| 1 | package main
|
|---|
| 2 |
|
|---|
| 3 | import (
|
|---|
| 4 | "bufio"
|
|---|
| 5 | "flag"
|
|---|
| 6 | "fmt"
|
|---|
| 7 | "os"
|
|---|
| 8 | "runtime"
|
|---|
| 9 | "sync/atomic"
|
|---|
| 10 | "time"
|
|---|
| 11 | "golang.org/x/text/language"
|
|---|
| 12 | "golang.org/x/text/message"
|
|---|
| 13 | )
|
|---|
| 14 |
|
|---|
| 15 | var clock_mode bool
|
|---|
| 16 | var threads_left int64
|
|---|
| 17 | var stop int32
|
|---|
| 18 | var duration float64
|
|---|
| 19 | var stop_count uint64
|
|---|
| 20 |
|
|---|
| 21 | func fflush(f *bufio.Writer) {
|
|---|
| 22 | defer f.Flush()
|
|---|
| 23 | f.Write([]byte("\r"))
|
|---|
| 24 | }
|
|---|
| 25 |
|
|---|
| 26 | func wait(start time.Time, is_tty bool) {
|
|---|
| 27 | f := bufio.NewWriter(os.Stdout)
|
|---|
| 28 | tdur := time.Duration(duration)
|
|---|
| 29 | for true {
|
|---|
| 30 | time.Sleep(100 * time.Millisecond)
|
|---|
| 31 | end := time.Now()
|
|---|
| 32 | delta := end.Sub(start)
|
|---|
| 33 | if is_tty {
|
|---|
| 34 | fmt.Printf(" %.1f",delta.Seconds())
|
|---|
| 35 | fflush(f)
|
|---|
| 36 | }
|
|---|
| 37 | if clock_mode && delta >= (tdur * time.Second) {
|
|---|
| 38 | break
|
|---|
| 39 | } else if !clock_mode && atomic.LoadInt64(&threads_left) == 0 {
|
|---|
| 40 | break
|
|---|
| 41 | }
|
|---|
| 42 | }
|
|---|
| 43 | }
|
|---|
| 44 |
|
|---|
| 45 | func partner(result chan uint64, mine chan int, next chan int) {
|
|---|
| 46 | count := uint64(0)
|
|---|
| 47 | for true {
|
|---|
| 48 | <- mine
|
|---|
| 49 | next <- 0
|
|---|
| 50 | count += 1
|
|---|
| 51 | if clock_mode && atomic.LoadInt32(&stop) == 1 { break }
|
|---|
| 52 | if !clock_mode && count >= stop_count { break }
|
|---|
| 53 | }
|
|---|
| 54 |
|
|---|
| 55 | atomic.AddInt64(&threads_left, -1);
|
|---|
| 56 | result <- count
|
|---|
| 57 | }
|
|---|
| 58 |
|
|---|
| 59 | func main() {
|
|---|
| 60 | var nprocs int
|
|---|
| 61 | var nthreads int
|
|---|
| 62 | var ring_size int
|
|---|
| 63 |
|
|---|
| 64 | nprocsOpt := flag.Int("p", 1, "The number of processors")
|
|---|
| 65 | nthreadsOpt := flag.Int("t", 1, "The number of threads")
|
|---|
| 66 | ring_sizeOpt := flag.Int("r", 2, "The number of threads per cycles")
|
|---|
| 67 | durationOpt := flag.Float64("d", 0, "Duration of the experiment in seconds")
|
|---|
| 68 | stopOpt := flag.Uint64("i", 0, "Duration of the experiment in iterations")
|
|---|
| 69 |
|
|---|
| 70 | flag.Parse()
|
|---|
| 71 |
|
|---|
| 72 | nprocs = *nprocsOpt
|
|---|
| 73 | nthreads = *nthreadsOpt
|
|---|
| 74 | ring_size = *ring_sizeOpt
|
|---|
| 75 | duration = *durationOpt
|
|---|
| 76 | stop_count = *stopOpt
|
|---|
| 77 |
|
|---|
| 78 | if duration > 0 && stop_count > 0 {
|
|---|
| 79 | panic(fmt.Sprintf("--duration and --iterations cannot be used together\n"))
|
|---|
| 80 | } else if duration > 0 {
|
|---|
| 81 | clock_mode = true
|
|---|
| 82 | stop_count = 0xFFFFFFFFFFFFFFFF
|
|---|
| 83 | fmt.Printf("Running for %f seconds\n", duration)
|
|---|
| 84 | } else if stop_count > 0 {
|
|---|
| 85 | clock_mode = false
|
|---|
| 86 | fmt.Printf("Running for %d iterations\n", stop_count)
|
|---|
| 87 | } else {
|
|---|
| 88 | duration = 5
|
|---|
| 89 | clock_mode = true
|
|---|
| 90 | fmt.Printf("Running for %f seconds\n", duration)
|
|---|
| 91 | }
|
|---|
| 92 |
|
|---|
| 93 | runtime.GOMAXPROCS(nprocs)
|
|---|
| 94 | tthreads := nthreads * ring_size
|
|---|
| 95 | threads_left = int64(tthreads)
|
|---|
| 96 |
|
|---|
| 97 | result := make(chan uint64)
|
|---|
| 98 | channels := make([]chan int, tthreads)
|
|---|
| 99 | for i := range channels {
|
|---|
| 100 | channels[i] = make(chan int, 1)
|
|---|
| 101 | }
|
|---|
| 102 |
|
|---|
| 103 | for i := 0; i < tthreads; i++ {
|
|---|
| 104 | pi := (i + nthreads) % tthreads
|
|---|
| 105 | go partner(result, channels[i], channels[pi])
|
|---|
| 106 | }
|
|---|
| 107 | fmt.Printf("Starting\n");
|
|---|
| 108 |
|
|---|
| 109 | atomic.StoreInt32(&stop, 0)
|
|---|
| 110 | start := time.Now()
|
|---|
| 111 | for i := 0; i < nthreads; i++ {
|
|---|
| 112 | channels[i] <- 0
|
|---|
| 113 | }
|
|---|
| 114 | wait(start, true);
|
|---|
| 115 |
|
|---|
| 116 | atomic.StoreInt32(&stop, 1)
|
|---|
| 117 | end := time.Now()
|
|---|
| 118 | delta := end.Sub(start)
|
|---|
| 119 |
|
|---|
| 120 | fmt.Printf("\nDone\n")
|
|---|
| 121 |
|
|---|
| 122 | global_counter := uint64(0)
|
|---|
| 123 | for i := 0; i < tthreads; i++ {
|
|---|
| 124 | global_counter += <- result
|
|---|
| 125 | }
|
|---|
| 126 |
|
|---|
| 127 | p := message.NewPrinter(language.English)
|
|---|
| 128 | p.Printf("Duration (ms) : %f\n", delta.Seconds());
|
|---|
| 129 | p.Printf("Number of processors: %d\n", nprocs);
|
|---|
| 130 | p.Printf("Number of threads : %d\n", tthreads);
|
|---|
| 131 | p.Printf("Cycle size (# thrds): %d\n", ring_size);
|
|---|
| 132 | p.Printf("Yields per second : %18.2f\n", float64(global_counter) / delta.Seconds())
|
|---|
| 133 | p.Printf("ns per yields : %18.2f\n", float64(delta.Nanoseconds()) / float64(global_counter))
|
|---|
| 134 | p.Printf("Total yields : %15d\n", global_counter)
|
|---|
| 135 | p.Printf("Yields per threads : %15d\n", global_counter / uint64(tthreads))
|
|---|
| 136 | p.Printf("Yields per procs : %15d\n", global_counter / uint64(nprocs))
|
|---|
| 137 | p.Printf("Yields/sec/procs : %18.2f\n", (float64(global_counter) / float64(nprocs)) / delta.Seconds())
|
|---|
| 138 | p.Printf("ns per yields/procs : %18.2f\n", float64(delta.Nanoseconds()) / (float64(global_counter) / float64(nprocs)))
|
|---|
| 139 |
|
|---|
| 140 | }
|
|---|