diff options
author | Birte Kristina Friesel <birte.friesel@uos.de> | 2024-02-23 12:13:20 +0100 |
---|---|---|
committer | Birte Kristina Friesel <birte.friesel@uos.de> | 2024-02-23 12:13:20 +0100 |
commit | 09a8f09e2c00e484d59ceab09519984fc487237f (patch) | |
tree | 3078d7a544db0ae06e0c2b821621aaa39802ae75 /Microbenchmarks | |
parent | 02619c6af481c62a5cb4c2c78a015de072b0e091 (diff) |
STREAM: no alloc/load overhead for now
Diffstat (limited to 'Microbenchmarks')
-rwxr-xr-x | Microbenchmarks/STREAM/run-rank.sh | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/Microbenchmarks/STREAM/run-rank.sh b/Microbenchmarks/STREAM/run-rank.sh index a745a3f..8a831c3 100755 --- a/Microbenchmarks/STREAM/run-rank.sh +++ b/Microbenchmarks/STREAM/run-rank.sh @@ -20,8 +20,8 @@ for i in 2097152 1048576 131072 16384 4096; do # From a performance perspective, 8 to 10 is usually best for sequential operations. for bl in 3 4 5 6 8 10; do echo - if make -B OP=${op} NR_DPUS=${nr_dpus} NR_TASKLETS=${nr_tasklets} BL=${bl} T=${dt} UNROLL=1 WITH_ALLOC_OVERHEAD=1 WITH_LOAD_OVERHEAD=1 WITH_FREE_OVERHEAD=1 \ - || make -B OP=${op} NR_DPUS=${nr_dpus} NR_TASKLETS=${nr_tasklets} BL=${bl} T=${dt} UNROLL=0 WITH_ALLOC_OVERHEAD=1 WITH_LOAD_OVERHEAD=1 WITH_FREE_OVERHEAD=1; then + if make -B OP=${op} NR_DPUS=${nr_dpus} NR_TASKLETS=${nr_tasklets} BL=${bl} T=${dt} UNROLL=1 WITH_ALLOC_OVERHEAD=0 WITH_LOAD_OVERHEAD=0 WITH_FREE_OVERHEAD=0 \ + || make -B OP=${op} NR_DPUS=${nr_dpus} NR_TASKLETS=${nr_tasklets} BL=${bl} T=${dt} UNROLL=0 WITH_ALLOC_OVERHEAD=0 WITH_LOAD_OVERHEAD=0 WITH_FREE_OVERHEAD=0; then # -w: number of un-timed warmup iterations # -e: number of timed iterations timeout --foreground -k 1m 30m bin/host_code -w 0 -e 100 -i $i -x 0 || true |