summaryrefslogtreecommitdiff
path: root/VA/dimes-hetsim-hbm.sh
diff options
context:
space:
mode:
Diffstat (limited to 'VA/dimes-hetsim-hbm.sh')
-rwxr-xr-xVA/dimes-hetsim-hbm.sh42
1 files changed, 34 insertions, 8 deletions
diff --git a/VA/dimes-hetsim-hbm.sh b/VA/dimes-hetsim-hbm.sh
index a7c9ef4..7c0df73 100755
--- a/VA/dimes-hetsim-hbm.sh
+++ b/VA/dimes-hetsim-hbm.sh
@@ -1,7 +1,6 @@
#!/bin/sh
cd baselines/cpu
-make -B NUMA=1
mkdir -p log/$(hostname)
fn=log/$(hostname)/dimes-hetsim-hbm
@@ -10,22 +9,49 @@ fn=log/$(hostname)/dimes-hetsim-hbm
(
-echo "single-node execution (1/2)" >&2
+make -B NUMA=1 NUMA_MEMCPY=1
+
+echo "CPU single-node operation with setup cost, cpu/out on same node (1/4)" >&2
parallel -j1 --eta --joblog ${fn}.1.joblog --resume --header : \
- ./va -i {input_size} -a {ram} -b {ram} -c {cpu} -t {nr_threads} -w 0 -e 5 \
+ ./va -i {input_size} -a {ram_in} -b {ram_out} -c {cpu} -C {ram_local} -t {nr_threads} -w 0 -e 40 \
::: nr_threads 1 2 4 8 12 16 \
- ::: cpu $(seq 0 7) \
- ::: ram $(seq 0 15) \
+ ::: ram_in $(seq 0 15) \
+ ::: cpu $(seq 0 7) $(seq 0 7) \
+ :::+ ram_local $(seq 0 15) \
+ :::+ ram_out $(seq 0 15) \
::: input_size 167772160
-echo "multi-node execution (2/2)" >&2
+make -B NUMA=1
+
+echo "single-node execution, cpu/out on same node (2/4)" >&2
parallel -j1 --eta --joblog ${fn}.2.joblog --resume --header : \
- ./va -i {input_size} -a {ram} -b {ram} -c {cpu} -t {nr_threads} -w 0 -e 40 \
+ ./va -i {input_size} -a {ram_in} -b {ram_out} -c {cpu} -t {nr_threads} -w 0 -e 5 \
+ ::: nr_threads 1 2 4 8 12 16 \
+ ::: ram_in $(seq 0 15) \
+ ::: cpu $(seq 0 7) $(seq 0 7) \
+ :::+ ram_out $(seq 0 15) \
+ ::: input_size 167772160
+
+echo "single-node execution, in/out on same node (3/4)" >&2
+
+parallel -j1 --eta --joblog ${fn}.3.joblog --resume --header : \
+ ./va -i {input_size} -a {ram_in} -b {ram_out} -c {cpu} -t {nr_threads} -w 0 -e 5 \
+ ::: nr_threads 1 2 4 8 12 16 \
+ ::: cpu $(seq 0 7) \
+ ::: ram_in $(seq 0 15) \
+ :::+ ram_out $(seq 0 15) \
+ ::: input_size 167772160
+
+echo "multi-node execution (4/4)" >&2
+
+parallel -j1 --eta --joblog ${fn}.4.joblog --resume --header : \
+ ./va -i {input_size} -a {ram_in} -b {ram_out} -c {cpu} -t {nr_threads} -w 0 -e 40 \
::: nr_threads 32 48 64 96 128 \
::: cpu -1 \
- ::: ram $(seq 0 15) \
+ ::: ram_in $(seq 0 15) \
+ ::: ram_out $(seq 0 15) \
::: input_size 167772160
) >> ${fn}.txt