summaryrefslogtreecommitdiff
path: root/BS/dimes-hetsim-hbm.sh
diff options
context:
space:
mode:
Diffstat (limited to 'BS/dimes-hetsim-hbm.sh')
-rwxr-xr-xBS/dimes-hetsim-hbm.sh16
1 files changed, 6 insertions, 10 deletions
diff --git a/BS/dimes-hetsim-hbm.sh b/BS/dimes-hetsim-hbm.sh
index 2aabe15..4e1500d 100755
--- a/BS/dimes-hetsim-hbm.sh
+++ b/BS/dimes-hetsim-hbm.sh
@@ -1,12 +1,10 @@
#!/bin/bash
-echo PrIM BS
-
cd baselines/cpu
make -B NUMA=1
mkdir -p log/$(hostname)
-fn=log/$(hostname)/$(date +%Y%m%d)
+fn=log/$(hostname)/dimes-hetsim-hbm
# upstream DPU version uses 2048576 * uint64 ≈ 16 MiB (DPU max: 64 MiB)
# upstream DPU version uses 2 queries
@@ -32,7 +30,7 @@ export -f run_benchmark
echo "single-node execution, DPU ref (1/4)" >&2
-parallel -j1 --eta --joblog ${fn}.1.joblog --header : \
+parallel -j1 --eta --joblog ${fn}.1.joblog --resume --header : \
run_benchmark i={i} nr_threads={nr_threads} ram={ram} cpu={cpu} \
input_size=${input_size_dpu} num_queries=${num_queries_dpu} \
::: i $(seq 1 5) \
@@ -42,7 +40,7 @@ parallel -j1 --eta --joblog ${fn}.1.joblog --header : \
echo "single-node execution, HBM ref (2/4)" >&2
-parallel -j1 --eta --joblog ${fn}.2.joblog --header : \
+parallel -j1 --eta --joblog ${fn}.2.joblog --resume --header : \
run_benchmark i={i} nr_threads={nr_threads} ram={ram} cpu={cpu} \
input_size=${input_size_hbm} num_queries=${num_queries_hbm} \
::: i $(seq 1 5) \
@@ -52,7 +50,7 @@ parallel -j1 --eta --joblog ${fn}.2.joblog --header : \
echo "multi-node execution, DPU ref (3/4)" >&2
-parallel -j1 --eta --joblog ${fn}.3.joblog --header : \
+parallel -j1 --eta --joblog ${fn}.3.joblog --resume --header : \
run_benchmark i={i} nr_threads={nr_threads} ram={ram} cpu={cpu} \
input_size=${input_size_dpu} num_queries=${num_queries_dpu} \
::: i $(seq 1 40) \
@@ -62,7 +60,7 @@ parallel -j1 --eta --joblog ${fn}.3.joblog --header : \
echo "multi-node execution, HBM ref (4/4)" >&2
-parallel -j1 --eta --joblog ${fn}.4.joblog --header : \
+parallel -j1 --eta --joblog ${fn}.4.joblog --resume --header : \
run_benchmark i={i} nr_threads={nr_threads} ram={ram} cpu={cpu} \
input_size=${input_size_hbm} num_queries=${num_queries_hbm} \
::: i $(seq 1 40) \
@@ -70,6 +68,4 @@ parallel -j1 --eta --joblog ${fn}.4.joblog --header : \
::: cpu -1 \
::: ram $(seq 0 15)
-) > ${fn}.txt
-
-xz -f -v -9 -M 800M ${fn}.txt
+) >> ${fn}.txt