diff options
Diffstat (limited to 'BFS')
| -rwxr-xr-x | BFS/benchmark-scripts/ccmcc25-sim.sh | 27 | ||||
| -rwxr-xr-x | BFS/benchmark-scripts/ccmcc25.sh | 27 | ||||
| -rw-r--r-- | BFS/host/app.c | 2 |
3 files changed, 44 insertions, 12 deletions
diff --git a/BFS/benchmark-scripts/ccmcc25-sim.sh b/BFS/benchmark-scripts/ccmcc25-sim.sh new file mode 100755 index 0000000..bcbe284 --- /dev/null +++ b/BFS/benchmark-scripts/ccmcc25-sim.sh @@ -0,0 +1,27 @@ +#!/bin/bash + +mkdir -p log/$(hostname) + +run_benchmark_nmc() { + local "$@" + set -e + make -B NR_DPUS=${nr_dpus} NR_TASKLETS=${nr_tasklets} \ + aspectc=1 aspectc_timing=1 dfatool_timing=0 + bin/host_code -f ${data} 2>&1 +} + +export -f run_benchmark_nmc + +fn=log/$(hostname)/ccmcc25-sdk${sdk}-sim + +source ~/lib/local/upmem/upmem-2025.1.0-Linux-x86_64/upmem_env.sh simulator + +echo "prim-benchmarks BFS $(git describe --all --long) $(git rev-parse HEAD) $(date -R)" >> ${fn}.txt + +# BFS does not support repeated kernel invocations → repeat it here +parallel -j1 --eta --joblog ${fn}.joblog --resume --header : \ + run_benchmark_nmc nr_dpus={nr_dpus} nr_tasklets=16 data={data} \ + ::: i $(seq 0 4) \ + ::: data data/roadNet-CA.txt data/loc-gowalla_edges.txt \ + ::: nr_dpus 1 2 4 8 16 32 48 64 \ +>> ${fn}.txt diff --git a/BFS/benchmark-scripts/ccmcc25.sh b/BFS/benchmark-scripts/ccmcc25.sh index 436d2eb..0dcf4bb 100755 --- a/BFS/benchmark-scripts/ccmcc25.sh +++ b/BFS/benchmark-scripts/ccmcc25.sh @@ -1,9 +1,6 @@ #!/bin/bash mkdir -p log/$(hostname) -fn=log/$(hostname)/ccmcc25 - -source /opt/upmem/upmem-2025.1.0-Linux-x86_64/upmem_env.sh run_benchmark_nmc() { local "$@" @@ -16,12 +13,20 @@ run_benchmark_nmc() { export -f run_benchmark_nmc -echo "prim-benchmarks BFS $(git describe --all --long) $(git rev-parse HEAD) $(date -R)" >> ${fn}.txt +for sdk in 2023.2.0 2024.1.0 2024.2.0 2025.1.0; do + + fn=log/$(hostname)/ccmcc25-sdk${sdk} + + source /opt/upmem/upmem-${sdk}-Linux-x86_64/upmem_env.sh + + echo "prim-benchmarks BFS $(git describe --all --long) $(git rev-parse HEAD) $(date -R)" >> ${fn}.txt + + # BFS does not support repeated kernel invocations → repeat it here + parallel -j1 --eta --joblog ${fn}.joblog --resume --header : \ + run_benchmark_nmc nr_dpus={nr_dpus} nr_tasklets=16 numa_rank=any data={data} \ + ::: i $(seq 0 10) \ + ::: data data/roadNet-CA.txt data/loc-gowalla_edges.txt \ + ::: nr_dpus 64 128 256 512 768 1024 1536 2048 2304 \ + >> ${fn}.txt -# BFS does not support repeated kernel invocations → repeat it here -parallel -j1 --eta --joblog ${fn}.joblog --resume --header : \ - run_benchmark_nmc nr_dpus={nr_dpus} nr_tasklets=16 numa_rank=any data={data} \ - ::: i $(seq 0 10) \ - ::: data data/roadNet-CA.txt data/loc-gowalla_edges.txt \ - ::: nr_dpus 64 128 256 512 768 1024 1536 2048 2304 \ ->> ${fn}.txt +done diff --git a/BFS/host/app.c b/BFS/host/app.c index 66b4792..4431193 100644 --- a/BFS/host/app.c +++ b/BFS/host/app.c @@ -205,7 +205,7 @@ int main(int argc, char **argv) DPU_ASSERT(dpu_copy_to(dpu, DPU_MRAM_HEAP_POINTER_NAME, dpuNextFrontier_m, (uint8_t *) nextFrontier, - ROUND_UP_TO_MULTIPLE_OF_8(numNodes / 64 * sizeof(uint64_t)))) + ROUND_UP_TO_MULTIPLE_OF_8(numNodes / 64 * sizeof(uint64_t)))); // NOTE: No need to copy current frontier because it is written before being read stopTimer(&timer, 2); |
