blob: 25bba55ed674e9baf8d5ee8907b6141b0cb529ef (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
|
#!/bin/bash
set -e
mkdir -p $(hostname)
ts=$(date +%Y%m%d)
# BL: use 2^(BL) B blocks for MRAM <-> WRAM transfers on PIM module
# T: data type
# -w: number of un-timed warmup iterations
# -e: number of timed iterations
# -i; ignored, always uses 262144 elements
(
echo "prim-benchmarks TS (dfatool fgbs24a edition)"
echo "Started at $(date)"
echo "Revision $(git describe --always)"
for nr_dpus in 2304 2048 2543; do
# upstream code only works with up to 8 tasklets. funky.
for nr_tasklets in 8 12 16; do
echo
# upstream code did not respect $BL in the makefile and used 256B (BL=8) instead.
# This appears to be faster than BL=10.
if make -B NR_DPUS=${nr_dpus} NR_TASKLETS=${nr_tasklets} BL=8; then
timeout --foreground -k 1m 30m bin/ts_host -w 0 -e 100 -n 33554432 || true
fi
if make -B NR_DPUS=${nr_dpus} NR_TASKLETS=${nr_tasklets} BL=8 WITH_ALLOC_OVERHEAD=1 WITH_LOAD_OVERHEAD=1 WITH_FREE_OVERHEAD=1; then
timeout --foreground -k 1m 30m bin/ts_host -w 0 -e 100 -n 33554432 || true
fi
done
done
echo "Completed at $(date)"
) | tee "$(hostname)/${ts}-fgbs24a.txt"
|