summaryrefslogtreecommitdiff
path: root/Microbenchmarks/STREAM/dpu
diff options
context:
space:
mode:
authorDaniel Friesel <daniel.friesel@uos.de>2023-05-10 15:18:52 +0200
committerDaniel Friesel <daniel.friesel@uos.de>2023-05-10 15:18:52 +0200
commitce9cc7975bad005cb4f7cf260b92ee7e8c85249e (patch)
tree34e23ee9c41d98f9303b85166b0edf34c6addf98 /Microbenchmarks/STREAM/dpu
parentf83c88050dd459ba3b3782b8ff83ef94a6313ad9 (diff)
STREAM: dfatool compat; variable data type
Diffstat (limited to 'Microbenchmarks/STREAM/dpu')
-rw-r--r--Microbenchmarks/STREAM/dpu/add.c8
-rw-r--r--Microbenchmarks/STREAM/dpu/copyw.c8
-rw-r--r--Microbenchmarks/STREAM/dpu/scale.c8
-rw-r--r--Microbenchmarks/STREAM/dpu/triad.c8
4 files changed, 24 insertions, 8 deletions
diff --git a/Microbenchmarks/STREAM/dpu/add.c b/Microbenchmarks/STREAM/dpu/add.c
index faf6504..12854ee 100644
--- a/Microbenchmarks/STREAM/dpu/add.c
+++ b/Microbenchmarks/STREAM/dpu/add.c
@@ -18,12 +18,16 @@ __host dpu_results_t DPU_RESULTS[NR_TASKLETS];
// Add
static void add_dpu(T *bufferC, T *bufferA, T *bufferB) {
-
+#if UNROLL
#pragma unroll
for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
bufferC[i] = bufferA[i] + bufferB[i];
}
-
+#else
+ for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
+ bufferC[i] = bufferA[i] + bufferB[i];
+ }
+#endif
}
// Barrier
diff --git a/Microbenchmarks/STREAM/dpu/copyw.c b/Microbenchmarks/STREAM/dpu/copyw.c
index eff7a3b..66dd319 100644
--- a/Microbenchmarks/STREAM/dpu/copyw.c
+++ b/Microbenchmarks/STREAM/dpu/copyw.c
@@ -18,12 +18,16 @@ __host dpu_results_t DPU_RESULTS[NR_TASKLETS];
// Copy
static void copyw_dpu(T *bufferB, T *bufferA) {
-
+#if UNROLL
#pragma unroll
for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
bufferB[i] = bufferA[i];
}
-
+#else
+ for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
+ bufferB[i] = bufferA[i];
+ }
+#endif
}
// Barrier
diff --git a/Microbenchmarks/STREAM/dpu/scale.c b/Microbenchmarks/STREAM/dpu/scale.c
index 4247aac..53a70a2 100644
--- a/Microbenchmarks/STREAM/dpu/scale.c
+++ b/Microbenchmarks/STREAM/dpu/scale.c
@@ -18,12 +18,16 @@ __host dpu_results_t DPU_RESULTS[NR_TASKLETS];
// Scale
static void scale_dpu(T *bufferB, T *bufferA, T scalar) {
-
+#if UNROLL
#pragma unroll
for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
bufferB[i] = scalar * bufferA[i];
}
-
+#else
+ for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
+ bufferB[i] = scalar * bufferA[i];
+ }
+#endif
}
// Barrier
diff --git a/Microbenchmarks/STREAM/dpu/triad.c b/Microbenchmarks/STREAM/dpu/triad.c
index e81cb59..9e641ea 100644
--- a/Microbenchmarks/STREAM/dpu/triad.c
+++ b/Microbenchmarks/STREAM/dpu/triad.c
@@ -18,12 +18,16 @@ __host dpu_results_t DPU_RESULTS[NR_TASKLETS];
// Triad
static void triad_dpu(T *bufferC, T *bufferA, T *bufferB, T scalar) {
-
+#if UNROLL
#pragma unroll
for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
bufferC[i] = bufferA[i] + scalar * bufferB[i];
}
-
+#else
+ for (unsigned int i = 0; i < BLOCK_SIZE / sizeof(T); i++){
+ bufferC[i] = bufferA[i] + scalar * bufferB[i];
+ }
+#endif
}
// Barrier