summaryrefslogtreecommitdiff
path: root/TRNS/dimes-hetsim-nmc.sh
diff options
context:
space:
mode:
authorBirte Kristina Friesel <birte.friesel@uos.de>2024-07-25 15:42:29 +0200
committerBirte Kristina Friesel <birte.friesel@uos.de>2024-07-25 15:42:50 +0200
commitb471467e738151e643be84d8e3757553aba524d0 (patch)
tree9c7cc79c51b5d734141548104a113104106ccd1f /TRNS/dimes-hetsim-nmc.sh
parentb3d5b55cc00cb7977adfbde6c03599a345357767 (diff)
TRNS: fix write1 documentation
Diffstat (limited to 'TRNS/dimes-hetsim-nmc.sh')
-rwxr-xr-xTRNS/dimes-hetsim-nmc.sh4
1 files changed, 2 insertions, 2 deletions
diff --git a/TRNS/dimes-hetsim-nmc.sh b/TRNS/dimes-hetsim-nmc.sh
index fb2640c..ef32b86 100755
--- a/TRNS/dimes-hetsim-nmc.sh
+++ b/TRNS/dimes-hetsim-nmc.sh
@@ -9,9 +9,9 @@ source /opt/upmem/upmem-2024.1.0-Linux-x86_64/upmem_env.sh
#
# Input: (M_ * m) × (N_ * n) matrix
# Output: (N_* n) × (M_ * m) matrix
-# Step 1: transpose (M_ * m) × N_ matrix that consits of tiles of size n
+# Step 1: transpose (M_ * m) × N_ matrix that consists of tiles of size n
# CPU version: explicit
-# DPU version: implicit (appropriate write operations to DPUs)
+# DPU version: implicit (M_ * m write operations of #DPUs * n elements to DPUs)
# Step 2: transpose m × n matrix; this happens N_ * M_ times.
# DPU version: Each tasklet transposes a single m × n matrix / tile.
# (16 × 8 tile takes up 1 KiB WRAM)