diff options
Diffstat (limited to 'TRNS/include')
-rw-r--r-- | TRNS/include/common.h | 42 | ||||
-rw-r--r-- | TRNS/include/dfatool_host.ah | 25 | ||||
-rw-r--r-- | TRNS/include/params.h | 68 | ||||
-rw-r--r-- | TRNS/include/timer.h | 5 |
4 files changed, 140 insertions, 0 deletions
diff --git a/TRNS/include/common.h b/TRNS/include/common.h new file mode 100644 index 0000000..6a94c62 --- /dev/null +++ b/TRNS/include/common.h @@ -0,0 +1,42 @@ +#ifndef _COMMON_H_ +#define _COMMON_H_ + +// Transfer size between MRAM and WRAM +#ifdef BL +#define BLOCK_SIZE_LOG2 BL +#define BLOCK_SIZE (1 << BLOCK_SIZE_LOG2) +#else +#define BLOCK_SIZE_LOG2 8 +#define BLOCK_SIZE (1 << BLOCK_SIZE_LOG2) +#define BL BLOCK_SIZE_LOG2 +#endif + +// Data type +#define T int64_t + +enum kernels { + kernel1 = 0, + kernel2 = 1, + nr_kernels = 2, +}; + +// Structures used by both the host and the dpu to communicate information +typedef struct { + uint32_t m; + uint32_t n; + uint32_t M_; + enum kernels kernel; +} dpu_arguments_t; + +#ifndef ENERGY +#define ENERGY 0 +#endif +#define PRINT 0 + +#define ANSI_COLOR_RED "\x1b[31m" +#define ANSI_COLOR_GREEN "\x1b[32m" +#define ANSI_COLOR_RESET "\x1b[0m" + +#define divceil(n, m) (((n)-1) / (m) + 1) +#define roundup(n, m) ((n / m) * m + m) +#endif diff --git a/TRNS/include/dfatool_host.ah b/TRNS/include/dfatool_host.ah new file mode 100644 index 0000000..94f6101 --- /dev/null +++ b/TRNS/include/dfatool_host.ah @@ -0,0 +1,25 @@ +#pragma once + +#include <sys/time.h> +#include "dfatool_host_dpu.ah" + +aspect DfatoolHostTiming : public DfatoolHostDPUTiming { + + DfatoolHostTiming() { + element_size = sizeof(T); + } + + advice call("% input_params(...)") : after() { + Params* p = tjp->result(); + input_size = p->M_ * p->m * p->N_ * p->n; + printf("[>>] TRNS | n_dpus=%u n_elements=%lu e_exp=%d\n", NR_DPUS, input_size, p->exp); + } + + advice call("% trns_host(...)") : after() { + printf("[--] TRNS | n_dpus=%u n_ranks=%u n_elements=%lu e_exp=%d\n", n_dpus, n_ranks, input_size, p.exp); + } + + advice execution("% main(...)") : after() { + printf("[<<] TRNS | n_dpus=%u n_elements=%lu e_exp=%d\n", NR_DPUS, input_size, p.exp); + } +}; diff --git a/TRNS/include/params.h b/TRNS/include/params.h new file mode 100644 index 0000000..385490e --- /dev/null +++ b/TRNS/include/params.h @@ -0,0 +1,68 @@ +#ifndef _PARAMS_H_ +#define _PARAMS_H_ + +#include "common.h" + +typedef struct Params { + unsigned int M_; + unsigned int m; + unsigned int N_; + unsigned int n; + int n_warmup; + int n_reps; + int exp; +}Params; + +static void usage() { + fprintf(stderr, + "\nUsage: ./program [options]" + "\n" + "\nGeneral options:" + "\n -h help" + "\n -w <W> # of untimed warmup iterations (default=1)" + "\n -e <E> # of timed repetition iterations (default=3)" + "\n -x <X> Weak (0) or strong (1) scaling (default=1)" + "\n" + "\nBenchmark-specific options:" + "\n -m <I> m (default=16 elements)" + "\n -n <I> n (default=8 elements)" + "\n -o <I> M_ (default=12288 elements)" + "\n -p <I> N_ (default=1 elements)" + "\n"); +} + +struct Params input_params(int argc, char **argv) { + struct Params p; + p.M_ = 12288; + p.m = 16; + p.N_ = 1; + p.n = 8; + p.n_warmup = 1; + p.n_reps = 3; + p.exp = 1; + + int opt; + while((opt = getopt(argc, argv, "hw:e:x:m:n:o:p:")) >= 0) { + switch(opt) { + case 'h': + usage(); + exit(0); + break; + case 'w': p.n_warmup = atoi(optarg); break; + case 'e': p.n_reps = atoi(optarg); break; + case 'x': p.exp = atoi(optarg); break; + case 'm': p.m = atoi(optarg); break; + case 'n': p.n = atoi(optarg); break; + case 'o': p.M_ = atoi(optarg); break; + case 'p': p.N_ = atoi(optarg); break; + default: + fprintf(stderr, "\nUnrecognized option!\n"); + usage(); + exit(0); + } + } + assert(NR_DPUS > 0 && "Invalid # of dpus!"); + + return p; +} +#endif diff --git a/TRNS/include/timer.h b/TRNS/include/timer.h new file mode 100644 index 0000000..8d5c3d5 --- /dev/null +++ b/TRNS/include/timer.h @@ -0,0 +1,5 @@ +#pragma once + +#define N_TIMERS 10 +#include "../../include/timer_base.h" +#undef N_TIMERS |