1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
|
#pragma once
#include <sys/time.h>
#include "dfatool_host_dpu.ah"
aspect DfatoolHostTiming : public DfatoolHostDPUTiming {
unsigned int n_rows_f1, n_rows_f2, n_cols_f1, n_cols_f2;
unsigned int element_size;
virtual int getKernel() { return kernel; }
DfatoolHostTiming() {
element_size = sizeof(T);
}
advice call("% input_params(...)") : after() {
Params* p = tjp->result();
/*
* Input: (M_ * m) × (N_ * n) matrix
*/
n_rows_f1 = p->M_;
n_rows_f2 = p->m;
n_cols_f1 = p->N_;
n_cols_f2 = p->n;
printf("[>>] TRNS | n_dpus=%u n_rows_f1=%u n_rows_f2=%u n_cols_f1=%u n_cols_f2=%u\n", NR_DPUS, n_rows_f1, n_rows_f2, n_cols_f1, n_cols_f2);
}
advice call("% trns_host(...)") : after() {
printf("[--] TRNS | n_dpus=%u n_rows_f1=%u n_rows_f2=%u n_cols_f1=%u n_cols_f2=%u\n", NR_DPUS, n_rows_f1, n_rows_f2, n_cols_f1, n_cols_f2);
}
advice execution("% main(...)") : after() {
printf("[<<] TRNS | n_dpus=%u n_rows_f1=%u n_rows_f2=%u n_cols_f1=%u n_cols_f2=%u\n", NR_DPUS, n_rows_f1, n_rows_f2, n_cols_f1, n_cols_f2);
}
};
|