blob: 121bf31df06187d5c0bf93c2b1de6c294bccc9bf (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
|
#ifndef _COMMON_H_
#define _COMMON_H_
// Transfer size between MRAM and WRAM
#ifdef BL
#define BLOCK_SIZE_LOG2 BL
#define BLOCK_SIZE (1 << BLOCK_SIZE_LOG2)
#else
#define BLOCK_SIZE_LOG2 8
#define BLOCK_SIZE (1 << BLOCK_SIZE_LOG2)
#define BL BLOCK_SIZE_LOG2
#endif
// Data type
#ifdef UINT32
#define T uint32_t
#define DIV 2 // Shift right to divide by sizeof(T)
#elif UINT64
#define T uint64_t
#define DIV 3 // Shift right to divide by sizeof(T)
#elif INT32
#define T int32_t
#define DIV 2 // Shift right to divide by sizeof(T)
#elif INT64
#define T int64_t
#define DIV 3 // Shift right to divide by sizeof(T)
#elif FLOAT
#define T float
#define DIV 2 // Shift right to divide by sizeof(T)
#elif DOUBLE
#define T double
#define DIV 3 // Shift right to divide by sizeof(T)
#elif CHAR
#define T char
#define DIV 0 // Shift right to divide by sizeof(T)
#elif SHORT
#define T short
#define DIV 1 // Shift right to divide by sizeof(T)
#endif
// Structures used by both the host and the dpu to communicate information
typedef struct {
uint32_t size;
enum kernels {
kernel1 = 0,
nr_kernels = 1,
} kernel;
T t_count;
} dpu_arguments_t;
typedef struct {
uint64_t cycles;
T t_count;
} dpu_results_t;
#ifndef PERF
#define PERF 0 // Use perfcounters?
#endif
#ifndef PERF_SYNC
#define PERF_SYNC 0 // Use perfcounters to time sync primitives?
#endif
#ifndef ENERGY
#define ENERGY 0
#endif
#define PRINT 0
#define ANSI_COLOR_RED "\x1b[31m"
#define ANSI_COLOR_GREEN "\x1b[32m"
#define ANSI_COLOR_RESET "\x1b[0m"
#define divceil(n, m) (((n)-1) / (m) + 1)
#define roundup(n, m) ((n / m) * m + m)
#endif
|