From 55f2653aafa38ea1d53a43c104185218e0dad1f1 Mon Sep 17 00:00:00 2001 From: Birte Kristina Friesel Date: Wed, 14 May 2025 16:03:27 +0200 Subject: Use benchmark-specific input descriptions rather than opaque "#elements" --- include/dfatool_host_dpu.ah | 10 ++-------- 1 file changed, 2 insertions(+), 8 deletions(-) (limited to 'include') diff --git a/include/dfatool_host_dpu.ah b/include/dfatool_host_dpu.ah index 010c18c..c676f50 100644 --- a/include/dfatool_host_dpu.ah +++ b/include/dfatool_host_dpu.ah @@ -5,8 +5,6 @@ aspect DfatoolHostDPUTiming { struct timeval starttime; struct timeval stoptime; - unsigned long input_size; - unsigned int element_size; uint32_t n_ranks = 0; uint32_t n_dpus = 0; @@ -77,16 +75,12 @@ aspect DfatoolHostDPUTiming { tjp->proceed(); gettimeofday(&stoptime, NULL); double latency_us = (stoptime.tv_sec - starttime.tv_sec) * 1000000.0 + (stoptime.tv_usec - starttime.tv_usec); - printf("[::] dpu_launch @ %s:%d | n_dpus=%u n_ranks=%u e_kernel=kernel%d n_elements=%lu n_elements_per_dpu=%lu | latency_us=%f throughput_Mps=%f throughput_MiBps=%f\n", + printf("[::] dpu_launch @ %s:%d | n_dpus=%u n_ranks=%u e_kernel=kernel%d | latency_us=%f\n", tjp->filename(), tjp->line(), n_dpus, n_ranks, getKernel(), - input_size, - input_size / n_dpus, - latency_us, - input_size / latency_us, - input_size * element_size / (latency_us * M_to_Mi) + latency_us ); } -- cgit v1.2.3