blob: 42ec64688b917bbf45aa484d696354027370f0f3 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
|
#ifndef _KBENCH_H_
#define _KBENCH_H_
#include <stdint.h>
uintptr_t KBenchTS(void);
uintptr_t KBenchElapsedCounts(uintptr_t t0, uintptr_t t1);
double KBenchElapsedTime(uintptr_t t0, uintptr_t t1);
#ifdef KBENCH_IMPLEMENTATION
#ifdef __linux__
#include <time.h>
#endif
uintptr_t KBenchTS(void)
{
uintptr_t result = 0;
// macos+aarch64+clang: use CNTVCT_EL0
#if defined(__APPLE__) && defined(__clang__) && defined(__aarch64__)
__asm__ volatile("mrs %0, CNTVCT_EL0" : "=r"(result) :: "memory");
#endif
// linux: use clock_gettime
#if defined(__linux__)
struct timespec ts;
clock_gettime(CLOCK_MONOTONIC, &ts);
result = (uintptr_t)ts.tv_sec * 1e9 + (uintptr_t)ts.tv_nsec;
#endif
return result;
}
uintptr_t KBenchElapsedCounts(uintptr_t t0, uintptr_t t1)
{
// @@
return t1 - t0;
}
double KBenchElapsedTime(uintptr_t t0, uintptr_t t1)
{
uintptr_t elapsed = KBenchElapsedCounts(t0, t1);
double val = 0.0f;
// macos+aarch64+clang: divide by CNTFRQ_EL0
#if defined(__APPLE__) && defined(__clang__) && defined(__aarch64__)
uintptr_t cntfreq_el0 = 0;
__asm__ volatile("mrs %0, CNTFRQ_EL0" : "=r"(cntfreq_el0) :: "memory");
val = (double)elapsed / (double)cntfreq_el0;
#endif
// linux: use clock_gettime
#if defined(__linux__) && defined(__GNUC__) && defined(__amd64__)
val = (double)elapsed / 1e9;
#endif
return val;
}
#endif // KBENCH_IMPLEMENTATION
#endif // _KBENCH_H_
|