summaryrefslogtreecommitdiff
path: root/yuvbench/kbench.h
blob: 42ec64688b917bbf45aa484d696354027370f0f3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#ifndef _KBENCH_H_
#define _KBENCH_H_

#include <stdint.h>

uintptr_t KBenchTS(void);
uintptr_t KBenchElapsedCounts(uintptr_t t0, uintptr_t t1);
double KBenchElapsedTime(uintptr_t t0, uintptr_t t1);

#ifdef KBENCH_IMPLEMENTATION

#ifdef __linux__
#include <time.h>
#endif

uintptr_t KBenchTS(void)
{
    uintptr_t result = 0;
    // macos+aarch64+clang: use CNTVCT_EL0
#if defined(__APPLE__) && defined(__clang__) && defined(__aarch64__)
    __asm__ volatile("mrs %0, CNTVCT_EL0" : "=r"(result) :: "memory");
#endif
    // linux: use clock_gettime
#if defined(__linux__)
    struct timespec ts;
    clock_gettime(CLOCK_MONOTONIC, &ts);
    result = (uintptr_t)ts.tv_sec * 1e9 + (uintptr_t)ts.tv_nsec;
#endif
    return result;
}

uintptr_t KBenchElapsedCounts(uintptr_t t0, uintptr_t t1)
{
    // @@
    return t1 - t0;
}

double KBenchElapsedTime(uintptr_t t0, uintptr_t t1)
{
    uintptr_t elapsed = KBenchElapsedCounts(t0, t1);
    double val = 0.0f;
    // macos+aarch64+clang: divide by CNTFRQ_EL0
#if defined(__APPLE__) && defined(__clang__) && defined(__aarch64__)
    uintptr_t cntfreq_el0 = 0;
    __asm__ volatile("mrs %0, CNTFRQ_EL0" : "=r"(cntfreq_el0) :: "memory");
    val = (double)elapsed / (double)cntfreq_el0;
#endif
    // linux: use clock_gettime
#if defined(__linux__) && defined(__GNUC__) && defined(__amd64__)
    val = (double)elapsed / 1e9;
#endif
    return val;
}

#endif // KBENCH_IMPLEMENTATION
#endif // _KBENCH_H_