benchmark.cc (1389B)
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 | // TODO #if !defined( _MSC_VER ) #include <x86intrin.h> #endif #include "intrinsics.h" #include "benchmark.h" #include "platform_atomic.h" #define MAX_TIMERS 4096 struct Timer { NONCOPYABLE( Timer ); Timer() { } const char * fn; const char * file; int line; // TODO: use Stats atomic_u64 total_clocks; atomic_u64 num_calls; }; static Timer timers[ 4096 ]; static atomic_u32 num_timers( 0 ); ScopedTimer::ScopedTimer( u32 idx ) { initial_clock = __rdtsc(); timer_idx = idx; } ScopedTimer::~ScopedTimer() { u64 dt = __rdtsc() - initial_clock; fetch_add_relaxed( &timers[ timer_idx ].total_clocks, dt ); fetch_add_relaxed( &timers[ timer_idx ].num_calls, 1 ); } u32 benchmark_new_timer( const char * fn, const char * file, int line ) { u32 idx = fetch_add_relaxed( &num_timers, 1 ); assert( idx < MAX_TIMERS ); Timer & info = timers[ idx ]; info.fn = fn; info.file = file; info.line = line; store_relaxed( &info.total_clocks, 0 ); store_release( &info.num_calls, 0 ); return idx; } void benchmark_print_timers() { u32 n = load_acquire( &num_timers ); for( u32 i = 0; i < n; i++ ) { u64 clocks = load_relaxed( &timers[ i ].total_clocks ); u64 calls = load_relaxed( &timers[ i ].num_calls ); printf( "%s (%s:%d) called %lu times, %lu clocks, %lu avg\n", timers[ i ].fn, timers[ i ].file, timers[ i ].line, calls, clocks, clocks / calls ); } } |