You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
182 lines
4.6 KiB
182 lines
4.6 KiB
#include "cache.h" |
|
#include "thread-utils.h" |
|
#include "trace2/tr2_tgt.h" |
|
#include "trace2/tr2_tls.h" |
|
#include "trace2/tr2_tmr.h" |
|
|
|
#define MY_MAX(a, b) ((a) > (b) ? (a) : (b)) |
|
#define MY_MIN(a, b) ((a) < (b) ? (a) : (b)) |
|
|
|
/* |
|
* A global timer block to aggregate values from the partial sums from |
|
* each thread. |
|
*/ |
|
static struct tr2_timer_block final_timer_block; /* access under tr2tls_mutex */ |
|
|
|
/* |
|
* Define metadata for each stopwatch timer. |
|
* |
|
* This array must match "enum trace2_timer_id" and the values |
|
* in "struct tr2_timer_block.timer[*]". |
|
*/ |
|
static struct tr2_timer_metadata tr2_timer_metadata[TRACE2_NUMBER_OF_TIMERS] = { |
|
[TRACE2_TIMER_ID_TEST1] = { |
|
.category = "test", |
|
.name = "test1", |
|
.want_per_thread_events = 0, |
|
}, |
|
[TRACE2_TIMER_ID_TEST2] = { |
|
.category = "test", |
|
.name = "test2", |
|
.want_per_thread_events = 1, |
|
}, |
|
|
|
/* Add additional metadata before here. */ |
|
}; |
|
|
|
void tr2_start_timer(enum trace2_timer_id tid) |
|
{ |
|
struct tr2tls_thread_ctx *ctx = tr2tls_get_self(); |
|
struct tr2_timer *t = &ctx->timer_block.timer[tid]; |
|
|
|
t->recursion_count++; |
|
if (t->recursion_count > 1) |
|
return; /* ignore recursive starts */ |
|
|
|
t->start_ns = getnanotime(); |
|
} |
|
|
|
void tr2_stop_timer(enum trace2_timer_id tid) |
|
{ |
|
struct tr2tls_thread_ctx *ctx = tr2tls_get_self(); |
|
struct tr2_timer *t = &ctx->timer_block.timer[tid]; |
|
uint64_t ns_now; |
|
uint64_t ns_interval; |
|
|
|
assert(t->recursion_count > 0); |
|
|
|
t->recursion_count--; |
|
if (t->recursion_count) |
|
return; /* still in recursive call(s) */ |
|
|
|
ns_now = getnanotime(); |
|
ns_interval = ns_now - t->start_ns; |
|
|
|
t->total_ns += ns_interval; |
|
|
|
/* |
|
* min_ns was initialized to zero (in the xcalloc()) rather |
|
* than UINT_MAX when the block of timers was allocated, |
|
* so we should always set both the min_ns and max_ns values |
|
* the first time that the timer is used. |
|
*/ |
|
if (!t->interval_count) { |
|
t->min_ns = ns_interval; |
|
t->max_ns = ns_interval; |
|
} else { |
|
t->min_ns = MY_MIN(ns_interval, t->min_ns); |
|
t->max_ns = MY_MAX(ns_interval, t->max_ns); |
|
} |
|
|
|
t->interval_count++; |
|
|
|
ctx->used_any_timer = 1; |
|
if (tr2_timer_metadata[tid].want_per_thread_events) |
|
ctx->used_any_per_thread_timer = 1; |
|
} |
|
|
|
void tr2_update_final_timers(void) |
|
{ |
|
struct tr2tls_thread_ctx *ctx = tr2tls_get_self(); |
|
enum trace2_timer_id tid; |
|
|
|
if (!ctx->used_any_timer) |
|
return; |
|
|
|
/* |
|
* Accessing `final_timer_block` requires holding `tr2tls_mutex`. |
|
* We assume that our caller is holding the lock. |
|
*/ |
|
|
|
for (tid = 0; tid < TRACE2_NUMBER_OF_TIMERS; tid++) { |
|
struct tr2_timer *t_final = &final_timer_block.timer[tid]; |
|
struct tr2_timer *t = &ctx->timer_block.timer[tid]; |
|
|
|
if (t->recursion_count) { |
|
/* |
|
* The current thread is exiting with |
|
* timer[tid] still running. |
|
* |
|
* Technically, this is a bug, but I'm going |
|
* to ignore it. |
|
* |
|
* I don't think it is worth calling die() |
|
* for. I don't think it is worth killing the |
|
* process for this bookkeeping error. We |
|
* might want to call warning(), but I'm going |
|
* to wait on that. |
|
* |
|
* The downside here is that total_ns won't |
|
* include the current open interval (now - |
|
* start_ns). I can live with that. |
|
*/ |
|
} |
|
|
|
if (!t->interval_count) |
|
continue; /* this timer was not used by this thread */ |
|
|
|
t_final->total_ns += t->total_ns; |
|
|
|
/* |
|
* final_timer_block.timer[tid].min_ns was initialized to |
|
* was initialized to zero rather than UINT_MAX, so we should |
|
* always set both the min_ns and max_ns values the first time |
|
* that we add a partial sum into it. |
|
*/ |
|
if (!t_final->interval_count) { |
|
t_final->min_ns = t->min_ns; |
|
t_final->max_ns = t->max_ns; |
|
} else { |
|
t_final->min_ns = MY_MIN(t_final->min_ns, t->min_ns); |
|
t_final->max_ns = MY_MAX(t_final->max_ns, t->max_ns); |
|
} |
|
|
|
t_final->interval_count += t->interval_count; |
|
} |
|
} |
|
|
|
void tr2_emit_per_thread_timers(tr2_tgt_evt_timer_t *fn_apply) |
|
{ |
|
struct tr2tls_thread_ctx *ctx = tr2tls_get_self(); |
|
enum trace2_timer_id tid; |
|
|
|
if (!ctx->used_any_per_thread_timer) |
|
return; |
|
|
|
/* |
|
* For each timer, if the timer wants per-thread events and |
|
* this thread used it, emit it. |
|
*/ |
|
for (tid = 0; tid < TRACE2_NUMBER_OF_TIMERS; tid++) |
|
if (tr2_timer_metadata[tid].want_per_thread_events && |
|
ctx->timer_block.timer[tid].interval_count) |
|
fn_apply(&tr2_timer_metadata[tid], |
|
&ctx->timer_block.timer[tid], |
|
0); |
|
} |
|
|
|
void tr2_emit_final_timers(tr2_tgt_evt_timer_t *fn_apply) |
|
{ |
|
enum trace2_timer_id tid; |
|
|
|
/* |
|
* Accessing `final_timer_block` requires holding `tr2tls_mutex`. |
|
* We assume that our caller is holding the lock. |
|
*/ |
|
|
|
for (tid = 0; tid < TRACE2_NUMBER_OF_TIMERS; tid++) |
|
if (final_timer_block.timer[tid].interval_count) |
|
fn_apply(&tr2_timer_metadata[tid], |
|
&final_timer_block.timer[tid], |
|
1); |
|
}
|
|
|