diff options
| author | Chris Wilson <chris@chris-wilson.co.uk> | 2013-08-22 01:30:02 +0100 | 
|---|---|---|
| committer | Chris Wilson <chris@chris-wilson.co.uk> | 2013-08-22 03:25:02 +0100 | 
| commit | b20a6b827924bfaf0bf92a1eae818385f90dfbea (patch) | |
| tree | ffbb5dbdd32021cfc48f5fe8f159c1d546e1d445 /overlay | |
| parent | 4572067c88276c6f72e33e6b204527f8a7ba4481 (diff) | |
overlay: Remove busy estimation
Too inaccurate to be useful.
Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Diffstat (limited to 'overlay')
| -rw-r--r-- | overlay/gpu-perf.c | 57 | ||||
| -rw-r--r-- | overlay/gpu-perf.h | 5 | 
2 files changed, 6 insertions, 56 deletions
| diff --git a/overlay/gpu-perf.c b/overlay/gpu-perf.c index bbebc5a8..d5e461c6 100644 --- a/overlay/gpu-perf.c +++ b/overlay/gpu-perf.c @@ -241,51 +241,6 @@ static int request_add(struct gpu_perf *gp, const void *event)  	return 1;  } -static int busy_start(struct gpu_perf *gp, const void *event) -{ -	const struct sample_event *sample = event; -	struct gpu_perf_comm *comm; -	struct gpu_perf_time *busy; - -	comm = lookup_comm(gp, sample->pid); -	if (comm == NULL) -		return 0; - -	busy = malloc(sizeof(*busy)); -	if (busy == NULL) -		return 0; - -	busy->ring = sample->raw[1]; -	busy->seqno = sample->raw[2]; -	busy->time = sample->time; -	busy->comm = comm; -	busy->next = gp->busy; -	gp->busy = busy; - -	return 0; -} - -static int busy_end(struct gpu_perf *gp, const void *event) -{ -	const struct sample_event *sample = event; -	struct gpu_perf_time *busy, **prev; - -	for (prev = &gp->busy; (busy = *prev) != NULL; prev = &busy->next) { -		if (busy->ring != sample->raw[1]) -			continue; - -		if (busy->seqno != sample->raw[2]) -			continue; - -		busy->comm->busy_time += sample->time - busy->time; -		*prev = busy->next; -		free(busy); -		return 1; -	} - -	return 0; -} -  static int flip_complete(struct gpu_perf *gp, const void *event)  {  	const struct sample_event *sample = event; @@ -309,11 +264,10 @@ static int wait_begin(struct gpu_perf *gp, const void *event)  		return 0;  	wait->comm = comm; -	wait->ring = sample->raw[1];  	wait->seqno = sample->raw[2];  	wait->time = sample->time; -	wait->next = gp->wait; -	gp->wait = wait; +	wait->next = gp->wait[sample->raw[1]]; +	gp->wait[sample->raw[1]] = wait;  	return 0;  } @@ -323,10 +277,7 @@ static int wait_end(struct gpu_perf *gp, const void *event)  	const struct sample_event *sample = event;  	struct gpu_perf_time *wait, **prev; -	for (prev = &gp->wait; (wait = *prev) != NULL; prev = &wait->next) { -		if (wait->ring != sample->raw[1]) -			continue; - +	for (prev = &gp->wait[sample->raw[1]]; (wait = *prev) != NULL; prev = &wait->next) {  		if (wait->seqno != sample->raw[2])  			continue; @@ -346,8 +297,6 @@ void gpu_perf_init(struct gpu_perf *gp, unsigned flags)  	gp->page_size = getpagesize();  	perf_tracepoint_open(gp, "i915", "i915_gem_request_add", request_add); -	if (perf_tracepoint_open(gp, "i915", "i915_gem_ring_complete", busy_end) == 0) -		perf_tracepoint_open(gp, "i915", "i915_gem_ring_dispatch", busy_start);  	if (perf_tracepoint_open(gp, "i915", "i915_gem_request_wait_begin", wait_begin) == 0)  		perf_tracepoint_open(gp, "i915", "i915_gem_request_wait_end", wait_end);  	perf_tracepoint_open(gp, "i915", "i915_flip_complete", flip_complete); diff --git a/overlay/gpu-perf.h b/overlay/gpu-perf.h index 56c783d6..3b91bd59 100644 --- a/overlay/gpu-perf.h +++ b/overlay/gpu-perf.h @@ -27,6 +27,8 @@  #include <stdint.h> +#define MAX_RINGS 4 +  struct gpu_perf {  	int page_size;  	int nr_cpus; @@ -52,10 +54,9 @@ struct gpu_perf {  	struct gpu_perf_time {  		struct gpu_perf_time *next;  		struct gpu_perf_comm *comm; -		int ring;  		uint32_t seqno;  		uint64_t time; -	} *wait, *busy; +	} *wait[MAX_RINGS];  };  void gpu_perf_init(struct gpu_perf *gp, unsigned flags); | 
