igt/gem_ctx_switch: Measure qlen for timing loops

Some platforms may execute the heavy workload very slowly, such that using a batch of 1024 takes tens of seconds and immediately overrunning the 5s timeout on a pass. Added up over a few dozen passes, this turns a 120 second test into 10 minutes. Counter this by doing a warmup loop to estimate the appropriate queue len for timing. Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk> Reviewed-by: Joonas Lahtinen <joonas.lahtinen@linux.intel.com>
author: Chris Wilson <chris@chris-wilson.co.uk> 2018-03-16 15:53:57 +0000
committer: Chris Wilson <chris@chris-wilson.co.uk> 2018-03-23 10:35:17 +0000
commit: 20b8799898c844ad57e9cdb0238ffb7a44140d89 (patch)
tree: f3685aa9119cfccefb799ea58dbf09113a177a13
parent: 23a91ab7aa2227fabb09b48301ab70904a70aea7 (diff)
1 files changed, 40 insertions, 3 deletions
diff --git a/tests/gem_ctx_switch.c b/tests/gem_ctx_switch.c
index 4efece14..766ff9ae 100644
--- a/tests/gem_ctx_switch.c
+++ b/tests/gem_ctx_switch.c
@@ -51,6 +51,38 @@ static double elapsed(const struct timespec *start, const struct timespec *end)
 		(end->tv_nsec - start->tv_nsec)*1e-9);
 }
 
+static int measure_qlen(int fd,
+			struct drm_i915_gem_execbuffer2 *execbuf,
+			unsigned int *engine, unsigned int nengine,
+			int timeout)
+{
+	const struct drm_i915_gem_exec_object2 * const obj =
+		(struct drm_i915_gem_exec_object2 *)(uintptr_t)execbuf->buffers_ptr;
+	int qlen = 64;
+
+	for (unsigned int n = 0; n < nengine; n++) {
+		uint64_t saved = execbuf->flags;
+		struct timespec tv = {};
+
+		execbuf->flags |= engine[n];
+
+		igt_nsec_elapsed(&tv);
+		for (int loop = 0; loop < qlen; loop++)
+			gem_execbuf(fd, execbuf);
+		gem_sync(fd, obj->handle);
+
+		execbuf->flags = saved;
+
+		/*
+		 * Be conservative and aim not to overshoot timeout, so scale
+		 * down by 8 for hopefully a max of 12.5% error.
+		 */
+		qlen = qlen * timeout * 1e9 / igt_nsec_elapsed(&tv) / 8 + 1;
+	}
+
+	return qlen;
+}
+
 static void single(int fd, uint32_t handle,
 		   const struct intel_execution_engine *e,
 		   unsigned flags,
@@ -141,7 +173,7 @@ static void all(int fd, uint32_t handle, unsigned flags, int timeout)
 	const char *name[16];
 	uint32_t contexts[65];
 	unsigned int nengine;
-	int n;
+	int n, qlen;
 
 	nengine = 0;
 	for_each_physical_engine(fd, e) {
@@ -165,6 +197,10 @@ static void all(int fd, uint32_t handle, unsigned flags, int timeout)
 	execbuf.flags |= LOCAL_I915_EXEC_NO_RELOC;
 	igt_require(__gem_execbuf(fd, &execbuf) == 0);
 	gem_sync(fd, handle);
+
+	qlen = measure_qlen(fd, &execbuf, engine, nengine, timeout);
+	igt_info("Using timing depth of %d batches\n", qlen);
+
 	execbuf.buffers_ptr = to_user_pointer(obj);
 	execbuf.buffer_count = 2;
 
@@ -184,11 +220,12 @@ static void all(int fd, uint32_t handle, unsigned flags, int timeout)
 
 				clock_gettime(CLOCK_MONOTONIC, &start);
 				do {
-					for (int loop = 0; loop < 1024; loop++) {
+					for (int loop = 0; loop < qlen; loop++) {
 						execbuf.rsvd1 = contexts[loop % nctx];
 						gem_execbuf(fd, &execbuf);
 					}
-					count += 1024;
+					count += qlen;
+					gem_sync(fd, obj[0].handle);
 					clock_gettime(CLOCK_MONOTONIC, &now);
 				} while (elapsed(&start, &now) < timeout);
 				gem_sync(fd, obj[0].handle);
author	Chris Wilson <chris@chris-wilson.co.uk>	2018-03-16 15:53:57 +0000
committer	Chris Wilson <chris@chris-wilson.co.uk>	2018-03-23 10:35:17 +0000
commit	20b8799898c844ad57e9cdb0238ffb7a44140d89 (patch)
tree	f3685aa9119cfccefb799ea58dbf09113a177a13
parent	23a91ab7aa2227fabb09b48301ab70904a70aea7 (diff)