All of lore.kernel.org
 help / color / mirror / Atom feed
* [PATCH i-g-t 01/24] i915/gem_exec_latency: Measure the latency of context switching
@ 2019-03-22  9:21 ` Chris Wilson
  0 siblings, 0 replies; 113+ messages in thread
From: Chris Wilson @ 2019-03-22  9:21 UTC (permalink / raw)
  To: intel-gfx; +Cc: igt-dev

Measure the baseline latency between contexts in order to directly
compare that with the additional cost of preemption.

Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
---
 tests/i915/gem_exec_latency.c | 145 ++++++++++++++++++++++++++++++++++
 1 file changed, 145 insertions(+)

diff --git a/tests/i915/gem_exec_latency.c b/tests/i915/gem_exec_latency.c
index f308e0851..04ec7d9d2 100644
--- a/tests/i915/gem_exec_latency.c
+++ b/tests/i915/gem_exec_latency.c
@@ -629,6 +629,142 @@ rthog_latency_on_ring(int fd, unsigned int engine, const char *name, unsigned in
 	munmap(results, MMAP_SZ);
 }
 
+static void context_switch(int i915,
+			   unsigned int engine, const char *name,
+			   unsigned int flags)
+{
+	struct drm_i915_gem_exec_object2 obj[2];
+	struct drm_i915_gem_relocation_entry reloc[5];
+	struct drm_i915_gem_execbuffer2 eb;
+	uint32_t *cs, *bbe, *results, v;
+	unsigned int mmio_base;
+	struct igt_mean mean;
+	uint32_t ctx[2];
+
+	/* XXX i915_query()! */
+	switch (engine) {
+	case I915_EXEC_DEFAULT:
+	case I915_EXEC_RENDER:
+		mmio_base = 0x2000;
+		break;
+#if 0
+	case I915_EXEC_BSD:
+		mmio_base = 0x12000;
+		break;
+#endif
+	case I915_EXEC_BLT:
+		mmio_base = 0x22000;
+		break;
+
+	case I915_EXEC_VEBOX:
+		if (intel_gen(intel_get_drm_devid(i915)) >= 11)
+			mmio_base = 0x1d8000;
+		else
+			mmio_base = 0x1a000;
+		break;
+
+	default:
+		igt_skip("mmio base not known\n");
+	}
+
+	for (int i = 0; i < ARRAY_SIZE(ctx); i++)
+		ctx[i] = gem_context_create(i915);
+
+	if (flags & PREEMPT) {
+		gem_context_set_priority(i915, ctx[0], -1023);
+		gem_context_set_priority(i915, ctx[1], +1023);
+	}
+
+	memset(obj, 0, sizeof(obj));
+	obj[0].handle = gem_create(i915, 4096);
+	gem_set_caching(i915, obj[0].handle, 1);
+	results = gem_mmap__cpu(i915, obj[0].handle, 0, 4096, PROT_READ);
+	gem_set_domain(i915, obj[0].handle, I915_GEM_DOMAIN_CPU, 0);
+
+	obj[1].handle = gem_create(i915, 4096);
+	memset(reloc,0, sizeof(reloc));
+	obj[1].relocation_count = ARRAY_SIZE(reloc);
+	obj[1].relocs_ptr = to_user_pointer(reloc);
+	bbe = gem_mmap__wc(i915, obj[1].handle, 0, 4096, PROT_WRITE);
+	gem_set_domain(i915, obj[1].handle,
+		       I915_GEM_DOMAIN_WC, I915_GEM_DOMAIN_WC);
+
+	cs = bbe;
+	*cs++ = 0x5 << 23;
+	*cs++ = 0x24 << 23 | 2; /* SRM */
+	*cs++ = mmio_base + 0x358; /* TIMESTAMP */
+	reloc[0].target_handle = obj[0].handle;
+	reloc[0].offset = (cs - bbe) * sizeof(*cs);
+	*cs++ = 0;
+	*cs++ = 0;
+	*cs++ = MI_BATCH_BUFFER_START | 1;
+	reloc[1].target_handle = obj[1].handle;
+	reloc[1].offset = (cs - bbe) * sizeof(*cs);
+	*cs++ = 0;
+	*cs++ = 0;
+
+	cs = bbe + 64;
+	*cs++ = 0x24 << 23 | 2; /* SRM */
+	*cs++ = mmio_base + 0x358; /* TIMESTAMP */
+	reloc[2].target_handle = obj[0].handle;
+	reloc[2].offset = (cs - bbe) * sizeof(*cs);
+	*cs++ = reloc[2].delta = 4;
+	*cs++ = 0;
+	*cs++ = 0x29 << 23 | 2; /* LRM */
+	*cs++ = mmio_base + 0x600; /* GPR0 */
+	reloc[3].target_handle = obj[0].handle;
+	reloc[3].offset = (cs - bbe) * sizeof(*cs);
+	*cs++ = 0;
+	*cs++ = 0;
+	*cs++ = 0x24 << 23 | 2; /* SRM */
+	*cs++ = mmio_base + 0x600; /* GPR0 */
+	reloc[4].target_handle = obj[0].handle;
+	reloc[4].offset = (cs - bbe) * sizeof(*cs);
+	*cs++ = reloc[4].delta = 8;
+	*cs++ = 0;
+	*cs++ = 0xa << 23;
+
+	memset(&eb, 0, sizeof(eb));
+	eb.buffers_ptr = to_user_pointer(obj);
+	eb.buffer_count = ARRAY_SIZE(obj);
+	eb.flags = engine;
+	eb.flags |= LOCAL_I915_EXEC_NO_RELOC;
+
+	v = 0;
+	igt_mean_init(&mean);
+	igt_until_timeout(5) {
+		eb.rsvd1 = ctx[0];
+		eb.batch_start_offset = 0;
+		gem_execbuf(i915, &eb);
+
+		while (results[0] == v)
+			igt_assert(gem_bo_busy(i915, obj[1].handle));
+
+		eb.rsvd1 = ctx[1];
+		eb.batch_start_offset = 64 * sizeof(*cs);
+		gem_execbuf(i915, &eb);
+
+		*bbe = 0xa << 23;
+		gem_sync(i915, obj[1].handle);
+		*bbe = 0x5 << 23;
+
+		v = results[0];
+		igt_mean_add(&mean, (results[1] - results[2]) * rcs_clock);
+	}
+	igt_info("%s context switch latency%s: %.2f±%.2fus\n",
+		 name, flags & PREEMPT ? " (preempt)" : "",
+		 1e-3 * igt_mean_get(&mean),
+		 1e-3 * sqrt(igt_mean_get_variance(&mean)));
+	munmap(results, 4096);
+	munmap(bbe, 4096);
+
+	for (int i = 0; i < ARRAY_SIZE(obj); i++)
+		gem_close(i915, obj[i].handle);
+
+	for (int i = 0; i < ARRAY_SIZE(ctx); i++)
+		gem_context_destroy(i915, ctx[i]);
+}
+
 static double clockrate(int i915, int reg)
 {
 	volatile uint32_t *mmio;
@@ -754,12 +890,21 @@ igt_main
 							  e->exec_id | e->flags,
 							  e->name, CORK);
 
+				igt_subtest_f("%s-cs", e->name)
+					context_switch(device,
+						       e->exec_id | e->flags,
+						       e->name, 0);
 				igt_subtest_group {
 					igt_fixture {
 						gem_require_contexts(device);
 						igt_require(gem_scheduler_has_preemption(device));
 					}
 
+					igt_subtest_f("%s-cs-preempt", e->name)
+						context_switch(device,
+								e->exec_id | e->flags,
+								e->name, PREEMPT);
+
 					igt_subtest_f("%s-preemption", e->name)
 						latency_from_ring(device,
 								  e->exec_id | e->flags,
-- 
2.20.1

_______________________________________________
Intel-gfx mailing list
Intel-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/intel-gfx

^ permalink raw reply related	[flat|nested] 113+ messages in thread

end of thread, other threads:[~2019-03-26 15:54 UTC | newest]

Thread overview: 113+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2019-03-22  9:21 [PATCH i-g-t 01/24] i915/gem_exec_latency: Measure the latency of context switching Chris Wilson
2019-03-22  9:21 ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 02/24] lib: Add GPU power measurement Chris Wilson
2019-03-22  9:21   ` [Intel-gfx] " Chris Wilson
2019-03-26  8:36   ` [igt-dev] " Tvrtko Ursulin
2019-03-26  8:36     ` Tvrtko Ursulin
2019-03-26  8:49     ` Chris Wilson
2019-03-26  8:49       ` Chris Wilson
2019-03-26  9:18   ` [PATCH i-g-t v2] " Chris Wilson
2019-03-26  9:18     ` [igt-dev] " Chris Wilson
2019-03-26  9:52     ` Tvrtko Ursulin
2019-03-26  9:52       ` Tvrtko Ursulin
2019-03-26 10:06       ` Chris Wilson
2019-03-26 10:06         ` Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 03/24] i915/gem_exec_schedule: Measure semaphore power consumption Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26  8:46   ` Tvrtko Ursulin
2019-03-26  8:46     ` [Intel-gfx] " Tvrtko Ursulin
2019-03-26  9:23     ` Chris Wilson
2019-03-26  9:23       ` Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 04/24] i915/gem_exec_whisper: Measure total power consumed Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26  8:47   ` Tvrtko Ursulin
2019-03-26  8:47     ` Tvrtko Ursulin
2019-03-22  9:21 ` [PATCH i-g-t 05/24] i915/gem_exec_schedule: Verify that using HW semaphores doesn't block Chris Wilson
2019-03-22  9:21   ` [Intel-gfx] " Chris Wilson
2019-03-26  9:19   ` [igt-dev] " Tvrtko Ursulin
2019-03-26  9:19     ` Tvrtko Ursulin
2019-03-26 10:03     ` Chris Wilson
2019-03-26 10:03       ` [Intel-gfx] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 06/24] i915/gem_exec_nop: poll-sequential requires ordering between rings Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26  9:38   ` Tvrtko Ursulin
2019-03-26  9:38     ` Tvrtko Ursulin
2019-03-22  9:21 ` [PATCH i-g-t 07/24] i915/gem_sync: Make switch-default asymmetric Chris Wilson
2019-03-22  9:21   ` [Intel-gfx] " Chris Wilson
2019-03-26  9:57   ` [igt-dev] " Tvrtko Ursulin
2019-03-26  9:57     ` [Intel-gfx] " Tvrtko Ursulin
2019-03-22  9:21 ` [PATCH i-g-t 08/24] i915/gem_ctx_param: Remove kneecapping Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26  9:58   ` Tvrtko Ursulin
2019-03-26  9:58     ` Tvrtko Ursulin
2019-03-22  9:21 ` [PATCH i-g-t 09/24] i915/gem_exec_big: Add a single shot test Chris Wilson
2019-03-22  9:21   ` [Intel-gfx] " Chris Wilson
2019-03-26 10:06   ` [igt-dev] " Tvrtko Ursulin
2019-03-26 10:06     ` Tvrtko Ursulin
2019-03-26 10:21     ` Chris Wilson
2019-03-26 10:21       ` Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 10/24] kms_fence_pin_leak: Ask for the GPU before use Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26 10:10   ` Tvrtko Ursulin
2019-03-26 10:10     ` Tvrtko Ursulin
2019-03-22  9:21 ` [PATCH i-g-t 11/24] drm-uapi: Import i915_drm.h upto 53073249452d Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 12/24] lib/i915: Improve gem_context error messages Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26 10:14   ` Tvrtko Ursulin
2019-03-26 10:14     ` Tvrtko Ursulin
2019-03-22  9:21 ` [PATCH i-g-t 13/24] i915/gem_ctx_param: Test set/get (copy) VM Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26 10:22   ` Tvrtko Ursulin
2019-03-26 10:22     ` Tvrtko Ursulin
2019-03-26 10:33     ` Tvrtko Ursulin
2019-03-26 10:33       ` Tvrtko Ursulin
2019-03-26 10:51       ` Chris Wilson
2019-03-26 10:51         ` Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 14/24] i915/gem_ctx_create: Basic checks for constructor properties Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26 10:46   ` Tvrtko Ursulin
2019-03-26 10:46     ` Tvrtko Ursulin
2019-03-26 11:06     ` Chris Wilson
2019-03-26 11:06       ` [Intel-gfx] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 15/24] i915: Add gem_vm_create Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26 11:21   ` Tvrtko Ursulin
2019-03-26 11:21     ` Tvrtko Ursulin
2019-03-26 11:37     ` Chris Wilson
2019-03-26 11:37       ` Chris Wilson
2019-03-26 11:48       ` Tvrtko Ursulin
2019-03-26 11:48         ` Tvrtko Ursulin
2019-03-26 14:11         ` Chris Wilson
2019-03-26 14:11           ` Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 16/24] drm-uapi: Import i915_drm.h upto 364df3d04d51 Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 17/24] i915: Add gem_ctx_clone Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-26 15:44   ` Tvrtko Ursulin
2019-03-26 15:44     ` Tvrtko Ursulin
2019-03-26 15:49     ` Chris Wilson
2019-03-26 15:49       ` Chris Wilson
2019-03-26 15:54     ` Chris Wilson
2019-03-26 15:54       ` Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 18/24] i915: Exercise creating context with shared GTT Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 19/24] i915/gem_ctx_switch: Exercise queues Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 20/24] i915/gem_exec_whisper: Fork all-engine tests one-per-engine Chris Wilson
2019-03-22  9:21   ` [Intel-gfx] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 21/24] i915/gem_exec_whisper: debugfs/next_seqno is defunct Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 22/24] i915: Add gem_ctx_engines Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22 16:40   ` Andi Shyti
2019-03-22 16:40     ` [igt-dev] " Andi Shyti
2019-03-22 16:48     ` Chris Wilson
2019-03-22 16:48       ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 23/24] i915: Add gem_exec_balancer Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22  9:21 ` [PATCH i-g-t 24/24] i915/gem_exec_balancer: Exercise bonded pairs Chris Wilson
2019-03-22  9:21   ` [igt-dev] " Chris Wilson
2019-03-22 10:22 ` [igt-dev] ✓ Fi.CI.BAT: success for series starting with [i-g-t,01/24] i915/gem_exec_latency: Measure the latency of context switching Patchwork
2019-03-23  6:38 ` [igt-dev] ✓ Fi.CI.IGT: " Patchwork
2019-03-26 11:00 ` [igt-dev] ✗ Fi.CI.BAT: failure for series starting with [i-g-t,01/24] i915/gem_exec_latency: Measure the latency of context switching (rev2) Patchwork

This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.