diff mbox series

drm/i915/selftest: Check that GPR are restored across noa_wait

Message ID 20200709215331.19994-1-chris@chris-wilson.co.uk (mailing list archive)
State New, archived
Headers show
Series drm/i915/selftest: Check that GPR are restored across noa_wait | expand

Commit Message

Chris Wilson July 9, 2020, 9:53 p.m. UTC
Perf implements a GPU delay (noa_wait) by looping until the CS timestamp
has passed a certain point. This use MI_MATH and the general purpose
registers of the user's context, and since it is clobbering the user
state it must carefully save and restore the user's data around the
noa_wait. We can verify this by loading some values in the GPR that we
know will be clobbered the noa_wait, and then inspecting the GPR after
the noa_wait completes and confirming that have been restored.

Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
Cc: Umesh Nerlige Ramappa <umesh.nerlige.ramappa@intel.com>
Cc: Lionel Landwerlin <lionel.g.landwerlin@intel.com>
---
 drivers/gpu/drm/i915/selftests/i915_perf.c | 124 +++++++++++++++++++++
 1 file changed, 124 insertions(+)

Comments

Lionel Landwerlin July 10, 2020, 5:34 a.m. UTC | #1
On 10/07/2020 00:53, Chris Wilson wrote:
> Perf implements a GPU delay (noa_wait) by looping until the CS timestamp
> has passed a certain point. This use MI_MATH and the general purpose
> registers of the user's context, and since it is clobbering the user
> state it must carefully save and restore the user's data around the
> noa_wait. We can verify this by loading some values in the GPR that we
> know will be clobbered the noa_wait, and then inspecting the GPR after
> the noa_wait completes and confirming that have been restored.
>
> Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
> Cc: Umesh Nerlige Ramappa <umesh.nerlige.ramappa@intel.com>
> Cc: Lionel Landwerlin <lionel.g.landwerlin@intel.com>

Reviewed-by: Lionel Landwerlin <lionel.g.landwerlin@intel.com>


Thanks a lot!

-Lionel

> ---
>   drivers/gpu/drm/i915/selftests/i915_perf.c | 124 +++++++++++++++++++++
>   1 file changed, 124 insertions(+)
>
> diff --git a/drivers/gpu/drm/i915/selftests/i915_perf.c b/drivers/gpu/drm/i915/selftests/i915_perf.c
> index be54570c407c..be63cfe82feb 100644
> --- a/drivers/gpu/drm/i915/selftests/i915_perf.c
> +++ b/drivers/gpu/drm/i915/selftests/i915_perf.c
> @@ -280,11 +280,135 @@ static int live_noa_delay(void *arg)
>   	return err;
>   }
>   
> +static int live_noa_gpr(void *arg)
> +{
> +	struct drm_i915_private *i915 = arg;
> +	struct i915_perf_stream *stream;
> +	struct intel_context *ce;
> +	struct i915_request *rq;
> +	u32 *cs, *store;
> +	void *scratch;
> +	u32 gpr0;
> +	int err;
> +	int i;
> +
> +	/* Check that the delay does not clobber user context state (GPR) */
> +
> +	stream = test_stream(&i915->perf);
> +	if (!stream)
> +		return -ENOMEM;
> +
> +	gpr0 = i915_mmio_reg_offset(GEN8_RING_CS_GPR(stream->engine->mmio_base, 0));
> +
> +	ce = intel_context_create(stream->engine);
> +	if (IS_ERR(ce)) {
> +		err = PTR_ERR(ce);
> +		goto out;
> +	}
> +
> +	scratch = kmap(ce->vm->scratch[0].base.page);
> +	memset(scratch, POISON_FREE, PAGE_SIZE);
> +
> +	rq = intel_context_create_request(ce);
> +	if (IS_ERR(rq)) {
> +		err = PTR_ERR(rq);
> +		goto out_ce;
> +	}
> +	i915_request_get(rq);
> +
> +	if (rq->engine->emit_init_breadcrumb) {
> +		err = rq->engine->emit_init_breadcrumb(rq);
> +		if (err) {
> +			i915_request_add(rq);
> +			goto out_rq;
> +		}
> +	}
> +
> +	cs = intel_ring_begin(rq, 2 * 32 + 2);
> +	if (IS_ERR(cs)) {
> +		i915_request_add(rq);
> +		goto out_rq;
> +	}
> +
> +	*cs++ = MI_LOAD_REGISTER_IMM(32);
> +	for (i = 0; i < 32; i++) {
> +		*cs++ = gpr0 + i * sizeof(u32);
> +		*cs++ = STACK_MAGIC;
> +	}
> +	*cs++ = MI_NOOP;
> +	intel_ring_advance(rq, cs);
> +
> +	err = rq->engine->emit_bb_start(rq,
> +					i915_ggtt_offset(stream->noa_wait), 0,
> +					I915_DISPATCH_SECURE);
> +	if (err) {
> +		i915_request_add(rq);
> +		goto out_rq;
> +	}
> +
> +	store = memset32(rq->engine->status_page.addr + 512, 0, 32);
> +	for (i = 0; i < 32; i++) {
> +		u32 cmd;
> +
> +		cs = intel_ring_begin(rq, 4);
> +		if (IS_ERR(cs)) {
> +			i915_request_add(rq);
> +			goto out_rq;
> +		}
> +
> +		cmd = MI_STORE_REGISTER_MEM;
> +		if (INTEL_GEN(i915) >= 8)
> +			cmd++;
> +		cmd |= MI_USE_GGTT;
> +
> +		*cs++ = cmd;
> +		*cs++ = gpr0 + i * sizeof(u32);
> +		*cs++ = i915_ggtt_offset(rq->engine->status_page.vma) +
> +			offset_in_page(store) +
> +			i * sizeof(u32);
> +		*cs++ = 0;
> +		intel_ring_advance(rq, cs);
> +	}
> +
> +	i915_request_add(rq);
> +
> +	if (i915_request_wait(rq, I915_WAIT_INTERRUPTIBLE, HZ / 2) < 0) {
> +		intel_gt_set_wedged(stream->engine->gt);
> +		err = -EIO;
> +		goto out_rq;
> +	}
> +
> +	for (i = 0; i < 32; i++) {
> +		if (store[i] == STACK_MAGIC)
> +			continue;
> +
> +		pr_err("GPR[%d] lost, found:%08x, expected:%08x!\n",
> +		       i, store[i], STACK_MAGIC);
> +		err = -EINVAL;
> +	}
> +
> +	if (memchr_inv(scratch, POISON_FREE, PAGE_SIZE)) {
> +		pr_err("scratch page overwritten!\n");
> +		igt_hexdump(scratch, 4096);
> +		err = -EINVAL;
> +	}
> +
> +out_rq:
> +	i915_request_put(rq);
> +out_ce:
> +	kunmap(ce->vm->scratch[0].base.page);
> +	intel_context_put(ce);
> +out:
> +	stream_destroy(stream);
> +	return err;
> +}
> +
>   int i915_perf_live_selftests(struct drm_i915_private *i915)
>   {
>   	static const struct i915_subtest tests[] = {
>   		SUBTEST(live_sanitycheck),
>   		SUBTEST(live_noa_delay),
> +		SUBTEST(live_noa_gpr),
>   	};
>   	struct i915_perf *perf = &i915->perf;
>   	int err;
diff mbox series

Patch

diff --git a/drivers/gpu/drm/i915/selftests/i915_perf.c b/drivers/gpu/drm/i915/selftests/i915_perf.c
index be54570c407c..be63cfe82feb 100644
--- a/drivers/gpu/drm/i915/selftests/i915_perf.c
+++ b/drivers/gpu/drm/i915/selftests/i915_perf.c
@@ -280,11 +280,135 @@  static int live_noa_delay(void *arg)
 	return err;
 }
 
+static int live_noa_gpr(void *arg)
+{
+	struct drm_i915_private *i915 = arg;
+	struct i915_perf_stream *stream;
+	struct intel_context *ce;
+	struct i915_request *rq;
+	u32 *cs, *store;
+	void *scratch;
+	u32 gpr0;
+	int err;
+	int i;
+
+	/* Check that the delay does not clobber user context state (GPR) */
+
+	stream = test_stream(&i915->perf);
+	if (!stream)
+		return -ENOMEM;
+
+	gpr0 = i915_mmio_reg_offset(GEN8_RING_CS_GPR(stream->engine->mmio_base, 0));
+
+	ce = intel_context_create(stream->engine);
+	if (IS_ERR(ce)) {
+		err = PTR_ERR(ce);
+		goto out;
+	}
+
+	scratch = kmap(ce->vm->scratch[0].base.page);
+	memset(scratch, POISON_FREE, PAGE_SIZE);
+
+	rq = intel_context_create_request(ce);
+	if (IS_ERR(rq)) {
+		err = PTR_ERR(rq);
+		goto out_ce;
+	}
+	i915_request_get(rq);
+
+	if (rq->engine->emit_init_breadcrumb) {
+		err = rq->engine->emit_init_breadcrumb(rq);
+		if (err) {
+			i915_request_add(rq);
+			goto out_rq;
+		}
+	}
+
+	cs = intel_ring_begin(rq, 2 * 32 + 2);
+	if (IS_ERR(cs)) {
+		i915_request_add(rq);
+		goto out_rq;
+	}
+
+	*cs++ = MI_LOAD_REGISTER_IMM(32);
+	for (i = 0; i < 32; i++) {
+		*cs++ = gpr0 + i * sizeof(u32);
+		*cs++ = STACK_MAGIC;
+	}
+	*cs++ = MI_NOOP;
+	intel_ring_advance(rq, cs);
+
+	err = rq->engine->emit_bb_start(rq,
+					i915_ggtt_offset(stream->noa_wait), 0,
+					I915_DISPATCH_SECURE);
+	if (err) {
+		i915_request_add(rq);
+		goto out_rq;
+	}
+
+	store = memset32(rq->engine->status_page.addr + 512, 0, 32);
+	for (i = 0; i < 32; i++) {
+		u32 cmd;
+
+		cs = intel_ring_begin(rq, 4);
+		if (IS_ERR(cs)) {
+			i915_request_add(rq);
+			goto out_rq;
+		}
+
+		cmd = MI_STORE_REGISTER_MEM;
+		if (INTEL_GEN(i915) >= 8)
+			cmd++;
+		cmd |= MI_USE_GGTT;
+
+		*cs++ = cmd;
+		*cs++ = gpr0 + i * sizeof(u32);
+		*cs++ = i915_ggtt_offset(rq->engine->status_page.vma) +
+			offset_in_page(store) +
+			i * sizeof(u32);
+		*cs++ = 0;
+		intel_ring_advance(rq, cs);
+	}
+
+	i915_request_add(rq);
+
+	if (i915_request_wait(rq, I915_WAIT_INTERRUPTIBLE, HZ / 2) < 0) {
+		intel_gt_set_wedged(stream->engine->gt);
+		err = -EIO;
+		goto out_rq;
+	}
+
+	for (i = 0; i < 32; i++) {
+		if (store[i] == STACK_MAGIC)
+			continue;
+
+		pr_err("GPR[%d] lost, found:%08x, expected:%08x!\n",
+		       i, store[i], STACK_MAGIC);
+		err = -EINVAL;
+	}
+
+	if (memchr_inv(scratch, POISON_FREE, PAGE_SIZE)) {
+		pr_err("scratch page overwritten!\n");
+		igt_hexdump(scratch, 4096);
+		err = -EINVAL;
+	}
+
+out_rq:
+	i915_request_put(rq);
+out_ce:
+	kunmap(ce->vm->scratch[0].base.page);
+	intel_context_put(ce);
+out:
+	stream_destroy(stream);
+	return err;
+}
+
 int i915_perf_live_selftests(struct drm_i915_private *i915)
 {
 	static const struct i915_subtest tests[] = {
 		SUBTEST(live_sanitycheck),
 		SUBTEST(live_noa_delay),
+		SUBTEST(live_noa_gpr),
 	};
 	struct i915_perf *perf = &i915->perf;
 	int err;