diff mbox series

[v2,2/4] drm/i915/selftests: exercise GPU access from the importer

Message ID 20221028155029.494736-2-matthew.auld@intel.com (mailing list archive)
State New, archived
Headers show
Series [v2,1/4] drm/i915/dmabuf: fix sg_table handling in map_dma_buf | expand

Commit Message

Matthew Auld Oct. 28, 2022, 3:50 p.m. UTC
Using PAGE_SIZE here potentially hides issues so bump that to something
larger. This should also make it possible for iommu to coalesce entries
for us. With that in place verify we can write from the GPU using the
importers sg_table, followed by checking that our writes match when read
from the CPU side.

v2: Switch over to igt_gpu_fill_dw(), which looks to be more widely
supported than the migrate stuff (at least OOTB).

References: https://gitlab.freedesktop.org/drm/intel/-/issues/7306
Signed-off-by: Matthew Auld <matthew.auld@intel.com>
Cc: Lionel Landwerlin <lionel.g.landwerlin@intel.com>
Cc: Tvrtko Ursulin <tvrtko.ursulin@linux.intel.com>
Cc: Ville Syrjälä <ville.syrjala@linux.intel.com>
Cc: Michael J. Ruhl <michael.j.ruhl@intel.com>
---
 .../drm/i915/gem/selftests/i915_gem_dmabuf.c  | 79 ++++++++++++++++++-
 1 file changed, 78 insertions(+), 1 deletion(-)

Comments

Ruhl, Michael J Oct. 28, 2022, 4:10 p.m. UTC | #1
>-----Original Message-----
>From: Auld, Matthew <matthew.auld@intel.com>
>Sent: Friday, October 28, 2022 11:50 AM
>To: intel-gfx@lists.freedesktop.org
>Cc: Landwerlin, Lionel G <lionel.g.landwerlin@intel.com>; Tvrtko Ursulin
><tvrtko.ursulin@linux.intel.com>; Ville Syrjälä <ville.syrjala@linux.intel.com>;
>Ruhl, Michael J <michael.j.ruhl@intel.com>
>Subject: [PATCH v2 2/4] drm/i915/selftests: exercise GPU access from the
>importer
>
>Using PAGE_SIZE here potentially hides issues so bump that to something
>larger. This should also make it possible for iommu to coalesce entries
>for us. With that in place verify we can write from the GPU using the
>importers sg_table, followed by checking that our writes match when read
>from the CPU side.
>
>v2: Switch over to igt_gpu_fill_dw(), which looks to be more widely
>supported than the migrate stuff (at least OOTB).
>
>References: https://gitlab.freedesktop.org/drm/intel/-/issues/7306
>Signed-off-by: Matthew Auld <matthew.auld@intel.com>
>Cc: Lionel Landwerlin <lionel.g.landwerlin@intel.com>
>Cc: Tvrtko Ursulin <tvrtko.ursulin@linux.intel.com>
>Cc: Ville Syrjälä <ville.syrjala@linux.intel.com>
>Cc: Michael J. Ruhl <michael.j.ruhl@intel.com>
>---
> .../drm/i915/gem/selftests/i915_gem_dmabuf.c  | 79
>++++++++++++++++++-
> 1 file changed, 78 insertions(+), 1 deletion(-)
>
>diff --git a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>index f2f3cfad807b..e57f9390076c 100644
>--- a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>+++ b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>@@ -6,8 +6,12 @@
>
> #include "i915_drv.h"
> #include "i915_selftest.h"
>+#include "gem/i915_gem_context.h"
>
>+#include "mock_context.h"
> #include "mock_dmabuf.h"
>+#include "igt_gem_utils.h"
>+#include "selftests/mock_drm.h"
> #include "selftests/mock_gem_device.h"
>
> static int igt_dmabuf_export(void *arg)
>@@ -140,6 +144,75 @@ static int
>igt_dmabuf_import_same_driver_lmem(void *arg)
> 	return err;
> }
>
>+static int verify_access(struct drm_i915_private *i915,
>+			 struct drm_i915_gem_object *native_obj,
>+			 struct drm_i915_gem_object *import_obj)
>+{
>+	struct i915_gem_engines_iter it;
>+	struct i915_gem_context *ctx;
>+	struct intel_context *ce;
>+	struct i915_vma *vma;
>+	struct file *file;
>+	u32 *vaddr;
>+	int err = 0, i;
>+
>+	file = mock_file(i915);
>+	if (IS_ERR(file))
>+		return PTR_ERR(file);
>+
>+	ctx = live_context(i915, file);
>+	if (IS_ERR(ctx)) {
>+		err = PTR_ERR(ctx);
>+		goto out_file;
>+	}
>+
>+	for_each_gem_engine(ce, i915_gem_context_lock_engines(ctx), it) {
>+		if (intel_engine_can_store_dword(ce->engine))
>+			break;
>+	}
>+	i915_gem_context_unlock_engines(ctx);
>+	if (!ce)
>+		goto out_file;
>+
>+	vma = i915_vma_instance(import_obj, ce->vm, NULL);
>+	if (IS_ERR(vma)) {
>+		err = PTR_ERR(vma);
>+		goto out_file;
>+	}
>+
>+	err = i915_vma_pin(vma, 0, 0, PIN_USER);
>+	if (err)
>+		goto out_file;
>+
>+	err = igt_gpu_fill_dw(ce, vma, 0,
>+			      vma->size >> PAGE_SHIFT, 0xdeadbeaf);
>+	i915_vma_unpin(vma);
>+	if (err)
>+		goto out_file;
>+
>+	err = i915_gem_object_wait(import_obj, 0,
>MAX_SCHEDULE_TIMEOUT);
>+	if (err)
>+		goto out_file;
>+
>+	vaddr = i915_gem_object_pin_map_unlocked(native_obj,
>I915_MAP_WB);
>+	if (IS_ERR(vaddr)) {
>+		err = PTR_ERR(vaddr);
>+		goto out_file;
>+	}
>+
>+	for (i = 0; i < native_obj->base.size / sizeof(u32); i += PAGE_SIZE /
>sizeof(u32)) {
>+		if (vaddr[i] != 0xdeadbeaf) {
>+			pr_err("Data mismatch [%d]=%u\n", i, vaddr[i]);
>+			err = -EINVAL;
>+			goto out_file;
>+		}

Not sure what timing issues are related to this test, but this loop could have
some impact (takes a long time, assuming the object is LMEM).

Would checking the beginning, middle and end of each page be any less
beneficial than the current check?

Not a suggested change, but just a thought to ponder if the timing becomes
an issue...

This test looks reasonable to me.

Reviewed-by: Michael J. Ruhl <michael.j.ruhl@intel.com>

M

>+	}
>+
>+out_file:
>+	fput(file);
>+	return err;
>+}
>+
> static int igt_dmabuf_import_same_driver(struct drm_i915_private *i915,
> 					 struct intel_memory_region
>**regions,
> 					 unsigned int num_regions)
>@@ -154,7 +227,7 @@ static int igt_dmabuf_import_same_driver(struct
>drm_i915_private *i915,
>
> 	force_different_devices = true;
>
>-	obj = __i915_gem_object_create_user(i915, PAGE_SIZE,
>+	obj = __i915_gem_object_create_user(i915, SZ_8M,
> 					    regions, num_regions);
> 	if (IS_ERR(obj)) {
> 		pr_err("__i915_gem_object_create_user failed with
>err=%ld\n",
>@@ -206,6 +279,10 @@ static int igt_dmabuf_import_same_driver(struct
>drm_i915_private *i915,
>
> 	i915_gem_object_unlock(import_obj);
>
>+	err = verify_access(i915, obj, import_obj);
>+	if (err)
>+		goto out_import;
>+
> 	/* Now try a fake an importer */
> 	import_attach = dma_buf_attach(dmabuf, obj->base.dev->dev);
> 	if (IS_ERR(import_attach)) {
>--
>2.37.3
Matthew Auld Oct. 28, 2022, 4:26 p.m. UTC | #2
On 28/10/2022 17:10, Ruhl, Michael J wrote:
>> -----Original Message-----
>> From: Auld, Matthew <matthew.auld@intel.com>
>> Sent: Friday, October 28, 2022 11:50 AM
>> To: intel-gfx@lists.freedesktop.org
>> Cc: Landwerlin, Lionel G <lionel.g.landwerlin@intel.com>; Tvrtko Ursulin
>> <tvrtko.ursulin@linux.intel.com>; Ville Syrjälä <ville.syrjala@linux.intel.com>;
>> Ruhl, Michael J <michael.j.ruhl@intel.com>
>> Subject: [PATCH v2 2/4] drm/i915/selftests: exercise GPU access from the
>> importer
>>
>> Using PAGE_SIZE here potentially hides issues so bump that to something
>> larger. This should also make it possible for iommu to coalesce entries
>> for us. With that in place verify we can write from the GPU using the
>> importers sg_table, followed by checking that our writes match when read
>>from the CPU side.
>>
>> v2: Switch over to igt_gpu_fill_dw(), which looks to be more widely
>> supported than the migrate stuff (at least OOTB).
>>
>> References: https://gitlab.freedesktop.org/drm/intel/-/issues/7306
>> Signed-off-by: Matthew Auld <matthew.auld@intel.com>
>> Cc: Lionel Landwerlin <lionel.g.landwerlin@intel.com>
>> Cc: Tvrtko Ursulin <tvrtko.ursulin@linux.intel.com>
>> Cc: Ville Syrjälä <ville.syrjala@linux.intel.com>
>> Cc: Michael J. Ruhl <michael.j.ruhl@intel.com>
>> ---
>> .../drm/i915/gem/selftests/i915_gem_dmabuf.c  | 79
>> ++++++++++++++++++-
>> 1 file changed, 78 insertions(+), 1 deletion(-)
>>
>> diff --git a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>> b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>> index f2f3cfad807b..e57f9390076c 100644
>> --- a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>> +++ b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
>> @@ -6,8 +6,12 @@
>>
>> #include "i915_drv.h"
>> #include "i915_selftest.h"
>> +#include "gem/i915_gem_context.h"
>>
>> +#include "mock_context.h"
>> #include "mock_dmabuf.h"
>> +#include "igt_gem_utils.h"
>> +#include "selftests/mock_drm.h"
>> #include "selftests/mock_gem_device.h"
>>
>> static int igt_dmabuf_export(void *arg)
>> @@ -140,6 +144,75 @@ static int
>> igt_dmabuf_import_same_driver_lmem(void *arg)
>> 	return err;
>> }
>>
>> +static int verify_access(struct drm_i915_private *i915,
>> +			 struct drm_i915_gem_object *native_obj,
>> +			 struct drm_i915_gem_object *import_obj)
>> +{
>> +	struct i915_gem_engines_iter it;
>> +	struct i915_gem_context *ctx;
>> +	struct intel_context *ce;
>> +	struct i915_vma *vma;
>> +	struct file *file;
>> +	u32 *vaddr;
>> +	int err = 0, i;
>> +
>> +	file = mock_file(i915);
>> +	if (IS_ERR(file))
>> +		return PTR_ERR(file);
>> +
>> +	ctx = live_context(i915, file);
>> +	if (IS_ERR(ctx)) {
>> +		err = PTR_ERR(ctx);
>> +		goto out_file;
>> +	}
>> +
>> +	for_each_gem_engine(ce, i915_gem_context_lock_engines(ctx), it) {
>> +		if (intel_engine_can_store_dword(ce->engine))
>> +			break;
>> +	}
>> +	i915_gem_context_unlock_engines(ctx);
>> +	if (!ce)
>> +		goto out_file;
>> +
>> +	vma = i915_vma_instance(import_obj, ce->vm, NULL);
>> +	if (IS_ERR(vma)) {
>> +		err = PTR_ERR(vma);
>> +		goto out_file;
>> +	}
>> +
>> +	err = i915_vma_pin(vma, 0, 0, PIN_USER);
>> +	if (err)
>> +		goto out_file;
>> +
>> +	err = igt_gpu_fill_dw(ce, vma, 0,
>> +			      vma->size >> PAGE_SHIFT, 0xdeadbeaf);
>> +	i915_vma_unpin(vma);
>> +	if (err)
>> +		goto out_file;
>> +
>> +	err = i915_gem_object_wait(import_obj, 0,
>> MAX_SCHEDULE_TIMEOUT);
>> +	if (err)
>> +		goto out_file;
>> +
>> +	vaddr = i915_gem_object_pin_map_unlocked(native_obj,
>> I915_MAP_WB);
>> +	if (IS_ERR(vaddr)) {
>> +		err = PTR_ERR(vaddr);
>> +		goto out_file;
>> +	}
>> +
>> +	for (i = 0; i < native_obj->base.size / sizeof(u32); i += PAGE_SIZE /
>> sizeof(u32)) {
>> +		if (vaddr[i] != 0xdeadbeaf) {
>> +			pr_err("Data mismatch [%d]=%u\n", i, vaddr[i]);
>> +			err = -EINVAL;
>> +			goto out_file;
>> +		}
> 
> Not sure what timing issues are related to this test, but this loop could have
> some impact (takes a long time, assuming the object is LMEM).
> 
> Would checking the beginning, middle and end of each page be any less
> beneficial than the current check?

We are currently just sampling the first dword of each page (that could 
perhaps be random instead). We could go further and sample a selection 
of random pages instead, if speed is a concern. Although here the pages 
must be in system memory. dma-buf in upstream will currently force 
migrate to system memory.

> 
> Not a suggested change, but just a thought to ponder if the timing becomes
> an issue...
> 
> This test looks reasonable to me.
> 
> Reviewed-by: Michael J. Ruhl <michael.j.ruhl@intel.com>
> 
> M
> 
>> +	}
>> +
>> +out_file:
>> +	fput(file);
>> +	return err;
>> +}
>> +
>> static int igt_dmabuf_import_same_driver(struct drm_i915_private *i915,
>> 					 struct intel_memory_region
>> **regions,
>> 					 unsigned int num_regions)
>> @@ -154,7 +227,7 @@ static int igt_dmabuf_import_same_driver(struct
>> drm_i915_private *i915,
>>
>> 	force_different_devices = true;
>>
>> -	obj = __i915_gem_object_create_user(i915, PAGE_SIZE,
>> +	obj = __i915_gem_object_create_user(i915, SZ_8M,
>> 					    regions, num_regions);
>> 	if (IS_ERR(obj)) {
>> 		pr_err("__i915_gem_object_create_user failed with
>> err=%ld\n",
>> @@ -206,6 +279,10 @@ static int igt_dmabuf_import_same_driver(struct
>> drm_i915_private *i915,
>>
>> 	i915_gem_object_unlock(import_obj);
>>
>> +	err = verify_access(i915, obj, import_obj);
>> +	if (err)
>> +		goto out_import;
>> +
>> 	/* Now try a fake an importer */
>> 	import_attach = dma_buf_attach(dmabuf, obj->base.dev->dev);
>> 	if (IS_ERR(import_attach)) {
>> --
>> 2.37.3
>
diff mbox series

Patch

diff --git a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
index f2f3cfad807b..e57f9390076c 100644
--- a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
+++ b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
@@ -6,8 +6,12 @@ 
 
 #include "i915_drv.h"
 #include "i915_selftest.h"
+#include "gem/i915_gem_context.h"
 
+#include "mock_context.h"
 #include "mock_dmabuf.h"
+#include "igt_gem_utils.h"
+#include "selftests/mock_drm.h"
 #include "selftests/mock_gem_device.h"
 
 static int igt_dmabuf_export(void *arg)
@@ -140,6 +144,75 @@  static int igt_dmabuf_import_same_driver_lmem(void *arg)
 	return err;
 }
 
+static int verify_access(struct drm_i915_private *i915,
+			 struct drm_i915_gem_object *native_obj,
+			 struct drm_i915_gem_object *import_obj)
+{
+	struct i915_gem_engines_iter it;
+	struct i915_gem_context *ctx;
+	struct intel_context *ce;
+	struct i915_vma *vma;
+	struct file *file;
+	u32 *vaddr;
+	int err = 0, i;
+
+	file = mock_file(i915);
+	if (IS_ERR(file))
+		return PTR_ERR(file);
+
+	ctx = live_context(i915, file);
+	if (IS_ERR(ctx)) {
+		err = PTR_ERR(ctx);
+		goto out_file;
+	}
+
+	for_each_gem_engine(ce, i915_gem_context_lock_engines(ctx), it) {
+		if (intel_engine_can_store_dword(ce->engine))
+			break;
+	}
+	i915_gem_context_unlock_engines(ctx);
+	if (!ce)
+		goto out_file;
+
+	vma = i915_vma_instance(import_obj, ce->vm, NULL);
+	if (IS_ERR(vma)) {
+		err = PTR_ERR(vma);
+		goto out_file;
+	}
+
+	err = i915_vma_pin(vma, 0, 0, PIN_USER);
+	if (err)
+		goto out_file;
+
+	err = igt_gpu_fill_dw(ce, vma, 0,
+			      vma->size >> PAGE_SHIFT, 0xdeadbeaf);
+	i915_vma_unpin(vma);
+	if (err)
+		goto out_file;
+
+	err = i915_gem_object_wait(import_obj, 0, MAX_SCHEDULE_TIMEOUT);
+	if (err)
+		goto out_file;
+
+	vaddr = i915_gem_object_pin_map_unlocked(native_obj, I915_MAP_WB);
+	if (IS_ERR(vaddr)) {
+		err = PTR_ERR(vaddr);
+		goto out_file;
+	}
+
+	for (i = 0; i < native_obj->base.size / sizeof(u32); i += PAGE_SIZE / sizeof(u32)) {
+		if (vaddr[i] != 0xdeadbeaf) {
+			pr_err("Data mismatch [%d]=%u\n", i, vaddr[i]);
+			err = -EINVAL;
+			goto out_file;
+		}
+	}
+
+out_file:
+	fput(file);
+	return err;
+}
+
 static int igt_dmabuf_import_same_driver(struct drm_i915_private *i915,
 					 struct intel_memory_region **regions,
 					 unsigned int num_regions)
@@ -154,7 +227,7 @@  static int igt_dmabuf_import_same_driver(struct drm_i915_private *i915,
 
 	force_different_devices = true;
 
-	obj = __i915_gem_object_create_user(i915, PAGE_SIZE,
+	obj = __i915_gem_object_create_user(i915, SZ_8M,
 					    regions, num_regions);
 	if (IS_ERR(obj)) {
 		pr_err("__i915_gem_object_create_user failed with err=%ld\n",
@@ -206,6 +279,10 @@  static int igt_dmabuf_import_same_driver(struct drm_i915_private *i915,
 
 	i915_gem_object_unlock(import_obj);
 
+	err = verify_access(i915, obj, import_obj);
+	if (err)
+		goto out_import;
+
 	/* Now try a fake an importer */
 	import_attach = dma_buf_attach(dmabuf, obj->base.dev->dev);
 	if (IS_ERR(import_attach)) {