On Mon, Jun 28, 2021 at 07:45:31PM +0000, Ruhl, Michael J wrote:
> >-----Original Message-----
> >From: Thomas Hellström <thomas.hellst...@linux.intel.com>
> >Sent: Monday, June 28, 2021 10:46 AM
> >To: intel-...@lists.freedesktop.org; dri-devel@lists.freedesktop.org
> >Cc: Auld, Matthew <matthew.a...@intel.com>;
> >maarten.lankho...@linux.intel.com; Thomas Hellström
> ><thomas.hellst...@linux.intel.com>; Ruhl; Ruhl, Michael J
> ><michael.j.r...@intel.com>
> >Subject: [PATCH v3 4/5] drm/i915/gem: Fix same-driver-another-instance
> >dma-buf export
> >
> >If our exported dma-bufs are imported by another instance of our driver,
> >that instance will typically have the imported dma-bufs locked during
> >map_attachment(). But the exporter also locks the same reservation
> >object in the map_dma_buf() callback, which leads to recursive locking.
> >
> >Add a live selftest to catch this case, and as a workaround until
> >we fully support dynamic import and export, declare the exporter dynamic
> >by providing NOP pin() and unpin() functions. This means our map_dma_buf()
> >callback will *always* get called locked, and by pinning unconditionally
> >in i915_gem_map_dma_buf() we make sure we don't need to use the
> >move_notify() functionality which is not yet implemented.
> 
> An interesting abuse of the interface, but it seems reasonable (for now) to 
> me.

Hm I'm not sure this is the best interface abuse, since if we combine this
with amdgpu it goes boom. Also I thought the dynamic stuff is optional (or
is that only for the importer).

What I discussed a bit with Maarten on irc is to essentially emulate the
rules of what a dynamic exporter would end up with with a non-dynamic
importer: pin/unpin the buffer at attach/detach time. We could fake this
in our attach/detach callbacks.

At least I don't think it's the locking changes that saves us here, but
the caching of the sgt list in attach/detach. As long as we hand-roll that
we should be fine. So hand-rolling that feels like the best option to make
sure we're not making this worse, as long as we haven't fully validated
the true dynamic importer _and_ exporter case.

Cheers, Daniel

> Reviewed-by: Michael J. Ruhl <michael.j.r...@intel.com>
> 
> Mike
> 
> >Reported-by: Ruhl, Michael J <michael.j.r...@intel.com>
> >Cc: Ruhl, Michael J <michael.j.r...@intel.com>
> >Signed-off-by: Thomas Hellström <thomas.hellst...@linux.intel.com>
> >---
> > drivers/gpu/drm/i915/gem/i915_gem_dmabuf.c    | 31 ++++++-
> > .../drm/i915/gem/selftests/i915_gem_dmabuf.c  | 81
> >++++++++++++++++++-
> > 2 files changed, 108 insertions(+), 4 deletions(-)
> >
> >diff --git a/drivers/gpu/drm/i915/gem/i915_gem_dmabuf.c
> >b/drivers/gpu/drm/i915/gem/i915_gem_dmabuf.c
> >index 616c3a2f1baf..1d1eeb167d28 100644
> >--- a/drivers/gpu/drm/i915/gem/i915_gem_dmabuf.c
> >+++ b/drivers/gpu/drm/i915/gem/i915_gem_dmabuf.c
> >@@ -12,6 +12,8 @@
> > #include "i915_gem_object.h"
> > #include "i915_scatterlist.h"
> >
> >+I915_SELFTEST_DECLARE(static bool force_different_devices;)
> >+
> > static struct drm_i915_gem_object *dma_buf_to_obj(struct dma_buf *buf)
> > {
> >     return to_intel_bo(buf->priv);
> >@@ -25,7 +27,9 @@ static struct sg_table *i915_gem_map_dma_buf(struct
> >dma_buf_attachment *attachme
> >     struct scatterlist *src, *dst;
> >     int ret, i;
> >
> >-    ret = i915_gem_object_pin_pages_unlocked(obj);
> >+    assert_object_held(obj);
> >+
> >+    ret = i915_gem_object_pin_pages(obj);
> >     if (ret)
> >             goto err;
> >
> >@@ -168,6 +172,26 @@ static int i915_gem_end_cpu_access(struct dma_buf
> >*dma_buf, enum dma_data_direct
> >     return err;
> > }
> >
> >+/*
> >+ * As a workaround until we fully support dynamic import and export,
> >+ * declare the exporter dynamic by providing NOP pin() and unpin()
> >functions.
> >+ * This means our i915_gem_map_dma_buf() callback will *always* get
> >called
> >+ * locked, and by pinning unconditionally in i915_gem_map_dma_buf() we
> >make
> >+ * sure we don't need to use the move_notify() functionality which is
> >+ * not yet implemented. Typically for the same-driver-another-instance case,
> >+ * i915_gem_map_dma_buf() will be called at importer attach time and the
> >+ * mapped sg_list will be cached by the dma-buf core for the
> >+ * duration of the attachment.
> >+ */
> >+static int i915_gem_dmabuf_pin(struct dma_buf_attachment *attach)
> >+{
> >+    return 0;
> >+}
> >+
> >+static void i915_gem_dmabuf_unpin(struct dma_buf_attachment *attach)
> >+{
> >+}
> >+
> > static const struct dma_buf_ops i915_dmabuf_ops =  {
> >     .map_dma_buf = i915_gem_map_dma_buf,
> >     .unmap_dma_buf = i915_gem_unmap_dma_buf,
> >@@ -177,6 +201,8 @@ static const struct dma_buf_ops i915_dmabuf_ops =  {
> >     .vunmap = i915_gem_dmabuf_vunmap,
> >     .begin_cpu_access = i915_gem_begin_cpu_access,
> >     .end_cpu_access = i915_gem_end_cpu_access,
> >+    .pin = i915_gem_dmabuf_pin,
> >+    .unpin = i915_gem_dmabuf_unpin,
> > };
> >
> > struct dma_buf *i915_gem_prime_export(struct drm_gem_object
> >*gem_obj, int flags)
> >@@ -241,7 +267,8 @@ struct drm_gem_object
> >*i915_gem_prime_import(struct drm_device *dev,
> >     if (dma_buf->ops == &i915_dmabuf_ops) {
> >             obj = dma_buf_to_obj(dma_buf);
> >             /* is it from our device? */
> >-            if (obj->base.dev == dev) {
> >+            if (obj->base.dev == dev &&
> >+                !I915_SELFTEST_ONLY(force_different_devices)) {
> >                     /*
> >                      * Importing dmabuf exported from out own gem
> >increases
> >                      * refcount on gem itself instead of f_count of
> >dmabuf.
> >diff --git a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
> >b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
> >index dd74bc09ec88..24735d6c12a2 100644
> >--- a/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
> >+++ b/drivers/gpu/drm/i915/gem/selftests/i915_gem_dmabuf.c
> >@@ -35,7 +35,7 @@ static int igt_dmabuf_export(void *arg)
> > static int igt_dmabuf_import_self(void *arg)
> > {
> >     struct drm_i915_private *i915 = arg;
> >-    struct drm_i915_gem_object *obj;
> >+    struct drm_i915_gem_object *obj, *import_obj;
> >     struct drm_gem_object *import;
> >     struct dma_buf *dmabuf;
> >     int err;
> >@@ -65,14 +65,90 @@ static int igt_dmabuf_import_self(void *arg)
> >             err = -EINVAL;
> >             goto out_import;
> >     }
> >+    import_obj = to_intel_bo(import);
> >+
> >+    i915_gem_object_lock(import_obj, NULL);
> >+    err = ____i915_gem_object_get_pages(import_obj);
> >+    i915_gem_object_unlock(import_obj);
> >+    if (err) {
> >+            pr_err("Same object dma-buf get_pages failed!\n");
> >+            goto out_import;
> >+    }
> >
> >     err = 0;
> > out_import:
> >-    i915_gem_object_put(to_intel_bo(import));
> >+    i915_gem_object_put(import_obj);
> >+out_dmabuf:
> >+    dma_buf_put(dmabuf);
> >+out:
> >+    i915_gem_object_put(obj);
> >+    return err;
> >+}
> >+
> >+static int igt_dmabuf_import_same_driver(void *arg)
> >+{
> >+    struct drm_i915_private *i915 = arg;
> >+    struct drm_i915_gem_object *obj, *import_obj;
> >+    struct drm_gem_object *import;
> >+    struct dma_buf *dmabuf;
> >+    int err;
> >+
> >+    force_different_devices = true;
> >+    obj = i915_gem_object_create_shmem(i915, PAGE_SIZE);
> >+    if (IS_ERR(obj))
> >+            goto out_ret;
> >+
> >+    dmabuf = i915_gem_prime_export(&obj->base, 0);
> >+    if (IS_ERR(dmabuf)) {
> >+            pr_err("i915_gem_prime_export failed with err=%d\n",
> >+                   (int)PTR_ERR(dmabuf));
> >+            err = PTR_ERR(dmabuf);
> >+            goto out;
> >+    }
> >+
> >+    import = i915_gem_prime_import(&i915->drm, dmabuf);
> >+    if (IS_ERR(import)) {
> >+            pr_err("i915_gem_prime_import failed with err=%d\n",
> >+                   (int)PTR_ERR(import));
> >+            err = PTR_ERR(import);
> >+            goto out_dmabuf;
> >+    }
> >+
> >+    if (import == &obj->base) {
> >+            pr_err("i915_gem_prime_import reused gem object!\n");
> >+            err = -EINVAL;
> >+            goto out_import;
> >+    }
> >+
> >+    import_obj = to_intel_bo(import);
> >+
> >+    i915_gem_object_lock(import_obj, NULL);
> >+    err = ____i915_gem_object_get_pages(import_obj);
> >+    if (err) {
> >+            pr_err("Different objects dma-buf get_pages failed!\n");
> >+            i915_gem_object_unlock(import_obj);
> >+            goto out_import;
> >+    }
> >+
> >+    /*
> >+     * If the exported object is not in system memory, something
> >+     * weird is going on. TODO: When p2p is supported, this is no
> >+     * longer considered weird.
> >+     */
> >+    if (obj->mm.region != i915->mm.regions[INTEL_REGION_SMEM]) {
> >+            pr_err("Exported dma-buf is not in system memory\n");
> >+            err = -EINVAL;
> >+    }
> >+    i915_gem_object_unlock(import_obj);
> >+
> >+out_import:
> >+    i915_gem_object_put(import_obj);
> > out_dmabuf:
> >     dma_buf_put(dmabuf);
> > out:
> >     i915_gem_object_put(obj);
> >+out_ret:
> >+    force_different_devices = false;
> >     return err;
> > }
> >
> >@@ -286,6 +362,7 @@ int i915_gem_dmabuf_live_selftests(struct
> >drm_i915_private *i915)
> > {
> >     static const struct i915_subtest tests[] = {
> >             SUBTEST(igt_dmabuf_export),
> >+            SUBTEST(igt_dmabuf_import_same_driver),
> >     };
> >
> >     return i915_subtests(tests, i915);
> >--
> >2.31.1
> 

-- 
Daniel Vetter
Software Engineer, Intel Corporation
http://blog.ffwll.ch

Reply via email to