gem: Extract transient execbuf flags from i915_vma

Chris Wilson Wed, 06 Nov 2019 07:48:44 -0800

For our convenience, and to avoid frequent allocations, we placed some
lists we use for execbuf inside the common i915_vma struct. As we look
to parallelise execbuf, such fields guarded by the struct_mutex BKL must
be pulled under local control. Instead of using the i915_vma as our
primary means of tracking the user's list of objects and their virtual
mappings, we use a local eb_vma with the same lists as before (just now
local not global).


Signed-off-by: Chris Wilson <ch...@chris-wilson.co.uk>
Cc: Maarten Lankhorst <maarten.lankho...@linux.intel.com>
---
 .../gpu/drm/i915/gem/i915_gem_execbuffer.c    | 271 +++++++++---------
 drivers/gpu/drm/i915/i915_vma.h               |  11 -
 2 files changed, 130 insertions(+), 152 deletions(-)

diff --git a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c 
b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
index e4f5c269150a..8eb9c4e17514 100644
--- a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
+++ b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
@@ -27,6 +27,19 @@
 #include "i915_gem_ioctls.h"
 #include "i915_trace.h"
 
+struct eb_vma {
+       struct i915_vma *vma;
+       unsigned int flags;
+
+       /** This vma's place in the execbuf reservation list */
+       struct drm_i915_gem_exec_object2 *exec;
+       struct list_head bind_link;
+       struct list_head reloc_link;
+
+       struct hlist_node node;
+       u32 handle;
+};
+
 enum {
        FORCE_CPU_RELOC = 1,
        FORCE_GTT_RELOC,
@@ -219,15 +232,14 @@ struct i915_execbuffer {
        struct drm_file *file; /** per-file lookup tables and limits */
        struct drm_i915_gem_execbuffer2 *args; /** ioctl parameters */
        struct drm_i915_gem_exec_object2 *exec; /** ioctl execobj[] */
-       struct i915_vma **vma;
-       unsigned int *flags;
+       struct eb_vma *vma;
 
        struct intel_engine_cs *engine; /** engine to queue the request to */
        struct intel_context *context; /* logical state for the request */
        struct i915_gem_context *gem_context; /** caller's context */
 
        struct i915_request *request; /** our request to build */
-       struct i915_vma *batch; /** identity of the batch obj/vma */
+       struct eb_vma *batch; /** identity of the batch obj/vma */
 
        /** actual size of execobj[] as we may extend it for the cmdparser */
        unsigned int buffer_count;
@@ -275,8 +287,6 @@ struct i915_execbuffer {
        struct hlist_head *buckets; /** ht for relocation handles */
 };
 
-#define exec_entry(EB, VMA) (&(EB)->exec[(VMA)->exec_flags - (EB)->flags])
-
 /*
  * Used to convert any address to canonical form.
  * Starting from gen8, some commands (e.g. STATE_BASE_ADDRESS,
@@ -380,9 +390,9 @@ eb_vma_misplaced(const struct drm_i915_gem_exec_object2 
*entry,
 static inline bool
 eb_pin_vma(struct i915_execbuffer *eb,
           const struct drm_i915_gem_exec_object2 *entry,
-          struct i915_vma *vma)
+          struct eb_vma *ev)
 {
-       unsigned int exec_flags = *vma->exec_flags;
+       struct i915_vma *vma = ev->vma;
        u64 pin_flags;
 
        if (vma->node.size)
@@ -391,24 +401,24 @@ eb_pin_vma(struct i915_execbuffer *eb,
                pin_flags = entry->offset & PIN_OFFSET_MASK;
 
        pin_flags |= PIN_USER | PIN_NOEVICT | PIN_OFFSET_FIXED;
-       if (unlikely(exec_flags & EXEC_OBJECT_NEEDS_GTT))
+       if (unlikely(ev->flags & EXEC_OBJECT_NEEDS_GTT))
                pin_flags |= PIN_GLOBAL;
 
        if (unlikely(i915_vma_pin(vma, 0, 0, pin_flags)))
                return false;
 
-       if (unlikely(exec_flags & EXEC_OBJECT_NEEDS_FENCE)) {
+       if (unlikely(ev->flags & EXEC_OBJECT_NEEDS_FENCE)) {
                if (unlikely(i915_vma_pin_fence(vma))) {
                        i915_vma_unpin(vma);
                        return false;
                }
 
                if (vma->fence)
-                       exec_flags |= __EXEC_OBJECT_HAS_FENCE;
+                       ev->flags |= __EXEC_OBJECT_HAS_FENCE;
        }
 
-       *vma->exec_flags = exec_flags | __EXEC_OBJECT_HAS_PIN;
-       return !eb_vma_misplaced(entry, vma, exec_flags);
+       ev->flags |= __EXEC_OBJECT_HAS_PIN;
+       return !eb_vma_misplaced(entry, vma, ev->flags);
 }
 
 static inline void __eb_unreserve_vma(struct i915_vma *vma, unsigned int flags)
@@ -422,13 +432,13 @@ static inline void __eb_unreserve_vma(struct i915_vma 
*vma, unsigned int flags)
 }
 
 static inline void
-eb_unreserve_vma(struct i915_vma *vma, unsigned int *flags)
+eb_unreserve_vma(struct eb_vma *ev)
 {
-       if (!(*flags & __EXEC_OBJECT_HAS_PIN))
+       if (!(ev->flags & __EXEC_OBJECT_HAS_PIN))
                return;
 
-       __eb_unreserve_vma(vma, *flags);
-       *flags &= ~__EXEC_OBJECT_RESERVED;
+       __eb_unreserve_vma(ev->vma, ev->flags);
+       ev->flags &= ~__EXEC_OBJECT_RESERVED;
 }
 
 static int
@@ -458,12 +468,6 @@ eb_validate_vma(struct i915_execbuffer *eb,
                entry->pad_to_size = 0;
        }
 
-       if (unlikely(vma->exec_flags)) {
-               DRM_DEBUG("Object [handle %d, index %d] appears more than once 
in object list\n",
-                         entry->handle, (int)(entry - eb->exec));
-               return -EINVAL;
-       }
-
        /*
         * From drm_mm perspective address space is continuous,
         * so from this point we're always using non-canonical
@@ -492,6 +496,7 @@ eb_add_vma(struct i915_execbuffer *eb,
           struct i915_vma *vma)
 {
        struct drm_i915_gem_exec_object2 *entry = &eb->exec[i];
+       struct eb_vma *ev = &eb->vma[i];
        int err;
 
        GEM_BUG_ON(i915_vma_is_closed(vma));
@@ -502,25 +507,19 @@ eb_add_vma(struct i915_execbuffer *eb,
                        return err;
        }
 
+       ev->vma = vma;
+       ev->exec = entry;
+       ev->flags = entry->flags;
+
        if (eb->lut_size > 0) {
-               vma->exec_handle = entry->handle;
-               hlist_add_head(&vma->exec_node,
+               ev->handle = entry->handle;
+               hlist_add_head(&ev->node,
                               &eb->buckets[hash_32(entry->handle,
                                                    eb->lut_size)]);
        }
 
        if (entry->relocation_count)
-               list_add_tail(&vma->reloc_link, &eb->relocs);
-
-       /*
-        * Stash a pointer from the vma to execobj, so we can query its flags,
-        * size, alignment etc as provided by the user. Also we stash a pointer
-        * to the vma inside the execobj so that we can use a direct lookup
-        * to find the right target VMA when doing relocations.
-        */
-       eb->vma[i] = vma;
-       eb->flags[i] = entry->flags;
-       vma->exec_flags = &eb->flags[i];
+               list_add_tail(&ev->reloc_link, &eb->relocs);
 
        /*
         * SNA is doing fancy tricks with compressing batch buffers, which leads
@@ -533,28 +532,26 @@ eb_add_vma(struct i915_execbuffer *eb,
         */
        if (i == batch_idx) {
                if (entry->relocation_count &&
-                   !(eb->flags[i] & EXEC_OBJECT_PINNED))
-                       eb->flags[i] |= __EXEC_OBJECT_NEEDS_BIAS;
+                   !(ev->flags & EXEC_OBJECT_PINNED))
+                       ev->flags |= __EXEC_OBJECT_NEEDS_BIAS;
                if (eb->reloc_cache.has_fence)
-                       eb->flags[i] |= EXEC_OBJECT_NEEDS_FENCE;
+                       ev->flags |= EXEC_OBJECT_NEEDS_FENCE;
 
-               eb->batch = vma;
+               eb->batch = ev;
        }
 
        err = 0;
-       if (eb_pin_vma(eb, entry, vma)) {
+       if (eb_pin_vma(eb, entry, ev)) {
                if (entry->offset != vma->node.start) {
                        entry->offset = vma->node.start | UPDATE;
                        eb->args->flags |= __EXEC_HAS_RELOC;
                }
        } else {
-               eb_unreserve_vma(vma, vma->exec_flags);
+               eb_unreserve_vma(ev);
 
-               list_add_tail(&vma->exec_link, &eb->unbound);
+               list_add_tail(&ev->bind_link, &eb->unbound);
                if (drm_mm_node_allocated(&vma->node))
                        err = i915_vma_unbind(vma);
-               if (unlikely(err))
-                       vma->exec_flags = NULL;
        }
        return err;
 }
@@ -576,11 +573,11 @@ static inline int use_cpu_reloc(const struct reloc_cache 
*cache,
                obj->cache_level != I915_CACHE_NONE);
 }
 
-static int eb_reserve_vma(const struct i915_execbuffer *eb,
-                         struct i915_vma *vma)
+static int eb_reserve_vma(const struct i915_execbuffer *eb, struct eb_vma *ev)
 {
-       struct drm_i915_gem_exec_object2 *entry = exec_entry(eb, vma);
-       unsigned int exec_flags = *vma->exec_flags;
+       struct drm_i915_gem_exec_object2 *entry = ev->exec;
+       unsigned int exec_flags = ev->flags;
+       struct i915_vma *vma = ev->vma;
        u64 pin_flags;
        int err;
 
@@ -627,8 +624,8 @@ static int eb_reserve_vma(const struct i915_execbuffer *eb,
                        exec_flags |= __EXEC_OBJECT_HAS_FENCE;
        }
 
-       *vma->exec_flags = exec_flags | __EXEC_OBJECT_HAS_PIN;
-       GEM_BUG_ON(eb_vma_misplaced(entry, vma, exec_flags));
+       ev->flags = exec_flags | __EXEC_OBJECT_HAS_PIN;
+       GEM_BUG_ON(eb_vma_misplaced(entry, vma, ev->flags));
 
        return 0;
 }
@@ -637,7 +634,7 @@ static int eb_reserve(struct i915_execbuffer *eb)
 {
        const unsigned int count = eb->buffer_count;
        struct list_head last;
-       struct i915_vma *vma;
+       struct eb_vma *ev;
        unsigned int i, pass;
        int err;
 
@@ -658,8 +655,8 @@ static int eb_reserve(struct i915_execbuffer *eb)
        pass = 0;
        err = 0;
        do {
-               list_for_each_entry(vma, &eb->unbound, exec_link) {
-                       err = eb_reserve_vma(eb, vma);
+               list_for_each_entry(ev, &eb->unbound, bind_link) {
+                       err = eb_reserve_vma(eb, ev);
                        if (err)
                                break;
                }
@@ -670,26 +667,26 @@ static int eb_reserve(struct i915_execbuffer *eb)
                INIT_LIST_HEAD(&eb->unbound);
                INIT_LIST_HEAD(&last);
                for (i = 0; i < count; i++) {
-                       unsigned int flags = eb->flags[i];
-                       struct i915_vma *vma = eb->vma[i];
+                       struct eb_vma *ev = &eb->vma[i];
+                       unsigned int flags = ev->flags;
 
                        if (flags & EXEC_OBJECT_PINNED &&
                            flags & __EXEC_OBJECT_HAS_PIN)
                                continue;
 
-                       eb_unreserve_vma(vma, &eb->flags[i]);
+                       eb_unreserve_vma(ev);
 
                        if (flags & EXEC_OBJECT_PINNED)
                                /* Pinned must have their slot */
-                               list_add(&vma->exec_link, &eb->unbound);
+                               list_add(&ev->bind_link, &eb->unbound);
                        else if (flags & __EXEC_OBJECT_NEEDS_MAP)
                                /* Map require the lowest 256MiB (aperture) */
-                               list_add_tail(&vma->exec_link, &eb->unbound);
+                               list_add_tail(&ev->bind_link, &eb->unbound);
                        else if (!(flags & EXEC_OBJECT_SUPPORTS_48B_ADDRESS))
                                /* Prioritise 4GiB region for restricted bo */
-                               list_add(&vma->exec_link, &last);
+                               list_add(&ev->bind_link, &last);
                        else
-                               list_add_tail(&vma->exec_link, &last);
+                               list_add_tail(&ev->bind_link, &last);
                }
                list_splice_tail(&last, &eb->unbound);
 
@@ -808,10 +805,8 @@ static int eb_lookup_vmas(struct i915_execbuffer *eb)
                if (unlikely(err))
                        goto err_vma;
 
-               GEM_BUG_ON(vma != eb->vma[i]);
-               GEM_BUG_ON(vma->exec_flags != &eb->flags[i]);
                GEM_BUG_ON(drm_mm_node_allocated(&vma->node) &&
-                          eb_vma_misplaced(&eb->exec[i], vma, eb->flags[i]));
+                          eb_vma_misplaced(&eb->exec[i], vma, 
eb->vma[i].flags));
        }
 
        mutex_unlock(&eb->gem_context->mutex);
@@ -822,27 +817,27 @@ static int eb_lookup_vmas(struct i915_execbuffer *eb)
 err_obj:
        i915_gem_object_put(obj);
 err_vma:
-       eb->vma[i] = NULL;
+       eb->vma[i].vma = NULL;
 err_ctx:
        mutex_unlock(&eb->gem_context->mutex);
        return err;
 }
 
-static struct i915_vma *
+static struct eb_vma *
 eb_get_vma(const struct i915_execbuffer *eb, unsigned long handle)
 {
        if (eb->lut_size < 0) {
                if (handle >= -eb->lut_size)
                        return NULL;
-               return eb->vma[handle];
+               return &eb->vma[handle];
        } else {
                struct hlist_head *head;
-               struct i915_vma *vma;
+               struct eb_vma *ev;
 
                head = &eb->buckets[hash_32(handle, eb->lut_size)];
-               hlist_for_each_entry(vma, head, exec_node) {
-                       if (vma->exec_handle == handle)
-                               return vma;
+               hlist_for_each_entry(ev, head, node) {
+                       if (ev->handle == handle)
+                               return ev;
                }
                return NULL;
        }
@@ -854,20 +849,18 @@ static void eb_release_vmas(const struct i915_execbuffer 
*eb)
        unsigned int i;
 
        for (i = 0; i < count; i++) {
-               struct i915_vma *vma = eb->vma[i];
-               unsigned int flags = eb->flags[i];
+               struct eb_vma *ev = &eb->vma[i];
+               struct i915_vma *vma = ev->vma;
 
                if (!vma)
                        break;
 
-               GEM_BUG_ON(vma->exec_flags != &eb->flags[i]);
-               vma->exec_flags = NULL;
-               eb->vma[i] = NULL;
+               eb->vma[i].vma = NULL;
 
-               if (flags & __EXEC_OBJECT_HAS_PIN)
-                       __eb_unreserve_vma(vma, flags);
+               if (ev->flags & __EXEC_OBJECT_HAS_PIN)
+                       __eb_unreserve_vma(vma, ev->flags);
 
-               if (flags & __EXEC_OBJECT_HAS_REF)
+               if (ev->flags & __EXEC_OBJECT_HAS_REF)
                        i915_vma_put(vma);
        }
 }
@@ -1377,10 +1370,10 @@ relocate_entry(struct i915_vma *vma,
 
 static u64
 eb_relocate_entry(struct i915_execbuffer *eb,
-                 struct i915_vma *vma,
+                 struct eb_vma *ev,
                  const struct drm_i915_gem_relocation_entry *reloc)
 {
-       struct i915_vma *target;
+       struct eb_vma *target;
        int err;
 
        /* we've already hold a reference to all valid objects */
@@ -1412,7 +1405,7 @@ eb_relocate_entry(struct i915_execbuffer *eb,
        }
 
        if (reloc->write_domain) {
-               *target->exec_flags |= EXEC_OBJECT_WRITE;
+               target->flags |= EXEC_OBJECT_WRITE;
 
                /*
                 * Sandybridge PPGTT errata: We need a global gtt mapping
@@ -1422,7 +1415,8 @@ eb_relocate_entry(struct i915_execbuffer *eb,
                 */
                if (reloc->write_domain == I915_GEM_DOMAIN_INSTRUCTION &&
                    IS_GEN(eb->i915, 6)) {
-                       err = i915_vma_bind(target, target->obj->cache_level,
+                       err = i915_vma_bind(target->vma,
+                                           target->vma->obj->cache_level,
                                            PIN_GLOBAL, NULL);
                        if (WARN_ONCE(err,
                                      "Unexpected failure to bind target VMA!"))
@@ -1435,17 +1429,17 @@ eb_relocate_entry(struct i915_execbuffer *eb,
         * more work needs to be done.
         */
        if (!DBG_FORCE_RELOC &&
-           gen8_canonical_addr(target->node.start) == reloc->presumed_offset)
+           gen8_canonical_addr(target->vma->node.start) == 
reloc->presumed_offset)
                return 0;
 
        /* Check that the relocation address is valid... */
        if (unlikely(reloc->offset >
-                    vma->size - (eb->reloc_cache.use_64bit_reloc ? 8 : 4))) {
+                    ev->vma->size - (eb->reloc_cache.use_64bit_reloc ? 8 : 
4))) {
                DRM_DEBUG("Relocation beyond object bounds: "
                          "target %d offset %d size %d.\n",
                          reloc->target_handle,
                          (int)reloc->offset,
-                         (int)vma->size);
+                         (int)ev->vma->size);
                return -EINVAL;
        }
        if (unlikely(reloc->offset & 3)) {
@@ -1464,18 +1458,18 @@ eb_relocate_entry(struct i915_execbuffer *eb,
         * do relocations we are already stalling, disable the user's opt
         * out of our synchronisation.
         */
-       *vma->exec_flags &= ~EXEC_OBJECT_ASYNC;
+       ev->flags &= ~EXEC_OBJECT_ASYNC;
 
        /* and update the user's relocation entry */
-       return relocate_entry(vma, reloc, eb, target);
+       return relocate_entry(ev->vma, reloc, eb, target->vma);
 }
 
-static int eb_relocate_vma(struct i915_execbuffer *eb, struct i915_vma *vma)
+static int eb_relocate_vma(struct i915_execbuffer *eb, struct eb_vma *ev)
 {
 #define N_RELOC(x) ((x) / sizeof(struct drm_i915_gem_relocation_entry))
        struct drm_i915_gem_relocation_entry stack[N_RELOC(512)];
        struct drm_i915_gem_relocation_entry __user *urelocs;
-       const struct drm_i915_gem_exec_object2 *entry = exec_entry(eb, vma);
+       const struct drm_i915_gem_exec_object2 *entry = ev->exec;
        unsigned int remain;
 
        urelocs = u64_to_user_ptr(entry->relocs_ptr);
@@ -1515,7 +1509,7 @@ static int eb_relocate_vma(struct i915_execbuffer *eb, 
struct i915_vma *vma)
 
                remain -= count;
                do {
-                       u64 offset = eb_relocate_entry(eb, vma, r);
+                       u64 offset = eb_relocate_entry(eb, ev, r);
 
                        if (likely(offset == 0)) {
                        } else if ((s64)offset < 0) {
@@ -1558,16 +1552,16 @@ static int eb_relocate_vma(struct i915_execbuffer *eb, 
struct i915_vma *vma)
 }
 
 static int
-eb_relocate_vma_slow(struct i915_execbuffer *eb, struct i915_vma *vma)
+eb_relocate_vma_slow(struct i915_execbuffer *eb, struct eb_vma *ev)
 {
-       const struct drm_i915_gem_exec_object2 *entry = exec_entry(eb, vma);
+       const struct drm_i915_gem_exec_object2 *entry = ev->exec;
        struct drm_i915_gem_relocation_entry *relocs =
                u64_to_ptr(typeof(*relocs), entry->relocs_ptr);
        unsigned int i;
        int err;
 
        for (i = 0; i < entry->relocation_count; i++) {
-               u64 offset = eb_relocate_entry(eb, vma, &relocs[i]);
+               u64 offset = eb_relocate_entry(eb, ev, &relocs[i]);
 
                if ((s64)offset < 0) {
                        err = (int)offset;
@@ -1711,7 +1705,7 @@ static noinline int eb_relocate_slow(struct 
i915_execbuffer *eb)
 {
        struct drm_device *dev = &eb->i915->drm;
        bool have_copy = false;
-       struct i915_vma *vma;
+       struct eb_vma *ev;
        int err = 0;
 
 repeat:
@@ -1767,15 +1761,15 @@ static noinline int eb_relocate_slow(struct 
i915_execbuffer *eb)
 
        GEM_BUG_ON(!eb->batch);
 
-       list_for_each_entry(vma, &eb->relocs, reloc_link) {
+       list_for_each_entry(ev, &eb->relocs, reloc_link) {
                if (!have_copy) {
                        pagefault_disable();
-                       err = eb_relocate_vma(eb, vma);
+                       err = eb_relocate_vma(eb, ev);
                        pagefault_enable();
                        if (err)
                                goto repeat;
                } else {
-                       err = eb_relocate_vma_slow(eb, vma);
+                       err = eb_relocate_vma_slow(eb, ev);
                        if (err)
                                goto err;
                }
@@ -1820,10 +1814,10 @@ static int eb_relocate(struct i915_execbuffer *eb)
 
        /* The objects are in their final locations, apply the relocations. */
        if (eb->args->flags & __EXEC_HAS_RELOC) {
-               struct i915_vma *vma;
+               struct eb_vma *ev;
 
-               list_for_each_entry(vma, &eb->relocs, reloc_link) {
-                       if (eb_relocate_vma(eb, vma))
+               list_for_each_entry(ev, &eb->relocs, reloc_link) {
+                       if (eb_relocate_vma(eb, ev))
                                goto slow;
                }
        }
@@ -1844,39 +1838,34 @@ static int eb_move_to_gpu(struct i915_execbuffer *eb)
        ww_acquire_init(&acquire, &reservation_ww_class);
 
        for (i = 0; i < count; i++) {
-               struct i915_vma *vma = eb->vma[i];
+               struct eb_vma *ev = &eb->vma[i];
+               struct i915_vma *vma = ev->vma;
 
                err = ww_mutex_lock_interruptible(&vma->resv->lock, &acquire);
-               if (!err)
-                       continue;
-
-               GEM_BUG_ON(err == -EALREADY); /* No duplicate vma */
-
                if (err == -EDEADLK) {
                        GEM_BUG_ON(i == 0);
                        do {
                                int j = i - 1;
 
-                               ww_mutex_unlock(&eb->vma[j]->resv->lock);
+                               ww_mutex_unlock(&eb->vma[j].vma->resv->lock);
 
-                               swap(eb->flags[i], eb->flags[j]);
                                swap(eb->vma[i],  eb->vma[j]);
-                               eb->vma[i]->exec_flags = &eb->flags[i];
                        } while (--i);
-                       GEM_BUG_ON(vma != eb->vma[0]);
-                       vma->exec_flags = &eb->flags[0];
 
                        err = ww_mutex_lock_slow_interruptible(&vma->resv->lock,
                                                               &acquire);
                }
+               if (err == -EALREADY)
+                       err = 0;
                if (err)
                        break;
        }
        ww_acquire_done(&acquire);
 
        while (i--) {
-               unsigned int flags = eb->flags[i];
-               struct i915_vma *vma = eb->vma[i];
+               struct eb_vma *ev = &eb->vma[i];
+               struct i915_vma *vma = ev->vma;
+               unsigned int flags = ev->flags;
                struct drm_i915_gem_object *obj = vma->obj;
 
                assert_vma_held(vma);
@@ -1920,10 +1909,10 @@ static int eb_move_to_gpu(struct i915_execbuffer *eb)
                i915_vma_unlock(vma);
 
                __eb_unreserve_vma(vma, flags);
-               vma->exec_flags = NULL;
-
                if (unlikely(flags & __EXEC_OBJECT_HAS_REF))
                        i915_vma_put(vma);
+
+               ev->vma = NULL;
        }
        ww_acquire_fini(&acquire);
 
@@ -2001,7 +1990,7 @@ static struct i915_vma *eb_parse(struct i915_execbuffer 
*eb, bool is_master)
                return ERR_CAST(pool);
 
        err = intel_engine_cmd_parser(eb->engine,
-                                     eb->batch->obj,
+                                     eb->batch->vma->obj,
                                      pool->obj,
                                      eb->batch_start_offset,
                                      eb->batch_len,
@@ -2018,10 +2007,9 @@ static struct i915_vma *eb_parse(struct i915_execbuffer 
*eb, bool is_master)
        if (IS_ERR(vma))
                goto err;
 
-       eb->vma[eb->buffer_count] = i915_vma_get(vma);
-       eb->flags[eb->buffer_count] =
+       eb->vma[eb->buffer_count].vma = i915_vma_get(vma);
+       eb->vma[eb->buffer_count].flags =
                __EXEC_OBJECT_HAS_PIN | __EXEC_OBJECT_HAS_REF;
-       vma->exec_flags = &eb->flags[eb->buffer_count];
        eb->buffer_count++;
 
        vma->private = pool;
@@ -2044,7 +2032,7 @@ add_to_client(struct i915_request *rq, struct drm_file 
*file)
        spin_unlock(&file_priv->mm.lock);
 }
 
-static int eb_submit(struct i915_execbuffer *eb)
+static int eb_submit(struct i915_execbuffer *eb, struct i915_vma *batch)
 {
        int err;
 
@@ -2071,7 +2059,7 @@ static int eb_submit(struct i915_execbuffer *eb)
        }
 
        err = eb->engine->emit_bb_start(eb->request,
-                                       eb->batch->node.start +
+                                       batch->node.start +
                                        eb->batch_start_offset,
                                        eb->batch_len,
                                        eb->batch_flags);
@@ -2434,6 +2422,7 @@ i915_gem_do_execbuffer(struct drm_device *dev,
        struct dma_fence *in_fence = NULL;
        struct dma_fence *exec_fence = NULL;
        struct sync_file *out_fence = NULL;
+       struct i915_vma *batch;
        int out_fence_fd = -1;
        int err;
 
@@ -2448,9 +2437,8 @@ i915_gem_do_execbuffer(struct drm_device *dev,
                args->flags |= __EXEC_HAS_RELOC;
 
        eb.exec = exec;
-       eb.vma = (struct i915_vma **)(exec + args->buffer_count + 1);
-       eb.vma[0] = NULL;
-       eb.flags = (unsigned int *)(eb.vma + args->buffer_count + 1);
+       eb.vma = (struct eb_vma *)(exec + args->buffer_count + 1);
+       eb.vma[0].vma = NULL;
 
        eb.invalid_flags = __EXEC_OBJECT_UNKNOWN_FLAGS;
        reloc_cache_init(&eb.reloc_cache, eb.i915);
@@ -2527,13 +2515,16 @@ i915_gem_do_execbuffer(struct drm_device *dev,
                goto err_vma;
        }
 
-       if (unlikely(*eb.batch->exec_flags & EXEC_OBJECT_WRITE)) {
+       if (unlikely(eb.batch->flags & EXEC_OBJECT_WRITE)) {
                DRM_DEBUG("Attempting to use self-modifying batch buffer\n");
                err = -EINVAL;
                goto err_vma;
        }
-       if (eb.batch_start_offset > eb.batch->size ||
-           eb.batch_len > eb.batch->size - eb.batch_start_offset) {
+
+       batch = eb.batch->vma;
+       if (range_overflows_t(u64,
+                             eb.batch_start_offset, eb.batch_len,
+                             batch->size)) {
                DRM_DEBUG("Attempting to use out-of-bounds batch\n");
                err = -EINVAL;
                goto err_vma;
@@ -2560,12 +2551,12 @@ i915_gem_do_execbuffer(struct drm_device *dev,
                         */
                        eb.batch_flags |= I915_DISPATCH_SECURE;
                        eb.batch_start_offset = 0;
-                       eb.batch = vma;
+                       batch = vma;
                }
        }
 
        if (eb.batch_len == 0)
-               eb.batch_len = eb.batch->size - eb.batch_start_offset;
+               eb.batch_len = batch->size - eb.batch_start_offset;
 
        /*
         * snb/ivb/vlv conflate the "batch in ppgtt" bit with the "non-secure
@@ -2584,13 +2575,13 @@ i915_gem_do_execbuffer(struct drm_device *dev,
                 *   fitting due to fragmentation.
                 * So this is actually safe.
                 */
-               vma = i915_gem_object_ggtt_pin(eb.batch->obj, NULL, 0, 0, 0);
+               vma = i915_gem_object_ggtt_pin(batch->obj, NULL, 0, 0, 0);
                if (IS_ERR(vma)) {
                        err = PTR_ERR(vma);
                        goto err_vma;
                }
 
-               eb.batch = vma;
+               batch = vma;
        }
 
        /* All GPU relocation batches must be submitted prior to the user rq */
@@ -2637,12 +2628,12 @@ i915_gem_do_execbuffer(struct drm_device *dev,
         * inactive_list and lose its active reference. Hence we do not need
         * to explicitly hold another reference here.
         */
-       eb.request->batch = eb.batch;
-       if (eb.batch->private)
-               intel_engine_pool_mark_active(eb.batch->private, eb.request);
+       eb.request->batch = batch;
+       if (batch->private)
+               intel_engine_pool_mark_active(batch->private, eb.request);
 
        trace_i915_request_queue(eb.request, eb.batch_flags);
-       err = eb_submit(&eb);
+       err = eb_submit(&eb, batch);
 err_request:
        add_to_client(eb.request, file);
        i915_request_add(eb.request);
@@ -2663,9 +2654,9 @@ i915_gem_do_execbuffer(struct drm_device *dev,
 
 err_batch_unpin:
        if (eb.batch_flags & I915_DISPATCH_SECURE)
-               i915_vma_unpin(eb.batch);
-       if (eb.batch->private)
-               intel_engine_pool_put(eb.batch->private);
+               i915_vma_unpin(batch);
+       if (batch->private)
+               intel_engine_pool_put(batch->private);
 err_vma:
        if (eb.exec)
                eb_release_vmas(&eb);
@@ -2688,9 +2679,7 @@ i915_gem_do_execbuffer(struct drm_device *dev,
 
 static size_t eb_element_size(void)
 {
-       return (sizeof(struct drm_i915_gem_exec_object2) +
-               sizeof(struct i915_vma *) +
-               sizeof(unsigned int));
+       return sizeof(struct drm_i915_gem_exec_object2) + sizeof(struct eb_vma);
 }
 
 static bool check_buffer_count(size_t count)
diff --git a/drivers/gpu/drm/i915/i915_vma.h b/drivers/gpu/drm/i915/i915_vma.h
index 465932813bc5..71402056d846 100644
--- a/drivers/gpu/drm/i915/i915_vma.h
+++ b/drivers/gpu/drm/i915/i915_vma.h
@@ -147,21 +147,10 @@ struct i915_vma {
        struct rb_node obj_node;
        struct hlist_node obj_hash;
 
-       /** This vma's place in the execbuf reservation list */
-       struct list_head exec_link;
-       struct list_head reloc_link;
-
        /** This vma's place in the eviction list */
        struct list_head evict_link;
 
        struct list_head closed_link;
-
-       /**
-        * Used for performing relocations during execbuffer insertion.
-        */
-       unsigned int *exec_flags;
-       struct hlist_node exec_node;
-       u32 exec_handle;
 };
 
 struct i915_vma *
-- 
2.24.0

_______________________________________________
Intel-gfx mailing list
Intel-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/intel-gfx

[Intel-gfx] [PATCH 3/3] drm/i915/gem: Extract transient execbuf flags from i915_vma

Reply via email to