panthor: Add support for atomic page table updates

Caterina Shablia Tue, 15 Jul 2025 08:04:21 -0700
El viernes, 11 de julio de 2025 21:11:15 (hora de verano de Europa central), 
Adrian Larumbe escribió:
> Hi Caterina,
> 
> On 03.07.2025 15:28, Caterina Shablia wrote:
> > From: Boris Brezillon <boris.brezil...@collabora.com>
> > 
> > Move the lock/flush_mem operations around the gpuvm_sm_map() calls so
> > we can implement true atomic page updates, where any access in the
> > locked range done by the GPU has to wait for the page table updates
> > to land before proceeding.
> > 
> > This is needed for vkQueueBindSparse(), so we can replace the dummy
> > page mapped over the entire object by actual BO backed pages in an atomic
> > way.
> > 
> > Signed-off-by: Boris Brezillon <boris.brezil...@collabora.com>
> > Signed-off-by: Caterina Shablia <caterina.shab...@collabora.com>
> > ---
> > 
> >  drivers/gpu/drm/panthor/panthor_mmu.c | 65 +++++++++++++++++++++++++--
> >  1 file changed, 62 insertions(+), 3 deletions(-)
> > 
> > diff --git a/drivers/gpu/drm/panthor/panthor_mmu.c
> > b/drivers/gpu/drm/panthor/panthor_mmu.c index b39ea6acc6a9..1e58948587a9
> > 100644
> > --- a/drivers/gpu/drm/panthor/panthor_mmu.c
> > +++ b/drivers/gpu/drm/panthor/panthor_mmu.c
> > @@ -387,6 +387,15 @@ struct panthor_vm {
> > 
> >      * flagged as faulty as a result.
> >      */
> >     
> >     bool unhandled_fault;
> > 
> > +
> > +   /** @locked_region: Information about the currently locked region
> > currently. */
> Nit: delete second 'current'
> 
> > +   struct {
> > +           /** @locked_region.start: Start of the locked region. 
*/
> > +           u64 start;
> > +
> > +           /** @locked_region.size: Size of the locked region. */
> > +           u64 size;
> > +   } locked_region;
> > 
> >  };
> >  
> >  /**
> > 
> > @@ -775,6 +784,10 @@ int panthor_vm_active(struct panthor_vm *vm)
> > 
> >     }
> >     
> >     ret = panthor_mmu_as_enable(vm->ptdev, vm->as.id, transtab, 
transcfg,
> >     vm->memattr);> 
> > +   if (!ret && vm->locked_region.size) {
> > +           lock_region(ptdev, vm->as.id, vm->locked_region.start,
> > vm->locked_region.size);
> Why do we need to lock the region after enabling a new AS?
See explanation further below for what happens in panthor_vm_lock_region. In 
short, we might poke vm_bind on a vm that's not active, locking a region. 
Because vm is not active, there's nothing for us to do to lock the region, 
beyond just specifying the region itself. If a vm in the meanwhile becomes 
active while some region is locked, we'll need to inform the mmu about the 
region that's supposed to be locked. 
> 
> > +           ret = wait_ready(ptdev, vm->as.id);
> > +   }
> > 
> >  out_make_active:
> >     if (!ret) {
> > 
> > @@ -902,6 +915,9 @@ static int panthor_vm_unmap_pages(struct panthor_vm
> > *vm, u64 iova, u64 size)> 
> >     struct io_pgtable_ops *ops = vm->pgtbl_ops;
> >     u64 offset = 0;
> > 
> > +   drm_WARN_ON(&ptdev->base,
> > +               (iova < vm->locked_region.start) ||
> > +               (iova + size > vm->locked_region.start + vm-
>locked_region.size));
> > 
> >     drm_dbg(&ptdev->base, "unmap: as=%d, iova=%llx, len=%llx", vm-
>as.id,
> >     iova, size);
> >     
> >     while (offset < size) {
> > 
> > @@ -915,13 +931,12 @@ static int panthor_vm_unmap_pages(struct panthor_vm
> > *vm, u64 iova, u64 size)> 
> >                             iova + offset + unmapped_sz,
> >                             iova + offset + pgsize * pgcount,
> >                             iova, iova + size);
> > 
> > -                   panthor_vm_flush_range(vm, iova, offset + 
unmapped_sz);
> 
> We've removed all calls to panthor_vm_flush_range(), but I don't see it
> being done in panthor_vm_exec_op() before the region is unlocked. It's
> effectively become dead code.
> 
> However, even if we did 'panthor_vm_flush_range(vm, op->va.addr,
> op->va.range);' in panthor_vm_exec_op() right before we unlock the region,
> we wouldn't be dealing well with the case in which only a partial unmap
> happens, but maybe this isn't a big deal either.
panthor_vm_unlock_region will do the necessary flushes.
> 
> >                     return  -EINVAL;
> >             
> >             }
> >             offset += unmapped_sz;
> >     
> >     }
> > 
> > -   return panthor_vm_flush_range(vm, iova, size);
> > +   return 0;
> > 
> >  }
> >  
> >  static int
> > 
> > @@ -938,6 +953,10 @@ panthor_vm_map_pages(struct panthor_vm *vm, u64 iova,
> > int prot,> 
> >     if (!size)
> >     
> >             return 0;
> > 
> > +   drm_WARN_ON(&ptdev->base,
> > +               (iova < vm->locked_region.start) ||
> > +               (iova + size > vm->locked_region.start + vm-
>locked_region.size));
> > +
> > 
> >     for_each_sgtable_dma_sg(sgt, sgl, count) {
> >     
> >             dma_addr_t paddr = sg_dma_address(sgl);
> >             size_t len = sg_dma_len(sgl);
> > 
> > @@ -985,7 +1004,7 @@ panthor_vm_map_pages(struct panthor_vm *vm, u64 iova,
> > int prot,> 
> >             offset = 0;
> >     
> >     }
> > 
> > -   return panthor_vm_flush_range(vm, start_iova, iova - start_iova);
> > 
> > 
> > +   return 0;
> > 
> >  }
> >  
> >  static int flags_to_prot(u32 flags)
> > 
> > @@ -1654,6 +1673,38 @@ static const char *access_type_name(struct
> > panthor_device *ptdev,> 
> >     }
> >  
> >  }
> > 
> > +static int panthor_vm_lock_region(struct panthor_vm *vm, u64 start, u64
> > size) +{
> > +   struct panthor_device *ptdev = vm->ptdev;
> > +   int ret;
> > +
> > +   mutex_lock(&ptdev->mmu->as.slots_lock);
> > +   drm_WARN_ON(&ptdev->base, vm->locked_region.start ||
> > vm->locked_region.size); +  vm->locked_region.start = start;
> > +   vm->locked_region.size = size;
> > +   if (vm->as.id >= 0) {
> 
> I guess VM bind operations don't increase the active_cnt of a VM, so we
> might try to be mapping addresses from UM while no active groups are
> submitting jobs targetting this VM?
vm_bind, beyond locking the region, does not involve the gpu and is performed 
entirely on host. If we were to try vm_binding while active_cnt is 0, we won't 
poke the mmu to do any locking. Instead, when panthor_vm_active is poked to 
make the vm active, we'll poke the mmu to actually lock the region supposed to 
be locked.
> > +           lock_region(ptdev, vm->as.id, start, size);
> > +           ret = wait_ready(ptdev, vm->as.id);
> 
> I've noticed in mmu_hw_do_operation_locked() we don't do wait_ready() after
> locking the region. Is it missing or else maybe waiting for the AS to be
> locked isn't necessary here?
> > +   }
> > +   mutex_unlock(&ptdev->mmu->as.slots_lock);
> > +
> > +   return ret;
> > +}
> > +
> > +static void panthor_vm_unlock_region(struct panthor_vm *vm)
> > +{
> > +   struct panthor_device *ptdev = vm->ptdev;
> > +
> > +   mutex_lock(&ptdev->mmu->as.slots_lock);
> > +   if (vm->as.id >= 0) {
> > +           write_cmd(ptdev, vm->as.id, AS_COMMAND_FLUSH_MEM);
> 
> I guess this is why we no longer need to call panthor_vm_flush_range() right
> before this function. Does AS_COMMAND_FLUSH_MEM only flush the locked
> region? Also, why not AS_COMMAND_FLUSH_PT instead?
IIUC FLUSH_MEM is less heavy of the two hammers. The doc says that it only 
invalidates MMU caches when used without a previous LOCK, so I guess it does 
something smarter in this case. FLUSH_PT invalidates MMU caches 
unconditionally.
> > +           drm_WARN_ON(&ptdev->base, wait_ready(ptdev, vm-
>as.id));
> > +   }
> > +   vm->locked_region.start = 0;
> > +   vm->locked_region.size = 0;
> > +   mutex_unlock(&ptdev->mmu->as.slots_lock);
> > +}
> > +
> > 
> >  static void panthor_mmu_irq_handler(struct panthor_device *ptdev, u32
> >  status) {
> >  
> >     bool has_unhandled_faults = false;
> > 
> > @@ -2179,6 +2230,11 @@ panthor_vm_exec_op(struct panthor_vm *vm, struct
> > panthor_vm_op_ctx *op,> 
> >     mutex_lock(&vm->op_lock);
> >     vm->op_ctx = op;
> > 
> > +
> > +   ret = panthor_vm_lock_region(vm, op->va.addr, op->va.range);
> > +   if (ret)
> > +           goto out;
> > +
> > 
> >     switch (op_type) {
> >     
> >     case DRM_PANTHOR_VM_BIND_OP_TYPE_MAP:
> >             if (vm->unusable) {
> > 
> > @@ -2199,6 +2255,9 @@ panthor_vm_exec_op(struct panthor_vm *vm, struct
> > panthor_vm_op_ctx *op,> 
> >             break;
> >     
> >     }
> > 
> > +   panthor_vm_unlock_region(vm);
> > +
> > 
> > +out:
> >     if (ret && flag_vm_unusable_on_failure)
> >     
> >             vm->unusable = true;
> > 
> > --
> > 2.47.2
> 
> Adrian Larumbe
Re: [PATCH v2 1/7] drm/panthor: Add support for atomic page table updates

Reply via email to