On 02.04.2025 14:58, Boris Brezillon wrote: > On Wed, 2 Apr 2025 12:54:29 +0100 > Adrián Larumbe <adrian.laru...@collabora.com> wrote: > > > Add a device DebugFS file that displays a complete list of all the DRM > > GEM objects that are exposed to UM through a DRM handle. > > > > Since leaking object identifiers that might belong to a different NS is > > inadmissible, this functionality is only made available in debug builds > > with DEBUGFS support enabled. > > > > File format is that of a table, with each entry displaying a variety of > > fields with information about each GEM object. > > > > Each GEM object entry in the file displays the following information > > fields: Client PID, BO's global name, reference count, BO virtual size, > > BO resize size, VM address in its DRM-managed range, BO label and a flag > > bitmask. > > > > There's also a kflags field for the type of BO. Bit 0 tells us whether > > it's a kernel BO, and bit 1 means the BO is mapped onto the FW's address > > space. > > > > Signed-off-by: Adrián Larumbe <adrian.laru...@collabora.com> > > --- > > drivers/gpu/drm/panthor/panthor_device.c | 5 + > > drivers/gpu/drm/panthor/panthor_device.h | 11 ++ > > drivers/gpu/drm/panthor/panthor_drv.c | 26 ++++ > > drivers/gpu/drm/panthor/panthor_gem.c | 149 +++++++++++++++++++++++ > > drivers/gpu/drm/panthor/panthor_gem.h | 35 ++++++ > > 5 files changed, 226 insertions(+) > > > > diff --git a/drivers/gpu/drm/panthor/panthor_device.c > > b/drivers/gpu/drm/panthor/panthor_device.c > > index a9da1d1eeb70..b776e1a2e4f3 100644 > > --- a/drivers/gpu/drm/panthor/panthor_device.c > > +++ b/drivers/gpu/drm/panthor/panthor_device.c > > @@ -184,6 +184,11 @@ int panthor_device_init(struct panthor_device *ptdev) > > if (ret) > > return ret; > > > > +#ifdef CONFIG_DEBUG_FS > > + drmm_mutex_init(&ptdev->base, &ptdev->gems.lock); > > + INIT_LIST_HEAD(&ptdev->gems.node); > > +#endif > > + > > atomic_set(&ptdev->pm.state, PANTHOR_DEVICE_PM_STATE_SUSPENDED); > > p = alloc_page(GFP_KERNEL | __GFP_ZERO); > > if (!p) > > diff --git a/drivers/gpu/drm/panthor/panthor_device.h > > b/drivers/gpu/drm/panthor/panthor_device.h > > index da6574021664..86206a961b38 100644 > > --- a/drivers/gpu/drm/panthor/panthor_device.h > > +++ b/drivers/gpu/drm/panthor/panthor_device.h > > @@ -205,6 +205,17 @@ struct panthor_device { > > > > /** @fast_rate: Maximum device clock frequency. Set by DVFS */ > > unsigned long fast_rate; > > + > > +#ifdef CONFIG_DEBUG_FS > > + /** @gems: Device-wide list of GEM objects owned by at least one file. > > */ > > + struct { > > + /** @gems.lock: Protects the device-wide list of GEM objects. */ > > + struct mutex lock; > > + > > + /** @node: Used to keep track of all the device's DRM objects */ > > + struct list_head node; > > + } gems; > > +#endif > > }; > > > > struct panthor_gpu_usage { > > diff --git a/drivers/gpu/drm/panthor/panthor_drv.c > > b/drivers/gpu/drm/panthor/panthor_drv.c > > index d5277284fe27..3e870ed2ad90 100644 > > --- a/drivers/gpu/drm/panthor/panthor_drv.c > > +++ b/drivers/gpu/drm/panthor/panthor_drv.c > > @@ -1534,9 +1534,35 @@ static const struct file_operations > > panthor_drm_driver_fops = { > > }; > > > > #ifdef CONFIG_DEBUG_FS > > +static int panthor_gems_show(struct seq_file *m, void *data) > > +{ > > + struct drm_info_node *node = m->private; > > + struct drm_device *dev = node->minor->dev; > > + struct panthor_device *ptdev = container_of(dev, struct panthor_device, > > base); > > + > > + panthor_gem_debugfs_print_bos(ptdev, m); > > + > > + return 0; > > +} > > + > > + > > +static struct drm_info_list panthor_debugfs_list[] = { > > + {"gems", panthor_gems_show, 0, NULL}, > > +}; > > + > > +static int panthor_gems_debugfs_init(struct drm_minor *minor) > > +{ > > + drm_debugfs_create_files(panthor_debugfs_list, > > + ARRAY_SIZE(panthor_debugfs_list), > > + minor->debugfs_root, minor); > > + > > + return 0; > > +} > > + > > static void panthor_debugfs_init(struct drm_minor *minor) > > { > > panthor_mmu_debugfs_init(minor); > > + panthor_gems_debugfs_init(minor); > > } > > #endif > > > > diff --git a/drivers/gpu/drm/panthor/panthor_gem.c > > b/drivers/gpu/drm/panthor/panthor_gem.c > > index 44d027e6d664..2fc87be9b700 100644 > > --- a/drivers/gpu/drm/panthor/panthor_gem.c > > +++ b/drivers/gpu/drm/panthor/panthor_gem.c > > @@ -2,6 +2,7 @@ > > /* Copyright 2019 Linaro, Ltd, Rob Herring <r...@kernel.org> */ > > /* Copyright 2023 Collabora ltd. */ > > > > +#include <linux/cleanup.h> > > #include <linux/dma-buf.h> > > #include <linux/dma-mapping.h> > > #include <linux/err.h> > > @@ -10,14 +11,65 @@ > > #include <drm/panthor_drm.h> > > > > #include "panthor_device.h" > > +#include "panthor_fw.h" > > #include "panthor_gem.h" > > #include "panthor_mmu.h" > > > > +#ifdef CONFIG_DEBUG_FS > > +static void panthor_gem_debugfs_bo_init(struct panthor_gem_object *bo, u32 > > type_mask) > > +{ > > + INIT_LIST_HEAD(&bo->debugfs.node); > > This should be called when the GEM object is created, otherwise the > list_empty() test done in panthor_gem_debugfs_bo_rm() will only work if > panthor_gem_debugfs_bo_add() is called, and depending on when this > happens, or whether it happens at all, the error path will do a NULL > deref.
I'll be moving panthor_gem_debugfs_bo_add() back into panthor_gem_create_object() and inline panthor_gem_debugfs_bo_init() into it. > > + > > + if (!(type_mask & PANTHOR_BO_FW_MAPPED)) { > > + bo->debugfs.creator.tgid = current->group_leader->pid; > > + get_task_comm(bo->debugfs.creator.process_name, > > current->group_leader); > > I don't think that's good to assume that FW-mapped BOs have been > created by the kernel without userspace directly or indirectly asking > for the allocation. For instance, per-group memory allocated for the > USER_CS interfaces are indirectly triggered by a GROUP_CREATE ioctl(), > and should IMO be flagged as being created by the process that > created the group. Don't we have another way to check if we're called > from a kernel thread? True, I completely missed this. I did some research of the kernel API and apparently is_kthread() might do the job. > > + } else { > > + bo->debugfs.creator.tgid = 0; > > + snprintf(bo->debugfs.creator.process_name, > > + sizeof(bo->debugfs.creator.process_name), > > + "kernel"); > > + } > > + > > + bo->debugfs.bo_mask = type_mask; > > Why not do that directly in panthor_gem_debugfs_bo_add()? The only bits > that might be useful to do early is the INIT_LIST_HEAD(), and I think > it can be inlined in panthor_gem_create_object(). I'll be doing in this in the next revision, but because I've no access to the BO type mask from inside Panthor's drm_driver::gem_create_object() binding, then I'll have to assign the mask right after the object has been created. I think this means there might be a short window after the object's been added to the DebugFS GEMs list in which it could be shown with the kernel mask field still set to 0, but I guess that's not too important either. > > +} > > + > > +static void panthor_gem_debugfs_bo_add(struct panthor_gem_object *bo, u32 > > type_mask) > > +{ > > + struct panthor_device *ptdev = container_of(bo->base.base.dev, > > + struct panthor_device, > > base); > > + > > + panthor_gem_debugfs_bo_init(bo, type_mask); > > + > > + mutex_lock(&ptdev->gems.lock); > > + list_add_tail(&bo->debugfs.node, &ptdev->gems.node); > > + mutex_unlock(&ptdev->gems.lock); > > +} > > + > > +static void panthor_gem_debugfs_bo_rm(struct panthor_gem_object *bo) > > +{ > > + struct panthor_device *ptdev = container_of(bo->base.base.dev, > > + struct panthor_device, > > base); > > + > > + if (list_empty(&bo->debugfs.node)) > > + return; > > + > > + mutex_lock(&ptdev->gems.lock); > > + list_del_init(&bo->debugfs.node); > > + mutex_unlock(&ptdev->gems.lock); > > +} > > + > > +#else > > +static void panthor_gem_debugfs_bo_add(struct panthor_gem_object *bo, u32 > > type_mask) {} > > +static void panthor_gem_debugfs_bo_rm(struct panthor_gem_object *bo) {} > > +#endif > > + > > static void panthor_gem_free_object(struct drm_gem_object *obj) > > { > > struct panthor_gem_object *bo = to_panthor_bo(obj); > > struct drm_gem_object *vm_root_gem = bo->exclusive_vm_root_gem; > > > > + panthor_gem_debugfs_bo_rm(bo); > > + > > /* > > * Label might have been allocated with kstrdup_const(), > > * we need to take that into account when freeing the memory > > @@ -86,6 +138,7 @@ panthor_kernel_bo_create(struct panthor_device *ptdev, > > struct panthor_vm *vm, > > struct drm_gem_shmem_object *obj; > > struct panthor_kernel_bo *kbo; > > struct panthor_gem_object *bo; > > + u32 type_mask = PANTHOR_BO_KERNEL; > > int ret; > > > > if (drm_WARN_ON(&ptdev->base, !vm)) > > @@ -105,7 +158,12 @@ panthor_kernel_bo_create(struct panthor_device *ptdev, > > struct panthor_vm *vm, > > kbo->obj = &obj->base; > > bo->flags = bo_flags; > > > > + if (vm == panthor_fw_vm(ptdev)) > > + type_mask |= PANTHOR_BO_FW_MAPPED; > > + > > panthor_gem_kernel_bo_set_label(kbo, name); > > + panthor_gem_debugfs_bo_add(to_panthor_bo(kbo->obj), type_mask); > > + > > /* The system and GPU MMU page size might differ, which becomes a > > * problem for FW sections that need to be mapped at explicit address > > * since our PAGE_SIZE alignment might cover a VA range that's > > @@ -255,6 +313,8 @@ panthor_gem_create_with_handle(struct drm_file *file, > > /* drop reference from allocate - handle holds it now. */ > > drm_gem_object_put(&shmem->base); > > > > + panthor_gem_debugfs_bo_add(bo, 0); > > + > > return ret; > > } > > > > @@ -286,3 +346,92 @@ panthor_gem_kernel_bo_set_label(struct > > panthor_kernel_bo *bo, const char *label) > > > > panthor_gem_bo_set_label(bo->obj, kstrdup_const(str, GFP_KERNEL)); > > } > > + > > +#ifdef CONFIG_DEBUG_FS > > +static bool panfrost_gem_print_flag(const char *name, > > + bool is_set, > > + bool other_flags_printed, > > + struct seq_file *m) > > +{ > > + if (is_set) > > + seq_printf(m, "%s%s", other_flags_printed ? "," : "", name); > > + > > + return is_set | other_flags_printed; > > +} > > + > > +struct gem_size_totals { > > + size_t size; > > + size_t resident; > > + size_t reclaimable; > > +}; > > + > > +static void panthor_gem_debugfs_bo_print(struct panthor_gem_object *bo, > > + struct seq_file *m, > > + struct gem_size_totals *totals) > > +{ > > + unsigned int refcount = kref_read(&bo->base.base.refcount); > > + char creator_info[32] = {}; > > + bool has_flags = false; > > + size_t resident_size; > > + > > + /* Skip BOs being destroyed. */ > > + if (!refcount) > > + return; > > + > > + resident_size = bo->base.pages != NULL ? bo->base.base.size : 0; > > + > > + snprintf(creator_info, sizeof(creator_info), > > + "%s/%d", bo->debugfs.creator.process_name, > > bo->debugfs.creator.tgid); > > + seq_printf(m, "%-32s%-16d%-16d%-16zd%-16zd%-16lx", > > + creator_info, > > + bo->base.base.name, > > + refcount, > > + bo->base.base.size, > > + resident_size, > > + drm_vma_node_start(&bo->base.base.vma_node)); > > + > > + seq_puts(m, "("); > > + has_flags = panfrost_gem_print_flag("imported", > > bo->base.base.import_attach != NULL, > > + has_flags, m); > > + has_flags = panfrost_gem_print_flag("exported", bo->base.base.dma_buf > > != NULL, > > + has_flags, m); > > + if (bo->base.madv < 0) > > + has_flags = panfrost_gem_print_flag("purged", true, has_flags, > > m); > > + else if (bo->base.madv > 0) > > + has_flags = panfrost_gem_print_flag("purgeable", true, > > has_flags, m); > > + if (!has_flags) > > + seq_puts(m, "none"); > > + seq_puts(m, ")"); > > + > > + seq_printf(m, "%-6s0x%-2x", "", bo->debugfs.bo_mask); > > + > > + mutex_lock(&bo->label.lock); > > + seq_printf(m, "%-6s%-60s", "", bo->label.str ? : NULL); > > + mutex_unlock(&bo->label.lock); > > + seq_puts(m, "\n"); > > + > > + totals->size += bo->base.base.size; > > + totals->resident += resident_size; > > + if (bo->base.madv > 0) > > + totals->reclaimable += resident_size; > > +} > > + > > +void panthor_gem_debugfs_print_bos(struct panthor_device *ptdev, > > + struct seq_file *m) > > +{ > > + struct gem_size_totals totals = {0}; > > + struct panthor_gem_object *bo; > > + > > + seq_puts(m, "created-by global-name refcount > > size resident-size file-offset flags kflags > > label\n"); > > + seq_puts(m, > > "------------------------------------------------------------------------------------------------------------------------------------------------\n"); > > + > > + scoped_guard(mutex, &ptdev->gems.lock) { > > + list_for_each_entry(bo, &ptdev->gems.node, debugfs.node) > > + panthor_gem_debugfs_bo_print(bo, m, &totals); > > + } > > + > > + seq_puts(m, > > "==========================================================================================================================================================\n"); > > + seq_printf(m, "Total size: %zd, Total resident: %zd, Total reclaimable: > > %zd\n", > > + totals.size, totals.resident, totals.reclaimable); > > +} > > +#endif > > diff --git a/drivers/gpu/drm/panthor/panthor_gem.h > > b/drivers/gpu/drm/panthor/panthor_gem.h > > index 49daa5088a0d..22ecc0d39d5e 100644 > > --- a/drivers/gpu/drm/panthor/panthor_gem.h > > +++ b/drivers/gpu/drm/panthor/panthor_gem.h > > @@ -15,6 +15,32 @@ struct panthor_vm; > > > > #define PANTHOR_BO_LABEL_MAXLEN PAGE_SIZE > > > > +#define PANTHOR_BO_KERNEL BIT(0) > > +#define PANTHOR_BO_FW_MAPPED BIT(1) > > + > > +/** > > + * struct panthor_gem_debugfs - GEM object's DebugFS list information > > + */ > > +struct panthor_gem_debugfs { > > + /** > > + * @node: Node used to insert the object in the device-wide list of > > + * GEM objects, to display information about it through a DebugFS file. > > + */ > > + struct list_head node; > > + > > + /** @creator: Information about the UM process which created the GEM. */ > > + struct { > > + /** @creator.process_name: Group leader name in owning thread's > > process */ > > + char process_name[TASK_COMM_LEN]; > > + > > + /** @creator.tgid: PID of the thread's group leader within its > > process */ > > + pid_t tgid; > > + } creator; > > + > > + /** @bo_mask: Bitmask encoding BO type as {USER, KERNEL} x {GPU, FW} */ > > + u32 bo_mask; > > +}; > > + > > /** > > * struct panthor_gem_object - Driver specific GEM object. > > */ > > @@ -62,6 +88,10 @@ struct panthor_gem_object { > > /** @lock.str: Protects access to the @label.str field. */ > > struct mutex lock; > > } label; > > + > > +#ifdef CONFIG_DEBUG_FS > > + struct panthor_gem_debugfs debugfs; > > +#endif > > }; > > > > /** > > @@ -157,4 +187,9 @@ panthor_kernel_bo_create(struct panthor_device *ptdev, > > struct panthor_vm *vm, > > > > void panthor_kernel_bo_destroy(struct panthor_kernel_bo *bo); > > > > +#ifdef CONFIG_DEBUG_FS > > +void panthor_gem_debugfs_print_bos(struct panthor_device *pfdev, > > + struct seq_file *m); > > +#endif > > + > > #endif /* __PANTHOR_GEM_H__ */ Adrian Larumbe