A user can invoke mmap_action_map_kernel_pages() to specify that the
mapping should map kernel pages starting from desc->start of a specified
number of pages specified in an array.

In order to implement this, adjust mmap_action_prepare() to be able to
return an error code, as it makes sense to assert that the specified
parameters are valid as quickly as possible as well as updating the VMA
flags to include VMA_MIXEDMAP_BIT as necessary.

This provides an mmap_prepare equivalent of vm_insert_pages().

We additionally update the existing vm_insert_pages() code to use
range_in_vma() and add a new range_in_vma_desc() helper function for the
mmap_prepare case, sharing the code between the two in range_is_subset().

We add both mmap_action_map_kernel_pages() and
mmap_action_map_kernel_pages_full() to allow for both partial and full VMA
mappings.

We also add mmap_action_map_kernel_pages_discontig() to allow for
discontiguous mapping of kernel pages should the need arise.

We update the documentation to reflect the new features.

Finally, we update the VMA tests accordingly to reflect the changes.

Signed-off-by: Lorenzo Stoakes (Oracle) <[email protected]>
---
 Documentation/filesystems/mmap_prepare.rst |  8 ++
 include/linux/mm.h                         | 94 +++++++++++++++++++++-
 include/linux/mm_types.h                   |  7 ++
 mm/memory.c                                | 42 +++++++++-
 mm/util.c                                  |  6 ++
 tools/testing/vma/include/dup.h            |  7 ++
 6 files changed, 159 insertions(+), 5 deletions(-)

diff --git a/Documentation/filesystems/mmap_prepare.rst 
b/Documentation/filesystems/mmap_prepare.rst
index d21406848bca..f89718285869 100644
--- a/Documentation/filesystems/mmap_prepare.rst
+++ b/Documentation/filesystems/mmap_prepare.rst
@@ -129,5 +129,13 @@ pointer. These are:
 * `mmap_action_simple_ioremap()` - Sets up an I/O remap from a specified
   physical address and over a specified length.
 
+* `mmap_action_map_kernel_pages()` - Maps a specified array of `struct page`
+  pointers in the VMA from a specific offset.
+
+* `mmap_action_map_kernel_pages_full()` - Maps a specified array of `struct
+  page` pointers over the entire VMA. The caller must ensure there are
+  sufficient entries in the page array to cover the entire range of the
+  described VMA.
+
 **NOTE:** The 'action' field should never normally be manipulated directly,
 rather you ought to use one of these helpers.
diff --git a/include/linux/mm.h b/include/linux/mm.h
index 88f42faeb377..88ad5649c02d 100644
--- a/include/linux/mm.h
+++ b/include/linux/mm.h
@@ -4160,6 +4160,45 @@ static inline void mmap_action_simple_ioremap(struct 
vm_area_desc *desc,
        action->type = MMAP_SIMPLE_IO_REMAP;
 }
 
+/**
+ * mmap_action_map_kernel_pages - helper for mmap_prepare hook to specify that
+ * @num kernel pages contained in the @pages array should be mapped to userland
+ * starting at virtual address @start.
+ * @desc: The VMA descriptor for the VMA requiring kernel pags to be mapped.
+ * @start: The virtual address from which to map them.
+ * @pages: An array of struct page pointers describing the memory to map.
+ * @nr_pages: The number of entries in the @pages aray.
+ */
+static inline void mmap_action_map_kernel_pages(struct vm_area_desc *desc,
+               unsigned long start, struct page **pages,
+               unsigned long nr_pages)
+{
+       struct mmap_action *action = &desc->action;
+
+       action->type = MMAP_MAP_KERNEL_PAGES;
+       action->map_kernel.start = start;
+       action->map_kernel.pages = pages;
+       action->map_kernel.nr_pages = nr_pages;
+       action->map_kernel.pgoff = desc->pgoff;
+}
+
+/**
+ * mmap_action_map_kernel_pages_full - helper for mmap_prepare hook to specify 
that
+ * kernel pages contained in the @pages array should be mapped to userland
+ * from @desc->start to @desc->end.
+ * @desc: The VMA descriptor for the VMA requiring kernel pags to be mapped.
+ * @pages: An array of struct page pointers describing the memory to map.
+ *
+ * The caller must ensure that @pages contains sufficient entries to cover the
+ * entire range described by @desc.
+ */
+static inline void mmap_action_map_kernel_pages_full(struct vm_area_desc *desc,
+               struct page **pages)
+{
+       mmap_action_map_kernel_pages(desc, desc->start, pages,
+                                    vma_desc_pages(desc));
+}
+
 int mmap_action_prepare(struct vm_area_desc *desc,
                        struct mmap_action *action);
 int mmap_action_complete(struct vm_area_struct *vma,
@@ -4177,10 +4216,59 @@ static inline struct vm_area_struct 
*find_exact_vma(struct mm_struct *mm,
        return vma;
 }
 
+/**
+ * range_is_subset - Is the specified inner range a subset of the outer range?
+ * @outer_start: The start of the outer range.
+ * @outer_end: The exclusive end of the outer range.
+ * @inner_start: The start of the inner range.
+ * @inner_end: The exclusive end of the inner range.
+ *
+ * Returns %true if [inner_start, inner_end) is a subset of [outer_start,
+ * outer_end), otherwise %false.
+ */
+static inline bool range_is_subset(unsigned long outer_start,
+                                  unsigned long outer_end,
+                                  unsigned long inner_start,
+                                  unsigned long inner_end)
+{
+       return outer_start <= inner_start && inner_end <= outer_end;
+}
+
+/**
+ * range_in_vma - is the specified [@start, @end) range a subset of the VMA?
+ * @vma: The VMA against which we want to check [@start, @end).
+ * @start: The start of the range we wish to check.
+ * @end: The exclusive end of the range we wish to check.
+ *
+ * Returns %true if [@start, @end) is a subset of [@vma->vm_start,
+ * @vma->vm_end), %false otherwise.
+ */
 static inline bool range_in_vma(const struct vm_area_struct *vma,
                                unsigned long start, unsigned long end)
 {
-       return (vma && vma->vm_start <= start && end <= vma->vm_end);
+       if (!vma)
+               return false;
+
+       return range_is_subset(vma->vm_start, vma->vm_end, start, end);
+}
+
+/**
+ * range_in_vma_desc - is the specified [@start, @end) range a subset of the 
VMA
+ * described by @desc, a VMA descriptor?
+ * @desc: The VMA descriptor against which we want to check [@start, @end).
+ * @start: The start of the range we wish to check.
+ * @end: The exclusive end of the range we wish to check.
+ *
+ * Returns %true if [@start, @end) is a subset of [@desc->start, @desc->end),
+ * %false otherwise.
+ */
+static inline bool range_in_vma_desc(const struct vm_area_desc *desc,
+                                    unsigned long start, unsigned long end)
+{
+       if (!desc)
+               return false;
+
+       return range_is_subset(desc->start, desc->end, start, end);
 }
 
 #ifdef CONFIG_MMU
@@ -4212,6 +4300,10 @@ int remap_pfn_range(struct vm_area_struct *vma, unsigned 
long addr,
 int vm_insert_page(struct vm_area_struct *, unsigned long addr, struct page *);
 int vm_insert_pages(struct vm_area_struct *vma, unsigned long addr,
                        struct page **pages, unsigned long *num);
+int map_kernel_pages_prepare(struct vm_area_desc *desc,
+                            struct mmap_action *action);
+int map_kernel_pages_complete(struct vm_area_struct *vma,
+                             struct mmap_action *action);
 int vm_map_pages(struct vm_area_struct *vma, struct page **pages,
                                unsigned long num);
 int vm_map_pages_zero(struct vm_area_struct *vma, struct page **pages,
diff --git a/include/linux/mm_types.h b/include/linux/mm_types.h
index 316bb0adf91d..6e7a399f0724 100644
--- a/include/linux/mm_types.h
+++ b/include/linux/mm_types.h
@@ -815,6 +815,7 @@ enum mmap_action_type {
        MMAP_REMAP_PFN,         /* Remap PFN range. */
        MMAP_IO_REMAP_PFN,      /* I/O remap PFN range. */
        MMAP_SIMPLE_IO_REMAP,   /* I/O remap with guardrails. */
+       MMAP_MAP_KERNEL_PAGES,  /* Map kernel page range from array. */
 };
 
 /*
@@ -833,6 +834,12 @@ struct mmap_action {
                        phys_addr_t start_phys_addr;
                        unsigned long size;
                } simple_ioremap;
+               struct {
+                       unsigned long start;
+                       struct page **pages;
+                       unsigned long nr_pages;
+                       pgoff_t pgoff;
+               } map_kernel;
        };
        enum mmap_action_type type;
 
diff --git a/mm/memory.c b/mm/memory.c
index 351cc917b7aa..608a98c4c947 100644
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -2484,13 +2484,14 @@ static int insert_pages(struct vm_area_struct *vma, 
unsigned long addr,
 int vm_insert_pages(struct vm_area_struct *vma, unsigned long addr,
                        struct page **pages, unsigned long *num)
 {
-       const unsigned long end_addr = addr + (*num * PAGE_SIZE) - 1;
+       const unsigned long nr_pages = *num;
+       const unsigned long end = addr + PAGE_SIZE * nr_pages;
 
-       if (addr < vma->vm_start || end_addr >= vma->vm_end)
+       if (!range_in_vma(vma, addr, end))
                return -EFAULT;
        if (!(vma->vm_flags & VM_MIXEDMAP)) {
-               BUG_ON(mmap_read_trylock(vma->vm_mm));
-               BUG_ON(vma->vm_flags & VM_PFNMAP);
+               VM_WARN_ON_ONCE(mmap_read_trylock(vma->vm_mm));
+               VM_WARN_ON_ONCE(vma->vm_flags & VM_PFNMAP);
                vm_flags_set(vma, VM_MIXEDMAP);
        }
        /* Defer page refcount checking till we're about to map that page. */
@@ -2498,6 +2499,39 @@ int vm_insert_pages(struct vm_area_struct *vma, unsigned 
long addr,
 }
 EXPORT_SYMBOL(vm_insert_pages);
 
+int map_kernel_pages_prepare(struct vm_area_desc *desc,
+                            struct mmap_action *action)
+{
+       const unsigned long addr = action->map_kernel.start;
+       unsigned long nr_pages, end;
+
+       if (!vma_desc_test(desc, VMA_MIXEDMAP_BIT)) {
+               VM_WARN_ON_ONCE(mmap_read_trylock(desc->mm));
+               VM_WARN_ON_ONCE(vma_desc_test(desc, VMA_PFNMAP_BIT));
+               vma_desc_set_flags(desc, VMA_MIXEDMAP_BIT);
+       }
+
+       nr_pages = action->map_kernel.nr_pages;
+       end = addr + PAGE_SIZE * nr_pages;
+       if (!range_in_vma_desc(desc, addr, end))
+               return -EFAULT;
+
+       return 0;
+}
+EXPORT_SYMBOL(map_kernel_pages_prepare);
+
+int map_kernel_pages_complete(struct vm_area_struct *vma,
+                             struct mmap_action *action)
+{
+       unsigned long nr_pages;
+
+       nr_pages = action->map_kernel.nr_pages;
+       return insert_pages(vma, action->map_kernel.start,
+                           action->map_kernel.pages,
+                           &nr_pages, vma->vm_page_prot);
+}
+EXPORT_SYMBOL(map_kernel_pages_complete);
+
 /**
  * vm_insert_page - insert single page into user vma
  * @vma: user vma to map to
diff --git a/mm/util.c b/mm/util.c
index e739d7c0311c..7934e303b230 100644
--- a/mm/util.c
+++ b/mm/util.c
@@ -1445,6 +1445,8 @@ int mmap_action_prepare(struct vm_area_desc *desc,
                return io_remap_pfn_range_prepare(desc, action);
        case MMAP_SIMPLE_IO_REMAP:
                return simple_ioremap_prepare(desc, action);
+       case MMAP_MAP_KERNEL_PAGES:
+               return map_kernel_pages_prepare(desc, action);
        }
 }
 EXPORT_SYMBOL(mmap_action_prepare);
@@ -1473,6 +1475,9 @@ int mmap_action_complete(struct vm_area_struct *vma,
        case MMAP_IO_REMAP_PFN:
                err = io_remap_pfn_range_complete(vma, action);
                break;
+       case MMAP_MAP_KERNEL_PAGES:
+               err = map_kernel_pages_complete(vma, action);
+               break;
        case MMAP_SIMPLE_IO_REMAP:
                /*
                 * The simple I/O remap should have been delegated to an I/O
@@ -1496,6 +1501,7 @@ int mmap_action_prepare(struct vm_area_desc *desc,
        case MMAP_REMAP_PFN:
        case MMAP_IO_REMAP_PFN:
        case MMAP_SIMPLE_IO_REMAP:
+       case MMAP_MAP_KERNEL_PAGES:
                WARN_ON_ONCE(1); /* nommu cannot handle these. */
                break;
        }
diff --git a/tools/testing/vma/include/dup.h b/tools/testing/vma/include/dup.h
index 4f2c9bb6b1ea..50ef2f62150d 100644
--- a/tools/testing/vma/include/dup.h
+++ b/tools/testing/vma/include/dup.h
@@ -425,6 +425,7 @@ enum mmap_action_type {
        MMAP_REMAP_PFN,         /* Remap PFN range. */
        MMAP_IO_REMAP_PFN,      /* I/O remap PFN range. */
        MMAP_SIMPLE_IO_REMAP,   /* I/O remap with guardrails. */
+       MMAP_MAP_KERNEL_PAGES,  /* Map kernel page range from an array. */
 };
 
 /*
@@ -443,6 +444,12 @@ struct mmap_action {
                        phys_addr_t start;
                        unsigned long len;
                } simple_ioremap;
+               struct {
+                       unsigned long start;
+                       struct page **pages;
+                       unsigned long num;
+                       pgoff_t pgoff;
+               } map_kernel;
        };
        enum mmap_action_type type;
 
-- 
2.53.0


Reply via email to