Hi Christoph,

On Tue, Sep 01, 2020 at 09:36:23AM +0200, Christoph Hellwig wrote:
> I really don't like all the open coded smarts in the various drivers.
> What do you think about a helper like the one in the untested patch

A helper function will be actually better. I was thinking of
one yet not very sure about the naming and where to put it.

> below (on top of your series).  Also please include the original
> segment boundary patch with the next resend so that the series has
> the full context.

I will use your change instead and resend with the ULONG_MAX
change. But in that case, should I make separate changes for
different files like this series, or just one single change
like yours?

Asking this as I was expecting that those changes would get
applied by different maintainers. But now it feels like you
will merge it to your tree at once?

Thanks
Nic

> diff --git a/arch/alpha/kernel/pci_iommu.c b/arch/alpha/kernel/pci_iommu.c
> index 1ef2c647bd3ec2..6f7de4f4e191e7 100644
> --- a/arch/alpha/kernel/pci_iommu.c
> +++ b/arch/alpha/kernel/pci_iommu.c
> @@ -141,10 +141,7 @@ iommu_arena_find_pages(struct device *dev, struct 
> pci_iommu_arena *arena,
>       unsigned long boundary_size;
>  
>       base = arena->dma_base >> PAGE_SHIFT;
> -
> -     boundary_size = dev ? dma_get_seg_boundary(dev) : U32_MAX;
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (boundary_size >> PAGE_SHIFT) + 1;
> +     boundary_size = dma_get_seg_boundary_nr_pages(dev, PAGE_SHIFT);
>  
>       /* Search forward for the first mask-aligned sequence of N free ptes */
>       ptes = arena->ptes;
> diff --git a/arch/ia64/hp/common/sba_iommu.c b/arch/ia64/hp/common/sba_iommu.c
> index 945954903bb0ba..b49b73a95067d2 100644
> --- a/arch/ia64/hp/common/sba_iommu.c
> +++ b/arch/ia64/hp/common/sba_iommu.c
> @@ -485,8 +485,7 @@ sba_search_bitmap(struct ioc *ioc, struct device *dev,
>       ASSERT(((unsigned long) ioc->res_hint & (sizeof(unsigned long) - 1UL)) 
> == 0);
>       ASSERT(res_ptr < res_end);
>  
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (dma_get_seg_boundary(dev) >> iovp_shift) + 1;
> +     boundary_size = dma_get_seg_boundary_nr_pages(dev, iovp_shift);
>  
>       BUG_ON(ioc->ibase & ~iovp_mask);
>       shift = ioc->ibase >> iovp_shift;
> diff --git a/arch/powerpc/kernel/iommu.c b/arch/powerpc/kernel/iommu.c
> index c01ccbf8afdd42..cbc2e62db597cf 100644
> --- a/arch/powerpc/kernel/iommu.c
> +++ b/arch/powerpc/kernel/iommu.c
> @@ -236,11 +236,7 @@ static unsigned long iommu_range_alloc(struct device 
> *dev,
>               }
>       }
>  
> -     /* 4GB boundary for iseries_hv_alloc and iseries_hv_map */
> -     boundary_size = dev ? dma_get_seg_boundary(dev) : U32_MAX;
> -
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (boundary_size >> tbl->it_page_shift) + 1;
> +     boundary_size = dma_get_seg_boundary_nr_pages(dev, tbl->it_page_shift);
>  
>       n = iommu_area_alloc(tbl->it_map, limit, start, npages, tbl->it_offset,
>                            boundary_size, align_mask);
> diff --git a/arch/s390/pci/pci_dma.c b/arch/s390/pci/pci_dma.c
> index ecb067acc6d532..4a37d8f4de9d9d 100644
> --- a/arch/s390/pci/pci_dma.c
> +++ b/arch/s390/pci/pci_dma.c
> @@ -261,13 +261,11 @@ static unsigned long __dma_alloc_iommu(struct device 
> *dev,
>                                      unsigned long start, int size)
>  {
>       struct zpci_dev *zdev = to_zpci(to_pci_dev(dev));
> -     unsigned long boundary_size;
>  
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (dma_get_seg_boundary(dev) >> PAGE_SHIFT) + 1;
>       return iommu_area_alloc(zdev->iommu_bitmap, zdev->iommu_pages,
>                               start, size, zdev->start_dma >> PAGE_SHIFT,
> -                             boundary_size, 0);
> +                             dma_get_seg_boundary_nr_pages(dev, PAGE_SHIFT),
> +                             0);
>  }
>  
>  static dma_addr_t dma_alloc_address(struct device *dev, int size)
> diff --git a/arch/sparc/kernel/iommu-common.c 
> b/arch/sparc/kernel/iommu-common.c
> index 843e71894d0482..e6139c99762e11 100644
> --- a/arch/sparc/kernel/iommu-common.c
> +++ b/arch/sparc/kernel/iommu-common.c
> @@ -166,10 +166,6 @@ unsigned long iommu_tbl_range_alloc(struct device *dev,
>               }
>       }
>  
> -     boundary_size = dev ? dma_get_seg_boundary(dev) : U32_MAX;
> -
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (boundary_size >> iommu->table_shift) + 1;
>       /*
>        * if the skip_span_boundary_check had been set during init, we set
>        * things up so that iommu_is_span_boundary() merely checks if the
> @@ -178,7 +174,11 @@ unsigned long iommu_tbl_range_alloc(struct device *dev,
>       if ((iommu->flags & IOMMU_NO_SPAN_BOUND) != 0) {
>               shift = 0;
>               boundary_size = iommu->poolsize * iommu->nr_pools;
> +     } else {
> +             boundary_size = dma_get_seg_boundary_nr_pages(dev,
> +                                     iommu->table_shift);
>       }
> +
>       n = iommu_area_alloc(iommu->map, limit, start, npages, shift,
>                            boundary_size, align_mask);
>       if (n == -1) {
> diff --git a/arch/sparc/kernel/iommu.c b/arch/sparc/kernel/iommu.c
> index d981c37305ae31..c3e4e2df26a8b8 100644
> --- a/arch/sparc/kernel/iommu.c
> +++ b/arch/sparc/kernel/iommu.c
> @@ -472,8 +472,7 @@ static int dma_4u_map_sg(struct device *dev, struct 
> scatterlist *sglist,
>       outs->dma_length = 0;
>  
>       max_seg_size = dma_get_max_seg_size(dev);
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     seg_boundary_size = (dma_get_seg_boundary(dev) >> IO_PAGE_SHIFT) + 1;
> +     seg_boundary_size = dma_get_seg_boundary_nr_pages(dev, IO_PAGE_SHIFT);
>       base_shift = iommu->tbl.table_map_base >> IO_PAGE_SHIFT;
>       for_each_sg(sglist, s, nelems, i) {
>               unsigned long paddr, npages, entry, out_entry = 0, slen;
> diff --git a/arch/sparc/kernel/pci_sun4v.c b/arch/sparc/kernel/pci_sun4v.c
> index 233fe8a20cec33..6b92dd51c0026f 100644
> --- a/arch/sparc/kernel/pci_sun4v.c
> +++ b/arch/sparc/kernel/pci_sun4v.c
> @@ -508,8 +508,7 @@ static int dma_4v_map_sg(struct device *dev, struct 
> scatterlist *sglist,
>       iommu_batch_start(dev, prot, ~0UL);
>  
>       max_seg_size = dma_get_max_seg_size(dev);
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     seg_boundary_size = (dma_get_seg_boundary(dev) >> IO_PAGE_SHIFT) + 1;
> +     seg_boundary_size = dma_get_seg_boundary_nr_pages(dev, IO_PAGE_SHIFT);
>  
>       mask = *dev->dma_mask;
>       if (!iommu_use_atu(iommu, mask))
> diff --git a/arch/x86/kernel/amd_gart_64.c b/arch/x86/kernel/amd_gart_64.c
> index 7fa0bb490065a1..bccc5357bffd6c 100644
> --- a/arch/x86/kernel/amd_gart_64.c
> +++ b/arch/x86/kernel/amd_gart_64.c
> @@ -96,8 +96,7 @@ static unsigned long alloc_iommu(struct device *dev, int 
> size,
>  
>       base_index = ALIGN(iommu_bus_base & dma_get_seg_boundary(dev),
>                          PAGE_SIZE) >> PAGE_SHIFT;
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (dma_get_seg_boundary(dev) >> PAGE_SHIFT) + 1;
> +     boundary_size = dma_get_seg_boundary_nr_pages(dev, PAGE_SHIFT);
>  
>       spin_lock_irqsave(&iommu_bitmap_lock, flags);
>       offset = iommu_area_alloc(iommu_gart_bitmap, iommu_pages, next_bit,
> diff --git a/drivers/parisc/ccio-dma.c b/drivers/parisc/ccio-dma.c
> index c667d6aba7646e..ba16b7f8f80612 100644
> --- a/drivers/parisc/ccio-dma.c
> +++ b/drivers/parisc/ccio-dma.c
> @@ -356,8 +356,7 @@ ccio_alloc_range(struct ioc *ioc, struct device *dev, 
> size_t size)
>       ** ggg sacrifices another 710 to the computer gods.
>       */
>  
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (dma_get_seg_boundary(dev) >> IOVP_SHIFT) + 1;
> +     boundary_size = dma_get_seg_boundary_nr_pages(dev, IOVP_SHIFT);
>  
>       if (pages_needed <= 8) {
>               /*
> diff --git a/drivers/parisc/sba_iommu.c b/drivers/parisc/sba_iommu.c
> index 96bc2c617cbd19..959bda193b9603 100644
> --- a/drivers/parisc/sba_iommu.c
> +++ b/drivers/parisc/sba_iommu.c
> @@ -342,8 +342,7 @@ sba_search_bitmap(struct ioc *ioc, struct device *dev,
>       unsigned long shift;
>       int ret;
>  
> -     /* Overflow-free shortcut for: ALIGN(b + 1, 1 << s) >> s */
> -     boundary_size = (dma_get_seg_boundary(dev) >> IOVP_SHIFT) + 1;
> +     boundary_size = dma_get_seg_boundary_nr_pages(dev, IOVP_SHIFT);
>  
>  #if defined(ZX1_SUPPORT)
>       BUG_ON(ioc->ibase & ~IOVP_MASK);
> diff --git a/include/linux/dma-mapping.h b/include/linux/dma-mapping.h
> index 52635e91143b25..7477a164500adb 100644
> --- a/include/linux/dma-mapping.h
> +++ b/include/linux/dma-mapping.h
> @@ -632,6 +632,25 @@ static inline unsigned long dma_get_seg_boundary(struct 
> device *dev)
>       return DMA_BIT_MASK(32);
>  }
>  
> +/**
> + * dma_get_seg_boundary_nr_pages - return the segment boundary in "page" 
> units
> + * @dev: device to guery the boundary for
> + * @page_shift: ilog() of the the IOMMU page size
> + *
> + * Return the segment boundary in IOMMU page units (which may be different 
> from
> + * the CPU page size) for the passed in device.
> + *
> + * If @dev is NULL a boundary of U32_MAX is assumed, this case is just for
> + * non-DMA API callers.
> + */
> +static inline unsigned long dma_get_seg_boundary_nr_pages(struct device *dev,
> +             unsigned int page_shift)
> +{
> +     if (!dev)
> +             return (U32_MAX >> page_shift) + 1;
> +     return (dma_get_seg_boundary(dev) >> page_shift) + 1;
> +}
> +
>  static inline int dma_set_seg_boundary(struct device *dev, unsigned long 
> mask)
>  {
>       if (dev->dma_parms) {

Reply via email to