Hi Chao,

On 2019/6/21 17:46, Chao Yu wrote:
> On 2019/6/21 0:07, Gao Xiang wrote:
>> This patch adds a new generic decompression framework
>> in order to replace the old LZ4-specific decompression code.
>>
>> Even though LZ4 is still the only supported algorithm, yet
>> it is more cleaner and easy to integrate new algorithm than
>> the old almost hard-coded decompression backend.
>>
>> Signed-off-by: Gao Xiang <gaoxian...@huawei.com>
>> ---
>>  drivers/staging/erofs/Makefile       |   2 +-
>>  drivers/staging/erofs/compress.h     |  21 ++
>>  drivers/staging/erofs/decompressor.c | 307 +++++++++++++++++++++++++++
>>  3 files changed, 329 insertions(+), 1 deletion(-)
>>  create mode 100644 drivers/staging/erofs/decompressor.c
>>
>> diff --git a/drivers/staging/erofs/Makefile b/drivers/staging/erofs/Makefile
>> index 84b412c7a991..adeb5d6e2668 100644
>> --- a/drivers/staging/erofs/Makefile
>> +++ b/drivers/staging/erofs/Makefile
>> @@ -9,5 +9,5 @@ obj-$(CONFIG_EROFS_FS) += erofs.o
>>  ccflags-y += -I $(srctree)/$(src)/include
>>  erofs-objs := super.o inode.o data.o namei.o dir.o utils.o
>>  erofs-$(CONFIG_EROFS_FS_XATTR) += xattr.o
>> -erofs-$(CONFIG_EROFS_FS_ZIP) += unzip_vle.o unzip_vle_lz4.o zmap.o
>> +erofs-$(CONFIG_EROFS_FS_ZIP) += unzip_vle.o unzip_vle_lz4.o zmap.o 
>> decompressor.o
>>  
>> diff --git a/drivers/staging/erofs/compress.h 
>> b/drivers/staging/erofs/compress.h
>> index 1dcfc3b35118..ebeccb1f4eae 100644
>> --- a/drivers/staging/erofs/compress.h
>> +++ b/drivers/staging/erofs/compress.h
>> @@ -9,6 +9,24 @@
>>  #ifndef __EROFS_FS_COMPRESS_H
>>  #define __EROFS_FS_COMPRESS_H
>>  
>> +#include "internal.h"
>> +
>> +enum {
>> +    Z_EROFS_COMPRESSION_SHIFTED = Z_EROFS_COMPRESSION_MAX,
>> +    Z_EROFS_COMPRESSION_RUNTIME_MAX
>> +};
>> +
>> +struct z_erofs_decompress_req {
>> +    struct page **in, **out;
>> +
>> +    unsigned short pageofs_out;
>> +    unsigned int inputsize, outputsize;
>> +
>> +    /* indicate the algorithm will be used for decompression */
>> +    unsigned int alg;
>> +    bool inplace_io, partial_decoding;
>> +};
>> +
>>  /*
>>   * - 0x5A110C8D ('sallocated', Z_EROFS_MAPPING_STAGING) -
>>   * used to mark temporary allocated pages from other
>> @@ -36,5 +54,8 @@ static inline bool z_erofs_put_stagingpage(struct 
>> list_head *pagepool,
>>      return true;
>>  }
>>  
>> +int z_erofs_decompress(struct z_erofs_decompress_req *rq,
>> +                   struct list_head *pagepool);
>> +
>>  #endif
>>  
>> diff --git a/drivers/staging/erofs/decompressor.c 
>> b/drivers/staging/erofs/decompressor.c
>> new file mode 100644
>> index 000000000000..c68d17b579e0
>> --- /dev/null
>> +++ b/drivers/staging/erofs/decompressor.c
>> @@ -0,0 +1,307 @@
>> +// SPDX-License-Identifier: GPL-2.0
>> +/*
>> + * linux/drivers/staging/erofs/decompressor.c
>> + *
>> + * Copyright (C) 2019 HUAWEI, Inc.
>> + *             http://www.huawei.com/
>> + * Created by Gao Xiang <gaoxian...@huawei.com>
>> + */
>> +#include "compress.h"
>> +#include <linux/lz4.h>
>> +
>> +#ifndef LZ4_DISTANCE_MAX    /* history window size */
>> +#define LZ4_DISTANCE_MAX 65535      /* set to maximum value by default */
>> +#endif
>> +
>> +#define LZ4_MAX_DISTANCE_PAGES      DIV_ROUND_UP(LZ4_DISTANCE_MAX, 
>> PAGE_SIZE)
>> +
>> +struct z_erofs_decompressor {
>> +    /*
>> +     * if destpages have sparsed pages, fill them with bounce pages.
>> +     * it also check whether destpages indicate continuous physical memory.
>> +     */
>> +    int (*prepare_destpages)(struct z_erofs_decompress_req *rq,
>> +                             struct list_head *pagepool);
>> +    int (*decompress)(struct z_erofs_decompress_req *rq, u8 *out);
>> +    char *name;
>> +};
>> +
>> +static int lz4_prepare_destpages(struct z_erofs_decompress_req *rq,
>> +                             struct list_head *pagepool)
>> +{
>> +    const unsigned int nr =
>> +            PAGE_ALIGN(rq->pageofs_out + rq->outputsize) >> PAGE_SHIFT;
>> +    struct page *availables[LZ4_MAX_DISTANCE_PAGES] = { NULL };
>> +    unsigned long unused[DIV_ROUND_UP(LZ4_MAX_DISTANCE_PAGES,
>> +                                      BITS_PER_LONG)] = { 0 };
>> +    void *kaddr = NULL;
>> +    unsigned int i, j, k;
>> +
>> +    for (i = 0; i < nr; ++i) {
>> +            struct page *const page = rq->out[i];
>> +
>> +            j = i & (LZ4_MAX_DISTANCE_PAGES - 1);
>> +            if (availables[j])
>> +                    __set_bit(j, unused);
>> +
>> +            if (page) {
>> +                    if (kaddr) {
>> +                            if (kaddr + PAGE_SIZE == page_address(page))
>> +                                    kaddr += PAGE_SIZE;
>> +                            else
>> +                                    kaddr = NULL;
>> +                    } else if (!i) {
>> +                            kaddr = page_address(page);
>> +                    }
>> +                    continue;
>> +            }
>> +            kaddr = NULL;
>> +
>> +            k = find_first_bit(unused, LZ4_MAX_DISTANCE_PAGES);
>> +            if (k < LZ4_MAX_DISTANCE_PAGES) {
>> +                    j = k;
>> +                    get_page(availables[j]);
>> +            } else {
>> +                    DBG_BUGON(availables[j]);
>> +
>> +                    if (!list_empty(pagepool)) {
>> +                            availables[j] = lru_to_page(pagepool);
>> +                            list_del(&availables[j]->lru);
>> +                            DBG_BUGON(page_ref_count(availables[j]) != 1);
>> +                    } else {
>> +                            availables[j] = alloc_pages(GFP_KERNEL, 0);
>> +                            if (!availables[j])
>> +                                    return -ENOMEM;
>> +                    }
>> +                    availables[j]->mapping = Z_EROFS_MAPPING_STAGING;
> 
> Could we use __stagingpage_alloc() instead opened codes, there is something
> different in between them though.

It was written "on propose" since the problem is that currently 
__stagingpage_alloc()
will allocate all pages in GFP_NOFAIL case, but memory allocation failure is 
accepted
here, therefore I open code to aim at introducing new decompression backend.

I will submit another patch after this series to clean up all staging page 
allocation
cases later, which was already on my scheduling list. :)

Thanks,
Gao Xiang

> 
> Reviewed-by: Chao Yu <yuch...@huawei.com>
> 
> Thanks,
> 
>> +            }
>> +            rq->out[i] = availables[j];
>> +            __clear_bit(j, unused);
>> +    }
>> +    return kaddr ? 1 : 0;
>> +}
>> +
>> +static void *generic_copy_inplace_data(struct z_erofs_decompress_req *rq,
>> +                                   u8 *src, unsigned int pageofs_in)
>> +{
>> +    /*
>> +     * if in-place decompression is ongoing, those decompressed
>> +     * pages should be copied in order to avoid being overlapped.
>> +     */
>> +    struct page **in = rq->in;
>> +    u8 *const tmp = erofs_get_pcpubuf(0);
>> +    u8 *tmpp = tmp;
>> +    unsigned int inlen = rq->inputsize - pageofs_in;
>> +    unsigned int count = min_t(uint, inlen, PAGE_SIZE - pageofs_in);
>> +
>> +    while (tmpp < tmp + inlen) {
>> +            if (!src)
>> +                    src = kmap_atomic(*in);
>> +            memcpy(tmpp, src + pageofs_in, count);
>> +            kunmap_atomic(src);
>> +            src = NULL;
>> +            tmpp += count;
>> +            pageofs_in = 0;
>> +            count = PAGE_SIZE;
>> +            ++in;
>> +    }
>> +    return tmp;
>> +}
>> +
>> +static int lz4_decompress(struct z_erofs_decompress_req *rq, u8 *out)
>> +{
>> +    unsigned int inputmargin, inlen;
>> +    u8 *src;
>> +    bool copied;
>> +    int ret;
>> +
>> +    if (rq->inputsize > PAGE_SIZE)
>> +            return -ENOTSUPP;
>> +
>> +    src = kmap_atomic(*rq->in);
>> +    inputmargin = 0;
>> +    while (!src[inputmargin & ~PAGE_MASK])
>> +            if (!(++inputmargin & ~PAGE_MASK))
>> +                    break;
>> +
>> +    if (inputmargin >= rq->inputsize) {
>> +            kunmap_atomic(src);
>> +            return -EIO;
>> +    }
>> +
>> +    copied = false;
>> +    inlen = rq->inputsize - inputmargin;
>> +    if (rq->inplace_io) {
>> +            src = generic_copy_inplace_data(rq, src, inputmargin);
>> +            inputmargin = 0;
>> +            copied = true;
>> +    }
>> +
>> +    ret = LZ4_decompress_safe_partial(src + inputmargin, out,
>> +                                      inlen, rq->outputsize,
>> +                                      rq->outputsize);
>> +    if (ret < 0) {
>> +            errln("%s, failed to decompress, in[%p, %u, %u] out[%p, %u]",
>> +                  __func__, src + inputmargin, inlen, inputmargin,
>> +                  out, rq->outputsize);
>> +            WARN_ON(1);
>> +            print_hex_dump(KERN_DEBUG, "[ in]: ", DUMP_PREFIX_OFFSET,
>> +                           16, 1, src + inputmargin, inlen, true);
>> +            print_hex_dump(KERN_DEBUG, "[out]: ", DUMP_PREFIX_OFFSET,
>> +                           16, 1, out, rq->outputsize, true);
>> +            ret = -EIO;
>> +    }
>> +
>> +    if (copied)
>> +            erofs_put_pcpubuf(src);
>> +    else
>> +            kunmap_atomic(src);
>> +    return ret;
>> +}
>> +
>> +static struct z_erofs_decompressor decompressors[] = {
>> +    [Z_EROFS_COMPRESSION_SHIFTED] = {
>> +            .name = "shifted"
>> +    },
>> +    [Z_EROFS_COMPRESSION_LZ4] = {
>> +            .prepare_destpages = lz4_prepare_destpages,
>> +            .decompress = lz4_decompress,
>> +            .name = "lz4"
>> +    },
>> +};
>> +
>> +static void copy_from_pcpubuf(struct page **out, const char *dst,
>> +                          unsigned short pageofs_out,
>> +                          unsigned int outputsize)
>> +{
>> +    const char *end = dst + outputsize;
>> +    const unsigned int righthalf = PAGE_SIZE - pageofs_out;
>> +    const char *cur = dst - pageofs_out;
>> +
>> +    while (cur < end) {
>> +            struct page *const page = *out++;
>> +
>> +            if (page) {
>> +                    char *buf = kmap_atomic(page);
>> +
>> +                    if (cur >= dst) {
>> +                            memcpy(buf, cur, min_t(uint, PAGE_SIZE,
>> +                                                   end - cur));
>> +                    } else {
>> +                            memcpy(buf + pageofs_out, cur + pageofs_out,
>> +                                   min_t(uint, righthalf, end - cur));
>> +                    }
>> +                    kunmap_atomic(buf);
>> +            }
>> +            cur += PAGE_SIZE;
>> +    }
>> +}
>> +
>> +static int decompress_generic(struct z_erofs_decompress_req *rq,
>> +                          struct list_head *pagepool)
>> +{
>> +    const unsigned int nrpages_out =
>> +            PAGE_ALIGN(rq->pageofs_out + rq->outputsize) >> PAGE_SHIFT;
>> +    const struct z_erofs_decompressor *alg = decompressors + rq->alg;
>> +    unsigned int dst_maptype;
>> +    void *dst;
>> +    int ret;
>> +
>> +    if (nrpages_out == 1 && !rq->inplace_io) {
>> +            DBG_BUGON(!*rq->out);
>> +            dst = kmap_atomic(*rq->out);
>> +            dst_maptype = 0;
>> +            goto dstmap_out;
>> +    }
>> +
>> +    /*
>> +     * For the case of small output size (especially much less
>> +     * than PAGE_SIZE), memcpy the decompressed data rather than
>> +     * compressed data is preferred.
>> +     */
>> +    if (rq->outputsize <= PAGE_SIZE * 7 / 8) {
>> +            dst = erofs_get_pcpubuf(0);
>> +
>> +            rq->inplace_io = false;
>> +            ret = alg->decompress(rq, dst);
>> +            if (!ret)
>> +                    copy_from_pcpubuf(rq->out, dst, rq->pageofs_out,
>> +                                      rq->outputsize);
>> +
>> +            erofs_put_pcpubuf(dst);
>> +            return ret;
>> +    }
>> +
>> +    ret = alg->prepare_destpages(rq, pagepool);
>> +    if (ret < 0) {
>> +            return ret;
>> +    } else if (ret) {
>> +            dst = page_address(*rq->out);
>> +            dst_maptype = 1;
>> +            goto dstmap_out;
>> +    }
>> +
>> +    dst = erofs_vmap(rq->out, nrpages_out);
>> +    if (!dst)
>> +            return -ENOMEM;
>> +    dst_maptype = 2;
>> +
>> +dstmap_out:
>> +    ret = alg->decompress(rq, dst + rq->pageofs_out);
>> +
>> +    if (!dst_maptype)
>> +            kunmap_atomic(dst);
>> +    else if (dst_maptype == 2)
>> +            erofs_vunmap(dst, nrpages_out);
>> +    return ret;
>> +}
>> +
>> +static int shifted_decompress(const struct z_erofs_decompress_req *rq,
>> +                          struct list_head *pagepool)
>> +{
>> +    const unsigned int nrpages_out =
>> +            PAGE_ALIGN(rq->pageofs_out + rq->outputsize) >> PAGE_SHIFT;
>> +    const unsigned int righthalf = PAGE_SIZE - rq->pageofs_out;
>> +    unsigned char *src, *dst;
>> +
>> +    if (nrpages_out > 2) {
>> +            DBG_BUGON(1);
>> +            return -EIO;
>> +    }
>> +
>> +    if (rq->out[0] == *rq->in) {
>> +            DBG_BUGON(nrpages_out != 1);
>> +            return 0;
>> +    }
>> +
>> +    src = kmap_atomic(*rq->in);
>> +    if (!rq->out[0]) {
>> +            dst = NULL;
>> +    } else {
>> +            dst = kmap_atomic(rq->out[0]);
>> +            memcpy(dst + rq->pageofs_out, src, righthalf);
>> +    }
>> +
>> +    if (rq->out[1] == *rq->in) {
>> +            memmove(src, src + righthalf, rq->pageofs_out);
>> +    } else if (nrpages_out == 2) {
>> +            if (dst)
>> +                    kunmap_atomic(dst);
>> +            DBG_BUGON(!rq->out[1]);
>> +            dst = kmap_atomic(rq->out[1]);
>> +            memcpy(dst, src + righthalf, rq->pageofs_out);
>> +    }
>> +    if (dst)
>> +            kunmap_atomic(dst);
>> +    kunmap_atomic(src);
>> +    return 0;
>> +}
>> +
>> +int z_erofs_decompress(struct z_erofs_decompress_req *rq,
>> +                   struct list_head *pagepool)
>> +{
>> +    if (rq->alg == Z_EROFS_COMPRESSION_SHIFTED)
>> +            return shifted_decompress(rq, pagepool);
>> +    return decompress_generic(rq, pagepool);
>> +}
>> +
>>
_______________________________________________
devel mailing list
de...@linuxdriverproject.org
http://driverdev.linuxdriverproject.org/mailman/listinfo/driverdev-devel

Reply via email to