Hi Fengchengwen,

> 
> On 2023/11/3 23:38, Gowrishankar Muthukrishnan wrote:
> > Add scatter-gather copy tests.
> >
> > Signed-off-by: Vidya Sagar Velumuri <vvelum...@marvell.com>
> > Signed-off-by: Gowrishankar Muthukrishnan <gmuthukri...@marvell.com>
> > ---
> >  app/test/test_dmadev.c     | 132 +++++++++++++++++++++++++++++-
> >  app/test/test_dmadev_api.c | 163 ++++++++++++++++++++++++++++++++++-
> --
> >  app/test/test_dmadev_api.h |   2 +
> >  3 files changed, 283 insertions(+), 14 deletions(-)
> >
> > diff --git a/app/test/test_dmadev.c b/app/test/test_dmadev.c index
> > 780941fc1e..a2f3a7f999 100644
> > --- a/app/test/test_dmadev.c
> > +++ b/app/test/test_dmadev.c
> > @@ -19,7 +19,7 @@
> >  #define ERR_RETURN(...) do { print_err(__func__, __LINE__,
> > __VA_ARGS__); return -1; } while (0)
> >
> >  #define TEST_RINGSIZE 512
> > -#define COPY_LEN 1024
> > +#define COPY_LEN 1032
> 
> The test MAX_SG_NUM is limit 4, so it could be 1/2/3/4 segment, and 1032 can
> both div 1/2/3/4, but 1024 couldn't
> 
> I think this is why change 1024->1032.
> Suggest add some comment about it.
>

This change is not required after normalization as done in next patch.
 
> >
> >  static struct rte_mempool *pool;
> >  static int16_t test_dev_id;
> > @@ -396,6 +396,120 @@ test_stop_start(int16_t dev_id, uint16_t vchan)
> >     return 0;
> >  }
> >
> > +static int
> > +test_enqueue_sg_copies(int16_t dev_id, uint16_t vchan) {
> > +   unsigned int src_len, dst_len, n_sge, len, i, j, k;
> > +   char orig_src[COPY_LEN], orig_dst[COPY_LEN];
> > +   struct rte_dma_info info = { 0 };
> > +   enum rte_dma_status_code status;
> > +   uint16_t id, n_src, n_dst;
> > +
> > +   if (rte_dma_info_get(dev_id, &info) < 0)
> > +           ERR_RETURN("Failed to get dev info");
> > +
> > +   n_sge = RTE_MIN(info.max_sges, TEST_SG_MAX);
> > +   len = COPY_LEN;
> > +
> > +   for (n_src = 1; n_src <= n_sge; n_src++) {
> > +           src_len = len / n_src;
> > +           for (n_dst = 1; n_dst <= n_sge; n_dst++) {
> > +                   dst_len = len / n_dst;
> 
> If the len % [1~n_dst] not zero, how to process it ?
> 
> I see, it was ensured by adjust copy_len value. Suggest add comments for it.
> 
> Also suggest extra above to one function.

I have added minor fix here to normalize buffer lengths. Please check in next 
patch version.
> 
> > +
> > +                   struct rte_dma_sge sg_src[n_sge], sg_dst[n_sge];
> > +                   struct rte_mbuf *src[n_sge], *dst[n_sge];
> > +                   char *src_data[n_sge], *dst_data[n_sge];
> > +
> > +                   for (i = 0 ; i < COPY_LEN; i++)
> > +                           orig_src[i] = rte_rand() & 0xFF;
> > +
> > +                   memset(orig_dst, 0, COPY_LEN);
> > +
> > +                   for (i = 0; i < n_src; i++) {
> > +                           src[i] = rte_pktmbuf_alloc(pool);
> > +                           RTE_ASSERT(src[i] != NULL);
> > +                           sg_src[i].addr = rte_pktmbuf_iova(src[i]);
> > +                           sg_src[i].length = src_len;
> > +                           src_data[i] = rte_pktmbuf_mtod(src[i], char *);
> > +                   }
> > +
> > +                   for (k = 0; k < n_dst; k++) {
> > +                           dst[k] = rte_pktmbuf_alloc(pool);
> > +                           RTE_ASSERT(dst[k] != NULL);
> > +                           sg_dst[k].addr = rte_pktmbuf_iova(dst[k]);
> > +                           sg_dst[k].length = dst_len;
> > +                           dst_data[k] = rte_pktmbuf_mtod(dst[k], char
> *);
> > +                   }
> > +
> > +                   for (i = 0; i < n_src; i++) {
> > +                           for (j = 0; j < src_len; j++)
> > +                                   src_data[i][j] = orig_src[i * src_len + 
> > j];
> > +                   }
> > +
> > +                   for (k = 0; k < n_dst; k++)
> > +                           memset(dst_data[k], 0, dst_len);
> > +
> > +                   printf("\tsrc segs: %2d [seg len: %4d] - dst segs: %2d
> [seg len : %4d]\n",
> > +                           n_src, src_len, n_dst, dst_len);
> > +
> > +                   id = rte_dma_copy_sg(dev_id, vchan, sg_src, sg_dst,
> n_src, n_dst,
> > +                                        RTE_DMA_OP_FLAG_SUBMIT);
> > +
> > +                   if (id != id_count)
> > +                           ERR_RETURN("Error with rte_dma_copy_sg,
> got %u, expected %u\n",
> > +                                   id, id_count);
> > +
> > +                   /* Give time for copy to finish, then check it was done
> */
> > +                   await_hw(dev_id, vchan);
> > +
> > +                   for (k = 0; k < n_dst; k++)
> > +                           memcpy((&orig_dst[0] + k * dst_len),
> dst_data[k], dst_len);
> > +
> > +                   if (memcmp(orig_src, orig_dst, COPY_LEN))
> > +                           ERR_RETURN("Data mismatch");
> > +
> > +                   /* Verify completion */
> > +                   id = ~id;
> > +                   if (rte_dma_completed(dev_id, vchan, 1, &id, NULL) !=
> 1)
> > +                           ERR_RETURN("Error with
> rte_dma_completed\n");
> > +
> > +                   /* Verify expected index(id_count) */
> > +                   if (id != id_count)
> > +                           ERR_RETURN("Error:incorrect job id received,
> %u [expected %u]\n",
> > +                                           id, id_count);
> > +
> > +                   /* Check for completed and id when no job done */
> > +                   id = ~id;
> > +                   if (rte_dma_completed(dev_id, vchan, 1, &id, NULL) !=
> 0)
> > +                           ERR_RETURN("Error with rte_dma_completed
> when no job done\n");
> > +
> > +                   if (id != id_count)
> > +                           ERR_RETURN("Error:incorrect job id received
> when no job done, %u [expected %u]\n",
> > +                                      id, id_count);
> > +
> > +                   /* Check for completed_status and id when no job done
> */
> > +                   id = ~id;
> > +                   if (rte_dma_completed_status(dev_id, vchan, 1, &id,
> &status) != 0)
> > +                           ERR_RETURN("Error with
> rte_dma_completed_status when no job done\n");
> > +                   if (id != id_count)
> > +                           ERR_RETURN("Error:incorrect job id received
> when no job done, %u [expected %u]\n",
> > +                                           id, 0);
> > +
> > +                   for (i = 0; i < n_src; i++)
> > +                           rte_pktmbuf_free(src[i]);
> > +                   for (i = 0; i < n_dst; i++)
> > +                           rte_pktmbuf_free(dst[i]);
> > +
> > +                   /* Verify that completion returns nothing more */
> > +                   if (rte_dma_completed(dev_id, 0, 1, NULL, NULL) != 0)
> > +                           ERR_RETURN("Error with rte_dma_completed
> in empty check\n");
> 
> already verify this, no need do more

But this is against empty param check (as it is also done in plain copy test).

> 
> > +
> > +                   id_count++;
> > +           }
> > +   }
> > +   return 0;
> > +}
> > +
> >  /* Failure handling test cases - global macros and variables for those 
> > tests*/
> >  #define COMP_BURST_SZ      16
> >  #define OPT_FENCE(idx) ((fence && idx == 8) ? RTE_DMA_OP_FLAG_FENCE :
> > 0) @@ -1003,7 +1117,7 @@ test_dmadev_setup(void)
> >                     TEST_RINGSIZE * 2, /* n == num elements */
> >                     32,  /* cache size */
> >                     0,   /* priv size */
> > -                   2048, /* data room size */
> > +                   COPY_LEN + RTE_PKTMBUF_HEADROOM, /* data
> room size */
> >                     info.numa_node);
> >     if (pool == NULL)
> >             ERR_RETURN("Error with mempool creation\n"); @@ -1026,6
> +1140,7 @@
> > test_dmadev_instance(int16_t dev_id)
> >  #define CHECK_ERRS    true
> >     enum {
> >               TEST_COPY = 0,
> > +             TEST_COPY_SG,
> >               TEST_START,
> >               TEST_BURST,
> >               TEST_ERR,
> > @@ -1060,6 +1175,13 @@ test_dmadev_instance(int16_t dev_id)
> >     param[TEST_COPY].vchan = vchan;
> >     param[TEST_COPY].check_err_stats = CHECK_ERRS;
> >
> > +   param[TEST_COPY_SG].printable = "copy";
> 
> should be SG copy.

Ack.
> 
> > +   param[TEST_COPY_SG].test_fn = test_enqueue_sg_copies;
> > +   param[TEST_COPY_SG].iterations = 1;
> > +   param[TEST_COPY_SG].dev_id = dev_id;
> > +   param[TEST_COPY_SG].vchan = vchan;
> > +   param[TEST_COPY_SG].check_err_stats = CHECK_ERRS;
> > +
> >     param[TEST_START].printable = "stop-start";
> >     param[TEST_START].test_fn = test_stop_start;
> >     param[TEST_START].iterations = 1;
> > @@ -1122,6 +1244,12 @@ test_dmadev_instance(int16_t dev_id)
> >     /* run tests stopping/starting devices and check jobs still work after
> restart */
> >     ts->unit_test_cases[TEST_START].enabled = 1;
> >
> > +   /* run SG test cases */
> > +   if ((dev_info.dev_capa & RTE_DMA_CAPA_OPS_COPY_SG) == 0)
> > +           printf("DMA Dev %u: No SG support, skipping SG copy tests\n",
> dev_id);
> > +   else
> > +           ts->unit_test_cases[TEST_COPY_SG].enabled = 1;
> 
> suggest wrap it as test_dmadev_sg_copy_setup, just like
> test_dmadev_burst_setup
> 
> > +
> >     /* run some burst capacity tests */
> >     ts->unit_test_cases[TEST_BURST].setup = test_dmadev_burst_setup;
> >     ts->unit_test_cases[TEST_BURST].enabled = 1; diff --git
> > a/app/test/test_dmadev_api.c b/app/test/test_dmadev_api.c index
> > aa07d2b359..37e43c9336 100644
> > --- a/app/test/test_dmadev_api.c
> > +++ b/app/test/test_dmadev_api.c
> > @@ -10,6 +10,7 @@
> >  #include <rte_dmadev.h>
> >
> >  #include "test.h"
> > +#include "test_dmadev_api.h"
> >
> >  extern int test_dma_api(uint16_t dev_id);
> >
> > @@ -21,36 +22,62 @@ static int16_t invalid_dev_id;
> >
> >  static char *src;
> >  static char *dst;
> > +static char *src_sg[TEST_SG_MAX];
> > +static char *dst_sg[TEST_SG_MAX];
> >
> >  static int
> >  testsuite_setup(void)
> >  {
> >     invalid_dev_id = -1;
> > -
> > -   src = rte_malloc("dmadev_test_src", TEST_MEMCPY_SIZE, 0);
> > -   if (src == NULL)
> > -           return -ENOMEM;
> > -   dst = rte_malloc("dmadev_test_dst", TEST_MEMCPY_SIZE, 0);
> > -   if (dst == NULL) {
> > -           rte_free(src);
> > -           src = NULL;
> > -           return -ENOMEM;
> > +   int i, rc = 0;
> > +
> > +   for (i = 0; i < TEST_SG_MAX; i++) {
> > +           src_sg[i] = rte_malloc("dmadev_test_src", TEST_MEMCPY_SIZE,
> 0);
> > +           if (src_sg[i] == NULL) {
> > +                   rc = -ENOMEM;
> > +                   goto exit;
> > +           }
> > +
> > +           dst_sg[i] = rte_malloc("dmadev_test_dst", TEST_MEMCPY_SIZE,
> 0);
> > +           if (dst_sg[i] == NULL) {
> > +                   rte_free(src_sg[i]);
> > +                   src_sg[i] = NULL;
> > +                   rc = -ENOMEM;
> > +                   goto exit;
> > +           }
> >     }
> >
> > +   src = src_sg[0];
> > +   dst = dst_sg[0];
> > +
> >     /* Set dmadev log level to critical to suppress unnecessary output
> >      * during API tests.
> >      */
> >     rte_log_set_level_pattern("lib.dmadev", RTE_LOG_CRIT);
> >
> > -   return 0;
> > +   return rc;
> > +exit:
> > +   while (--i >= 0) {
> > +           rte_free(src_sg[i]);
> > +           rte_free(dst_sg[i]);
> > +   }
> > +
> > +   return rc;
> >  }
> >
> >  static void
> >  testsuite_teardown(void)
> >  {
> > -   rte_free(src);
> > +   int i;
> > +
> > +   for (i = 0; i < TEST_SG_MAX; i++) {
> > +           rte_free(src_sg[i]);
> > +           src_sg[i] = NULL;
> > +           rte_free(dst_sg[i]);
> > +           dst_sg[i] = NULL;
> > +   }
> > +
> >     src = NULL;
> > -   rte_free(dst);
> >     dst = NULL;
> >     /* Ensure the dmadev is stopped. */
> >     rte_dma_stop(test_dev_id);
> > @@ -437,6 +464,37 @@ verify_memory(void)
> >     return 0;
> >  }
> >
> > +static void
> > +sg_memory_setup(int n)
> > +{
> > +   int i, j;
> > +
> > +   for (i = 0; i < n; i++) {
> > +           for (j = 0; j < TEST_MEMCPY_SIZE; j++)
> > +                   src_sg[i][j] = (char)j;
> > +
> > +           memset(dst_sg[i], 0, TEST_MEMCPY_SIZE);
> > +   }
> > +}
> > +
> > +static int
> > +sg_memory_verify(int n)
> > +{
> > +   int i, j;
> > +
> > +   for (i = 0; i < n; i++) {
> > +           for (j = 0; j < TEST_MEMCPY_SIZE; j++) {
> > +                   if (src_sg[i][j] == dst_sg[i][j])
> > +                           continue;
> > +
> > +                   RTE_TEST_ASSERT_EQUAL(src_sg[i][j], dst_sg[i][j],
> "Failed to copy memory, %d %d",
> > +                           src_sg[i][j], dst_sg[i][j]);
> > +           }
> > +   }
> > +
> > +   return 0;
> > +}
> > +
> >  static int
> >  test_dma_completed(void)
> >  {
> > @@ -551,6 +609,86 @@ test_dma_completed_status(void)
> >     return TEST_SUCCESS;
> >  }
> >
> > +static int
> > +test_dma_sg(void)
> > +{
> > +   struct rte_dma_sge src_sge[TEST_SG_MAX], dst_sge[TEST_SG_MAX];
> > +   struct rte_dma_info dev_info = { 0 };
> > +   uint16_t last_idx = -1;
> > +   bool has_error = true;
> > +   int n_sge, i, ret;
> > +   uint16_t cpl_ret;
> > +
> > +   ret = rte_dma_info_get(test_dev_id, &dev_info);
> > +   RTE_TEST_ASSERT_SUCCESS(ret, "Failed to obtain device info, %d",
> > +ret);
> > +
> > +   if ((dev_info.dev_capa & RTE_DMA_CAPA_OPS_COPY_SG) == 0)
> > +           return TEST_SKIPPED;
> > +
> > +   n_sge = RTE_MIN(dev_info.max_sges, TEST_SG_MAX);
> > +
> > +   ret = setup_vchan(1);
> > +   RTE_TEST_ASSERT_SUCCESS(ret, "Failed to setup one vchan, %d", ret);
> > +
> > +   ret = rte_dma_start(test_dev_id);
> > +   RTE_TEST_ASSERT_SUCCESS(ret, "Failed to start, %d", ret);
> > +
> > +   for (i = 0; i < n_sge; i++) {
> > +           src_sge[i].addr = rte_malloc_virt2iova(src_sg[i]);
> > +           src_sge[i].length = TEST_MEMCPY_SIZE;
> > +           dst_sge[i].addr = rte_malloc_virt2iova(dst_sg[i]);
> > +           dst_sge[i].length = TEST_MEMCPY_SIZE;
> > +   }
> > +
> > +   sg_memory_setup(n_sge);
> > +
> > +   /* Check enqueue without submit */
> > +   ret = rte_dma_copy_sg(test_dev_id, 0, src_sge, dst_sge, n_sge, n_sge,
> 0);
> > +   RTE_TEST_ASSERT_EQUAL(ret, 0, "Failed to enqueue copy, %d", ret);
> > +
> > +   rte_delay_us_sleep(TEST_WAIT_US_VAL);
> > +
> > +   cpl_ret = rte_dma_completed(test_dev_id, 0, 1, &last_idx, &has_error);
> > +   RTE_TEST_ASSERT_EQUAL(cpl_ret, 0, "Failed to get completed");
> > +
> > +   /* Check DMA submit */
> > +   ret = rte_dma_submit(test_dev_id, 0);
> > +   RTE_TEST_ASSERT_SUCCESS(ret, "Failed to submit, %d", ret);
> > +
> > +   rte_delay_us_sleep(TEST_WAIT_US_VAL);
> > +
> > +   cpl_ret = rte_dma_completed(test_dev_id, 0, 1, &last_idx, &has_error);
> > +   RTE_TEST_ASSERT_EQUAL(cpl_ret, 1, "Failed to get completed");
> > +   RTE_TEST_ASSERT_EQUAL(last_idx, 0, "Last idx should be zero, %u",
> last_idx);
> > +   RTE_TEST_ASSERT_EQUAL(has_error, false, "Should have no error");
> > +
> > +   ret = sg_memory_verify(n_sge);
> > +   RTE_TEST_ASSERT_SUCCESS(ret, "Failed to verify memory");
> > +
> > +   sg_memory_setup(n_sge);
> > +
> > +   /* Check for enqueue with submit */
> > +   ret = rte_dma_copy_sg(test_dev_id, 0, src_sge, dst_sge, n_sge, n_sge,
> > +                         RTE_DMA_OP_FLAG_SUBMIT);
> > +   RTE_TEST_ASSERT_EQUAL(ret, 1, "Failed to enqueue copy, %d", ret);
> > +
> > +   rte_delay_us_sleep(TEST_WAIT_US_VAL);
> > +
> > +   cpl_ret = rte_dma_completed(test_dev_id, 0, 1, &last_idx, &has_error);
> > +   RTE_TEST_ASSERT_EQUAL(cpl_ret, 1, "Failed to get completed");
> > +   RTE_TEST_ASSERT_EQUAL(last_idx, 1, "Last idx should be 1, %u",
> last_idx);
> > +   RTE_TEST_ASSERT_EQUAL(has_error, false, "Should have no error");
> > +
> > +   ret = sg_memory_verify(n_sge);
> > +   RTE_TEST_ASSERT_SUCCESS(ret, "Failed to verify memory");
> > +
> > +   /* Stop dmadev to make sure dmadev to a known state */
> > +   ret = rte_dma_stop(test_dev_id);
> > +   RTE_TEST_ASSERT_SUCCESS(ret, "Failed to stop, %d", ret);
> > +
> > +   return TEST_SUCCESS;
> > +}
> > +
> >  static struct unit_test_suite dma_api_testsuite = {
> >     .suite_name = "DMA API Test Suite",
> >     .setup = testsuite_setup,
> > @@ -568,6 +706,7 @@ static struct unit_test_suite dma_api_testsuite = {
> >             TEST_CASE(test_dma_dump),
> >             TEST_CASE(test_dma_completed),
> >             TEST_CASE(test_dma_completed_status),
> > +           TEST_CASE(test_dma_sg),
> >             TEST_CASES_END()
> >     }
> >  };
> > diff --git a/app/test/test_dmadev_api.h b/app/test/test_dmadev_api.h
> > index 33fbc5bd41..10ab925f80 100644
> > --- a/app/test/test_dmadev_api.h
> > +++ b/app/test/test_dmadev_api.h
> > @@ -2,4 +2,6 @@
> >   * Copyright(c) 2021 HiSilicon Limited
> >   */
> >
> > +#define TEST_SG_MAX 4
> 
> suggest TEST_MAX_SGES which corresponding dev_info.max_sges

Ok, I have fixed API test to validate against max_ages.

Thanks,
Gowrishankar
> 
> Thanks
> Chengwen
> 
> > +
> >  int test_dma_api(uint16_t dev_id);
> >

Reply via email to