Hi Amit, There are many commit for dma-perf, I've done a re-review and have a few comments, pls see below:
On 2023/11/22 19:06, Gowrishankar Muthukrishnan wrote: > From: Amit Prakash Shukla <amitpraka...@marvell.com> > > Add support to test performance for "device to memory" and > "memory to device" data transfer. > > Signed-off-by: Amit Prakash Shukla <amitpraka...@marvell.com> > Acked-by: Anoob Joseph <ano...@marvell.com> > --- > app/test-dma-perf/benchmark.c | 108 +++++++++++++++++++++++++++++++--- > app/test-dma-perf/config.ini | 37 ++++++++++++ > app/test-dma-perf/main.c | 67 +++++++++++++++++++++ > app/test-dma-perf/main.h | 6 ++ > 4 files changed, 209 insertions(+), 9 deletions(-) > > diff --git a/app/test-dma-perf/benchmark.c b/app/test-dma-perf/benchmark.c > index 9b1f58c78c..eaed224c67 100644 > --- a/app/test-dma-perf/benchmark.c > +++ b/app/test-dma-perf/benchmark.c > @@ -127,17 +127,54 @@ cache_flush_buf(__rte_unused struct rte_mbuf **array, > #endif > } > > +static int > +vchan_data_populate(uint32_t dev_id, struct rte_dma_vchan_conf *qconf, > + struct test_configure *cfg) > +{ > + struct rte_dma_info info; > + > + qconf->direction = cfg->transfer_dir; > + > + rte_dma_info_get(dev_id, &info); > + if (!(RTE_BIT64(qconf->direction) & info.dev_capa)) > + return -1; > + > + qconf->nb_desc = cfg->ring_size.cur; > + > + switch (qconf->direction) { > + case RTE_DMA_DIR_MEM_TO_DEV: > + qconf->dst_port.pcie.vfen = 1; > + qconf->dst_port.port_type = RTE_DMA_PORT_PCIE; > + qconf->dst_port.pcie.coreid = cfg->dcoreid; > + qconf->dst_port.pcie.vfid = cfg->vfid; > + qconf->dst_port.pcie.pfid = cfg->pfid; > + break; > + case RTE_DMA_DIR_DEV_TO_MEM: > + qconf->src_port.pcie.vfen = 1; > + qconf->src_port.port_type = RTE_DMA_PORT_PCIE; > + qconf->src_port.pcie.coreid = cfg->scoreid; > + qconf->src_port.pcie.vfid = cfg->vfid; > + qconf->src_port.pcie.pfid = cfg->pfid; > + break; > + case RTE_DMA_DIR_MEM_TO_MEM: > + case RTE_DMA_DIR_DEV_TO_DEV: > + break; > + } > + > + return 0; > +} > + > /* Configuration of device. */ > static void > -configure_dmadev_queue(uint32_t dev_id, uint32_t ring_size) > +configure_dmadev_queue(uint32_t dev_id, struct test_configure *cfg) > { > uint16_t vchan = 0; > struct rte_dma_info info; > struct rte_dma_conf dev_config = { .nb_vchans = 1 }; > - struct rte_dma_vchan_conf qconf = { > - .direction = RTE_DMA_DIR_MEM_TO_MEM, > - .nb_desc = ring_size > - }; > + struct rte_dma_vchan_conf qconf = { 0 }; > + > + if (vchan_data_populate(dev_id, &qconf, cfg) != 0) > + rte_exit(EXIT_FAILURE, "Error with vchan data populate.\n"); > > if (rte_dma_configure(dev_id, &dev_config) != 0) > rte_exit(EXIT_FAILURE, "Error with dma configure.\n"); > @@ -159,7 +196,6 @@ configure_dmadev_queue(uint32_t dev_id, uint32_t > ring_size) > static int > config_dmadevs(struct test_configure *cfg) > { > - uint32_t ring_size = cfg->ring_size.cur; > struct lcore_dma_map_t *ldm = &cfg->lcore_dma_map; > uint32_t nb_workers = ldm->cnt; > uint32_t i; > @@ -176,7 +212,7 @@ config_dmadevs(struct test_configure *cfg) > } > > ldm->dma_ids[i] = dev_id; > - configure_dmadev_queue(dev_id, ring_size); > + configure_dmadev_queue(dev_id, cfg); > ++nb_dmadevs; > } > > @@ -302,13 +338,22 @@ do_cpu_mem_copy(void *p) > return 0; > } > > +static void > +dummy_free_ext_buf(void *addr, void *opaque) > +{ > + RTE_SET_USED(addr); > + RTE_SET_USED(opaque); > +} > + > static int > setup_memory_env(struct test_configure *cfg, struct rte_mbuf ***srcs, > struct rte_mbuf ***dsts) > { > + static struct rte_mbuf_ext_shared_info *ext_buf_info; > unsigned int buf_size = cfg->buf_size.cur; > unsigned int nr_sockets; > uint32_t nr_buf = cfg->nr_buf; > + uint32_t i; > > nr_sockets = rte_socket_count(); > if (cfg->src_numa_node >= nr_sockets || > @@ -361,16 +406,47 @@ setup_memory_env(struct test_configure *cfg, struct > rte_mbuf ***srcs, > return -1; > } > > + if (cfg->transfer_dir == RTE_DMA_DIR_DEV_TO_MEM || > + cfg->transfer_dir == RTE_DMA_DIR_MEM_TO_DEV) { > + ext_buf_info = rte_malloc(NULL, sizeof(struct > rte_mbuf_ext_shared_info), 0); > + if (ext_buf_info == NULL) { > + printf("Error: ext_buf_info malloc failed.\n"); > + return -1; > + } > + } > + > + if (cfg->transfer_dir == RTE_DMA_DIR_DEV_TO_MEM) { > + ext_buf_info->free_cb = dummy_free_ext_buf; > + ext_buf_info->fcb_opaque = NULL; > + for (i = 0; i < nr_buf; i++) { > + /* Using mbuf structure to hold remote iova address. */ > + rte_pktmbuf_attach_extbuf((*srcs)[i], (void > *)cfg->raddr, > + (rte_iova_t)cfg->raddr, 0, > ext_buf_info); > + rte_mbuf_ext_refcnt_update(ext_buf_info, 1); > + } > + } > + > + if (cfg->transfer_dir == RTE_DMA_DIR_MEM_TO_DEV) { > + ext_buf_info->free_cb = dummy_free_ext_buf; > + ext_buf_info->fcb_opaque = NULL; > + for (i = 0; i < nr_buf; i++) { > + /* Using mbuf structure to hold remote iova address. */ > + rte_pktmbuf_attach_extbuf((*dsts)[i], (void > *)cfg->raddr, > + (rte_iova_t)cfg->raddr, 0, > ext_buf_info); > + rte_mbuf_ext_refcnt_update(ext_buf_info, 1); > + } > + } > + > return 0; > } > > void > mem_copy_benchmark(struct test_configure *cfg, bool is_dma) > { > - uint16_t i; > + uint32_t i; > uint32_t offset; > unsigned int lcore_id = 0; > - struct rte_mbuf **srcs = NULL, **dsts = NULL; > + struct rte_mbuf **srcs = NULL, **dsts = NULL, **m = NULL; > struct lcore_dma_map_t *ldm = &cfg->lcore_dma_map; > unsigned int buf_size = cfg->buf_size.cur; > uint16_t kick_batch = cfg->kick_batch.cur; > @@ -476,6 +552,20 @@ mem_copy_benchmark(struct test_configure *cfg, bool > is_dma) > avg_cycles_total / nb_workers, bandwidth_total, > mops_total); > > out: > + > + if (cfg->transfer_dir == RTE_DMA_DIR_DEV_TO_MEM) > + m = srcs; > + else if (cfg->transfer_dir == RTE_DMA_DIR_MEM_TO_DEV) > + m = dsts; > + > + if (m) { > + for (i = 0; i < nr_buf; i++) > + rte_pktmbuf_detach_extbuf(m[i]); > + > + if (m[0]->shinfo && rte_mbuf_ext_refcnt_read(m[0]->shinfo) == 0) > + rte_free(m[0]->shinfo); > + } > + > /* free mbufs used in the test */ > if (srcs != NULL) > rte_pktmbuf_free_bulk(srcs, nr_buf); > diff --git a/app/test-dma-perf/config.ini b/app/test-dma-perf/config.ini > index 4d59234b2a..cddcf93c6e 100644 > --- a/app/test-dma-perf/config.ini > +++ b/app/test-dma-perf/config.ini > @@ -38,6 +38,23 @@ > > ; "skip" To skip a test-case set skip to 1. > > +; Parameters to be configured for data transfers from "mem to dev" and "dev > to mem": > +; > ================================================================================== > +; "direction" denotes the direction of data transfer. It can take 3 values: > +; 0 - mem to mem transfer > +; 1 - mem to dev transfer > +; 2 - dev to mem transfer I prefer readable string not number, for examples: mem2mem mem2dev dev2mem > +; If not specified the default value is 0 (mem to mem transfer). > + > +; "raddr" remote iova address for "mem to dev" and "dev to mem" transfer. > + > +; "scoreid" denotes source PCIe core index. > +; "dcoreid" denotes destination PCIe core index. > +; "pfid" denotes PF-id to be used for data transfer > +; "vfid" denotes VF-id of PF-id to be used for data transfer. too many entries, and it all about pcie, the 'struct rte_dma_port_param' future may support other bus. Suggest the entry is vchan_dev, user could input some thing like 1. vchan_dev=bus=pcie,coreid=1,pfid=0,vfid=1,addr=xxx add add descriptor, only valid when direction is one of mem2dev or dev2mem It could use kvargs library to parse the value of entry vchan_dev > + > +; =========== End of "mem to dev" and "dev to mem" config parameters. > ============== > + > [case1] > type=DMA_MEM_COPY > mem_size=10 > @@ -52,6 +69,26 @@ lcore_dma=lcore10@0000:00:04.2, lcore11@0000:00:04.3 > eal_args=--in-memory --file-prefix=test > > [case2] > +skip=1 > +type=DMA_MEM_COPY > +direction=2 > +raddr=0x200000000 > +scoreid=0 > +dcoreid=0 > +pfid=0 > +vfid=0 > +mem_size=10 > +buf_size=64,4096,2,MUL > +dma_ring_size=1024 > +kick_batch=32 > +src_numa_node=0 > +dst_numa_node=0 > +cache_flush=0 > +test_seconds=2 > +lcore_dma=lcore10@0000:00:04.2, lcore11@0000:00:04.3 > +eal_args=--in-memory --file-prefix=test > + > +[case3] > type=CPU_MEM_COPY > mem_size=10 > buf_size=64,8192,2,MUL > diff --git a/app/test-dma-perf/main.c b/app/test-dma-perf/main.c > index 33c3750bb1..3eddf2e40a 100644 > --- a/app/test-dma-perf/main.c > +++ b/app/test-dma-perf/main.c > @@ -16,6 +16,7 @@ > #include <rte_cfgfile.h> > #include <rte_string_fns.h> > #include <rte_lcore.h> > +#include <rte_dmadev.h> > > #include "main.h" > > @@ -331,9 +332,11 @@ load_configs(const char *path) > struct test_configure *test_case; > char section_name[CFG_NAME_LEN]; > const char *case_type; > + const char *transfer_dir; > const char *lcore_dma; > const char *mem_size_str, *buf_size_str, *ring_size_str, > *kick_batch_str; > const char *skip; > + const char *raddr, *scoreid, *dcoreid, *vfid, *pfid; > int args_nr, nb_vp; > bool is_dma; > > @@ -371,6 +374,20 @@ load_configs(const char *path) > if (strcmp(case_type, DMA_MEM_COPY) == 0) { > test_case->test_type = TEST_TYPE_DMA_MEM_COPY; > test_case->test_type_str = DMA_MEM_COPY; > + > + transfer_dir = rte_cfgfile_get_entry(cfgfile, > section_name, "direction"); > + if (transfer_dir == NULL) { > + printf("Transfer direction not configured." > + " Defaulting it to MEM to MEM > transfer.\n"); > + test_case->transfer_dir = > RTE_DMA_DIR_MEM_TO_MEM; > + } else > + test_case->transfer_dir = > (uint8_t)atoi(transfer_dir); > + > + if (test_case->transfer_dir >= RTE_DMA_DIR_DEV_TO_DEV) { > + printf("Error: Invalid transfer direction > configured.\n"); > + test_case->is_valid = false; > + continue; > + } > is_dma = true; > } else if (strcmp(case_type, CPU_MEM_COPY) == 0) { > test_case->test_type = TEST_TYPE_CPU_MEM_COPY; > @@ -382,6 +399,56 @@ load_configs(const char *path) > continue; > } > > + if (test_case->transfer_dir == RTE_DMA_DIR_MEM_TO_DEV || > + test_case->transfer_dir == RTE_DMA_DIR_DEV_TO_MEM) { > + char *endptr; > + > + raddr = rte_cfgfile_get_entry(cfgfile, section_name, > "raddr"); > + if (raddr == NULL) { > + printf("Error: No raddr configured for > case%d.\n", i + 1); > + test_case->is_valid = false; > + continue; > + } > + test_case->raddr = strtoull(raddr, &endptr, 16); > + > + vfid = rte_cfgfile_get_entry(cfgfile, section_name, > "vfid"); > + if (vfid == NULL) { > + printf("Error: No vfid configured for > case%d.\n", i + 1); > + test_case->is_valid = false; > + continue; > + } > + test_case->vfid = (uint16_t)atoi(vfid); > + > + pfid = rte_cfgfile_get_entry(cfgfile, section_name, > "pfid"); > + if (pfid == NULL) { > + printf("Error: No pfid configured for > case%d.\n", i + 1); > + test_case->is_valid = false; > + continue; > + } > + test_case->pfid = (uint8_t)atoi(pfid); > + > + } > + > + if (test_case->transfer_dir == RTE_DMA_DIR_DEV_TO_MEM) { > + scoreid = rte_cfgfile_get_entry(cfgfile, section_name, > "scoreid"); > + if (scoreid == NULL) { > + printf("Error: No scoreid configured for > case%d.\n", i + 1); > + test_case->is_valid = false; > + continue; > + } > + test_case->scoreid = (uint8_t)atoi(scoreid); > + } > + > + if (test_case->transfer_dir == RTE_DMA_DIR_MEM_TO_DEV) { > + dcoreid = rte_cfgfile_get_entry(cfgfile, section_name, > "dcoreid"); > + if (dcoreid == NULL) { > + printf("Error: No dcoreid configured for > case%d.\n", i + 1); > + test_case->is_valid = false; > + continue; > + } > + test_case->dcoreid = (uint8_t)atoi(dcoreid); > + } > + suggest add a subfunction to wrap parsing device's config. > test_case->src_numa_node = > (int)atoi(rte_cfgfile_get_entry(cfgfile, > section_name, > "src_numa_node")); > test_case->dst_numa_node = > (int)atoi(rte_cfgfile_get_entry(cfgfile, > diff --git a/app/test-dma-perf/main.h b/app/test-dma-perf/main.h > index 32670151af..8ac3270fba 100644 > --- a/app/test-dma-perf/main.h > +++ b/app/test-dma-perf/main.h > @@ -42,6 +42,7 @@ struct test_configure { > bool is_valid; > bool is_skip; > uint8_t test_type; > + uint8_t transfer_dir; > const char *test_type_str; > uint16_t src_numa_node; > uint16_t dst_numa_node; > @@ -57,6 +58,11 @@ struct test_configure { > uint16_t test_secs; > const char *eal_args; > uint8_t scenario_id; > + uint8_t scoreid; > + uint8_t dcoreid; > + uint8_t pfid; > + uint16_t vfid; > + uintptr_t raddr; suggest create new struct: struct test_vchan_dev_config { struct rte_dma_port_param port; uintptr_t addr; }; So defined as: struct test_vchan_dev_config vchan_dev; Thanks > }; > > void mem_copy_benchmark(struct test_configure *cfg, bool is_dma); >