On 10/23/20 4:42 PM, Nicolas Chautru wrote:
> Run preloading explicitly for unit tests. Load each code block
> by reusing existing input op then restore for the actual test.
>
> Signed-off-by: Nicolas Chautru <nicolas.chau...@intel.com>
> Acked-by: Liu Tianjiao <tianjiao....@intel.com>
> ---
>  app/test-bbdev/main.h            |  1 +
>  app/test-bbdev/test_bbdev_perf.c | 51 
> +++++++++++++++++++++-------------------
>  2 files changed, 28 insertions(+), 24 deletions(-)
>
> diff --git a/app/test-bbdev/main.h b/app/test-bbdev/main.h
> index fb3dec8..dc10a50 100644
> --- a/app/test-bbdev/main.h
> +++ b/app/test-bbdev/main.h
> @@ -17,6 +17,7 @@
>  #define TEST_SKIPPED    1
>  
>  #define MAX_BURST 512U
> +#define MAX_OPS 1024U

This #define is not consistently used.

ex/ see retrieve_harq_ddr, the old 1024 is still being used.

>  #define DEFAULT_BURST 32U
>  #define DEFAULT_OPS 64U
>  #define DEFAULT_ITER 6U
> diff --git a/app/test-bbdev/test_bbdev_perf.c 
> b/app/test-bbdev/test_bbdev_perf.c
> index b62848e..f30cbdb 100644
> --- a/app/test-bbdev/test_bbdev_perf.c
> +++ b/app/test-bbdev/test_bbdev_perf.c
> @@ -2513,20 +2513,20 @@ typedef int (test_case_function)(struct active_device 
> *ad,
>               bool preload)
>  {
>       uint16_t j;
> -     int ret;
> -     uint32_t harq_offset = (uint32_t) queue_id * HARQ_INCR * 1024;
> -     struct rte_bbdev_op_data save_hc_in, save_hc_out;
> -     struct rte_bbdev_dec_op *ops_deq[MAX_BURST];
> +     int deq;
> +     uint32_t harq_offset = (uint32_t) queue_id * HARQ_INCR * MAX_OPS;
> +     struct rte_bbdev_op_data save_hc_in[MAX_OPS], save_hc_out[MAX_OPS];
> +     struct rte_bbdev_dec_op *ops_deq[MAX_OPS];
>       uint32_t flags = ops[0]->ldpc_dec.op_flags;
>       bool mem_in = flags & RTE_BBDEV_LDPC_INTERNAL_HARQ_MEMORY_IN_ENABLE;
>       bool hc_in = flags & RTE_BBDEV_LDPC_HQ_COMBINE_IN_ENABLE;
>       bool mem_out = flags & RTE_BBDEV_LDPC_INTERNAL_HARQ_MEMORY_OUT_ENABLE;
>       bool hc_out = flags & RTE_BBDEV_LDPC_HQ_COMBINE_OUT_ENABLE;
>       bool h_comp = flags & RTE_BBDEV_LDPC_HARQ_6BIT_COMPRESSION;
> -     for (j = 0; j < n; ++j) {
> -             if ((mem_in || hc_in) && preload) {
> -                     save_hc_in = ops[j]->ldpc_dec.harq_combined_input;
> -                     save_hc_out = ops[j]->ldpc_dec.harq_combined_output;
> +     if ((mem_in || hc_in) && preload) {
> +             for (j = 0; j < n; ++j) {
> +                     save_hc_in[j] = ops[j]->ldpc_dec.harq_combined_input;
> +                     save_hc_out[j] = ops[j]->ldpc_dec.harq_combined_output;
>                       ops[j]->ldpc_dec.op_flags =
>                               RTE_BBDEV_LDPC_INTERNAL_HARQ_MEMORY_LOOPBACK +
>                               RTE_BBDEV_LDPC_INTERNAL_HARQ_MEMORY_OUT_ENABLE;

flags are usually handled with bit operators, not arithmetic.

this seems to be a general issue.

> @@ -2536,16 +2536,23 @@ typedef int (test_case_function)(struct active_device 
> *ad,
>                       ops[j]->ldpc_dec.harq_combined_output.offset =
>                                       harq_offset;
>                       ops[j]->ldpc_dec.harq_combined_input.offset = 0;
> -                     rte_bbdev_enqueue_ldpc_dec_ops(dev_id, queue_id,
> -                                     &ops[j], 1);
> -                     ret = 0;
> -                     while (ret == 0)
> -                             ret = rte_bbdev_dequeue_ldpc_dec_ops(
> -                                     dev_id, queue_id, &ops_deq[j], 1);
> +                     harq_offset += HARQ_INCR;
> +             }
> +             rte_bbdev_enqueue_ldpc_dec_ops(dev_id, queue_id, &ops[0], n);
Add check the return is 'n'
> +             deq = 0;
> +             while (deq != n)
> +                     deq += rte_bbdev_dequeue_ldpc_dec_ops(
> +                                     dev_id, queue_id, &ops_deq[deq],
> +                                     n - deq);

Add check the return >= 0

Tom

> +             /* Restore the operations */
> +             for (j = 0; j < n; ++j) {
>                       ops[j]->ldpc_dec.op_flags = flags;
> -                     ops[j]->ldpc_dec.harq_combined_input = save_hc_in;
> -                     ops[j]->ldpc_dec.harq_combined_output = save_hc_out;
> +                     ops[j]->ldpc_dec.harq_combined_input = save_hc_in[j];
> +                     ops[j]->ldpc_dec.harq_combined_output = save_hc_out[j];
>               }
> +     }
> +     harq_offset = (uint32_t) queue_id * HARQ_INCR * MAX_OPS;
> +     for (j = 0; j < n; ++j) {
>               /* Adjust HARQ offset when we reach external DDR */
>               if (mem_in || hc_in)
>                       ops[j]->ldpc_dec.harq_combined_input.offset
> @@ -3231,11 +3238,9 @@ typedef int (test_case_function)(struct active_device 
> *ad,
>                               mbuf_reset(
>                               ops_enq[j]->ldpc_dec.harq_combined_output.data);
>               }
> -             if (extDdr) {
> -                     bool preload = i == (TEST_REPETITIONS - 1);
> +             if (extDdr)
>                       preload_harq_ddr(tp->dev_id, queue_id, ops_enq,
> -                                     num_ops, preload);
> -             }
> +                                     num_ops, true);
>               start_time = rte_rdtsc_precise();
>  
>               for (enq = 0, deq = 0; enq < num_ops;) {
> @@ -3362,11 +3367,9 @@ typedef int (test_case_function)(struct active_device 
> *ad,
>                               mbuf_reset(
>                               ops_enq[j]->ldpc_dec.harq_combined_output.data);
>               }
> -             if (extDdr) {
> -                     bool preload = i == (TEST_REPETITIONS - 1);
> +             if (extDdr)
>                       preload_harq_ddr(tp->dev_id, queue_id, ops_enq,
> -                                     num_ops, preload);
> -             }
> +                                     num_ops, true);
>               start_time = rte_rdtsc_precise();
>  
>               for (enq = 0, deq = 0; enq < num_ops;) {

Reply via email to