On Thu, Dec 07, 2023 at 04:18:16PM +0000, Euan Bourke wrote:
> Two new functions, the first is a 'heuristic parser' which examines a
> string describing a set of cores and determines based off heuristics
> whether its a coremask or a corelist.
> 
> Second is a 'combined parser' which calls the first function and then
> based off the returned value will call the relevant core string parser.
> This function also takes a 'default_type' int which corresponds to
> which parser should be used in the case of an ambiguous string.
> 
> Signed-off-by: Euan Bourke <euan.bou...@intel.com>
> ---
>  lib/arg_parser/arg_parser.c     | 68 +++++++++++++++++++++++++++++++++
>  lib/arg_parser/rte_arg_parser.h | 60 +++++++++++++++++++++++++++++
>  lib/arg_parser/version.map      |  2 +
>  3 files changed, 130 insertions(+)
> 
> diff --git a/lib/arg_parser/arg_parser.c b/lib/arg_parser/arg_parser.c
> index cebab9e2f8..95cbc50c13 100644
> --- a/lib/arg_parser/arg_parser.c
> +++ b/lib/arg_parser/arg_parser.c
> @@ -7,10 +7,15 @@
>  #include "ctype.h"
>  #include "string.h"
>  #include "stdbool.h"
> +#include "stdio.h"
>  
>  #include <rte_arg_parser.h>
>  #include <rte_common.h>
>  
> +#define RTE_ARG_PARSE_TYPE_COREMASK 0
> +#define RTE_ARG_PARSE_TYPE_CORELIST 1
> +#define RTE_ARG_PARSE_TYPE_UNKNOWN 2
> +

As these are used as return values, they need to be defined in the header
file so that applications can use them.

>  #define BITS_PER_HEX 4
>  #define MAX_COREMASK_SIZE ((UINT16_MAX + 1) / BITS_PER_HEX)
>  
> @@ -22,6 +27,7 @@ struct core_bits {
>       uint32_t total_bits_set;
>  };
>  
> +

Stray newline added to patch.

>  static inline bool
>  get_core_bit(struct core_bits *mask, uint16_t idx)
>  {
> @@ -159,3 +165,65 @@ rte_arg_parse_coremask(const char *coremask, uint16_t 
> *cores, uint32_t cores_len
>  
>       return total_count;
>  }
> +
> +int
> +rte_arg_parse_arg_type(const char *core_string)
> +{
> +     /* Remove leading whitespace */
> +     while (isblank(*core_string))
> +             core_string++;
> +
> +     /* Check for 0x prefix */
> +     if (core_string[0] == '0' && tolower(core_string[1]) == 'x') {
> +             if (core_string[2] != '\0')
> +                     return RTE_ARG_PARSE_TYPE_COREMASK;
> +             return -1;
> +     }
> +
> +     int i = 0, idx = 0;
> +     /* Check for ',' and '-' and check for A-F */
> +     do {
> +             while (isblank(core_string[idx]))
> +                     idx++;
> +
> +             if (core_string[idx] == ',' || core_string[idx] == '-')
> +                     return RTE_ARG_PARSE_TYPE_CORELIST;
> +
> +             if (isalpha(core_string[idx])) {
> +                     if (isxdigit(core_string[idx]))
> +                             return RTE_ARG_PARSE_TYPE_COREMASK;
> +                     return -1;
> +             }
> +             idx++;
> +             i++;
> +     } while (core_string[idx] != '\0');
> +
> +     /* Check length of core_string if ambiguous as max length of a uint16_t 
> is 5 digits
> +      * implying its a coremask.
> +      */
> +     if (i > 5)
> +             return RTE_ARG_PARSE_TYPE_COREMASK;
> +
> +     return -1;

Rather than returning -1, I think in most/all cases above, the function
should return -EINVAL as error code, since it's invalid input passed.

> +}
> +
> +int
> +rte_arg_parse_core_string(const char *core_string, uint16_t *cores, uint32_t 
> cores_len,
> +             int default_type)
> +{
> +     if (default_type != RTE_ARG_PARSE_TYPE_COREMASK &&
> +                     default_type != RTE_ARG_PARSE_TYPE_CORELIST) {
> +             return -1;
> +     }
> +     switch (rte_arg_parse_arg_type(core_string)) {
> +     case RTE_ARG_PARSE_TYPE_COREMASK:
> +             return rte_arg_parse_coremask(core_string, cores, cores_len);
> +     case RTE_ARG_PARSE_TYPE_CORELIST:
> +             return rte_arg_parse_corelist(core_string, cores, cores_len);
> +     default:
> +             return default_type == RTE_ARG_PARSE_TYPE_COREMASK ?
> +                     rte_arg_parse_coremask(core_string, cores, cores_len) :
> +                     rte_arg_parse_corelist(core_string, cores, cores_len);
> +             return -1;
> +     }
> +}
> diff --git a/lib/arg_parser/rte_arg_parser.h b/lib/arg_parser/rte_arg_parser.h
> index 359d40e305..125ca9524c 100644
> --- a/lib/arg_parser/rte_arg_parser.h
> +++ b/lib/arg_parser/rte_arg_parser.h
> @@ -92,6 +92,66 @@ __rte_experimental
>  int
>  rte_arg_parse_coremask(const char *coremask, uint16_t *cores, uint32_t 
> cores_len);
>  
> +/**
> + * Use heuristics to determine if a string contains a coremask or a corelist.
> + *
> + * This function will check a series of conditions and return an int 
> representing which
> + * core type (mask or list) the string represents or UNKNOWN if the string 
> is ambiguous.

"or report the type as unknown if it is ambiguous"

> + *
> + * @param core_string
> + *   A string describing the intended cores to be parsed
> + * @return
> + *   int representing the core type
> + *   -1: error.

Suggest "negative error code on error". We should also list out the error
codes at the end, though I think right now -EINVAL is the only one we need.

> + *   0: coremask.
> + *   1: corelist.
> + *   2: unknown (ambiguous).

Move the #defines from the C file to the header, and use them here rather
than magic numbers.

> + */
> +__rte_experimental
> +int
> +rte_arg_parse_arg_type(const char *core_string);
> +
> +/**
> + * Convert a string describing either a corelist or coremask into an array 
> of core ids.
> + *
> + * This function will fill the "cores" array up to "cores_len" with the core 
> ids described
> + * in the "core_string". The string can either describe a corelist or a 
> coremask, and
> + * will be parsed accordingly. The number of unique core ids in the string 
> is then returned.
> + * For example:
> + * "1-4" is treated as a corelist and results in an array of [1,2,3,4] with 
> 4 being returned
> + * "0xA1" is treated as a coremask and results in an array of [0,5,7] with 3 
> being returned
> + *
> + * In the case of an ambiguous string, the function will use the 
> default_type parameter to
> + * decide.
> + *
> + * NOTE: if the length of the input array is insufficient to hold the number 
> of core ids
> + * in "core_string" the input array is filled to capacity but the return 
> value is the
> + * number of elements which would have been written to the array, had enough 
> space been
> + * available. [This is similar to the behaviour of the snprintf function]. 
> Because of
> + * this, the number of core values in the "core_string" may be determined by 
> calling the
> + * function with a NULL array pointer and array length given as 0.
> + *
> + * @param core_string
> + *   A string describing the intended cores to be parsed.
> + * @param cores
> + *   An array where to store the core ids.
> + *   Array can be NULL if "cores_len" is 0.
> + * @param cores_len
> + *   The length of the "cores" array.
> + *   If the size is smaller than that needed to hold all cores from 
> "core_string"
> + * @param default_type
> + *   How to treat ambiguous cases (e.g. '4' could be mask or list).
> + *   0: mask.
> + *   1: list.

Again, use the defines.

> + * @return
> + *   n: the number of unique cores present in "core_string".
> + *   -1 if the string was invalid.
> + *   NOTE: if n > "cores_len", then only "cores_len" elements in the "cores" 
> array are valid.
> + */
> +__rte_experimental
> +int
> +rte_arg_parse_core_string(const char *core_string, uint16_t *cores, uint32_t 
> cores_len,
> +             int default_type);
>  
>  #ifdef __cplusplus
>  }
> diff --git a/lib/arg_parser/version.map b/lib/arg_parser/version.map
> index b44d4b02b7..383b6bd0e9 100644
> --- a/lib/arg_parser/version.map
> +++ b/lib/arg_parser/version.map
> @@ -8,4 +8,6 @@ EXPERIMENTAL {
>       # added in 24.03
>       rte_arg_parse_corelist;
>       rte_arg_parse_coremask;
> +     rte_arg_parse_arg_type;
> +     rte_arg_parse_core_string;


The version.map lists are kept alphabetical, so the new entries need to be
moved up.

>  };
> -- 
> 2.34.1
> 

Reply via email to