Both lexer and parser reject invalid interpolation specifications. The parser's check is useless.
The lexer ends the token right after the first bad character. This tends to lead to suboptimal error reporting. For instance, input [ %11d ] produces the tokens JSON_LSQUARE [ JSON_ERROR %1 JSON_INTEGER 1 JSON_KEYWORD d JSON_RSQUARE ] The parser then yields an error, an object and two more errors: error: Invalid JSON syntax object: 1 error: JSON parse error, invalid keyword error: JSON parse error, expecting value Change the lexer to accept [A-Za-z0-9]*[duipsf]. It now produces JSON_LSQUARE [ JSON_INTERPOLATION %11d JSON_RSQUARE ] and the parser reports just JSON parse error, invalid interpolation '%11d' Signed-off-by: Markus Armbruster <arm...@redhat.com> --- qobject/json-lexer.c | 52 +++++++++---------------------------------- qobject/json-parser.c | 1 + 2 files changed, 11 insertions(+), 42 deletions(-) diff --git a/qobject/json-lexer.c b/qobject/json-lexer.c index 0ea1eae4aa..7a82aab88b 100644 --- a/qobject/json-lexer.c +++ b/qobject/json-lexer.c @@ -93,7 +93,8 @@ * (apostrophe) instead of %x22 (quotation mark), and can't contain * unescaped apostrophe, but can contain unescaped quotation mark. * - Interpolation: - * interpolation = %((l|ll|I64)[du]|[ipsf]) + * The lexer accepts [A-Za-z0-9]*, and leaves rejecting invalid ones + * to the parser. * * Note: * - Input must be encoded in modified UTF-8. @@ -116,11 +117,6 @@ enum json_lexer_state { IN_NEG_NONZERO_NUMBER, IN_KEYWORD, IN_INTERPOL, - IN_INTERPOL_L, - IN_INTERPOL_LL, - IN_INTERPOL_I, - IN_INTERPOL_I6, - IN_INTERPOL_I64, IN_WHITESPACE, IN_START_INTERPOL, IN_START, @@ -222,42 +218,6 @@ static const uint8_t json_lexer[][256] = { ['\n'] = IN_WHITESPACE, }, - /* interpolation */ - [IN_INTERPOL_LL] = { - ['d'] = JSON_INTERPOL, - ['u'] = JSON_INTERPOL, - }, - - [IN_INTERPOL_L] = { - ['d'] = JSON_INTERPOL, - ['l'] = IN_INTERPOL_LL, - ['u'] = JSON_INTERPOL, - }, - - [IN_INTERPOL_I64] = { - ['d'] = JSON_INTERPOL, - ['u'] = JSON_INTERPOL, - }, - - [IN_INTERPOL_I6] = { - ['4'] = IN_INTERPOL_I64, - }, - - [IN_INTERPOL_I] = { - ['6'] = IN_INTERPOL_I6, - }, - - [IN_INTERPOL] = { - ['d'] = JSON_INTERPOL, - ['i'] = JSON_INTERPOL, - ['p'] = JSON_INTERPOL, - ['s'] = JSON_INTERPOL, - ['u'] = JSON_INTERPOL, - ['f'] = JSON_INTERPOL, - ['l'] = IN_INTERPOL_L, - ['I'] = IN_INTERPOL_I, - }, - /* top level rule */ [IN_START] = { ['"'] = IN_DQ_STRING, @@ -278,6 +238,14 @@ static const uint8_t json_lexer[][256] = { ['\n'] = IN_WHITESPACE, }, + /* interpolation */ + [IN_INTERPOL] = { + TERMINAL(JSON_INTERPOL), + ['A' ... 'Z'] = IN_INTERPOL, + ['a' ... 'z'] = IN_INTERPOL, + ['0' ... '9'] = IN_INTERPOL, + }, + [IN_START_INTERPOL] = { ['"'] = IN_DQ_STRING, ['\''] = IN_SQ_STRING, diff --git a/qobject/json-parser.c b/qobject/json-parser.c index 848d469b2a..bd137399e5 100644 --- a/qobject/json-parser.c +++ b/qobject/json-parser.c @@ -448,6 +448,7 @@ static QObject *parse_interpolation(JSONParserContext *ctxt, va_list *ap) } else if (!strcmp(token->str, "%f")) { return QOBJECT(qnum_from_double(va_arg(*ap, double))); } + parse_error(ctxt, token, "invalid interpolation '%s'", token->str); return NULL; } -- 2.17.1