Both lexer and parser reject invalid interpolation specifications. The parser's check is useless.
The lexer ends the token right after the first bad character. This tends to lead to suboptimal error reporting. For instance, input [ %04d ] produces the tokens JSON_LSQUARE [ JSON_ERROR %0 JSON_INTEGER 4 JSON_KEYWORD d JSON_RSQUARE ] The parser then yields an error, an object and two more errors: error: Invalid JSON syntax object: 4 error: JSON parse error, invalid keyword error: JSON parse error, expecting value Dumb down the lexer to accept [A-Za-z0-9]*. The parser's check is now used. Emit a proper error there. The lexer now produces JSON_LSQUARE [ JSON_INTERPOLATION %04d JSON_RSQUARE ] and the parser reports just JSON parse error, invalid interpolation '%04d' Signed-off-by: Markus Armbruster <arm...@redhat.com> Reviewed-by: Eric Blake <ebl...@redhat.com> --- qobject/json-lexer.c | 44 ++++++------------------------------------- qobject/json-parser.c | 1 + tests/check-qjson.c | 3 ++- 3 files changed, 9 insertions(+), 39 deletions(-) diff --git a/qobject/json-lexer.c b/qobject/json-lexer.c index cf15266cbe..ab2453a1e1 100644 --- a/qobject/json-lexer.c +++ b/qobject/json-lexer.c @@ -93,7 +93,8 @@ * (apostrophe) instead of %x22 (quotation mark), and can't contain * unescaped apostrophe, but can contain unescaped quotation mark. * - Interpolation, if enabled: - * interpolation = %((l|ll|I64)[du]|[ipsf]) + * The lexer accepts %[A-Za-z0-9]*, and leaves rejecting invalid + * ones to the parser. * * Note: * - Input must be encoded in modified UTF-8. @@ -116,11 +117,6 @@ enum json_lexer_state { IN_NEG_NONZERO_NUMBER, IN_KEYWORD, IN_INTERPOL, - IN_INTERPOL_L, - IN_INTERPOL_LL, - IN_INTERPOL_I, - IN_INTERPOL_I6, - IN_INTERPOL_I64, IN_WHITESPACE, IN_START, IN_START_INTERPOL, /* must be IN_START + 1 */ @@ -224,39 +220,11 @@ static const uint8_t json_lexer[][256] = { }, /* interpolation */ - [IN_INTERPOL_LL] = { - ['d'] = JSON_INTERPOL, - ['u'] = JSON_INTERPOL, - }, - - [IN_INTERPOL_L] = { - ['d'] = JSON_INTERPOL, - ['l'] = IN_INTERPOL_LL, - ['u'] = JSON_INTERPOL, - }, - - [IN_INTERPOL_I64] = { - ['d'] = JSON_INTERPOL, - ['u'] = JSON_INTERPOL, - }, - - [IN_INTERPOL_I6] = { - ['4'] = IN_INTERPOL_I64, - }, - - [IN_INTERPOL_I] = { - ['6'] = IN_INTERPOL_I6, - }, - [IN_INTERPOL] = { - ['d'] = JSON_INTERPOL, - ['i'] = JSON_INTERPOL, - ['p'] = JSON_INTERPOL, - ['s'] = JSON_INTERPOL, - ['u'] = JSON_INTERPOL, - ['f'] = JSON_INTERPOL, - ['l'] = IN_INTERPOL_L, - ['I'] = IN_INTERPOL_I, + TERMINAL(JSON_INTERPOL), + ['A' ... 'Z'] = IN_INTERPOL, + ['a' ... 'z'] = IN_INTERPOL, + ['0' ... '9'] = IN_INTERPOL, }, /* diff --git a/qobject/json-parser.c b/qobject/json-parser.c index 56bbfe6810..32131c08d5 100644 --- a/qobject/json-parser.c +++ b/qobject/json-parser.c @@ -453,6 +453,7 @@ static QObject *parse_interpolation(JSONParserContext *ctxt, va_list *ap) } else if (!strcmp(token->str, "%f")) { return QOBJECT(qnum_from_double(va_arg(*ap, double))); } + parse_error(ctxt, token, "invalid interpolation '%s'", token->str); return NULL; } diff --git a/tests/check-qjson.c b/tests/check-qjson.c index 3bd216f357..6a1dbbae43 100644 --- a/tests/check-qjson.c +++ b/tests/check-qjson.c @@ -1021,7 +1021,8 @@ static void interpolation_unknown(void) } g_test_trap_subprocess(NULL, 0, 0); g_test_trap_assert_failed(); - g_test_trap_assert_stderr("*Unexpected error*stray '%x'*"); + g_test_trap_assert_stderr("*Unexpected error*" + "invalid interpolation '%x'*"); } static void interpolation_string(void) -- 2.17.1