Hi! The libcpp left shift handling implements (partially) the C99-C23 wording where shifts are UB if shift count is negative, or too large, or shifting left a negative value or shifting left non-negative value results in something not representable in the result type (in the preprocessor case that is intmax_t). libcpp actually implements left shift by negative count as right shifts by negation of the count and similarly right shifts by negative count as left shifts by negation (not ok), sets overflow for too large shift count (ok), doesn't check for negative values on left shift (not ok) and checks correctly for the non-representable ones otherwise (ok).
Now, C++11 to C++17 has different behavior, whereas in C99-C23 1 << 63 in preprocessor is invalid, in C++11-17 it is valid, but 3 << 63 is not. The wording is that left shift of negative value is UB (like in C) and signed non-negative left shift is UB if the result isn't representable in corresponding unsigned type (so uintmax_t for libcpp). And then C++20 and newer says all left shifts are well defined with the exception of bad shift counts. In -fsanitize=undefined we handle these by /* For signed x << y, in C99 and later, the following: (unsigned) x >> (uprecm1 - y) if non-zero, is undefined. */ and /* For signed x << y, in C++11 to C++17, the following: x < 0 || ((unsigned) x >> (uprecm1 - y)) if > 1, is undefined. */ Now, we are late in GCC 15 development, so I think making the preprocessor more strict than it is now is undesirable, so will defer setting overflow flag for the shifts by negative count, or shifts by negative value left. The following patch just makes some previously incorrectly rejected or warned cases valid for C++11-17 and even more for C++20 and later. Bootstrapped/regtested on x86_64-linux and i686-linux, ok for trunk? 2025-03-22 Jakub Jelinek <ja...@redhat.com> PR preprocessor/119391 * expr.cc (num_lshift): Add pfile argument. Don't set num.overflow for !num.unsignedp in C++20 or later unless n >= precision. For C++11 to C++17 set it if orig >> (precision - 1 - n) as logical shift results in value > 1. (num_binary_op): Pass pfile to num_lshift. (num_div_op): Likewise. * g++.dg/cpp/pr119391.C: New test. --- libcpp/expr.cc.jj 2025-01-02 11:47:49.292955988 +0100 +++ libcpp/expr.cc 2025-03-21 17:03:28.790005969 +0100 @@ -53,7 +53,7 @@ static cpp_num num_equality_op (cpp_read static cpp_num num_mul (cpp_reader *, cpp_num, cpp_num); static cpp_num num_div_op (cpp_reader *, cpp_num, cpp_num, enum cpp_ttype, location_t); -static cpp_num num_lshift (cpp_num, size_t, size_t); +static cpp_num num_lshift (cpp_reader *, cpp_num, size_t, size_t); static cpp_num num_rshift (cpp_num, size_t, size_t); static cpp_num append_digit (cpp_num, int, int, size_t); @@ -2049,7 +2049,7 @@ num_rshift (cpp_num num, size_t precisio /* Shift NUM, of width PRECISION, left by N bits. */ static cpp_num -num_lshift (cpp_num num, size_t precision, size_t n) +num_lshift (cpp_reader *pfile, cpp_num num, size_t precision, size_t n) { if (n >= precision) { @@ -2075,8 +2075,26 @@ num_lshift (cpp_num num, size_t precisio } num = num_trim (num, precision); - if (num.unsignedp) + if (num.unsignedp + /* For C++20 or later, there is no overflow for signed left + shifts, it is as if the shift was in uintmax_t and cast + back to intmax_t afterwards. */ + || (CPP_OPTION (pfile, cplusplus) + && CPP_OPTION (pfile, lang) >= CLK_GNUCXX20)) num.overflow = false; + else if (CPP_OPTION (pfile, cplusplus) + && CPP_OPTION (pfile, lang) >= CLK_GNUCXX11 + && num_positive (orig, precision)) + { + /* For C++11 - C++17, 1 << 63 is allowed because it is + representable in uintmax_t, but 3 << 63 is not. + Test whether num >> (precision - 1 - n) as logical + shift is > 1. */ + maybe_orig = orig; + maybe_orig.unsignedp = true; + maybe_orig = num_rshift (maybe_orig, precision, precision - 1 - n); + num.overflow = maybe_orig.high || maybe_orig.low > 1; + } else { maybe_orig = num_rshift (num, precision, n); @@ -2149,7 +2167,7 @@ num_binary_op (cpp_reader *pfile, cpp_nu else n = rhs.low; if (op == CPP_LSHIFT) - lhs = num_lshift (lhs, precision, n); + lhs = num_lshift (pfile, lhs, precision, n); else lhs = num_rshift (lhs, precision, n); break; @@ -2347,7 +2365,7 @@ num_div_op (cpp_reader *pfile, cpp_num l rhs.unsignedp = true; lhs.unsignedp = true; i = precision - i - 1; - sub = num_lshift (rhs, precision, i); + sub = num_lshift (pfile, rhs, precision, i); result.high = result.low = 0; for (;;) --- gcc/testsuite/g++.dg/cpp/pr119391.C.jj 2025-03-21 17:13:12.792074937 +0100 +++ gcc/testsuite/g++.dg/cpp/pr119391.C 2025-03-21 17:12:38.677537621 +0100 @@ -0,0 +1,15 @@ +// PR preprocessor/119391 +// { dg-do preprocess } +// { dg-options "" } + +#if (1 << 63) != -9223372036854775807 - 1 // { dg-warning "integer overflow in preprocessor expression" "" { target c++98_only } } +#warning "Unexpected value" +#endif +#if (3 << 62) != -4611686018427387904 // { dg-warning "integer overflow in preprocessor expression" "" { target c++98_only } } +#warning "Unexpected value" +#endif +#if 1 << 64 // { dg-warning "integer overflow in preprocessor expression" } +#endif +#if (3 << 63) != -9223372036854775807 - 1 // { dg-warning "integer overflow in preprocessor expression" "" { target c++17_down } } +#warning "Unexpected value" +#endif Jakub