aboutsummaryrefslogtreecommitdiff
path: root/libcpp
diff options
context:
space:
mode:
authorJoseph Myers <joseph@codesourcery.com>2021-05-06 23:20:35 +0000
committerJoseph Myers <joseph@codesourcery.com>2021-05-06 23:20:35 +0000
commit8f51cf38bb9628546effe66c070188d10f80b5ca (patch)
tree2b3b9f76f52b7e5b6a21d2dd4426c4d8352051e9 /libcpp
parent07dd185755a791ab19e6a63274cf2cb69f087a6c (diff)
downloadgcc-8f51cf38bb9628546effe66c070188d10f80b5ca.zip
gcc-8f51cf38bb9628546effe66c070188d10f80b5ca.tar.gz
gcc-8f51cf38bb9628546effe66c070188d10f80b5ca.tar.bz2
preprocessor: Fix pp-number lexing of digit separators [PR83873, PR97604]
When the preprocessor lexes preprocessing numbers in lex_number, it accepts digit separators in more cases than actually permitted in pp-numbers by the standard syntax. One thing this accepts is adjacent digit separators; there is some code to reject those later, but as noted in bug 83873 it fails to cover the case of adjacent digit separators within a floating-point exponent. Accepting adjacent digit separators only results in a missing diagnostic, not in valid code being rejected or being accepted with incorrect semantics, because the correct lexing in such a case would have '' start the following preprocessing tokens, and no valid preprocessing token starts '' while ' isn't valid on its own as a preprocessing token either. So this patch fixes that case by moving the error for adjacent digit separators to lex_number (allowing a more specific diagnostic than if '' were excluded from the pp-number completely). Other cases inappropriately accepted involve digit separators before '.', 'e+', 'e-', 'p+' or 'p-' (or corresponding uppercase variants). In those cases, as shown by the test digit-sep-pp-number.C added, this can result in valid code being wrongly rejected as a result of too many characters being included in the pp-number. So this case is fixed by terminating the pp-number at the correct character according to the standard. That test also covers the case where a digit separator was followed by an identifier-nondigit that is not a nondigit (e.g. a UCN); that case was already handled correctly. Bootstrapped with no regressions for x86_64-pc-linux-gnu. libcpp/ PR c++/83873 PR preprocessor/97604 * lex.c (lex_number): Reject adjacent digit separators here. Do not allow digit separators before '.' or an exponent with sign. * expr.c (cpp_classify_number): Do not check for adjacent digit separators here. gcc/testsuite/ PR c++/83873 PR preprocessor/97604 * g++.dg/cpp1y/digit-sep-neg-2.C, g++.dg/cpp1y/digit-sep-pp-number.C: New tests. * g++.dg/cpp1y/digit-sep-line-neg.C, g++.dg/cpp1y/digit-sep-neg.C: Adjust expected messages.
Diffstat (limited to 'libcpp')
-rw-r--r--libcpp/expr.c6
-rw-r--r--libcpp/lex.c14
2 files changed, 13 insertions, 7 deletions
diff --git a/libcpp/expr.c b/libcpp/expr.c
index dd5611d..ab4a260 100644
--- a/libcpp/expr.c
+++ b/libcpp/expr.c
@@ -582,11 +582,7 @@ cpp_classify_number (cpp_reader *pfile, const cpp_token *token,
max_digit = c;
}
else if (DIGIT_SEP (c))
- {
- if (seen_digit_sep)
- SYNTAX_ERROR_AT (virtual_location, "adjacent digit separators");
- seen_digit_sep = true;
- }
+ seen_digit_sep = true;
else if (c == '.')
{
if (seen_digit_sep || DIGIT_SEP (*str))
diff --git a/libcpp/lex.c b/libcpp/lex.c
index 06bcc31..9662f1b 100644
--- a/libcpp/lex.c
+++ b/libcpp/lex.c
@@ -1548,18 +1548,28 @@ lex_number (cpp_reader *pfile, cpp_string *number,
base = pfile->buffer->cur - 1;
do
{
+ const uchar *adj_digit_sep = NULL;
cur = pfile->buffer->cur;
/* N.B. ISIDNUM does not include $. */
- while (ISIDNUM (*cur) || *cur == '.' || DIGIT_SEP (*cur)
- || VALID_SIGN (*cur, cur[-1]))
+ while (ISIDNUM (*cur)
+ || (*cur == '.' && !DIGIT_SEP (cur[-1]))
+ || DIGIT_SEP (*cur)
+ || (VALID_SIGN (*cur, cur[-1]) && !DIGIT_SEP (cur[-2])))
{
NORMALIZE_STATE_UPDATE_IDNUM (nst, *cur);
+ /* Adjacent digit separators do not form part of the pp-number syntax.
+ However, they can safely be diagnosed here as an error, since '' is
+ not a valid preprocessing token. */
+ if (DIGIT_SEP (*cur) && DIGIT_SEP (cur[-1]) && !adj_digit_sep)
+ adj_digit_sep = cur;
cur++;
}
/* A number can't end with a digit separator. */
while (cur > pfile->buffer->cur && DIGIT_SEP (cur[-1]))
--cur;
+ if (adj_digit_sep && adj_digit_sep < cur)
+ cpp_error (pfile, CPP_DL_ERROR, "adjacent digit separators");
pfile->buffer->cur = cur;
}