diff options
| author | Alex Lorenz <arphaman@gmail.com> | 2021-12-20 12:26:50 -0800 |
|---|---|---|
| committer | Alex Lorenz <arphaman@gmail.com> | 2022-02-02 11:16:11 -0800 |
| commit | 979d0ee8ab30a175220af3b39a6df7d56de9d2c8 (patch) | |
| tree | 4459753a3ce9aa911ed306c323736f3d84bbb054 | |
| parent | aee705661fe8c2ecbf0e1766ee93dbad286a6b8c (diff) | |
| download | llvm-979d0ee8ab30a175220af3b39a6df7d56de9d2c8.zip llvm-979d0ee8ab30a175220af3b39a6df7d56de9d2c8.tar.gz llvm-979d0ee8ab30a175220af3b39a6df7d56de9d2c8.tar.bz2 | |
[clang] fix out of bounds access in an empty string when lexing a _Pragma with missing string token
The lexer can attempt to lex a _Pragma and crash with an out of bounds string access when it's
lexing a _Pragma whose string token is an invalid buffer, e.g. when a module header file from which the macro
expansion for that token was deleted from the file system.
Differential Revision: https://reviews.llvm.org/D116052
| -rw-r--r-- | clang/lib/Frontend/PrintPreprocessedOutput.cpp | 3 | ||||
| -rw-r--r-- | clang/lib/Lex/Pragma.cpp | 7 | ||||
| -rw-r--r-- | clang/test/Preprocessor/pragma-missing-string-token.c | 27 |
3 files changed, 35 insertions, 2 deletions
diff --git a/clang/lib/Frontend/PrintPreprocessedOutput.cpp b/clang/lib/Frontend/PrintPreprocessedOutput.cpp index 1d0022b..e2fc862 100644 --- a/clang/lib/Frontend/PrintPreprocessedOutput.cpp +++ b/clang/lib/Frontend/PrintPreprocessedOutput.cpp @@ -189,7 +189,8 @@ public: bool MoveToLine(const Token &Tok, bool RequireStartOfLine) { PresumedLoc PLoc = SM.getPresumedLoc(Tok.getLocation()); unsigned TargetLine = PLoc.isValid() ? PLoc.getLine() : CurLine; - bool IsFirstInFile = Tok.isAtStartOfLine() && PLoc.getLine() == 1; + bool IsFirstInFile = + Tok.isAtStartOfLine() && PLoc.isValid() && PLoc.getLine() == 1; return MoveToLine(TargetLine, RequireStartOfLine) || IsFirstInFile; } diff --git a/clang/lib/Lex/Pragma.cpp b/clang/lib/Lex/Pragma.cpp index eb7e7cb..eb370e8 100644 --- a/clang/lib/Lex/Pragma.cpp +++ b/clang/lib/Lex/Pragma.cpp @@ -263,7 +263,12 @@ void Preprocessor::Handle_Pragma(Token &Tok) { } SourceLocation RParenLoc = Tok.getLocation(); - std::string StrVal = getSpelling(StrTok); + bool Invalid = false; + std::string StrVal = getSpelling(StrTok, &Invalid); + if (Invalid) { + Diag(PragmaLoc, diag::err__Pragma_malformed); + return; + } // The _Pragma is lexically sound. Destringize according to C11 6.10.9.1: // "The string literal is destringized by deleting any encoding prefix, diff --git a/clang/test/Preprocessor/pragma-missing-string-token.c b/clang/test/Preprocessor/pragma-missing-string-token.c new file mode 100644 index 0000000..5f40b2f --- /dev/null +++ b/clang/test/Preprocessor/pragma-missing-string-token.c @@ -0,0 +1,27 @@ +// RUN: rm -rf %t +// RUN: split-file %s %t + +// RUN: %clang_cc1 -emit-module -x c -fmodules -I %t/Inputs -fmodule-name=aa %t/Inputs/module.modulemap -o %t/aa.pcm +// RUN: rm %t/Inputs/b.h +// RUN: not %clang_cc1 -E -fmodules -I %t/Inputs -fmodule-file=%t/aa.pcm %s -o - -fallow-pcm-with-compiler-errors 2>&1 | FileCheck %s + +//--- Inputs/module.modulemap +module aa { + header "a.h" + header "b.h" +} + +//--- Inputs/a.h +#define TEST(x) x + +//--- Inputs/b.h +#define SUB "mypragma" + +//--- test.c +#include "a.h" + +_Pragma(SUB); +int a = TEST(SUB); + +// CHECK: int a +// CHECK: 1 error generated |
