Merging r322390:

author Hans Wennborg <hans@hanshq.net>

Wed, 17 Jan 2018 13:24:15 +0000 (13:24 +0000)

committer Hans Wennborg <hans@hanshq.net>

Wed, 17 Jan 2018 13:24:15 +0000 (13:24 +0000)
author Hans Wennborg <hans@hanshq.net>
Wed, 17 Jan 2018 13:24:15 +0000 (13:24 +0000)
committer Hans Wennborg <hans@hanshq.net>
Wed, 17 Jan 2018 13:24:15 +0000 (13:24 +0000)
diff --git a/lib/Lex/Lexer.cpp b/lib/Lex/Lexer.cpp

index 830354ab23f0d73a04b47ce7ccf0974d9480c541..8bd4ab0ff9caf2b74e0e7ac76033f8dac1733027 100644 (file)
--- a/lib/Lex/Lexer.cpp
+++ b/lib/Lex/Lexer.cpp
@@ -2009,18 +2009,21 @@ bool Lexer::LexAngledStringLiteral(Token &Result, const char *CurPtr) {
    const char *AfterLessPos = CurPtr;
    char C = getAndAdvanceChar(CurPtr, Result);
    while (C != '>') {
-    // Skip escaped characters.
-    if (C == '\\' && CurPtr < BufferEnd) {
-      // Skip the escaped character.
-      getAndAdvanceChar(CurPtr, Result);
-    } else if (C == '\n' || C == '\r' ||             // Newline.
-               (C == 0 && (CurPtr-1 == BufferEnd ||  // End of file.
-                           isCodeCompletionPoint(CurPtr-1)))) {
+    // Skip escaped characters.  Escaped newlines will already be processed by
+    // getAndAdvanceChar.
+    if (C == '\\')
+      C = getAndAdvanceChar(CurPtr, Result);
+
+    if (C == '\n' || C == '\r' ||             // Newline.
+        (C == 0 && (CurPtr-1 == BufferEnd ||  // End of file.
+                    isCodeCompletionPoint(CurPtr-1)))) {
        // If the filename is unterminated, then it must just be a lone <
        // character.  Return this as such.
        FormTokenWithChars(Result, AfterLessPos, tok::less);
        return true;
-    } else if (C == 0) {
+    }
+
+    if (C == 0) {
        NulCharacter = CurPtr-1;
      }
      C = getAndAdvanceChar(CurPtr, Result);
diff --git a/test/Lexer/null-character-in-literal.c b/test/Lexer/null-character-in-literal.c

new file mode 100644 (file)

index 0000000..a479547

Binary files /dev/null and b/test/Lexer/null-character-in-literal.c differ
diff --git a/unittests/Lex/LexerTest.cpp b/unittests/Lex/LexerTest.cpp

index d699a44b13fdb376db778cb37ee99389fef6b5c9..317e2c836335f8411fd18ad6e016323ccd55b1c4 100644 (file)
--- a/unittests/Lex/LexerTest.cpp
+++ b/unittests/Lex/LexerTest.cpp
@@ -476,6 +476,8 @@ TEST_F(LexerTest, GetBeginningOfTokenWithEscapedNewLine) {
  TEST_F(LexerTest, AvoidPastEndOfStringDereference) {
    std::vector<Token> LexedTokens = Lex("  //  \\\n");
    EXPECT_TRUE(LexedTokens.empty());
+  EXPECT_TRUE(Lex("#include <\\\\").empty());
+  EXPECT_TRUE(Lex("#include <\\\\\n").empty());
  }
  
  TEST_F(LexerTest, StringizingRasString) {
author	Hans Wennborg <hans@hanshq.net>
	Wed, 17 Jan 2018 13:24:15 +0000 (13:24 +0000)
committer	Hans Wennborg <hans@hanshq.net>
	Wed, 17 Jan 2018 13:24:15 +0000 (13:24 +0000)
lib/Lex/Lexer.cpp		patch \| blob \| history
test/Lexer/null-character-in-literal.c	[new file with mode: 0644]	patch \| blob
unittests/Lex/LexerTest.cpp		patch \| blob \| history