[MC] Prevent out of order HashDirective lexing in AsmLexer.

author Nirav Dave <niravd@google.com>

Sat, 1 Oct 2016 00:42:32 +0000 (00:42 +0000)

committer Nirav Dave <niravd@google.com>

Sat, 1 Oct 2016 00:42:32 +0000 (00:42 +0000)
author Nirav Dave <niravd@google.com>
Sat, 1 Oct 2016 00:42:32 +0000 (00:42 +0000)
committer Nirav Dave <niravd@google.com>
Sat, 1 Oct 2016 00:42:32 +0000 (00:42 +0000)
diff --git a/include/llvm/MC/MCParser/AsmLexer.h b/include/llvm/MC/MCParser/AsmLexer.h

index 06937e25f59ef61dd92be3683025560f9bd6d3f1..029598c013d3570c0ed226017006d67dc5eabbbb 100644 (file)
--- a/include/llvm/MC/MCParser/AsmLexer.h
+++ b/include/llvm/MC/MCParser/AsmLexer.h
@@ -32,7 +32,7 @@ class AsmLexer : public MCAsmLexer {
    bool IsAtStartOfLine;
    bool IsAtStartOfStatement;
    bool IsParsingMSInlineAsm;
-
+  bool IsPeeking;
    void operator=(const AsmLexer&) = delete;
    AsmLexer(const AsmLexer&) = delete;
  
diff --git a/lib/MC/MCParser/AsmLexer.cpp b/lib/MC/MCParser/AsmLexer.cpp

index c1f71bcc36810b9ac1eba22665eef9f2e8252e99..d0c8bce0382660f274ede3c89af5d986020b7041 100644 (file)
--- a/lib/MC/MCParser/AsmLexer.cpp
+++ b/lib/MC/MCParser/AsmLexer.cpp
@@ -11,29 +11,29 @@
  //
  //===----------------------------------------------------------------------===//
  
+#include "llvm/MC/MCParser/AsmLexer.h"
  #include "llvm/ADT/APInt.h"
  #include "llvm/ADT/ArrayRef.h"
-#include "llvm/ADT/StringSwitch.h"
  #include "llvm/ADT/StringRef.h"
-#include "llvm/MC/MCParser/AsmLexer.h"
-#include "llvm/MC/MCParser/MCAsmLexer.h"
+#include "llvm/ADT/StringSwitch.h"
  #include "llvm/MC/MCAsmInfo.h"
+#include "llvm/MC/MCParser/MCAsmLexer.h"
  #include "llvm/Support/SMLoc.h"
+#include "llvm/Support/SaveAndRestore.h"
  #include <cassert>
  #include <cctype>
  #include <cstdio>
  #include <cstring>
-#include <tuple>
  #include <string>
+#include <tuple>
  #include <utility>
  
  using namespace llvm;
  
-AsmLexer::AsmLexer(const MCAsmInfo &MAI) : MAI(MAI) {
-  CurPtr = nullptr;
-  IsAtStartOfLine = true;
-  IsAtStartOfStatement = true;
-  IsParsingMSInlineAsm = false;
+AsmLexer::AsmLexer(const MCAsmInfo &MAI)
+    : MAI(MAI), CurPtr(nullptr), IsAtStartOfLine(true),
+      IsAtStartOfStatement(true), IsParsingMSInlineAsm(false),
+      IsPeeking(false) {
    AllowAtInIdentifier = !StringRef(MAI.getCommentString()).startswith("@");
  }
  
@@ -487,17 +487,15 @@ StringRef AsmLexer::LexUntilEndOfLine() {
  
  size_t AsmLexer::peekTokens(MutableArrayRef<AsmToken> Buf,
                              bool ShouldSkipSpace) {
-  const char *SavedTokStart = TokStart;
-  const char *SavedCurPtr = CurPtr;
-  bool SavedAtStartOfLine = IsAtStartOfLine;
-  bool SavedAtStartOfStatement = IsAtStartOfStatement;
-  bool SavedSkipSpace = SkipSpace;
-
+  SaveAndRestore<const char *> SavedTokenStart(TokStart);
+  SaveAndRestore<const char *> SavedCurPtr(CurPtr);
+  SaveAndRestore<bool> SavedAtStartOfLine(IsAtStartOfLine);
+  SaveAndRestore<bool> SavedAtStartOfStatement(IsAtStartOfStatement);
+  SaveAndRestore<bool> SavedSkipSpace(SkipSpace, ShouldSkipSpace);
+  SaveAndRestore<bool> SavedIsPeeking(IsPeeking, true);
    std::string SavedErr = getErr();
    SMLoc SavedErrLoc = getErrLoc();
  
-  SkipSpace = ShouldSkipSpace;
-
    size_t ReadCount;
    for (ReadCount = 0; ReadCount < Buf.size(); ++ReadCount) {
      AsmToken Token = LexToken();
@@ -509,13 +507,6 @@ size_t AsmLexer::peekTokens(MutableArrayRef<AsmToken> Buf,
    }
  
    SetError(SavedErrLoc, SavedErr);
-
-  SkipSpace = SavedSkipSpace;
-  IsAtStartOfLine = SavedAtStartOfLine;
-  IsAtStartOfStatement = SavedAtStartOfStatement;
-  CurPtr = SavedCurPtr;
-  TokStart = SavedTokStart;
-
    return ReadCount;
  }
  
@@ -525,7 +516,7 @@ bool AsmLexer::isAtStartOfComment(const char *Ptr) {
    if (CommentString[1] == '\0')
      return CommentString[0] == Ptr[0];
  
-  // FIXME: special case for the bogus "##" comment string in X86MCAsmInfoDarwin
+  // Allow # preprocessor commments also be counted as comments for "##" cases
    if (CommentString[1] == '#')
      return CommentString[0] == Ptr[0];
  
@@ -542,7 +533,7 @@ AsmToken AsmLexer::LexToken() {
    // This always consumes at least one character.
    int CurChar = getNextChar();
  
-  if (CurChar == '#' && IsAtStartOfStatement) {
+  if (!IsPeeking && CurChar == '#' && IsAtStartOfStatement) {
      // If this starts with a '#', this may be a cpp
      // hash directive and otherwise a line comment.
      AsmToken TokenBuf[2];
diff --git a/test/MC/AsmParser/pr28921.s b/test/MC/AsmParser/pr28921.s

new file mode 100644 (file)

index 0000000..2fbb555
--- /dev/null
+++ b/test/MC/AsmParser/pr28921.s
@@ -0,0 +1,8 @@
+// RUN: llvm-mc -triple i386-unknown-unknown %s
+
+# 1 "kernel.S"
+# 1 "<built-in>" 1
+# 1 "kernel.S" 2
+##
+# 10 "kernel.S"
+##
author	Nirav Dave <niravd@google.com>
	Sat, 1 Oct 2016 00:42:32 +0000 (00:42 +0000)
committer	Nirav Dave <niravd@google.com>
	Sat, 1 Oct 2016 00:42:32 +0000 (00:42 +0000)
include/llvm/MC/MCParser/AsmLexer.h		patch \| blob \| history
lib/MC/MCParser/AsmLexer.cpp		patch \| blob \| history
test/MC/AsmParser/pr28921.s	[new file with mode: 0644]	patch \| blob