Move token length calculation out of the diagnostics machinery into

author Chris Lattner <sabre@nondot.org>

Wed, 17 Oct 2007 21:18:47 +0000 (21:18 +0000)

committer Chris Lattner <sabre@nondot.org>

Wed, 17 Oct 2007 21:18:47 +0000 (21:18 +0000)
author Chris Lattner <sabre@nondot.org>
Wed, 17 Oct 2007 21:18:47 +0000 (21:18 +0000)
committer Chris Lattner <sabre@nondot.org>
Wed, 17 Oct 2007 21:18:47 +0000 (21:18 +0000)
diff --git a/Driver/TextDiagnosticPrinter.cpp b/Driver/TextDiagnosticPrinter.cpp

index 76809d7dea9021528c39f6ae44ba19f44cab5ffa..81c73fd533fde7d3efa270411cae40eaf544a3bb 100644 (file)
--- a/Driver/TextDiagnosticPrinter.cpp
+++ b/Driver/TextDiagnosticPrinter.cpp
@@ -80,7 +80,7 @@ void TextDiagnosticPrinter::HighlightRange(const SourceRange &R,
        --EndColNo;  // Zero base the col #.
        
        // Add in the length of the token, so that we cover multi-char tokens.
-      EndColNo += GetTokenLength(R.getEnd());
+      EndColNo += Lexer::MeasureTokenLength(R.getEnd(), SourceMgr);
      } else {
        EndColNo = CaratLine.size();
      }
@@ -97,31 +97,6 @@ void TextDiagnosticPrinter::HighlightRange(const SourceRange &R,
      CaratLine[i] = '~';
  }
  
-/// GetTokenLength - Given the source location of a token, determine its length.
-/// This is a fully general function that uses a lexer to relex the token.
-unsigned TextDiagnosticPrinter::GetTokenLength(SourceLocation Loc) {
-  // If this comes from a macro expansion, we really do want the macro name, not
-  // the token this macro expanded to.
-  Loc = SourceMgr.getLogicalLoc(Loc);
-  const char *StrData = SourceMgr.getCharacterData(Loc);
-  const char *BufEnd = SourceMgr.getBufferData(Loc.getFileID()).second;
-  
-  // TODO: this could be special cased for common tokens like identifiers, ')',
-  // etc to make this faster, if it mattered.  This could use 
-  // Lexer::isObviouslySimpleCharacter for example.
-  
-  // Create a langops struct and enable trigraphs.  This is sufficient for
-  // measuring tokens.
-  LangOptions LangOpts;
-  LangOpts.Trigraphs = true;
-  
-  // Create a lexer starting at the beginning of this token.
-  Lexer TheLexer(Loc, LangOpts, StrData, BufEnd);
-  Token TheTok;
-  TheLexer.LexRawToken(TheTok);
-  return TheTok.getLength();
-}
-
  void TextDiagnosticPrinter::HandleDiagnostic(Diagnostic::Level Level, 
                                               SourceLocation Pos,
                                               diag::kind ID,
diff --git a/Driver/TextDiagnosticPrinter.h b/Driver/TextDiagnosticPrinter.h

index 71e584ebf4a88d1f29cdbcaab1398d465f376382..3df38c9d42f04e9914c5f000bef57c67539899e9 100644 (file)
--- a/Driver/TextDiagnosticPrinter.h
+++ b/Driver/TextDiagnosticPrinter.h
@@ -31,7 +31,6 @@ public:
    void HighlightRange(const SourceRange &R, unsigned LineNo,
                        std::string &CaratLine,
                        const std::string &SourceLine);
-  unsigned GetTokenLength(SourceLocation Loc);
  
    virtual void HandleDiagnostic(Diagnostic::Level DiagLevel,
                                  SourceLocation Pos,
diff --git a/Lex/Lexer.cpp b/Lex/Lexer.cpp

index c7f54ca8ff3c9cd0f2b9d0000ece4b8120c8938f..19dcfe2f0c6473815652783913bb0eddc433f82a 100644 (file)
--- a/Lex/Lexer.cpp
+++ b/Lex/Lexer.cpp
@@ -163,6 +163,39 @@ void Lexer::Stringify(llvm::SmallVectorImpl<char> &Str) {
  }
  
  
+/// MeasureTokenLength - Relex the token at the specified location and return
+/// its length in bytes in the input file.  If the token needs cleaning (e.g.
+/// includes a trigraph or an escaped newline) then this count includes bytes
+/// that are part of that.
+unsigned Lexer::MeasureTokenLength(SourceLocation Loc,
+                                   const SourceManager &SM) {
+  // If this comes from a macro expansion, we really do want the macro name, not
+  // the token this macro expanded to.
+  Loc = SM.getLogicalLoc(Loc);
+  
+  const char *StrData = SM.getCharacterData(Loc);
+  
+  // TODO: this could be special cased for common tokens like identifiers, ')',
+  // etc to make this faster, if it mattered.  Just look at StrData[0] to handle
+  // all obviously single-char tokens.  This could use 
+  // Lexer::isObviouslySimpleCharacter for example to handle identifiers or
+  // something.
+  
+  
+  const char *BufEnd = SM.getBufferData(Loc.getFileID()).second;
+  
+  // Create a langops struct and enable trigraphs.  This is sufficient for
+  // measuring tokens.
+  LangOptions LangOpts;
+  LangOpts.Trigraphs = true;
+  
+  // Create a lexer starting at the beginning of this token.
+  Lexer TheLexer(Loc, LangOpts, StrData, BufEnd);
+  Token TheTok;
+  TheLexer.LexRawToken(TheTok);
+  return TheTok.getLength();
+}
+
  //===----------------------------------------------------------------------===//
  // Character information.
  //===----------------------------------------------------------------------===//
diff --git a/include/clang/Lex/Lexer.h b/include/clang/Lex/Lexer.h

index 5954150c092844e637ccbc5825cd7e2fd202f027..eda50382ad8afbecd88ba4d20e0d68ae11dda46c 100644 (file)
--- a/include/clang/Lex/Lexer.h
+++ b/include/clang/Lex/Lexer.h
@@ -24,6 +24,7 @@
  
  namespace clang {
  class Diagnostic;
+class SourceManager;
  class Preprocessor;
  
  /// Lexer - This provides a simple interface that turns a text buffer into a
@@ -178,6 +179,13 @@ public:
    /// and " characters.  This does not add surrounding ""'s to the string.
    static void Stringify(llvm::SmallVectorImpl<char> &Str);
    
+  /// MeasureTokenLength - Relex the token at the specified location and return
+  /// its length in bytes in the input file.  If the token needs cleaning (e.g.
+  /// includes a trigraph or an escaped newline) then this count includes bytes
+  /// that are part of that.
+  static unsigned MeasureTokenLength(SourceLocation Loc,
+                                     const SourceManager &SM);
+  
    //===--------------------------------------------------------------------===//
    // Internal implementation interfaces.
  private:
author	Chris Lattner <sabre@nondot.org>
	Wed, 17 Oct 2007 21:18:47 +0000 (21:18 +0000)
committer	Chris Lattner <sabre@nondot.org>
	Wed, 17 Oct 2007 21:18:47 +0000 (21:18 +0000)
Driver/TextDiagnosticPrinter.cpp		patch \| blob \| history
Driver/TextDiagnosticPrinter.h		patch \| blob \| history
Lex/Lexer.cpp		patch \| blob \| history
include/clang/Lex/Lexer.h		patch \| blob \| history