Improve performance during cursor traversal when a region of interest

is present. Rather than using clang_getCursorExtent(), which requires us to lex the token at the ending position to determine its length. Then, we'd be comparing [a, b) source ranges that cover the characters in the range rather than the normal behavior for Clang's source ranges, which covers the tokens in the range. However, relexing causes us to read the source file (which may come from a precompiled header), which is rather unfortunate and affects performance. In the new scheme, we only use Clang-style source ranges that cover the tokens in the range. At the entry points where this matters (clang_annotateTokens, clang_getCursor), we make sure to move source locations to the start of the token. Addresses most of <rdar://problem/8049381>. llvm-svn: 109134
author: Douglas Gregor <dgregor@apple.com> 2010-07-22 20:22:31 +0000
committer: Douglas Gregor <dgregor@apple.com> 2010-07-22 20:22:31 +0000
commit: cd8bdd025fe37fc395801cb41a50c60d7fab63b6 (patch)
tree: 5802cd70238acbfb06af5a8d9c96a8edc2ed787a /clang/lib/Lex
parent: 5fa3813329d93ed4f1aa2e74dbb54b2bd650d034 (diff)
download: bcm5719-llvm-cd8bdd025fe37fc395801cb41a50c60d7fab63b6.tar.gz
bcm5719-llvm-cd8bdd025fe37fc395801cb41a50c60d7fab63b6.zip
1 files changed, 53 insertions, 0 deletions
diff --git a/clang/lib/Lex/Lexer.cpp b/clang/lib/Lex/Lexer.cpp
index 2f11c37e657..b23122cbcc5 100644
--- a/clang/lib/Lex/Lexer.cpp
+++ b/clang/lib/Lex/Lexer.cpp
@@ -248,6 +248,59 @@ unsigned Lexer::MeasureTokenLength(SourceLocation Loc,
   return TheTok.getLength();
 }
 
+SourceLocation Lexer::GetBeginningOfToken(SourceLocation Loc,
+                                          const SourceManager &SM,
+                                          const LangOptions &LangOpts) {
+  std::pair<FileID, unsigned> LocInfo = SM.getDecomposedLoc(Loc);
+  bool Invalid = false;
+  llvm::StringRef Buffer = SM.getBufferData(LocInfo.first, &Invalid);
+  if (Invalid)
+    return Loc;
+
+  // Back up from the current location until we hit the beginning of a line
+  // (or the buffer). We'll relex from that point.
+  const char *BufStart = Buffer.data();
+  const char *StrData = BufStart+LocInfo.second;
+  if (StrData[0] == '\n' || StrData[0] == '\r')
+    return Loc;
+
+  const char *LexStart = StrData;
+  while (LexStart != BufStart) {
+    if (LexStart[0] == '\n' || LexStart[0] == '\r') {
+      ++LexStart;
+      break;
+    }
+
+    --LexStart;
+  }
+  
+  // Create a lexer starting at the beginning of this token.
+  SourceLocation LexerStartLoc = Loc.getFileLocWithOffset(-LocInfo.second);
+  Lexer TheLexer(LexerStartLoc, LangOpts, BufStart, LexStart, Buffer.end());
+  TheLexer.SetCommentRetentionState(true);
+  
+  // Lex tokens until we find the token that contains the source location.
+  Token TheTok;
+  do {
+    TheLexer.LexFromRawLexer(TheTok);
+    
+    if (TheLexer.getBufferLocation() > StrData) {
+      // Lexing this token has taken the lexer past the source location we're
+      // looking for. If the current token encompasses our source location,
+      // return the beginning of that token.
+      if (TheLexer.getBufferLocation() - TheTok.getLength() <= StrData)
+        return TheTok.getLocation();
+      
+      // We ended up skipping over the source location entirely, which means
+      // that it points into whitespace. We're done here.
+      break;
+    }
+  } while (TheTok.getKind() != tok::eof);
+  
+  // We've passed our source location; just return the original source location.
+  return Loc;
+}
+
 namespace {
   enum PreambleDirectiveKind {
     PDK_Skipped,
author	Douglas Gregor <dgregor@apple.com>	2010-07-22 20:22:31 +0000
committer	Douglas Gregor <dgregor@apple.com>	2010-07-22 20:22:31 +0000
commit	cd8bdd025fe37fc395801cb41a50c60d7fab63b6 (patch)
tree	5802cd70238acbfb06af5a8d9c96a8edc2ed787a /clang/lib/Lex
parent	5fa3813329d93ed4f1aa2e74dbb54b2bd650d034 (diff)
download	bcm5719-llvm-cd8bdd025fe37fc395801cb41a50c60d7fab63b6.tar.gz bcm5719-llvm-cd8bdd025fe37fc395801cb41a50c60d7fab63b6.zip