Skip to content
This repository was archived by the owner on Nov 1, 2021. It is now read-only.

Commit cff9cc9

Browse files
committed
start implementing a token rewriter. At this point, it just reads in a file
and lets a client iterate over it. git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@57407 91177308-0d34-0410-b5e6-96231b3b80d8
1 parent b13c5ee commit cff9cc9

File tree

5 files changed

+131
-1
lines changed

5 files changed

+131
-1
lines changed

Driver/RewriteTest.cpp

+9-1
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,12 @@ void clang::DoRewriteTest(Preprocessor &PP, const std::string &InFileName,
2121
SourceManager &SM = PP.getSourceManager();
2222
const LangOptions &LangOpts = PP.getLangOptions();
2323

24+
TokenRewriter Rewriter(SM.getMainFileID(), SM, LangOpts);
25+
26+
27+
28+
29+
2430
std::pair<const char*,const char*> File =SM.getBufferData(SM.getMainFileID());
2531

2632
// Create a lexer to lex all the tokens of the main file in raw mode. Even
@@ -37,5 +43,7 @@ void clang::DoRewriteTest(Preprocessor &PP, const std::string &InFileName,
3743
RawLex.LexFromRawLexer(RawTok);
3844
}
3945

40-
46+
for (TokenRewriter::token_iterator I = Rewriter.token_begin(),
47+
E = Rewriter.token_end(); I != E; ++I)
48+
std::cout << PP.getSpelling(*I);
4149
}

clang.xcodeproj/project.pbxproj

+4
Original file line numberDiff line numberDiff line change
@@ -123,6 +123,7 @@
123123
DE4772FC0C10EAEC002239E8 /* CGExpr.cpp in Sources */ = {isa = PBXBuildFile; fileRef = DE4772FB0C10EAEC002239E8 /* CGExpr.cpp */; };
124124
DE47999C0D2EBE1A00706D2D /* SemaExprObjC.cpp in Sources */ = {isa = PBXBuildFile; fileRef = DE47999B0D2EBE1A00706D2D /* SemaExprObjC.cpp */; };
125125
DE4DC79E0EA1C09E00069E5A /* RewriteTest.cpp in Sources */ = {isa = PBXBuildFile; fileRef = DE4DC79D0EA1C09E00069E5A /* RewriteTest.cpp */; };
126+
DE4DC7A30EA1C33E00069E5A /* TokenRewriter.cpp in Sources */ = {isa = PBXBuildFile; fileRef = DE4DC7A20EA1C33E00069E5A /* TokenRewriter.cpp */; };
126127
DE5932D10AD60FF400BC794C /* clang.cpp in Sources */ = {isa = PBXBuildFile; fileRef = DE5932CD0AD60FF400BC794C /* clang.cpp */; };
127128
DE5932D20AD60FF400BC794C /* clang.h in CopyFiles */ = {isa = PBXBuildFile; fileRef = DE5932CE0AD60FF400BC794C /* clang.h */; };
128129
DE5932D30AD60FF400BC794C /* PrintParserCallbacks.cpp in Sources */ = {isa = PBXBuildFile; fileRef = DE5932CF0AD60FF400BC794C /* PrintParserCallbacks.cpp */; };
@@ -446,6 +447,7 @@
446447
DE47999B0D2EBE1A00706D2D /* SemaExprObjC.cpp */ = {isa = PBXFileReference; fileEncoding = 4; indentWidth = 2; lastKnownFileType = sourcecode.cpp.cpp; name = SemaExprObjC.cpp; path = lib/Sema/SemaExprObjC.cpp; sourceTree = "<group>"; tabWidth = 2; };
447448
DE4DC7980EA1BE4400069E5A /* TokenRewriter.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = TokenRewriter.h; path = clang/Rewrite/TokenRewriter.h; sourceTree = "<group>"; };
448449
DE4DC79D0EA1C09E00069E5A /* RewriteTest.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = RewriteTest.cpp; path = Driver/RewriteTest.cpp; sourceTree = "<group>"; };
450+
DE4DC7A20EA1C33E00069E5A /* TokenRewriter.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = TokenRewriter.cpp; path = lib/Rewrite/TokenRewriter.cpp; sourceTree = "<group>"; };
449451
DE53370B0CE2D96F00D9A028 /* RewriteRope.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; name = RewriteRope.h; path = clang/Rewrite/RewriteRope.h; sourceTree = "<group>"; };
450452
DE5932CD0AD60FF400BC794C /* clang.cpp */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.cpp.cpp; name = clang.cpp; path = Driver/clang.cpp; sourceTree = "<group>"; };
451453
DE5932CE0AD60FF400BC794C /* clang.h */ = {isa = PBXFileReference; fileEncoding = 30; lastKnownFileType = sourcecode.c.h; name = clang.h; path = Driver/clang.h; sourceTree = "<group>"; };
@@ -1073,6 +1075,7 @@
10731075
72D16C1E0D9975C400E6DA4A /* HTMLRewrite.cpp */,
10741076
DEF7D9F80C9C8B1D0001F598 /* Rewriter.cpp */,
10751077
DECAB0CF0DB3C84200E13CCB /* RewriteRope.cpp */,
1078+
DE4DC7A20EA1C33E00069E5A /* TokenRewriter.cpp */,
10761079
);
10771080
name = Rewrite;
10781081
sourceTree = "<group>";
@@ -1259,6 +1262,7 @@
12591262
3551068C0E9A8546006A4E44 /* ParsePragma.cpp in Sources */,
12601263
3551068D0E9A8546006A4E44 /* ParseTentative.cpp in Sources */,
12611264
DE4DC79E0EA1C09E00069E5A /* RewriteTest.cpp in Sources */,
1265+
DE4DC7A30EA1C33E00069E5A /* TokenRewriter.cpp in Sources */,
12621266
);
12631267
runOnlyForDeploymentPostprocessing = 0;
12641268
};

include/clang/Basic/SourceLocation.h

+5
Original file line numberDiff line numberDiff line change
@@ -155,6 +155,11 @@ class SourceLocation {
155155
/// directly.
156156
unsigned getRawEncoding() const { return ID; }
157157

158+
159+
bool operator<(const SourceLocation &RHS) const {
160+
return ID < RHS.ID;
161+
}
162+
158163
/// getFromRawEncoding - Turn a raw encoding of a SourceLocation object into
159164
/// a real SourceLocation.
160165
static SourceLocation getFromRawEncoding(unsigned Encoding) {

include/clang/Rewrite/TokenRewriter.h

+60
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,60 @@
1+
//===--- TokenRewriter.h - Token-based Rewriter -----------------*- C++ -*-===//
2+
//
3+
// The LLVM Compiler Infrastructure
4+
//
5+
// This file is distributed under the University of Illinois Open Source
6+
// License. See LICENSE.TXT for details.
7+
//
8+
//===----------------------------------------------------------------------===//
9+
//
10+
// This file defines the TokenRewriter class, which is used for code
11+
// transformations.
12+
//
13+
//===----------------------------------------------------------------------===//
14+
15+
#ifndef LLVM_CLANG_TOKENREWRITER_H
16+
#define LLVM_CLANG_TOKENREWRITER_H
17+
18+
#include "clang/Basic/SourceLocation.h"
19+
#include <list>
20+
#include <map>
21+
22+
namespace clang {
23+
class Token;
24+
class LangOptions;
25+
26+
class TokenRewriter {
27+
/// TokenList - This is the list of raw tokens that make up this file. Each
28+
/// of these tokens has a unique SourceLocation, which is a FileID.
29+
std::list<Token> TokenList;
30+
31+
/// TokenRefTy - This is the type used to refer to a token in the TokenList.
32+
typedef std::list<Token>::iterator TokenRefTy;
33+
34+
/// TokenAtLoc - This map indicates which token exists at a specific
35+
/// SourceLocation. Since each token has a unique SourceLocation, this is a
36+
/// one to one map. The token can return its own location directly, to map
37+
/// backwards.
38+
std::map<SourceLocation, TokenRefTy> TokenAtLoc;
39+
40+
public:
41+
/// TokenRewriter - This creates a TokenRewriter for the file with the
42+
/// specified FileID.
43+
TokenRewriter(unsigned FileID, SourceManager &SM, const LangOptions &LO);
44+
45+
46+
typedef std::list<Token>::const_iterator token_iterator;
47+
token_iterator token_begin() const { return TokenList.begin(); }
48+
token_iterator token_end() const { return TokenList.end(); }
49+
50+
private:
51+
/// AddToken - Add the specified token into the Rewriter before the other
52+
/// position.
53+
void AddToken(const Token &T, TokenRefTy Where);
54+
};
55+
56+
57+
58+
} // end namespace clang
59+
60+
#endif

lib/Rewrite/TokenRewriter.cpp

+53
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,53 @@
1+
//===--- TokenRewriter.cpp - Token-based code rewriting interface ---------===//
2+
//
3+
// The LLVM Compiler Infrastructure
4+
//
5+
// This file is distributed under the University of Illinois Open Source
6+
// License. See LICENSE.TXT for details.
7+
//
8+
//===----------------------------------------------------------------------===//
9+
//
10+
// This file implements the TokenRewriter class, which is used for code
11+
// transformations.
12+
//
13+
//===----------------------------------------------------------------------===//
14+
15+
#include "clang/Rewrite/TokenRewriter.h"
16+
#include "clang/Lex/Lexer.h"
17+
#include "clang/Basic/SourceManager.h"
18+
using namespace clang;
19+
20+
TokenRewriter::TokenRewriter(unsigned FileID, SourceManager &SM,
21+
const LangOptions &LangOpts) {
22+
23+
std::pair<const char*,const char*> File = SM.getBufferData(FileID);
24+
25+
// Create a lexer to lex all the tokens of the main file in raw mode.
26+
Lexer RawLex(SourceLocation::getFileLoc(FileID, 0),
27+
LangOpts, File.first, File.second);
28+
29+
// Return all comments and whitespace as tokens.
30+
RawLex.SetKeepWhitespaceMode(true);
31+
32+
// Lex the file, populating our datastructures.
33+
Token RawTok;
34+
RawLex.LexFromRawLexer(RawTok);
35+
while (RawTok.isNot(tok::eof)) {
36+
AddToken(RawTok, TokenList.end());
37+
RawLex.LexFromRawLexer(RawTok);
38+
}
39+
40+
41+
}
42+
43+
/// AddToken - Add the specified token into the Rewriter before the other
44+
/// position.
45+
void TokenRewriter::AddToken(const Token &T, TokenRefTy Where) {
46+
Where = TokenList.insert(Where, T);
47+
48+
bool InsertSuccess = TokenAtLoc.insert(std::make_pair(T.getLocation(),
49+
Where)).second;
50+
assert(InsertSuccess && "Token location already in rewriter!");
51+
InsertSuccess = InsertSuccess;
52+
}
53+

0 commit comments

Comments
 (0)