1*67e74705SXin Li //===--- TokenRewriter.cpp - Token-based code rewriting interface ---------===//
2*67e74705SXin Li //
3*67e74705SXin Li // The LLVM Compiler Infrastructure
4*67e74705SXin Li //
5*67e74705SXin Li // This file is distributed under the University of Illinois Open Source
6*67e74705SXin Li // License. See LICENSE.TXT for details.
7*67e74705SXin Li //
8*67e74705SXin Li //===----------------------------------------------------------------------===//
9*67e74705SXin Li //
10*67e74705SXin Li // This file implements the TokenRewriter class, which is used for code
11*67e74705SXin Li // transformations.
12*67e74705SXin Li //
13*67e74705SXin Li //===----------------------------------------------------------------------===//
14*67e74705SXin Li
15*67e74705SXin Li #include "clang/Rewrite/Core/TokenRewriter.h"
16*67e74705SXin Li #include "clang/Basic/SourceManager.h"
17*67e74705SXin Li #include "clang/Lex/Lexer.h"
18*67e74705SXin Li #include "clang/Lex/ScratchBuffer.h"
19*67e74705SXin Li using namespace clang;
20*67e74705SXin Li
TokenRewriter(FileID FID,SourceManager & SM,const LangOptions & LangOpts)21*67e74705SXin Li TokenRewriter::TokenRewriter(FileID FID, SourceManager &SM,
22*67e74705SXin Li const LangOptions &LangOpts) {
23*67e74705SXin Li ScratchBuf.reset(new ScratchBuffer(SM));
24*67e74705SXin Li
25*67e74705SXin Li // Create a lexer to lex all the tokens of the main file in raw mode.
26*67e74705SXin Li const llvm::MemoryBuffer *FromFile = SM.getBuffer(FID);
27*67e74705SXin Li Lexer RawLex(FID, FromFile, SM, LangOpts);
28*67e74705SXin Li
29*67e74705SXin Li // Return all comments and whitespace as tokens.
30*67e74705SXin Li RawLex.SetKeepWhitespaceMode(true);
31*67e74705SXin Li
32*67e74705SXin Li // Lex the file, populating our datastructures.
33*67e74705SXin Li Token RawTok;
34*67e74705SXin Li RawLex.LexFromRawLexer(RawTok);
35*67e74705SXin Li while (RawTok.isNot(tok::eof)) {
36*67e74705SXin Li #if 0
37*67e74705SXin Li if (Tok.is(tok::raw_identifier)) {
38*67e74705SXin Li // Look up the identifier info for the token. This should use
39*67e74705SXin Li // IdentifierTable directly instead of PP.
40*67e74705SXin Li PP.LookUpIdentifierInfo(Tok);
41*67e74705SXin Li }
42*67e74705SXin Li #endif
43*67e74705SXin Li
44*67e74705SXin Li AddToken(RawTok, TokenList.end());
45*67e74705SXin Li RawLex.LexFromRawLexer(RawTok);
46*67e74705SXin Li }
47*67e74705SXin Li }
48*67e74705SXin Li
~TokenRewriter()49*67e74705SXin Li TokenRewriter::~TokenRewriter() {
50*67e74705SXin Li }
51*67e74705SXin Li
52*67e74705SXin Li
53*67e74705SXin Li /// RemapIterator - Convert from token_iterator (a const iterator) to
54*67e74705SXin Li /// TokenRefTy (a non-const iterator).
RemapIterator(token_iterator I)55*67e74705SXin Li TokenRewriter::TokenRefTy TokenRewriter::RemapIterator(token_iterator I) {
56*67e74705SXin Li if (I == token_end()) return TokenList.end();
57*67e74705SXin Li
58*67e74705SXin Li // FIXME: This is horrible, we should use our own list or something to avoid
59*67e74705SXin Li // this.
60*67e74705SXin Li std::map<SourceLocation, TokenRefTy>::iterator MapIt =
61*67e74705SXin Li TokenAtLoc.find(I->getLocation());
62*67e74705SXin Li assert(MapIt != TokenAtLoc.end() && "iterator not in rewriter?");
63*67e74705SXin Li return MapIt->second;
64*67e74705SXin Li }
65*67e74705SXin Li
66*67e74705SXin Li
67*67e74705SXin Li /// AddToken - Add the specified token into the Rewriter before the other
68*67e74705SXin Li /// position.
69*67e74705SXin Li TokenRewriter::TokenRefTy
AddToken(const Token & T,TokenRefTy Where)70*67e74705SXin Li TokenRewriter::AddToken(const Token &T, TokenRefTy Where) {
71*67e74705SXin Li Where = TokenList.insert(Where, T);
72*67e74705SXin Li
73*67e74705SXin Li bool InsertSuccess = TokenAtLoc.insert(std::make_pair(T.getLocation(),
74*67e74705SXin Li Where)).second;
75*67e74705SXin Li assert(InsertSuccess && "Token location already in rewriter!");
76*67e74705SXin Li (void)InsertSuccess;
77*67e74705SXin Li return Where;
78*67e74705SXin Li }
79*67e74705SXin Li
80*67e74705SXin Li
81*67e74705SXin Li TokenRewriter::token_iterator
AddTokenBefore(token_iterator I,const char * Val)82*67e74705SXin Li TokenRewriter::AddTokenBefore(token_iterator I, const char *Val) {
83*67e74705SXin Li unsigned Len = strlen(Val);
84*67e74705SXin Li
85*67e74705SXin Li // Plop the string into the scratch buffer, then create a token for this
86*67e74705SXin Li // string.
87*67e74705SXin Li Token Tok;
88*67e74705SXin Li Tok.startToken();
89*67e74705SXin Li const char *Spelling;
90*67e74705SXin Li Tok.setLocation(ScratchBuf->getToken(Val, Len, Spelling));
91*67e74705SXin Li Tok.setLength(Len);
92*67e74705SXin Li
93*67e74705SXin Li // TODO: Form a whole lexer around this and relex the token! For now, just
94*67e74705SXin Li // set kind to tok::unknown.
95*67e74705SXin Li Tok.setKind(tok::unknown);
96*67e74705SXin Li
97*67e74705SXin Li return AddToken(Tok, RemapIterator(I));
98*67e74705SXin Li }
99*67e74705SXin Li
100