lib/Rewrite/TokenRewriter.cpp

0b57cec5SDimitry Andric//===- TokenRewriter.cpp - Token-based code rewriting interface -----------===//
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
0b57cec5SDimitry Andric// See https://llvm.org/LICENSE.txt for license information.
0b57cec5SDimitry Andric// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric//  This file implements the TokenRewriter class, which is used for code
0b57cec5SDimitry Andric//  transformations.
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric#include "clang/Rewrite/Core/TokenRewriter.h"
0b57cec5SDimitry Andric#include "clang/Basic/SourceManager.h"
0b57cec5SDimitry Andric#include "clang/Lex/Lexer.h"
0b57cec5SDimitry Andric#include "clang/Lex/ScratchBuffer.h"
0b57cec5SDimitry Andric#include "clang/Lex/Token.h"
0b57cec5SDimitry Andric#include <cassert>
0b57cec5SDimitry Andric#include <cstring>
0b57cec5SDimitry Andric#include <map>
0b57cec5SDimitry Andric#include <utility>
0b57cec5SDimitry Andric
0b57cec5SDimitry Andricusing namespace clang;
0b57cec5SDimitry Andric
0b57cec5SDimitry AndricTokenRewriter::TokenRewriter(FileID FID, SourceManager &SM,
0b57cec5SDimitry Andric                             const LangOptions &LangOpts) {
0b57cec5SDimitry Andric  ScratchBuf.reset(new ScratchBuffer(SM));
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  // Create a lexer to lex all the tokens of the main file in raw mode.
*e8d8bef9SDimitry Andric  llvm::MemoryBufferRef FromFile = SM.getBufferOrFake(FID);
0b57cec5SDimitry Andric  Lexer RawLex(FID, FromFile, SM, LangOpts);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  // Return all comments and whitespace as tokens.
0b57cec5SDimitry Andric  RawLex.SetKeepWhitespaceMode(true);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  // Lex the file, populating our datastructures.
0b57cec5SDimitry Andric  Token RawTok;
0b57cec5SDimitry Andric  RawLex.LexFromRawLexer(RawTok);
0b57cec5SDimitry Andric  while (RawTok.isNot(tok::eof)) {
0b57cec5SDimitry Andric#if 0
0b57cec5SDimitry Andric    if (Tok.is(tok::raw_identifier)) {
0b57cec5SDimitry Andric      // Look up the identifier info for the token.  This should use
0b57cec5SDimitry Andric      // IdentifierTable directly instead of PP.
0b57cec5SDimitry Andric      PP.LookUpIdentifierInfo(Tok);
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric#endif
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    AddToken(RawTok, TokenList.end());
0b57cec5SDimitry Andric    RawLex.LexFromRawLexer(RawTok);
0b57cec5SDimitry Andric  }
0b57cec5SDimitry Andric}
0b57cec5SDimitry Andric
0b57cec5SDimitry AndricTokenRewriter::~TokenRewriter() = default;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric/// RemapIterator - Convert from token_iterator (a const iterator) to
0b57cec5SDimitry Andric/// TokenRefTy (a non-const iterator).
0b57cec5SDimitry AndricTokenRewriter::TokenRefTy TokenRewriter::RemapIterator(token_iterator I) {
0b57cec5SDimitry Andric  if (I == token_end()) return TokenList.end();
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  // FIXME: This is horrible, we should use our own list or something to avoid
0b57cec5SDimitry Andric  // this.
0b57cec5SDimitry Andric  std::map<SourceLocation, TokenRefTy>::iterator MapIt =
0b57cec5SDimitry Andric    TokenAtLoc.find(I->getLocation());
0b57cec5SDimitry Andric  assert(MapIt != TokenAtLoc.end() && "iterator not in rewriter?");
0b57cec5SDimitry Andric  return MapIt->second;
0b57cec5SDimitry Andric}
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric/// AddToken - Add the specified token into the Rewriter before the other
0b57cec5SDimitry Andric/// position.
0b57cec5SDimitry AndricTokenRewriter::TokenRefTy
0b57cec5SDimitry AndricTokenRewriter::AddToken(const Token &T, TokenRefTy Where) {
0b57cec5SDimitry Andric  Where = TokenList.insert(Where, T);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  bool InsertSuccess = TokenAtLoc.insert(std::make_pair(T.getLocation(),
0b57cec5SDimitry Andric                                                        Where)).second;
0b57cec5SDimitry Andric  assert(InsertSuccess && "Token location already in rewriter!");
0b57cec5SDimitry Andric  (void)InsertSuccess;
0b57cec5SDimitry Andric  return Where;
0b57cec5SDimitry Andric}
0b57cec5SDimitry Andric
0b57cec5SDimitry AndricTokenRewriter::token_iterator
0b57cec5SDimitry AndricTokenRewriter::AddTokenBefore(token_iterator I, const char *Val) {
0b57cec5SDimitry Andric  unsigned Len = strlen(Val);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  // Plop the string into the scratch buffer, then create a token for this
0b57cec5SDimitry Andric  // string.
0b57cec5SDimitry Andric  Token Tok;
0b57cec5SDimitry Andric  Tok.startToken();
0b57cec5SDimitry Andric  const char *Spelling;
0b57cec5SDimitry Andric  Tok.setLocation(ScratchBuf->getToken(Val, Len, Spelling));
0b57cec5SDimitry Andric  Tok.setLength(Len);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  // TODO: Form a whole lexer around this and relex the token!  For now, just
0b57cec5SDimitry Andric  // set kind to tok::unknown.
0b57cec5SDimitry Andric  Tok.setKind(tok::unknown);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  return AddToken(Tok, RemapIterator(I));
0b57cec5SDimitry Andric}