1 //===--- Transformer.cpp - Transformer library implementation ---*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "clang/Tooling/Transformer/RewriteRule.h" 10 #include "clang/AST/ASTTypeTraits.h" 11 #include "clang/AST/Stmt.h" 12 #include "clang/ASTMatchers/ASTMatchFinder.h" 13 #include "clang/ASTMatchers/ASTMatchers.h" 14 #include "clang/Basic/SourceLocation.h" 15 #include "clang/Tooling/Transformer/SourceCode.h" 16 #include "llvm/ADT/StringRef.h" 17 #include "llvm/Support/Errc.h" 18 #include "llvm/Support/Error.h" 19 #include <map> 20 #include <string> 21 #include <utility> 22 #include <vector> 23 24 using namespace clang; 25 using namespace transformer; 26 27 using ast_matchers::MatchFinder; 28 using ast_matchers::internal::DynTypedMatcher; 29 30 using MatchResult = MatchFinder::MatchResult; 31 32 const char transformer::RootID[] = "___root___"; 33 34 static Expected<SmallVector<transformer::Edit, 1>> 35 translateEdits(const MatchResult &Result, ArrayRef<ASTEdit> ASTEdits) { 36 SmallVector<transformer::Edit, 1> Edits; 37 for (const auto &E : ASTEdits) { 38 Expected<CharSourceRange> Range = E.TargetRange(Result); 39 if (!Range) 40 return Range.takeError(); 41 std::optional<CharSourceRange> EditRange = 42 tooling::getFileRangeForEdit(*Range, *Result.Context); 43 // FIXME: let user specify whether to treat this case as an error or ignore 44 // it as is currently done. This behavior is problematic in that it hides 45 // failures from bad ranges. Also, the behavior here differs from 46 // `flatten`. Here, we abort (without error), whereas flatten, if it hits an 47 // empty list, does not abort. As a result, `editList({A,B})` is not 48 // equivalent to `flatten(edit(A), edit(B))`. The former will abort if `A` 49 // produces a bad range, whereas the latter will simply ignore A. 50 if (!EditRange) 51 return SmallVector<Edit, 0>(); 52 transformer::Edit T; 53 T.Kind = E.Kind; 54 T.Range = *EditRange; 55 if (E.Replacement) { 56 auto Replacement = E.Replacement->eval(Result); 57 if (!Replacement) 58 return Replacement.takeError(); 59 T.Replacement = std::move(*Replacement); 60 } 61 if (E.Note) { 62 auto Note = E.Note->eval(Result); 63 if (!Note) 64 return Note.takeError(); 65 T.Note = std::move(*Note); 66 } 67 if (E.Metadata) { 68 auto Metadata = E.Metadata(Result); 69 if (!Metadata) 70 return Metadata.takeError(); 71 T.Metadata = std::move(*Metadata); 72 } 73 Edits.push_back(std::move(T)); 74 } 75 return Edits; 76 } 77 78 EditGenerator transformer::editList(SmallVector<ASTEdit, 1> Edits) { 79 return [Edits = std::move(Edits)](const MatchResult &Result) { 80 return translateEdits(Result, Edits); 81 }; 82 } 83 84 EditGenerator transformer::edit(ASTEdit Edit) { 85 return [Edit = std::move(Edit)](const MatchResult &Result) { 86 return translateEdits(Result, {Edit}); 87 }; 88 } 89 90 EditGenerator transformer::noopEdit(RangeSelector Anchor) { 91 return [Anchor = std::move(Anchor)](const MatchResult &Result) 92 -> Expected<SmallVector<transformer::Edit, 1>> { 93 Expected<CharSourceRange> Range = Anchor(Result); 94 if (!Range) 95 return Range.takeError(); 96 // In case the range is inside a macro expansion, map the location back to a 97 // "real" source location. 98 SourceLocation Begin = 99 Result.SourceManager->getSpellingLoc(Range->getBegin()); 100 Edit E; 101 // Implicitly, leave `E.Replacement` as the empty string. 102 E.Kind = EditKind::Range; 103 E.Range = CharSourceRange::getCharRange(Begin, Begin); 104 return SmallVector<Edit, 1>{E}; 105 }; 106 } 107 108 EditGenerator 109 transformer::flattenVector(SmallVector<EditGenerator, 2> Generators) { 110 if (Generators.size() == 1) 111 return std::move(Generators[0]); 112 return 113 [Gs = std::move(Generators)]( 114 const MatchResult &Result) -> llvm::Expected<SmallVector<Edit, 1>> { 115 SmallVector<Edit, 1> AllEdits; 116 for (const auto &G : Gs) { 117 llvm::Expected<SmallVector<Edit, 1>> Edits = G(Result); 118 if (!Edits) 119 return Edits.takeError(); 120 AllEdits.append(Edits->begin(), Edits->end()); 121 } 122 return AllEdits; 123 }; 124 } 125 126 ASTEdit transformer::changeTo(RangeSelector Target, TextGenerator Replacement) { 127 ASTEdit E; 128 E.TargetRange = std::move(Target); 129 E.Replacement = std::move(Replacement); 130 return E; 131 } 132 133 ASTEdit transformer::note(RangeSelector Anchor, TextGenerator Note) { 134 ASTEdit E; 135 E.TargetRange = transformer::before(Anchor); 136 E.Note = std::move(Note); 137 return E; 138 } 139 140 namespace { 141 /// A \c TextGenerator that always returns a fixed string. 142 class SimpleTextGenerator : public MatchComputation<std::string> { 143 std::string S; 144 145 public: 146 SimpleTextGenerator(std::string S) : S(std::move(S)) {} 147 llvm::Error eval(const ast_matchers::MatchFinder::MatchResult &, 148 std::string *Result) const override { 149 Result->append(S); 150 return llvm::Error::success(); 151 } 152 std::string toString() const override { 153 return (llvm::Twine("text(\"") + S + "\")").str(); 154 } 155 }; 156 } // namespace 157 158 static TextGenerator makeText(std::string S) { 159 return std::make_shared<SimpleTextGenerator>(std::move(S)); 160 } 161 162 ASTEdit transformer::remove(RangeSelector S) { 163 return change(std::move(S), makeText("")); 164 } 165 166 static std::string formatHeaderPath(StringRef Header, IncludeFormat Format) { 167 switch (Format) { 168 case transformer::IncludeFormat::Quoted: 169 return Header.str(); 170 case transformer::IncludeFormat::Angled: 171 return ("<" + Header + ">").str(); 172 } 173 llvm_unreachable("Unknown transformer::IncludeFormat enum"); 174 } 175 176 ASTEdit transformer::addInclude(RangeSelector Target, StringRef Header, 177 IncludeFormat Format) { 178 ASTEdit E; 179 E.Kind = EditKind::AddInclude; 180 E.TargetRange = Target; 181 E.Replacement = makeText(formatHeaderPath(Header, Format)); 182 return E; 183 } 184 185 EditGenerator 186 transformer::detail::makeEditGenerator(llvm::SmallVector<ASTEdit, 1> Edits) { 187 return editList(std::move(Edits)); 188 } 189 190 EditGenerator transformer::detail::makeEditGenerator(ASTEdit Edit) { 191 return edit(std::move(Edit)); 192 } 193 194 RewriteRule transformer::detail::makeRule(DynTypedMatcher M, 195 EditGenerator Edits) { 196 RewriteRule R; 197 R.Cases = {{std::move(M), std::move(Edits)}}; 198 return R; 199 } 200 201 RewriteRule transformer::makeRule(ast_matchers::internal::DynTypedMatcher M, 202 std::initializer_list<ASTEdit> Edits) { 203 return detail::makeRule(std::move(M), 204 detail::makeEditGenerator(std::move(Edits))); 205 } 206 207 namespace { 208 209 /// Unconditionally binds the given node set before trying `InnerMatcher` and 210 /// keeps the bound nodes on a successful match. 211 template <typename T> 212 class BindingsMatcher : public ast_matchers::internal::MatcherInterface<T> { 213 ast_matchers::BoundNodes Nodes; 214 const ast_matchers::internal::Matcher<T> InnerMatcher; 215 216 public: 217 explicit BindingsMatcher(ast_matchers::BoundNodes Nodes, 218 ast_matchers::internal::Matcher<T> InnerMatcher) 219 : Nodes(std::move(Nodes)), InnerMatcher(std::move(InnerMatcher)) {} 220 221 bool matches( 222 const T &Node, ast_matchers::internal::ASTMatchFinder *Finder, 223 ast_matchers::internal::BoundNodesTreeBuilder *Builder) const override { 224 ast_matchers::internal::BoundNodesTreeBuilder Result(*Builder); 225 for (const auto &N : Nodes.getMap()) 226 Result.setBinding(N.first, N.second); 227 if (InnerMatcher.matches(Node, Finder, &Result)) { 228 *Builder = std::move(Result); 229 return true; 230 } 231 return false; 232 } 233 }; 234 235 /// Matches nodes of type T that have at least one descendant node for which the 236 /// given inner matcher matches. Will match for each descendant node that 237 /// matches. Based on ForEachDescendantMatcher, but takes a dynamic matcher, 238 /// instead of a static one, because it is used by RewriteRule, which carries 239 /// (only top-level) dynamic matchers. 240 template <typename T> 241 class DynamicForEachDescendantMatcher 242 : public ast_matchers::internal::MatcherInterface<T> { 243 const DynTypedMatcher DescendantMatcher; 244 245 public: 246 explicit DynamicForEachDescendantMatcher(DynTypedMatcher DescendantMatcher) 247 : DescendantMatcher(std::move(DescendantMatcher)) {} 248 249 bool matches( 250 const T &Node, ast_matchers::internal::ASTMatchFinder *Finder, 251 ast_matchers::internal::BoundNodesTreeBuilder *Builder) const override { 252 return Finder->matchesDescendantOf( 253 Node, this->DescendantMatcher, Builder, 254 ast_matchers::internal::ASTMatchFinder::BK_All); 255 } 256 }; 257 258 template <typename T> 259 ast_matchers::internal::Matcher<T> 260 forEachDescendantDynamically(ast_matchers::BoundNodes Nodes, 261 DynTypedMatcher M) { 262 return ast_matchers::internal::makeMatcher(new BindingsMatcher<T>( 263 std::move(Nodes), 264 ast_matchers::internal::makeMatcher( 265 new DynamicForEachDescendantMatcher<T>(std::move(M))))); 266 } 267 268 class ApplyRuleCallback : public MatchFinder::MatchCallback { 269 public: 270 ApplyRuleCallback(RewriteRule Rule) : Rule(std::move(Rule)) {} 271 272 template <typename T> 273 void registerMatchers(const ast_matchers::BoundNodes &Nodes, 274 MatchFinder *MF) { 275 for (auto &Matcher : transformer::detail::buildMatchers(Rule)) 276 MF->addMatcher(forEachDescendantDynamically<T>(Nodes, Matcher), this); 277 } 278 279 void run(const MatchFinder::MatchResult &Result) override { 280 if (!Edits) 281 return; 282 size_t I = transformer::detail::findSelectedCase(Result, Rule); 283 auto Transformations = Rule.Cases[I].Edits(Result); 284 if (!Transformations) { 285 Edits = Transformations.takeError(); 286 return; 287 } 288 Edits->append(Transformations->begin(), Transformations->end()); 289 } 290 291 RewriteRule Rule; 292 293 // Initialize to a non-error state. 294 Expected<SmallVector<Edit, 1>> Edits = SmallVector<Edit, 1>(); 295 }; 296 } // namespace 297 298 template <typename T> 299 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 300 rewriteDescendantsImpl(const T &Node, RewriteRule Rule, 301 const MatchResult &Result) { 302 ApplyRuleCallback Callback(std::move(Rule)); 303 MatchFinder Finder; 304 Callback.registerMatchers<T>(Result.Nodes, &Finder); 305 Finder.match(Node, *Result.Context); 306 return std::move(Callback.Edits); 307 } 308 309 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 310 transformer::detail::rewriteDescendants(const Decl &Node, RewriteRule Rule, 311 const MatchResult &Result) { 312 return rewriteDescendantsImpl(Node, std::move(Rule), Result); 313 } 314 315 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 316 transformer::detail::rewriteDescendants(const Stmt &Node, RewriteRule Rule, 317 const MatchResult &Result) { 318 return rewriteDescendantsImpl(Node, std::move(Rule), Result); 319 } 320 321 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 322 transformer::detail::rewriteDescendants(const TypeLoc &Node, RewriteRule Rule, 323 const MatchResult &Result) { 324 return rewriteDescendantsImpl(Node, std::move(Rule), Result); 325 } 326 327 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 328 transformer::detail::rewriteDescendants(const DynTypedNode &DNode, 329 RewriteRule Rule, 330 const MatchResult &Result) { 331 if (const auto *Node = DNode.get<Decl>()) 332 return rewriteDescendantsImpl(*Node, std::move(Rule), Result); 333 if (const auto *Node = DNode.get<Stmt>()) 334 return rewriteDescendantsImpl(*Node, std::move(Rule), Result); 335 if (const auto *Node = DNode.get<TypeLoc>()) 336 return rewriteDescendantsImpl(*Node, std::move(Rule), Result); 337 338 return llvm::make_error<llvm::StringError>( 339 llvm::errc::invalid_argument, 340 "type unsupported for recursive rewriting, Kind=" + 341 DNode.getNodeKind().asStringRef()); 342 } 343 344 EditGenerator transformer::rewriteDescendants(std::string NodeId, 345 RewriteRule Rule) { 346 return [NodeId = std::move(NodeId), 347 Rule = std::move(Rule)](const MatchResult &Result) 348 -> llvm::Expected<SmallVector<clang::transformer::Edit, 1>> { 349 const ast_matchers::BoundNodes::IDToNodeMap &NodesMap = 350 Result.Nodes.getMap(); 351 auto It = NodesMap.find(NodeId); 352 if (It == NodesMap.end()) 353 return llvm::make_error<llvm::StringError>(llvm::errc::invalid_argument, 354 "ID not bound: " + NodeId); 355 return detail::rewriteDescendants(It->second, std::move(Rule), Result); 356 }; 357 } 358 359 void transformer::addInclude(RewriteRuleBase &Rule, StringRef Header, 360 IncludeFormat Format) { 361 for (auto &Case : Rule.Cases) 362 Case.Edits = flatten(std::move(Case.Edits), addInclude(Header, Format)); 363 } 364 365 #ifndef NDEBUG 366 // Filters for supported matcher kinds. FIXME: Explicitly list the allowed kinds 367 // (all node matcher types except for `QualType` and `Type`), rather than just 368 // banning `QualType` and `Type`. 369 static bool hasValidKind(const DynTypedMatcher &M) { 370 return !M.canConvertTo<QualType>(); 371 } 372 #endif 373 374 // Binds each rule's matcher to a unique (and deterministic) tag based on 375 // `TagBase` and the id paired with the case. All of the returned matchers have 376 // their traversal kind explicitly set, either based on a pre-set kind or to the 377 // provided `DefaultTraversalKind`. 378 static std::vector<DynTypedMatcher> taggedMatchers( 379 StringRef TagBase, 380 const SmallVectorImpl<std::pair<size_t, RewriteRule::Case>> &Cases, 381 TraversalKind DefaultTraversalKind) { 382 std::vector<DynTypedMatcher> Matchers; 383 Matchers.reserve(Cases.size()); 384 for (const auto &Case : Cases) { 385 std::string Tag = (TagBase + Twine(Case.first)).str(); 386 // HACK: Many matchers are not bindable, so ensure that tryBind will work. 387 DynTypedMatcher BoundMatcher(Case.second.Matcher); 388 BoundMatcher.setAllowBind(true); 389 auto M = *BoundMatcher.tryBind(Tag); 390 Matchers.push_back(!M.getTraversalKind() 391 ? M.withTraversalKind(DefaultTraversalKind) 392 : std::move(M)); 393 } 394 return Matchers; 395 } 396 397 // Simply gathers the contents of the various rules into a single rule. The 398 // actual work to combine these into an ordered choice is deferred to matcher 399 // registration. 400 template <> 401 RewriteRuleWith<void> 402 transformer::applyFirst(ArrayRef<RewriteRuleWith<void>> Rules) { 403 RewriteRule R; 404 for (auto &Rule : Rules) 405 R.Cases.append(Rule.Cases.begin(), Rule.Cases.end()); 406 return R; 407 } 408 409 std::vector<DynTypedMatcher> 410 transformer::detail::buildMatchers(const RewriteRuleBase &Rule) { 411 // Map the cases into buckets of matchers -- one for each "root" AST kind, 412 // which guarantees that they can be combined in a single anyOf matcher. Each 413 // case is paired with an identifying number that is converted to a string id 414 // in `taggedMatchers`. 415 std::map<ASTNodeKind, 416 SmallVector<std::pair<size_t, RewriteRuleBase::Case>, 1>> 417 Buckets; 418 const SmallVectorImpl<RewriteRule::Case> &Cases = Rule.Cases; 419 for (int I = 0, N = Cases.size(); I < N; ++I) { 420 assert(hasValidKind(Cases[I].Matcher) && 421 "Matcher must be non-(Qual)Type node matcher"); 422 Buckets[Cases[I].Matcher.getSupportedKind()].emplace_back(I, Cases[I]); 423 } 424 425 // Each anyOf explicitly controls the traversal kind. The anyOf itself is set 426 // to `TK_AsIs` to ensure no nodes are skipped, thereby deferring to the kind 427 // of the branches. Then, each branch is either left as is, if the kind is 428 // already set, or explicitly set to `TK_AsIs`. We choose this setting because 429 // it is the default interpretation of matchers. 430 std::vector<DynTypedMatcher> Matchers; 431 for (const auto &Bucket : Buckets) { 432 DynTypedMatcher M = DynTypedMatcher::constructVariadic( 433 DynTypedMatcher::VO_AnyOf, Bucket.first, 434 taggedMatchers("Tag", Bucket.second, TK_AsIs)); 435 M.setAllowBind(true); 436 // `tryBind` is guaranteed to succeed, because `AllowBind` was set to true. 437 Matchers.push_back(M.tryBind(RootID)->withTraversalKind(TK_AsIs)); 438 } 439 return Matchers; 440 } 441 442 DynTypedMatcher transformer::detail::buildMatcher(const RewriteRuleBase &Rule) { 443 std::vector<DynTypedMatcher> Ms = buildMatchers(Rule); 444 assert(Ms.size() == 1 && "Cases must have compatible matchers."); 445 return Ms[0]; 446 } 447 448 SourceLocation transformer::detail::getRuleMatchLoc(const MatchResult &Result) { 449 auto &NodesMap = Result.Nodes.getMap(); 450 auto Root = NodesMap.find(RootID); 451 assert(Root != NodesMap.end() && "Transformation failed: missing root node."); 452 std::optional<CharSourceRange> RootRange = tooling::getFileRangeForEdit( 453 CharSourceRange::getTokenRange(Root->second.getSourceRange()), 454 *Result.Context); 455 if (RootRange) 456 return RootRange->getBegin(); 457 // The match doesn't have a coherent range, so fall back to the expansion 458 // location as the "beginning" of the match. 459 return Result.SourceManager->getExpansionLoc( 460 Root->second.getSourceRange().getBegin()); 461 } 462 463 // Finds the case that was "selected" -- that is, whose matcher triggered the 464 // `MatchResult`. 465 size_t transformer::detail::findSelectedCase(const MatchResult &Result, 466 const RewriteRuleBase &Rule) { 467 if (Rule.Cases.size() == 1) 468 return 0; 469 470 auto &NodesMap = Result.Nodes.getMap(); 471 for (size_t i = 0, N = Rule.Cases.size(); i < N; ++i) { 472 std::string Tag = ("Tag" + Twine(i)).str(); 473 if (NodesMap.find(Tag) != NodesMap.end()) 474 return i; 475 } 476 llvm_unreachable("No tag found for this rule."); 477 } 478