1 //===--- Transformer.cpp - Transformer library implementation ---*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "clang/Tooling/Transformer/RewriteRule.h" 10 #include "clang/AST/ASTTypeTraits.h" 11 #include "clang/AST/Stmt.h" 12 #include "clang/ASTMatchers/ASTMatchFinder.h" 13 #include "clang/ASTMatchers/ASTMatchers.h" 14 #include "clang/Basic/SourceLocation.h" 15 #include "clang/Tooling/Transformer/SourceCode.h" 16 #include "llvm/ADT/Optional.h" 17 #include "llvm/ADT/StringRef.h" 18 #include "llvm/Support/Errc.h" 19 #include "llvm/Support/Error.h" 20 #include <map> 21 #include <string> 22 #include <utility> 23 #include <vector> 24 25 using namespace clang; 26 using namespace transformer; 27 28 using ast_matchers::MatchFinder; 29 using ast_matchers::internal::DynTypedMatcher; 30 31 using MatchResult = MatchFinder::MatchResult; 32 33 const char transformer::RootID[] = "___root___"; 34 35 static Expected<SmallVector<transformer::Edit, 1>> 36 translateEdits(const MatchResult &Result, ArrayRef<ASTEdit> ASTEdits) { 37 SmallVector<transformer::Edit, 1> Edits; 38 for (const auto &E : ASTEdits) { 39 Expected<CharSourceRange> Range = E.TargetRange(Result); 40 if (!Range) 41 return Range.takeError(); 42 llvm::Optional<CharSourceRange> EditRange = 43 tooling::getRangeForEdit(*Range, *Result.Context); 44 // FIXME: let user specify whether to treat this case as an error or ignore 45 // it as is currently done. 46 if (!EditRange) 47 return SmallVector<Edit, 0>(); 48 auto Replacement = E.Replacement->eval(Result); 49 if (!Replacement) 50 return Replacement.takeError(); 51 auto Metadata = E.Metadata(Result); 52 if (!Metadata) 53 return Metadata.takeError(); 54 transformer::Edit T; 55 T.Kind = E.Kind; 56 T.Range = *EditRange; 57 T.Replacement = std::move(*Replacement); 58 T.Metadata = std::move(*Metadata); 59 Edits.push_back(std::move(T)); 60 } 61 return Edits; 62 } 63 64 EditGenerator transformer::editList(SmallVector<ASTEdit, 1> Edits) { 65 return [Edits = std::move(Edits)](const MatchResult &Result) { 66 return translateEdits(Result, Edits); 67 }; 68 } 69 70 EditGenerator transformer::edit(ASTEdit Edit) { 71 return [Edit = std::move(Edit)](const MatchResult &Result) { 72 return translateEdits(Result, {Edit}); 73 }; 74 } 75 76 EditGenerator transformer::noopEdit(RangeSelector Anchor) { 77 return [Anchor = std::move(Anchor)](const MatchResult &Result) 78 -> Expected<SmallVector<transformer::Edit, 1>> { 79 Expected<CharSourceRange> Range = Anchor(Result); 80 if (!Range) 81 return Range.takeError(); 82 // In case the range is inside a macro expansion, map the location back to a 83 // "real" source location. 84 SourceLocation Begin = 85 Result.SourceManager->getSpellingLoc(Range->getBegin()); 86 Edit E; 87 // Implicitly, leave `E.Replacement` as the empty string. 88 E.Kind = EditKind::Range; 89 E.Range = CharSourceRange::getCharRange(Begin, Begin); 90 return SmallVector<Edit, 1>{E}; 91 }; 92 } 93 94 EditGenerator 95 transformer::flattenVector(SmallVector<EditGenerator, 2> Generators) { 96 if (Generators.size() == 1) 97 return std::move(Generators[0]); 98 return 99 [Gs = std::move(Generators)]( 100 const MatchResult &Result) -> llvm::Expected<SmallVector<Edit, 1>> { 101 SmallVector<Edit, 1> AllEdits; 102 for (const auto &G : Gs) { 103 llvm::Expected<SmallVector<Edit, 1>> Edits = G(Result); 104 if (!Edits) 105 return Edits.takeError(); 106 AllEdits.append(Edits->begin(), Edits->end()); 107 } 108 return AllEdits; 109 }; 110 } 111 112 ASTEdit transformer::changeTo(RangeSelector Target, TextGenerator Replacement) { 113 ASTEdit E; 114 E.TargetRange = std::move(Target); 115 E.Replacement = std::move(Replacement); 116 return E; 117 } 118 119 namespace { 120 /// A \c TextGenerator that always returns a fixed string. 121 class SimpleTextGenerator : public MatchComputation<std::string> { 122 std::string S; 123 124 public: 125 SimpleTextGenerator(std::string S) : S(std::move(S)) {} 126 llvm::Error eval(const ast_matchers::MatchFinder::MatchResult &, 127 std::string *Result) const override { 128 Result->append(S); 129 return llvm::Error::success(); 130 } 131 std::string toString() const override { 132 return (llvm::Twine("text(\"") + S + "\")").str(); 133 } 134 }; 135 } // namespace 136 137 static TextGenerator makeText(std::string S) { 138 return std::make_shared<SimpleTextGenerator>(std::move(S)); 139 } 140 141 ASTEdit transformer::remove(RangeSelector S) { 142 return change(std::move(S), makeText("")); 143 } 144 145 static std::string formatHeaderPath(StringRef Header, IncludeFormat Format) { 146 switch (Format) { 147 case transformer::IncludeFormat::Quoted: 148 return Header.str(); 149 case transformer::IncludeFormat::Angled: 150 return ("<" + Header + ">").str(); 151 } 152 llvm_unreachable("Unknown transformer::IncludeFormat enum"); 153 } 154 155 ASTEdit transformer::addInclude(RangeSelector Target, StringRef Header, 156 IncludeFormat Format) { 157 ASTEdit E; 158 E.Kind = EditKind::AddInclude; 159 E.TargetRange = Target; 160 E.Replacement = makeText(formatHeaderPath(Header, Format)); 161 return E; 162 } 163 164 RewriteRule transformer::makeRule(DynTypedMatcher M, EditGenerator Edits, 165 TextGenerator Explanation) { 166 return RewriteRule{{RewriteRule::Case{std::move(M), std::move(Edits), 167 std::move(Explanation)}}}; 168 } 169 170 namespace { 171 172 /// Unconditionally binds the given node set before trying `InnerMatcher` and 173 /// keeps the bound nodes on a successful match. 174 template <typename T> 175 class BindingsMatcher : public ast_matchers::internal::MatcherInterface<T> { 176 ast_matchers::BoundNodes Nodes; 177 const ast_matchers::internal::Matcher<T> InnerMatcher; 178 179 public: 180 explicit BindingsMatcher(ast_matchers::BoundNodes Nodes, 181 ast_matchers::internal::Matcher<T> InnerMatcher) 182 : Nodes(std::move(Nodes)), InnerMatcher(std::move(InnerMatcher)) {} 183 184 bool matches( 185 const T &Node, ast_matchers::internal::ASTMatchFinder *Finder, 186 ast_matchers::internal::BoundNodesTreeBuilder *Builder) const override { 187 ast_matchers::internal::BoundNodesTreeBuilder Result(*Builder); 188 for (const auto &N : Nodes.getMap()) 189 Result.setBinding(N.first, N.second); 190 if (InnerMatcher.matches(Node, Finder, &Result)) { 191 *Builder = std::move(Result); 192 return true; 193 } 194 return false; 195 } 196 }; 197 198 /// Matches nodes of type T that have at least one descendant node for which the 199 /// given inner matcher matches. Will match for each descendant node that 200 /// matches. Based on ForEachDescendantMatcher, but takes a dynamic matcher, 201 /// instead of a static one, because it is used by RewriteRule, which carries 202 /// (only top-level) dynamic matchers. 203 template <typename T> 204 class DynamicForEachDescendantMatcher 205 : public ast_matchers::internal::MatcherInterface<T> { 206 const DynTypedMatcher DescendantMatcher; 207 208 public: 209 explicit DynamicForEachDescendantMatcher(DynTypedMatcher DescendantMatcher) 210 : DescendantMatcher(std::move(DescendantMatcher)) {} 211 212 bool matches( 213 const T &Node, ast_matchers::internal::ASTMatchFinder *Finder, 214 ast_matchers::internal::BoundNodesTreeBuilder *Builder) const override { 215 return Finder->matchesDescendantOf( 216 Node, this->DescendantMatcher, Builder, 217 ast_matchers::internal::ASTMatchFinder::BK_All); 218 } 219 }; 220 221 template <typename T> 222 ast_matchers::internal::Matcher<T> 223 forEachDescendantDynamically(ast_matchers::BoundNodes Nodes, 224 DynTypedMatcher M) { 225 return ast_matchers::internal::makeMatcher(new BindingsMatcher<T>( 226 std::move(Nodes), 227 ast_matchers::internal::makeMatcher( 228 new DynamicForEachDescendantMatcher<T>(std::move(M))))); 229 } 230 231 class ApplyRuleCallback : public MatchFinder::MatchCallback { 232 public: 233 ApplyRuleCallback(RewriteRule Rule) : Rule(std::move(Rule)) {} 234 235 template <typename T> 236 void registerMatchers(const ast_matchers::BoundNodes &Nodes, 237 MatchFinder *MF) { 238 for (auto &Matcher : transformer::detail::buildMatchers(Rule)) 239 MF->addMatcher(forEachDescendantDynamically<T>(Nodes, Matcher), this); 240 } 241 242 void run(const MatchFinder::MatchResult &Result) override { 243 if (!Edits) 244 return; 245 transformer::RewriteRule::Case Case = 246 transformer::detail::findSelectedCase(Result, Rule); 247 auto Transformations = Case.Edits(Result); 248 if (!Transformations) { 249 Edits = Transformations.takeError(); 250 return; 251 } 252 Edits->append(Transformations->begin(), Transformations->end()); 253 } 254 255 RewriteRule Rule; 256 257 // Initialize to a non-error state. 258 Expected<SmallVector<Edit, 1>> Edits = SmallVector<Edit, 1>(); 259 }; 260 } // namespace 261 262 template <typename T> 263 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 264 rewriteDescendantsImpl(const T &Node, RewriteRule Rule, 265 const MatchResult &Result) { 266 ApplyRuleCallback Callback(std::move(Rule)); 267 MatchFinder Finder; 268 Callback.registerMatchers<T>(Result.Nodes, &Finder); 269 Finder.match(Node, *Result.Context); 270 return std::move(Callback.Edits); 271 } 272 273 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 274 transformer::detail::rewriteDescendants(const Decl &Node, RewriteRule Rule, 275 const MatchResult &Result) { 276 return rewriteDescendantsImpl(Node, std::move(Rule), Result); 277 } 278 279 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 280 transformer::detail::rewriteDescendants(const Stmt &Node, RewriteRule Rule, 281 const MatchResult &Result) { 282 return rewriteDescendantsImpl(Node, std::move(Rule), Result); 283 } 284 285 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 286 transformer::detail::rewriteDescendants(const TypeLoc &Node, RewriteRule Rule, 287 const MatchResult &Result) { 288 return rewriteDescendantsImpl(Node, std::move(Rule), Result); 289 } 290 291 llvm::Expected<SmallVector<clang::transformer::Edit, 1>> 292 transformer::detail::rewriteDescendants(const DynTypedNode &DNode, 293 RewriteRule Rule, 294 const MatchResult &Result) { 295 if (const auto *Node = DNode.get<Decl>()) 296 return rewriteDescendantsImpl(*Node, std::move(Rule), Result); 297 if (const auto *Node = DNode.get<Stmt>()) 298 return rewriteDescendantsImpl(*Node, std::move(Rule), Result); 299 if (const auto *Node = DNode.get<TypeLoc>()) 300 return rewriteDescendantsImpl(*Node, std::move(Rule), Result); 301 302 return llvm::make_error<llvm::StringError>( 303 llvm::errc::invalid_argument, 304 "type unsupported for recursive rewriting, Kind=" + 305 DNode.getNodeKind().asStringRef()); 306 } 307 308 EditGenerator transformer::rewriteDescendants(std::string NodeId, 309 RewriteRule Rule) { 310 return [NodeId = std::move(NodeId), 311 Rule = std::move(Rule)](const MatchResult &Result) 312 -> llvm::Expected<SmallVector<clang::transformer::Edit, 1>> { 313 const ast_matchers::BoundNodes::IDToNodeMap &NodesMap = 314 Result.Nodes.getMap(); 315 auto It = NodesMap.find(NodeId); 316 if (It == NodesMap.end()) 317 return llvm::make_error<llvm::StringError>(llvm::errc::invalid_argument, 318 "ID not bound: " + NodeId); 319 return detail::rewriteDescendants(It->second, std::move(Rule), Result); 320 }; 321 } 322 323 void transformer::addInclude(RewriteRule &Rule, StringRef Header, 324 IncludeFormat Format) { 325 for (auto &Case : Rule.Cases) 326 Case.Edits = flatten(std::move(Case.Edits), addInclude(Header, Format)); 327 } 328 329 #ifndef NDEBUG 330 // Filters for supported matcher kinds. FIXME: Explicitly list the allowed kinds 331 // (all node matcher types except for `QualType` and `Type`), rather than just 332 // banning `QualType` and `Type`. 333 static bool hasValidKind(const DynTypedMatcher &M) { 334 return !M.canConvertTo<QualType>(); 335 } 336 #endif 337 338 // Binds each rule's matcher to a unique (and deterministic) tag based on 339 // `TagBase` and the id paired with the case. All of the returned matchers have 340 // their traversal kind explicitly set, either based on a pre-set kind or to the 341 // provided `DefaultTraversalKind`. 342 static std::vector<DynTypedMatcher> taggedMatchers( 343 StringRef TagBase, 344 const SmallVectorImpl<std::pair<size_t, RewriteRule::Case>> &Cases, 345 ast_type_traits::TraversalKind DefaultTraversalKind) { 346 std::vector<DynTypedMatcher> Matchers; 347 Matchers.reserve(Cases.size()); 348 for (const auto &Case : Cases) { 349 std::string Tag = (TagBase + Twine(Case.first)).str(); 350 // HACK: Many matchers are not bindable, so ensure that tryBind will work. 351 DynTypedMatcher BoundMatcher(Case.second.Matcher); 352 BoundMatcher.setAllowBind(true); 353 auto M = *BoundMatcher.tryBind(Tag); 354 Matchers.push_back(!M.getTraversalKind() 355 ? M.withTraversalKind(DefaultTraversalKind) 356 : std::move(M)); 357 } 358 return Matchers; 359 } 360 361 // Simply gathers the contents of the various rules into a single rule. The 362 // actual work to combine these into an ordered choice is deferred to matcher 363 // registration. 364 RewriteRule transformer::applyFirst(ArrayRef<RewriteRule> Rules) { 365 RewriteRule R; 366 for (auto &Rule : Rules) 367 R.Cases.append(Rule.Cases.begin(), Rule.Cases.end()); 368 return R; 369 } 370 371 std::vector<DynTypedMatcher> 372 transformer::detail::buildMatchers(const RewriteRule &Rule) { 373 // Map the cases into buckets of matchers -- one for each "root" AST kind, 374 // which guarantees that they can be combined in a single anyOf matcher. Each 375 // case is paired with an identifying number that is converted to a string id 376 // in `taggedMatchers`. 377 std::map<ASTNodeKind, SmallVector<std::pair<size_t, RewriteRule::Case>, 1>> 378 Buckets; 379 const SmallVectorImpl<RewriteRule::Case> &Cases = Rule.Cases; 380 for (int I = 0, N = Cases.size(); I < N; ++I) { 381 assert(hasValidKind(Cases[I].Matcher) && 382 "Matcher must be non-(Qual)Type node matcher"); 383 Buckets[Cases[I].Matcher.getSupportedKind()].emplace_back(I, Cases[I]); 384 } 385 386 // Each anyOf explicitly controls the traversal kind. The anyOf itself is set 387 // to `TK_AsIs` to ensure no nodes are skipped, thereby deferring to the kind 388 // of the branches. Then, each branch is either left as is, if the kind is 389 // already set, or explicitly set to `TK_AsIs`. We choose this setting because 390 // it is the default interpretation of matchers. 391 std::vector<DynTypedMatcher> Matchers; 392 for (const auto &Bucket : Buckets) { 393 DynTypedMatcher M = DynTypedMatcher::constructVariadic( 394 DynTypedMatcher::VO_AnyOf, Bucket.first, 395 taggedMatchers("Tag", Bucket.second, TK_AsIs)); 396 M.setAllowBind(true); 397 // `tryBind` is guaranteed to succeed, because `AllowBind` was set to true. 398 Matchers.push_back(M.tryBind(RootID)->withTraversalKind(TK_AsIs)); 399 } 400 return Matchers; 401 } 402 403 DynTypedMatcher transformer::detail::buildMatcher(const RewriteRule &Rule) { 404 std::vector<DynTypedMatcher> Ms = buildMatchers(Rule); 405 assert(Ms.size() == 1 && "Cases must have compatible matchers."); 406 return Ms[0]; 407 } 408 409 SourceLocation transformer::detail::getRuleMatchLoc(const MatchResult &Result) { 410 auto &NodesMap = Result.Nodes.getMap(); 411 auto Root = NodesMap.find(RootID); 412 assert(Root != NodesMap.end() && "Transformation failed: missing root node."); 413 llvm::Optional<CharSourceRange> RootRange = tooling::getRangeForEdit( 414 CharSourceRange::getTokenRange(Root->second.getSourceRange()), 415 *Result.Context); 416 if (RootRange) 417 return RootRange->getBegin(); 418 // The match doesn't have a coherent range, so fall back to the expansion 419 // location as the "beginning" of the match. 420 return Result.SourceManager->getExpansionLoc( 421 Root->second.getSourceRange().getBegin()); 422 } 423 424 // Finds the case that was "selected" -- that is, whose matcher triggered the 425 // `MatchResult`. 426 const RewriteRule::Case & 427 transformer::detail::findSelectedCase(const MatchResult &Result, 428 const RewriteRule &Rule) { 429 if (Rule.Cases.size() == 1) 430 return Rule.Cases[0]; 431 432 auto &NodesMap = Result.Nodes.getMap(); 433 for (size_t i = 0, N = Rule.Cases.size(); i < N; ++i) { 434 std::string Tag = ("Tag" + Twine(i)).str(); 435 if (NodesMap.find(Tag) != NodesMap.end()) 436 return Rule.Cases[i]; 437 } 438 llvm_unreachable("No tag found for this rule."); 439 } 440 441 const llvm::StringRef RewriteRule::RootID = ::clang::transformer::RootID; 442