19b3f38f9SIlya Biryukov //===- BuildTree.cpp ------------------------------------------*- C++ -*-=====// 29b3f38f9SIlya Biryukov // 39b3f38f9SIlya Biryukov // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 49b3f38f9SIlya Biryukov // See https://llvm.org/LICENSE.txt for license information. 59b3f38f9SIlya Biryukov // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 69b3f38f9SIlya Biryukov // 79b3f38f9SIlya Biryukov //===----------------------------------------------------------------------===// 89b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/BuildTree.h" 97d382dcdSMarcel Hlopko #include "clang/AST/ASTFwd.h" 10e702bdb8SIlya Biryukov #include "clang/AST/Decl.h" 11e702bdb8SIlya Biryukov #include "clang/AST/DeclBase.h" 127d382dcdSMarcel Hlopko #include "clang/AST/DeclCXX.h" 137d382dcdSMarcel Hlopko #include "clang/AST/DeclarationName.h" 149b3f38f9SIlya Biryukov #include "clang/AST/RecursiveASTVisitor.h" 159b3f38f9SIlya Biryukov #include "clang/AST/Stmt.h" 167d382dcdSMarcel Hlopko #include "clang/AST/TypeLoc.h" 177d382dcdSMarcel Hlopko #include "clang/AST/TypeLocVisitor.h" 189b3f38f9SIlya Biryukov #include "clang/Basic/LLVM.h" 199b3f38f9SIlya Biryukov #include "clang/Basic/SourceLocation.h" 209b3f38f9SIlya Biryukov #include "clang/Basic/SourceManager.h" 2188bf9b3dSMarcel Hlopko #include "clang/Basic/Specifiers.h" 229b3f38f9SIlya Biryukov #include "clang/Basic/TokenKinds.h" 239b3f38f9SIlya Biryukov #include "clang/Lex/Lexer.h" 249b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Nodes.h" 259b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tokens.h" 269b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tree.h" 279b3f38f9SIlya Biryukov #include "llvm/ADT/ArrayRef.h" 28a711a3a4SMarcel Hlopko #include "llvm/ADT/DenseMap.h" 29a711a3a4SMarcel Hlopko #include "llvm/ADT/PointerUnion.h" 309b3f38f9SIlya Biryukov #include "llvm/ADT/STLExtras.h" 317d382dcdSMarcel Hlopko #include "llvm/ADT/ScopeExit.h" 329b3f38f9SIlya Biryukov #include "llvm/ADT/SmallVector.h" 339b3f38f9SIlya Biryukov #include "llvm/Support/Allocator.h" 349b3f38f9SIlya Biryukov #include "llvm/Support/Casting.h" 3596065cf7SIlya Biryukov #include "llvm/Support/Compiler.h" 369b3f38f9SIlya Biryukov #include "llvm/Support/FormatVariadic.h" 371ad15046SIlya Biryukov #include "llvm/Support/MemoryBuffer.h" 389b3f38f9SIlya Biryukov #include "llvm/Support/raw_ostream.h" 39a711a3a4SMarcel Hlopko #include <cstddef> 409b3f38f9SIlya Biryukov #include <map> 419b3f38f9SIlya Biryukov 429b3f38f9SIlya Biryukov using namespace clang; 439b3f38f9SIlya Biryukov 4496065cf7SIlya Biryukov LLVM_ATTRIBUTE_UNUSED 4558fa50f4SIlya Biryukov static bool isImplicitExpr(clang::Expr *E) { return E->IgnoreImplicit() != E; } 4658fa50f4SIlya Biryukov 477d382dcdSMarcel Hlopko namespace { 487d382dcdSMarcel Hlopko /// Get start location of the Declarator from the TypeLoc. 497d382dcdSMarcel Hlopko /// E.g.: 507d382dcdSMarcel Hlopko /// loc of `(` in `int (a)` 517d382dcdSMarcel Hlopko /// loc of `*` in `int *(a)` 527d382dcdSMarcel Hlopko /// loc of the first `(` in `int (*a)(int)` 537d382dcdSMarcel Hlopko /// loc of the `*` in `int *(a)(int)` 547d382dcdSMarcel Hlopko /// loc of the first `*` in `const int *const *volatile a;` 557d382dcdSMarcel Hlopko /// 567d382dcdSMarcel Hlopko /// It is non-trivial to get the start location because TypeLocs are stored 577d382dcdSMarcel Hlopko /// inside out. In the example above `*volatile` is the TypeLoc returned 587d382dcdSMarcel Hlopko /// by `Decl.getTypeSourceInfo()`, and `*const` is what `.getPointeeLoc()` 597d382dcdSMarcel Hlopko /// returns. 607d382dcdSMarcel Hlopko struct GetStartLoc : TypeLocVisitor<GetStartLoc, SourceLocation> { 617d382dcdSMarcel Hlopko SourceLocation VisitParenTypeLoc(ParenTypeLoc T) { 627d382dcdSMarcel Hlopko auto L = Visit(T.getInnerLoc()); 637d382dcdSMarcel Hlopko if (L.isValid()) 647d382dcdSMarcel Hlopko return L; 657d382dcdSMarcel Hlopko return T.getLParenLoc(); 667d382dcdSMarcel Hlopko } 677d382dcdSMarcel Hlopko 687d382dcdSMarcel Hlopko // Types spelled in the prefix part of the declarator. 697d382dcdSMarcel Hlopko SourceLocation VisitPointerTypeLoc(PointerTypeLoc T) { 707d382dcdSMarcel Hlopko return HandlePointer(T); 717d382dcdSMarcel Hlopko } 727d382dcdSMarcel Hlopko 737d382dcdSMarcel Hlopko SourceLocation VisitMemberPointerTypeLoc(MemberPointerTypeLoc T) { 747d382dcdSMarcel Hlopko return HandlePointer(T); 757d382dcdSMarcel Hlopko } 767d382dcdSMarcel Hlopko 777d382dcdSMarcel Hlopko SourceLocation VisitBlockPointerTypeLoc(BlockPointerTypeLoc T) { 787d382dcdSMarcel Hlopko return HandlePointer(T); 797d382dcdSMarcel Hlopko } 807d382dcdSMarcel Hlopko 817d382dcdSMarcel Hlopko SourceLocation VisitReferenceTypeLoc(ReferenceTypeLoc T) { 827d382dcdSMarcel Hlopko return HandlePointer(T); 837d382dcdSMarcel Hlopko } 847d382dcdSMarcel Hlopko 857d382dcdSMarcel Hlopko SourceLocation VisitObjCObjectPointerTypeLoc(ObjCObjectPointerTypeLoc T) { 867d382dcdSMarcel Hlopko return HandlePointer(T); 877d382dcdSMarcel Hlopko } 887d382dcdSMarcel Hlopko 897d382dcdSMarcel Hlopko // All other cases are not important, as they are either part of declaration 907d382dcdSMarcel Hlopko // specifiers (e.g. inheritors of TypeSpecTypeLoc) or introduce modifiers on 917d382dcdSMarcel Hlopko // existing declarators (e.g. QualifiedTypeLoc). They cannot start the 927d382dcdSMarcel Hlopko // declarator themselves, but their underlying type can. 937d382dcdSMarcel Hlopko SourceLocation VisitTypeLoc(TypeLoc T) { 947d382dcdSMarcel Hlopko auto N = T.getNextTypeLoc(); 957d382dcdSMarcel Hlopko if (!N) 967d382dcdSMarcel Hlopko return SourceLocation(); 977d382dcdSMarcel Hlopko return Visit(N); 987d382dcdSMarcel Hlopko } 997d382dcdSMarcel Hlopko 1007d382dcdSMarcel Hlopko SourceLocation VisitFunctionProtoTypeLoc(FunctionProtoTypeLoc T) { 1017d382dcdSMarcel Hlopko if (T.getTypePtr()->hasTrailingReturn()) 1027d382dcdSMarcel Hlopko return SourceLocation(); // avoid recursing into the suffix of declarator. 1037d382dcdSMarcel Hlopko return VisitTypeLoc(T); 1047d382dcdSMarcel Hlopko } 1057d382dcdSMarcel Hlopko 1067d382dcdSMarcel Hlopko private: 1077d382dcdSMarcel Hlopko template <class PtrLoc> SourceLocation HandlePointer(PtrLoc T) { 1087d382dcdSMarcel Hlopko auto L = Visit(T.getPointeeLoc()); 1097d382dcdSMarcel Hlopko if (L.isValid()) 1107d382dcdSMarcel Hlopko return L; 1117d382dcdSMarcel Hlopko return T.getLocalSourceRange().getBegin(); 1127d382dcdSMarcel Hlopko } 1137d382dcdSMarcel Hlopko }; 1147d382dcdSMarcel Hlopko } // namespace 1157d382dcdSMarcel Hlopko 1167d382dcdSMarcel Hlopko /// Gets the range of declarator as defined by the C++ grammar. E.g. 1177d382dcdSMarcel Hlopko /// `int a;` -> range of `a`, 1187d382dcdSMarcel Hlopko /// `int *a;` -> range of `*a`, 1197d382dcdSMarcel Hlopko /// `int a[10];` -> range of `a[10]`, 1207d382dcdSMarcel Hlopko /// `int a[1][2][3];` -> range of `a[1][2][3]`, 1217d382dcdSMarcel Hlopko /// `int *a = nullptr` -> range of `*a = nullptr`. 1227d382dcdSMarcel Hlopko /// FIMXE: \p Name must be a source range, e.g. for `operator+`. 1237d382dcdSMarcel Hlopko static SourceRange getDeclaratorRange(const SourceManager &SM, TypeLoc T, 1247d382dcdSMarcel Hlopko SourceLocation Name, 1257d382dcdSMarcel Hlopko SourceRange Initializer) { 1267d382dcdSMarcel Hlopko SourceLocation Start = GetStartLoc().Visit(T); 1277d382dcdSMarcel Hlopko SourceLocation End = T.getSourceRange().getEnd(); 1287d382dcdSMarcel Hlopko assert(End.isValid()); 1297d382dcdSMarcel Hlopko if (Name.isValid()) { 1307d382dcdSMarcel Hlopko if (Start.isInvalid()) 1317d382dcdSMarcel Hlopko Start = Name; 1327d382dcdSMarcel Hlopko if (SM.isBeforeInTranslationUnit(End, Name)) 1337d382dcdSMarcel Hlopko End = Name; 1347d382dcdSMarcel Hlopko } 1357d382dcdSMarcel Hlopko if (Initializer.isValid()) { 136*cdce2fe5SMarcel Hlopko auto InitializerEnd = Initializer.getEnd(); 137*cdce2fe5SMarcel Hlopko assert(SM.isBeforeInTranslationUnit(End, InitializerEnd) || End == InitializerEnd); 138*cdce2fe5SMarcel Hlopko End = InitializerEnd; 1397d382dcdSMarcel Hlopko } 1407d382dcdSMarcel Hlopko return SourceRange(Start, End); 1417d382dcdSMarcel Hlopko } 1427d382dcdSMarcel Hlopko 143a711a3a4SMarcel Hlopko namespace { 144a711a3a4SMarcel Hlopko /// All AST hierarchy roots that can be represented as pointers. 145a711a3a4SMarcel Hlopko using ASTPtr = llvm::PointerUnion<Stmt *, Decl *>; 146a711a3a4SMarcel Hlopko /// Maintains a mapping from AST to syntax tree nodes. This class will get more 147a711a3a4SMarcel Hlopko /// complicated as we support more kinds of AST nodes, e.g. TypeLocs. 148a711a3a4SMarcel Hlopko /// FIXME: expose this as public API. 149a711a3a4SMarcel Hlopko class ASTToSyntaxMapping { 150a711a3a4SMarcel Hlopko public: 151a711a3a4SMarcel Hlopko void add(ASTPtr From, syntax::Tree *To) { 152a711a3a4SMarcel Hlopko assert(To != nullptr); 153a711a3a4SMarcel Hlopko assert(!From.isNull()); 154a711a3a4SMarcel Hlopko 155a711a3a4SMarcel Hlopko bool Added = Nodes.insert({From, To}).second; 156a711a3a4SMarcel Hlopko (void)Added; 157a711a3a4SMarcel Hlopko assert(Added && "mapping added twice"); 158a711a3a4SMarcel Hlopko } 159a711a3a4SMarcel Hlopko 160a711a3a4SMarcel Hlopko syntax::Tree *find(ASTPtr P) const { return Nodes.lookup(P); } 161a711a3a4SMarcel Hlopko 162a711a3a4SMarcel Hlopko private: 163a711a3a4SMarcel Hlopko llvm::DenseMap<ASTPtr, syntax::Tree *> Nodes; 164a711a3a4SMarcel Hlopko }; 165a711a3a4SMarcel Hlopko } // namespace 166a711a3a4SMarcel Hlopko 1679b3f38f9SIlya Biryukov /// A helper class for constructing the syntax tree while traversing a clang 1689b3f38f9SIlya Biryukov /// AST. 1699b3f38f9SIlya Biryukov /// 1709b3f38f9SIlya Biryukov /// At each point of the traversal we maintain a list of pending nodes. 1719b3f38f9SIlya Biryukov /// Initially all tokens are added as pending nodes. When processing a clang AST 1729b3f38f9SIlya Biryukov /// node, the clients need to: 1739b3f38f9SIlya Biryukov /// - create a corresponding syntax node, 1749b3f38f9SIlya Biryukov /// - assign roles to all pending child nodes with 'markChild' and 1759b3f38f9SIlya Biryukov /// 'markChildToken', 1769b3f38f9SIlya Biryukov /// - replace the child nodes with the new syntax node in the pending list 1779b3f38f9SIlya Biryukov /// with 'foldNode'. 1789b3f38f9SIlya Biryukov /// 1799b3f38f9SIlya Biryukov /// Note that all children are expected to be processed when building a node. 1809b3f38f9SIlya Biryukov /// 1819b3f38f9SIlya Biryukov /// Call finalize() to finish building the tree and consume the root node. 1829b3f38f9SIlya Biryukov class syntax::TreeBuilder { 1839b3f38f9SIlya Biryukov public: 184c1bbefefSIlya Biryukov TreeBuilder(syntax::Arena &Arena) : Arena(Arena), Pending(Arena) { 185c1bbefefSIlya Biryukov for (const auto &T : Arena.tokenBuffer().expandedTokens()) 186c1bbefefSIlya Biryukov LocationToToken.insert({T.location().getRawEncoding(), &T}); 187c1bbefefSIlya Biryukov } 1889b3f38f9SIlya Biryukov 1899b3f38f9SIlya Biryukov llvm::BumpPtrAllocator &allocator() { return Arena.allocator(); } 1907d382dcdSMarcel Hlopko const SourceManager &sourceManager() const { return Arena.sourceManager(); } 1919b3f38f9SIlya Biryukov 1929b3f38f9SIlya Biryukov /// Populate children for \p New node, assuming it covers tokens from \p 1939b3f38f9SIlya Biryukov /// Range. 194a711a3a4SMarcel Hlopko void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New, 195a711a3a4SMarcel Hlopko ASTPtr From) { 196a711a3a4SMarcel Hlopko assert(New); 197a711a3a4SMarcel Hlopko Pending.foldChildren(Arena, Range, New); 198a711a3a4SMarcel Hlopko if (From) 199a711a3a4SMarcel Hlopko Mapping.add(From, New); 200a711a3a4SMarcel Hlopko } 201a711a3a4SMarcel Hlopko void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New, 202a711a3a4SMarcel Hlopko TypeLoc L) { 203a711a3a4SMarcel Hlopko // FIXME: add mapping for TypeLocs 204a711a3a4SMarcel Hlopko foldNode(Range, New, nullptr); 205a711a3a4SMarcel Hlopko } 2069b3f38f9SIlya Biryukov 207e702bdb8SIlya Biryukov /// Notifies that we should not consume trailing semicolon when computing 208e702bdb8SIlya Biryukov /// token range of \p D. 2097d382dcdSMarcel Hlopko void noticeDeclWithoutSemicolon(Decl *D); 210e702bdb8SIlya Biryukov 21158fa50f4SIlya Biryukov /// Mark the \p Child node with a corresponding \p Role. All marked children 21258fa50f4SIlya Biryukov /// should be consumed by foldNode. 2137d382dcdSMarcel Hlopko /// When called on expressions (clang::Expr is derived from clang::Stmt), 21458fa50f4SIlya Biryukov /// wraps expressions into expression statement. 21558fa50f4SIlya Biryukov void markStmtChild(Stmt *Child, NodeRole Role); 21658fa50f4SIlya Biryukov /// Should be called for expressions in non-statement position to avoid 21758fa50f4SIlya Biryukov /// wrapping into expression statement. 21858fa50f4SIlya Biryukov void markExprChild(Expr *Child, NodeRole Role); 2199b3f38f9SIlya Biryukov /// Set role for a token starting at \p Loc. 220def65bb4SIlya Biryukov void markChildToken(SourceLocation Loc, NodeRole R); 2217d382dcdSMarcel Hlopko /// Set role for \p T. 2227d382dcdSMarcel Hlopko void markChildToken(const syntax::Token *T, NodeRole R); 2237d382dcdSMarcel Hlopko 224a711a3a4SMarcel Hlopko /// Set role for \p N. 225a711a3a4SMarcel Hlopko void markChild(syntax::Node *N, NodeRole R); 226a711a3a4SMarcel Hlopko /// Set role for the syntax node matching \p N. 227a711a3a4SMarcel Hlopko void markChild(ASTPtr N, NodeRole R); 2289b3f38f9SIlya Biryukov 2299b3f38f9SIlya Biryukov /// Finish building the tree and consume the root node. 2309b3f38f9SIlya Biryukov syntax::TranslationUnit *finalize() && { 2319b3f38f9SIlya Biryukov auto Tokens = Arena.tokenBuffer().expandedTokens(); 232bfbf6b6cSIlya Biryukov assert(!Tokens.empty()); 233bfbf6b6cSIlya Biryukov assert(Tokens.back().kind() == tok::eof); 234bfbf6b6cSIlya Biryukov 2359b3f38f9SIlya Biryukov // Build the root of the tree, consuming all the children. 2361ad15046SIlya Biryukov Pending.foldChildren(Arena, Tokens.drop_back(), 2379b3f38f9SIlya Biryukov new (Arena.allocator()) syntax::TranslationUnit); 2389b3f38f9SIlya Biryukov 2393b929fe7SIlya Biryukov auto *TU = cast<syntax::TranslationUnit>(std::move(Pending).finalize()); 2403b929fe7SIlya Biryukov TU->assertInvariantsRecursive(); 2413b929fe7SIlya Biryukov return TU; 2429b3f38f9SIlya Biryukov } 2439b3f38f9SIlya Biryukov 24488bf9b3dSMarcel Hlopko /// Finds a token starting at \p L. The token must exist if \p L is valid. 24588bf9b3dSMarcel Hlopko const syntax::Token *findToken(SourceLocation L) const; 24688bf9b3dSMarcel Hlopko 247a711a3a4SMarcel Hlopko /// Finds the syntax tokens corresponding to the \p SourceRange. 248a711a3a4SMarcel Hlopko llvm::ArrayRef<syntax::Token> getRange(SourceRange Range) const { 249a711a3a4SMarcel Hlopko assert(Range.isValid()); 250a711a3a4SMarcel Hlopko return getRange(Range.getBegin(), Range.getEnd()); 251a711a3a4SMarcel Hlopko } 252a711a3a4SMarcel Hlopko 253a711a3a4SMarcel Hlopko /// Finds the syntax tokens corresponding to the passed source locations. 2549b3f38f9SIlya Biryukov /// \p First is the start position of the first token and \p Last is the start 2559b3f38f9SIlya Biryukov /// position of the last token. 2569b3f38f9SIlya Biryukov llvm::ArrayRef<syntax::Token> getRange(SourceLocation First, 2579b3f38f9SIlya Biryukov SourceLocation Last) const { 2589b3f38f9SIlya Biryukov assert(First.isValid()); 2599b3f38f9SIlya Biryukov assert(Last.isValid()); 2609b3f38f9SIlya Biryukov assert(First == Last || 2619b3f38f9SIlya Biryukov Arena.sourceManager().isBeforeInTranslationUnit(First, Last)); 2629b3f38f9SIlya Biryukov return llvm::makeArrayRef(findToken(First), std::next(findToken(Last))); 2639b3f38f9SIlya Biryukov } 26488bf9b3dSMarcel Hlopko 26588bf9b3dSMarcel Hlopko llvm::ArrayRef<syntax::Token> 26688bf9b3dSMarcel Hlopko getTemplateRange(const ClassTemplateSpecializationDecl *D) const { 267a711a3a4SMarcel Hlopko auto Tokens = getRange(D->getSourceRange()); 26888bf9b3dSMarcel Hlopko return maybeAppendSemicolon(Tokens, D); 26988bf9b3dSMarcel Hlopko } 27088bf9b3dSMarcel Hlopko 271*cdce2fe5SMarcel Hlopko /// Returns true if \p D is the last declarator in a chain and is thus 272*cdce2fe5SMarcel Hlopko /// reponsible for creating SimpleDeclaration for the whole chain. 273*cdce2fe5SMarcel Hlopko template <class T> 274*cdce2fe5SMarcel Hlopko bool isResponsibleForCreatingDeclaration(const T *D) const { 275*cdce2fe5SMarcel Hlopko static_assert((std::is_base_of<DeclaratorDecl, T>::value || 276*cdce2fe5SMarcel Hlopko std::is_base_of<TypedefNameDecl, T>::value), 277*cdce2fe5SMarcel Hlopko "only DeclaratorDecl and TypedefNameDecl are supported."); 278*cdce2fe5SMarcel Hlopko 279*cdce2fe5SMarcel Hlopko const Decl *Next = D->getNextDeclInContext(); 280*cdce2fe5SMarcel Hlopko 281*cdce2fe5SMarcel Hlopko // There's no next sibling, this one is responsible. 282*cdce2fe5SMarcel Hlopko if (Next == nullptr) { 283*cdce2fe5SMarcel Hlopko return true; 284*cdce2fe5SMarcel Hlopko } 285*cdce2fe5SMarcel Hlopko const auto *NextT = llvm::dyn_cast<T>(Next); 286*cdce2fe5SMarcel Hlopko 287*cdce2fe5SMarcel Hlopko // Next sibling is not the same type, this one is responsible. 288*cdce2fe5SMarcel Hlopko if (NextT == nullptr) { 289*cdce2fe5SMarcel Hlopko return true; 290*cdce2fe5SMarcel Hlopko } 291*cdce2fe5SMarcel Hlopko // Next sibling doesn't begin at the same loc, it must be a different 292*cdce2fe5SMarcel Hlopko // declaration, so this declarator is responsible. 293*cdce2fe5SMarcel Hlopko if (NextT->getBeginLoc() != D->getBeginLoc()) { 294*cdce2fe5SMarcel Hlopko return true; 295*cdce2fe5SMarcel Hlopko } 296*cdce2fe5SMarcel Hlopko 297*cdce2fe5SMarcel Hlopko // NextT is a member of the same declaration, and we need the last member to 298*cdce2fe5SMarcel Hlopko // create declaration. This one is not responsible. 299*cdce2fe5SMarcel Hlopko return false; 300*cdce2fe5SMarcel Hlopko } 301*cdce2fe5SMarcel Hlopko 302*cdce2fe5SMarcel Hlopko llvm::ArrayRef<syntax::Token> getDeclarationRange(Decl *D) { 30388bf9b3dSMarcel Hlopko llvm::ArrayRef<clang::syntax::Token> Tokens; 30488bf9b3dSMarcel Hlopko // We want to drop the template parameters for specializations. 30588bf9b3dSMarcel Hlopko if (const auto *S = llvm::dyn_cast<TagDecl>(D)) 30688bf9b3dSMarcel Hlopko Tokens = getRange(S->TypeDecl::getBeginLoc(), S->getEndLoc()); 30788bf9b3dSMarcel Hlopko else 308a711a3a4SMarcel Hlopko Tokens = getRange(D->getSourceRange()); 30988bf9b3dSMarcel Hlopko return maybeAppendSemicolon(Tokens, D); 3109b3f38f9SIlya Biryukov } 311*cdce2fe5SMarcel Hlopko 31258fa50f4SIlya Biryukov llvm::ArrayRef<syntax::Token> getExprRange(const Expr *E) const { 313a711a3a4SMarcel Hlopko return getRange(E->getSourceRange()); 31458fa50f4SIlya Biryukov } 315*cdce2fe5SMarcel Hlopko 31658fa50f4SIlya Biryukov /// Find the adjusted range for the statement, consuming the trailing 31758fa50f4SIlya Biryukov /// semicolon when needed. 31858fa50f4SIlya Biryukov llvm::ArrayRef<syntax::Token> getStmtRange(const Stmt *S) const { 319a711a3a4SMarcel Hlopko auto Tokens = getRange(S->getSourceRange()); 32058fa50f4SIlya Biryukov if (isa<CompoundStmt>(S)) 32158fa50f4SIlya Biryukov return Tokens; 32258fa50f4SIlya Biryukov 32358fa50f4SIlya Biryukov // Some statements miss a trailing semicolon, e.g. 'return', 'continue' and 32458fa50f4SIlya Biryukov // all statements that end with those. Consume this semicolon here. 325e702bdb8SIlya Biryukov if (Tokens.back().kind() == tok::semi) 326e702bdb8SIlya Biryukov return Tokens; 327e702bdb8SIlya Biryukov return withTrailingSemicolon(Tokens); 328e702bdb8SIlya Biryukov } 329e702bdb8SIlya Biryukov 330e702bdb8SIlya Biryukov private: 331e702bdb8SIlya Biryukov llvm::ArrayRef<syntax::Token> 33288bf9b3dSMarcel Hlopko maybeAppendSemicolon(llvm::ArrayRef<syntax::Token> Tokens, 33388bf9b3dSMarcel Hlopko const Decl *D) const { 33488bf9b3dSMarcel Hlopko if (llvm::isa<NamespaceDecl>(D)) 33588bf9b3dSMarcel Hlopko return Tokens; 33688bf9b3dSMarcel Hlopko if (DeclsWithoutSemicolons.count(D)) 33788bf9b3dSMarcel Hlopko return Tokens; 33888bf9b3dSMarcel Hlopko // FIXME: do not consume trailing semicolon on function definitions. 33988bf9b3dSMarcel Hlopko // Most declarations own a semicolon in syntax trees, but not in clang AST. 34088bf9b3dSMarcel Hlopko return withTrailingSemicolon(Tokens); 34188bf9b3dSMarcel Hlopko } 34288bf9b3dSMarcel Hlopko 34388bf9b3dSMarcel Hlopko llvm::ArrayRef<syntax::Token> 344e702bdb8SIlya Biryukov withTrailingSemicolon(llvm::ArrayRef<syntax::Token> Tokens) const { 345e702bdb8SIlya Biryukov assert(!Tokens.empty()); 346e702bdb8SIlya Biryukov assert(Tokens.back().kind() != tok::eof); 3477d382dcdSMarcel Hlopko // We never consume 'eof', so looking at the next token is ok. 34858fa50f4SIlya Biryukov if (Tokens.back().kind() != tok::semi && Tokens.end()->kind() == tok::semi) 34958fa50f4SIlya Biryukov return llvm::makeArrayRef(Tokens.begin(), Tokens.end() + 1); 35058fa50f4SIlya Biryukov return Tokens; 3519b3f38f9SIlya Biryukov } 3529b3f38f9SIlya Biryukov 353a711a3a4SMarcel Hlopko void setRole(syntax::Node *N, NodeRole R) { 354a711a3a4SMarcel Hlopko assert(N->role() == NodeRole::Detached); 355a711a3a4SMarcel Hlopko N->setRole(R); 356a711a3a4SMarcel Hlopko } 357a711a3a4SMarcel Hlopko 3589b3f38f9SIlya Biryukov /// A collection of trees covering the input tokens. 3599b3f38f9SIlya Biryukov /// When created, each tree corresponds to a single token in the file. 3609b3f38f9SIlya Biryukov /// Clients call 'foldChildren' to attach one or more subtrees to a parent 3619b3f38f9SIlya Biryukov /// node and update the list of trees accordingly. 3629b3f38f9SIlya Biryukov /// 3639b3f38f9SIlya Biryukov /// Ensures that added nodes properly nest and cover the whole token stream. 3649b3f38f9SIlya Biryukov struct Forest { 3659b3f38f9SIlya Biryukov Forest(syntax::Arena &A) { 366bfbf6b6cSIlya Biryukov assert(!A.tokenBuffer().expandedTokens().empty()); 367bfbf6b6cSIlya Biryukov assert(A.tokenBuffer().expandedTokens().back().kind() == tok::eof); 3689b3f38f9SIlya Biryukov // Create all leaf nodes. 369bfbf6b6cSIlya Biryukov // Note that we do not have 'eof' in the tree. 3701ad15046SIlya Biryukov for (auto &T : A.tokenBuffer().expandedTokens().drop_back()) { 3711ad15046SIlya Biryukov auto *L = new (A.allocator()) syntax::Leaf(&T); 3721ad15046SIlya Biryukov L->Original = true; 3731ad15046SIlya Biryukov L->CanModify = A.tokenBuffer().spelledForExpanded(T).hasValue(); 374a711a3a4SMarcel Hlopko Trees.insert(Trees.end(), {&T, L}); 3751ad15046SIlya Biryukov } 3769b3f38f9SIlya Biryukov } 3779b3f38f9SIlya Biryukov 3789b3f38f9SIlya Biryukov void assignRole(llvm::ArrayRef<syntax::Token> Range, 3799b3f38f9SIlya Biryukov syntax::NodeRole Role) { 3809b3f38f9SIlya Biryukov assert(!Range.empty()); 3819b3f38f9SIlya Biryukov auto It = Trees.lower_bound(Range.begin()); 3829b3f38f9SIlya Biryukov assert(It != Trees.end() && "no node found"); 3839b3f38f9SIlya Biryukov assert(It->first == Range.begin() && "no child with the specified range"); 3849b3f38f9SIlya Biryukov assert((std::next(It) == Trees.end() || 3859b3f38f9SIlya Biryukov std::next(It)->first == Range.end()) && 3869b3f38f9SIlya Biryukov "no child with the specified range"); 387a711a3a4SMarcel Hlopko assert(It->second->role() == NodeRole::Detached && 388a711a3a4SMarcel Hlopko "re-assigning role for a child"); 389a711a3a4SMarcel Hlopko It->second->setRole(Role); 3909b3f38f9SIlya Biryukov } 3919b3f38f9SIlya Biryukov 392e702bdb8SIlya Biryukov /// Add \p Node to the forest and attach child nodes based on \p Tokens. 3931ad15046SIlya Biryukov void foldChildren(const syntax::Arena &A, 3941ad15046SIlya Biryukov llvm::ArrayRef<syntax::Token> Tokens, 3959b3f38f9SIlya Biryukov syntax::Tree *Node) { 396e702bdb8SIlya Biryukov // Attach children to `Node`. 397*cdce2fe5SMarcel Hlopko assert(Node->firstChild() == nullptr && "node already has children"); 398*cdce2fe5SMarcel Hlopko 399*cdce2fe5SMarcel Hlopko auto *FirstToken = Tokens.begin(); 400*cdce2fe5SMarcel Hlopko auto BeginChildren = Trees.lower_bound(FirstToken); 401*cdce2fe5SMarcel Hlopko 402*cdce2fe5SMarcel Hlopko assert((BeginChildren == Trees.end() || 403*cdce2fe5SMarcel Hlopko BeginChildren->first == FirstToken) && 404*cdce2fe5SMarcel Hlopko "fold crosses boundaries of existing subtrees"); 405*cdce2fe5SMarcel Hlopko auto EndChildren = Trees.lower_bound(Tokens.end()); 406*cdce2fe5SMarcel Hlopko assert( 407*cdce2fe5SMarcel Hlopko (EndChildren == Trees.end() || EndChildren->first == Tokens.end()) && 408*cdce2fe5SMarcel Hlopko "fold crosses boundaries of existing subtrees"); 409*cdce2fe5SMarcel Hlopko 410*cdce2fe5SMarcel Hlopko // We need to go in reverse order, because we can only prepend. 411*cdce2fe5SMarcel Hlopko for (auto It = EndChildren; It != BeginChildren; --It) { 412*cdce2fe5SMarcel Hlopko auto *C = std::prev(It)->second; 413*cdce2fe5SMarcel Hlopko if (C->role() == NodeRole::Detached) 414*cdce2fe5SMarcel Hlopko C->setRole(NodeRole::Unknown); 415*cdce2fe5SMarcel Hlopko Node->prependChildLowLevel(C); 416e702bdb8SIlya Biryukov } 4179b3f38f9SIlya Biryukov 418*cdce2fe5SMarcel Hlopko // Mark that this node came from the AST and is backed by the source code. 419*cdce2fe5SMarcel Hlopko Node->Original = true; 420*cdce2fe5SMarcel Hlopko Node->CanModify = A.tokenBuffer().spelledForExpanded(Tokens).hasValue(); 4219b3f38f9SIlya Biryukov 422*cdce2fe5SMarcel Hlopko Trees.erase(BeginChildren, EndChildren); 423*cdce2fe5SMarcel Hlopko Trees.insert({FirstToken, Node}); 4249b3f38f9SIlya Biryukov } 4259b3f38f9SIlya Biryukov 4269b3f38f9SIlya Biryukov // EXPECTS: all tokens were consumed and are owned by a single root node. 4279b3f38f9SIlya Biryukov syntax::Node *finalize() && { 4289b3f38f9SIlya Biryukov assert(Trees.size() == 1); 429a711a3a4SMarcel Hlopko auto *Root = Trees.begin()->second; 4309b3f38f9SIlya Biryukov Trees = {}; 4319b3f38f9SIlya Biryukov return Root; 4329b3f38f9SIlya Biryukov } 4339b3f38f9SIlya Biryukov 4349b3f38f9SIlya Biryukov std::string str(const syntax::Arena &A) const { 4359b3f38f9SIlya Biryukov std::string R; 4369b3f38f9SIlya Biryukov for (auto It = Trees.begin(); It != Trees.end(); ++It) { 4379b3f38f9SIlya Biryukov unsigned CoveredTokens = 4389b3f38f9SIlya Biryukov It != Trees.end() 4399b3f38f9SIlya Biryukov ? (std::next(It)->first - It->first) 4409b3f38f9SIlya Biryukov : A.tokenBuffer().expandedTokens().end() - It->first; 4419b3f38f9SIlya Biryukov 442adcd0268SBenjamin Kramer R += std::string(llvm::formatv( 443a711a3a4SMarcel Hlopko "- '{0}' covers '{1}'+{2} tokens\n", It->second->kind(), 444adcd0268SBenjamin Kramer It->first->text(A.sourceManager()), CoveredTokens)); 445a711a3a4SMarcel Hlopko R += It->second->dump(A); 4469b3f38f9SIlya Biryukov } 4479b3f38f9SIlya Biryukov return R; 4489b3f38f9SIlya Biryukov } 4499b3f38f9SIlya Biryukov 4509b3f38f9SIlya Biryukov private: 4519b3f38f9SIlya Biryukov /// Maps from the start token to a subtree starting at that token. 452302cb3bcSIlya Biryukov /// Keys in the map are pointers into the array of expanded tokens, so 453302cb3bcSIlya Biryukov /// pointer order corresponds to the order of preprocessor tokens. 454a711a3a4SMarcel Hlopko std::map<const syntax::Token *, syntax::Node *> Trees; 4559b3f38f9SIlya Biryukov }; 4569b3f38f9SIlya Biryukov 4579b3f38f9SIlya Biryukov /// For debugging purposes. 4589b3f38f9SIlya Biryukov std::string str() { return Pending.str(Arena); } 4599b3f38f9SIlya Biryukov 4609b3f38f9SIlya Biryukov syntax::Arena &Arena; 461c1bbefefSIlya Biryukov /// To quickly find tokens by their start location. 462c1bbefefSIlya Biryukov llvm::DenseMap</*SourceLocation*/ unsigned, const syntax::Token *> 463c1bbefefSIlya Biryukov LocationToToken; 4649b3f38f9SIlya Biryukov Forest Pending; 465e702bdb8SIlya Biryukov llvm::DenseSet<Decl *> DeclsWithoutSemicolons; 466a711a3a4SMarcel Hlopko ASTToSyntaxMapping Mapping; 4679b3f38f9SIlya Biryukov }; 4689b3f38f9SIlya Biryukov 4699b3f38f9SIlya Biryukov namespace { 4709b3f38f9SIlya Biryukov class BuildTreeVisitor : public RecursiveASTVisitor<BuildTreeVisitor> { 4719b3f38f9SIlya Biryukov public: 4729b3f38f9SIlya Biryukov explicit BuildTreeVisitor(ASTContext &Ctx, syntax::TreeBuilder &Builder) 4739b3f38f9SIlya Biryukov : Builder(Builder), LangOpts(Ctx.getLangOpts()) {} 4749b3f38f9SIlya Biryukov 4759b3f38f9SIlya Biryukov bool shouldTraversePostOrder() const { return true; } 4769b3f38f9SIlya Biryukov 4777d382dcdSMarcel Hlopko bool WalkUpFromDeclaratorDecl(DeclaratorDecl *DD) { 478*cdce2fe5SMarcel Hlopko return processDeclaratorAndDeclaration(DD); 4797d382dcdSMarcel Hlopko } 4807d382dcdSMarcel Hlopko 481*cdce2fe5SMarcel Hlopko bool WalkUpFromTypedefNameDecl(TypedefNameDecl *TD) { 482*cdce2fe5SMarcel Hlopko return processDeclaratorAndDeclaration(TD); 4839b3f38f9SIlya Biryukov } 4849b3f38f9SIlya Biryukov 4859b3f38f9SIlya Biryukov bool VisitDecl(Decl *D) { 4869b3f38f9SIlya Biryukov assert(!D->isImplicit()); 487*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(D), 488a711a3a4SMarcel Hlopko new (allocator()) syntax::UnknownDeclaration(), D); 489e702bdb8SIlya Biryukov return true; 490e702bdb8SIlya Biryukov } 491e702bdb8SIlya Biryukov 49288bf9b3dSMarcel Hlopko // RAV does not call WalkUpFrom* on explicit instantiations, so we have to 49388bf9b3dSMarcel Hlopko // override Traverse. 49488bf9b3dSMarcel Hlopko // FIXME: make RAV call WalkUpFrom* instead. 49588bf9b3dSMarcel Hlopko bool 49688bf9b3dSMarcel Hlopko TraverseClassTemplateSpecializationDecl(ClassTemplateSpecializationDecl *C) { 49788bf9b3dSMarcel Hlopko if (!RecursiveASTVisitor::TraverseClassTemplateSpecializationDecl(C)) 49888bf9b3dSMarcel Hlopko return false; 49988bf9b3dSMarcel Hlopko if (C->isExplicitSpecialization()) 50088bf9b3dSMarcel Hlopko return true; // we are only interested in explicit instantiations. 501a711a3a4SMarcel Hlopko auto *Declaration = 502a711a3a4SMarcel Hlopko cast<syntax::SimpleDeclaration>(handleFreeStandingTagDecl(C)); 50388bf9b3dSMarcel Hlopko foldExplicitTemplateInstantiation( 50488bf9b3dSMarcel Hlopko Builder.getTemplateRange(C), Builder.findToken(C->getExternLoc()), 505a711a3a4SMarcel Hlopko Builder.findToken(C->getTemplateKeywordLoc()), Declaration, C); 50688bf9b3dSMarcel Hlopko return true; 50788bf9b3dSMarcel Hlopko } 50888bf9b3dSMarcel Hlopko 50988bf9b3dSMarcel Hlopko bool WalkUpFromTemplateDecl(TemplateDecl *S) { 51088bf9b3dSMarcel Hlopko foldTemplateDeclaration( 511*cdce2fe5SMarcel Hlopko Builder.getDeclarationRange(S), 51288bf9b3dSMarcel Hlopko Builder.findToken(S->getTemplateParameters()->getTemplateLoc()), 513*cdce2fe5SMarcel Hlopko Builder.getDeclarationRange(S->getTemplatedDecl()), S); 51488bf9b3dSMarcel Hlopko return true; 51588bf9b3dSMarcel Hlopko } 51688bf9b3dSMarcel Hlopko 517e702bdb8SIlya Biryukov bool WalkUpFromTagDecl(TagDecl *C) { 51804f627f6SIlya Biryukov // FIXME: build the ClassSpecifier node. 51988bf9b3dSMarcel Hlopko if (!C->isFreeStanding()) { 52088bf9b3dSMarcel Hlopko assert(C->getNumTemplateParameterLists() == 0); 52104f627f6SIlya Biryukov return true; 52204f627f6SIlya Biryukov } 523a711a3a4SMarcel Hlopko handleFreeStandingTagDecl(C); 524a711a3a4SMarcel Hlopko return true; 525a711a3a4SMarcel Hlopko } 526a711a3a4SMarcel Hlopko 527a711a3a4SMarcel Hlopko syntax::Declaration *handleFreeStandingTagDecl(TagDecl *C) { 528a711a3a4SMarcel Hlopko assert(C->isFreeStanding()); 52988bf9b3dSMarcel Hlopko // Class is a declaration specifier and needs a spanning declaration node. 530*cdce2fe5SMarcel Hlopko auto DeclarationRange = Builder.getDeclarationRange(C); 531a711a3a4SMarcel Hlopko syntax::Declaration *Result = new (allocator()) syntax::SimpleDeclaration; 532a711a3a4SMarcel Hlopko Builder.foldNode(DeclarationRange, Result, nullptr); 53388bf9b3dSMarcel Hlopko 53488bf9b3dSMarcel Hlopko // Build TemplateDeclaration nodes if we had template parameters. 53588bf9b3dSMarcel Hlopko auto ConsumeTemplateParameters = [&](const TemplateParameterList &L) { 53688bf9b3dSMarcel Hlopko const auto *TemplateKW = Builder.findToken(L.getTemplateLoc()); 53788bf9b3dSMarcel Hlopko auto R = llvm::makeArrayRef(TemplateKW, DeclarationRange.end()); 538a711a3a4SMarcel Hlopko Result = 539a711a3a4SMarcel Hlopko foldTemplateDeclaration(R, TemplateKW, DeclarationRange, nullptr); 54088bf9b3dSMarcel Hlopko DeclarationRange = R; 54188bf9b3dSMarcel Hlopko }; 54288bf9b3dSMarcel Hlopko if (auto *S = llvm::dyn_cast<ClassTemplatePartialSpecializationDecl>(C)) 54388bf9b3dSMarcel Hlopko ConsumeTemplateParameters(*S->getTemplateParameters()); 54488bf9b3dSMarcel Hlopko for (unsigned I = C->getNumTemplateParameterLists(); 0 < I; --I) 54588bf9b3dSMarcel Hlopko ConsumeTemplateParameters(*C->getTemplateParameterList(I - 1)); 546a711a3a4SMarcel Hlopko return Result; 5479b3f38f9SIlya Biryukov } 5489b3f38f9SIlya Biryukov 5499b3f38f9SIlya Biryukov bool WalkUpFromTranslationUnitDecl(TranslationUnitDecl *TU) { 5507d382dcdSMarcel Hlopko // We do not want to call VisitDecl(), the declaration for translation 5519b3f38f9SIlya Biryukov // unit is built by finalize(). 5529b3f38f9SIlya Biryukov return true; 5539b3f38f9SIlya Biryukov } 5549b3f38f9SIlya Biryukov 5559b3f38f9SIlya Biryukov bool WalkUpFromCompoundStmt(CompoundStmt *S) { 55651dad419SIlya Biryukov using NodeRole = syntax::NodeRole; 5579b3f38f9SIlya Biryukov 558def65bb4SIlya Biryukov Builder.markChildToken(S->getLBracLoc(), NodeRole::OpenParen); 55958fa50f4SIlya Biryukov for (auto *Child : S->body()) 56058fa50f4SIlya Biryukov Builder.markStmtChild(Child, NodeRole::CompoundStatement_statement); 561def65bb4SIlya Biryukov Builder.markChildToken(S->getRBracLoc(), NodeRole::CloseParen); 5629b3f38f9SIlya Biryukov 56358fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 564a711a3a4SMarcel Hlopko new (allocator()) syntax::CompoundStatement, S); 5659b3f38f9SIlya Biryukov return true; 5669b3f38f9SIlya Biryukov } 5679b3f38f9SIlya Biryukov 56858fa50f4SIlya Biryukov // Some statements are not yet handled by syntax trees. 56958fa50f4SIlya Biryukov bool WalkUpFromStmt(Stmt *S) { 57058fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 571a711a3a4SMarcel Hlopko new (allocator()) syntax::UnknownStatement, S); 57258fa50f4SIlya Biryukov return true; 57358fa50f4SIlya Biryukov } 57458fa50f4SIlya Biryukov 57558fa50f4SIlya Biryukov bool TraverseCXXForRangeStmt(CXXForRangeStmt *S) { 57658fa50f4SIlya Biryukov // We override to traverse range initializer as VarDecl. 57758fa50f4SIlya Biryukov // RAV traverses it as a statement, we produce invalid node kinds in that 57858fa50f4SIlya Biryukov // case. 57958fa50f4SIlya Biryukov // FIXME: should do this in RAV instead? 58058fa50f4SIlya Biryukov if (S->getInit() && !TraverseStmt(S->getInit())) 58158fa50f4SIlya Biryukov return false; 58258fa50f4SIlya Biryukov if (S->getLoopVariable() && !TraverseDecl(S->getLoopVariable())) 58358fa50f4SIlya Biryukov return false; 58458fa50f4SIlya Biryukov if (S->getRangeInit() && !TraverseStmt(S->getRangeInit())) 58558fa50f4SIlya Biryukov return false; 58658fa50f4SIlya Biryukov if (S->getBody() && !TraverseStmt(S->getBody())) 58758fa50f4SIlya Biryukov return false; 58858fa50f4SIlya Biryukov return true; 58958fa50f4SIlya Biryukov } 59058fa50f4SIlya Biryukov 59158fa50f4SIlya Biryukov bool TraverseStmt(Stmt *S) { 592e702bdb8SIlya Biryukov if (auto *DS = llvm::dyn_cast_or_null<DeclStmt>(S)) { 593e702bdb8SIlya Biryukov // We want to consume the semicolon, make sure SimpleDeclaration does not. 594e702bdb8SIlya Biryukov for (auto *D : DS->decls()) 5957d382dcdSMarcel Hlopko Builder.noticeDeclWithoutSemicolon(D); 596e702bdb8SIlya Biryukov } else if (auto *E = llvm::dyn_cast_or_null<Expr>(S)) { 5977d382dcdSMarcel Hlopko // Do not recurse into subexpressions. 5987d382dcdSMarcel Hlopko // We do not have syntax trees for expressions yet, so we only want to see 59958fa50f4SIlya Biryukov // the first top-level expression. 60058fa50f4SIlya Biryukov return WalkUpFromExpr(E->IgnoreImplicit()); 60158fa50f4SIlya Biryukov } 60258fa50f4SIlya Biryukov return RecursiveASTVisitor::TraverseStmt(S); 60358fa50f4SIlya Biryukov } 60458fa50f4SIlya Biryukov 60558fa50f4SIlya Biryukov // Some expressions are not yet handled by syntax trees. 60658fa50f4SIlya Biryukov bool WalkUpFromExpr(Expr *E) { 60758fa50f4SIlya Biryukov assert(!isImplicitExpr(E) && "should be handled by TraverseStmt"); 60858fa50f4SIlya Biryukov Builder.foldNode(Builder.getExprRange(E), 609a711a3a4SMarcel Hlopko new (allocator()) syntax::UnknownExpression, E); 61058fa50f4SIlya Biryukov return true; 61158fa50f4SIlya Biryukov } 61258fa50f4SIlya Biryukov 613be14a22bSIlya Biryukov bool WalkUpFromNamespaceDecl(NamespaceDecl *S) { 614*cdce2fe5SMarcel Hlopko auto Tokens = Builder.getDeclarationRange(S); 615be14a22bSIlya Biryukov if (Tokens.front().kind() == tok::coloncolon) { 616be14a22bSIlya Biryukov // Handle nested namespace definitions. Those start at '::' token, e.g. 617be14a22bSIlya Biryukov // namespace a^::b {} 618be14a22bSIlya Biryukov // FIXME: build corresponding nodes for the name of this namespace. 619be14a22bSIlya Biryukov return true; 620be14a22bSIlya Biryukov } 621a711a3a4SMarcel Hlopko Builder.foldNode(Tokens, new (allocator()) syntax::NamespaceDefinition, S); 622be14a22bSIlya Biryukov return true; 623be14a22bSIlya Biryukov } 624be14a22bSIlya Biryukov 6257d382dcdSMarcel Hlopko bool TraverseParenTypeLoc(ParenTypeLoc L) { 6267d382dcdSMarcel Hlopko // We reverse order of traversal to get the proper syntax structure. 6277d382dcdSMarcel Hlopko if (!WalkUpFromParenTypeLoc(L)) 6287d382dcdSMarcel Hlopko return false; 6297d382dcdSMarcel Hlopko return TraverseTypeLoc(L.getInnerLoc()); 6307d382dcdSMarcel Hlopko } 6317d382dcdSMarcel Hlopko 6327d382dcdSMarcel Hlopko bool WalkUpFromParenTypeLoc(ParenTypeLoc L) { 6337d382dcdSMarcel Hlopko Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen); 6347d382dcdSMarcel Hlopko Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen); 6357d382dcdSMarcel Hlopko Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getRParenLoc()), 636a711a3a4SMarcel Hlopko new (allocator()) syntax::ParenDeclarator, L); 6377d382dcdSMarcel Hlopko return true; 6387d382dcdSMarcel Hlopko } 6397d382dcdSMarcel Hlopko 6407d382dcdSMarcel Hlopko // Declarator chunks, they are produced by type locs and some clang::Decls. 6417d382dcdSMarcel Hlopko bool WalkUpFromArrayTypeLoc(ArrayTypeLoc L) { 6427d382dcdSMarcel Hlopko Builder.markChildToken(L.getLBracketLoc(), syntax::NodeRole::OpenParen); 6437d382dcdSMarcel Hlopko Builder.markExprChild(L.getSizeExpr(), 6447d382dcdSMarcel Hlopko syntax::NodeRole::ArraySubscript_sizeExpression); 6457d382dcdSMarcel Hlopko Builder.markChildToken(L.getRBracketLoc(), syntax::NodeRole::CloseParen); 6467d382dcdSMarcel Hlopko Builder.foldNode(Builder.getRange(L.getLBracketLoc(), L.getRBracketLoc()), 647a711a3a4SMarcel Hlopko new (allocator()) syntax::ArraySubscript, L); 6487d382dcdSMarcel Hlopko return true; 6497d382dcdSMarcel Hlopko } 6507d382dcdSMarcel Hlopko 6517d382dcdSMarcel Hlopko bool WalkUpFromFunctionTypeLoc(FunctionTypeLoc L) { 6527d382dcdSMarcel Hlopko Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen); 653*cdce2fe5SMarcel Hlopko for (auto *P : L.getParams()) { 654*cdce2fe5SMarcel Hlopko Builder.markChild(P, syntax::NodeRole::ParametersAndQualifiers_parameter); 655*cdce2fe5SMarcel Hlopko } 6567d382dcdSMarcel Hlopko Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen); 6577d382dcdSMarcel Hlopko Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getEndLoc()), 658a711a3a4SMarcel Hlopko new (allocator()) syntax::ParametersAndQualifiers, L); 6597d382dcdSMarcel Hlopko return true; 6607d382dcdSMarcel Hlopko } 6617d382dcdSMarcel Hlopko 6627d382dcdSMarcel Hlopko bool WalkUpFromFunctionProtoTypeLoc(FunctionProtoTypeLoc L) { 6637d382dcdSMarcel Hlopko if (!L.getTypePtr()->hasTrailingReturn()) 6647d382dcdSMarcel Hlopko return WalkUpFromFunctionTypeLoc(L); 6657d382dcdSMarcel Hlopko 666*cdce2fe5SMarcel Hlopko auto *TrailingReturnTokens = BuildTrailingReturn(L); 6677d382dcdSMarcel Hlopko // Finish building the node for parameters. 6687d382dcdSMarcel Hlopko Builder.markChild(TrailingReturnTokens, 6697d382dcdSMarcel Hlopko syntax::NodeRole::ParametersAndQualifiers_trailingReturn); 6707d382dcdSMarcel Hlopko return WalkUpFromFunctionTypeLoc(L); 6717d382dcdSMarcel Hlopko } 6727d382dcdSMarcel Hlopko 6737d382dcdSMarcel Hlopko bool WalkUpFromMemberPointerTypeLoc(MemberPointerTypeLoc L) { 6747d382dcdSMarcel Hlopko auto SR = L.getLocalSourceRange(); 675a711a3a4SMarcel Hlopko Builder.foldNode(Builder.getRange(SR), 676a711a3a4SMarcel Hlopko new (allocator()) syntax::MemberPointer, L); 6777d382dcdSMarcel Hlopko return true; 6787d382dcdSMarcel Hlopko } 6797d382dcdSMarcel Hlopko 68058fa50f4SIlya Biryukov // The code below is very regular, it could even be generated with some 68158fa50f4SIlya Biryukov // preprocessor magic. We merely assign roles to the corresponding children 68258fa50f4SIlya Biryukov // and fold resulting nodes. 68358fa50f4SIlya Biryukov bool WalkUpFromDeclStmt(DeclStmt *S) { 68458fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 685a711a3a4SMarcel Hlopko new (allocator()) syntax::DeclarationStatement, S); 68658fa50f4SIlya Biryukov return true; 68758fa50f4SIlya Biryukov } 68858fa50f4SIlya Biryukov 68958fa50f4SIlya Biryukov bool WalkUpFromNullStmt(NullStmt *S) { 69058fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 691a711a3a4SMarcel Hlopko new (allocator()) syntax::EmptyStatement, S); 69258fa50f4SIlya Biryukov return true; 69358fa50f4SIlya Biryukov } 69458fa50f4SIlya Biryukov 69558fa50f4SIlya Biryukov bool WalkUpFromSwitchStmt(SwitchStmt *S) { 696def65bb4SIlya Biryukov Builder.markChildToken(S->getSwitchLoc(), 69758fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 69858fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 69958fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 700a711a3a4SMarcel Hlopko new (allocator()) syntax::SwitchStatement, S); 70158fa50f4SIlya Biryukov return true; 70258fa50f4SIlya Biryukov } 70358fa50f4SIlya Biryukov 70458fa50f4SIlya Biryukov bool WalkUpFromCaseStmt(CaseStmt *S) { 705def65bb4SIlya Biryukov Builder.markChildToken(S->getKeywordLoc(), 70658fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 70758fa50f4SIlya Biryukov Builder.markExprChild(S->getLHS(), syntax::NodeRole::CaseStatement_value); 70858fa50f4SIlya Biryukov Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement); 70958fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 710a711a3a4SMarcel Hlopko new (allocator()) syntax::CaseStatement, S); 71158fa50f4SIlya Biryukov return true; 71258fa50f4SIlya Biryukov } 71358fa50f4SIlya Biryukov 71458fa50f4SIlya Biryukov bool WalkUpFromDefaultStmt(DefaultStmt *S) { 715def65bb4SIlya Biryukov Builder.markChildToken(S->getKeywordLoc(), 71658fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 71758fa50f4SIlya Biryukov Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement); 71858fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 719a711a3a4SMarcel Hlopko new (allocator()) syntax::DefaultStatement, S); 72058fa50f4SIlya Biryukov return true; 72158fa50f4SIlya Biryukov } 72258fa50f4SIlya Biryukov 72358fa50f4SIlya Biryukov bool WalkUpFromIfStmt(IfStmt *S) { 724def65bb4SIlya Biryukov Builder.markChildToken(S->getIfLoc(), syntax::NodeRole::IntroducerKeyword); 72558fa50f4SIlya Biryukov Builder.markStmtChild(S->getThen(), 72658fa50f4SIlya Biryukov syntax::NodeRole::IfStatement_thenStatement); 727def65bb4SIlya Biryukov Builder.markChildToken(S->getElseLoc(), 72858fa50f4SIlya Biryukov syntax::NodeRole::IfStatement_elseKeyword); 72958fa50f4SIlya Biryukov Builder.markStmtChild(S->getElse(), 73058fa50f4SIlya Biryukov syntax::NodeRole::IfStatement_elseStatement); 73158fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 732a711a3a4SMarcel Hlopko new (allocator()) syntax::IfStatement, S); 73358fa50f4SIlya Biryukov return true; 73458fa50f4SIlya Biryukov } 73558fa50f4SIlya Biryukov 73658fa50f4SIlya Biryukov bool WalkUpFromForStmt(ForStmt *S) { 737def65bb4SIlya Biryukov Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword); 73858fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 73958fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 740a711a3a4SMarcel Hlopko new (allocator()) syntax::ForStatement, S); 74158fa50f4SIlya Biryukov return true; 74258fa50f4SIlya Biryukov } 74358fa50f4SIlya Biryukov 74458fa50f4SIlya Biryukov bool WalkUpFromWhileStmt(WhileStmt *S) { 745def65bb4SIlya Biryukov Builder.markChildToken(S->getWhileLoc(), 74658fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 74758fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 74858fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 749a711a3a4SMarcel Hlopko new (allocator()) syntax::WhileStatement, S); 75058fa50f4SIlya Biryukov return true; 75158fa50f4SIlya Biryukov } 75258fa50f4SIlya Biryukov 75358fa50f4SIlya Biryukov bool WalkUpFromContinueStmt(ContinueStmt *S) { 754def65bb4SIlya Biryukov Builder.markChildToken(S->getContinueLoc(), 75558fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 75658fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 757a711a3a4SMarcel Hlopko new (allocator()) syntax::ContinueStatement, S); 75858fa50f4SIlya Biryukov return true; 75958fa50f4SIlya Biryukov } 76058fa50f4SIlya Biryukov 76158fa50f4SIlya Biryukov bool WalkUpFromBreakStmt(BreakStmt *S) { 762def65bb4SIlya Biryukov Builder.markChildToken(S->getBreakLoc(), 76358fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 76458fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 765a711a3a4SMarcel Hlopko new (allocator()) syntax::BreakStatement, S); 76658fa50f4SIlya Biryukov return true; 76758fa50f4SIlya Biryukov } 76858fa50f4SIlya Biryukov 76958fa50f4SIlya Biryukov bool WalkUpFromReturnStmt(ReturnStmt *S) { 770def65bb4SIlya Biryukov Builder.markChildToken(S->getReturnLoc(), 77158fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 77258fa50f4SIlya Biryukov Builder.markExprChild(S->getRetValue(), 77358fa50f4SIlya Biryukov syntax::NodeRole::ReturnStatement_value); 77458fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 775a711a3a4SMarcel Hlopko new (allocator()) syntax::ReturnStatement, S); 77658fa50f4SIlya Biryukov return true; 77758fa50f4SIlya Biryukov } 77858fa50f4SIlya Biryukov 77958fa50f4SIlya Biryukov bool WalkUpFromCXXForRangeStmt(CXXForRangeStmt *S) { 780def65bb4SIlya Biryukov Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword); 78158fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 78258fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 783a711a3a4SMarcel Hlopko new (allocator()) syntax::RangeBasedForStatement, S); 78458fa50f4SIlya Biryukov return true; 78558fa50f4SIlya Biryukov } 78658fa50f4SIlya Biryukov 787be14a22bSIlya Biryukov bool WalkUpFromEmptyDecl(EmptyDecl *S) { 788*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 789a711a3a4SMarcel Hlopko new (allocator()) syntax::EmptyDeclaration, S); 790be14a22bSIlya Biryukov return true; 791be14a22bSIlya Biryukov } 792be14a22bSIlya Biryukov 793be14a22bSIlya Biryukov bool WalkUpFromStaticAssertDecl(StaticAssertDecl *S) { 794be14a22bSIlya Biryukov Builder.markExprChild(S->getAssertExpr(), 795be14a22bSIlya Biryukov syntax::NodeRole::StaticAssertDeclaration_condition); 796be14a22bSIlya Biryukov Builder.markExprChild(S->getMessage(), 797be14a22bSIlya Biryukov syntax::NodeRole::StaticAssertDeclaration_message); 798*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 799a711a3a4SMarcel Hlopko new (allocator()) syntax::StaticAssertDeclaration, S); 800be14a22bSIlya Biryukov return true; 801be14a22bSIlya Biryukov } 802be14a22bSIlya Biryukov 803be14a22bSIlya Biryukov bool WalkUpFromLinkageSpecDecl(LinkageSpecDecl *S) { 804*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 805a711a3a4SMarcel Hlopko new (allocator()) syntax::LinkageSpecificationDeclaration, 806a711a3a4SMarcel Hlopko S); 807be14a22bSIlya Biryukov return true; 808be14a22bSIlya Biryukov } 809be14a22bSIlya Biryukov 810be14a22bSIlya Biryukov bool WalkUpFromNamespaceAliasDecl(NamespaceAliasDecl *S) { 811*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 812a711a3a4SMarcel Hlopko new (allocator()) syntax::NamespaceAliasDefinition, S); 813be14a22bSIlya Biryukov return true; 814be14a22bSIlya Biryukov } 815be14a22bSIlya Biryukov 816be14a22bSIlya Biryukov bool WalkUpFromUsingDirectiveDecl(UsingDirectiveDecl *S) { 817*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 818a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingNamespaceDirective, S); 819be14a22bSIlya Biryukov return true; 820be14a22bSIlya Biryukov } 821be14a22bSIlya Biryukov 822be14a22bSIlya Biryukov bool WalkUpFromUsingDecl(UsingDecl *S) { 823*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 824a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingDeclaration, S); 825be14a22bSIlya Biryukov return true; 826be14a22bSIlya Biryukov } 827be14a22bSIlya Biryukov 828be14a22bSIlya Biryukov bool WalkUpFromUnresolvedUsingValueDecl(UnresolvedUsingValueDecl *S) { 829*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 830a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingDeclaration, S); 831be14a22bSIlya Biryukov return true; 832be14a22bSIlya Biryukov } 833be14a22bSIlya Biryukov 834be14a22bSIlya Biryukov bool WalkUpFromUnresolvedUsingTypenameDecl(UnresolvedUsingTypenameDecl *S) { 835*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 836a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingDeclaration, S); 837be14a22bSIlya Biryukov return true; 838be14a22bSIlya Biryukov } 839be14a22bSIlya Biryukov 840be14a22bSIlya Biryukov bool WalkUpFromTypeAliasDecl(TypeAliasDecl *S) { 841*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 842a711a3a4SMarcel Hlopko new (allocator()) syntax::TypeAliasDeclaration, S); 843be14a22bSIlya Biryukov return true; 844be14a22bSIlya Biryukov } 845be14a22bSIlya Biryukov 8469b3f38f9SIlya Biryukov private: 847*cdce2fe5SMarcel Hlopko template <class T> SourceLocation getQualifiedNameStart(T *D) { 848*cdce2fe5SMarcel Hlopko static_assert((std::is_base_of<DeclaratorDecl, T>::value || 849*cdce2fe5SMarcel Hlopko std::is_base_of<TypedefNameDecl, T>::value), 850*cdce2fe5SMarcel Hlopko "only DeclaratorDecl and TypedefNameDecl are supported."); 851*cdce2fe5SMarcel Hlopko 852*cdce2fe5SMarcel Hlopko auto DN = D->getDeclName(); 853*cdce2fe5SMarcel Hlopko bool IsAnonymous = DN.isIdentifier() && !DN.getAsIdentifierInfo(); 854*cdce2fe5SMarcel Hlopko if (IsAnonymous) 855*cdce2fe5SMarcel Hlopko return SourceLocation(); 856*cdce2fe5SMarcel Hlopko 857*cdce2fe5SMarcel Hlopko if (const auto *DD = llvm::dyn_cast<DeclaratorDecl>(D)) { 858*cdce2fe5SMarcel Hlopko if (DD->getQualifierLoc()) { 859*cdce2fe5SMarcel Hlopko return DD->getQualifierLoc().getBeginLoc(); 860*cdce2fe5SMarcel Hlopko } 861*cdce2fe5SMarcel Hlopko } 862*cdce2fe5SMarcel Hlopko 863*cdce2fe5SMarcel Hlopko return D->getLocation(); 864*cdce2fe5SMarcel Hlopko } 865*cdce2fe5SMarcel Hlopko 866*cdce2fe5SMarcel Hlopko SourceRange getInitializerRange(Decl *D) { 867*cdce2fe5SMarcel Hlopko if (auto *V = llvm::dyn_cast<VarDecl>(D)) { 868*cdce2fe5SMarcel Hlopko auto *I = V->getInit(); 869*cdce2fe5SMarcel Hlopko // Initializers in range-based-for are not part of the declarator 870*cdce2fe5SMarcel Hlopko if (I && !V->isCXXForRangeDecl()) 871*cdce2fe5SMarcel Hlopko return I->getSourceRange(); 872*cdce2fe5SMarcel Hlopko } 873*cdce2fe5SMarcel Hlopko 874*cdce2fe5SMarcel Hlopko return SourceRange(); 875*cdce2fe5SMarcel Hlopko } 876*cdce2fe5SMarcel Hlopko 877*cdce2fe5SMarcel Hlopko /// Folds SimpleDeclarator node (if present) and in case this is the last 878*cdce2fe5SMarcel Hlopko /// declarator in the chain it also folds SimpleDeclaration node. 879*cdce2fe5SMarcel Hlopko template <class T> bool processDeclaratorAndDeclaration(T *D) { 880*cdce2fe5SMarcel Hlopko SourceRange Initializer = getInitializerRange(D); 881*cdce2fe5SMarcel Hlopko auto Range = getDeclaratorRange(Builder.sourceManager(), 882*cdce2fe5SMarcel Hlopko D->getTypeSourceInfo()->getTypeLoc(), 883*cdce2fe5SMarcel Hlopko getQualifiedNameStart(D), Initializer); 884*cdce2fe5SMarcel Hlopko 885*cdce2fe5SMarcel Hlopko // There doesn't have to be a declarator (e.g. `void foo(int)` only has 886*cdce2fe5SMarcel Hlopko // declaration, but no declarator). 887*cdce2fe5SMarcel Hlopko if (Range.getBegin().isValid()) { 888*cdce2fe5SMarcel Hlopko auto *N = new (allocator()) syntax::SimpleDeclarator; 889*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getRange(Range), N, nullptr); 890*cdce2fe5SMarcel Hlopko Builder.markChild(N, syntax::NodeRole::SimpleDeclaration_declarator); 891*cdce2fe5SMarcel Hlopko } 892*cdce2fe5SMarcel Hlopko 893*cdce2fe5SMarcel Hlopko if (Builder.isResponsibleForCreatingDeclaration(D)) { 894*cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(D), 895*cdce2fe5SMarcel Hlopko new (allocator()) syntax::SimpleDeclaration, D); 896*cdce2fe5SMarcel Hlopko } 897*cdce2fe5SMarcel Hlopko return true; 898*cdce2fe5SMarcel Hlopko } 899*cdce2fe5SMarcel Hlopko 9007d382dcdSMarcel Hlopko /// Returns the range of the built node. 901a711a3a4SMarcel Hlopko syntax::TrailingReturnType *BuildTrailingReturn(FunctionProtoTypeLoc L) { 9027d382dcdSMarcel Hlopko assert(L.getTypePtr()->hasTrailingReturn()); 9037d382dcdSMarcel Hlopko 9047d382dcdSMarcel Hlopko auto ReturnedType = L.getReturnLoc(); 9057d382dcdSMarcel Hlopko // Build node for the declarator, if any. 9067d382dcdSMarcel Hlopko auto ReturnDeclaratorRange = 9077d382dcdSMarcel Hlopko getDeclaratorRange(this->Builder.sourceManager(), ReturnedType, 9087d382dcdSMarcel Hlopko /*Name=*/SourceLocation(), 9097d382dcdSMarcel Hlopko /*Initializer=*/SourceLocation()); 910a711a3a4SMarcel Hlopko syntax::SimpleDeclarator *ReturnDeclarator = nullptr; 9117d382dcdSMarcel Hlopko if (ReturnDeclaratorRange.isValid()) { 912a711a3a4SMarcel Hlopko ReturnDeclarator = new (allocator()) syntax::SimpleDeclarator; 913a711a3a4SMarcel Hlopko Builder.foldNode(Builder.getRange(ReturnDeclaratorRange), 914a711a3a4SMarcel Hlopko ReturnDeclarator, nullptr); 9157d382dcdSMarcel Hlopko } 9167d382dcdSMarcel Hlopko 9177d382dcdSMarcel Hlopko // Build node for trailing return type. 918a711a3a4SMarcel Hlopko auto Return = Builder.getRange(ReturnedType.getSourceRange()); 9197d382dcdSMarcel Hlopko const auto *Arrow = Return.begin() - 1; 9207d382dcdSMarcel Hlopko assert(Arrow->kind() == tok::arrow); 9217d382dcdSMarcel Hlopko auto Tokens = llvm::makeArrayRef(Arrow, Return.end()); 9227d382dcdSMarcel Hlopko Builder.markChildToken(Arrow, syntax::NodeRole::TrailingReturnType_arrow); 923a711a3a4SMarcel Hlopko if (ReturnDeclarator) 924a711a3a4SMarcel Hlopko Builder.markChild(ReturnDeclarator, 9257d382dcdSMarcel Hlopko syntax::NodeRole::TrailingReturnType_declarator); 926a711a3a4SMarcel Hlopko auto *R = new (allocator()) syntax::TrailingReturnType; 927*cdce2fe5SMarcel Hlopko Builder.foldNode(Tokens, R, L); 928a711a3a4SMarcel Hlopko return R; 9297d382dcdSMarcel Hlopko } 93088bf9b3dSMarcel Hlopko 931a711a3a4SMarcel Hlopko void foldExplicitTemplateInstantiation( 932a711a3a4SMarcel Hlopko ArrayRef<syntax::Token> Range, const syntax::Token *ExternKW, 93388bf9b3dSMarcel Hlopko const syntax::Token *TemplateKW, 934a711a3a4SMarcel Hlopko syntax::SimpleDeclaration *InnerDeclaration, Decl *From) { 93588bf9b3dSMarcel Hlopko assert(!ExternKW || ExternKW->kind() == tok::kw_extern); 93688bf9b3dSMarcel Hlopko assert(TemplateKW && TemplateKW->kind() == tok::kw_template); 93788bf9b3dSMarcel Hlopko Builder.markChildToken( 93888bf9b3dSMarcel Hlopko ExternKW, 93988bf9b3dSMarcel Hlopko syntax::NodeRole::ExplicitTemplateInstantiation_externKeyword); 94088bf9b3dSMarcel Hlopko Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword); 94188bf9b3dSMarcel Hlopko Builder.markChild( 94288bf9b3dSMarcel Hlopko InnerDeclaration, 94388bf9b3dSMarcel Hlopko syntax::NodeRole::ExplicitTemplateInstantiation_declaration); 944a711a3a4SMarcel Hlopko Builder.foldNode( 945a711a3a4SMarcel Hlopko Range, new (allocator()) syntax::ExplicitTemplateInstantiation, From); 94688bf9b3dSMarcel Hlopko } 94788bf9b3dSMarcel Hlopko 948a711a3a4SMarcel Hlopko syntax::TemplateDeclaration *foldTemplateDeclaration( 949a711a3a4SMarcel Hlopko ArrayRef<syntax::Token> Range, const syntax::Token *TemplateKW, 950a711a3a4SMarcel Hlopko ArrayRef<syntax::Token> TemplatedDeclaration, Decl *From) { 95188bf9b3dSMarcel Hlopko assert(TemplateKW && TemplateKW->kind() == tok::kw_template); 95288bf9b3dSMarcel Hlopko Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword); 953a711a3a4SMarcel Hlopko 954a711a3a4SMarcel Hlopko auto *N = new (allocator()) syntax::TemplateDeclaration; 955a711a3a4SMarcel Hlopko Builder.foldNode(Range, N, From); 956*cdce2fe5SMarcel Hlopko Builder.markChild(N, syntax::NodeRole::TemplateDeclaration_declaration); 957a711a3a4SMarcel Hlopko return N; 95888bf9b3dSMarcel Hlopko } 95988bf9b3dSMarcel Hlopko 9609b3f38f9SIlya Biryukov /// A small helper to save some typing. 9619b3f38f9SIlya Biryukov llvm::BumpPtrAllocator &allocator() { return Builder.allocator(); } 9629b3f38f9SIlya Biryukov 9639b3f38f9SIlya Biryukov syntax::TreeBuilder &Builder; 9649b3f38f9SIlya Biryukov const LangOptions &LangOpts; 9659b3f38f9SIlya Biryukov }; 9669b3f38f9SIlya Biryukov } // namespace 9679b3f38f9SIlya Biryukov 9687d382dcdSMarcel Hlopko void syntax::TreeBuilder::noticeDeclWithoutSemicolon(Decl *D) { 969e702bdb8SIlya Biryukov DeclsWithoutSemicolons.insert(D); 970e702bdb8SIlya Biryukov } 971e702bdb8SIlya Biryukov 972def65bb4SIlya Biryukov void syntax::TreeBuilder::markChildToken(SourceLocation Loc, NodeRole Role) { 9739b3f38f9SIlya Biryukov if (Loc.isInvalid()) 9749b3f38f9SIlya Biryukov return; 9759b3f38f9SIlya Biryukov Pending.assignRole(*findToken(Loc), Role); 9769b3f38f9SIlya Biryukov } 9779b3f38f9SIlya Biryukov 9787d382dcdSMarcel Hlopko void syntax::TreeBuilder::markChildToken(const syntax::Token *T, NodeRole R) { 9797d382dcdSMarcel Hlopko if (!T) 9807d382dcdSMarcel Hlopko return; 9817d382dcdSMarcel Hlopko Pending.assignRole(*T, R); 9827d382dcdSMarcel Hlopko } 9837d382dcdSMarcel Hlopko 984a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(syntax::Node *N, NodeRole R) { 985a711a3a4SMarcel Hlopko assert(N); 986a711a3a4SMarcel Hlopko setRole(N, R); 987a711a3a4SMarcel Hlopko } 988a711a3a4SMarcel Hlopko 989a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(ASTPtr N, NodeRole R) { 990a711a3a4SMarcel Hlopko auto *SN = Mapping.find(N); 991a711a3a4SMarcel Hlopko assert(SN != nullptr); 992a711a3a4SMarcel Hlopko setRole(SN, R); 9937d382dcdSMarcel Hlopko } 9947d382dcdSMarcel Hlopko 99558fa50f4SIlya Biryukov void syntax::TreeBuilder::markStmtChild(Stmt *Child, NodeRole Role) { 99658fa50f4SIlya Biryukov if (!Child) 99758fa50f4SIlya Biryukov return; 99858fa50f4SIlya Biryukov 999a711a3a4SMarcel Hlopko syntax::Tree *ChildNode = Mapping.find(Child); 1000a711a3a4SMarcel Hlopko assert(ChildNode != nullptr); 1001a711a3a4SMarcel Hlopko 100258fa50f4SIlya Biryukov // This is an expression in a statement position, consume the trailing 100358fa50f4SIlya Biryukov // semicolon and form an 'ExpressionStatement' node. 1004896fa30fSSimon Pilgrim if (isa<Expr>(Child)) { 1005a711a3a4SMarcel Hlopko setRole(ChildNode, NodeRole::ExpressionStatement_expression); 1006a711a3a4SMarcel Hlopko ChildNode = new (allocator()) syntax::ExpressionStatement; 1007a711a3a4SMarcel Hlopko // (!) 'getStmtRange()' ensures this covers a trailing semicolon. 1008a711a3a4SMarcel Hlopko Pending.foldChildren(Arena, getStmtRange(Child), ChildNode); 100958fa50f4SIlya Biryukov } 1010a711a3a4SMarcel Hlopko setRole(ChildNode, Role); 101158fa50f4SIlya Biryukov } 101258fa50f4SIlya Biryukov 101358fa50f4SIlya Biryukov void syntax::TreeBuilder::markExprChild(Expr *Child, NodeRole Role) { 1014be14a22bSIlya Biryukov if (!Child) 1015be14a22bSIlya Biryukov return; 1016a711a3a4SMarcel Hlopko Child = Child->IgnoreImplicit(); 1017be14a22bSIlya Biryukov 1018a711a3a4SMarcel Hlopko syntax::Tree *ChildNode = Mapping.find(Child); 1019a711a3a4SMarcel Hlopko assert(ChildNode != nullptr); 1020a711a3a4SMarcel Hlopko setRole(ChildNode, Role); 102158fa50f4SIlya Biryukov } 102258fa50f4SIlya Biryukov 10239b3f38f9SIlya Biryukov const syntax::Token *syntax::TreeBuilder::findToken(SourceLocation L) const { 102488bf9b3dSMarcel Hlopko if (L.isInvalid()) 102588bf9b3dSMarcel Hlopko return nullptr; 1026c1bbefefSIlya Biryukov auto It = LocationToToken.find(L.getRawEncoding()); 1027c1bbefefSIlya Biryukov assert(It != LocationToToken.end()); 1028c1bbefefSIlya Biryukov return It->second; 10299b3f38f9SIlya Biryukov } 10309b3f38f9SIlya Biryukov 10319b3f38f9SIlya Biryukov syntax::TranslationUnit * 10329b3f38f9SIlya Biryukov syntax::buildSyntaxTree(Arena &A, const TranslationUnitDecl &TU) { 10339b3f38f9SIlya Biryukov TreeBuilder Builder(A); 10349b3f38f9SIlya Biryukov BuildTreeVisitor(TU.getASTContext(), Builder).TraverseAST(TU.getASTContext()); 10359b3f38f9SIlya Biryukov return std::move(Builder).finalize(); 10369b3f38f9SIlya Biryukov } 1037