19b3f38f9SIlya Biryukov //===- BuildTree.cpp ------------------------------------------*- C++ -*-=====// 29b3f38f9SIlya Biryukov // 39b3f38f9SIlya Biryukov // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 49b3f38f9SIlya Biryukov // See https://llvm.org/LICENSE.txt for license information. 59b3f38f9SIlya Biryukov // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 69b3f38f9SIlya Biryukov // 79b3f38f9SIlya Biryukov //===----------------------------------------------------------------------===// 89b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/BuildTree.h" 97d382dcdSMarcel Hlopko #include "clang/AST/ASTFwd.h" 10e702bdb8SIlya Biryukov #include "clang/AST/Decl.h" 11e702bdb8SIlya Biryukov #include "clang/AST/DeclBase.h" 127d382dcdSMarcel Hlopko #include "clang/AST/DeclCXX.h" 137d382dcdSMarcel Hlopko #include "clang/AST/DeclarationName.h" 143785eb83SEduardo Caldas #include "clang/AST/Expr.h" 159b3f38f9SIlya Biryukov #include "clang/AST/RecursiveASTVisitor.h" 169b3f38f9SIlya Biryukov #include "clang/AST/Stmt.h" 177d382dcdSMarcel Hlopko #include "clang/AST/TypeLoc.h" 187d382dcdSMarcel Hlopko #include "clang/AST/TypeLocVisitor.h" 199b3f38f9SIlya Biryukov #include "clang/Basic/LLVM.h" 209b3f38f9SIlya Biryukov #include "clang/Basic/SourceLocation.h" 219b3f38f9SIlya Biryukov #include "clang/Basic/SourceManager.h" 2288bf9b3dSMarcel Hlopko #include "clang/Basic/Specifiers.h" 239b3f38f9SIlya Biryukov #include "clang/Basic/TokenKinds.h" 249b3f38f9SIlya Biryukov #include "clang/Lex/Lexer.h" 259b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Nodes.h" 269b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tokens.h" 279b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tree.h" 289b3f38f9SIlya Biryukov #include "llvm/ADT/ArrayRef.h" 29a711a3a4SMarcel Hlopko #include "llvm/ADT/DenseMap.h" 30a711a3a4SMarcel Hlopko #include "llvm/ADT/PointerUnion.h" 319b3f38f9SIlya Biryukov #include "llvm/ADT/STLExtras.h" 327d382dcdSMarcel Hlopko #include "llvm/ADT/ScopeExit.h" 339b3f38f9SIlya Biryukov #include "llvm/ADT/SmallVector.h" 349b3f38f9SIlya Biryukov #include "llvm/Support/Allocator.h" 359b3f38f9SIlya Biryukov #include "llvm/Support/Casting.h" 3696065cf7SIlya Biryukov #include "llvm/Support/Compiler.h" 379b3f38f9SIlya Biryukov #include "llvm/Support/FormatVariadic.h" 381ad15046SIlya Biryukov #include "llvm/Support/MemoryBuffer.h" 399b3f38f9SIlya Biryukov #include "llvm/Support/raw_ostream.h" 40a711a3a4SMarcel Hlopko #include <cstddef> 419b3f38f9SIlya Biryukov #include <map> 429b3f38f9SIlya Biryukov 439b3f38f9SIlya Biryukov using namespace clang; 449b3f38f9SIlya Biryukov 4596065cf7SIlya Biryukov LLVM_ATTRIBUTE_UNUSED 4658fa50f4SIlya Biryukov static bool isImplicitExpr(clang::Expr *E) { return E->IgnoreImplicit() != E; } 4758fa50f4SIlya Biryukov 487d382dcdSMarcel Hlopko namespace { 497d382dcdSMarcel Hlopko /// Get start location of the Declarator from the TypeLoc. 507d382dcdSMarcel Hlopko /// E.g.: 517d382dcdSMarcel Hlopko /// loc of `(` in `int (a)` 527d382dcdSMarcel Hlopko /// loc of `*` in `int *(a)` 537d382dcdSMarcel Hlopko /// loc of the first `(` in `int (*a)(int)` 547d382dcdSMarcel Hlopko /// loc of the `*` in `int *(a)(int)` 557d382dcdSMarcel Hlopko /// loc of the first `*` in `const int *const *volatile a;` 567d382dcdSMarcel Hlopko /// 577d382dcdSMarcel Hlopko /// It is non-trivial to get the start location because TypeLocs are stored 587d382dcdSMarcel Hlopko /// inside out. In the example above `*volatile` is the TypeLoc returned 597d382dcdSMarcel Hlopko /// by `Decl.getTypeSourceInfo()`, and `*const` is what `.getPointeeLoc()` 607d382dcdSMarcel Hlopko /// returns. 617d382dcdSMarcel Hlopko struct GetStartLoc : TypeLocVisitor<GetStartLoc, SourceLocation> { 627d382dcdSMarcel Hlopko SourceLocation VisitParenTypeLoc(ParenTypeLoc T) { 637d382dcdSMarcel Hlopko auto L = Visit(T.getInnerLoc()); 647d382dcdSMarcel Hlopko if (L.isValid()) 657d382dcdSMarcel Hlopko return L; 667d382dcdSMarcel Hlopko return T.getLParenLoc(); 677d382dcdSMarcel Hlopko } 687d382dcdSMarcel Hlopko 697d382dcdSMarcel Hlopko // Types spelled in the prefix part of the declarator. 707d382dcdSMarcel Hlopko SourceLocation VisitPointerTypeLoc(PointerTypeLoc T) { 717d382dcdSMarcel Hlopko return HandlePointer(T); 727d382dcdSMarcel Hlopko } 737d382dcdSMarcel Hlopko 747d382dcdSMarcel Hlopko SourceLocation VisitMemberPointerTypeLoc(MemberPointerTypeLoc T) { 757d382dcdSMarcel Hlopko return HandlePointer(T); 767d382dcdSMarcel Hlopko } 777d382dcdSMarcel Hlopko 787d382dcdSMarcel Hlopko SourceLocation VisitBlockPointerTypeLoc(BlockPointerTypeLoc T) { 797d382dcdSMarcel Hlopko return HandlePointer(T); 807d382dcdSMarcel Hlopko } 817d382dcdSMarcel Hlopko 827d382dcdSMarcel Hlopko SourceLocation VisitReferenceTypeLoc(ReferenceTypeLoc T) { 837d382dcdSMarcel Hlopko return HandlePointer(T); 847d382dcdSMarcel Hlopko } 857d382dcdSMarcel Hlopko 867d382dcdSMarcel Hlopko SourceLocation VisitObjCObjectPointerTypeLoc(ObjCObjectPointerTypeLoc T) { 877d382dcdSMarcel Hlopko return HandlePointer(T); 887d382dcdSMarcel Hlopko } 897d382dcdSMarcel Hlopko 907d382dcdSMarcel Hlopko // All other cases are not important, as they are either part of declaration 917d382dcdSMarcel Hlopko // specifiers (e.g. inheritors of TypeSpecTypeLoc) or introduce modifiers on 927d382dcdSMarcel Hlopko // existing declarators (e.g. QualifiedTypeLoc). They cannot start the 937d382dcdSMarcel Hlopko // declarator themselves, but their underlying type can. 947d382dcdSMarcel Hlopko SourceLocation VisitTypeLoc(TypeLoc T) { 957d382dcdSMarcel Hlopko auto N = T.getNextTypeLoc(); 967d382dcdSMarcel Hlopko if (!N) 977d382dcdSMarcel Hlopko return SourceLocation(); 987d382dcdSMarcel Hlopko return Visit(N); 997d382dcdSMarcel Hlopko } 1007d382dcdSMarcel Hlopko 1017d382dcdSMarcel Hlopko SourceLocation VisitFunctionProtoTypeLoc(FunctionProtoTypeLoc T) { 1027d382dcdSMarcel Hlopko if (T.getTypePtr()->hasTrailingReturn()) 1037d382dcdSMarcel Hlopko return SourceLocation(); // avoid recursing into the suffix of declarator. 1047d382dcdSMarcel Hlopko return VisitTypeLoc(T); 1057d382dcdSMarcel Hlopko } 1067d382dcdSMarcel Hlopko 1077d382dcdSMarcel Hlopko private: 1087d382dcdSMarcel Hlopko template <class PtrLoc> SourceLocation HandlePointer(PtrLoc T) { 1097d382dcdSMarcel Hlopko auto L = Visit(T.getPointeeLoc()); 1107d382dcdSMarcel Hlopko if (L.isValid()) 1117d382dcdSMarcel Hlopko return L; 1127d382dcdSMarcel Hlopko return T.getLocalSourceRange().getBegin(); 1137d382dcdSMarcel Hlopko } 1147d382dcdSMarcel Hlopko }; 1157d382dcdSMarcel Hlopko } // namespace 1167d382dcdSMarcel Hlopko 1177d382dcdSMarcel Hlopko /// Gets the range of declarator as defined by the C++ grammar. E.g. 1187d382dcdSMarcel Hlopko /// `int a;` -> range of `a`, 1197d382dcdSMarcel Hlopko /// `int *a;` -> range of `*a`, 1207d382dcdSMarcel Hlopko /// `int a[10];` -> range of `a[10]`, 1217d382dcdSMarcel Hlopko /// `int a[1][2][3];` -> range of `a[1][2][3]`, 1227d382dcdSMarcel Hlopko /// `int *a = nullptr` -> range of `*a = nullptr`. 1237d382dcdSMarcel Hlopko /// FIMXE: \p Name must be a source range, e.g. for `operator+`. 1247d382dcdSMarcel Hlopko static SourceRange getDeclaratorRange(const SourceManager &SM, TypeLoc T, 1257d382dcdSMarcel Hlopko SourceLocation Name, 1267d382dcdSMarcel Hlopko SourceRange Initializer) { 1277d382dcdSMarcel Hlopko SourceLocation Start = GetStartLoc().Visit(T); 1287d382dcdSMarcel Hlopko SourceLocation End = T.getSourceRange().getEnd(); 1297d382dcdSMarcel Hlopko assert(End.isValid()); 1307d382dcdSMarcel Hlopko if (Name.isValid()) { 1317d382dcdSMarcel Hlopko if (Start.isInvalid()) 1327d382dcdSMarcel Hlopko Start = Name; 1337d382dcdSMarcel Hlopko if (SM.isBeforeInTranslationUnit(End, Name)) 1347d382dcdSMarcel Hlopko End = Name; 1357d382dcdSMarcel Hlopko } 1367d382dcdSMarcel Hlopko if (Initializer.isValid()) { 137cdce2fe5SMarcel Hlopko auto InitializerEnd = Initializer.getEnd(); 138cdce2fe5SMarcel Hlopko assert(SM.isBeforeInTranslationUnit(End, InitializerEnd) || End == InitializerEnd); 139cdce2fe5SMarcel Hlopko End = InitializerEnd; 1407d382dcdSMarcel Hlopko } 1417d382dcdSMarcel Hlopko return SourceRange(Start, End); 1427d382dcdSMarcel Hlopko } 1437d382dcdSMarcel Hlopko 144a711a3a4SMarcel Hlopko namespace { 145a711a3a4SMarcel Hlopko /// All AST hierarchy roots that can be represented as pointers. 146a711a3a4SMarcel Hlopko using ASTPtr = llvm::PointerUnion<Stmt *, Decl *>; 147a711a3a4SMarcel Hlopko /// Maintains a mapping from AST to syntax tree nodes. This class will get more 148a711a3a4SMarcel Hlopko /// complicated as we support more kinds of AST nodes, e.g. TypeLocs. 149a711a3a4SMarcel Hlopko /// FIXME: expose this as public API. 150a711a3a4SMarcel Hlopko class ASTToSyntaxMapping { 151a711a3a4SMarcel Hlopko public: 152a711a3a4SMarcel Hlopko void add(ASTPtr From, syntax::Tree *To) { 153a711a3a4SMarcel Hlopko assert(To != nullptr); 154a711a3a4SMarcel Hlopko assert(!From.isNull()); 155a711a3a4SMarcel Hlopko 156a711a3a4SMarcel Hlopko bool Added = Nodes.insert({From, To}).second; 157a711a3a4SMarcel Hlopko (void)Added; 158a711a3a4SMarcel Hlopko assert(Added && "mapping added twice"); 159a711a3a4SMarcel Hlopko } 160a711a3a4SMarcel Hlopko 161a711a3a4SMarcel Hlopko syntax::Tree *find(ASTPtr P) const { return Nodes.lookup(P); } 162a711a3a4SMarcel Hlopko 163a711a3a4SMarcel Hlopko private: 164a711a3a4SMarcel Hlopko llvm::DenseMap<ASTPtr, syntax::Tree *> Nodes; 165a711a3a4SMarcel Hlopko }; 166a711a3a4SMarcel Hlopko } // namespace 167a711a3a4SMarcel Hlopko 1689b3f38f9SIlya Biryukov /// A helper class for constructing the syntax tree while traversing a clang 1699b3f38f9SIlya Biryukov /// AST. 1709b3f38f9SIlya Biryukov /// 1719b3f38f9SIlya Biryukov /// At each point of the traversal we maintain a list of pending nodes. 1729b3f38f9SIlya Biryukov /// Initially all tokens are added as pending nodes. When processing a clang AST 1739b3f38f9SIlya Biryukov /// node, the clients need to: 1749b3f38f9SIlya Biryukov /// - create a corresponding syntax node, 1759b3f38f9SIlya Biryukov /// - assign roles to all pending child nodes with 'markChild' and 1769b3f38f9SIlya Biryukov /// 'markChildToken', 1779b3f38f9SIlya Biryukov /// - replace the child nodes with the new syntax node in the pending list 1789b3f38f9SIlya Biryukov /// with 'foldNode'. 1799b3f38f9SIlya Biryukov /// 1809b3f38f9SIlya Biryukov /// Note that all children are expected to be processed when building a node. 1819b3f38f9SIlya Biryukov /// 1829b3f38f9SIlya Biryukov /// Call finalize() to finish building the tree and consume the root node. 1839b3f38f9SIlya Biryukov class syntax::TreeBuilder { 1849b3f38f9SIlya Biryukov public: 185c1bbefefSIlya Biryukov TreeBuilder(syntax::Arena &Arena) : Arena(Arena), Pending(Arena) { 186c1bbefefSIlya Biryukov for (const auto &T : Arena.tokenBuffer().expandedTokens()) 187c1bbefefSIlya Biryukov LocationToToken.insert({T.location().getRawEncoding(), &T}); 188c1bbefefSIlya Biryukov } 1899b3f38f9SIlya Biryukov 1909b3f38f9SIlya Biryukov llvm::BumpPtrAllocator &allocator() { return Arena.allocator(); } 1917d382dcdSMarcel Hlopko const SourceManager &sourceManager() const { return Arena.sourceManager(); } 1929b3f38f9SIlya Biryukov 1939b3f38f9SIlya Biryukov /// Populate children for \p New node, assuming it covers tokens from \p 1949b3f38f9SIlya Biryukov /// Range. 195a711a3a4SMarcel Hlopko void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New, 196a711a3a4SMarcel Hlopko ASTPtr From) { 197a711a3a4SMarcel Hlopko assert(New); 198a711a3a4SMarcel Hlopko Pending.foldChildren(Arena, Range, New); 199a711a3a4SMarcel Hlopko if (From) 200a711a3a4SMarcel Hlopko Mapping.add(From, New); 201a711a3a4SMarcel Hlopko } 202a711a3a4SMarcel Hlopko void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New, 203a711a3a4SMarcel Hlopko TypeLoc L) { 204a711a3a4SMarcel Hlopko // FIXME: add mapping for TypeLocs 205a711a3a4SMarcel Hlopko foldNode(Range, New, nullptr); 206a711a3a4SMarcel Hlopko } 2079b3f38f9SIlya Biryukov 208e702bdb8SIlya Biryukov /// Notifies that we should not consume trailing semicolon when computing 209e702bdb8SIlya Biryukov /// token range of \p D. 2107d382dcdSMarcel Hlopko void noticeDeclWithoutSemicolon(Decl *D); 211e702bdb8SIlya Biryukov 21258fa50f4SIlya Biryukov /// Mark the \p Child node with a corresponding \p Role. All marked children 21358fa50f4SIlya Biryukov /// should be consumed by foldNode. 2147d382dcdSMarcel Hlopko /// When called on expressions (clang::Expr is derived from clang::Stmt), 21558fa50f4SIlya Biryukov /// wraps expressions into expression statement. 21658fa50f4SIlya Biryukov void markStmtChild(Stmt *Child, NodeRole Role); 21758fa50f4SIlya Biryukov /// Should be called for expressions in non-statement position to avoid 21858fa50f4SIlya Biryukov /// wrapping into expression statement. 21958fa50f4SIlya Biryukov void markExprChild(Expr *Child, NodeRole Role); 2209b3f38f9SIlya Biryukov /// Set role for a token starting at \p Loc. 221def65bb4SIlya Biryukov void markChildToken(SourceLocation Loc, NodeRole R); 2227d382dcdSMarcel Hlopko /// Set role for \p T. 2237d382dcdSMarcel Hlopko void markChildToken(const syntax::Token *T, NodeRole R); 2247d382dcdSMarcel Hlopko 225a711a3a4SMarcel Hlopko /// Set role for \p N. 226a711a3a4SMarcel Hlopko void markChild(syntax::Node *N, NodeRole R); 227a711a3a4SMarcel Hlopko /// Set role for the syntax node matching \p N. 228a711a3a4SMarcel Hlopko void markChild(ASTPtr N, NodeRole R); 2299b3f38f9SIlya Biryukov 2309b3f38f9SIlya Biryukov /// Finish building the tree and consume the root node. 2319b3f38f9SIlya Biryukov syntax::TranslationUnit *finalize() && { 2329b3f38f9SIlya Biryukov auto Tokens = Arena.tokenBuffer().expandedTokens(); 233bfbf6b6cSIlya Biryukov assert(!Tokens.empty()); 234bfbf6b6cSIlya Biryukov assert(Tokens.back().kind() == tok::eof); 235bfbf6b6cSIlya Biryukov 2369b3f38f9SIlya Biryukov // Build the root of the tree, consuming all the children. 2371ad15046SIlya Biryukov Pending.foldChildren(Arena, Tokens.drop_back(), 2389b3f38f9SIlya Biryukov new (Arena.allocator()) syntax::TranslationUnit); 2399b3f38f9SIlya Biryukov 2403b929fe7SIlya Biryukov auto *TU = cast<syntax::TranslationUnit>(std::move(Pending).finalize()); 2413b929fe7SIlya Biryukov TU->assertInvariantsRecursive(); 2423b929fe7SIlya Biryukov return TU; 2439b3f38f9SIlya Biryukov } 2449b3f38f9SIlya Biryukov 24588bf9b3dSMarcel Hlopko /// Finds a token starting at \p L. The token must exist if \p L is valid. 24688bf9b3dSMarcel Hlopko const syntax::Token *findToken(SourceLocation L) const; 24788bf9b3dSMarcel Hlopko 248a711a3a4SMarcel Hlopko /// Finds the syntax tokens corresponding to the \p SourceRange. 249a711a3a4SMarcel Hlopko llvm::ArrayRef<syntax::Token> getRange(SourceRange Range) const { 250a711a3a4SMarcel Hlopko assert(Range.isValid()); 251a711a3a4SMarcel Hlopko return getRange(Range.getBegin(), Range.getEnd()); 252a711a3a4SMarcel Hlopko } 253a711a3a4SMarcel Hlopko 254a711a3a4SMarcel Hlopko /// Finds the syntax tokens corresponding to the passed source locations. 2559b3f38f9SIlya Biryukov /// \p First is the start position of the first token and \p Last is the start 2569b3f38f9SIlya Biryukov /// position of the last token. 2579b3f38f9SIlya Biryukov llvm::ArrayRef<syntax::Token> getRange(SourceLocation First, 2589b3f38f9SIlya Biryukov SourceLocation Last) const { 2599b3f38f9SIlya Biryukov assert(First.isValid()); 2609b3f38f9SIlya Biryukov assert(Last.isValid()); 2619b3f38f9SIlya Biryukov assert(First == Last || 2629b3f38f9SIlya Biryukov Arena.sourceManager().isBeforeInTranslationUnit(First, Last)); 2639b3f38f9SIlya Biryukov return llvm::makeArrayRef(findToken(First), std::next(findToken(Last))); 2649b3f38f9SIlya Biryukov } 26588bf9b3dSMarcel Hlopko 26688bf9b3dSMarcel Hlopko llvm::ArrayRef<syntax::Token> 26788bf9b3dSMarcel Hlopko getTemplateRange(const ClassTemplateSpecializationDecl *D) const { 268a711a3a4SMarcel Hlopko auto Tokens = getRange(D->getSourceRange()); 26988bf9b3dSMarcel Hlopko return maybeAppendSemicolon(Tokens, D); 27088bf9b3dSMarcel Hlopko } 27188bf9b3dSMarcel Hlopko 272cdce2fe5SMarcel Hlopko /// Returns true if \p D is the last declarator in a chain and is thus 273cdce2fe5SMarcel Hlopko /// reponsible for creating SimpleDeclaration for the whole chain. 274cdce2fe5SMarcel Hlopko template <class T> 275cdce2fe5SMarcel Hlopko bool isResponsibleForCreatingDeclaration(const T *D) const { 276cdce2fe5SMarcel Hlopko static_assert((std::is_base_of<DeclaratorDecl, T>::value || 277cdce2fe5SMarcel Hlopko std::is_base_of<TypedefNameDecl, T>::value), 278cdce2fe5SMarcel Hlopko "only DeclaratorDecl and TypedefNameDecl are supported."); 279cdce2fe5SMarcel Hlopko 280cdce2fe5SMarcel Hlopko const Decl *Next = D->getNextDeclInContext(); 281cdce2fe5SMarcel Hlopko 282cdce2fe5SMarcel Hlopko // There's no next sibling, this one is responsible. 283cdce2fe5SMarcel Hlopko if (Next == nullptr) { 284cdce2fe5SMarcel Hlopko return true; 285cdce2fe5SMarcel Hlopko } 286cdce2fe5SMarcel Hlopko const auto *NextT = llvm::dyn_cast<T>(Next); 287cdce2fe5SMarcel Hlopko 288cdce2fe5SMarcel Hlopko // Next sibling is not the same type, this one is responsible. 289cdce2fe5SMarcel Hlopko if (NextT == nullptr) { 290cdce2fe5SMarcel Hlopko return true; 291cdce2fe5SMarcel Hlopko } 292cdce2fe5SMarcel Hlopko // Next sibling doesn't begin at the same loc, it must be a different 293cdce2fe5SMarcel Hlopko // declaration, so this declarator is responsible. 294cdce2fe5SMarcel Hlopko if (NextT->getBeginLoc() != D->getBeginLoc()) { 295cdce2fe5SMarcel Hlopko return true; 296cdce2fe5SMarcel Hlopko } 297cdce2fe5SMarcel Hlopko 298cdce2fe5SMarcel Hlopko // NextT is a member of the same declaration, and we need the last member to 299cdce2fe5SMarcel Hlopko // create declaration. This one is not responsible. 300cdce2fe5SMarcel Hlopko return false; 301cdce2fe5SMarcel Hlopko } 302cdce2fe5SMarcel Hlopko 303cdce2fe5SMarcel Hlopko llvm::ArrayRef<syntax::Token> getDeclarationRange(Decl *D) { 30488bf9b3dSMarcel Hlopko llvm::ArrayRef<clang::syntax::Token> Tokens; 30588bf9b3dSMarcel Hlopko // We want to drop the template parameters for specializations. 30688bf9b3dSMarcel Hlopko if (const auto *S = llvm::dyn_cast<TagDecl>(D)) 30788bf9b3dSMarcel Hlopko Tokens = getRange(S->TypeDecl::getBeginLoc(), S->getEndLoc()); 30888bf9b3dSMarcel Hlopko else 309a711a3a4SMarcel Hlopko Tokens = getRange(D->getSourceRange()); 31088bf9b3dSMarcel Hlopko return maybeAppendSemicolon(Tokens, D); 3119b3f38f9SIlya Biryukov } 312cdce2fe5SMarcel Hlopko 31358fa50f4SIlya Biryukov llvm::ArrayRef<syntax::Token> getExprRange(const Expr *E) const { 314a711a3a4SMarcel Hlopko return getRange(E->getSourceRange()); 31558fa50f4SIlya Biryukov } 316cdce2fe5SMarcel Hlopko 31758fa50f4SIlya Biryukov /// Find the adjusted range for the statement, consuming the trailing 31858fa50f4SIlya Biryukov /// semicolon when needed. 31958fa50f4SIlya Biryukov llvm::ArrayRef<syntax::Token> getStmtRange(const Stmt *S) const { 320a711a3a4SMarcel Hlopko auto Tokens = getRange(S->getSourceRange()); 32158fa50f4SIlya Biryukov if (isa<CompoundStmt>(S)) 32258fa50f4SIlya Biryukov return Tokens; 32358fa50f4SIlya Biryukov 32458fa50f4SIlya Biryukov // Some statements miss a trailing semicolon, e.g. 'return', 'continue' and 32558fa50f4SIlya Biryukov // all statements that end with those. Consume this semicolon here. 326e702bdb8SIlya Biryukov if (Tokens.back().kind() == tok::semi) 327e702bdb8SIlya Biryukov return Tokens; 328e702bdb8SIlya Biryukov return withTrailingSemicolon(Tokens); 329e702bdb8SIlya Biryukov } 330e702bdb8SIlya Biryukov 331e702bdb8SIlya Biryukov private: 332e702bdb8SIlya Biryukov llvm::ArrayRef<syntax::Token> 33388bf9b3dSMarcel Hlopko maybeAppendSemicolon(llvm::ArrayRef<syntax::Token> Tokens, 33488bf9b3dSMarcel Hlopko const Decl *D) const { 33588bf9b3dSMarcel Hlopko if (llvm::isa<NamespaceDecl>(D)) 33688bf9b3dSMarcel Hlopko return Tokens; 33788bf9b3dSMarcel Hlopko if (DeclsWithoutSemicolons.count(D)) 33888bf9b3dSMarcel Hlopko return Tokens; 33988bf9b3dSMarcel Hlopko // FIXME: do not consume trailing semicolon on function definitions. 34088bf9b3dSMarcel Hlopko // Most declarations own a semicolon in syntax trees, but not in clang AST. 34188bf9b3dSMarcel Hlopko return withTrailingSemicolon(Tokens); 34288bf9b3dSMarcel Hlopko } 34388bf9b3dSMarcel Hlopko 34488bf9b3dSMarcel Hlopko llvm::ArrayRef<syntax::Token> 345e702bdb8SIlya Biryukov withTrailingSemicolon(llvm::ArrayRef<syntax::Token> Tokens) const { 346e702bdb8SIlya Biryukov assert(!Tokens.empty()); 347e702bdb8SIlya Biryukov assert(Tokens.back().kind() != tok::eof); 3487d382dcdSMarcel Hlopko // We never consume 'eof', so looking at the next token is ok. 34958fa50f4SIlya Biryukov if (Tokens.back().kind() != tok::semi && Tokens.end()->kind() == tok::semi) 35058fa50f4SIlya Biryukov return llvm::makeArrayRef(Tokens.begin(), Tokens.end() + 1); 35158fa50f4SIlya Biryukov return Tokens; 3529b3f38f9SIlya Biryukov } 3539b3f38f9SIlya Biryukov 354a711a3a4SMarcel Hlopko void setRole(syntax::Node *N, NodeRole R) { 355a711a3a4SMarcel Hlopko assert(N->role() == NodeRole::Detached); 356a711a3a4SMarcel Hlopko N->setRole(R); 357a711a3a4SMarcel Hlopko } 358a711a3a4SMarcel Hlopko 3599b3f38f9SIlya Biryukov /// A collection of trees covering the input tokens. 3609b3f38f9SIlya Biryukov /// When created, each tree corresponds to a single token in the file. 3619b3f38f9SIlya Biryukov /// Clients call 'foldChildren' to attach one or more subtrees to a parent 3629b3f38f9SIlya Biryukov /// node and update the list of trees accordingly. 3639b3f38f9SIlya Biryukov /// 3649b3f38f9SIlya Biryukov /// Ensures that added nodes properly nest and cover the whole token stream. 3659b3f38f9SIlya Biryukov struct Forest { 3669b3f38f9SIlya Biryukov Forest(syntax::Arena &A) { 367bfbf6b6cSIlya Biryukov assert(!A.tokenBuffer().expandedTokens().empty()); 368bfbf6b6cSIlya Biryukov assert(A.tokenBuffer().expandedTokens().back().kind() == tok::eof); 3699b3f38f9SIlya Biryukov // Create all leaf nodes. 370bfbf6b6cSIlya Biryukov // Note that we do not have 'eof' in the tree. 3711ad15046SIlya Biryukov for (auto &T : A.tokenBuffer().expandedTokens().drop_back()) { 3721ad15046SIlya Biryukov auto *L = new (A.allocator()) syntax::Leaf(&T); 3731ad15046SIlya Biryukov L->Original = true; 3741ad15046SIlya Biryukov L->CanModify = A.tokenBuffer().spelledForExpanded(T).hasValue(); 375a711a3a4SMarcel Hlopko Trees.insert(Trees.end(), {&T, L}); 3761ad15046SIlya Biryukov } 3779b3f38f9SIlya Biryukov } 3789b3f38f9SIlya Biryukov 3799b3f38f9SIlya Biryukov void assignRole(llvm::ArrayRef<syntax::Token> Range, 3809b3f38f9SIlya Biryukov syntax::NodeRole Role) { 3819b3f38f9SIlya Biryukov assert(!Range.empty()); 3829b3f38f9SIlya Biryukov auto It = Trees.lower_bound(Range.begin()); 3839b3f38f9SIlya Biryukov assert(It != Trees.end() && "no node found"); 3849b3f38f9SIlya Biryukov assert(It->first == Range.begin() && "no child with the specified range"); 3859b3f38f9SIlya Biryukov assert((std::next(It) == Trees.end() || 3869b3f38f9SIlya Biryukov std::next(It)->first == Range.end()) && 3879b3f38f9SIlya Biryukov "no child with the specified range"); 388a711a3a4SMarcel Hlopko assert(It->second->role() == NodeRole::Detached && 389a711a3a4SMarcel Hlopko "re-assigning role for a child"); 390a711a3a4SMarcel Hlopko It->second->setRole(Role); 3919b3f38f9SIlya Biryukov } 3929b3f38f9SIlya Biryukov 393e702bdb8SIlya Biryukov /// Add \p Node to the forest and attach child nodes based on \p Tokens. 3941ad15046SIlya Biryukov void foldChildren(const syntax::Arena &A, 3951ad15046SIlya Biryukov llvm::ArrayRef<syntax::Token> Tokens, 3969b3f38f9SIlya Biryukov syntax::Tree *Node) { 397e702bdb8SIlya Biryukov // Attach children to `Node`. 398cdce2fe5SMarcel Hlopko assert(Node->firstChild() == nullptr && "node already has children"); 399cdce2fe5SMarcel Hlopko 400cdce2fe5SMarcel Hlopko auto *FirstToken = Tokens.begin(); 401cdce2fe5SMarcel Hlopko auto BeginChildren = Trees.lower_bound(FirstToken); 402cdce2fe5SMarcel Hlopko 403cdce2fe5SMarcel Hlopko assert((BeginChildren == Trees.end() || 404cdce2fe5SMarcel Hlopko BeginChildren->first == FirstToken) && 405cdce2fe5SMarcel Hlopko "fold crosses boundaries of existing subtrees"); 406cdce2fe5SMarcel Hlopko auto EndChildren = Trees.lower_bound(Tokens.end()); 407cdce2fe5SMarcel Hlopko assert( 408cdce2fe5SMarcel Hlopko (EndChildren == Trees.end() || EndChildren->first == Tokens.end()) && 409cdce2fe5SMarcel Hlopko "fold crosses boundaries of existing subtrees"); 410cdce2fe5SMarcel Hlopko 411cdce2fe5SMarcel Hlopko // We need to go in reverse order, because we can only prepend. 412cdce2fe5SMarcel Hlopko for (auto It = EndChildren; It != BeginChildren; --It) { 413cdce2fe5SMarcel Hlopko auto *C = std::prev(It)->second; 414cdce2fe5SMarcel Hlopko if (C->role() == NodeRole::Detached) 415cdce2fe5SMarcel Hlopko C->setRole(NodeRole::Unknown); 416cdce2fe5SMarcel Hlopko Node->prependChildLowLevel(C); 417e702bdb8SIlya Biryukov } 4189b3f38f9SIlya Biryukov 419cdce2fe5SMarcel Hlopko // Mark that this node came from the AST and is backed by the source code. 420cdce2fe5SMarcel Hlopko Node->Original = true; 421cdce2fe5SMarcel Hlopko Node->CanModify = A.tokenBuffer().spelledForExpanded(Tokens).hasValue(); 4229b3f38f9SIlya Biryukov 423cdce2fe5SMarcel Hlopko Trees.erase(BeginChildren, EndChildren); 424cdce2fe5SMarcel Hlopko Trees.insert({FirstToken, Node}); 4259b3f38f9SIlya Biryukov } 4269b3f38f9SIlya Biryukov 4279b3f38f9SIlya Biryukov // EXPECTS: all tokens were consumed and are owned by a single root node. 4289b3f38f9SIlya Biryukov syntax::Node *finalize() && { 4299b3f38f9SIlya Biryukov assert(Trees.size() == 1); 430a711a3a4SMarcel Hlopko auto *Root = Trees.begin()->second; 4319b3f38f9SIlya Biryukov Trees = {}; 4329b3f38f9SIlya Biryukov return Root; 4339b3f38f9SIlya Biryukov } 4349b3f38f9SIlya Biryukov 4359b3f38f9SIlya Biryukov std::string str(const syntax::Arena &A) const { 4369b3f38f9SIlya Biryukov std::string R; 4379b3f38f9SIlya Biryukov for (auto It = Trees.begin(); It != Trees.end(); ++It) { 4389b3f38f9SIlya Biryukov unsigned CoveredTokens = 4399b3f38f9SIlya Biryukov It != Trees.end() 4409b3f38f9SIlya Biryukov ? (std::next(It)->first - It->first) 4419b3f38f9SIlya Biryukov : A.tokenBuffer().expandedTokens().end() - It->first; 4429b3f38f9SIlya Biryukov 443adcd0268SBenjamin Kramer R += std::string(llvm::formatv( 444a711a3a4SMarcel Hlopko "- '{0}' covers '{1}'+{2} tokens\n", It->second->kind(), 445adcd0268SBenjamin Kramer It->first->text(A.sourceManager()), CoveredTokens)); 446a711a3a4SMarcel Hlopko R += It->second->dump(A); 4479b3f38f9SIlya Biryukov } 4489b3f38f9SIlya Biryukov return R; 4499b3f38f9SIlya Biryukov } 4509b3f38f9SIlya Biryukov 4519b3f38f9SIlya Biryukov private: 4529b3f38f9SIlya Biryukov /// Maps from the start token to a subtree starting at that token. 453302cb3bcSIlya Biryukov /// Keys in the map are pointers into the array of expanded tokens, so 454302cb3bcSIlya Biryukov /// pointer order corresponds to the order of preprocessor tokens. 455a711a3a4SMarcel Hlopko std::map<const syntax::Token *, syntax::Node *> Trees; 4569b3f38f9SIlya Biryukov }; 4579b3f38f9SIlya Biryukov 4589b3f38f9SIlya Biryukov /// For debugging purposes. 4599b3f38f9SIlya Biryukov std::string str() { return Pending.str(Arena); } 4609b3f38f9SIlya Biryukov 4619b3f38f9SIlya Biryukov syntax::Arena &Arena; 462c1bbefefSIlya Biryukov /// To quickly find tokens by their start location. 463c1bbefefSIlya Biryukov llvm::DenseMap</*SourceLocation*/ unsigned, const syntax::Token *> 464c1bbefefSIlya Biryukov LocationToToken; 4659b3f38f9SIlya Biryukov Forest Pending; 466e702bdb8SIlya Biryukov llvm::DenseSet<Decl *> DeclsWithoutSemicolons; 467a711a3a4SMarcel Hlopko ASTToSyntaxMapping Mapping; 4689b3f38f9SIlya Biryukov }; 4699b3f38f9SIlya Biryukov 4709b3f38f9SIlya Biryukov namespace { 4719b3f38f9SIlya Biryukov class BuildTreeVisitor : public RecursiveASTVisitor<BuildTreeVisitor> { 4729b3f38f9SIlya Biryukov public: 4739b3f38f9SIlya Biryukov explicit BuildTreeVisitor(ASTContext &Ctx, syntax::TreeBuilder &Builder) 4749b3f38f9SIlya Biryukov : Builder(Builder), LangOpts(Ctx.getLangOpts()) {} 4759b3f38f9SIlya Biryukov 4769b3f38f9SIlya Biryukov bool shouldTraversePostOrder() const { return true; } 4779b3f38f9SIlya Biryukov 4787d382dcdSMarcel Hlopko bool WalkUpFromDeclaratorDecl(DeclaratorDecl *DD) { 479cdce2fe5SMarcel Hlopko return processDeclaratorAndDeclaration(DD); 4807d382dcdSMarcel Hlopko } 4817d382dcdSMarcel Hlopko 482cdce2fe5SMarcel Hlopko bool WalkUpFromTypedefNameDecl(TypedefNameDecl *TD) { 483cdce2fe5SMarcel Hlopko return processDeclaratorAndDeclaration(TD); 4849b3f38f9SIlya Biryukov } 4859b3f38f9SIlya Biryukov 4869b3f38f9SIlya Biryukov bool VisitDecl(Decl *D) { 4879b3f38f9SIlya Biryukov assert(!D->isImplicit()); 488cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(D), 489a711a3a4SMarcel Hlopko new (allocator()) syntax::UnknownDeclaration(), D); 490e702bdb8SIlya Biryukov return true; 491e702bdb8SIlya Biryukov } 492e702bdb8SIlya Biryukov 49388bf9b3dSMarcel Hlopko // RAV does not call WalkUpFrom* on explicit instantiations, so we have to 49488bf9b3dSMarcel Hlopko // override Traverse. 49588bf9b3dSMarcel Hlopko // FIXME: make RAV call WalkUpFrom* instead. 49688bf9b3dSMarcel Hlopko bool 49788bf9b3dSMarcel Hlopko TraverseClassTemplateSpecializationDecl(ClassTemplateSpecializationDecl *C) { 49888bf9b3dSMarcel Hlopko if (!RecursiveASTVisitor::TraverseClassTemplateSpecializationDecl(C)) 49988bf9b3dSMarcel Hlopko return false; 50088bf9b3dSMarcel Hlopko if (C->isExplicitSpecialization()) 50188bf9b3dSMarcel Hlopko return true; // we are only interested in explicit instantiations. 502a711a3a4SMarcel Hlopko auto *Declaration = 503a711a3a4SMarcel Hlopko cast<syntax::SimpleDeclaration>(handleFreeStandingTagDecl(C)); 50488bf9b3dSMarcel Hlopko foldExplicitTemplateInstantiation( 50588bf9b3dSMarcel Hlopko Builder.getTemplateRange(C), Builder.findToken(C->getExternLoc()), 506a711a3a4SMarcel Hlopko Builder.findToken(C->getTemplateKeywordLoc()), Declaration, C); 50788bf9b3dSMarcel Hlopko return true; 50888bf9b3dSMarcel Hlopko } 50988bf9b3dSMarcel Hlopko 51088bf9b3dSMarcel Hlopko bool WalkUpFromTemplateDecl(TemplateDecl *S) { 51188bf9b3dSMarcel Hlopko foldTemplateDeclaration( 512cdce2fe5SMarcel Hlopko Builder.getDeclarationRange(S), 51388bf9b3dSMarcel Hlopko Builder.findToken(S->getTemplateParameters()->getTemplateLoc()), 514cdce2fe5SMarcel Hlopko Builder.getDeclarationRange(S->getTemplatedDecl()), S); 51588bf9b3dSMarcel Hlopko return true; 51688bf9b3dSMarcel Hlopko } 51788bf9b3dSMarcel Hlopko 518e702bdb8SIlya Biryukov bool WalkUpFromTagDecl(TagDecl *C) { 51904f627f6SIlya Biryukov // FIXME: build the ClassSpecifier node. 52088bf9b3dSMarcel Hlopko if (!C->isFreeStanding()) { 52188bf9b3dSMarcel Hlopko assert(C->getNumTemplateParameterLists() == 0); 52204f627f6SIlya Biryukov return true; 52304f627f6SIlya Biryukov } 524a711a3a4SMarcel Hlopko handleFreeStandingTagDecl(C); 525a711a3a4SMarcel Hlopko return true; 526a711a3a4SMarcel Hlopko } 527a711a3a4SMarcel Hlopko 528a711a3a4SMarcel Hlopko syntax::Declaration *handleFreeStandingTagDecl(TagDecl *C) { 529a711a3a4SMarcel Hlopko assert(C->isFreeStanding()); 53088bf9b3dSMarcel Hlopko // Class is a declaration specifier and needs a spanning declaration node. 531cdce2fe5SMarcel Hlopko auto DeclarationRange = Builder.getDeclarationRange(C); 532a711a3a4SMarcel Hlopko syntax::Declaration *Result = new (allocator()) syntax::SimpleDeclaration; 533a711a3a4SMarcel Hlopko Builder.foldNode(DeclarationRange, Result, nullptr); 53488bf9b3dSMarcel Hlopko 53588bf9b3dSMarcel Hlopko // Build TemplateDeclaration nodes if we had template parameters. 53688bf9b3dSMarcel Hlopko auto ConsumeTemplateParameters = [&](const TemplateParameterList &L) { 53788bf9b3dSMarcel Hlopko const auto *TemplateKW = Builder.findToken(L.getTemplateLoc()); 53888bf9b3dSMarcel Hlopko auto R = llvm::makeArrayRef(TemplateKW, DeclarationRange.end()); 539a711a3a4SMarcel Hlopko Result = 540a711a3a4SMarcel Hlopko foldTemplateDeclaration(R, TemplateKW, DeclarationRange, nullptr); 54188bf9b3dSMarcel Hlopko DeclarationRange = R; 54288bf9b3dSMarcel Hlopko }; 54388bf9b3dSMarcel Hlopko if (auto *S = llvm::dyn_cast<ClassTemplatePartialSpecializationDecl>(C)) 54488bf9b3dSMarcel Hlopko ConsumeTemplateParameters(*S->getTemplateParameters()); 54588bf9b3dSMarcel Hlopko for (unsigned I = C->getNumTemplateParameterLists(); 0 < I; --I) 54688bf9b3dSMarcel Hlopko ConsumeTemplateParameters(*C->getTemplateParameterList(I - 1)); 547a711a3a4SMarcel Hlopko return Result; 5489b3f38f9SIlya Biryukov } 5499b3f38f9SIlya Biryukov 5509b3f38f9SIlya Biryukov bool WalkUpFromTranslationUnitDecl(TranslationUnitDecl *TU) { 5517d382dcdSMarcel Hlopko // We do not want to call VisitDecl(), the declaration for translation 5529b3f38f9SIlya Biryukov // unit is built by finalize(). 5539b3f38f9SIlya Biryukov return true; 5549b3f38f9SIlya Biryukov } 5559b3f38f9SIlya Biryukov 5569b3f38f9SIlya Biryukov bool WalkUpFromCompoundStmt(CompoundStmt *S) { 55751dad419SIlya Biryukov using NodeRole = syntax::NodeRole; 5589b3f38f9SIlya Biryukov 559def65bb4SIlya Biryukov Builder.markChildToken(S->getLBracLoc(), NodeRole::OpenParen); 56058fa50f4SIlya Biryukov for (auto *Child : S->body()) 56158fa50f4SIlya Biryukov Builder.markStmtChild(Child, NodeRole::CompoundStatement_statement); 562def65bb4SIlya Biryukov Builder.markChildToken(S->getRBracLoc(), NodeRole::CloseParen); 5639b3f38f9SIlya Biryukov 56458fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 565a711a3a4SMarcel Hlopko new (allocator()) syntax::CompoundStatement, S); 5669b3f38f9SIlya Biryukov return true; 5679b3f38f9SIlya Biryukov } 5689b3f38f9SIlya Biryukov 56958fa50f4SIlya Biryukov // Some statements are not yet handled by syntax trees. 57058fa50f4SIlya Biryukov bool WalkUpFromStmt(Stmt *S) { 57158fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 572a711a3a4SMarcel Hlopko new (allocator()) syntax::UnknownStatement, S); 57358fa50f4SIlya Biryukov return true; 57458fa50f4SIlya Biryukov } 57558fa50f4SIlya Biryukov 57658fa50f4SIlya Biryukov bool TraverseCXXForRangeStmt(CXXForRangeStmt *S) { 57758fa50f4SIlya Biryukov // We override to traverse range initializer as VarDecl. 57858fa50f4SIlya Biryukov // RAV traverses it as a statement, we produce invalid node kinds in that 57958fa50f4SIlya Biryukov // case. 58058fa50f4SIlya Biryukov // FIXME: should do this in RAV instead? 58158fa50f4SIlya Biryukov if (S->getInit() && !TraverseStmt(S->getInit())) 58258fa50f4SIlya Biryukov return false; 58358fa50f4SIlya Biryukov if (S->getLoopVariable() && !TraverseDecl(S->getLoopVariable())) 58458fa50f4SIlya Biryukov return false; 58558fa50f4SIlya Biryukov if (S->getRangeInit() && !TraverseStmt(S->getRangeInit())) 58658fa50f4SIlya Biryukov return false; 58758fa50f4SIlya Biryukov if (S->getBody() && !TraverseStmt(S->getBody())) 58858fa50f4SIlya Biryukov return false; 58958fa50f4SIlya Biryukov return true; 59058fa50f4SIlya Biryukov } 59158fa50f4SIlya Biryukov 59258fa50f4SIlya Biryukov bool TraverseStmt(Stmt *S) { 593e702bdb8SIlya Biryukov if (auto *DS = llvm::dyn_cast_or_null<DeclStmt>(S)) { 594e702bdb8SIlya Biryukov // We want to consume the semicolon, make sure SimpleDeclaration does not. 595e702bdb8SIlya Biryukov for (auto *D : DS->decls()) 5967d382dcdSMarcel Hlopko Builder.noticeDeclWithoutSemicolon(D); 597e702bdb8SIlya Biryukov } else if (auto *E = llvm::dyn_cast_or_null<Expr>(S)) { 5983785eb83SEduardo Caldas return RecursiveASTVisitor::TraverseStmt(E->IgnoreImplicit()); 59958fa50f4SIlya Biryukov } 60058fa50f4SIlya Biryukov return RecursiveASTVisitor::TraverseStmt(S); 60158fa50f4SIlya Biryukov } 60258fa50f4SIlya Biryukov 60358fa50f4SIlya Biryukov // Some expressions are not yet handled by syntax trees. 60458fa50f4SIlya Biryukov bool WalkUpFromExpr(Expr *E) { 60558fa50f4SIlya Biryukov assert(!isImplicitExpr(E) && "should be handled by TraverseStmt"); 60658fa50f4SIlya Biryukov Builder.foldNode(Builder.getExprRange(E), 607a711a3a4SMarcel Hlopko new (allocator()) syntax::UnknownExpression, E); 60858fa50f4SIlya Biryukov return true; 60958fa50f4SIlya Biryukov } 61058fa50f4SIlya Biryukov 6111b2f6b4aSEduardo Caldas syntax::NestedNameSpecifier * 6121b2f6b4aSEduardo Caldas BuildNestedNameSpecifier(NestedNameSpecifierLoc QualifierLoc) { 6131b2f6b4aSEduardo Caldas if (!QualifierLoc) 6141b2f6b4aSEduardo Caldas return nullptr; 6151b2f6b4aSEduardo Caldas for (auto it = QualifierLoc; it; it = it.getPrefix()) { 6161b2f6b4aSEduardo Caldas auto *NS = new (allocator()) syntax::NameSpecifier; 6171b2f6b4aSEduardo Caldas Builder.foldNode(Builder.getRange(it.getLocalSourceRange()), NS, nullptr); 6181b2f6b4aSEduardo Caldas Builder.markChild(NS, syntax::NodeRole::NestedNameSpecifier_specifier); 6191b2f6b4aSEduardo Caldas } 6201b2f6b4aSEduardo Caldas auto *NNS = new (allocator()) syntax::NestedNameSpecifier; 6211b2f6b4aSEduardo Caldas Builder.foldNode(Builder.getRange(QualifierLoc.getSourceRange()), NNS, 6221b2f6b4aSEduardo Caldas nullptr); 6231b2f6b4aSEduardo Caldas return NNS; 6241b2f6b4aSEduardo Caldas } 6251b2f6b4aSEduardo Caldas 6261b2f6b4aSEduardo Caldas bool WalkUpFromDeclRefExpr(DeclRefExpr *S) { 6271b2f6b4aSEduardo Caldas if (auto *NNS = BuildNestedNameSpecifier(S->getQualifierLoc())) 6281b2f6b4aSEduardo Caldas Builder.markChild(NNS, syntax::NodeRole::IdExpression_qualifier); 6291b2f6b4aSEduardo Caldas 6301b2f6b4aSEduardo Caldas auto *unqualifiedId = new (allocator()) syntax::UnqualifiedId; 6311b2f6b4aSEduardo Caldas // Get `UnqualifiedId` from `DeclRefExpr`. 6321b2f6b4aSEduardo Caldas // FIXME: Extract this logic so that it can be used by `MemberExpr`, 6331b2f6b4aSEduardo Caldas // and other semantic constructs, now it is tied to `DeclRefExpr`. 6341b2f6b4aSEduardo Caldas if (!S->hasExplicitTemplateArgs()) { 6351b2f6b4aSEduardo Caldas Builder.foldNode(Builder.getRange(S->getNameInfo().getSourceRange()), 6361b2f6b4aSEduardo Caldas unqualifiedId, nullptr); 6371b2f6b4aSEduardo Caldas } else { 6381b2f6b4aSEduardo Caldas auto templateIdSourceRange = 6391b2f6b4aSEduardo Caldas SourceRange(S->getNameInfo().getBeginLoc(), S->getRAngleLoc()); 6401b2f6b4aSEduardo Caldas Builder.foldNode(Builder.getRange(templateIdSourceRange), unqualifiedId, 6411b2f6b4aSEduardo Caldas nullptr); 6421b2f6b4aSEduardo Caldas } 6431b2f6b4aSEduardo Caldas Builder.markChild(unqualifiedId, syntax::NodeRole::IdExpression_id); 6441b2f6b4aSEduardo Caldas 6451b2f6b4aSEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 6461b2f6b4aSEduardo Caldas new (allocator()) syntax::IdExpression, S); 6471b2f6b4aSEduardo Caldas return true; 6481b2f6b4aSEduardo Caldas } 6491b2f6b4aSEduardo Caldas 6503b739690SEduardo Caldas bool WalkUpFromIntegerLiteral(IntegerLiteral *S) { 65142f6fec3SEduardo Caldas Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken); 6523b739690SEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 6533b739690SEduardo Caldas new (allocator()) syntax::IntegerLiteralExpression, S); 6543b739690SEduardo Caldas return true; 6553b739690SEduardo Caldas } 6563b739690SEduardo Caldas 6577f7f8564SEduardo Caldas bool WalkUpFromCXXBoolLiteralExpr(CXXBoolLiteralExpr *S) { 6587f7f8564SEduardo Caldas Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken); 6597f7f8564SEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 6607f7f8564SEduardo Caldas new (allocator()) syntax::BoolLiteralExpression, S); 6617f7f8564SEduardo Caldas return true; 6627f7f8564SEduardo Caldas } 6637f7f8564SEduardo Caldas 664*221d7bbeSEduardo Caldas bool WalkUpFromCharacterLiteral(CharacterLiteral *S) { 665*221d7bbeSEduardo Caldas Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken); 666*221d7bbeSEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 667*221d7bbeSEduardo Caldas new (allocator()) syntax::CharacterLiteralExpression, S); 668*221d7bbeSEduardo Caldas return true; 669*221d7bbeSEduardo Caldas } 670*221d7bbeSEduardo Caldas 671007098d7SEduardo Caldas bool WalkUpFromCXXNullPtrLiteralExpr(CXXNullPtrLiteralExpr *S) { 67242f6fec3SEduardo Caldas Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken); 673007098d7SEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 674007098d7SEduardo Caldas new (allocator()) syntax::CxxNullPtrExpression, S); 675007098d7SEduardo Caldas return true; 676007098d7SEduardo Caldas } 677007098d7SEduardo Caldas 678461af57dSEduardo Caldas bool WalkUpFromUnaryOperator(UnaryOperator *S) { 67942f6fec3SEduardo Caldas Builder.markChildToken(S->getOperatorLoc(), 68042f6fec3SEduardo Caldas syntax::NodeRole::OperatorExpression_operatorToken); 681461af57dSEduardo Caldas Builder.markExprChild(S->getSubExpr(), 682461af57dSEduardo Caldas syntax::NodeRole::UnaryOperatorExpression_operand); 683461af57dSEduardo Caldas 684461af57dSEduardo Caldas if (S->isPostfix()) 685461af57dSEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 686461af57dSEduardo Caldas new (allocator()) syntax::PostfixUnaryOperatorExpression, 687461af57dSEduardo Caldas S); 688461af57dSEduardo Caldas else 689461af57dSEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 690461af57dSEduardo Caldas new (allocator()) syntax::PrefixUnaryOperatorExpression, 691461af57dSEduardo Caldas S); 692461af57dSEduardo Caldas 693461af57dSEduardo Caldas return true; 694461af57dSEduardo Caldas } 695461af57dSEduardo Caldas 6963785eb83SEduardo Caldas bool WalkUpFromBinaryOperator(BinaryOperator *S) { 6973785eb83SEduardo Caldas Builder.markExprChild( 6983785eb83SEduardo Caldas S->getLHS(), syntax::NodeRole::BinaryOperatorExpression_leftHandSide); 69942f6fec3SEduardo Caldas Builder.markChildToken(S->getOperatorLoc(), 70042f6fec3SEduardo Caldas syntax::NodeRole::OperatorExpression_operatorToken); 7013785eb83SEduardo Caldas Builder.markExprChild( 7023785eb83SEduardo Caldas S->getRHS(), syntax::NodeRole::BinaryOperatorExpression_rightHandSide); 7033785eb83SEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 7043785eb83SEduardo Caldas new (allocator()) syntax::BinaryOperatorExpression, S); 7053785eb83SEduardo Caldas return true; 7063785eb83SEduardo Caldas } 7073785eb83SEduardo Caldas 7083a574a6cSEduardo Caldas bool WalkUpFromCXXOperatorCallExpr(CXXOperatorCallExpr *S) { 7093a574a6cSEduardo Caldas if (S->isInfixBinaryOp()) { 7103a574a6cSEduardo Caldas Builder.markExprChild( 7113a574a6cSEduardo Caldas S->getArg(0), 7123a574a6cSEduardo Caldas syntax::NodeRole::BinaryOperatorExpression_leftHandSide); 7133a574a6cSEduardo Caldas Builder.markChildToken( 7143a574a6cSEduardo Caldas S->getOperatorLoc(), 71542f6fec3SEduardo Caldas syntax::NodeRole::OperatorExpression_operatorToken); 7163a574a6cSEduardo Caldas Builder.markExprChild( 7173a574a6cSEduardo Caldas S->getArg(1), 7183a574a6cSEduardo Caldas syntax::NodeRole::BinaryOperatorExpression_rightHandSide); 7193a574a6cSEduardo Caldas Builder.foldNode(Builder.getExprRange(S), 7203a574a6cSEduardo Caldas new (allocator()) syntax::BinaryOperatorExpression, S); 7213a574a6cSEduardo Caldas return true; 7223a574a6cSEduardo Caldas } 7233a574a6cSEduardo Caldas return RecursiveASTVisitor::WalkUpFromCXXOperatorCallExpr(S); 7243a574a6cSEduardo Caldas } 7253a574a6cSEduardo Caldas 726be14a22bSIlya Biryukov bool WalkUpFromNamespaceDecl(NamespaceDecl *S) { 727cdce2fe5SMarcel Hlopko auto Tokens = Builder.getDeclarationRange(S); 728be14a22bSIlya Biryukov if (Tokens.front().kind() == tok::coloncolon) { 729be14a22bSIlya Biryukov // Handle nested namespace definitions. Those start at '::' token, e.g. 730be14a22bSIlya Biryukov // namespace a^::b {} 731be14a22bSIlya Biryukov // FIXME: build corresponding nodes for the name of this namespace. 732be14a22bSIlya Biryukov return true; 733be14a22bSIlya Biryukov } 734a711a3a4SMarcel Hlopko Builder.foldNode(Tokens, new (allocator()) syntax::NamespaceDefinition, S); 735be14a22bSIlya Biryukov return true; 736be14a22bSIlya Biryukov } 737be14a22bSIlya Biryukov 7387d382dcdSMarcel Hlopko bool TraverseParenTypeLoc(ParenTypeLoc L) { 7397d382dcdSMarcel Hlopko // We reverse order of traversal to get the proper syntax structure. 7407d382dcdSMarcel Hlopko if (!WalkUpFromParenTypeLoc(L)) 7417d382dcdSMarcel Hlopko return false; 7427d382dcdSMarcel Hlopko return TraverseTypeLoc(L.getInnerLoc()); 7437d382dcdSMarcel Hlopko } 7447d382dcdSMarcel Hlopko 7457d382dcdSMarcel Hlopko bool WalkUpFromParenTypeLoc(ParenTypeLoc L) { 7467d382dcdSMarcel Hlopko Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen); 7477d382dcdSMarcel Hlopko Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen); 7487d382dcdSMarcel Hlopko Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getRParenLoc()), 749a711a3a4SMarcel Hlopko new (allocator()) syntax::ParenDeclarator, L); 7507d382dcdSMarcel Hlopko return true; 7517d382dcdSMarcel Hlopko } 7527d382dcdSMarcel Hlopko 7537d382dcdSMarcel Hlopko // Declarator chunks, they are produced by type locs and some clang::Decls. 7547d382dcdSMarcel Hlopko bool WalkUpFromArrayTypeLoc(ArrayTypeLoc L) { 7557d382dcdSMarcel Hlopko Builder.markChildToken(L.getLBracketLoc(), syntax::NodeRole::OpenParen); 7567d382dcdSMarcel Hlopko Builder.markExprChild(L.getSizeExpr(), 7577d382dcdSMarcel Hlopko syntax::NodeRole::ArraySubscript_sizeExpression); 7587d382dcdSMarcel Hlopko Builder.markChildToken(L.getRBracketLoc(), syntax::NodeRole::CloseParen); 7597d382dcdSMarcel Hlopko Builder.foldNode(Builder.getRange(L.getLBracketLoc(), L.getRBracketLoc()), 760a711a3a4SMarcel Hlopko new (allocator()) syntax::ArraySubscript, L); 7617d382dcdSMarcel Hlopko return true; 7627d382dcdSMarcel Hlopko } 7637d382dcdSMarcel Hlopko 7647d382dcdSMarcel Hlopko bool WalkUpFromFunctionTypeLoc(FunctionTypeLoc L) { 7657d382dcdSMarcel Hlopko Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen); 766cdce2fe5SMarcel Hlopko for (auto *P : L.getParams()) { 767cdce2fe5SMarcel Hlopko Builder.markChild(P, syntax::NodeRole::ParametersAndQualifiers_parameter); 768cdce2fe5SMarcel Hlopko } 7697d382dcdSMarcel Hlopko Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen); 7707d382dcdSMarcel Hlopko Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getEndLoc()), 771a711a3a4SMarcel Hlopko new (allocator()) syntax::ParametersAndQualifiers, L); 7727d382dcdSMarcel Hlopko return true; 7737d382dcdSMarcel Hlopko } 7747d382dcdSMarcel Hlopko 7757d382dcdSMarcel Hlopko bool WalkUpFromFunctionProtoTypeLoc(FunctionProtoTypeLoc L) { 7767d382dcdSMarcel Hlopko if (!L.getTypePtr()->hasTrailingReturn()) 7777d382dcdSMarcel Hlopko return WalkUpFromFunctionTypeLoc(L); 7787d382dcdSMarcel Hlopko 779cdce2fe5SMarcel Hlopko auto *TrailingReturnTokens = BuildTrailingReturn(L); 7807d382dcdSMarcel Hlopko // Finish building the node for parameters. 7817d382dcdSMarcel Hlopko Builder.markChild(TrailingReturnTokens, 7827d382dcdSMarcel Hlopko syntax::NodeRole::ParametersAndQualifiers_trailingReturn); 7837d382dcdSMarcel Hlopko return WalkUpFromFunctionTypeLoc(L); 7847d382dcdSMarcel Hlopko } 7857d382dcdSMarcel Hlopko 7867d382dcdSMarcel Hlopko bool WalkUpFromMemberPointerTypeLoc(MemberPointerTypeLoc L) { 7877d382dcdSMarcel Hlopko auto SR = L.getLocalSourceRange(); 788a711a3a4SMarcel Hlopko Builder.foldNode(Builder.getRange(SR), 789a711a3a4SMarcel Hlopko new (allocator()) syntax::MemberPointer, L); 7907d382dcdSMarcel Hlopko return true; 7917d382dcdSMarcel Hlopko } 7927d382dcdSMarcel Hlopko 79358fa50f4SIlya Biryukov // The code below is very regular, it could even be generated with some 79458fa50f4SIlya Biryukov // preprocessor magic. We merely assign roles to the corresponding children 79558fa50f4SIlya Biryukov // and fold resulting nodes. 79658fa50f4SIlya Biryukov bool WalkUpFromDeclStmt(DeclStmt *S) { 79758fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 798a711a3a4SMarcel Hlopko new (allocator()) syntax::DeclarationStatement, S); 79958fa50f4SIlya Biryukov return true; 80058fa50f4SIlya Biryukov } 80158fa50f4SIlya Biryukov 80258fa50f4SIlya Biryukov bool WalkUpFromNullStmt(NullStmt *S) { 80358fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 804a711a3a4SMarcel Hlopko new (allocator()) syntax::EmptyStatement, S); 80558fa50f4SIlya Biryukov return true; 80658fa50f4SIlya Biryukov } 80758fa50f4SIlya Biryukov 80858fa50f4SIlya Biryukov bool WalkUpFromSwitchStmt(SwitchStmt *S) { 809def65bb4SIlya Biryukov Builder.markChildToken(S->getSwitchLoc(), 81058fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 81158fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 81258fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 813a711a3a4SMarcel Hlopko new (allocator()) syntax::SwitchStatement, S); 81458fa50f4SIlya Biryukov return true; 81558fa50f4SIlya Biryukov } 81658fa50f4SIlya Biryukov 81758fa50f4SIlya Biryukov bool WalkUpFromCaseStmt(CaseStmt *S) { 818def65bb4SIlya Biryukov Builder.markChildToken(S->getKeywordLoc(), 81958fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 82058fa50f4SIlya Biryukov Builder.markExprChild(S->getLHS(), syntax::NodeRole::CaseStatement_value); 82158fa50f4SIlya Biryukov Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement); 82258fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 823a711a3a4SMarcel Hlopko new (allocator()) syntax::CaseStatement, S); 82458fa50f4SIlya Biryukov return true; 82558fa50f4SIlya Biryukov } 82658fa50f4SIlya Biryukov 82758fa50f4SIlya Biryukov bool WalkUpFromDefaultStmt(DefaultStmt *S) { 828def65bb4SIlya Biryukov Builder.markChildToken(S->getKeywordLoc(), 82958fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 83058fa50f4SIlya Biryukov Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement); 83158fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 832a711a3a4SMarcel Hlopko new (allocator()) syntax::DefaultStatement, S); 83358fa50f4SIlya Biryukov return true; 83458fa50f4SIlya Biryukov } 83558fa50f4SIlya Biryukov 83658fa50f4SIlya Biryukov bool WalkUpFromIfStmt(IfStmt *S) { 837def65bb4SIlya Biryukov Builder.markChildToken(S->getIfLoc(), syntax::NodeRole::IntroducerKeyword); 83858fa50f4SIlya Biryukov Builder.markStmtChild(S->getThen(), 83958fa50f4SIlya Biryukov syntax::NodeRole::IfStatement_thenStatement); 840def65bb4SIlya Biryukov Builder.markChildToken(S->getElseLoc(), 84158fa50f4SIlya Biryukov syntax::NodeRole::IfStatement_elseKeyword); 84258fa50f4SIlya Biryukov Builder.markStmtChild(S->getElse(), 84358fa50f4SIlya Biryukov syntax::NodeRole::IfStatement_elseStatement); 84458fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 845a711a3a4SMarcel Hlopko new (allocator()) syntax::IfStatement, S); 84658fa50f4SIlya Biryukov return true; 84758fa50f4SIlya Biryukov } 84858fa50f4SIlya Biryukov 84958fa50f4SIlya Biryukov bool WalkUpFromForStmt(ForStmt *S) { 850def65bb4SIlya Biryukov Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword); 85158fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 85258fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 853a711a3a4SMarcel Hlopko new (allocator()) syntax::ForStatement, S); 85458fa50f4SIlya Biryukov return true; 85558fa50f4SIlya Biryukov } 85658fa50f4SIlya Biryukov 85758fa50f4SIlya Biryukov bool WalkUpFromWhileStmt(WhileStmt *S) { 858def65bb4SIlya Biryukov Builder.markChildToken(S->getWhileLoc(), 85958fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 86058fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 86158fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 862a711a3a4SMarcel Hlopko new (allocator()) syntax::WhileStatement, S); 86358fa50f4SIlya Biryukov return true; 86458fa50f4SIlya Biryukov } 86558fa50f4SIlya Biryukov 86658fa50f4SIlya Biryukov bool WalkUpFromContinueStmt(ContinueStmt *S) { 867def65bb4SIlya Biryukov Builder.markChildToken(S->getContinueLoc(), 86858fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 86958fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 870a711a3a4SMarcel Hlopko new (allocator()) syntax::ContinueStatement, S); 87158fa50f4SIlya Biryukov return true; 87258fa50f4SIlya Biryukov } 87358fa50f4SIlya Biryukov 87458fa50f4SIlya Biryukov bool WalkUpFromBreakStmt(BreakStmt *S) { 875def65bb4SIlya Biryukov Builder.markChildToken(S->getBreakLoc(), 87658fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 87758fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 878a711a3a4SMarcel Hlopko new (allocator()) syntax::BreakStatement, S); 87958fa50f4SIlya Biryukov return true; 88058fa50f4SIlya Biryukov } 88158fa50f4SIlya Biryukov 88258fa50f4SIlya Biryukov bool WalkUpFromReturnStmt(ReturnStmt *S) { 883def65bb4SIlya Biryukov Builder.markChildToken(S->getReturnLoc(), 88458fa50f4SIlya Biryukov syntax::NodeRole::IntroducerKeyword); 88558fa50f4SIlya Biryukov Builder.markExprChild(S->getRetValue(), 88658fa50f4SIlya Biryukov syntax::NodeRole::ReturnStatement_value); 88758fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 888a711a3a4SMarcel Hlopko new (allocator()) syntax::ReturnStatement, S); 88958fa50f4SIlya Biryukov return true; 89058fa50f4SIlya Biryukov } 89158fa50f4SIlya Biryukov 89258fa50f4SIlya Biryukov bool WalkUpFromCXXForRangeStmt(CXXForRangeStmt *S) { 893def65bb4SIlya Biryukov Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword); 89458fa50f4SIlya Biryukov Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement); 89558fa50f4SIlya Biryukov Builder.foldNode(Builder.getStmtRange(S), 896a711a3a4SMarcel Hlopko new (allocator()) syntax::RangeBasedForStatement, S); 89758fa50f4SIlya Biryukov return true; 89858fa50f4SIlya Biryukov } 89958fa50f4SIlya Biryukov 900be14a22bSIlya Biryukov bool WalkUpFromEmptyDecl(EmptyDecl *S) { 901cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 902a711a3a4SMarcel Hlopko new (allocator()) syntax::EmptyDeclaration, S); 903be14a22bSIlya Biryukov return true; 904be14a22bSIlya Biryukov } 905be14a22bSIlya Biryukov 906be14a22bSIlya Biryukov bool WalkUpFromStaticAssertDecl(StaticAssertDecl *S) { 907be14a22bSIlya Biryukov Builder.markExprChild(S->getAssertExpr(), 908be14a22bSIlya Biryukov syntax::NodeRole::StaticAssertDeclaration_condition); 909be14a22bSIlya Biryukov Builder.markExprChild(S->getMessage(), 910be14a22bSIlya Biryukov syntax::NodeRole::StaticAssertDeclaration_message); 911cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 912a711a3a4SMarcel Hlopko new (allocator()) syntax::StaticAssertDeclaration, S); 913be14a22bSIlya Biryukov return true; 914be14a22bSIlya Biryukov } 915be14a22bSIlya Biryukov 916be14a22bSIlya Biryukov bool WalkUpFromLinkageSpecDecl(LinkageSpecDecl *S) { 917cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 918a711a3a4SMarcel Hlopko new (allocator()) syntax::LinkageSpecificationDeclaration, 919a711a3a4SMarcel Hlopko S); 920be14a22bSIlya Biryukov return true; 921be14a22bSIlya Biryukov } 922be14a22bSIlya Biryukov 923be14a22bSIlya Biryukov bool WalkUpFromNamespaceAliasDecl(NamespaceAliasDecl *S) { 924cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 925a711a3a4SMarcel Hlopko new (allocator()) syntax::NamespaceAliasDefinition, S); 926be14a22bSIlya Biryukov return true; 927be14a22bSIlya Biryukov } 928be14a22bSIlya Biryukov 929be14a22bSIlya Biryukov bool WalkUpFromUsingDirectiveDecl(UsingDirectiveDecl *S) { 930cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 931a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingNamespaceDirective, S); 932be14a22bSIlya Biryukov return true; 933be14a22bSIlya Biryukov } 934be14a22bSIlya Biryukov 935be14a22bSIlya Biryukov bool WalkUpFromUsingDecl(UsingDecl *S) { 936cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 937a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingDeclaration, S); 938be14a22bSIlya Biryukov return true; 939be14a22bSIlya Biryukov } 940be14a22bSIlya Biryukov 941be14a22bSIlya Biryukov bool WalkUpFromUnresolvedUsingValueDecl(UnresolvedUsingValueDecl *S) { 942cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 943a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingDeclaration, S); 944be14a22bSIlya Biryukov return true; 945be14a22bSIlya Biryukov } 946be14a22bSIlya Biryukov 947be14a22bSIlya Biryukov bool WalkUpFromUnresolvedUsingTypenameDecl(UnresolvedUsingTypenameDecl *S) { 948cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 949a711a3a4SMarcel Hlopko new (allocator()) syntax::UsingDeclaration, S); 950be14a22bSIlya Biryukov return true; 951be14a22bSIlya Biryukov } 952be14a22bSIlya Biryukov 953be14a22bSIlya Biryukov bool WalkUpFromTypeAliasDecl(TypeAliasDecl *S) { 954cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(S), 955a711a3a4SMarcel Hlopko new (allocator()) syntax::TypeAliasDeclaration, S); 956be14a22bSIlya Biryukov return true; 957be14a22bSIlya Biryukov } 958be14a22bSIlya Biryukov 9599b3f38f9SIlya Biryukov private: 960cdce2fe5SMarcel Hlopko template <class T> SourceLocation getQualifiedNameStart(T *D) { 961cdce2fe5SMarcel Hlopko static_assert((std::is_base_of<DeclaratorDecl, T>::value || 962cdce2fe5SMarcel Hlopko std::is_base_of<TypedefNameDecl, T>::value), 963cdce2fe5SMarcel Hlopko "only DeclaratorDecl and TypedefNameDecl are supported."); 964cdce2fe5SMarcel Hlopko 965cdce2fe5SMarcel Hlopko auto DN = D->getDeclName(); 966cdce2fe5SMarcel Hlopko bool IsAnonymous = DN.isIdentifier() && !DN.getAsIdentifierInfo(); 967cdce2fe5SMarcel Hlopko if (IsAnonymous) 968cdce2fe5SMarcel Hlopko return SourceLocation(); 969cdce2fe5SMarcel Hlopko 970cdce2fe5SMarcel Hlopko if (const auto *DD = llvm::dyn_cast<DeclaratorDecl>(D)) { 971cdce2fe5SMarcel Hlopko if (DD->getQualifierLoc()) { 972cdce2fe5SMarcel Hlopko return DD->getQualifierLoc().getBeginLoc(); 973cdce2fe5SMarcel Hlopko } 974cdce2fe5SMarcel Hlopko } 975cdce2fe5SMarcel Hlopko 976cdce2fe5SMarcel Hlopko return D->getLocation(); 977cdce2fe5SMarcel Hlopko } 978cdce2fe5SMarcel Hlopko 979cdce2fe5SMarcel Hlopko SourceRange getInitializerRange(Decl *D) { 980cdce2fe5SMarcel Hlopko if (auto *V = llvm::dyn_cast<VarDecl>(D)) { 981cdce2fe5SMarcel Hlopko auto *I = V->getInit(); 982cdce2fe5SMarcel Hlopko // Initializers in range-based-for are not part of the declarator 983cdce2fe5SMarcel Hlopko if (I && !V->isCXXForRangeDecl()) 984cdce2fe5SMarcel Hlopko return I->getSourceRange(); 985cdce2fe5SMarcel Hlopko } 986cdce2fe5SMarcel Hlopko 987cdce2fe5SMarcel Hlopko return SourceRange(); 988cdce2fe5SMarcel Hlopko } 989cdce2fe5SMarcel Hlopko 990cdce2fe5SMarcel Hlopko /// Folds SimpleDeclarator node (if present) and in case this is the last 991cdce2fe5SMarcel Hlopko /// declarator in the chain it also folds SimpleDeclaration node. 992cdce2fe5SMarcel Hlopko template <class T> bool processDeclaratorAndDeclaration(T *D) { 993cdce2fe5SMarcel Hlopko SourceRange Initializer = getInitializerRange(D); 994cdce2fe5SMarcel Hlopko auto Range = getDeclaratorRange(Builder.sourceManager(), 995cdce2fe5SMarcel Hlopko D->getTypeSourceInfo()->getTypeLoc(), 996cdce2fe5SMarcel Hlopko getQualifiedNameStart(D), Initializer); 997cdce2fe5SMarcel Hlopko 998cdce2fe5SMarcel Hlopko // There doesn't have to be a declarator (e.g. `void foo(int)` only has 999cdce2fe5SMarcel Hlopko // declaration, but no declarator). 1000cdce2fe5SMarcel Hlopko if (Range.getBegin().isValid()) { 1001cdce2fe5SMarcel Hlopko auto *N = new (allocator()) syntax::SimpleDeclarator; 1002cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getRange(Range), N, nullptr); 1003cdce2fe5SMarcel Hlopko Builder.markChild(N, syntax::NodeRole::SimpleDeclaration_declarator); 1004cdce2fe5SMarcel Hlopko } 1005cdce2fe5SMarcel Hlopko 1006cdce2fe5SMarcel Hlopko if (Builder.isResponsibleForCreatingDeclaration(D)) { 1007cdce2fe5SMarcel Hlopko Builder.foldNode(Builder.getDeclarationRange(D), 1008cdce2fe5SMarcel Hlopko new (allocator()) syntax::SimpleDeclaration, D); 1009cdce2fe5SMarcel Hlopko } 1010cdce2fe5SMarcel Hlopko return true; 1011cdce2fe5SMarcel Hlopko } 1012cdce2fe5SMarcel Hlopko 10137d382dcdSMarcel Hlopko /// Returns the range of the built node. 1014a711a3a4SMarcel Hlopko syntax::TrailingReturnType *BuildTrailingReturn(FunctionProtoTypeLoc L) { 10157d382dcdSMarcel Hlopko assert(L.getTypePtr()->hasTrailingReturn()); 10167d382dcdSMarcel Hlopko 10177d382dcdSMarcel Hlopko auto ReturnedType = L.getReturnLoc(); 10187d382dcdSMarcel Hlopko // Build node for the declarator, if any. 10197d382dcdSMarcel Hlopko auto ReturnDeclaratorRange = 10207d382dcdSMarcel Hlopko getDeclaratorRange(this->Builder.sourceManager(), ReturnedType, 10217d382dcdSMarcel Hlopko /*Name=*/SourceLocation(), 10227d382dcdSMarcel Hlopko /*Initializer=*/SourceLocation()); 1023a711a3a4SMarcel Hlopko syntax::SimpleDeclarator *ReturnDeclarator = nullptr; 10247d382dcdSMarcel Hlopko if (ReturnDeclaratorRange.isValid()) { 1025a711a3a4SMarcel Hlopko ReturnDeclarator = new (allocator()) syntax::SimpleDeclarator; 1026a711a3a4SMarcel Hlopko Builder.foldNode(Builder.getRange(ReturnDeclaratorRange), 1027a711a3a4SMarcel Hlopko ReturnDeclarator, nullptr); 10287d382dcdSMarcel Hlopko } 10297d382dcdSMarcel Hlopko 10307d382dcdSMarcel Hlopko // Build node for trailing return type. 1031a711a3a4SMarcel Hlopko auto Return = Builder.getRange(ReturnedType.getSourceRange()); 10327d382dcdSMarcel Hlopko const auto *Arrow = Return.begin() - 1; 10337d382dcdSMarcel Hlopko assert(Arrow->kind() == tok::arrow); 10347d382dcdSMarcel Hlopko auto Tokens = llvm::makeArrayRef(Arrow, Return.end()); 103542f6fec3SEduardo Caldas Builder.markChildToken(Arrow, syntax::NodeRole::ArrowToken); 1036a711a3a4SMarcel Hlopko if (ReturnDeclarator) 1037a711a3a4SMarcel Hlopko Builder.markChild(ReturnDeclarator, 10387d382dcdSMarcel Hlopko syntax::NodeRole::TrailingReturnType_declarator); 1039a711a3a4SMarcel Hlopko auto *R = new (allocator()) syntax::TrailingReturnType; 1040cdce2fe5SMarcel Hlopko Builder.foldNode(Tokens, R, L); 1041a711a3a4SMarcel Hlopko return R; 10427d382dcdSMarcel Hlopko } 104388bf9b3dSMarcel Hlopko 1044a711a3a4SMarcel Hlopko void foldExplicitTemplateInstantiation( 1045a711a3a4SMarcel Hlopko ArrayRef<syntax::Token> Range, const syntax::Token *ExternKW, 104688bf9b3dSMarcel Hlopko const syntax::Token *TemplateKW, 1047a711a3a4SMarcel Hlopko syntax::SimpleDeclaration *InnerDeclaration, Decl *From) { 104888bf9b3dSMarcel Hlopko assert(!ExternKW || ExternKW->kind() == tok::kw_extern); 104988bf9b3dSMarcel Hlopko assert(TemplateKW && TemplateKW->kind() == tok::kw_template); 105042f6fec3SEduardo Caldas Builder.markChildToken(ExternKW, syntax::NodeRole::ExternKeyword); 105188bf9b3dSMarcel Hlopko Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword); 105288bf9b3dSMarcel Hlopko Builder.markChild( 105388bf9b3dSMarcel Hlopko InnerDeclaration, 105488bf9b3dSMarcel Hlopko syntax::NodeRole::ExplicitTemplateInstantiation_declaration); 1055a711a3a4SMarcel Hlopko Builder.foldNode( 1056a711a3a4SMarcel Hlopko Range, new (allocator()) syntax::ExplicitTemplateInstantiation, From); 105788bf9b3dSMarcel Hlopko } 105888bf9b3dSMarcel Hlopko 1059a711a3a4SMarcel Hlopko syntax::TemplateDeclaration *foldTemplateDeclaration( 1060a711a3a4SMarcel Hlopko ArrayRef<syntax::Token> Range, const syntax::Token *TemplateKW, 1061a711a3a4SMarcel Hlopko ArrayRef<syntax::Token> TemplatedDeclaration, Decl *From) { 106288bf9b3dSMarcel Hlopko assert(TemplateKW && TemplateKW->kind() == tok::kw_template); 106388bf9b3dSMarcel Hlopko Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword); 1064a711a3a4SMarcel Hlopko 1065a711a3a4SMarcel Hlopko auto *N = new (allocator()) syntax::TemplateDeclaration; 1066a711a3a4SMarcel Hlopko Builder.foldNode(Range, N, From); 1067cdce2fe5SMarcel Hlopko Builder.markChild(N, syntax::NodeRole::TemplateDeclaration_declaration); 1068a711a3a4SMarcel Hlopko return N; 106988bf9b3dSMarcel Hlopko } 107088bf9b3dSMarcel Hlopko 10719b3f38f9SIlya Biryukov /// A small helper to save some typing. 10729b3f38f9SIlya Biryukov llvm::BumpPtrAllocator &allocator() { return Builder.allocator(); } 10739b3f38f9SIlya Biryukov 10749b3f38f9SIlya Biryukov syntax::TreeBuilder &Builder; 10759b3f38f9SIlya Biryukov const LangOptions &LangOpts; 10769b3f38f9SIlya Biryukov }; 10779b3f38f9SIlya Biryukov } // namespace 10789b3f38f9SIlya Biryukov 10797d382dcdSMarcel Hlopko void syntax::TreeBuilder::noticeDeclWithoutSemicolon(Decl *D) { 1080e702bdb8SIlya Biryukov DeclsWithoutSemicolons.insert(D); 1081e702bdb8SIlya Biryukov } 1082e702bdb8SIlya Biryukov 1083def65bb4SIlya Biryukov void syntax::TreeBuilder::markChildToken(SourceLocation Loc, NodeRole Role) { 10849b3f38f9SIlya Biryukov if (Loc.isInvalid()) 10859b3f38f9SIlya Biryukov return; 10869b3f38f9SIlya Biryukov Pending.assignRole(*findToken(Loc), Role); 10879b3f38f9SIlya Biryukov } 10889b3f38f9SIlya Biryukov 10897d382dcdSMarcel Hlopko void syntax::TreeBuilder::markChildToken(const syntax::Token *T, NodeRole R) { 10907d382dcdSMarcel Hlopko if (!T) 10917d382dcdSMarcel Hlopko return; 10927d382dcdSMarcel Hlopko Pending.assignRole(*T, R); 10937d382dcdSMarcel Hlopko } 10947d382dcdSMarcel Hlopko 1095a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(syntax::Node *N, NodeRole R) { 1096a711a3a4SMarcel Hlopko assert(N); 1097a711a3a4SMarcel Hlopko setRole(N, R); 1098a711a3a4SMarcel Hlopko } 1099a711a3a4SMarcel Hlopko 1100a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(ASTPtr N, NodeRole R) { 1101a711a3a4SMarcel Hlopko auto *SN = Mapping.find(N); 1102a711a3a4SMarcel Hlopko assert(SN != nullptr); 1103a711a3a4SMarcel Hlopko setRole(SN, R); 11047d382dcdSMarcel Hlopko } 11057d382dcdSMarcel Hlopko 110658fa50f4SIlya Biryukov void syntax::TreeBuilder::markStmtChild(Stmt *Child, NodeRole Role) { 110758fa50f4SIlya Biryukov if (!Child) 110858fa50f4SIlya Biryukov return; 110958fa50f4SIlya Biryukov 1110b34b7691SDmitri Gribenko syntax::Tree *ChildNode; 1111b34b7691SDmitri Gribenko if (Expr *ChildExpr = dyn_cast<Expr>(Child)) { 111258fa50f4SIlya Biryukov // This is an expression in a statement position, consume the trailing 111358fa50f4SIlya Biryukov // semicolon and form an 'ExpressionStatement' node. 1114b34b7691SDmitri Gribenko markExprChild(ChildExpr, NodeRole::ExpressionStatement_expression); 1115a711a3a4SMarcel Hlopko ChildNode = new (allocator()) syntax::ExpressionStatement; 1116a711a3a4SMarcel Hlopko // (!) 'getStmtRange()' ensures this covers a trailing semicolon. 1117a711a3a4SMarcel Hlopko Pending.foldChildren(Arena, getStmtRange(Child), ChildNode); 1118b34b7691SDmitri Gribenko } else { 1119b34b7691SDmitri Gribenko ChildNode = Mapping.find(Child); 112058fa50f4SIlya Biryukov } 1121b34b7691SDmitri Gribenko assert(ChildNode != nullptr); 1122a711a3a4SMarcel Hlopko setRole(ChildNode, Role); 112358fa50f4SIlya Biryukov } 112458fa50f4SIlya Biryukov 112558fa50f4SIlya Biryukov void syntax::TreeBuilder::markExprChild(Expr *Child, NodeRole Role) { 1126be14a22bSIlya Biryukov if (!Child) 1127be14a22bSIlya Biryukov return; 1128a711a3a4SMarcel Hlopko Child = Child->IgnoreImplicit(); 1129be14a22bSIlya Biryukov 1130a711a3a4SMarcel Hlopko syntax::Tree *ChildNode = Mapping.find(Child); 1131a711a3a4SMarcel Hlopko assert(ChildNode != nullptr); 1132a711a3a4SMarcel Hlopko setRole(ChildNode, Role); 113358fa50f4SIlya Biryukov } 113458fa50f4SIlya Biryukov 11359b3f38f9SIlya Biryukov const syntax::Token *syntax::TreeBuilder::findToken(SourceLocation L) const { 113688bf9b3dSMarcel Hlopko if (L.isInvalid()) 113788bf9b3dSMarcel Hlopko return nullptr; 1138c1bbefefSIlya Biryukov auto It = LocationToToken.find(L.getRawEncoding()); 1139c1bbefefSIlya Biryukov assert(It != LocationToToken.end()); 1140c1bbefefSIlya Biryukov return It->second; 11419b3f38f9SIlya Biryukov } 11429b3f38f9SIlya Biryukov 11439b3f38f9SIlya Biryukov syntax::TranslationUnit * 11449b3f38f9SIlya Biryukov syntax::buildSyntaxTree(Arena &A, const TranslationUnitDecl &TU) { 11459b3f38f9SIlya Biryukov TreeBuilder Builder(A); 11469b3f38f9SIlya Biryukov BuildTreeVisitor(TU.getASTContext(), Builder).TraverseAST(TU.getASTContext()); 11479b3f38f9SIlya Biryukov return std::move(Builder).finalize(); 11489b3f38f9SIlya Biryukov } 1149