19b3f38f9SIlya Biryukov //===- BuildTree.cpp ------------------------------------------*- C++ -*-=====//
29b3f38f9SIlya Biryukov //
39b3f38f9SIlya Biryukov // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
49b3f38f9SIlya Biryukov // See https://llvm.org/LICENSE.txt for license information.
59b3f38f9SIlya Biryukov // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
69b3f38f9SIlya Biryukov //
79b3f38f9SIlya Biryukov //===----------------------------------------------------------------------===//
89b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/BuildTree.h"
97d382dcdSMarcel Hlopko #include "clang/AST/ASTFwd.h"
10e702bdb8SIlya Biryukov #include "clang/AST/Decl.h"
11e702bdb8SIlya Biryukov #include "clang/AST/DeclBase.h"
127d382dcdSMarcel Hlopko #include "clang/AST/DeclCXX.h"
137d382dcdSMarcel Hlopko #include "clang/AST/DeclarationName.h"
143785eb83SEduardo Caldas #include "clang/AST/Expr.h"
159b3f38f9SIlya Biryukov #include "clang/AST/RecursiveASTVisitor.h"
169b3f38f9SIlya Biryukov #include "clang/AST/Stmt.h"
177d382dcdSMarcel Hlopko #include "clang/AST/TypeLoc.h"
187d382dcdSMarcel Hlopko #include "clang/AST/TypeLocVisitor.h"
199b3f38f9SIlya Biryukov #include "clang/Basic/LLVM.h"
209b3f38f9SIlya Biryukov #include "clang/Basic/SourceLocation.h"
219b3f38f9SIlya Biryukov #include "clang/Basic/SourceManager.h"
2288bf9b3dSMarcel Hlopko #include "clang/Basic/Specifiers.h"
239b3f38f9SIlya Biryukov #include "clang/Basic/TokenKinds.h"
249b3f38f9SIlya Biryukov #include "clang/Lex/Lexer.h"
259b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Nodes.h"
269b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tokens.h"
279b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tree.h"
289b3f38f9SIlya Biryukov #include "llvm/ADT/ArrayRef.h"
29a711a3a4SMarcel Hlopko #include "llvm/ADT/DenseMap.h"
30a711a3a4SMarcel Hlopko #include "llvm/ADT/PointerUnion.h"
319b3f38f9SIlya Biryukov #include "llvm/ADT/STLExtras.h"
327d382dcdSMarcel Hlopko #include "llvm/ADT/ScopeExit.h"
339b3f38f9SIlya Biryukov #include "llvm/ADT/SmallVector.h"
349b3f38f9SIlya Biryukov #include "llvm/Support/Allocator.h"
359b3f38f9SIlya Biryukov #include "llvm/Support/Casting.h"
3696065cf7SIlya Biryukov #include "llvm/Support/Compiler.h"
379b3f38f9SIlya Biryukov #include "llvm/Support/FormatVariadic.h"
381ad15046SIlya Biryukov #include "llvm/Support/MemoryBuffer.h"
399b3f38f9SIlya Biryukov #include "llvm/Support/raw_ostream.h"
40a711a3a4SMarcel Hlopko #include <cstddef>
419b3f38f9SIlya Biryukov #include <map>
429b3f38f9SIlya Biryukov 
439b3f38f9SIlya Biryukov using namespace clang;
449b3f38f9SIlya Biryukov 
4596065cf7SIlya Biryukov LLVM_ATTRIBUTE_UNUSED
4658fa50f4SIlya Biryukov static bool isImplicitExpr(clang::Expr *E) { return E->IgnoreImplicit() != E; }
4758fa50f4SIlya Biryukov 
487d382dcdSMarcel Hlopko namespace {
497d382dcdSMarcel Hlopko /// Get start location of the Declarator from the TypeLoc.
507d382dcdSMarcel Hlopko /// E.g.:
517d382dcdSMarcel Hlopko ///   loc of `(` in `int (a)`
527d382dcdSMarcel Hlopko ///   loc of `*` in `int *(a)`
537d382dcdSMarcel Hlopko ///   loc of the first `(` in `int (*a)(int)`
547d382dcdSMarcel Hlopko ///   loc of the `*` in `int *(a)(int)`
557d382dcdSMarcel Hlopko ///   loc of the first `*` in `const int *const *volatile a;`
567d382dcdSMarcel Hlopko ///
577d382dcdSMarcel Hlopko /// It is non-trivial to get the start location because TypeLocs are stored
587d382dcdSMarcel Hlopko /// inside out. In the example above `*volatile` is the TypeLoc returned
597d382dcdSMarcel Hlopko /// by `Decl.getTypeSourceInfo()`, and `*const` is what `.getPointeeLoc()`
607d382dcdSMarcel Hlopko /// returns.
617d382dcdSMarcel Hlopko struct GetStartLoc : TypeLocVisitor<GetStartLoc, SourceLocation> {
627d382dcdSMarcel Hlopko   SourceLocation VisitParenTypeLoc(ParenTypeLoc T) {
637d382dcdSMarcel Hlopko     auto L = Visit(T.getInnerLoc());
647d382dcdSMarcel Hlopko     if (L.isValid())
657d382dcdSMarcel Hlopko       return L;
667d382dcdSMarcel Hlopko     return T.getLParenLoc();
677d382dcdSMarcel Hlopko   }
687d382dcdSMarcel Hlopko 
697d382dcdSMarcel Hlopko   // Types spelled in the prefix part of the declarator.
707d382dcdSMarcel Hlopko   SourceLocation VisitPointerTypeLoc(PointerTypeLoc T) {
717d382dcdSMarcel Hlopko     return HandlePointer(T);
727d382dcdSMarcel Hlopko   }
737d382dcdSMarcel Hlopko 
747d382dcdSMarcel Hlopko   SourceLocation VisitMemberPointerTypeLoc(MemberPointerTypeLoc T) {
757d382dcdSMarcel Hlopko     return HandlePointer(T);
767d382dcdSMarcel Hlopko   }
777d382dcdSMarcel Hlopko 
787d382dcdSMarcel Hlopko   SourceLocation VisitBlockPointerTypeLoc(BlockPointerTypeLoc T) {
797d382dcdSMarcel Hlopko     return HandlePointer(T);
807d382dcdSMarcel Hlopko   }
817d382dcdSMarcel Hlopko 
827d382dcdSMarcel Hlopko   SourceLocation VisitReferenceTypeLoc(ReferenceTypeLoc T) {
837d382dcdSMarcel Hlopko     return HandlePointer(T);
847d382dcdSMarcel Hlopko   }
857d382dcdSMarcel Hlopko 
867d382dcdSMarcel Hlopko   SourceLocation VisitObjCObjectPointerTypeLoc(ObjCObjectPointerTypeLoc T) {
877d382dcdSMarcel Hlopko     return HandlePointer(T);
887d382dcdSMarcel Hlopko   }
897d382dcdSMarcel Hlopko 
907d382dcdSMarcel Hlopko   // All other cases are not important, as they are either part of declaration
917d382dcdSMarcel Hlopko   // specifiers (e.g. inheritors of TypeSpecTypeLoc) or introduce modifiers on
927d382dcdSMarcel Hlopko   // existing declarators (e.g. QualifiedTypeLoc). They cannot start the
937d382dcdSMarcel Hlopko   // declarator themselves, but their underlying type can.
947d382dcdSMarcel Hlopko   SourceLocation VisitTypeLoc(TypeLoc T) {
957d382dcdSMarcel Hlopko     auto N = T.getNextTypeLoc();
967d382dcdSMarcel Hlopko     if (!N)
977d382dcdSMarcel Hlopko       return SourceLocation();
987d382dcdSMarcel Hlopko     return Visit(N);
997d382dcdSMarcel Hlopko   }
1007d382dcdSMarcel Hlopko 
1017d382dcdSMarcel Hlopko   SourceLocation VisitFunctionProtoTypeLoc(FunctionProtoTypeLoc T) {
1027d382dcdSMarcel Hlopko     if (T.getTypePtr()->hasTrailingReturn())
1037d382dcdSMarcel Hlopko       return SourceLocation(); // avoid recursing into the suffix of declarator.
1047d382dcdSMarcel Hlopko     return VisitTypeLoc(T);
1057d382dcdSMarcel Hlopko   }
1067d382dcdSMarcel Hlopko 
1077d382dcdSMarcel Hlopko private:
1087d382dcdSMarcel Hlopko   template <class PtrLoc> SourceLocation HandlePointer(PtrLoc T) {
1097d382dcdSMarcel Hlopko     auto L = Visit(T.getPointeeLoc());
1107d382dcdSMarcel Hlopko     if (L.isValid())
1117d382dcdSMarcel Hlopko       return L;
1127d382dcdSMarcel Hlopko     return T.getLocalSourceRange().getBegin();
1137d382dcdSMarcel Hlopko   }
1147d382dcdSMarcel Hlopko };
1157d382dcdSMarcel Hlopko } // namespace
1167d382dcdSMarcel Hlopko 
1177d382dcdSMarcel Hlopko /// Gets the range of declarator as defined by the C++ grammar. E.g.
1187d382dcdSMarcel Hlopko ///     `int a;` -> range of `a`,
1197d382dcdSMarcel Hlopko ///     `int *a;` -> range of `*a`,
1207d382dcdSMarcel Hlopko ///     `int a[10];` -> range of `a[10]`,
1217d382dcdSMarcel Hlopko ///     `int a[1][2][3];` -> range of `a[1][2][3]`,
1227d382dcdSMarcel Hlopko ///     `int *a = nullptr` -> range of `*a = nullptr`.
1237d382dcdSMarcel Hlopko /// FIMXE: \p Name must be a source range, e.g. for `operator+`.
1247d382dcdSMarcel Hlopko static SourceRange getDeclaratorRange(const SourceManager &SM, TypeLoc T,
1257d382dcdSMarcel Hlopko                                       SourceLocation Name,
1267d382dcdSMarcel Hlopko                                       SourceRange Initializer) {
1277d382dcdSMarcel Hlopko   SourceLocation Start = GetStartLoc().Visit(T);
1287d382dcdSMarcel Hlopko   SourceLocation End = T.getSourceRange().getEnd();
1297d382dcdSMarcel Hlopko   assert(End.isValid());
1307d382dcdSMarcel Hlopko   if (Name.isValid()) {
1317d382dcdSMarcel Hlopko     if (Start.isInvalid())
1327d382dcdSMarcel Hlopko       Start = Name;
1337d382dcdSMarcel Hlopko     if (SM.isBeforeInTranslationUnit(End, Name))
1347d382dcdSMarcel Hlopko       End = Name;
1357d382dcdSMarcel Hlopko   }
1367d382dcdSMarcel Hlopko   if (Initializer.isValid()) {
137cdce2fe5SMarcel Hlopko     auto InitializerEnd = Initializer.getEnd();
138cdce2fe5SMarcel Hlopko     assert(SM.isBeforeInTranslationUnit(End, InitializerEnd) || End == InitializerEnd);
139cdce2fe5SMarcel Hlopko     End = InitializerEnd;
1407d382dcdSMarcel Hlopko   }
1417d382dcdSMarcel Hlopko   return SourceRange(Start, End);
1427d382dcdSMarcel Hlopko }
1437d382dcdSMarcel Hlopko 
144a711a3a4SMarcel Hlopko namespace {
145a711a3a4SMarcel Hlopko /// All AST hierarchy roots that can be represented as pointers.
146a711a3a4SMarcel Hlopko using ASTPtr = llvm::PointerUnion<Stmt *, Decl *>;
147a711a3a4SMarcel Hlopko /// Maintains a mapping from AST to syntax tree nodes. This class will get more
148a711a3a4SMarcel Hlopko /// complicated as we support more kinds of AST nodes, e.g. TypeLocs.
149a711a3a4SMarcel Hlopko /// FIXME: expose this as public API.
150a711a3a4SMarcel Hlopko class ASTToSyntaxMapping {
151a711a3a4SMarcel Hlopko public:
152a711a3a4SMarcel Hlopko   void add(ASTPtr From, syntax::Tree *To) {
153a711a3a4SMarcel Hlopko     assert(To != nullptr);
154a711a3a4SMarcel Hlopko     assert(!From.isNull());
155a711a3a4SMarcel Hlopko 
156a711a3a4SMarcel Hlopko     bool Added = Nodes.insert({From, To}).second;
157a711a3a4SMarcel Hlopko     (void)Added;
158a711a3a4SMarcel Hlopko     assert(Added && "mapping added twice");
159a711a3a4SMarcel Hlopko   }
160a711a3a4SMarcel Hlopko 
161a711a3a4SMarcel Hlopko   syntax::Tree *find(ASTPtr P) const { return Nodes.lookup(P); }
162a711a3a4SMarcel Hlopko 
163a711a3a4SMarcel Hlopko private:
164a711a3a4SMarcel Hlopko   llvm::DenseMap<ASTPtr, syntax::Tree *> Nodes;
165a711a3a4SMarcel Hlopko };
166a711a3a4SMarcel Hlopko } // namespace
167a711a3a4SMarcel Hlopko 
1689b3f38f9SIlya Biryukov /// A helper class for constructing the syntax tree while traversing a clang
1699b3f38f9SIlya Biryukov /// AST.
1709b3f38f9SIlya Biryukov ///
1719b3f38f9SIlya Biryukov /// At each point of the traversal we maintain a list of pending nodes.
1729b3f38f9SIlya Biryukov /// Initially all tokens are added as pending nodes. When processing a clang AST
1739b3f38f9SIlya Biryukov /// node, the clients need to:
1749b3f38f9SIlya Biryukov ///   - create a corresponding syntax node,
1759b3f38f9SIlya Biryukov ///   - assign roles to all pending child nodes with 'markChild' and
1769b3f38f9SIlya Biryukov ///     'markChildToken',
1779b3f38f9SIlya Biryukov ///   - replace the child nodes with the new syntax node in the pending list
1789b3f38f9SIlya Biryukov ///     with 'foldNode'.
1799b3f38f9SIlya Biryukov ///
1809b3f38f9SIlya Biryukov /// Note that all children are expected to be processed when building a node.
1819b3f38f9SIlya Biryukov ///
1829b3f38f9SIlya Biryukov /// Call finalize() to finish building the tree and consume the root node.
1839b3f38f9SIlya Biryukov class syntax::TreeBuilder {
1849b3f38f9SIlya Biryukov public:
185c1bbefefSIlya Biryukov   TreeBuilder(syntax::Arena &Arena) : Arena(Arena), Pending(Arena) {
186c1bbefefSIlya Biryukov     for (const auto &T : Arena.tokenBuffer().expandedTokens())
187c1bbefefSIlya Biryukov       LocationToToken.insert({T.location().getRawEncoding(), &T});
188c1bbefefSIlya Biryukov   }
1899b3f38f9SIlya Biryukov 
1909b3f38f9SIlya Biryukov   llvm::BumpPtrAllocator &allocator() { return Arena.allocator(); }
1917d382dcdSMarcel Hlopko   const SourceManager &sourceManager() const { return Arena.sourceManager(); }
1929b3f38f9SIlya Biryukov 
1939b3f38f9SIlya Biryukov   /// Populate children for \p New node, assuming it covers tokens from \p
1949b3f38f9SIlya Biryukov   /// Range.
195a711a3a4SMarcel Hlopko   void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New,
196a711a3a4SMarcel Hlopko                 ASTPtr From) {
197a711a3a4SMarcel Hlopko     assert(New);
198a711a3a4SMarcel Hlopko     Pending.foldChildren(Arena, Range, New);
199a711a3a4SMarcel Hlopko     if (From)
200a711a3a4SMarcel Hlopko       Mapping.add(From, New);
201a711a3a4SMarcel Hlopko   }
202a711a3a4SMarcel Hlopko   void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New,
203a711a3a4SMarcel Hlopko                 TypeLoc L) {
204a711a3a4SMarcel Hlopko     // FIXME: add mapping for TypeLocs
205a711a3a4SMarcel Hlopko     foldNode(Range, New, nullptr);
206a711a3a4SMarcel Hlopko   }
2079b3f38f9SIlya Biryukov 
208e702bdb8SIlya Biryukov   /// Notifies that we should not consume trailing semicolon when computing
209e702bdb8SIlya Biryukov   /// token range of \p D.
2107d382dcdSMarcel Hlopko   void noticeDeclWithoutSemicolon(Decl *D);
211e702bdb8SIlya Biryukov 
21258fa50f4SIlya Biryukov   /// Mark the \p Child node with a corresponding \p Role. All marked children
21358fa50f4SIlya Biryukov   /// should be consumed by foldNode.
2147d382dcdSMarcel Hlopko   /// When called on expressions (clang::Expr is derived from clang::Stmt),
21558fa50f4SIlya Biryukov   /// wraps expressions into expression statement.
21658fa50f4SIlya Biryukov   void markStmtChild(Stmt *Child, NodeRole Role);
21758fa50f4SIlya Biryukov   /// Should be called for expressions in non-statement position to avoid
21858fa50f4SIlya Biryukov   /// wrapping into expression statement.
21958fa50f4SIlya Biryukov   void markExprChild(Expr *Child, NodeRole Role);
2209b3f38f9SIlya Biryukov   /// Set role for a token starting at \p Loc.
221def65bb4SIlya Biryukov   void markChildToken(SourceLocation Loc, NodeRole R);
2227d382dcdSMarcel Hlopko   /// Set role for \p T.
2237d382dcdSMarcel Hlopko   void markChildToken(const syntax::Token *T, NodeRole R);
2247d382dcdSMarcel Hlopko 
225a711a3a4SMarcel Hlopko   /// Set role for \p N.
226a711a3a4SMarcel Hlopko   void markChild(syntax::Node *N, NodeRole R);
227a711a3a4SMarcel Hlopko   /// Set role for the syntax node matching \p N.
228a711a3a4SMarcel Hlopko   void markChild(ASTPtr N, NodeRole R);
2299b3f38f9SIlya Biryukov 
2309b3f38f9SIlya Biryukov   /// Finish building the tree and consume the root node.
2319b3f38f9SIlya Biryukov   syntax::TranslationUnit *finalize() && {
2329b3f38f9SIlya Biryukov     auto Tokens = Arena.tokenBuffer().expandedTokens();
233bfbf6b6cSIlya Biryukov     assert(!Tokens.empty());
234bfbf6b6cSIlya Biryukov     assert(Tokens.back().kind() == tok::eof);
235bfbf6b6cSIlya Biryukov 
2369b3f38f9SIlya Biryukov     // Build the root of the tree, consuming all the children.
2371ad15046SIlya Biryukov     Pending.foldChildren(Arena, Tokens.drop_back(),
2389b3f38f9SIlya Biryukov                          new (Arena.allocator()) syntax::TranslationUnit);
2399b3f38f9SIlya Biryukov 
2403b929fe7SIlya Biryukov     auto *TU = cast<syntax::TranslationUnit>(std::move(Pending).finalize());
2413b929fe7SIlya Biryukov     TU->assertInvariantsRecursive();
2423b929fe7SIlya Biryukov     return TU;
2439b3f38f9SIlya Biryukov   }
2449b3f38f9SIlya Biryukov 
24588bf9b3dSMarcel Hlopko   /// Finds a token starting at \p L. The token must exist if \p L is valid.
24688bf9b3dSMarcel Hlopko   const syntax::Token *findToken(SourceLocation L) const;
24788bf9b3dSMarcel Hlopko 
248a711a3a4SMarcel Hlopko   /// Finds the syntax tokens corresponding to the \p SourceRange.
249a711a3a4SMarcel Hlopko   llvm::ArrayRef<syntax::Token> getRange(SourceRange Range) const {
250a711a3a4SMarcel Hlopko     assert(Range.isValid());
251a711a3a4SMarcel Hlopko     return getRange(Range.getBegin(), Range.getEnd());
252a711a3a4SMarcel Hlopko   }
253a711a3a4SMarcel Hlopko 
254a711a3a4SMarcel Hlopko   /// Finds the syntax tokens corresponding to the passed source locations.
2559b3f38f9SIlya Biryukov   /// \p First is the start position of the first token and \p Last is the start
2569b3f38f9SIlya Biryukov   /// position of the last token.
2579b3f38f9SIlya Biryukov   llvm::ArrayRef<syntax::Token> getRange(SourceLocation First,
2589b3f38f9SIlya Biryukov                                          SourceLocation Last) const {
2599b3f38f9SIlya Biryukov     assert(First.isValid());
2609b3f38f9SIlya Biryukov     assert(Last.isValid());
2619b3f38f9SIlya Biryukov     assert(First == Last ||
2629b3f38f9SIlya Biryukov            Arena.sourceManager().isBeforeInTranslationUnit(First, Last));
2639b3f38f9SIlya Biryukov     return llvm::makeArrayRef(findToken(First), std::next(findToken(Last)));
2649b3f38f9SIlya Biryukov   }
26588bf9b3dSMarcel Hlopko 
26688bf9b3dSMarcel Hlopko   llvm::ArrayRef<syntax::Token>
26788bf9b3dSMarcel Hlopko   getTemplateRange(const ClassTemplateSpecializationDecl *D) const {
268a711a3a4SMarcel Hlopko     auto Tokens = getRange(D->getSourceRange());
26988bf9b3dSMarcel Hlopko     return maybeAppendSemicolon(Tokens, D);
27088bf9b3dSMarcel Hlopko   }
27188bf9b3dSMarcel Hlopko 
272cdce2fe5SMarcel Hlopko   /// Returns true if \p D is the last declarator in a chain and is thus
273cdce2fe5SMarcel Hlopko   /// reponsible for creating SimpleDeclaration for the whole chain.
274cdce2fe5SMarcel Hlopko   template <class T>
275cdce2fe5SMarcel Hlopko   bool isResponsibleForCreatingDeclaration(const T *D) const {
276cdce2fe5SMarcel Hlopko     static_assert((std::is_base_of<DeclaratorDecl, T>::value ||
277cdce2fe5SMarcel Hlopko                    std::is_base_of<TypedefNameDecl, T>::value),
278cdce2fe5SMarcel Hlopko                   "only DeclaratorDecl and TypedefNameDecl are supported.");
279cdce2fe5SMarcel Hlopko 
280cdce2fe5SMarcel Hlopko     const Decl *Next = D->getNextDeclInContext();
281cdce2fe5SMarcel Hlopko 
282cdce2fe5SMarcel Hlopko     // There's no next sibling, this one is responsible.
283cdce2fe5SMarcel Hlopko     if (Next == nullptr) {
284cdce2fe5SMarcel Hlopko       return true;
285cdce2fe5SMarcel Hlopko     }
286cdce2fe5SMarcel Hlopko     const auto *NextT = llvm::dyn_cast<T>(Next);
287cdce2fe5SMarcel Hlopko 
288cdce2fe5SMarcel Hlopko     // Next sibling is not the same type, this one is responsible.
289cdce2fe5SMarcel Hlopko     if (NextT == nullptr) {
290cdce2fe5SMarcel Hlopko       return true;
291cdce2fe5SMarcel Hlopko     }
292cdce2fe5SMarcel Hlopko     // Next sibling doesn't begin at the same loc, it must be a different
293cdce2fe5SMarcel Hlopko     // declaration, so this declarator is responsible.
294cdce2fe5SMarcel Hlopko     if (NextT->getBeginLoc() != D->getBeginLoc()) {
295cdce2fe5SMarcel Hlopko       return true;
296cdce2fe5SMarcel Hlopko     }
297cdce2fe5SMarcel Hlopko 
298cdce2fe5SMarcel Hlopko     // NextT is a member of the same declaration, and we need the last member to
299cdce2fe5SMarcel Hlopko     // create declaration. This one is not responsible.
300cdce2fe5SMarcel Hlopko     return false;
301cdce2fe5SMarcel Hlopko   }
302cdce2fe5SMarcel Hlopko 
303cdce2fe5SMarcel Hlopko   llvm::ArrayRef<syntax::Token> getDeclarationRange(Decl *D) {
30488bf9b3dSMarcel Hlopko     llvm::ArrayRef<clang::syntax::Token> Tokens;
30588bf9b3dSMarcel Hlopko     // We want to drop the template parameters for specializations.
30688bf9b3dSMarcel Hlopko     if (const auto *S = llvm::dyn_cast<TagDecl>(D))
30788bf9b3dSMarcel Hlopko       Tokens = getRange(S->TypeDecl::getBeginLoc(), S->getEndLoc());
30888bf9b3dSMarcel Hlopko     else
309a711a3a4SMarcel Hlopko       Tokens = getRange(D->getSourceRange());
31088bf9b3dSMarcel Hlopko     return maybeAppendSemicolon(Tokens, D);
3119b3f38f9SIlya Biryukov   }
312cdce2fe5SMarcel Hlopko 
31358fa50f4SIlya Biryukov   llvm::ArrayRef<syntax::Token> getExprRange(const Expr *E) const {
314a711a3a4SMarcel Hlopko     return getRange(E->getSourceRange());
31558fa50f4SIlya Biryukov   }
316cdce2fe5SMarcel Hlopko 
31758fa50f4SIlya Biryukov   /// Find the adjusted range for the statement, consuming the trailing
31858fa50f4SIlya Biryukov   /// semicolon when needed.
31958fa50f4SIlya Biryukov   llvm::ArrayRef<syntax::Token> getStmtRange(const Stmt *S) const {
320a711a3a4SMarcel Hlopko     auto Tokens = getRange(S->getSourceRange());
32158fa50f4SIlya Biryukov     if (isa<CompoundStmt>(S))
32258fa50f4SIlya Biryukov       return Tokens;
32358fa50f4SIlya Biryukov 
32458fa50f4SIlya Biryukov     // Some statements miss a trailing semicolon, e.g. 'return', 'continue' and
32558fa50f4SIlya Biryukov     // all statements that end with those. Consume this semicolon here.
326e702bdb8SIlya Biryukov     if (Tokens.back().kind() == tok::semi)
327e702bdb8SIlya Biryukov       return Tokens;
328e702bdb8SIlya Biryukov     return withTrailingSemicolon(Tokens);
329e702bdb8SIlya Biryukov   }
330e702bdb8SIlya Biryukov 
331e702bdb8SIlya Biryukov private:
332e702bdb8SIlya Biryukov   llvm::ArrayRef<syntax::Token>
33388bf9b3dSMarcel Hlopko   maybeAppendSemicolon(llvm::ArrayRef<syntax::Token> Tokens,
33488bf9b3dSMarcel Hlopko                        const Decl *D) const {
33588bf9b3dSMarcel Hlopko     if (llvm::isa<NamespaceDecl>(D))
33688bf9b3dSMarcel Hlopko       return Tokens;
33788bf9b3dSMarcel Hlopko     if (DeclsWithoutSemicolons.count(D))
33888bf9b3dSMarcel Hlopko       return Tokens;
33988bf9b3dSMarcel Hlopko     // FIXME: do not consume trailing semicolon on function definitions.
34088bf9b3dSMarcel Hlopko     // Most declarations own a semicolon in syntax trees, but not in clang AST.
34188bf9b3dSMarcel Hlopko     return withTrailingSemicolon(Tokens);
34288bf9b3dSMarcel Hlopko   }
34388bf9b3dSMarcel Hlopko 
34488bf9b3dSMarcel Hlopko   llvm::ArrayRef<syntax::Token>
345e702bdb8SIlya Biryukov   withTrailingSemicolon(llvm::ArrayRef<syntax::Token> Tokens) const {
346e702bdb8SIlya Biryukov     assert(!Tokens.empty());
347e702bdb8SIlya Biryukov     assert(Tokens.back().kind() != tok::eof);
3487d382dcdSMarcel Hlopko     // We never consume 'eof', so looking at the next token is ok.
34958fa50f4SIlya Biryukov     if (Tokens.back().kind() != tok::semi && Tokens.end()->kind() == tok::semi)
35058fa50f4SIlya Biryukov       return llvm::makeArrayRef(Tokens.begin(), Tokens.end() + 1);
35158fa50f4SIlya Biryukov     return Tokens;
3529b3f38f9SIlya Biryukov   }
3539b3f38f9SIlya Biryukov 
354a711a3a4SMarcel Hlopko   void setRole(syntax::Node *N, NodeRole R) {
355a711a3a4SMarcel Hlopko     assert(N->role() == NodeRole::Detached);
356a711a3a4SMarcel Hlopko     N->setRole(R);
357a711a3a4SMarcel Hlopko   }
358a711a3a4SMarcel Hlopko 
3599b3f38f9SIlya Biryukov   /// A collection of trees covering the input tokens.
3609b3f38f9SIlya Biryukov   /// When created, each tree corresponds to a single token in the file.
3619b3f38f9SIlya Biryukov   /// Clients call 'foldChildren' to attach one or more subtrees to a parent
3629b3f38f9SIlya Biryukov   /// node and update the list of trees accordingly.
3639b3f38f9SIlya Biryukov   ///
3649b3f38f9SIlya Biryukov   /// Ensures that added nodes properly nest and cover the whole token stream.
3659b3f38f9SIlya Biryukov   struct Forest {
3669b3f38f9SIlya Biryukov     Forest(syntax::Arena &A) {
367bfbf6b6cSIlya Biryukov       assert(!A.tokenBuffer().expandedTokens().empty());
368bfbf6b6cSIlya Biryukov       assert(A.tokenBuffer().expandedTokens().back().kind() == tok::eof);
3699b3f38f9SIlya Biryukov       // Create all leaf nodes.
370bfbf6b6cSIlya Biryukov       // Note that we do not have 'eof' in the tree.
3711ad15046SIlya Biryukov       for (auto &T : A.tokenBuffer().expandedTokens().drop_back()) {
3721ad15046SIlya Biryukov         auto *L = new (A.allocator()) syntax::Leaf(&T);
3731ad15046SIlya Biryukov         L->Original = true;
3741ad15046SIlya Biryukov         L->CanModify = A.tokenBuffer().spelledForExpanded(T).hasValue();
375a711a3a4SMarcel Hlopko         Trees.insert(Trees.end(), {&T, L});
3761ad15046SIlya Biryukov       }
3779b3f38f9SIlya Biryukov     }
3789b3f38f9SIlya Biryukov 
3799b3f38f9SIlya Biryukov     void assignRole(llvm::ArrayRef<syntax::Token> Range,
3809b3f38f9SIlya Biryukov                     syntax::NodeRole Role) {
3819b3f38f9SIlya Biryukov       assert(!Range.empty());
3829b3f38f9SIlya Biryukov       auto It = Trees.lower_bound(Range.begin());
3839b3f38f9SIlya Biryukov       assert(It != Trees.end() && "no node found");
3849b3f38f9SIlya Biryukov       assert(It->first == Range.begin() && "no child with the specified range");
3859b3f38f9SIlya Biryukov       assert((std::next(It) == Trees.end() ||
3869b3f38f9SIlya Biryukov               std::next(It)->first == Range.end()) &&
3879b3f38f9SIlya Biryukov              "no child with the specified range");
388a711a3a4SMarcel Hlopko       assert(It->second->role() == NodeRole::Detached &&
389a711a3a4SMarcel Hlopko              "re-assigning role for a child");
390a711a3a4SMarcel Hlopko       It->second->setRole(Role);
3919b3f38f9SIlya Biryukov     }
3929b3f38f9SIlya Biryukov 
393e702bdb8SIlya Biryukov     /// Add \p Node to the forest and attach child nodes based on \p Tokens.
3941ad15046SIlya Biryukov     void foldChildren(const syntax::Arena &A,
3951ad15046SIlya Biryukov                       llvm::ArrayRef<syntax::Token> Tokens,
3969b3f38f9SIlya Biryukov                       syntax::Tree *Node) {
397e702bdb8SIlya Biryukov       // Attach children to `Node`.
398cdce2fe5SMarcel Hlopko       assert(Node->firstChild() == nullptr && "node already has children");
399cdce2fe5SMarcel Hlopko 
400cdce2fe5SMarcel Hlopko       auto *FirstToken = Tokens.begin();
401cdce2fe5SMarcel Hlopko       auto BeginChildren = Trees.lower_bound(FirstToken);
402cdce2fe5SMarcel Hlopko 
403cdce2fe5SMarcel Hlopko       assert((BeginChildren == Trees.end() ||
404cdce2fe5SMarcel Hlopko               BeginChildren->first == FirstToken) &&
405cdce2fe5SMarcel Hlopko              "fold crosses boundaries of existing subtrees");
406cdce2fe5SMarcel Hlopko       auto EndChildren = Trees.lower_bound(Tokens.end());
407cdce2fe5SMarcel Hlopko       assert(
408cdce2fe5SMarcel Hlopko           (EndChildren == Trees.end() || EndChildren->first == Tokens.end()) &&
409cdce2fe5SMarcel Hlopko           "fold crosses boundaries of existing subtrees");
410cdce2fe5SMarcel Hlopko 
411cdce2fe5SMarcel Hlopko       // We need to go in reverse order, because we can only prepend.
412cdce2fe5SMarcel Hlopko       for (auto It = EndChildren; It != BeginChildren; --It) {
413cdce2fe5SMarcel Hlopko         auto *C = std::prev(It)->second;
414cdce2fe5SMarcel Hlopko         if (C->role() == NodeRole::Detached)
415cdce2fe5SMarcel Hlopko           C->setRole(NodeRole::Unknown);
416cdce2fe5SMarcel Hlopko         Node->prependChildLowLevel(C);
417e702bdb8SIlya Biryukov       }
4189b3f38f9SIlya Biryukov 
419cdce2fe5SMarcel Hlopko       // Mark that this node came from the AST and is backed by the source code.
420cdce2fe5SMarcel Hlopko       Node->Original = true;
421cdce2fe5SMarcel Hlopko       Node->CanModify = A.tokenBuffer().spelledForExpanded(Tokens).hasValue();
4229b3f38f9SIlya Biryukov 
423cdce2fe5SMarcel Hlopko       Trees.erase(BeginChildren, EndChildren);
424cdce2fe5SMarcel Hlopko       Trees.insert({FirstToken, Node});
4259b3f38f9SIlya Biryukov     }
4269b3f38f9SIlya Biryukov 
4279b3f38f9SIlya Biryukov     // EXPECTS: all tokens were consumed and are owned by a single root node.
4289b3f38f9SIlya Biryukov     syntax::Node *finalize() && {
4299b3f38f9SIlya Biryukov       assert(Trees.size() == 1);
430a711a3a4SMarcel Hlopko       auto *Root = Trees.begin()->second;
4319b3f38f9SIlya Biryukov       Trees = {};
4329b3f38f9SIlya Biryukov       return Root;
4339b3f38f9SIlya Biryukov     }
4349b3f38f9SIlya Biryukov 
4359b3f38f9SIlya Biryukov     std::string str(const syntax::Arena &A) const {
4369b3f38f9SIlya Biryukov       std::string R;
4379b3f38f9SIlya Biryukov       for (auto It = Trees.begin(); It != Trees.end(); ++It) {
4389b3f38f9SIlya Biryukov         unsigned CoveredTokens =
4399b3f38f9SIlya Biryukov             It != Trees.end()
4409b3f38f9SIlya Biryukov                 ? (std::next(It)->first - It->first)
4419b3f38f9SIlya Biryukov                 : A.tokenBuffer().expandedTokens().end() - It->first;
4429b3f38f9SIlya Biryukov 
443adcd0268SBenjamin Kramer         R += std::string(llvm::formatv(
444a711a3a4SMarcel Hlopko             "- '{0}' covers '{1}'+{2} tokens\n", It->second->kind(),
445adcd0268SBenjamin Kramer             It->first->text(A.sourceManager()), CoveredTokens));
446a711a3a4SMarcel Hlopko         R += It->second->dump(A);
4479b3f38f9SIlya Biryukov       }
4489b3f38f9SIlya Biryukov       return R;
4499b3f38f9SIlya Biryukov     }
4509b3f38f9SIlya Biryukov 
4519b3f38f9SIlya Biryukov   private:
4529b3f38f9SIlya Biryukov     /// Maps from the start token to a subtree starting at that token.
453302cb3bcSIlya Biryukov     /// Keys in the map are pointers into the array of expanded tokens, so
454302cb3bcSIlya Biryukov     /// pointer order corresponds to the order of preprocessor tokens.
455a711a3a4SMarcel Hlopko     std::map<const syntax::Token *, syntax::Node *> Trees;
4569b3f38f9SIlya Biryukov   };
4579b3f38f9SIlya Biryukov 
4589b3f38f9SIlya Biryukov   /// For debugging purposes.
4599b3f38f9SIlya Biryukov   std::string str() { return Pending.str(Arena); }
4609b3f38f9SIlya Biryukov 
4619b3f38f9SIlya Biryukov   syntax::Arena &Arena;
462c1bbefefSIlya Biryukov   /// To quickly find tokens by their start location.
463c1bbefefSIlya Biryukov   llvm::DenseMap</*SourceLocation*/ unsigned, const syntax::Token *>
464c1bbefefSIlya Biryukov       LocationToToken;
4659b3f38f9SIlya Biryukov   Forest Pending;
466e702bdb8SIlya Biryukov   llvm::DenseSet<Decl *> DeclsWithoutSemicolons;
467a711a3a4SMarcel Hlopko   ASTToSyntaxMapping Mapping;
4689b3f38f9SIlya Biryukov };
4699b3f38f9SIlya Biryukov 
4709b3f38f9SIlya Biryukov namespace {
4719b3f38f9SIlya Biryukov class BuildTreeVisitor : public RecursiveASTVisitor<BuildTreeVisitor> {
4729b3f38f9SIlya Biryukov public:
4739b3f38f9SIlya Biryukov   explicit BuildTreeVisitor(ASTContext &Ctx, syntax::TreeBuilder &Builder)
4749b3f38f9SIlya Biryukov       : Builder(Builder), LangOpts(Ctx.getLangOpts()) {}
4759b3f38f9SIlya Biryukov 
4769b3f38f9SIlya Biryukov   bool shouldTraversePostOrder() const { return true; }
4779b3f38f9SIlya Biryukov 
4787d382dcdSMarcel Hlopko   bool WalkUpFromDeclaratorDecl(DeclaratorDecl *DD) {
479cdce2fe5SMarcel Hlopko     return processDeclaratorAndDeclaration(DD);
4807d382dcdSMarcel Hlopko   }
4817d382dcdSMarcel Hlopko 
482cdce2fe5SMarcel Hlopko   bool WalkUpFromTypedefNameDecl(TypedefNameDecl *TD) {
483cdce2fe5SMarcel Hlopko     return processDeclaratorAndDeclaration(TD);
4849b3f38f9SIlya Biryukov   }
4859b3f38f9SIlya Biryukov 
4869b3f38f9SIlya Biryukov   bool VisitDecl(Decl *D) {
4879b3f38f9SIlya Biryukov     assert(!D->isImplicit());
488cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(D),
489a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UnknownDeclaration(), D);
490e702bdb8SIlya Biryukov     return true;
491e702bdb8SIlya Biryukov   }
492e702bdb8SIlya Biryukov 
49388bf9b3dSMarcel Hlopko   // RAV does not call WalkUpFrom* on explicit instantiations, so we have to
49488bf9b3dSMarcel Hlopko   // override Traverse.
49588bf9b3dSMarcel Hlopko   // FIXME: make RAV call WalkUpFrom* instead.
49688bf9b3dSMarcel Hlopko   bool
49788bf9b3dSMarcel Hlopko   TraverseClassTemplateSpecializationDecl(ClassTemplateSpecializationDecl *C) {
49888bf9b3dSMarcel Hlopko     if (!RecursiveASTVisitor::TraverseClassTemplateSpecializationDecl(C))
49988bf9b3dSMarcel Hlopko       return false;
50088bf9b3dSMarcel Hlopko     if (C->isExplicitSpecialization())
50188bf9b3dSMarcel Hlopko       return true; // we are only interested in explicit instantiations.
502a711a3a4SMarcel Hlopko     auto *Declaration =
503a711a3a4SMarcel Hlopko         cast<syntax::SimpleDeclaration>(handleFreeStandingTagDecl(C));
50488bf9b3dSMarcel Hlopko     foldExplicitTemplateInstantiation(
50588bf9b3dSMarcel Hlopko         Builder.getTemplateRange(C), Builder.findToken(C->getExternLoc()),
506a711a3a4SMarcel Hlopko         Builder.findToken(C->getTemplateKeywordLoc()), Declaration, C);
50788bf9b3dSMarcel Hlopko     return true;
50888bf9b3dSMarcel Hlopko   }
50988bf9b3dSMarcel Hlopko 
51088bf9b3dSMarcel Hlopko   bool WalkUpFromTemplateDecl(TemplateDecl *S) {
51188bf9b3dSMarcel Hlopko     foldTemplateDeclaration(
512cdce2fe5SMarcel Hlopko         Builder.getDeclarationRange(S),
51388bf9b3dSMarcel Hlopko         Builder.findToken(S->getTemplateParameters()->getTemplateLoc()),
514cdce2fe5SMarcel Hlopko         Builder.getDeclarationRange(S->getTemplatedDecl()), S);
51588bf9b3dSMarcel Hlopko     return true;
51688bf9b3dSMarcel Hlopko   }
51788bf9b3dSMarcel Hlopko 
518e702bdb8SIlya Biryukov   bool WalkUpFromTagDecl(TagDecl *C) {
51904f627f6SIlya Biryukov     // FIXME: build the ClassSpecifier node.
52088bf9b3dSMarcel Hlopko     if (!C->isFreeStanding()) {
52188bf9b3dSMarcel Hlopko       assert(C->getNumTemplateParameterLists() == 0);
52204f627f6SIlya Biryukov       return true;
52304f627f6SIlya Biryukov     }
524a711a3a4SMarcel Hlopko     handleFreeStandingTagDecl(C);
525a711a3a4SMarcel Hlopko     return true;
526a711a3a4SMarcel Hlopko   }
527a711a3a4SMarcel Hlopko 
528a711a3a4SMarcel Hlopko   syntax::Declaration *handleFreeStandingTagDecl(TagDecl *C) {
529a711a3a4SMarcel Hlopko     assert(C->isFreeStanding());
53088bf9b3dSMarcel Hlopko     // Class is a declaration specifier and needs a spanning declaration node.
531cdce2fe5SMarcel Hlopko     auto DeclarationRange = Builder.getDeclarationRange(C);
532a711a3a4SMarcel Hlopko     syntax::Declaration *Result = new (allocator()) syntax::SimpleDeclaration;
533a711a3a4SMarcel Hlopko     Builder.foldNode(DeclarationRange, Result, nullptr);
53488bf9b3dSMarcel Hlopko 
53588bf9b3dSMarcel Hlopko     // Build TemplateDeclaration nodes if we had template parameters.
53688bf9b3dSMarcel Hlopko     auto ConsumeTemplateParameters = [&](const TemplateParameterList &L) {
53788bf9b3dSMarcel Hlopko       const auto *TemplateKW = Builder.findToken(L.getTemplateLoc());
53888bf9b3dSMarcel Hlopko       auto R = llvm::makeArrayRef(TemplateKW, DeclarationRange.end());
539a711a3a4SMarcel Hlopko       Result =
540a711a3a4SMarcel Hlopko           foldTemplateDeclaration(R, TemplateKW, DeclarationRange, nullptr);
54188bf9b3dSMarcel Hlopko       DeclarationRange = R;
54288bf9b3dSMarcel Hlopko     };
54388bf9b3dSMarcel Hlopko     if (auto *S = llvm::dyn_cast<ClassTemplatePartialSpecializationDecl>(C))
54488bf9b3dSMarcel Hlopko       ConsumeTemplateParameters(*S->getTemplateParameters());
54588bf9b3dSMarcel Hlopko     for (unsigned I = C->getNumTemplateParameterLists(); 0 < I; --I)
54688bf9b3dSMarcel Hlopko       ConsumeTemplateParameters(*C->getTemplateParameterList(I - 1));
547a711a3a4SMarcel Hlopko     return Result;
5489b3f38f9SIlya Biryukov   }
5499b3f38f9SIlya Biryukov 
5509b3f38f9SIlya Biryukov   bool WalkUpFromTranslationUnitDecl(TranslationUnitDecl *TU) {
5517d382dcdSMarcel Hlopko     // We do not want to call VisitDecl(), the declaration for translation
5529b3f38f9SIlya Biryukov     // unit is built by finalize().
5539b3f38f9SIlya Biryukov     return true;
5549b3f38f9SIlya Biryukov   }
5559b3f38f9SIlya Biryukov 
5569b3f38f9SIlya Biryukov   bool WalkUpFromCompoundStmt(CompoundStmt *S) {
55751dad419SIlya Biryukov     using NodeRole = syntax::NodeRole;
5589b3f38f9SIlya Biryukov 
559def65bb4SIlya Biryukov     Builder.markChildToken(S->getLBracLoc(), NodeRole::OpenParen);
56058fa50f4SIlya Biryukov     for (auto *Child : S->body())
56158fa50f4SIlya Biryukov       Builder.markStmtChild(Child, NodeRole::CompoundStatement_statement);
562def65bb4SIlya Biryukov     Builder.markChildToken(S->getRBracLoc(), NodeRole::CloseParen);
5639b3f38f9SIlya Biryukov 
56458fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
565a711a3a4SMarcel Hlopko                      new (allocator()) syntax::CompoundStatement, S);
5669b3f38f9SIlya Biryukov     return true;
5679b3f38f9SIlya Biryukov   }
5689b3f38f9SIlya Biryukov 
56958fa50f4SIlya Biryukov   // Some statements are not yet handled by syntax trees.
57058fa50f4SIlya Biryukov   bool WalkUpFromStmt(Stmt *S) {
57158fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
572a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UnknownStatement, S);
57358fa50f4SIlya Biryukov     return true;
57458fa50f4SIlya Biryukov   }
57558fa50f4SIlya Biryukov 
57658fa50f4SIlya Biryukov   bool TraverseCXXForRangeStmt(CXXForRangeStmt *S) {
57758fa50f4SIlya Biryukov     // We override to traverse range initializer as VarDecl.
57858fa50f4SIlya Biryukov     // RAV traverses it as a statement, we produce invalid node kinds in that
57958fa50f4SIlya Biryukov     // case.
58058fa50f4SIlya Biryukov     // FIXME: should do this in RAV instead?
58158fa50f4SIlya Biryukov     if (S->getInit() && !TraverseStmt(S->getInit()))
58258fa50f4SIlya Biryukov       return false;
58358fa50f4SIlya Biryukov     if (S->getLoopVariable() && !TraverseDecl(S->getLoopVariable()))
58458fa50f4SIlya Biryukov       return false;
58558fa50f4SIlya Biryukov     if (S->getRangeInit() && !TraverseStmt(S->getRangeInit()))
58658fa50f4SIlya Biryukov       return false;
58758fa50f4SIlya Biryukov     if (S->getBody() && !TraverseStmt(S->getBody()))
58858fa50f4SIlya Biryukov       return false;
58958fa50f4SIlya Biryukov     return true;
59058fa50f4SIlya Biryukov   }
59158fa50f4SIlya Biryukov 
59258fa50f4SIlya Biryukov   bool TraverseStmt(Stmt *S) {
593e702bdb8SIlya Biryukov     if (auto *DS = llvm::dyn_cast_or_null<DeclStmt>(S)) {
594e702bdb8SIlya Biryukov       // We want to consume the semicolon, make sure SimpleDeclaration does not.
595e702bdb8SIlya Biryukov       for (auto *D : DS->decls())
5967d382dcdSMarcel Hlopko         Builder.noticeDeclWithoutSemicolon(D);
597e702bdb8SIlya Biryukov     } else if (auto *E = llvm::dyn_cast_or_null<Expr>(S)) {
5983785eb83SEduardo Caldas       return RecursiveASTVisitor::TraverseStmt(E->IgnoreImplicit());
59958fa50f4SIlya Biryukov     }
60058fa50f4SIlya Biryukov     return RecursiveASTVisitor::TraverseStmt(S);
60158fa50f4SIlya Biryukov   }
60258fa50f4SIlya Biryukov 
60358fa50f4SIlya Biryukov   // Some expressions are not yet handled by syntax trees.
60458fa50f4SIlya Biryukov   bool WalkUpFromExpr(Expr *E) {
60558fa50f4SIlya Biryukov     assert(!isImplicitExpr(E) && "should be handled by TraverseStmt");
60658fa50f4SIlya Biryukov     Builder.foldNode(Builder.getExprRange(E),
607a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UnknownExpression, E);
60858fa50f4SIlya Biryukov     return true;
60958fa50f4SIlya Biryukov   }
61058fa50f4SIlya Biryukov 
6111b2f6b4aSEduardo Caldas   syntax::NestedNameSpecifier *
6121b2f6b4aSEduardo Caldas   BuildNestedNameSpecifier(NestedNameSpecifierLoc QualifierLoc) {
6131b2f6b4aSEduardo Caldas     if (!QualifierLoc)
6141b2f6b4aSEduardo Caldas       return nullptr;
6151b2f6b4aSEduardo Caldas     for (auto it = QualifierLoc; it; it = it.getPrefix()) {
6161b2f6b4aSEduardo Caldas       auto *NS = new (allocator()) syntax::NameSpecifier;
6171b2f6b4aSEduardo Caldas       Builder.foldNode(Builder.getRange(it.getLocalSourceRange()), NS, nullptr);
6181b2f6b4aSEduardo Caldas       Builder.markChild(NS, syntax::NodeRole::NestedNameSpecifier_specifier);
6191b2f6b4aSEduardo Caldas     }
6201b2f6b4aSEduardo Caldas     auto *NNS = new (allocator()) syntax::NestedNameSpecifier;
6211b2f6b4aSEduardo Caldas     Builder.foldNode(Builder.getRange(QualifierLoc.getSourceRange()), NNS,
6221b2f6b4aSEduardo Caldas                      nullptr);
6231b2f6b4aSEduardo Caldas     return NNS;
6241b2f6b4aSEduardo Caldas   }
6251b2f6b4aSEduardo Caldas 
6261b2f6b4aSEduardo Caldas   bool WalkUpFromDeclRefExpr(DeclRefExpr *S) {
6271b2f6b4aSEduardo Caldas     if (auto *NNS = BuildNestedNameSpecifier(S->getQualifierLoc()))
6281b2f6b4aSEduardo Caldas       Builder.markChild(NNS, syntax::NodeRole::IdExpression_qualifier);
6291b2f6b4aSEduardo Caldas 
6301b2f6b4aSEduardo Caldas     auto *unqualifiedId = new (allocator()) syntax::UnqualifiedId;
6311b2f6b4aSEduardo Caldas     // Get `UnqualifiedId` from `DeclRefExpr`.
6321b2f6b4aSEduardo Caldas     // FIXME: Extract this logic so that it can be used by `MemberExpr`,
6331b2f6b4aSEduardo Caldas     // and other semantic constructs, now it is tied to `DeclRefExpr`.
6341b2f6b4aSEduardo Caldas     if (!S->hasExplicitTemplateArgs()) {
6351b2f6b4aSEduardo Caldas       Builder.foldNode(Builder.getRange(S->getNameInfo().getSourceRange()),
6361b2f6b4aSEduardo Caldas                        unqualifiedId, nullptr);
6371b2f6b4aSEduardo Caldas     } else {
6381b2f6b4aSEduardo Caldas       auto templateIdSourceRange =
6391b2f6b4aSEduardo Caldas           SourceRange(S->getNameInfo().getBeginLoc(), S->getRAngleLoc());
6401b2f6b4aSEduardo Caldas       Builder.foldNode(Builder.getRange(templateIdSourceRange), unqualifiedId,
6411b2f6b4aSEduardo Caldas                        nullptr);
6421b2f6b4aSEduardo Caldas     }
6431b2f6b4aSEduardo Caldas     Builder.markChild(unqualifiedId, syntax::NodeRole::IdExpression_id);
6441b2f6b4aSEduardo Caldas 
6451b2f6b4aSEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
6461b2f6b4aSEduardo Caldas                      new (allocator()) syntax::IdExpression, S);
6471b2f6b4aSEduardo Caldas     return true;
6481b2f6b4aSEduardo Caldas   }
6491b2f6b4aSEduardo Caldas 
6503b739690SEduardo Caldas   bool WalkUpFromIntegerLiteral(IntegerLiteral *S) {
65142f6fec3SEduardo Caldas     Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken);
6523b739690SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
6533b739690SEduardo Caldas                      new (allocator()) syntax::IntegerLiteralExpression, S);
6543b739690SEduardo Caldas     return true;
6553b739690SEduardo Caldas   }
6563b739690SEduardo Caldas 
657*7f7f8564SEduardo Caldas   bool WalkUpFromCXXBoolLiteralExpr(CXXBoolLiteralExpr *S) {
658*7f7f8564SEduardo Caldas     Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken);
659*7f7f8564SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
660*7f7f8564SEduardo Caldas                      new (allocator()) syntax::BoolLiteralExpression, S);
661*7f7f8564SEduardo Caldas     return true;
662*7f7f8564SEduardo Caldas   }
663*7f7f8564SEduardo Caldas 
664007098d7SEduardo Caldas   bool WalkUpFromCXXNullPtrLiteralExpr(CXXNullPtrLiteralExpr *S) {
66542f6fec3SEduardo Caldas     Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken);
666007098d7SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
667007098d7SEduardo Caldas                      new (allocator()) syntax::CxxNullPtrExpression, S);
668007098d7SEduardo Caldas     return true;
669007098d7SEduardo Caldas   }
670007098d7SEduardo Caldas 
671461af57dSEduardo Caldas   bool WalkUpFromUnaryOperator(UnaryOperator *S) {
67242f6fec3SEduardo Caldas     Builder.markChildToken(S->getOperatorLoc(),
67342f6fec3SEduardo Caldas                            syntax::NodeRole::OperatorExpression_operatorToken);
674461af57dSEduardo Caldas     Builder.markExprChild(S->getSubExpr(),
675461af57dSEduardo Caldas                           syntax::NodeRole::UnaryOperatorExpression_operand);
676461af57dSEduardo Caldas 
677461af57dSEduardo Caldas     if (S->isPostfix())
678461af57dSEduardo Caldas       Builder.foldNode(Builder.getExprRange(S),
679461af57dSEduardo Caldas                        new (allocator()) syntax::PostfixUnaryOperatorExpression,
680461af57dSEduardo Caldas                        S);
681461af57dSEduardo Caldas     else
682461af57dSEduardo Caldas       Builder.foldNode(Builder.getExprRange(S),
683461af57dSEduardo Caldas                        new (allocator()) syntax::PrefixUnaryOperatorExpression,
684461af57dSEduardo Caldas                        S);
685461af57dSEduardo Caldas 
686461af57dSEduardo Caldas     return true;
687461af57dSEduardo Caldas   }
688461af57dSEduardo Caldas 
6893785eb83SEduardo Caldas   bool WalkUpFromBinaryOperator(BinaryOperator *S) {
6903785eb83SEduardo Caldas     Builder.markExprChild(
6913785eb83SEduardo Caldas         S->getLHS(), syntax::NodeRole::BinaryOperatorExpression_leftHandSide);
69242f6fec3SEduardo Caldas     Builder.markChildToken(S->getOperatorLoc(),
69342f6fec3SEduardo Caldas                            syntax::NodeRole::OperatorExpression_operatorToken);
6943785eb83SEduardo Caldas     Builder.markExprChild(
6953785eb83SEduardo Caldas         S->getRHS(), syntax::NodeRole::BinaryOperatorExpression_rightHandSide);
6963785eb83SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
6973785eb83SEduardo Caldas                      new (allocator()) syntax::BinaryOperatorExpression, S);
6983785eb83SEduardo Caldas     return true;
6993785eb83SEduardo Caldas   }
7003785eb83SEduardo Caldas 
7013a574a6cSEduardo Caldas   bool WalkUpFromCXXOperatorCallExpr(CXXOperatorCallExpr *S) {
7023a574a6cSEduardo Caldas     if (S->isInfixBinaryOp()) {
7033a574a6cSEduardo Caldas       Builder.markExprChild(
7043a574a6cSEduardo Caldas           S->getArg(0),
7053a574a6cSEduardo Caldas           syntax::NodeRole::BinaryOperatorExpression_leftHandSide);
7063a574a6cSEduardo Caldas       Builder.markChildToken(
7073a574a6cSEduardo Caldas           S->getOperatorLoc(),
70842f6fec3SEduardo Caldas           syntax::NodeRole::OperatorExpression_operatorToken);
7093a574a6cSEduardo Caldas       Builder.markExprChild(
7103a574a6cSEduardo Caldas           S->getArg(1),
7113a574a6cSEduardo Caldas           syntax::NodeRole::BinaryOperatorExpression_rightHandSide);
7123a574a6cSEduardo Caldas       Builder.foldNode(Builder.getExprRange(S),
7133a574a6cSEduardo Caldas                        new (allocator()) syntax::BinaryOperatorExpression, S);
7143a574a6cSEduardo Caldas       return true;
7153a574a6cSEduardo Caldas     }
7163a574a6cSEduardo Caldas     return RecursiveASTVisitor::WalkUpFromCXXOperatorCallExpr(S);
7173a574a6cSEduardo Caldas   }
7183a574a6cSEduardo Caldas 
719be14a22bSIlya Biryukov   bool WalkUpFromNamespaceDecl(NamespaceDecl *S) {
720cdce2fe5SMarcel Hlopko     auto Tokens = Builder.getDeclarationRange(S);
721be14a22bSIlya Biryukov     if (Tokens.front().kind() == tok::coloncolon) {
722be14a22bSIlya Biryukov       // Handle nested namespace definitions. Those start at '::' token, e.g.
723be14a22bSIlya Biryukov       // namespace a^::b {}
724be14a22bSIlya Biryukov       // FIXME: build corresponding nodes for the name of this namespace.
725be14a22bSIlya Biryukov       return true;
726be14a22bSIlya Biryukov     }
727a711a3a4SMarcel Hlopko     Builder.foldNode(Tokens, new (allocator()) syntax::NamespaceDefinition, S);
728be14a22bSIlya Biryukov     return true;
729be14a22bSIlya Biryukov   }
730be14a22bSIlya Biryukov 
7317d382dcdSMarcel Hlopko   bool TraverseParenTypeLoc(ParenTypeLoc L) {
7327d382dcdSMarcel Hlopko     // We reverse order of traversal to get the proper syntax structure.
7337d382dcdSMarcel Hlopko     if (!WalkUpFromParenTypeLoc(L))
7347d382dcdSMarcel Hlopko       return false;
7357d382dcdSMarcel Hlopko     return TraverseTypeLoc(L.getInnerLoc());
7367d382dcdSMarcel Hlopko   }
7377d382dcdSMarcel Hlopko 
7387d382dcdSMarcel Hlopko   bool WalkUpFromParenTypeLoc(ParenTypeLoc L) {
7397d382dcdSMarcel Hlopko     Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen);
7407d382dcdSMarcel Hlopko     Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen);
7417d382dcdSMarcel Hlopko     Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getRParenLoc()),
742a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ParenDeclarator, L);
7437d382dcdSMarcel Hlopko     return true;
7447d382dcdSMarcel Hlopko   }
7457d382dcdSMarcel Hlopko 
7467d382dcdSMarcel Hlopko   // Declarator chunks, they are produced by type locs and some clang::Decls.
7477d382dcdSMarcel Hlopko   bool WalkUpFromArrayTypeLoc(ArrayTypeLoc L) {
7487d382dcdSMarcel Hlopko     Builder.markChildToken(L.getLBracketLoc(), syntax::NodeRole::OpenParen);
7497d382dcdSMarcel Hlopko     Builder.markExprChild(L.getSizeExpr(),
7507d382dcdSMarcel Hlopko                           syntax::NodeRole::ArraySubscript_sizeExpression);
7517d382dcdSMarcel Hlopko     Builder.markChildToken(L.getRBracketLoc(), syntax::NodeRole::CloseParen);
7527d382dcdSMarcel Hlopko     Builder.foldNode(Builder.getRange(L.getLBracketLoc(), L.getRBracketLoc()),
753a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ArraySubscript, L);
7547d382dcdSMarcel Hlopko     return true;
7557d382dcdSMarcel Hlopko   }
7567d382dcdSMarcel Hlopko 
7577d382dcdSMarcel Hlopko   bool WalkUpFromFunctionTypeLoc(FunctionTypeLoc L) {
7587d382dcdSMarcel Hlopko     Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen);
759cdce2fe5SMarcel Hlopko     for (auto *P : L.getParams()) {
760cdce2fe5SMarcel Hlopko       Builder.markChild(P, syntax::NodeRole::ParametersAndQualifiers_parameter);
761cdce2fe5SMarcel Hlopko     }
7627d382dcdSMarcel Hlopko     Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen);
7637d382dcdSMarcel Hlopko     Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getEndLoc()),
764a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ParametersAndQualifiers, L);
7657d382dcdSMarcel Hlopko     return true;
7667d382dcdSMarcel Hlopko   }
7677d382dcdSMarcel Hlopko 
7687d382dcdSMarcel Hlopko   bool WalkUpFromFunctionProtoTypeLoc(FunctionProtoTypeLoc L) {
7697d382dcdSMarcel Hlopko     if (!L.getTypePtr()->hasTrailingReturn())
7707d382dcdSMarcel Hlopko       return WalkUpFromFunctionTypeLoc(L);
7717d382dcdSMarcel Hlopko 
772cdce2fe5SMarcel Hlopko     auto *TrailingReturnTokens = BuildTrailingReturn(L);
7737d382dcdSMarcel Hlopko     // Finish building the node for parameters.
7747d382dcdSMarcel Hlopko     Builder.markChild(TrailingReturnTokens,
7757d382dcdSMarcel Hlopko                       syntax::NodeRole::ParametersAndQualifiers_trailingReturn);
7767d382dcdSMarcel Hlopko     return WalkUpFromFunctionTypeLoc(L);
7777d382dcdSMarcel Hlopko   }
7787d382dcdSMarcel Hlopko 
7797d382dcdSMarcel Hlopko   bool WalkUpFromMemberPointerTypeLoc(MemberPointerTypeLoc L) {
7807d382dcdSMarcel Hlopko     auto SR = L.getLocalSourceRange();
781a711a3a4SMarcel Hlopko     Builder.foldNode(Builder.getRange(SR),
782a711a3a4SMarcel Hlopko                      new (allocator()) syntax::MemberPointer, L);
7837d382dcdSMarcel Hlopko     return true;
7847d382dcdSMarcel Hlopko   }
7857d382dcdSMarcel Hlopko 
78658fa50f4SIlya Biryukov   // The code below is very regular, it could even be generated with some
78758fa50f4SIlya Biryukov   // preprocessor magic. We merely assign roles to the corresponding children
78858fa50f4SIlya Biryukov   // and fold resulting nodes.
78958fa50f4SIlya Biryukov   bool WalkUpFromDeclStmt(DeclStmt *S) {
79058fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
791a711a3a4SMarcel Hlopko                      new (allocator()) syntax::DeclarationStatement, S);
79258fa50f4SIlya Biryukov     return true;
79358fa50f4SIlya Biryukov   }
79458fa50f4SIlya Biryukov 
79558fa50f4SIlya Biryukov   bool WalkUpFromNullStmt(NullStmt *S) {
79658fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
797a711a3a4SMarcel Hlopko                      new (allocator()) syntax::EmptyStatement, S);
79858fa50f4SIlya Biryukov     return true;
79958fa50f4SIlya Biryukov   }
80058fa50f4SIlya Biryukov 
80158fa50f4SIlya Biryukov   bool WalkUpFromSwitchStmt(SwitchStmt *S) {
802def65bb4SIlya Biryukov     Builder.markChildToken(S->getSwitchLoc(),
80358fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
80458fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
80558fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
806a711a3a4SMarcel Hlopko                      new (allocator()) syntax::SwitchStatement, S);
80758fa50f4SIlya Biryukov     return true;
80858fa50f4SIlya Biryukov   }
80958fa50f4SIlya Biryukov 
81058fa50f4SIlya Biryukov   bool WalkUpFromCaseStmt(CaseStmt *S) {
811def65bb4SIlya Biryukov     Builder.markChildToken(S->getKeywordLoc(),
81258fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
81358fa50f4SIlya Biryukov     Builder.markExprChild(S->getLHS(), syntax::NodeRole::CaseStatement_value);
81458fa50f4SIlya Biryukov     Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement);
81558fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
816a711a3a4SMarcel Hlopko                      new (allocator()) syntax::CaseStatement, S);
81758fa50f4SIlya Biryukov     return true;
81858fa50f4SIlya Biryukov   }
81958fa50f4SIlya Biryukov 
82058fa50f4SIlya Biryukov   bool WalkUpFromDefaultStmt(DefaultStmt *S) {
821def65bb4SIlya Biryukov     Builder.markChildToken(S->getKeywordLoc(),
82258fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
82358fa50f4SIlya Biryukov     Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement);
82458fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
825a711a3a4SMarcel Hlopko                      new (allocator()) syntax::DefaultStatement, S);
82658fa50f4SIlya Biryukov     return true;
82758fa50f4SIlya Biryukov   }
82858fa50f4SIlya Biryukov 
82958fa50f4SIlya Biryukov   bool WalkUpFromIfStmt(IfStmt *S) {
830def65bb4SIlya Biryukov     Builder.markChildToken(S->getIfLoc(), syntax::NodeRole::IntroducerKeyword);
83158fa50f4SIlya Biryukov     Builder.markStmtChild(S->getThen(),
83258fa50f4SIlya Biryukov                           syntax::NodeRole::IfStatement_thenStatement);
833def65bb4SIlya Biryukov     Builder.markChildToken(S->getElseLoc(),
83458fa50f4SIlya Biryukov                            syntax::NodeRole::IfStatement_elseKeyword);
83558fa50f4SIlya Biryukov     Builder.markStmtChild(S->getElse(),
83658fa50f4SIlya Biryukov                           syntax::NodeRole::IfStatement_elseStatement);
83758fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
838a711a3a4SMarcel Hlopko                      new (allocator()) syntax::IfStatement, S);
83958fa50f4SIlya Biryukov     return true;
84058fa50f4SIlya Biryukov   }
84158fa50f4SIlya Biryukov 
84258fa50f4SIlya Biryukov   bool WalkUpFromForStmt(ForStmt *S) {
843def65bb4SIlya Biryukov     Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword);
84458fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
84558fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
846a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ForStatement, S);
84758fa50f4SIlya Biryukov     return true;
84858fa50f4SIlya Biryukov   }
84958fa50f4SIlya Biryukov 
85058fa50f4SIlya Biryukov   bool WalkUpFromWhileStmt(WhileStmt *S) {
851def65bb4SIlya Biryukov     Builder.markChildToken(S->getWhileLoc(),
85258fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
85358fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
85458fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
855a711a3a4SMarcel Hlopko                      new (allocator()) syntax::WhileStatement, S);
85658fa50f4SIlya Biryukov     return true;
85758fa50f4SIlya Biryukov   }
85858fa50f4SIlya Biryukov 
85958fa50f4SIlya Biryukov   bool WalkUpFromContinueStmt(ContinueStmt *S) {
860def65bb4SIlya Biryukov     Builder.markChildToken(S->getContinueLoc(),
86158fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
86258fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
863a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ContinueStatement, S);
86458fa50f4SIlya Biryukov     return true;
86558fa50f4SIlya Biryukov   }
86658fa50f4SIlya Biryukov 
86758fa50f4SIlya Biryukov   bool WalkUpFromBreakStmt(BreakStmt *S) {
868def65bb4SIlya Biryukov     Builder.markChildToken(S->getBreakLoc(),
86958fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
87058fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
871a711a3a4SMarcel Hlopko                      new (allocator()) syntax::BreakStatement, S);
87258fa50f4SIlya Biryukov     return true;
87358fa50f4SIlya Biryukov   }
87458fa50f4SIlya Biryukov 
87558fa50f4SIlya Biryukov   bool WalkUpFromReturnStmt(ReturnStmt *S) {
876def65bb4SIlya Biryukov     Builder.markChildToken(S->getReturnLoc(),
87758fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
87858fa50f4SIlya Biryukov     Builder.markExprChild(S->getRetValue(),
87958fa50f4SIlya Biryukov                           syntax::NodeRole::ReturnStatement_value);
88058fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
881a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ReturnStatement, S);
88258fa50f4SIlya Biryukov     return true;
88358fa50f4SIlya Biryukov   }
88458fa50f4SIlya Biryukov 
88558fa50f4SIlya Biryukov   bool WalkUpFromCXXForRangeStmt(CXXForRangeStmt *S) {
886def65bb4SIlya Biryukov     Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword);
88758fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
88858fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
889a711a3a4SMarcel Hlopko                      new (allocator()) syntax::RangeBasedForStatement, S);
89058fa50f4SIlya Biryukov     return true;
89158fa50f4SIlya Biryukov   }
89258fa50f4SIlya Biryukov 
893be14a22bSIlya Biryukov   bool WalkUpFromEmptyDecl(EmptyDecl *S) {
894cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
895a711a3a4SMarcel Hlopko                      new (allocator()) syntax::EmptyDeclaration, S);
896be14a22bSIlya Biryukov     return true;
897be14a22bSIlya Biryukov   }
898be14a22bSIlya Biryukov 
899be14a22bSIlya Biryukov   bool WalkUpFromStaticAssertDecl(StaticAssertDecl *S) {
900be14a22bSIlya Biryukov     Builder.markExprChild(S->getAssertExpr(),
901be14a22bSIlya Biryukov                           syntax::NodeRole::StaticAssertDeclaration_condition);
902be14a22bSIlya Biryukov     Builder.markExprChild(S->getMessage(),
903be14a22bSIlya Biryukov                           syntax::NodeRole::StaticAssertDeclaration_message);
904cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
905a711a3a4SMarcel Hlopko                      new (allocator()) syntax::StaticAssertDeclaration, S);
906be14a22bSIlya Biryukov     return true;
907be14a22bSIlya Biryukov   }
908be14a22bSIlya Biryukov 
909be14a22bSIlya Biryukov   bool WalkUpFromLinkageSpecDecl(LinkageSpecDecl *S) {
910cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
911a711a3a4SMarcel Hlopko                      new (allocator()) syntax::LinkageSpecificationDeclaration,
912a711a3a4SMarcel Hlopko                      S);
913be14a22bSIlya Biryukov     return true;
914be14a22bSIlya Biryukov   }
915be14a22bSIlya Biryukov 
916be14a22bSIlya Biryukov   bool WalkUpFromNamespaceAliasDecl(NamespaceAliasDecl *S) {
917cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
918a711a3a4SMarcel Hlopko                      new (allocator()) syntax::NamespaceAliasDefinition, S);
919be14a22bSIlya Biryukov     return true;
920be14a22bSIlya Biryukov   }
921be14a22bSIlya Biryukov 
922be14a22bSIlya Biryukov   bool WalkUpFromUsingDirectiveDecl(UsingDirectiveDecl *S) {
923cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
924a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingNamespaceDirective, S);
925be14a22bSIlya Biryukov     return true;
926be14a22bSIlya Biryukov   }
927be14a22bSIlya Biryukov 
928be14a22bSIlya Biryukov   bool WalkUpFromUsingDecl(UsingDecl *S) {
929cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
930a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingDeclaration, S);
931be14a22bSIlya Biryukov     return true;
932be14a22bSIlya Biryukov   }
933be14a22bSIlya Biryukov 
934be14a22bSIlya Biryukov   bool WalkUpFromUnresolvedUsingValueDecl(UnresolvedUsingValueDecl *S) {
935cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
936a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingDeclaration, S);
937be14a22bSIlya Biryukov     return true;
938be14a22bSIlya Biryukov   }
939be14a22bSIlya Biryukov 
940be14a22bSIlya Biryukov   bool WalkUpFromUnresolvedUsingTypenameDecl(UnresolvedUsingTypenameDecl *S) {
941cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
942a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingDeclaration, S);
943be14a22bSIlya Biryukov     return true;
944be14a22bSIlya Biryukov   }
945be14a22bSIlya Biryukov 
946be14a22bSIlya Biryukov   bool WalkUpFromTypeAliasDecl(TypeAliasDecl *S) {
947cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
948a711a3a4SMarcel Hlopko                      new (allocator()) syntax::TypeAliasDeclaration, S);
949be14a22bSIlya Biryukov     return true;
950be14a22bSIlya Biryukov   }
951be14a22bSIlya Biryukov 
9529b3f38f9SIlya Biryukov private:
953cdce2fe5SMarcel Hlopko   template <class T> SourceLocation getQualifiedNameStart(T *D) {
954cdce2fe5SMarcel Hlopko     static_assert((std::is_base_of<DeclaratorDecl, T>::value ||
955cdce2fe5SMarcel Hlopko                    std::is_base_of<TypedefNameDecl, T>::value),
956cdce2fe5SMarcel Hlopko                   "only DeclaratorDecl and TypedefNameDecl are supported.");
957cdce2fe5SMarcel Hlopko 
958cdce2fe5SMarcel Hlopko     auto DN = D->getDeclName();
959cdce2fe5SMarcel Hlopko     bool IsAnonymous = DN.isIdentifier() && !DN.getAsIdentifierInfo();
960cdce2fe5SMarcel Hlopko     if (IsAnonymous)
961cdce2fe5SMarcel Hlopko       return SourceLocation();
962cdce2fe5SMarcel Hlopko 
963cdce2fe5SMarcel Hlopko     if (const auto *DD = llvm::dyn_cast<DeclaratorDecl>(D)) {
964cdce2fe5SMarcel Hlopko       if (DD->getQualifierLoc()) {
965cdce2fe5SMarcel Hlopko         return DD->getQualifierLoc().getBeginLoc();
966cdce2fe5SMarcel Hlopko       }
967cdce2fe5SMarcel Hlopko     }
968cdce2fe5SMarcel Hlopko 
969cdce2fe5SMarcel Hlopko     return D->getLocation();
970cdce2fe5SMarcel Hlopko   }
971cdce2fe5SMarcel Hlopko 
972cdce2fe5SMarcel Hlopko   SourceRange getInitializerRange(Decl *D) {
973cdce2fe5SMarcel Hlopko     if (auto *V = llvm::dyn_cast<VarDecl>(D)) {
974cdce2fe5SMarcel Hlopko       auto *I = V->getInit();
975cdce2fe5SMarcel Hlopko       // Initializers in range-based-for are not part of the declarator
976cdce2fe5SMarcel Hlopko       if (I && !V->isCXXForRangeDecl())
977cdce2fe5SMarcel Hlopko         return I->getSourceRange();
978cdce2fe5SMarcel Hlopko     }
979cdce2fe5SMarcel Hlopko 
980cdce2fe5SMarcel Hlopko     return SourceRange();
981cdce2fe5SMarcel Hlopko   }
982cdce2fe5SMarcel Hlopko 
983cdce2fe5SMarcel Hlopko   /// Folds SimpleDeclarator node (if present) and in case this is the last
984cdce2fe5SMarcel Hlopko   /// declarator in the chain it also folds SimpleDeclaration node.
985cdce2fe5SMarcel Hlopko   template <class T> bool processDeclaratorAndDeclaration(T *D) {
986cdce2fe5SMarcel Hlopko     SourceRange Initializer = getInitializerRange(D);
987cdce2fe5SMarcel Hlopko     auto Range = getDeclaratorRange(Builder.sourceManager(),
988cdce2fe5SMarcel Hlopko                                     D->getTypeSourceInfo()->getTypeLoc(),
989cdce2fe5SMarcel Hlopko                                     getQualifiedNameStart(D), Initializer);
990cdce2fe5SMarcel Hlopko 
991cdce2fe5SMarcel Hlopko     // There doesn't have to be a declarator (e.g. `void foo(int)` only has
992cdce2fe5SMarcel Hlopko     // declaration, but no declarator).
993cdce2fe5SMarcel Hlopko     if (Range.getBegin().isValid()) {
994cdce2fe5SMarcel Hlopko       auto *N = new (allocator()) syntax::SimpleDeclarator;
995cdce2fe5SMarcel Hlopko       Builder.foldNode(Builder.getRange(Range), N, nullptr);
996cdce2fe5SMarcel Hlopko       Builder.markChild(N, syntax::NodeRole::SimpleDeclaration_declarator);
997cdce2fe5SMarcel Hlopko     }
998cdce2fe5SMarcel Hlopko 
999cdce2fe5SMarcel Hlopko     if (Builder.isResponsibleForCreatingDeclaration(D)) {
1000cdce2fe5SMarcel Hlopko       Builder.foldNode(Builder.getDeclarationRange(D),
1001cdce2fe5SMarcel Hlopko                        new (allocator()) syntax::SimpleDeclaration, D);
1002cdce2fe5SMarcel Hlopko     }
1003cdce2fe5SMarcel Hlopko     return true;
1004cdce2fe5SMarcel Hlopko   }
1005cdce2fe5SMarcel Hlopko 
10067d382dcdSMarcel Hlopko   /// Returns the range of the built node.
1007a711a3a4SMarcel Hlopko   syntax::TrailingReturnType *BuildTrailingReturn(FunctionProtoTypeLoc L) {
10087d382dcdSMarcel Hlopko     assert(L.getTypePtr()->hasTrailingReturn());
10097d382dcdSMarcel Hlopko 
10107d382dcdSMarcel Hlopko     auto ReturnedType = L.getReturnLoc();
10117d382dcdSMarcel Hlopko     // Build node for the declarator, if any.
10127d382dcdSMarcel Hlopko     auto ReturnDeclaratorRange =
10137d382dcdSMarcel Hlopko         getDeclaratorRange(this->Builder.sourceManager(), ReturnedType,
10147d382dcdSMarcel Hlopko                            /*Name=*/SourceLocation(),
10157d382dcdSMarcel Hlopko                            /*Initializer=*/SourceLocation());
1016a711a3a4SMarcel Hlopko     syntax::SimpleDeclarator *ReturnDeclarator = nullptr;
10177d382dcdSMarcel Hlopko     if (ReturnDeclaratorRange.isValid()) {
1018a711a3a4SMarcel Hlopko       ReturnDeclarator = new (allocator()) syntax::SimpleDeclarator;
1019a711a3a4SMarcel Hlopko       Builder.foldNode(Builder.getRange(ReturnDeclaratorRange),
1020a711a3a4SMarcel Hlopko                        ReturnDeclarator, nullptr);
10217d382dcdSMarcel Hlopko     }
10227d382dcdSMarcel Hlopko 
10237d382dcdSMarcel Hlopko     // Build node for trailing return type.
1024a711a3a4SMarcel Hlopko     auto Return = Builder.getRange(ReturnedType.getSourceRange());
10257d382dcdSMarcel Hlopko     const auto *Arrow = Return.begin() - 1;
10267d382dcdSMarcel Hlopko     assert(Arrow->kind() == tok::arrow);
10277d382dcdSMarcel Hlopko     auto Tokens = llvm::makeArrayRef(Arrow, Return.end());
102842f6fec3SEduardo Caldas     Builder.markChildToken(Arrow, syntax::NodeRole::ArrowToken);
1029a711a3a4SMarcel Hlopko     if (ReturnDeclarator)
1030a711a3a4SMarcel Hlopko       Builder.markChild(ReturnDeclarator,
10317d382dcdSMarcel Hlopko                         syntax::NodeRole::TrailingReturnType_declarator);
1032a711a3a4SMarcel Hlopko     auto *R = new (allocator()) syntax::TrailingReturnType;
1033cdce2fe5SMarcel Hlopko     Builder.foldNode(Tokens, R, L);
1034a711a3a4SMarcel Hlopko     return R;
10357d382dcdSMarcel Hlopko   }
103688bf9b3dSMarcel Hlopko 
1037a711a3a4SMarcel Hlopko   void foldExplicitTemplateInstantiation(
1038a711a3a4SMarcel Hlopko       ArrayRef<syntax::Token> Range, const syntax::Token *ExternKW,
103988bf9b3dSMarcel Hlopko       const syntax::Token *TemplateKW,
1040a711a3a4SMarcel Hlopko       syntax::SimpleDeclaration *InnerDeclaration, Decl *From) {
104188bf9b3dSMarcel Hlopko     assert(!ExternKW || ExternKW->kind() == tok::kw_extern);
104288bf9b3dSMarcel Hlopko     assert(TemplateKW && TemplateKW->kind() == tok::kw_template);
104342f6fec3SEduardo Caldas     Builder.markChildToken(ExternKW, syntax::NodeRole::ExternKeyword);
104488bf9b3dSMarcel Hlopko     Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword);
104588bf9b3dSMarcel Hlopko     Builder.markChild(
104688bf9b3dSMarcel Hlopko         InnerDeclaration,
104788bf9b3dSMarcel Hlopko         syntax::NodeRole::ExplicitTemplateInstantiation_declaration);
1048a711a3a4SMarcel Hlopko     Builder.foldNode(
1049a711a3a4SMarcel Hlopko         Range, new (allocator()) syntax::ExplicitTemplateInstantiation, From);
105088bf9b3dSMarcel Hlopko   }
105188bf9b3dSMarcel Hlopko 
1052a711a3a4SMarcel Hlopko   syntax::TemplateDeclaration *foldTemplateDeclaration(
1053a711a3a4SMarcel Hlopko       ArrayRef<syntax::Token> Range, const syntax::Token *TemplateKW,
1054a711a3a4SMarcel Hlopko       ArrayRef<syntax::Token> TemplatedDeclaration, Decl *From) {
105588bf9b3dSMarcel Hlopko     assert(TemplateKW && TemplateKW->kind() == tok::kw_template);
105688bf9b3dSMarcel Hlopko     Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword);
1057a711a3a4SMarcel Hlopko 
1058a711a3a4SMarcel Hlopko     auto *N = new (allocator()) syntax::TemplateDeclaration;
1059a711a3a4SMarcel Hlopko     Builder.foldNode(Range, N, From);
1060cdce2fe5SMarcel Hlopko     Builder.markChild(N, syntax::NodeRole::TemplateDeclaration_declaration);
1061a711a3a4SMarcel Hlopko     return N;
106288bf9b3dSMarcel Hlopko   }
106388bf9b3dSMarcel Hlopko 
10649b3f38f9SIlya Biryukov   /// A small helper to save some typing.
10659b3f38f9SIlya Biryukov   llvm::BumpPtrAllocator &allocator() { return Builder.allocator(); }
10669b3f38f9SIlya Biryukov 
10679b3f38f9SIlya Biryukov   syntax::TreeBuilder &Builder;
10689b3f38f9SIlya Biryukov   const LangOptions &LangOpts;
10699b3f38f9SIlya Biryukov };
10709b3f38f9SIlya Biryukov } // namespace
10719b3f38f9SIlya Biryukov 
10727d382dcdSMarcel Hlopko void syntax::TreeBuilder::noticeDeclWithoutSemicolon(Decl *D) {
1073e702bdb8SIlya Biryukov   DeclsWithoutSemicolons.insert(D);
1074e702bdb8SIlya Biryukov }
1075e702bdb8SIlya Biryukov 
1076def65bb4SIlya Biryukov void syntax::TreeBuilder::markChildToken(SourceLocation Loc, NodeRole Role) {
10779b3f38f9SIlya Biryukov   if (Loc.isInvalid())
10789b3f38f9SIlya Biryukov     return;
10799b3f38f9SIlya Biryukov   Pending.assignRole(*findToken(Loc), Role);
10809b3f38f9SIlya Biryukov }
10819b3f38f9SIlya Biryukov 
10827d382dcdSMarcel Hlopko void syntax::TreeBuilder::markChildToken(const syntax::Token *T, NodeRole R) {
10837d382dcdSMarcel Hlopko   if (!T)
10847d382dcdSMarcel Hlopko     return;
10857d382dcdSMarcel Hlopko   Pending.assignRole(*T, R);
10867d382dcdSMarcel Hlopko }
10877d382dcdSMarcel Hlopko 
1088a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(syntax::Node *N, NodeRole R) {
1089a711a3a4SMarcel Hlopko   assert(N);
1090a711a3a4SMarcel Hlopko   setRole(N, R);
1091a711a3a4SMarcel Hlopko }
1092a711a3a4SMarcel Hlopko 
1093a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(ASTPtr N, NodeRole R) {
1094a711a3a4SMarcel Hlopko   auto *SN = Mapping.find(N);
1095a711a3a4SMarcel Hlopko   assert(SN != nullptr);
1096a711a3a4SMarcel Hlopko   setRole(SN, R);
10977d382dcdSMarcel Hlopko }
10987d382dcdSMarcel Hlopko 
109958fa50f4SIlya Biryukov void syntax::TreeBuilder::markStmtChild(Stmt *Child, NodeRole Role) {
110058fa50f4SIlya Biryukov   if (!Child)
110158fa50f4SIlya Biryukov     return;
110258fa50f4SIlya Biryukov 
1103b34b7691SDmitri Gribenko   syntax::Tree *ChildNode;
1104b34b7691SDmitri Gribenko   if (Expr *ChildExpr = dyn_cast<Expr>(Child)) {
110558fa50f4SIlya Biryukov     // This is an expression in a statement position, consume the trailing
110658fa50f4SIlya Biryukov     // semicolon and form an 'ExpressionStatement' node.
1107b34b7691SDmitri Gribenko     markExprChild(ChildExpr, NodeRole::ExpressionStatement_expression);
1108a711a3a4SMarcel Hlopko     ChildNode = new (allocator()) syntax::ExpressionStatement;
1109a711a3a4SMarcel Hlopko     // (!) 'getStmtRange()' ensures this covers a trailing semicolon.
1110a711a3a4SMarcel Hlopko     Pending.foldChildren(Arena, getStmtRange(Child), ChildNode);
1111b34b7691SDmitri Gribenko   } else {
1112b34b7691SDmitri Gribenko     ChildNode = Mapping.find(Child);
111358fa50f4SIlya Biryukov   }
1114b34b7691SDmitri Gribenko   assert(ChildNode != nullptr);
1115a711a3a4SMarcel Hlopko   setRole(ChildNode, Role);
111658fa50f4SIlya Biryukov }
111758fa50f4SIlya Biryukov 
111858fa50f4SIlya Biryukov void syntax::TreeBuilder::markExprChild(Expr *Child, NodeRole Role) {
1119be14a22bSIlya Biryukov   if (!Child)
1120be14a22bSIlya Biryukov     return;
1121a711a3a4SMarcel Hlopko   Child = Child->IgnoreImplicit();
1122be14a22bSIlya Biryukov 
1123a711a3a4SMarcel Hlopko   syntax::Tree *ChildNode = Mapping.find(Child);
1124a711a3a4SMarcel Hlopko   assert(ChildNode != nullptr);
1125a711a3a4SMarcel Hlopko   setRole(ChildNode, Role);
112658fa50f4SIlya Biryukov }
112758fa50f4SIlya Biryukov 
11289b3f38f9SIlya Biryukov const syntax::Token *syntax::TreeBuilder::findToken(SourceLocation L) const {
112988bf9b3dSMarcel Hlopko   if (L.isInvalid())
113088bf9b3dSMarcel Hlopko     return nullptr;
1131c1bbefefSIlya Biryukov   auto It = LocationToToken.find(L.getRawEncoding());
1132c1bbefefSIlya Biryukov   assert(It != LocationToToken.end());
1133c1bbefefSIlya Biryukov   return It->second;
11349b3f38f9SIlya Biryukov }
11359b3f38f9SIlya Biryukov 
11369b3f38f9SIlya Biryukov syntax::TranslationUnit *
11379b3f38f9SIlya Biryukov syntax::buildSyntaxTree(Arena &A, const TranslationUnitDecl &TU) {
11389b3f38f9SIlya Biryukov   TreeBuilder Builder(A);
11399b3f38f9SIlya Biryukov   BuildTreeVisitor(TU.getASTContext(), Builder).TraverseAST(TU.getASTContext());
11409b3f38f9SIlya Biryukov   return std::move(Builder).finalize();
11419b3f38f9SIlya Biryukov }
1142