19b3f38f9SIlya Biryukov //===- BuildTree.cpp ------------------------------------------*- C++ -*-=====//
29b3f38f9SIlya Biryukov //
39b3f38f9SIlya Biryukov // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
49b3f38f9SIlya Biryukov // See https://llvm.org/LICENSE.txt for license information.
59b3f38f9SIlya Biryukov // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
69b3f38f9SIlya Biryukov //
79b3f38f9SIlya Biryukov //===----------------------------------------------------------------------===//
89b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/BuildTree.h"
97d382dcdSMarcel Hlopko #include "clang/AST/ASTFwd.h"
10e702bdb8SIlya Biryukov #include "clang/AST/Decl.h"
11e702bdb8SIlya Biryukov #include "clang/AST/DeclBase.h"
127d382dcdSMarcel Hlopko #include "clang/AST/DeclCXX.h"
137d382dcdSMarcel Hlopko #include "clang/AST/DeclarationName.h"
143785eb83SEduardo Caldas #include "clang/AST/Expr.h"
159b3f38f9SIlya Biryukov #include "clang/AST/RecursiveASTVisitor.h"
169b3f38f9SIlya Biryukov #include "clang/AST/Stmt.h"
177d382dcdSMarcel Hlopko #include "clang/AST/TypeLoc.h"
187d382dcdSMarcel Hlopko #include "clang/AST/TypeLocVisitor.h"
199b3f38f9SIlya Biryukov #include "clang/Basic/LLVM.h"
209b3f38f9SIlya Biryukov #include "clang/Basic/SourceLocation.h"
219b3f38f9SIlya Biryukov #include "clang/Basic/SourceManager.h"
2288bf9b3dSMarcel Hlopko #include "clang/Basic/Specifiers.h"
239b3f38f9SIlya Biryukov #include "clang/Basic/TokenKinds.h"
249b3f38f9SIlya Biryukov #include "clang/Lex/Lexer.h"
259b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Nodes.h"
269b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tokens.h"
279b3f38f9SIlya Biryukov #include "clang/Tooling/Syntax/Tree.h"
289b3f38f9SIlya Biryukov #include "llvm/ADT/ArrayRef.h"
29a711a3a4SMarcel Hlopko #include "llvm/ADT/DenseMap.h"
30a711a3a4SMarcel Hlopko #include "llvm/ADT/PointerUnion.h"
319b3f38f9SIlya Biryukov #include "llvm/ADT/STLExtras.h"
327d382dcdSMarcel Hlopko #include "llvm/ADT/ScopeExit.h"
339b3f38f9SIlya Biryukov #include "llvm/ADT/SmallVector.h"
349b3f38f9SIlya Biryukov #include "llvm/Support/Allocator.h"
359b3f38f9SIlya Biryukov #include "llvm/Support/Casting.h"
3696065cf7SIlya Biryukov #include "llvm/Support/Compiler.h"
379b3f38f9SIlya Biryukov #include "llvm/Support/FormatVariadic.h"
381ad15046SIlya Biryukov #include "llvm/Support/MemoryBuffer.h"
399b3f38f9SIlya Biryukov #include "llvm/Support/raw_ostream.h"
40a711a3a4SMarcel Hlopko #include <cstddef>
419b3f38f9SIlya Biryukov #include <map>
429b3f38f9SIlya Biryukov 
439b3f38f9SIlya Biryukov using namespace clang;
449b3f38f9SIlya Biryukov 
4596065cf7SIlya Biryukov LLVM_ATTRIBUTE_UNUSED
4658fa50f4SIlya Biryukov static bool isImplicitExpr(clang::Expr *E) { return E->IgnoreImplicit() != E; }
4758fa50f4SIlya Biryukov 
487d382dcdSMarcel Hlopko namespace {
497d382dcdSMarcel Hlopko /// Get start location of the Declarator from the TypeLoc.
507d382dcdSMarcel Hlopko /// E.g.:
517d382dcdSMarcel Hlopko ///   loc of `(` in `int (a)`
527d382dcdSMarcel Hlopko ///   loc of `*` in `int *(a)`
537d382dcdSMarcel Hlopko ///   loc of the first `(` in `int (*a)(int)`
547d382dcdSMarcel Hlopko ///   loc of the `*` in `int *(a)(int)`
557d382dcdSMarcel Hlopko ///   loc of the first `*` in `const int *const *volatile a;`
567d382dcdSMarcel Hlopko ///
577d382dcdSMarcel Hlopko /// It is non-trivial to get the start location because TypeLocs are stored
587d382dcdSMarcel Hlopko /// inside out. In the example above `*volatile` is the TypeLoc returned
597d382dcdSMarcel Hlopko /// by `Decl.getTypeSourceInfo()`, and `*const` is what `.getPointeeLoc()`
607d382dcdSMarcel Hlopko /// returns.
617d382dcdSMarcel Hlopko struct GetStartLoc : TypeLocVisitor<GetStartLoc, SourceLocation> {
627d382dcdSMarcel Hlopko   SourceLocation VisitParenTypeLoc(ParenTypeLoc T) {
637d382dcdSMarcel Hlopko     auto L = Visit(T.getInnerLoc());
647d382dcdSMarcel Hlopko     if (L.isValid())
657d382dcdSMarcel Hlopko       return L;
667d382dcdSMarcel Hlopko     return T.getLParenLoc();
677d382dcdSMarcel Hlopko   }
687d382dcdSMarcel Hlopko 
697d382dcdSMarcel Hlopko   // Types spelled in the prefix part of the declarator.
707d382dcdSMarcel Hlopko   SourceLocation VisitPointerTypeLoc(PointerTypeLoc T) {
717d382dcdSMarcel Hlopko     return HandlePointer(T);
727d382dcdSMarcel Hlopko   }
737d382dcdSMarcel Hlopko 
747d382dcdSMarcel Hlopko   SourceLocation VisitMemberPointerTypeLoc(MemberPointerTypeLoc T) {
757d382dcdSMarcel Hlopko     return HandlePointer(T);
767d382dcdSMarcel Hlopko   }
777d382dcdSMarcel Hlopko 
787d382dcdSMarcel Hlopko   SourceLocation VisitBlockPointerTypeLoc(BlockPointerTypeLoc T) {
797d382dcdSMarcel Hlopko     return HandlePointer(T);
807d382dcdSMarcel Hlopko   }
817d382dcdSMarcel Hlopko 
827d382dcdSMarcel Hlopko   SourceLocation VisitReferenceTypeLoc(ReferenceTypeLoc T) {
837d382dcdSMarcel Hlopko     return HandlePointer(T);
847d382dcdSMarcel Hlopko   }
857d382dcdSMarcel Hlopko 
867d382dcdSMarcel Hlopko   SourceLocation VisitObjCObjectPointerTypeLoc(ObjCObjectPointerTypeLoc T) {
877d382dcdSMarcel Hlopko     return HandlePointer(T);
887d382dcdSMarcel Hlopko   }
897d382dcdSMarcel Hlopko 
907d382dcdSMarcel Hlopko   // All other cases are not important, as they are either part of declaration
917d382dcdSMarcel Hlopko   // specifiers (e.g. inheritors of TypeSpecTypeLoc) or introduce modifiers on
927d382dcdSMarcel Hlopko   // existing declarators (e.g. QualifiedTypeLoc). They cannot start the
937d382dcdSMarcel Hlopko   // declarator themselves, but their underlying type can.
947d382dcdSMarcel Hlopko   SourceLocation VisitTypeLoc(TypeLoc T) {
957d382dcdSMarcel Hlopko     auto N = T.getNextTypeLoc();
967d382dcdSMarcel Hlopko     if (!N)
977d382dcdSMarcel Hlopko       return SourceLocation();
987d382dcdSMarcel Hlopko     return Visit(N);
997d382dcdSMarcel Hlopko   }
1007d382dcdSMarcel Hlopko 
1017d382dcdSMarcel Hlopko   SourceLocation VisitFunctionProtoTypeLoc(FunctionProtoTypeLoc T) {
1027d382dcdSMarcel Hlopko     if (T.getTypePtr()->hasTrailingReturn())
1037d382dcdSMarcel Hlopko       return SourceLocation(); // avoid recursing into the suffix of declarator.
1047d382dcdSMarcel Hlopko     return VisitTypeLoc(T);
1057d382dcdSMarcel Hlopko   }
1067d382dcdSMarcel Hlopko 
1077d382dcdSMarcel Hlopko private:
1087d382dcdSMarcel Hlopko   template <class PtrLoc> SourceLocation HandlePointer(PtrLoc T) {
1097d382dcdSMarcel Hlopko     auto L = Visit(T.getPointeeLoc());
1107d382dcdSMarcel Hlopko     if (L.isValid())
1117d382dcdSMarcel Hlopko       return L;
1127d382dcdSMarcel Hlopko     return T.getLocalSourceRange().getBegin();
1137d382dcdSMarcel Hlopko   }
1147d382dcdSMarcel Hlopko };
1157d382dcdSMarcel Hlopko } // namespace
1167d382dcdSMarcel Hlopko 
1177d382dcdSMarcel Hlopko /// Gets the range of declarator as defined by the C++ grammar. E.g.
1187d382dcdSMarcel Hlopko ///     `int a;` -> range of `a`,
1197d382dcdSMarcel Hlopko ///     `int *a;` -> range of `*a`,
1207d382dcdSMarcel Hlopko ///     `int a[10];` -> range of `a[10]`,
1217d382dcdSMarcel Hlopko ///     `int a[1][2][3];` -> range of `a[1][2][3]`,
1227d382dcdSMarcel Hlopko ///     `int *a = nullptr` -> range of `*a = nullptr`.
1237d382dcdSMarcel Hlopko /// FIMXE: \p Name must be a source range, e.g. for `operator+`.
1247d382dcdSMarcel Hlopko static SourceRange getDeclaratorRange(const SourceManager &SM, TypeLoc T,
1257d382dcdSMarcel Hlopko                                       SourceLocation Name,
1267d382dcdSMarcel Hlopko                                       SourceRange Initializer) {
1277d382dcdSMarcel Hlopko   SourceLocation Start = GetStartLoc().Visit(T);
1287d382dcdSMarcel Hlopko   SourceLocation End = T.getSourceRange().getEnd();
1297d382dcdSMarcel Hlopko   assert(End.isValid());
1307d382dcdSMarcel Hlopko   if (Name.isValid()) {
1317d382dcdSMarcel Hlopko     if (Start.isInvalid())
1327d382dcdSMarcel Hlopko       Start = Name;
1337d382dcdSMarcel Hlopko     if (SM.isBeforeInTranslationUnit(End, Name))
1347d382dcdSMarcel Hlopko       End = Name;
1357d382dcdSMarcel Hlopko   }
1367d382dcdSMarcel Hlopko   if (Initializer.isValid()) {
137cdce2fe5SMarcel Hlopko     auto InitializerEnd = Initializer.getEnd();
138cdce2fe5SMarcel Hlopko     assert(SM.isBeforeInTranslationUnit(End, InitializerEnd) || End == InitializerEnd);
139cdce2fe5SMarcel Hlopko     End = InitializerEnd;
1407d382dcdSMarcel Hlopko   }
1417d382dcdSMarcel Hlopko   return SourceRange(Start, End);
1427d382dcdSMarcel Hlopko }
1437d382dcdSMarcel Hlopko 
144a711a3a4SMarcel Hlopko namespace {
145a711a3a4SMarcel Hlopko /// All AST hierarchy roots that can be represented as pointers.
146a711a3a4SMarcel Hlopko using ASTPtr = llvm::PointerUnion<Stmt *, Decl *>;
147a711a3a4SMarcel Hlopko /// Maintains a mapping from AST to syntax tree nodes. This class will get more
148a711a3a4SMarcel Hlopko /// complicated as we support more kinds of AST nodes, e.g. TypeLocs.
149a711a3a4SMarcel Hlopko /// FIXME: expose this as public API.
150a711a3a4SMarcel Hlopko class ASTToSyntaxMapping {
151a711a3a4SMarcel Hlopko public:
152a711a3a4SMarcel Hlopko   void add(ASTPtr From, syntax::Tree *To) {
153a711a3a4SMarcel Hlopko     assert(To != nullptr);
154a711a3a4SMarcel Hlopko     assert(!From.isNull());
155a711a3a4SMarcel Hlopko 
156a711a3a4SMarcel Hlopko     bool Added = Nodes.insert({From, To}).second;
157a711a3a4SMarcel Hlopko     (void)Added;
158a711a3a4SMarcel Hlopko     assert(Added && "mapping added twice");
159a711a3a4SMarcel Hlopko   }
160a711a3a4SMarcel Hlopko 
161a711a3a4SMarcel Hlopko   syntax::Tree *find(ASTPtr P) const { return Nodes.lookup(P); }
162a711a3a4SMarcel Hlopko 
163a711a3a4SMarcel Hlopko private:
164a711a3a4SMarcel Hlopko   llvm::DenseMap<ASTPtr, syntax::Tree *> Nodes;
165a711a3a4SMarcel Hlopko };
166a711a3a4SMarcel Hlopko } // namespace
167a711a3a4SMarcel Hlopko 
1689b3f38f9SIlya Biryukov /// A helper class for constructing the syntax tree while traversing a clang
1699b3f38f9SIlya Biryukov /// AST.
1709b3f38f9SIlya Biryukov ///
1719b3f38f9SIlya Biryukov /// At each point of the traversal we maintain a list of pending nodes.
1729b3f38f9SIlya Biryukov /// Initially all tokens are added as pending nodes. When processing a clang AST
1739b3f38f9SIlya Biryukov /// node, the clients need to:
1749b3f38f9SIlya Biryukov ///   - create a corresponding syntax node,
1759b3f38f9SIlya Biryukov ///   - assign roles to all pending child nodes with 'markChild' and
1769b3f38f9SIlya Biryukov ///     'markChildToken',
1779b3f38f9SIlya Biryukov ///   - replace the child nodes with the new syntax node in the pending list
1789b3f38f9SIlya Biryukov ///     with 'foldNode'.
1799b3f38f9SIlya Biryukov ///
1809b3f38f9SIlya Biryukov /// Note that all children are expected to be processed when building a node.
1819b3f38f9SIlya Biryukov ///
1829b3f38f9SIlya Biryukov /// Call finalize() to finish building the tree and consume the root node.
1839b3f38f9SIlya Biryukov class syntax::TreeBuilder {
1849b3f38f9SIlya Biryukov public:
185c1bbefefSIlya Biryukov   TreeBuilder(syntax::Arena &Arena) : Arena(Arena), Pending(Arena) {
186c1bbefefSIlya Biryukov     for (const auto &T : Arena.tokenBuffer().expandedTokens())
187c1bbefefSIlya Biryukov       LocationToToken.insert({T.location().getRawEncoding(), &T});
188c1bbefefSIlya Biryukov   }
1899b3f38f9SIlya Biryukov 
1909b3f38f9SIlya Biryukov   llvm::BumpPtrAllocator &allocator() { return Arena.allocator(); }
1917d382dcdSMarcel Hlopko   const SourceManager &sourceManager() const { return Arena.sourceManager(); }
1929b3f38f9SIlya Biryukov 
1939b3f38f9SIlya Biryukov   /// Populate children for \p New node, assuming it covers tokens from \p
1949b3f38f9SIlya Biryukov   /// Range.
195a711a3a4SMarcel Hlopko   void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New,
196a711a3a4SMarcel Hlopko                 ASTPtr From) {
197a711a3a4SMarcel Hlopko     assert(New);
198a711a3a4SMarcel Hlopko     Pending.foldChildren(Arena, Range, New);
199a711a3a4SMarcel Hlopko     if (From)
200a711a3a4SMarcel Hlopko       Mapping.add(From, New);
201a711a3a4SMarcel Hlopko   }
202a711a3a4SMarcel Hlopko   void foldNode(llvm::ArrayRef<syntax::Token> Range, syntax::Tree *New,
203a711a3a4SMarcel Hlopko                 TypeLoc L) {
204a711a3a4SMarcel Hlopko     // FIXME: add mapping for TypeLocs
205a711a3a4SMarcel Hlopko     foldNode(Range, New, nullptr);
206a711a3a4SMarcel Hlopko   }
2079b3f38f9SIlya Biryukov 
208e702bdb8SIlya Biryukov   /// Notifies that we should not consume trailing semicolon when computing
209e702bdb8SIlya Biryukov   /// token range of \p D.
2107d382dcdSMarcel Hlopko   void noticeDeclWithoutSemicolon(Decl *D);
211e702bdb8SIlya Biryukov 
21258fa50f4SIlya Biryukov   /// Mark the \p Child node with a corresponding \p Role. All marked children
21358fa50f4SIlya Biryukov   /// should be consumed by foldNode.
2147d382dcdSMarcel Hlopko   /// When called on expressions (clang::Expr is derived from clang::Stmt),
21558fa50f4SIlya Biryukov   /// wraps expressions into expression statement.
21658fa50f4SIlya Biryukov   void markStmtChild(Stmt *Child, NodeRole Role);
21758fa50f4SIlya Biryukov   /// Should be called for expressions in non-statement position to avoid
21858fa50f4SIlya Biryukov   /// wrapping into expression statement.
21958fa50f4SIlya Biryukov   void markExprChild(Expr *Child, NodeRole Role);
2209b3f38f9SIlya Biryukov   /// Set role for a token starting at \p Loc.
221def65bb4SIlya Biryukov   void markChildToken(SourceLocation Loc, NodeRole R);
2227d382dcdSMarcel Hlopko   /// Set role for \p T.
2237d382dcdSMarcel Hlopko   void markChildToken(const syntax::Token *T, NodeRole R);
2247d382dcdSMarcel Hlopko 
225a711a3a4SMarcel Hlopko   /// Set role for \p N.
226a711a3a4SMarcel Hlopko   void markChild(syntax::Node *N, NodeRole R);
227a711a3a4SMarcel Hlopko   /// Set role for the syntax node matching \p N.
228a711a3a4SMarcel Hlopko   void markChild(ASTPtr N, NodeRole R);
2299b3f38f9SIlya Biryukov 
2309b3f38f9SIlya Biryukov   /// Finish building the tree and consume the root node.
2319b3f38f9SIlya Biryukov   syntax::TranslationUnit *finalize() && {
2329b3f38f9SIlya Biryukov     auto Tokens = Arena.tokenBuffer().expandedTokens();
233bfbf6b6cSIlya Biryukov     assert(!Tokens.empty());
234bfbf6b6cSIlya Biryukov     assert(Tokens.back().kind() == tok::eof);
235bfbf6b6cSIlya Biryukov 
2369b3f38f9SIlya Biryukov     // Build the root of the tree, consuming all the children.
2371ad15046SIlya Biryukov     Pending.foldChildren(Arena, Tokens.drop_back(),
2389b3f38f9SIlya Biryukov                          new (Arena.allocator()) syntax::TranslationUnit);
2399b3f38f9SIlya Biryukov 
2403b929fe7SIlya Biryukov     auto *TU = cast<syntax::TranslationUnit>(std::move(Pending).finalize());
2413b929fe7SIlya Biryukov     TU->assertInvariantsRecursive();
2423b929fe7SIlya Biryukov     return TU;
2439b3f38f9SIlya Biryukov   }
2449b3f38f9SIlya Biryukov 
24588bf9b3dSMarcel Hlopko   /// Finds a token starting at \p L. The token must exist if \p L is valid.
24688bf9b3dSMarcel Hlopko   const syntax::Token *findToken(SourceLocation L) const;
24788bf9b3dSMarcel Hlopko 
248a711a3a4SMarcel Hlopko   /// Finds the syntax tokens corresponding to the \p SourceRange.
249a711a3a4SMarcel Hlopko   llvm::ArrayRef<syntax::Token> getRange(SourceRange Range) const {
250a711a3a4SMarcel Hlopko     assert(Range.isValid());
251a711a3a4SMarcel Hlopko     return getRange(Range.getBegin(), Range.getEnd());
252a711a3a4SMarcel Hlopko   }
253a711a3a4SMarcel Hlopko 
254a711a3a4SMarcel Hlopko   /// Finds the syntax tokens corresponding to the passed source locations.
2559b3f38f9SIlya Biryukov   /// \p First is the start position of the first token and \p Last is the start
2569b3f38f9SIlya Biryukov   /// position of the last token.
2579b3f38f9SIlya Biryukov   llvm::ArrayRef<syntax::Token> getRange(SourceLocation First,
2589b3f38f9SIlya Biryukov                                          SourceLocation Last) const {
2599b3f38f9SIlya Biryukov     assert(First.isValid());
2609b3f38f9SIlya Biryukov     assert(Last.isValid());
2619b3f38f9SIlya Biryukov     assert(First == Last ||
2629b3f38f9SIlya Biryukov            Arena.sourceManager().isBeforeInTranslationUnit(First, Last));
2639b3f38f9SIlya Biryukov     return llvm::makeArrayRef(findToken(First), std::next(findToken(Last)));
2649b3f38f9SIlya Biryukov   }
26588bf9b3dSMarcel Hlopko 
26688bf9b3dSMarcel Hlopko   llvm::ArrayRef<syntax::Token>
26788bf9b3dSMarcel Hlopko   getTemplateRange(const ClassTemplateSpecializationDecl *D) const {
268a711a3a4SMarcel Hlopko     auto Tokens = getRange(D->getSourceRange());
26988bf9b3dSMarcel Hlopko     return maybeAppendSemicolon(Tokens, D);
27088bf9b3dSMarcel Hlopko   }
27188bf9b3dSMarcel Hlopko 
272cdce2fe5SMarcel Hlopko   /// Returns true if \p D is the last declarator in a chain and is thus
273cdce2fe5SMarcel Hlopko   /// reponsible for creating SimpleDeclaration for the whole chain.
274cdce2fe5SMarcel Hlopko   template <class T>
275cdce2fe5SMarcel Hlopko   bool isResponsibleForCreatingDeclaration(const T *D) const {
276cdce2fe5SMarcel Hlopko     static_assert((std::is_base_of<DeclaratorDecl, T>::value ||
277cdce2fe5SMarcel Hlopko                    std::is_base_of<TypedefNameDecl, T>::value),
278cdce2fe5SMarcel Hlopko                   "only DeclaratorDecl and TypedefNameDecl are supported.");
279cdce2fe5SMarcel Hlopko 
280cdce2fe5SMarcel Hlopko     const Decl *Next = D->getNextDeclInContext();
281cdce2fe5SMarcel Hlopko 
282cdce2fe5SMarcel Hlopko     // There's no next sibling, this one is responsible.
283cdce2fe5SMarcel Hlopko     if (Next == nullptr) {
284cdce2fe5SMarcel Hlopko       return true;
285cdce2fe5SMarcel Hlopko     }
286cdce2fe5SMarcel Hlopko     const auto *NextT = llvm::dyn_cast<T>(Next);
287cdce2fe5SMarcel Hlopko 
288cdce2fe5SMarcel Hlopko     // Next sibling is not the same type, this one is responsible.
289cdce2fe5SMarcel Hlopko     if (NextT == nullptr) {
290cdce2fe5SMarcel Hlopko       return true;
291cdce2fe5SMarcel Hlopko     }
292cdce2fe5SMarcel Hlopko     // Next sibling doesn't begin at the same loc, it must be a different
293cdce2fe5SMarcel Hlopko     // declaration, so this declarator is responsible.
294cdce2fe5SMarcel Hlopko     if (NextT->getBeginLoc() != D->getBeginLoc()) {
295cdce2fe5SMarcel Hlopko       return true;
296cdce2fe5SMarcel Hlopko     }
297cdce2fe5SMarcel Hlopko 
298cdce2fe5SMarcel Hlopko     // NextT is a member of the same declaration, and we need the last member to
299cdce2fe5SMarcel Hlopko     // create declaration. This one is not responsible.
300cdce2fe5SMarcel Hlopko     return false;
301cdce2fe5SMarcel Hlopko   }
302cdce2fe5SMarcel Hlopko 
303cdce2fe5SMarcel Hlopko   llvm::ArrayRef<syntax::Token> getDeclarationRange(Decl *D) {
30488bf9b3dSMarcel Hlopko     llvm::ArrayRef<clang::syntax::Token> Tokens;
30588bf9b3dSMarcel Hlopko     // We want to drop the template parameters for specializations.
30688bf9b3dSMarcel Hlopko     if (const auto *S = llvm::dyn_cast<TagDecl>(D))
30788bf9b3dSMarcel Hlopko       Tokens = getRange(S->TypeDecl::getBeginLoc(), S->getEndLoc());
30888bf9b3dSMarcel Hlopko     else
309a711a3a4SMarcel Hlopko       Tokens = getRange(D->getSourceRange());
31088bf9b3dSMarcel Hlopko     return maybeAppendSemicolon(Tokens, D);
3119b3f38f9SIlya Biryukov   }
312cdce2fe5SMarcel Hlopko 
31358fa50f4SIlya Biryukov   llvm::ArrayRef<syntax::Token> getExprRange(const Expr *E) const {
314a711a3a4SMarcel Hlopko     return getRange(E->getSourceRange());
31558fa50f4SIlya Biryukov   }
316cdce2fe5SMarcel Hlopko 
31758fa50f4SIlya Biryukov   /// Find the adjusted range for the statement, consuming the trailing
31858fa50f4SIlya Biryukov   /// semicolon when needed.
31958fa50f4SIlya Biryukov   llvm::ArrayRef<syntax::Token> getStmtRange(const Stmt *S) const {
320a711a3a4SMarcel Hlopko     auto Tokens = getRange(S->getSourceRange());
32158fa50f4SIlya Biryukov     if (isa<CompoundStmt>(S))
32258fa50f4SIlya Biryukov       return Tokens;
32358fa50f4SIlya Biryukov 
32458fa50f4SIlya Biryukov     // Some statements miss a trailing semicolon, e.g. 'return', 'continue' and
32558fa50f4SIlya Biryukov     // all statements that end with those. Consume this semicolon here.
326e702bdb8SIlya Biryukov     if (Tokens.back().kind() == tok::semi)
327e702bdb8SIlya Biryukov       return Tokens;
328e702bdb8SIlya Biryukov     return withTrailingSemicolon(Tokens);
329e702bdb8SIlya Biryukov   }
330e702bdb8SIlya Biryukov 
331e702bdb8SIlya Biryukov private:
332e702bdb8SIlya Biryukov   llvm::ArrayRef<syntax::Token>
33388bf9b3dSMarcel Hlopko   maybeAppendSemicolon(llvm::ArrayRef<syntax::Token> Tokens,
33488bf9b3dSMarcel Hlopko                        const Decl *D) const {
33588bf9b3dSMarcel Hlopko     if (llvm::isa<NamespaceDecl>(D))
33688bf9b3dSMarcel Hlopko       return Tokens;
33788bf9b3dSMarcel Hlopko     if (DeclsWithoutSemicolons.count(D))
33888bf9b3dSMarcel Hlopko       return Tokens;
33988bf9b3dSMarcel Hlopko     // FIXME: do not consume trailing semicolon on function definitions.
34088bf9b3dSMarcel Hlopko     // Most declarations own a semicolon in syntax trees, but not in clang AST.
34188bf9b3dSMarcel Hlopko     return withTrailingSemicolon(Tokens);
34288bf9b3dSMarcel Hlopko   }
34388bf9b3dSMarcel Hlopko 
34488bf9b3dSMarcel Hlopko   llvm::ArrayRef<syntax::Token>
345e702bdb8SIlya Biryukov   withTrailingSemicolon(llvm::ArrayRef<syntax::Token> Tokens) const {
346e702bdb8SIlya Biryukov     assert(!Tokens.empty());
347e702bdb8SIlya Biryukov     assert(Tokens.back().kind() != tok::eof);
3487d382dcdSMarcel Hlopko     // We never consume 'eof', so looking at the next token is ok.
34958fa50f4SIlya Biryukov     if (Tokens.back().kind() != tok::semi && Tokens.end()->kind() == tok::semi)
35058fa50f4SIlya Biryukov       return llvm::makeArrayRef(Tokens.begin(), Tokens.end() + 1);
35158fa50f4SIlya Biryukov     return Tokens;
3529b3f38f9SIlya Biryukov   }
3539b3f38f9SIlya Biryukov 
354a711a3a4SMarcel Hlopko   void setRole(syntax::Node *N, NodeRole R) {
355a711a3a4SMarcel Hlopko     assert(N->role() == NodeRole::Detached);
356a711a3a4SMarcel Hlopko     N->setRole(R);
357a711a3a4SMarcel Hlopko   }
358a711a3a4SMarcel Hlopko 
3599b3f38f9SIlya Biryukov   /// A collection of trees covering the input tokens.
3609b3f38f9SIlya Biryukov   /// When created, each tree corresponds to a single token in the file.
3619b3f38f9SIlya Biryukov   /// Clients call 'foldChildren' to attach one or more subtrees to a parent
3629b3f38f9SIlya Biryukov   /// node and update the list of trees accordingly.
3639b3f38f9SIlya Biryukov   ///
3649b3f38f9SIlya Biryukov   /// Ensures that added nodes properly nest and cover the whole token stream.
3659b3f38f9SIlya Biryukov   struct Forest {
3669b3f38f9SIlya Biryukov     Forest(syntax::Arena &A) {
367bfbf6b6cSIlya Biryukov       assert(!A.tokenBuffer().expandedTokens().empty());
368bfbf6b6cSIlya Biryukov       assert(A.tokenBuffer().expandedTokens().back().kind() == tok::eof);
3699b3f38f9SIlya Biryukov       // Create all leaf nodes.
370bfbf6b6cSIlya Biryukov       // Note that we do not have 'eof' in the tree.
3711ad15046SIlya Biryukov       for (auto &T : A.tokenBuffer().expandedTokens().drop_back()) {
3721ad15046SIlya Biryukov         auto *L = new (A.allocator()) syntax::Leaf(&T);
3731ad15046SIlya Biryukov         L->Original = true;
3741ad15046SIlya Biryukov         L->CanModify = A.tokenBuffer().spelledForExpanded(T).hasValue();
375a711a3a4SMarcel Hlopko         Trees.insert(Trees.end(), {&T, L});
3761ad15046SIlya Biryukov       }
3779b3f38f9SIlya Biryukov     }
3789b3f38f9SIlya Biryukov 
3799b3f38f9SIlya Biryukov     void assignRole(llvm::ArrayRef<syntax::Token> Range,
3809b3f38f9SIlya Biryukov                     syntax::NodeRole Role) {
3819b3f38f9SIlya Biryukov       assert(!Range.empty());
3829b3f38f9SIlya Biryukov       auto It = Trees.lower_bound(Range.begin());
3839b3f38f9SIlya Biryukov       assert(It != Trees.end() && "no node found");
3849b3f38f9SIlya Biryukov       assert(It->first == Range.begin() && "no child with the specified range");
3859b3f38f9SIlya Biryukov       assert((std::next(It) == Trees.end() ||
3869b3f38f9SIlya Biryukov               std::next(It)->first == Range.end()) &&
3879b3f38f9SIlya Biryukov              "no child with the specified range");
388a711a3a4SMarcel Hlopko       assert(It->second->role() == NodeRole::Detached &&
389a711a3a4SMarcel Hlopko              "re-assigning role for a child");
390a711a3a4SMarcel Hlopko       It->second->setRole(Role);
3919b3f38f9SIlya Biryukov     }
3929b3f38f9SIlya Biryukov 
393e702bdb8SIlya Biryukov     /// Add \p Node to the forest and attach child nodes based on \p Tokens.
3941ad15046SIlya Biryukov     void foldChildren(const syntax::Arena &A,
3951ad15046SIlya Biryukov                       llvm::ArrayRef<syntax::Token> Tokens,
3969b3f38f9SIlya Biryukov                       syntax::Tree *Node) {
397e702bdb8SIlya Biryukov       // Attach children to `Node`.
398cdce2fe5SMarcel Hlopko       assert(Node->firstChild() == nullptr && "node already has children");
399cdce2fe5SMarcel Hlopko 
400cdce2fe5SMarcel Hlopko       auto *FirstToken = Tokens.begin();
401cdce2fe5SMarcel Hlopko       auto BeginChildren = Trees.lower_bound(FirstToken);
402cdce2fe5SMarcel Hlopko 
403cdce2fe5SMarcel Hlopko       assert((BeginChildren == Trees.end() ||
404cdce2fe5SMarcel Hlopko               BeginChildren->first == FirstToken) &&
405cdce2fe5SMarcel Hlopko              "fold crosses boundaries of existing subtrees");
406cdce2fe5SMarcel Hlopko       auto EndChildren = Trees.lower_bound(Tokens.end());
407cdce2fe5SMarcel Hlopko       assert(
408cdce2fe5SMarcel Hlopko           (EndChildren == Trees.end() || EndChildren->first == Tokens.end()) &&
409cdce2fe5SMarcel Hlopko           "fold crosses boundaries of existing subtrees");
410cdce2fe5SMarcel Hlopko 
411cdce2fe5SMarcel Hlopko       // We need to go in reverse order, because we can only prepend.
412cdce2fe5SMarcel Hlopko       for (auto It = EndChildren; It != BeginChildren; --It) {
413cdce2fe5SMarcel Hlopko         auto *C = std::prev(It)->second;
414cdce2fe5SMarcel Hlopko         if (C->role() == NodeRole::Detached)
415cdce2fe5SMarcel Hlopko           C->setRole(NodeRole::Unknown);
416cdce2fe5SMarcel Hlopko         Node->prependChildLowLevel(C);
417e702bdb8SIlya Biryukov       }
4189b3f38f9SIlya Biryukov 
419cdce2fe5SMarcel Hlopko       // Mark that this node came from the AST and is backed by the source code.
420cdce2fe5SMarcel Hlopko       Node->Original = true;
421cdce2fe5SMarcel Hlopko       Node->CanModify = A.tokenBuffer().spelledForExpanded(Tokens).hasValue();
4229b3f38f9SIlya Biryukov 
423cdce2fe5SMarcel Hlopko       Trees.erase(BeginChildren, EndChildren);
424cdce2fe5SMarcel Hlopko       Trees.insert({FirstToken, Node});
4259b3f38f9SIlya Biryukov     }
4269b3f38f9SIlya Biryukov 
4279b3f38f9SIlya Biryukov     // EXPECTS: all tokens were consumed and are owned by a single root node.
4289b3f38f9SIlya Biryukov     syntax::Node *finalize() && {
4299b3f38f9SIlya Biryukov       assert(Trees.size() == 1);
430a711a3a4SMarcel Hlopko       auto *Root = Trees.begin()->second;
4319b3f38f9SIlya Biryukov       Trees = {};
4329b3f38f9SIlya Biryukov       return Root;
4339b3f38f9SIlya Biryukov     }
4349b3f38f9SIlya Biryukov 
4359b3f38f9SIlya Biryukov     std::string str(const syntax::Arena &A) const {
4369b3f38f9SIlya Biryukov       std::string R;
4379b3f38f9SIlya Biryukov       for (auto It = Trees.begin(); It != Trees.end(); ++It) {
4389b3f38f9SIlya Biryukov         unsigned CoveredTokens =
4399b3f38f9SIlya Biryukov             It != Trees.end()
4409b3f38f9SIlya Biryukov                 ? (std::next(It)->first - It->first)
4419b3f38f9SIlya Biryukov                 : A.tokenBuffer().expandedTokens().end() - It->first;
4429b3f38f9SIlya Biryukov 
443adcd0268SBenjamin Kramer         R += std::string(llvm::formatv(
444a711a3a4SMarcel Hlopko             "- '{0}' covers '{1}'+{2} tokens\n", It->second->kind(),
445adcd0268SBenjamin Kramer             It->first->text(A.sourceManager()), CoveredTokens));
446a711a3a4SMarcel Hlopko         R += It->second->dump(A);
4479b3f38f9SIlya Biryukov       }
4489b3f38f9SIlya Biryukov       return R;
4499b3f38f9SIlya Biryukov     }
4509b3f38f9SIlya Biryukov 
4519b3f38f9SIlya Biryukov   private:
4529b3f38f9SIlya Biryukov     /// Maps from the start token to a subtree starting at that token.
453302cb3bcSIlya Biryukov     /// Keys in the map are pointers into the array of expanded tokens, so
454302cb3bcSIlya Biryukov     /// pointer order corresponds to the order of preprocessor tokens.
455a711a3a4SMarcel Hlopko     std::map<const syntax::Token *, syntax::Node *> Trees;
4569b3f38f9SIlya Biryukov   };
4579b3f38f9SIlya Biryukov 
4589b3f38f9SIlya Biryukov   /// For debugging purposes.
4599b3f38f9SIlya Biryukov   std::string str() { return Pending.str(Arena); }
4609b3f38f9SIlya Biryukov 
4619b3f38f9SIlya Biryukov   syntax::Arena &Arena;
462c1bbefefSIlya Biryukov   /// To quickly find tokens by their start location.
463c1bbefefSIlya Biryukov   llvm::DenseMap</*SourceLocation*/ unsigned, const syntax::Token *>
464c1bbefefSIlya Biryukov       LocationToToken;
4659b3f38f9SIlya Biryukov   Forest Pending;
466e702bdb8SIlya Biryukov   llvm::DenseSet<Decl *> DeclsWithoutSemicolons;
467a711a3a4SMarcel Hlopko   ASTToSyntaxMapping Mapping;
4689b3f38f9SIlya Biryukov };
4699b3f38f9SIlya Biryukov 
4709b3f38f9SIlya Biryukov namespace {
4719b3f38f9SIlya Biryukov class BuildTreeVisitor : public RecursiveASTVisitor<BuildTreeVisitor> {
4729b3f38f9SIlya Biryukov public:
4739b3f38f9SIlya Biryukov   explicit BuildTreeVisitor(ASTContext &Ctx, syntax::TreeBuilder &Builder)
4749b3f38f9SIlya Biryukov       : Builder(Builder), LangOpts(Ctx.getLangOpts()) {}
4759b3f38f9SIlya Biryukov 
4769b3f38f9SIlya Biryukov   bool shouldTraversePostOrder() const { return true; }
4779b3f38f9SIlya Biryukov 
4787d382dcdSMarcel Hlopko   bool WalkUpFromDeclaratorDecl(DeclaratorDecl *DD) {
479cdce2fe5SMarcel Hlopko     return processDeclaratorAndDeclaration(DD);
4807d382dcdSMarcel Hlopko   }
4817d382dcdSMarcel Hlopko 
482cdce2fe5SMarcel Hlopko   bool WalkUpFromTypedefNameDecl(TypedefNameDecl *TD) {
483cdce2fe5SMarcel Hlopko     return processDeclaratorAndDeclaration(TD);
4849b3f38f9SIlya Biryukov   }
4859b3f38f9SIlya Biryukov 
4869b3f38f9SIlya Biryukov   bool VisitDecl(Decl *D) {
4879b3f38f9SIlya Biryukov     assert(!D->isImplicit());
488cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(D),
489a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UnknownDeclaration(), D);
490e702bdb8SIlya Biryukov     return true;
491e702bdb8SIlya Biryukov   }
492e702bdb8SIlya Biryukov 
49388bf9b3dSMarcel Hlopko   // RAV does not call WalkUpFrom* on explicit instantiations, so we have to
49488bf9b3dSMarcel Hlopko   // override Traverse.
49588bf9b3dSMarcel Hlopko   // FIXME: make RAV call WalkUpFrom* instead.
49688bf9b3dSMarcel Hlopko   bool
49788bf9b3dSMarcel Hlopko   TraverseClassTemplateSpecializationDecl(ClassTemplateSpecializationDecl *C) {
49888bf9b3dSMarcel Hlopko     if (!RecursiveASTVisitor::TraverseClassTemplateSpecializationDecl(C))
49988bf9b3dSMarcel Hlopko       return false;
50088bf9b3dSMarcel Hlopko     if (C->isExplicitSpecialization())
50188bf9b3dSMarcel Hlopko       return true; // we are only interested in explicit instantiations.
502a711a3a4SMarcel Hlopko     auto *Declaration =
503a711a3a4SMarcel Hlopko         cast<syntax::SimpleDeclaration>(handleFreeStandingTagDecl(C));
50488bf9b3dSMarcel Hlopko     foldExplicitTemplateInstantiation(
50588bf9b3dSMarcel Hlopko         Builder.getTemplateRange(C), Builder.findToken(C->getExternLoc()),
506a711a3a4SMarcel Hlopko         Builder.findToken(C->getTemplateKeywordLoc()), Declaration, C);
50788bf9b3dSMarcel Hlopko     return true;
50888bf9b3dSMarcel Hlopko   }
50988bf9b3dSMarcel Hlopko 
51088bf9b3dSMarcel Hlopko   bool WalkUpFromTemplateDecl(TemplateDecl *S) {
51188bf9b3dSMarcel Hlopko     foldTemplateDeclaration(
512cdce2fe5SMarcel Hlopko         Builder.getDeclarationRange(S),
51388bf9b3dSMarcel Hlopko         Builder.findToken(S->getTemplateParameters()->getTemplateLoc()),
514cdce2fe5SMarcel Hlopko         Builder.getDeclarationRange(S->getTemplatedDecl()), S);
51588bf9b3dSMarcel Hlopko     return true;
51688bf9b3dSMarcel Hlopko   }
51788bf9b3dSMarcel Hlopko 
518e702bdb8SIlya Biryukov   bool WalkUpFromTagDecl(TagDecl *C) {
51904f627f6SIlya Biryukov     // FIXME: build the ClassSpecifier node.
52088bf9b3dSMarcel Hlopko     if (!C->isFreeStanding()) {
52188bf9b3dSMarcel Hlopko       assert(C->getNumTemplateParameterLists() == 0);
52204f627f6SIlya Biryukov       return true;
52304f627f6SIlya Biryukov     }
524a711a3a4SMarcel Hlopko     handleFreeStandingTagDecl(C);
525a711a3a4SMarcel Hlopko     return true;
526a711a3a4SMarcel Hlopko   }
527a711a3a4SMarcel Hlopko 
528a711a3a4SMarcel Hlopko   syntax::Declaration *handleFreeStandingTagDecl(TagDecl *C) {
529a711a3a4SMarcel Hlopko     assert(C->isFreeStanding());
53088bf9b3dSMarcel Hlopko     // Class is a declaration specifier and needs a spanning declaration node.
531cdce2fe5SMarcel Hlopko     auto DeclarationRange = Builder.getDeclarationRange(C);
532a711a3a4SMarcel Hlopko     syntax::Declaration *Result = new (allocator()) syntax::SimpleDeclaration;
533a711a3a4SMarcel Hlopko     Builder.foldNode(DeclarationRange, Result, nullptr);
53488bf9b3dSMarcel Hlopko 
53588bf9b3dSMarcel Hlopko     // Build TemplateDeclaration nodes if we had template parameters.
53688bf9b3dSMarcel Hlopko     auto ConsumeTemplateParameters = [&](const TemplateParameterList &L) {
53788bf9b3dSMarcel Hlopko       const auto *TemplateKW = Builder.findToken(L.getTemplateLoc());
53888bf9b3dSMarcel Hlopko       auto R = llvm::makeArrayRef(TemplateKW, DeclarationRange.end());
539a711a3a4SMarcel Hlopko       Result =
540a711a3a4SMarcel Hlopko           foldTemplateDeclaration(R, TemplateKW, DeclarationRange, nullptr);
54188bf9b3dSMarcel Hlopko       DeclarationRange = R;
54288bf9b3dSMarcel Hlopko     };
54388bf9b3dSMarcel Hlopko     if (auto *S = llvm::dyn_cast<ClassTemplatePartialSpecializationDecl>(C))
54488bf9b3dSMarcel Hlopko       ConsumeTemplateParameters(*S->getTemplateParameters());
54588bf9b3dSMarcel Hlopko     for (unsigned I = C->getNumTemplateParameterLists(); 0 < I; --I)
54688bf9b3dSMarcel Hlopko       ConsumeTemplateParameters(*C->getTemplateParameterList(I - 1));
547a711a3a4SMarcel Hlopko     return Result;
5489b3f38f9SIlya Biryukov   }
5499b3f38f9SIlya Biryukov 
5509b3f38f9SIlya Biryukov   bool WalkUpFromTranslationUnitDecl(TranslationUnitDecl *TU) {
5517d382dcdSMarcel Hlopko     // We do not want to call VisitDecl(), the declaration for translation
5529b3f38f9SIlya Biryukov     // unit is built by finalize().
5539b3f38f9SIlya Biryukov     return true;
5549b3f38f9SIlya Biryukov   }
5559b3f38f9SIlya Biryukov 
5569b3f38f9SIlya Biryukov   bool WalkUpFromCompoundStmt(CompoundStmt *S) {
55751dad419SIlya Biryukov     using NodeRole = syntax::NodeRole;
5589b3f38f9SIlya Biryukov 
559def65bb4SIlya Biryukov     Builder.markChildToken(S->getLBracLoc(), NodeRole::OpenParen);
56058fa50f4SIlya Biryukov     for (auto *Child : S->body())
56158fa50f4SIlya Biryukov       Builder.markStmtChild(Child, NodeRole::CompoundStatement_statement);
562def65bb4SIlya Biryukov     Builder.markChildToken(S->getRBracLoc(), NodeRole::CloseParen);
5639b3f38f9SIlya Biryukov 
56458fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
565a711a3a4SMarcel Hlopko                      new (allocator()) syntax::CompoundStatement, S);
5669b3f38f9SIlya Biryukov     return true;
5679b3f38f9SIlya Biryukov   }
5689b3f38f9SIlya Biryukov 
56958fa50f4SIlya Biryukov   // Some statements are not yet handled by syntax trees.
57058fa50f4SIlya Biryukov   bool WalkUpFromStmt(Stmt *S) {
57158fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
572a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UnknownStatement, S);
57358fa50f4SIlya Biryukov     return true;
57458fa50f4SIlya Biryukov   }
57558fa50f4SIlya Biryukov 
57658fa50f4SIlya Biryukov   bool TraverseCXXForRangeStmt(CXXForRangeStmt *S) {
57758fa50f4SIlya Biryukov     // We override to traverse range initializer as VarDecl.
57858fa50f4SIlya Biryukov     // RAV traverses it as a statement, we produce invalid node kinds in that
57958fa50f4SIlya Biryukov     // case.
58058fa50f4SIlya Biryukov     // FIXME: should do this in RAV instead?
58158fa50f4SIlya Biryukov     if (S->getInit() && !TraverseStmt(S->getInit()))
58258fa50f4SIlya Biryukov       return false;
58358fa50f4SIlya Biryukov     if (S->getLoopVariable() && !TraverseDecl(S->getLoopVariable()))
58458fa50f4SIlya Biryukov       return false;
58558fa50f4SIlya Biryukov     if (S->getRangeInit() && !TraverseStmt(S->getRangeInit()))
58658fa50f4SIlya Biryukov       return false;
58758fa50f4SIlya Biryukov     if (S->getBody() && !TraverseStmt(S->getBody()))
58858fa50f4SIlya Biryukov       return false;
58958fa50f4SIlya Biryukov     return true;
59058fa50f4SIlya Biryukov   }
59158fa50f4SIlya Biryukov 
59258fa50f4SIlya Biryukov   bool TraverseStmt(Stmt *S) {
593e702bdb8SIlya Biryukov     if (auto *DS = llvm::dyn_cast_or_null<DeclStmt>(S)) {
594e702bdb8SIlya Biryukov       // We want to consume the semicolon, make sure SimpleDeclaration does not.
595e702bdb8SIlya Biryukov       for (auto *D : DS->decls())
5967d382dcdSMarcel Hlopko         Builder.noticeDeclWithoutSemicolon(D);
597e702bdb8SIlya Biryukov     } else if (auto *E = llvm::dyn_cast_or_null<Expr>(S)) {
5983785eb83SEduardo Caldas       return RecursiveASTVisitor::TraverseStmt(E->IgnoreImplicit());
59958fa50f4SIlya Biryukov     }
60058fa50f4SIlya Biryukov     return RecursiveASTVisitor::TraverseStmt(S);
60158fa50f4SIlya Biryukov   }
60258fa50f4SIlya Biryukov 
60358fa50f4SIlya Biryukov   // Some expressions are not yet handled by syntax trees.
60458fa50f4SIlya Biryukov   bool WalkUpFromExpr(Expr *E) {
60558fa50f4SIlya Biryukov     assert(!isImplicitExpr(E) && "should be handled by TraverseStmt");
60658fa50f4SIlya Biryukov     Builder.foldNode(Builder.getExprRange(E),
607a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UnknownExpression, E);
60858fa50f4SIlya Biryukov     return true;
60958fa50f4SIlya Biryukov   }
61058fa50f4SIlya Biryukov 
6111b2f6b4aSEduardo Caldas   syntax::NestedNameSpecifier *
6121b2f6b4aSEduardo Caldas   BuildNestedNameSpecifier(NestedNameSpecifierLoc QualifierLoc) {
6131b2f6b4aSEduardo Caldas     if (!QualifierLoc)
6141b2f6b4aSEduardo Caldas       return nullptr;
6151b2f6b4aSEduardo Caldas     for (auto it = QualifierLoc; it; it = it.getPrefix()) {
6161b2f6b4aSEduardo Caldas       auto *NS = new (allocator()) syntax::NameSpecifier;
6171b2f6b4aSEduardo Caldas       Builder.foldNode(Builder.getRange(it.getLocalSourceRange()), NS, nullptr);
6181b2f6b4aSEduardo Caldas       Builder.markChild(NS, syntax::NodeRole::NestedNameSpecifier_specifier);
6191b2f6b4aSEduardo Caldas     }
6201b2f6b4aSEduardo Caldas     auto *NNS = new (allocator()) syntax::NestedNameSpecifier;
6211b2f6b4aSEduardo Caldas     Builder.foldNode(Builder.getRange(QualifierLoc.getSourceRange()), NNS,
6221b2f6b4aSEduardo Caldas                      nullptr);
6231b2f6b4aSEduardo Caldas     return NNS;
6241b2f6b4aSEduardo Caldas   }
6251b2f6b4aSEduardo Caldas 
6261b2f6b4aSEduardo Caldas   bool WalkUpFromDeclRefExpr(DeclRefExpr *S) {
6271b2f6b4aSEduardo Caldas     if (auto *NNS = BuildNestedNameSpecifier(S->getQualifierLoc()))
6281b2f6b4aSEduardo Caldas       Builder.markChild(NNS, syntax::NodeRole::IdExpression_qualifier);
6291b2f6b4aSEduardo Caldas 
6301b2f6b4aSEduardo Caldas     auto *unqualifiedId = new (allocator()) syntax::UnqualifiedId;
6311b2f6b4aSEduardo Caldas     // Get `UnqualifiedId` from `DeclRefExpr`.
6321b2f6b4aSEduardo Caldas     // FIXME: Extract this logic so that it can be used by `MemberExpr`,
6331b2f6b4aSEduardo Caldas     // and other semantic constructs, now it is tied to `DeclRefExpr`.
6341b2f6b4aSEduardo Caldas     if (!S->hasExplicitTemplateArgs()) {
6351b2f6b4aSEduardo Caldas       Builder.foldNode(Builder.getRange(S->getNameInfo().getSourceRange()),
6361b2f6b4aSEduardo Caldas                        unqualifiedId, nullptr);
6371b2f6b4aSEduardo Caldas     } else {
6381b2f6b4aSEduardo Caldas       auto templateIdSourceRange =
6391b2f6b4aSEduardo Caldas           SourceRange(S->getNameInfo().getBeginLoc(), S->getRAngleLoc());
6401b2f6b4aSEduardo Caldas       Builder.foldNode(Builder.getRange(templateIdSourceRange), unqualifiedId,
6411b2f6b4aSEduardo Caldas                        nullptr);
6421b2f6b4aSEduardo Caldas     }
6431b2f6b4aSEduardo Caldas     Builder.markChild(unqualifiedId, syntax::NodeRole::IdExpression_id);
6441b2f6b4aSEduardo Caldas 
6451b2f6b4aSEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
6461b2f6b4aSEduardo Caldas                      new (allocator()) syntax::IdExpression, S);
6471b2f6b4aSEduardo Caldas     return true;
6481b2f6b4aSEduardo Caldas   }
6491b2f6b4aSEduardo Caldas 
6503b739690SEduardo Caldas   bool WalkUpFromIntegerLiteral(IntegerLiteral *S) {
65142f6fec3SEduardo Caldas     Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken);
6523b739690SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
6533b739690SEduardo Caldas                      new (allocator()) syntax::IntegerLiteralExpression, S);
6543b739690SEduardo Caldas     return true;
6553b739690SEduardo Caldas   }
6563b739690SEduardo Caldas 
6577f7f8564SEduardo Caldas   bool WalkUpFromCXXBoolLiteralExpr(CXXBoolLiteralExpr *S) {
6587f7f8564SEduardo Caldas     Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken);
6597f7f8564SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
6607f7f8564SEduardo Caldas                      new (allocator()) syntax::BoolLiteralExpression, S);
6617f7f8564SEduardo Caldas     return true;
6627f7f8564SEduardo Caldas   }
6637f7f8564SEduardo Caldas 
664*221d7bbeSEduardo Caldas   bool WalkUpFromCharacterLiteral(CharacterLiteral *S) {
665*221d7bbeSEduardo Caldas     Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken);
666*221d7bbeSEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
667*221d7bbeSEduardo Caldas                      new (allocator()) syntax::CharacterLiteralExpression, S);
668*221d7bbeSEduardo Caldas     return true;
669*221d7bbeSEduardo Caldas   }
670*221d7bbeSEduardo Caldas 
671007098d7SEduardo Caldas   bool WalkUpFromCXXNullPtrLiteralExpr(CXXNullPtrLiteralExpr *S) {
67242f6fec3SEduardo Caldas     Builder.markChildToken(S->getLocation(), syntax::NodeRole::LiteralToken);
673007098d7SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
674007098d7SEduardo Caldas                      new (allocator()) syntax::CxxNullPtrExpression, S);
675007098d7SEduardo Caldas     return true;
676007098d7SEduardo Caldas   }
677007098d7SEduardo Caldas 
678461af57dSEduardo Caldas   bool WalkUpFromUnaryOperator(UnaryOperator *S) {
67942f6fec3SEduardo Caldas     Builder.markChildToken(S->getOperatorLoc(),
68042f6fec3SEduardo Caldas                            syntax::NodeRole::OperatorExpression_operatorToken);
681461af57dSEduardo Caldas     Builder.markExprChild(S->getSubExpr(),
682461af57dSEduardo Caldas                           syntax::NodeRole::UnaryOperatorExpression_operand);
683461af57dSEduardo Caldas 
684461af57dSEduardo Caldas     if (S->isPostfix())
685461af57dSEduardo Caldas       Builder.foldNode(Builder.getExprRange(S),
686461af57dSEduardo Caldas                        new (allocator()) syntax::PostfixUnaryOperatorExpression,
687461af57dSEduardo Caldas                        S);
688461af57dSEduardo Caldas     else
689461af57dSEduardo Caldas       Builder.foldNode(Builder.getExprRange(S),
690461af57dSEduardo Caldas                        new (allocator()) syntax::PrefixUnaryOperatorExpression,
691461af57dSEduardo Caldas                        S);
692461af57dSEduardo Caldas 
693461af57dSEduardo Caldas     return true;
694461af57dSEduardo Caldas   }
695461af57dSEduardo Caldas 
6963785eb83SEduardo Caldas   bool WalkUpFromBinaryOperator(BinaryOperator *S) {
6973785eb83SEduardo Caldas     Builder.markExprChild(
6983785eb83SEduardo Caldas         S->getLHS(), syntax::NodeRole::BinaryOperatorExpression_leftHandSide);
69942f6fec3SEduardo Caldas     Builder.markChildToken(S->getOperatorLoc(),
70042f6fec3SEduardo Caldas                            syntax::NodeRole::OperatorExpression_operatorToken);
7013785eb83SEduardo Caldas     Builder.markExprChild(
7023785eb83SEduardo Caldas         S->getRHS(), syntax::NodeRole::BinaryOperatorExpression_rightHandSide);
7033785eb83SEduardo Caldas     Builder.foldNode(Builder.getExprRange(S),
7043785eb83SEduardo Caldas                      new (allocator()) syntax::BinaryOperatorExpression, S);
7053785eb83SEduardo Caldas     return true;
7063785eb83SEduardo Caldas   }
7073785eb83SEduardo Caldas 
7083a574a6cSEduardo Caldas   bool WalkUpFromCXXOperatorCallExpr(CXXOperatorCallExpr *S) {
7093a574a6cSEduardo Caldas     if (S->isInfixBinaryOp()) {
7103a574a6cSEduardo Caldas       Builder.markExprChild(
7113a574a6cSEduardo Caldas           S->getArg(0),
7123a574a6cSEduardo Caldas           syntax::NodeRole::BinaryOperatorExpression_leftHandSide);
7133a574a6cSEduardo Caldas       Builder.markChildToken(
7143a574a6cSEduardo Caldas           S->getOperatorLoc(),
71542f6fec3SEduardo Caldas           syntax::NodeRole::OperatorExpression_operatorToken);
7163a574a6cSEduardo Caldas       Builder.markExprChild(
7173a574a6cSEduardo Caldas           S->getArg(1),
7183a574a6cSEduardo Caldas           syntax::NodeRole::BinaryOperatorExpression_rightHandSide);
7193a574a6cSEduardo Caldas       Builder.foldNode(Builder.getExprRange(S),
7203a574a6cSEduardo Caldas                        new (allocator()) syntax::BinaryOperatorExpression, S);
7213a574a6cSEduardo Caldas       return true;
7223a574a6cSEduardo Caldas     }
7233a574a6cSEduardo Caldas     return RecursiveASTVisitor::WalkUpFromCXXOperatorCallExpr(S);
7243a574a6cSEduardo Caldas   }
7253a574a6cSEduardo Caldas 
726be14a22bSIlya Biryukov   bool WalkUpFromNamespaceDecl(NamespaceDecl *S) {
727cdce2fe5SMarcel Hlopko     auto Tokens = Builder.getDeclarationRange(S);
728be14a22bSIlya Biryukov     if (Tokens.front().kind() == tok::coloncolon) {
729be14a22bSIlya Biryukov       // Handle nested namespace definitions. Those start at '::' token, e.g.
730be14a22bSIlya Biryukov       // namespace a^::b {}
731be14a22bSIlya Biryukov       // FIXME: build corresponding nodes for the name of this namespace.
732be14a22bSIlya Biryukov       return true;
733be14a22bSIlya Biryukov     }
734a711a3a4SMarcel Hlopko     Builder.foldNode(Tokens, new (allocator()) syntax::NamespaceDefinition, S);
735be14a22bSIlya Biryukov     return true;
736be14a22bSIlya Biryukov   }
737be14a22bSIlya Biryukov 
7387d382dcdSMarcel Hlopko   bool TraverseParenTypeLoc(ParenTypeLoc L) {
7397d382dcdSMarcel Hlopko     // We reverse order of traversal to get the proper syntax structure.
7407d382dcdSMarcel Hlopko     if (!WalkUpFromParenTypeLoc(L))
7417d382dcdSMarcel Hlopko       return false;
7427d382dcdSMarcel Hlopko     return TraverseTypeLoc(L.getInnerLoc());
7437d382dcdSMarcel Hlopko   }
7447d382dcdSMarcel Hlopko 
7457d382dcdSMarcel Hlopko   bool WalkUpFromParenTypeLoc(ParenTypeLoc L) {
7467d382dcdSMarcel Hlopko     Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen);
7477d382dcdSMarcel Hlopko     Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen);
7487d382dcdSMarcel Hlopko     Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getRParenLoc()),
749a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ParenDeclarator, L);
7507d382dcdSMarcel Hlopko     return true;
7517d382dcdSMarcel Hlopko   }
7527d382dcdSMarcel Hlopko 
7537d382dcdSMarcel Hlopko   // Declarator chunks, they are produced by type locs and some clang::Decls.
7547d382dcdSMarcel Hlopko   bool WalkUpFromArrayTypeLoc(ArrayTypeLoc L) {
7557d382dcdSMarcel Hlopko     Builder.markChildToken(L.getLBracketLoc(), syntax::NodeRole::OpenParen);
7567d382dcdSMarcel Hlopko     Builder.markExprChild(L.getSizeExpr(),
7577d382dcdSMarcel Hlopko                           syntax::NodeRole::ArraySubscript_sizeExpression);
7587d382dcdSMarcel Hlopko     Builder.markChildToken(L.getRBracketLoc(), syntax::NodeRole::CloseParen);
7597d382dcdSMarcel Hlopko     Builder.foldNode(Builder.getRange(L.getLBracketLoc(), L.getRBracketLoc()),
760a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ArraySubscript, L);
7617d382dcdSMarcel Hlopko     return true;
7627d382dcdSMarcel Hlopko   }
7637d382dcdSMarcel Hlopko 
7647d382dcdSMarcel Hlopko   bool WalkUpFromFunctionTypeLoc(FunctionTypeLoc L) {
7657d382dcdSMarcel Hlopko     Builder.markChildToken(L.getLParenLoc(), syntax::NodeRole::OpenParen);
766cdce2fe5SMarcel Hlopko     for (auto *P : L.getParams()) {
767cdce2fe5SMarcel Hlopko       Builder.markChild(P, syntax::NodeRole::ParametersAndQualifiers_parameter);
768cdce2fe5SMarcel Hlopko     }
7697d382dcdSMarcel Hlopko     Builder.markChildToken(L.getRParenLoc(), syntax::NodeRole::CloseParen);
7707d382dcdSMarcel Hlopko     Builder.foldNode(Builder.getRange(L.getLParenLoc(), L.getEndLoc()),
771a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ParametersAndQualifiers, L);
7727d382dcdSMarcel Hlopko     return true;
7737d382dcdSMarcel Hlopko   }
7747d382dcdSMarcel Hlopko 
7757d382dcdSMarcel Hlopko   bool WalkUpFromFunctionProtoTypeLoc(FunctionProtoTypeLoc L) {
7767d382dcdSMarcel Hlopko     if (!L.getTypePtr()->hasTrailingReturn())
7777d382dcdSMarcel Hlopko       return WalkUpFromFunctionTypeLoc(L);
7787d382dcdSMarcel Hlopko 
779cdce2fe5SMarcel Hlopko     auto *TrailingReturnTokens = BuildTrailingReturn(L);
7807d382dcdSMarcel Hlopko     // Finish building the node for parameters.
7817d382dcdSMarcel Hlopko     Builder.markChild(TrailingReturnTokens,
7827d382dcdSMarcel Hlopko                       syntax::NodeRole::ParametersAndQualifiers_trailingReturn);
7837d382dcdSMarcel Hlopko     return WalkUpFromFunctionTypeLoc(L);
7847d382dcdSMarcel Hlopko   }
7857d382dcdSMarcel Hlopko 
7867d382dcdSMarcel Hlopko   bool WalkUpFromMemberPointerTypeLoc(MemberPointerTypeLoc L) {
7877d382dcdSMarcel Hlopko     auto SR = L.getLocalSourceRange();
788a711a3a4SMarcel Hlopko     Builder.foldNode(Builder.getRange(SR),
789a711a3a4SMarcel Hlopko                      new (allocator()) syntax::MemberPointer, L);
7907d382dcdSMarcel Hlopko     return true;
7917d382dcdSMarcel Hlopko   }
7927d382dcdSMarcel Hlopko 
79358fa50f4SIlya Biryukov   // The code below is very regular, it could even be generated with some
79458fa50f4SIlya Biryukov   // preprocessor magic. We merely assign roles to the corresponding children
79558fa50f4SIlya Biryukov   // and fold resulting nodes.
79658fa50f4SIlya Biryukov   bool WalkUpFromDeclStmt(DeclStmt *S) {
79758fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
798a711a3a4SMarcel Hlopko                      new (allocator()) syntax::DeclarationStatement, S);
79958fa50f4SIlya Biryukov     return true;
80058fa50f4SIlya Biryukov   }
80158fa50f4SIlya Biryukov 
80258fa50f4SIlya Biryukov   bool WalkUpFromNullStmt(NullStmt *S) {
80358fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
804a711a3a4SMarcel Hlopko                      new (allocator()) syntax::EmptyStatement, S);
80558fa50f4SIlya Biryukov     return true;
80658fa50f4SIlya Biryukov   }
80758fa50f4SIlya Biryukov 
80858fa50f4SIlya Biryukov   bool WalkUpFromSwitchStmt(SwitchStmt *S) {
809def65bb4SIlya Biryukov     Builder.markChildToken(S->getSwitchLoc(),
81058fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
81158fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
81258fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
813a711a3a4SMarcel Hlopko                      new (allocator()) syntax::SwitchStatement, S);
81458fa50f4SIlya Biryukov     return true;
81558fa50f4SIlya Biryukov   }
81658fa50f4SIlya Biryukov 
81758fa50f4SIlya Biryukov   bool WalkUpFromCaseStmt(CaseStmt *S) {
818def65bb4SIlya Biryukov     Builder.markChildToken(S->getKeywordLoc(),
81958fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
82058fa50f4SIlya Biryukov     Builder.markExprChild(S->getLHS(), syntax::NodeRole::CaseStatement_value);
82158fa50f4SIlya Biryukov     Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement);
82258fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
823a711a3a4SMarcel Hlopko                      new (allocator()) syntax::CaseStatement, S);
82458fa50f4SIlya Biryukov     return true;
82558fa50f4SIlya Biryukov   }
82658fa50f4SIlya Biryukov 
82758fa50f4SIlya Biryukov   bool WalkUpFromDefaultStmt(DefaultStmt *S) {
828def65bb4SIlya Biryukov     Builder.markChildToken(S->getKeywordLoc(),
82958fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
83058fa50f4SIlya Biryukov     Builder.markStmtChild(S->getSubStmt(), syntax::NodeRole::BodyStatement);
83158fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
832a711a3a4SMarcel Hlopko                      new (allocator()) syntax::DefaultStatement, S);
83358fa50f4SIlya Biryukov     return true;
83458fa50f4SIlya Biryukov   }
83558fa50f4SIlya Biryukov 
83658fa50f4SIlya Biryukov   bool WalkUpFromIfStmt(IfStmt *S) {
837def65bb4SIlya Biryukov     Builder.markChildToken(S->getIfLoc(), syntax::NodeRole::IntroducerKeyword);
83858fa50f4SIlya Biryukov     Builder.markStmtChild(S->getThen(),
83958fa50f4SIlya Biryukov                           syntax::NodeRole::IfStatement_thenStatement);
840def65bb4SIlya Biryukov     Builder.markChildToken(S->getElseLoc(),
84158fa50f4SIlya Biryukov                            syntax::NodeRole::IfStatement_elseKeyword);
84258fa50f4SIlya Biryukov     Builder.markStmtChild(S->getElse(),
84358fa50f4SIlya Biryukov                           syntax::NodeRole::IfStatement_elseStatement);
84458fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
845a711a3a4SMarcel Hlopko                      new (allocator()) syntax::IfStatement, S);
84658fa50f4SIlya Biryukov     return true;
84758fa50f4SIlya Biryukov   }
84858fa50f4SIlya Biryukov 
84958fa50f4SIlya Biryukov   bool WalkUpFromForStmt(ForStmt *S) {
850def65bb4SIlya Biryukov     Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword);
85158fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
85258fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
853a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ForStatement, S);
85458fa50f4SIlya Biryukov     return true;
85558fa50f4SIlya Biryukov   }
85658fa50f4SIlya Biryukov 
85758fa50f4SIlya Biryukov   bool WalkUpFromWhileStmt(WhileStmt *S) {
858def65bb4SIlya Biryukov     Builder.markChildToken(S->getWhileLoc(),
85958fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
86058fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
86158fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
862a711a3a4SMarcel Hlopko                      new (allocator()) syntax::WhileStatement, S);
86358fa50f4SIlya Biryukov     return true;
86458fa50f4SIlya Biryukov   }
86558fa50f4SIlya Biryukov 
86658fa50f4SIlya Biryukov   bool WalkUpFromContinueStmt(ContinueStmt *S) {
867def65bb4SIlya Biryukov     Builder.markChildToken(S->getContinueLoc(),
86858fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
86958fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
870a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ContinueStatement, S);
87158fa50f4SIlya Biryukov     return true;
87258fa50f4SIlya Biryukov   }
87358fa50f4SIlya Biryukov 
87458fa50f4SIlya Biryukov   bool WalkUpFromBreakStmt(BreakStmt *S) {
875def65bb4SIlya Biryukov     Builder.markChildToken(S->getBreakLoc(),
87658fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
87758fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
878a711a3a4SMarcel Hlopko                      new (allocator()) syntax::BreakStatement, S);
87958fa50f4SIlya Biryukov     return true;
88058fa50f4SIlya Biryukov   }
88158fa50f4SIlya Biryukov 
88258fa50f4SIlya Biryukov   bool WalkUpFromReturnStmt(ReturnStmt *S) {
883def65bb4SIlya Biryukov     Builder.markChildToken(S->getReturnLoc(),
88458fa50f4SIlya Biryukov                            syntax::NodeRole::IntroducerKeyword);
88558fa50f4SIlya Biryukov     Builder.markExprChild(S->getRetValue(),
88658fa50f4SIlya Biryukov                           syntax::NodeRole::ReturnStatement_value);
88758fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
888a711a3a4SMarcel Hlopko                      new (allocator()) syntax::ReturnStatement, S);
88958fa50f4SIlya Biryukov     return true;
89058fa50f4SIlya Biryukov   }
89158fa50f4SIlya Biryukov 
89258fa50f4SIlya Biryukov   bool WalkUpFromCXXForRangeStmt(CXXForRangeStmt *S) {
893def65bb4SIlya Biryukov     Builder.markChildToken(S->getForLoc(), syntax::NodeRole::IntroducerKeyword);
89458fa50f4SIlya Biryukov     Builder.markStmtChild(S->getBody(), syntax::NodeRole::BodyStatement);
89558fa50f4SIlya Biryukov     Builder.foldNode(Builder.getStmtRange(S),
896a711a3a4SMarcel Hlopko                      new (allocator()) syntax::RangeBasedForStatement, S);
89758fa50f4SIlya Biryukov     return true;
89858fa50f4SIlya Biryukov   }
89958fa50f4SIlya Biryukov 
900be14a22bSIlya Biryukov   bool WalkUpFromEmptyDecl(EmptyDecl *S) {
901cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
902a711a3a4SMarcel Hlopko                      new (allocator()) syntax::EmptyDeclaration, S);
903be14a22bSIlya Biryukov     return true;
904be14a22bSIlya Biryukov   }
905be14a22bSIlya Biryukov 
906be14a22bSIlya Biryukov   bool WalkUpFromStaticAssertDecl(StaticAssertDecl *S) {
907be14a22bSIlya Biryukov     Builder.markExprChild(S->getAssertExpr(),
908be14a22bSIlya Biryukov                           syntax::NodeRole::StaticAssertDeclaration_condition);
909be14a22bSIlya Biryukov     Builder.markExprChild(S->getMessage(),
910be14a22bSIlya Biryukov                           syntax::NodeRole::StaticAssertDeclaration_message);
911cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
912a711a3a4SMarcel Hlopko                      new (allocator()) syntax::StaticAssertDeclaration, S);
913be14a22bSIlya Biryukov     return true;
914be14a22bSIlya Biryukov   }
915be14a22bSIlya Biryukov 
916be14a22bSIlya Biryukov   bool WalkUpFromLinkageSpecDecl(LinkageSpecDecl *S) {
917cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
918a711a3a4SMarcel Hlopko                      new (allocator()) syntax::LinkageSpecificationDeclaration,
919a711a3a4SMarcel Hlopko                      S);
920be14a22bSIlya Biryukov     return true;
921be14a22bSIlya Biryukov   }
922be14a22bSIlya Biryukov 
923be14a22bSIlya Biryukov   bool WalkUpFromNamespaceAliasDecl(NamespaceAliasDecl *S) {
924cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
925a711a3a4SMarcel Hlopko                      new (allocator()) syntax::NamespaceAliasDefinition, S);
926be14a22bSIlya Biryukov     return true;
927be14a22bSIlya Biryukov   }
928be14a22bSIlya Biryukov 
929be14a22bSIlya Biryukov   bool WalkUpFromUsingDirectiveDecl(UsingDirectiveDecl *S) {
930cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
931a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingNamespaceDirective, S);
932be14a22bSIlya Biryukov     return true;
933be14a22bSIlya Biryukov   }
934be14a22bSIlya Biryukov 
935be14a22bSIlya Biryukov   bool WalkUpFromUsingDecl(UsingDecl *S) {
936cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
937a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingDeclaration, S);
938be14a22bSIlya Biryukov     return true;
939be14a22bSIlya Biryukov   }
940be14a22bSIlya Biryukov 
941be14a22bSIlya Biryukov   bool WalkUpFromUnresolvedUsingValueDecl(UnresolvedUsingValueDecl *S) {
942cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
943a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingDeclaration, S);
944be14a22bSIlya Biryukov     return true;
945be14a22bSIlya Biryukov   }
946be14a22bSIlya Biryukov 
947be14a22bSIlya Biryukov   bool WalkUpFromUnresolvedUsingTypenameDecl(UnresolvedUsingTypenameDecl *S) {
948cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
949a711a3a4SMarcel Hlopko                      new (allocator()) syntax::UsingDeclaration, S);
950be14a22bSIlya Biryukov     return true;
951be14a22bSIlya Biryukov   }
952be14a22bSIlya Biryukov 
953be14a22bSIlya Biryukov   bool WalkUpFromTypeAliasDecl(TypeAliasDecl *S) {
954cdce2fe5SMarcel Hlopko     Builder.foldNode(Builder.getDeclarationRange(S),
955a711a3a4SMarcel Hlopko                      new (allocator()) syntax::TypeAliasDeclaration, S);
956be14a22bSIlya Biryukov     return true;
957be14a22bSIlya Biryukov   }
958be14a22bSIlya Biryukov 
9599b3f38f9SIlya Biryukov private:
960cdce2fe5SMarcel Hlopko   template <class T> SourceLocation getQualifiedNameStart(T *D) {
961cdce2fe5SMarcel Hlopko     static_assert((std::is_base_of<DeclaratorDecl, T>::value ||
962cdce2fe5SMarcel Hlopko                    std::is_base_of<TypedefNameDecl, T>::value),
963cdce2fe5SMarcel Hlopko                   "only DeclaratorDecl and TypedefNameDecl are supported.");
964cdce2fe5SMarcel Hlopko 
965cdce2fe5SMarcel Hlopko     auto DN = D->getDeclName();
966cdce2fe5SMarcel Hlopko     bool IsAnonymous = DN.isIdentifier() && !DN.getAsIdentifierInfo();
967cdce2fe5SMarcel Hlopko     if (IsAnonymous)
968cdce2fe5SMarcel Hlopko       return SourceLocation();
969cdce2fe5SMarcel Hlopko 
970cdce2fe5SMarcel Hlopko     if (const auto *DD = llvm::dyn_cast<DeclaratorDecl>(D)) {
971cdce2fe5SMarcel Hlopko       if (DD->getQualifierLoc()) {
972cdce2fe5SMarcel Hlopko         return DD->getQualifierLoc().getBeginLoc();
973cdce2fe5SMarcel Hlopko       }
974cdce2fe5SMarcel Hlopko     }
975cdce2fe5SMarcel Hlopko 
976cdce2fe5SMarcel Hlopko     return D->getLocation();
977cdce2fe5SMarcel Hlopko   }
978cdce2fe5SMarcel Hlopko 
979cdce2fe5SMarcel Hlopko   SourceRange getInitializerRange(Decl *D) {
980cdce2fe5SMarcel Hlopko     if (auto *V = llvm::dyn_cast<VarDecl>(D)) {
981cdce2fe5SMarcel Hlopko       auto *I = V->getInit();
982cdce2fe5SMarcel Hlopko       // Initializers in range-based-for are not part of the declarator
983cdce2fe5SMarcel Hlopko       if (I && !V->isCXXForRangeDecl())
984cdce2fe5SMarcel Hlopko         return I->getSourceRange();
985cdce2fe5SMarcel Hlopko     }
986cdce2fe5SMarcel Hlopko 
987cdce2fe5SMarcel Hlopko     return SourceRange();
988cdce2fe5SMarcel Hlopko   }
989cdce2fe5SMarcel Hlopko 
990cdce2fe5SMarcel Hlopko   /// Folds SimpleDeclarator node (if present) and in case this is the last
991cdce2fe5SMarcel Hlopko   /// declarator in the chain it also folds SimpleDeclaration node.
992cdce2fe5SMarcel Hlopko   template <class T> bool processDeclaratorAndDeclaration(T *D) {
993cdce2fe5SMarcel Hlopko     SourceRange Initializer = getInitializerRange(D);
994cdce2fe5SMarcel Hlopko     auto Range = getDeclaratorRange(Builder.sourceManager(),
995cdce2fe5SMarcel Hlopko                                     D->getTypeSourceInfo()->getTypeLoc(),
996cdce2fe5SMarcel Hlopko                                     getQualifiedNameStart(D), Initializer);
997cdce2fe5SMarcel Hlopko 
998cdce2fe5SMarcel Hlopko     // There doesn't have to be a declarator (e.g. `void foo(int)` only has
999cdce2fe5SMarcel Hlopko     // declaration, but no declarator).
1000cdce2fe5SMarcel Hlopko     if (Range.getBegin().isValid()) {
1001cdce2fe5SMarcel Hlopko       auto *N = new (allocator()) syntax::SimpleDeclarator;
1002cdce2fe5SMarcel Hlopko       Builder.foldNode(Builder.getRange(Range), N, nullptr);
1003cdce2fe5SMarcel Hlopko       Builder.markChild(N, syntax::NodeRole::SimpleDeclaration_declarator);
1004cdce2fe5SMarcel Hlopko     }
1005cdce2fe5SMarcel Hlopko 
1006cdce2fe5SMarcel Hlopko     if (Builder.isResponsibleForCreatingDeclaration(D)) {
1007cdce2fe5SMarcel Hlopko       Builder.foldNode(Builder.getDeclarationRange(D),
1008cdce2fe5SMarcel Hlopko                        new (allocator()) syntax::SimpleDeclaration, D);
1009cdce2fe5SMarcel Hlopko     }
1010cdce2fe5SMarcel Hlopko     return true;
1011cdce2fe5SMarcel Hlopko   }
1012cdce2fe5SMarcel Hlopko 
10137d382dcdSMarcel Hlopko   /// Returns the range of the built node.
1014a711a3a4SMarcel Hlopko   syntax::TrailingReturnType *BuildTrailingReturn(FunctionProtoTypeLoc L) {
10157d382dcdSMarcel Hlopko     assert(L.getTypePtr()->hasTrailingReturn());
10167d382dcdSMarcel Hlopko 
10177d382dcdSMarcel Hlopko     auto ReturnedType = L.getReturnLoc();
10187d382dcdSMarcel Hlopko     // Build node for the declarator, if any.
10197d382dcdSMarcel Hlopko     auto ReturnDeclaratorRange =
10207d382dcdSMarcel Hlopko         getDeclaratorRange(this->Builder.sourceManager(), ReturnedType,
10217d382dcdSMarcel Hlopko                            /*Name=*/SourceLocation(),
10227d382dcdSMarcel Hlopko                            /*Initializer=*/SourceLocation());
1023a711a3a4SMarcel Hlopko     syntax::SimpleDeclarator *ReturnDeclarator = nullptr;
10247d382dcdSMarcel Hlopko     if (ReturnDeclaratorRange.isValid()) {
1025a711a3a4SMarcel Hlopko       ReturnDeclarator = new (allocator()) syntax::SimpleDeclarator;
1026a711a3a4SMarcel Hlopko       Builder.foldNode(Builder.getRange(ReturnDeclaratorRange),
1027a711a3a4SMarcel Hlopko                        ReturnDeclarator, nullptr);
10287d382dcdSMarcel Hlopko     }
10297d382dcdSMarcel Hlopko 
10307d382dcdSMarcel Hlopko     // Build node for trailing return type.
1031a711a3a4SMarcel Hlopko     auto Return = Builder.getRange(ReturnedType.getSourceRange());
10327d382dcdSMarcel Hlopko     const auto *Arrow = Return.begin() - 1;
10337d382dcdSMarcel Hlopko     assert(Arrow->kind() == tok::arrow);
10347d382dcdSMarcel Hlopko     auto Tokens = llvm::makeArrayRef(Arrow, Return.end());
103542f6fec3SEduardo Caldas     Builder.markChildToken(Arrow, syntax::NodeRole::ArrowToken);
1036a711a3a4SMarcel Hlopko     if (ReturnDeclarator)
1037a711a3a4SMarcel Hlopko       Builder.markChild(ReturnDeclarator,
10387d382dcdSMarcel Hlopko                         syntax::NodeRole::TrailingReturnType_declarator);
1039a711a3a4SMarcel Hlopko     auto *R = new (allocator()) syntax::TrailingReturnType;
1040cdce2fe5SMarcel Hlopko     Builder.foldNode(Tokens, R, L);
1041a711a3a4SMarcel Hlopko     return R;
10427d382dcdSMarcel Hlopko   }
104388bf9b3dSMarcel Hlopko 
1044a711a3a4SMarcel Hlopko   void foldExplicitTemplateInstantiation(
1045a711a3a4SMarcel Hlopko       ArrayRef<syntax::Token> Range, const syntax::Token *ExternKW,
104688bf9b3dSMarcel Hlopko       const syntax::Token *TemplateKW,
1047a711a3a4SMarcel Hlopko       syntax::SimpleDeclaration *InnerDeclaration, Decl *From) {
104888bf9b3dSMarcel Hlopko     assert(!ExternKW || ExternKW->kind() == tok::kw_extern);
104988bf9b3dSMarcel Hlopko     assert(TemplateKW && TemplateKW->kind() == tok::kw_template);
105042f6fec3SEduardo Caldas     Builder.markChildToken(ExternKW, syntax::NodeRole::ExternKeyword);
105188bf9b3dSMarcel Hlopko     Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword);
105288bf9b3dSMarcel Hlopko     Builder.markChild(
105388bf9b3dSMarcel Hlopko         InnerDeclaration,
105488bf9b3dSMarcel Hlopko         syntax::NodeRole::ExplicitTemplateInstantiation_declaration);
1055a711a3a4SMarcel Hlopko     Builder.foldNode(
1056a711a3a4SMarcel Hlopko         Range, new (allocator()) syntax::ExplicitTemplateInstantiation, From);
105788bf9b3dSMarcel Hlopko   }
105888bf9b3dSMarcel Hlopko 
1059a711a3a4SMarcel Hlopko   syntax::TemplateDeclaration *foldTemplateDeclaration(
1060a711a3a4SMarcel Hlopko       ArrayRef<syntax::Token> Range, const syntax::Token *TemplateKW,
1061a711a3a4SMarcel Hlopko       ArrayRef<syntax::Token> TemplatedDeclaration, Decl *From) {
106288bf9b3dSMarcel Hlopko     assert(TemplateKW && TemplateKW->kind() == tok::kw_template);
106388bf9b3dSMarcel Hlopko     Builder.markChildToken(TemplateKW, syntax::NodeRole::IntroducerKeyword);
1064a711a3a4SMarcel Hlopko 
1065a711a3a4SMarcel Hlopko     auto *N = new (allocator()) syntax::TemplateDeclaration;
1066a711a3a4SMarcel Hlopko     Builder.foldNode(Range, N, From);
1067cdce2fe5SMarcel Hlopko     Builder.markChild(N, syntax::NodeRole::TemplateDeclaration_declaration);
1068a711a3a4SMarcel Hlopko     return N;
106988bf9b3dSMarcel Hlopko   }
107088bf9b3dSMarcel Hlopko 
10719b3f38f9SIlya Biryukov   /// A small helper to save some typing.
10729b3f38f9SIlya Biryukov   llvm::BumpPtrAllocator &allocator() { return Builder.allocator(); }
10739b3f38f9SIlya Biryukov 
10749b3f38f9SIlya Biryukov   syntax::TreeBuilder &Builder;
10759b3f38f9SIlya Biryukov   const LangOptions &LangOpts;
10769b3f38f9SIlya Biryukov };
10779b3f38f9SIlya Biryukov } // namespace
10789b3f38f9SIlya Biryukov 
10797d382dcdSMarcel Hlopko void syntax::TreeBuilder::noticeDeclWithoutSemicolon(Decl *D) {
1080e702bdb8SIlya Biryukov   DeclsWithoutSemicolons.insert(D);
1081e702bdb8SIlya Biryukov }
1082e702bdb8SIlya Biryukov 
1083def65bb4SIlya Biryukov void syntax::TreeBuilder::markChildToken(SourceLocation Loc, NodeRole Role) {
10849b3f38f9SIlya Biryukov   if (Loc.isInvalid())
10859b3f38f9SIlya Biryukov     return;
10869b3f38f9SIlya Biryukov   Pending.assignRole(*findToken(Loc), Role);
10879b3f38f9SIlya Biryukov }
10889b3f38f9SIlya Biryukov 
10897d382dcdSMarcel Hlopko void syntax::TreeBuilder::markChildToken(const syntax::Token *T, NodeRole R) {
10907d382dcdSMarcel Hlopko   if (!T)
10917d382dcdSMarcel Hlopko     return;
10927d382dcdSMarcel Hlopko   Pending.assignRole(*T, R);
10937d382dcdSMarcel Hlopko }
10947d382dcdSMarcel Hlopko 
1095a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(syntax::Node *N, NodeRole R) {
1096a711a3a4SMarcel Hlopko   assert(N);
1097a711a3a4SMarcel Hlopko   setRole(N, R);
1098a711a3a4SMarcel Hlopko }
1099a711a3a4SMarcel Hlopko 
1100a711a3a4SMarcel Hlopko void syntax::TreeBuilder::markChild(ASTPtr N, NodeRole R) {
1101a711a3a4SMarcel Hlopko   auto *SN = Mapping.find(N);
1102a711a3a4SMarcel Hlopko   assert(SN != nullptr);
1103a711a3a4SMarcel Hlopko   setRole(SN, R);
11047d382dcdSMarcel Hlopko }
11057d382dcdSMarcel Hlopko 
110658fa50f4SIlya Biryukov void syntax::TreeBuilder::markStmtChild(Stmt *Child, NodeRole Role) {
110758fa50f4SIlya Biryukov   if (!Child)
110858fa50f4SIlya Biryukov     return;
110958fa50f4SIlya Biryukov 
1110b34b7691SDmitri Gribenko   syntax::Tree *ChildNode;
1111b34b7691SDmitri Gribenko   if (Expr *ChildExpr = dyn_cast<Expr>(Child)) {
111258fa50f4SIlya Biryukov     // This is an expression in a statement position, consume the trailing
111358fa50f4SIlya Biryukov     // semicolon and form an 'ExpressionStatement' node.
1114b34b7691SDmitri Gribenko     markExprChild(ChildExpr, NodeRole::ExpressionStatement_expression);
1115a711a3a4SMarcel Hlopko     ChildNode = new (allocator()) syntax::ExpressionStatement;
1116a711a3a4SMarcel Hlopko     // (!) 'getStmtRange()' ensures this covers a trailing semicolon.
1117a711a3a4SMarcel Hlopko     Pending.foldChildren(Arena, getStmtRange(Child), ChildNode);
1118b34b7691SDmitri Gribenko   } else {
1119b34b7691SDmitri Gribenko     ChildNode = Mapping.find(Child);
112058fa50f4SIlya Biryukov   }
1121b34b7691SDmitri Gribenko   assert(ChildNode != nullptr);
1122a711a3a4SMarcel Hlopko   setRole(ChildNode, Role);
112358fa50f4SIlya Biryukov }
112458fa50f4SIlya Biryukov 
112558fa50f4SIlya Biryukov void syntax::TreeBuilder::markExprChild(Expr *Child, NodeRole Role) {
1126be14a22bSIlya Biryukov   if (!Child)
1127be14a22bSIlya Biryukov     return;
1128a711a3a4SMarcel Hlopko   Child = Child->IgnoreImplicit();
1129be14a22bSIlya Biryukov 
1130a711a3a4SMarcel Hlopko   syntax::Tree *ChildNode = Mapping.find(Child);
1131a711a3a4SMarcel Hlopko   assert(ChildNode != nullptr);
1132a711a3a4SMarcel Hlopko   setRole(ChildNode, Role);
113358fa50f4SIlya Biryukov }
113458fa50f4SIlya Biryukov 
11359b3f38f9SIlya Biryukov const syntax::Token *syntax::TreeBuilder::findToken(SourceLocation L) const {
113688bf9b3dSMarcel Hlopko   if (L.isInvalid())
113788bf9b3dSMarcel Hlopko     return nullptr;
1138c1bbefefSIlya Biryukov   auto It = LocationToToken.find(L.getRawEncoding());
1139c1bbefefSIlya Biryukov   assert(It != LocationToToken.end());
1140c1bbefefSIlya Biryukov   return It->second;
11419b3f38f9SIlya Biryukov }
11429b3f38f9SIlya Biryukov 
11439b3f38f9SIlya Biryukov syntax::TranslationUnit *
11449b3f38f9SIlya Biryukov syntax::buildSyntaxTree(Arena &A, const TranslationUnitDecl &TU) {
11459b3f38f9SIlya Biryukov   TreeBuilder Builder(A);
11469b3f38f9SIlya Biryukov   BuildTreeVisitor(TU.getASTContext(), Builder).TraverseAST(TU.getASTContext());
11479b3f38f9SIlya Biryukov   return std::move(Builder).finalize();
11489b3f38f9SIlya Biryukov }
1149