llvm/clang-tools-extra/clangd/DumpAST.cpp
Haojian Wu 6ba1b9075d Reland "[AST] Add a new TemplateKind for template decls found via a using decl.""
This is the template version of https://reviews.llvm.org/D114251.

This patch introduces a new template name kind (UsingTemplateName). The
UsingTemplateName stores the found using-shadow decl (and underlying
template can be retrieved from the using-shadow decl). With the new
template name, we can be able to find the using decl that a template
typeloc (e.g. TemplateSpecializationTypeLoc) found its underlying template,
which is useful for tooling use cases (include cleaner etc).

This patch merely focuses on adding the node to the AST.

Next steps:
- support using-decl in qualified template name;
- update the clangd and other tools to use this new node;
- add ast matchers for matching different kinds of template names;

Differential Revision: https://reviews.llvm.org/D123127
2022-04-14 11:04:55 +02:00

432 lines
16 KiB
C++

//===--- DumpAST.cpp - Serialize clang AST to LSP -------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "DumpAST.h"
#include "Protocol.h"
#include "SourceCode.h"
#include "support/Logger.h"
#include "clang/AST/ASTTypeTraits.h"
#include "clang/AST/Expr.h"
#include "clang/AST/ExprCXX.h"
#include "clang/AST/NestedNameSpecifier.h"
#include "clang/AST/PrettyPrinter.h"
#include "clang/AST/RecursiveASTVisitor.h"
#include "clang/AST/TextNodeDumper.h"
#include "clang/AST/Type.h"
#include "clang/AST/TypeLoc.h"
#include "clang/Basic/Specifiers.h"
#include "clang/Tooling/Syntax/Tokens.h"
#include "llvm/ADT/StringRef.h"
#include "llvm/Support/raw_ostream.h"
namespace clang {
namespace clangd {
namespace {
using llvm::raw_ostream;
template <typename Print> std::string toString(const Print &C) {
std::string Result;
llvm::raw_string_ostream OS(Result);
C(OS);
return std::move(OS.str());
}
bool isInjectedClassName(Decl *D) {
if (const auto *CRD = llvm::dyn_cast<CXXRecordDecl>(D))
return CRD->isInjectedClassName();
return false;
}
class DumpVisitor : public RecursiveASTVisitor<DumpVisitor> {
using Base = RecursiveASTVisitor<DumpVisitor>;
const syntax::TokenBuffer &Tokens;
const ASTContext &Ctx;
// Pointers are into 'children' vector.
// They remain valid because while a node is on the stack we only add
// descendants, not siblings.
std::vector<ASTNode *> Stack;
// Generic logic used to handle traversal of all node kinds.
template <typename T>
bool traverseNodePre(llvm::StringRef Role, const T &Node) {
if (Stack.empty()) {
assert(Root.role.empty());
Stack.push_back(&Root);
} else {
Stack.back()->children.emplace_back();
Stack.push_back(&Stack.back()->children.back());
}
auto &N = *Stack.back();
N.role = Role.str();
N.kind = getKind(Node);
N.detail = getDetail(Node);
N.range = getRange(Node);
N.arcana = getArcana(Node);
return true;
}
bool traverseNodePost() {
assert(!Stack.empty());
Stack.pop_back();
return true;
}
template <typename T, typename Callable>
bool traverseNode(llvm::StringRef Role, const T &Node, const Callable &Body) {
traverseNodePre(Role, Node);
Body();
return traverseNodePost();
}
// Range: most nodes have getSourceRange(), with a couple of exceptions.
// We only return it if it's valid at both ends and there are no macros.
template <typename T> llvm::Optional<Range> getRange(const T &Node) {
SourceRange SR = getSourceRange(Node);
auto Spelled = Tokens.spelledForExpanded(Tokens.expandedTokens(SR));
if (!Spelled)
return llvm::None;
return halfOpenToRange(
Tokens.sourceManager(),
CharSourceRange::getCharRange(Spelled->front().location(),
Spelled->back().endLocation()));
}
template <typename T, typename = decltype(std::declval<T>().getSourceRange())>
SourceRange getSourceRange(const T &Node) {
return Node.getSourceRange();
}
template <typename T,
typename = decltype(std::declval<T *>()->getSourceRange())>
SourceRange getSourceRange(const T *Node) {
return Node->getSourceRange();
}
// TemplateName doesn't have a real Loc node type.
SourceRange getSourceRange(const TemplateName &Node) { return SourceRange(); }
// Attr just uses a weird method name. Maybe we should fix it instead?
SourceRange getSourceRange(const Attr *Node) { return Node->getRange(); }
// Kind is usualy the class name, without the suffix ("Type" etc).
// Where there's a set of variants instead, we use the 'Kind' enum values.
std::string getKind(const Decl *D) { return D->getDeclKindName(); }
std::string getKind(const Stmt *S) {
std::string Result = S->getStmtClassName();
if (llvm::StringRef(Result).endswith("Stmt") ||
llvm::StringRef(Result).endswith("Expr"))
Result.resize(Result.size() - 4);
return Result;
}
std::string getKind(const TypeLoc &TL) {
std::string Result;
if (TL.getTypeLocClass() == TypeLoc::Qualified)
return "Qualified";
return TL.getType()->getTypeClassName();
}
std::string getKind(const TemplateArgumentLoc &TAL) {
switch (TAL.getArgument().getKind()) {
#define TEMPLATE_ARGUMENT_KIND(X) \
case TemplateArgument::X: \
return #X
TEMPLATE_ARGUMENT_KIND(Null);
TEMPLATE_ARGUMENT_KIND(NullPtr);
TEMPLATE_ARGUMENT_KIND(Expression);
TEMPLATE_ARGUMENT_KIND(Integral);
TEMPLATE_ARGUMENT_KIND(Pack);
TEMPLATE_ARGUMENT_KIND(Type);
TEMPLATE_ARGUMENT_KIND(Declaration);
TEMPLATE_ARGUMENT_KIND(Template);
TEMPLATE_ARGUMENT_KIND(TemplateExpansion);
#undef TEMPLATE_ARGUMENT_KIND
}
llvm_unreachable("Unhandled ArgKind enum");
}
std::string getKind(const NestedNameSpecifierLoc &NNSL) {
assert(NNSL.getNestedNameSpecifier());
switch (NNSL.getNestedNameSpecifier()->getKind()) {
#define NNS_KIND(X) \
case NestedNameSpecifier::X: \
return #X
NNS_KIND(Identifier);
NNS_KIND(Namespace);
NNS_KIND(TypeSpec);
NNS_KIND(TypeSpecWithTemplate);
NNS_KIND(Global);
NNS_KIND(Super);
NNS_KIND(NamespaceAlias);
#undef NNS_KIND
}
llvm_unreachable("Unhandled SpecifierKind enum");
}
std::string getKind(const CXXCtorInitializer *CCI) {
if (CCI->isBaseInitializer())
return "BaseInitializer";
if (CCI->isDelegatingInitializer())
return "DelegatingInitializer";
if (CCI->isAnyMemberInitializer())
return "MemberInitializer";
llvm_unreachable("Unhandled CXXCtorInitializer type");
}
std::string getKind(const TemplateName &TN) {
switch (TN.getKind()) {
#define TEMPLATE_KIND(X) \
case TemplateName::X: \
return #X;
TEMPLATE_KIND(Template);
TEMPLATE_KIND(OverloadedTemplate);
TEMPLATE_KIND(AssumedTemplate);
TEMPLATE_KIND(QualifiedTemplate);
TEMPLATE_KIND(DependentTemplate);
TEMPLATE_KIND(SubstTemplateTemplateParm);
TEMPLATE_KIND(SubstTemplateTemplateParmPack);
TEMPLATE_KIND(UsingTemplate);
#undef TEMPLATE_KIND
}
llvm_unreachable("Unhandled NameKind enum");
}
std::string getKind(const Attr *A) {
switch (A->getKind()) {
#define ATTR(X) \
case attr::X: \
return #X;
#include "clang/Basic/AttrList.inc"
#undef ATTR
}
llvm_unreachable("Unhandled attr::Kind enum");
}
std::string getKind(const CXXBaseSpecifier &CBS) {
// There aren't really any variants of CXXBaseSpecifier.
// To avoid special cases in the API/UI, use public/private as the kind.
return getAccessSpelling(CBS.getAccessSpecifier()).str();
}
// Detail is the single most important fact about the node.
// Often this is the name, sometimes a "kind" enum like operators or casts.
// We should avoid unbounded text, like dumping parameter lists.
std::string getDetail(const Decl *D) {
const auto *ND = dyn_cast<NamedDecl>(D);
if (!ND || llvm::isa_and_nonnull<CXXConstructorDecl>(ND->getAsFunction()) ||
isa<CXXDestructorDecl>(ND))
return "";
std::string Name = toString([&](raw_ostream &OS) { ND->printName(OS); });
if (Name.empty())
return "(anonymous)";
return Name;
}
std::string getDetail(const Stmt *S) {
if (const auto *DRE = dyn_cast<DeclRefExpr>(S))
return DRE->getNameInfo().getAsString();
if (const auto *DSDRE = dyn_cast<DependentScopeDeclRefExpr>(S))
return DSDRE->getNameInfo().getAsString();
if (const auto *ME = dyn_cast<MemberExpr>(S))
return ME->getMemberNameInfo().getAsString();
if (const auto *CE = dyn_cast<CastExpr>(S))
return CE->getCastKindName();
if (const auto *BO = dyn_cast<BinaryOperator>(S))
return BO->getOpcodeStr().str();
if (const auto *UO = dyn_cast<UnaryOperator>(S))
return UnaryOperator::getOpcodeStr(UO->getOpcode()).str();
if (const auto *CCO = dyn_cast<CXXConstructExpr>(S))
return CCO->getConstructor()->getNameAsString();
if (const auto *CTE = dyn_cast<CXXThisExpr>(S)) {
bool Const = CTE->getType()->getPointeeType().isLocalConstQualified();
if (CTE->isImplicit())
return Const ? "const, implicit" : "implicit";
if (Const)
return "const";
return "";
}
if (isa<IntegerLiteral, FloatingLiteral, FixedPointLiteral,
CharacterLiteral, ImaginaryLiteral, CXXBoolLiteralExpr>(S))
return toString([&](raw_ostream &OS) {
S->printPretty(OS, nullptr, Ctx.getPrintingPolicy());
});
if (const auto *MTE = dyn_cast<MaterializeTemporaryExpr>(S))
return MTE->isBoundToLvalueReference() ? "lvalue" : "rvalue";
return "";
}
std::string getDetail(const TypeLoc &TL) {
if (TL.getType().hasLocalQualifiers())
return TL.getType().getLocalQualifiers().getAsString(
Ctx.getPrintingPolicy());
if (const auto *TT = dyn_cast<TagType>(TL.getTypePtr()))
return getDetail(TT->getDecl());
if (const auto *DT = dyn_cast<DeducedType>(TL.getTypePtr()))
if (DT->isDeduced())
return DT->getDeducedType().getAsString(Ctx.getPrintingPolicy());
if (const auto *BT = dyn_cast<BuiltinType>(TL.getTypePtr()))
return BT->getName(Ctx.getPrintingPolicy()).str();
if (const auto *TTPT = dyn_cast<TemplateTypeParmType>(TL.getTypePtr()))
return getDetail(TTPT->getDecl());
if (const auto *TT = dyn_cast<TypedefType>(TL.getTypePtr()))
return getDetail(TT->getDecl());
return "";
}
std::string getDetail(const NestedNameSpecifierLoc &NNSL) {
const auto &NNS = *NNSL.getNestedNameSpecifier();
switch (NNS.getKind()) {
case NestedNameSpecifier::Identifier:
return NNS.getAsIdentifier()->getName().str() + "::";
case NestedNameSpecifier::Namespace:
return NNS.getAsNamespace()->getNameAsString() + "::";
case NestedNameSpecifier::NamespaceAlias:
return NNS.getAsNamespaceAlias()->getNameAsString() + "::";
default:
return "";
}
}
std::string getDetail(const CXXCtorInitializer *CCI) {
if (FieldDecl *FD = CCI->getAnyMember())
return getDetail(FD);
if (TypeLoc TL = CCI->getBaseClassLoc())
return getDetail(TL);
return "";
}
std::string getDetail(const TemplateArgumentLoc &TAL) {
if (TAL.getArgument().getKind() == TemplateArgument::Integral)
return toString(TAL.getArgument().getAsIntegral(), 10);
return "";
}
std::string getDetail(const TemplateName &TN) {
return toString([&](raw_ostream &OS) {
TN.print(OS, Ctx.getPrintingPolicy(), TemplateName::Qualified::None);
});
}
std::string getDetail(const Attr *A) {
return A->getAttrName() ? A->getNormalizedFullName() : A->getSpelling();
}
std::string getDetail(const CXXBaseSpecifier &CBS) {
return CBS.isVirtual() ? "virtual" : "";
}
/// Arcana is produced by TextNodeDumper, for the types it supports.
template <typename Dump> std::string dump(const Dump &D) {
return toString([&](raw_ostream &OS) {
TextNodeDumper Dumper(OS, Ctx, /*ShowColors=*/false);
D(Dumper);
});
}
template <typename T> std::string getArcana(const T &N) {
return dump([&](TextNodeDumper &D) { D.Visit(N); });
}
std::string getArcana(const NestedNameSpecifierLoc &NNS) { return ""; }
std::string getArcana(const TemplateName &NNS) { return ""; }
std::string getArcana(const CXXBaseSpecifier &CBS) { return ""; }
std::string getArcana(const TemplateArgumentLoc &TAL) {
return dump([&](TextNodeDumper &D) {
D.Visit(TAL.getArgument(), TAL.getSourceRange());
});
}
std::string getArcana(const TypeLoc &TL) {
return dump([&](TextNodeDumper &D) { D.Visit(TL.getType()); });
}
public:
ASTNode Root;
DumpVisitor(const syntax::TokenBuffer &Tokens, const ASTContext &Ctx)
: Tokens(Tokens), Ctx(Ctx) {}
// Override traversal to record the nodes we care about.
// Generally, these are nodes with position information (TypeLoc, not Type).
bool TraverseDecl(Decl *D) {
return !D || isInjectedClassName(D) ||
traverseNode("declaration", D, [&] { Base::TraverseDecl(D); });
}
bool TraverseTypeLoc(TypeLoc TL) {
return !TL || traverseNode("type", TL, [&] { Base::TraverseTypeLoc(TL); });
}
bool TraverseTemplateName(const TemplateName &TN) {
return traverseNode("template name", TN,
[&] { Base::TraverseTemplateName(TN); });
}
bool TraverseTemplateArgumentLoc(const TemplateArgumentLoc &TAL) {
return traverseNode("template argument", TAL,
[&] { Base::TraverseTemplateArgumentLoc(TAL); });
}
bool TraverseNestedNameSpecifierLoc(NestedNameSpecifierLoc NNSL) {
return !NNSL || traverseNode("specifier", NNSL, [&] {
Base::TraverseNestedNameSpecifierLoc(NNSL);
});
}
bool TraverseConstructorInitializer(CXXCtorInitializer *CCI) {
return !CCI || traverseNode("constructor initializer", CCI, [&] {
Base::TraverseConstructorInitializer(CCI);
});
}
bool TraverseAttr(Attr *A) {
return !A || traverseNode("attribute", A, [&] { Base::TraverseAttr(A); });
}
bool TraverseCXXBaseSpecifier(const CXXBaseSpecifier &CBS) {
return traverseNode("base", CBS,
[&] { Base::TraverseCXXBaseSpecifier(CBS); });
}
// Stmt is the same, but this form allows the data recursion optimization.
bool dataTraverseStmtPre(Stmt *S) {
return S && traverseNodePre(isa<Expr>(S) ? "expression" : "statement", S);
}
bool dataTraverseStmtPost(Stmt *X) { return traverseNodePost(); }
// QualifiedTypeLoc is handled strangely in RecursiveASTVisitor: the derived
// TraverseTypeLoc is not called for the inner UnqualTypeLoc.
// This means we'd never see 'int' in 'const int'! Work around that here.
// (The reason for the behavior is to avoid traversing the nested Type twice,
// but we ignore TraverseType anyway).
bool TraverseQualifiedTypeLoc(QualifiedTypeLoc QTL) {
return TraverseTypeLoc(QTL.getUnqualifiedLoc());
}
// Uninteresting parts of the AST that don't have locations within them.
bool TraverseNestedNameSpecifier(NestedNameSpecifier *) { return true; }
bool TraverseType(QualType) { return true; }
// OpaqueValueExpr blocks traversal, we must explicitly traverse it.
bool TraverseOpaqueValueExpr(OpaqueValueExpr *E) {
return TraverseStmt(E->getSourceExpr());
}
// We only want to traverse the *syntactic form* to understand the selection.
bool TraversePseudoObjectExpr(PseudoObjectExpr *E) {
return TraverseStmt(E->getSyntacticForm());
}
};
} // namespace
ASTNode dumpAST(const DynTypedNode &N, const syntax::TokenBuffer &Tokens,
const ASTContext &Ctx) {
DumpVisitor V(Tokens, Ctx);
// DynTypedNode only works with const, RecursiveASTVisitor only non-const :-(
if (const auto *D = N.get<Decl>())
V.TraverseDecl(const_cast<Decl *>(D));
else if (const auto *S = N.get<Stmt>())
V.TraverseStmt(const_cast<Stmt *>(S));
else if (const auto *NNSL = N.get<NestedNameSpecifierLoc>())
V.TraverseNestedNameSpecifierLoc(
*const_cast<NestedNameSpecifierLoc *>(NNSL));
else if (const auto *NNS = N.get<NestedNameSpecifier>())
V.TraverseNestedNameSpecifier(const_cast<NestedNameSpecifier *>(NNS));
else if (const auto *TL = N.get<TypeLoc>())
V.TraverseTypeLoc(*const_cast<TypeLoc *>(TL));
else if (const auto *QT = N.get<QualType>())
V.TraverseType(*const_cast<QualType *>(QT));
else if (const auto *CCI = N.get<CXXCtorInitializer>())
V.TraverseConstructorInitializer(const_cast<CXXCtorInitializer *>(CCI));
else if (const auto *TAL = N.get<TemplateArgumentLoc>())
V.TraverseTemplateArgumentLoc(*const_cast<TemplateArgumentLoc *>(TAL));
else if (const auto *CBS = N.get<CXXBaseSpecifier>())
V.TraverseCXXBaseSpecifier(*const_cast<CXXBaseSpecifier *>(CBS));
else
elog("dumpAST: unhandled DynTypedNode kind {0}",
N.getNodeKind().asStringRef());
return std::move(V.Root);
}
} // namespace clangd
} // namespace clang