378 lines
10 KiB
C++
378 lines
10 KiB
C++
//===- Tree.cpp -----------------------------------------------*- C++ -*-=====//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
#include "clang/Tooling/Syntax/Tree.h"
|
|
#include "clang/Basic/TokenKinds.h"
|
|
#include "clang/Tooling/Syntax/Nodes.h"
|
|
#include "llvm/ADT/ArrayRef.h"
|
|
#include "llvm/ADT/STLExtras.h"
|
|
#include "llvm/Support/Casting.h"
|
|
#include <cassert>
|
|
|
|
using namespace clang;
|
|
|
|
namespace {
|
|
static void traverse(const syntax::Node *N,
|
|
llvm::function_ref<void(const syntax::Node *)> Visit) {
|
|
if (auto *T = dyn_cast<syntax::Tree>(N)) {
|
|
for (auto *C = T->firstChild(); C; C = C->nextSibling())
|
|
traverse(C, Visit);
|
|
}
|
|
Visit(N);
|
|
}
|
|
static void traverse(syntax::Node *N,
|
|
llvm::function_ref<void(syntax::Node *)> Visit) {
|
|
traverse(static_cast<const syntax::Node *>(N), [&](const syntax::Node *N) {
|
|
Visit(const_cast<syntax::Node *>(N));
|
|
});
|
|
}
|
|
} // namespace
|
|
|
|
syntax::Arena::Arena(SourceManager &SourceMgr, const LangOptions &LangOpts,
|
|
const TokenBuffer &Tokens)
|
|
: SourceMgr(SourceMgr), LangOpts(LangOpts), Tokens(Tokens) {}
|
|
|
|
const syntax::TokenBuffer &syntax::Arena::tokenBuffer() const { return Tokens; }
|
|
|
|
std::pair<FileID, ArrayRef<syntax::Token>>
|
|
syntax::Arena::lexBuffer(std::unique_ptr<llvm::MemoryBuffer> Input) {
|
|
auto FID = SourceMgr.createFileID(std::move(Input));
|
|
auto It = ExtraTokens.try_emplace(FID, tokenize(FID, SourceMgr, LangOpts));
|
|
assert(It.second && "duplicate FileID");
|
|
return {FID, It.first->second};
|
|
}
|
|
|
|
syntax::Leaf::Leaf(const syntax::Token *Tok) : Node(NodeKind::Leaf), Tok(Tok) {
|
|
assert(Tok != nullptr);
|
|
}
|
|
|
|
bool syntax::Leaf::classof(const Node *N) {
|
|
return N->kind() == NodeKind::Leaf;
|
|
}
|
|
|
|
syntax::Node::Node(NodeKind Kind)
|
|
: Parent(nullptr), NextSibling(nullptr), Kind(static_cast<unsigned>(Kind)),
|
|
Role(0), Original(false), CanModify(false) {
|
|
this->setRole(NodeRole::Detached);
|
|
}
|
|
|
|
bool syntax::Node::isDetached() const { return role() == NodeRole::Detached; }
|
|
|
|
void syntax::Node::setRole(NodeRole NR) {
|
|
this->Role = static_cast<unsigned>(NR);
|
|
}
|
|
|
|
bool syntax::Tree::classof(const Node *N) { return N->kind() > NodeKind::Leaf; }
|
|
|
|
void syntax::Tree::prependChildLowLevel(Node *Child, NodeRole Role) {
|
|
assert(Child->role() == NodeRole::Detached);
|
|
assert(Role != NodeRole::Detached);
|
|
|
|
Child->setRole(Role);
|
|
prependChildLowLevel(Child);
|
|
}
|
|
|
|
void syntax::Tree::prependChildLowLevel(Node *Child) {
|
|
assert(Child->Parent == nullptr);
|
|
assert(Child->NextSibling == nullptr);
|
|
assert(Child->role() != NodeRole::Detached);
|
|
|
|
Child->Parent = this;
|
|
Child->NextSibling = this->FirstChild;
|
|
this->FirstChild = Child;
|
|
}
|
|
|
|
void syntax::Tree::replaceChildRangeLowLevel(Node *BeforeBegin, Node *End,
|
|
Node *New) {
|
|
assert(!BeforeBegin || BeforeBegin->Parent == this);
|
|
|
|
#ifndef NDEBUG
|
|
for (auto *N = New; N; N = N->nextSibling()) {
|
|
assert(N->Parent == nullptr);
|
|
assert(N->role() != NodeRole::Detached && "Roles must be set");
|
|
// FIXME: sanity-check the role.
|
|
}
|
|
#endif
|
|
|
|
// Detach old nodes.
|
|
for (auto *N = !BeforeBegin ? FirstChild : BeforeBegin->nextSibling();
|
|
N != End;) {
|
|
auto *Next = N->NextSibling;
|
|
|
|
N->setRole(NodeRole::Detached);
|
|
N->Parent = nullptr;
|
|
N->NextSibling = nullptr;
|
|
if (N->Original)
|
|
traverse(N, [&](Node *C) { C->Original = false; });
|
|
|
|
N = Next;
|
|
}
|
|
|
|
// Attach new nodes.
|
|
if (BeforeBegin)
|
|
BeforeBegin->NextSibling = New ? New : End;
|
|
else
|
|
FirstChild = New ? New : End;
|
|
|
|
if (New) {
|
|
auto *Last = New;
|
|
for (auto *N = New; N != nullptr; N = N->nextSibling()) {
|
|
Last = N;
|
|
N->Parent = this;
|
|
}
|
|
Last->NextSibling = End;
|
|
}
|
|
|
|
// Mark the node as modified.
|
|
for (auto *T = this; T && T->Original; T = T->Parent)
|
|
T->Original = false;
|
|
}
|
|
|
|
namespace {
|
|
static void dumpTokens(raw_ostream &OS, ArrayRef<syntax::Token> Tokens,
|
|
const SourceManager &SM) {
|
|
assert(!Tokens.empty());
|
|
bool First = true;
|
|
for (const auto &T : Tokens) {
|
|
if (!First)
|
|
OS << " ";
|
|
else
|
|
First = false;
|
|
// Handle 'eof' separately, calling text() on it produces an empty string.
|
|
if (T.kind() == tok::eof) {
|
|
OS << "<eof>";
|
|
continue;
|
|
}
|
|
OS << T.text(SM);
|
|
}
|
|
}
|
|
|
|
static void dumpTree(raw_ostream &OS, const syntax::Node *N,
|
|
const syntax::Arena &A, std::vector<bool> IndentMask) {
|
|
std::string Marks;
|
|
if (!N->isOriginal())
|
|
Marks += "M";
|
|
if (N->role() == syntax::NodeRole::Detached)
|
|
Marks += "*"; // FIXME: find a nice way to print other roles.
|
|
if (!N->canModify())
|
|
Marks += "I";
|
|
if (!Marks.empty())
|
|
OS << Marks << ": ";
|
|
|
|
if (auto *L = dyn_cast<syntax::Leaf>(N)) {
|
|
dumpTokens(OS, *L->token(), A.sourceManager());
|
|
OS << "\n";
|
|
return;
|
|
}
|
|
|
|
auto *T = cast<syntax::Tree>(N);
|
|
OS << T->kind() << "\n";
|
|
|
|
for (auto It = T->firstChild(); It != nullptr; It = It->nextSibling()) {
|
|
for (bool Filled : IndentMask) {
|
|
if (Filled)
|
|
OS << "| ";
|
|
else
|
|
OS << " ";
|
|
}
|
|
if (!It->nextSibling()) {
|
|
OS << "`-";
|
|
IndentMask.push_back(false);
|
|
} else {
|
|
OS << "|-";
|
|
IndentMask.push_back(true);
|
|
}
|
|
dumpTree(OS, It, A, IndentMask);
|
|
IndentMask.pop_back();
|
|
}
|
|
}
|
|
} // namespace
|
|
|
|
std::string syntax::Node::dump(const Arena &A) const {
|
|
std::string Str;
|
|
llvm::raw_string_ostream OS(Str);
|
|
dumpTree(OS, this, A, /*IndentMask=*/{});
|
|
return std::move(OS.str());
|
|
}
|
|
|
|
std::string syntax::Node::dumpTokens(const Arena &A) const {
|
|
std::string Storage;
|
|
llvm::raw_string_ostream OS(Storage);
|
|
traverse(this, [&](const syntax::Node *N) {
|
|
auto *L = dyn_cast<syntax::Leaf>(N);
|
|
if (!L)
|
|
return;
|
|
::dumpTokens(OS, *L->token(), A.sourceManager());
|
|
OS << " ";
|
|
});
|
|
return OS.str();
|
|
}
|
|
|
|
void syntax::Node::assertInvariants() const {
|
|
#ifndef NDEBUG
|
|
if (isDetached())
|
|
assert(parent() == nullptr);
|
|
else
|
|
assert(parent() != nullptr);
|
|
|
|
auto *T = dyn_cast<Tree>(this);
|
|
if (!T)
|
|
return;
|
|
for (auto *C = T->firstChild(); C; C = C->nextSibling()) {
|
|
if (T->isOriginal())
|
|
assert(C->isOriginal());
|
|
assert(!C->isDetached());
|
|
assert(C->parent() == T);
|
|
}
|
|
#endif
|
|
}
|
|
|
|
void syntax::Node::assertInvariantsRecursive() const {
|
|
#ifndef NDEBUG
|
|
traverse(this, [&](const syntax::Node *N) { N->assertInvariants(); });
|
|
#endif
|
|
}
|
|
|
|
syntax::Leaf *syntax::Tree::firstLeaf() {
|
|
auto *T = this;
|
|
while (auto *C = T->firstChild()) {
|
|
if (auto *L = dyn_cast<syntax::Leaf>(C))
|
|
return L;
|
|
T = cast<syntax::Tree>(C);
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
syntax::Leaf *syntax::Tree::lastLeaf() {
|
|
auto *T = this;
|
|
while (auto *C = T->firstChild()) {
|
|
// Find the last child.
|
|
while (auto *Next = C->nextSibling())
|
|
C = Next;
|
|
|
|
if (auto *L = dyn_cast<syntax::Leaf>(C))
|
|
return L;
|
|
T = cast<syntax::Tree>(C);
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
syntax::Node *syntax::Tree::findChild(NodeRole R) {
|
|
for (auto *C = FirstChild; C; C = C->nextSibling()) {
|
|
if (C->role() == R)
|
|
return C;
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
std::vector<syntax::List::ElementAndDelimiter<syntax::Node>>
|
|
syntax::List::getElementsAsNodesAndDelimiters() {
|
|
if (!firstChild())
|
|
return {};
|
|
|
|
auto children = std::vector<syntax::List::ElementAndDelimiter<Node>>();
|
|
syntax::Node *elementWithoutDelimiter = nullptr;
|
|
for (auto *C = firstChild(); C; C = C->nextSibling()) {
|
|
switch (C->role()) {
|
|
case syntax::NodeRole::List_element: {
|
|
if (elementWithoutDelimiter) {
|
|
children.push_back({elementWithoutDelimiter, nullptr});
|
|
}
|
|
elementWithoutDelimiter = C;
|
|
break;
|
|
}
|
|
case syntax::NodeRole::List_delimiter: {
|
|
children.push_back({elementWithoutDelimiter, cast<syntax::Leaf>(C)});
|
|
elementWithoutDelimiter = nullptr;
|
|
break;
|
|
}
|
|
default:
|
|
llvm_unreachable(
|
|
"A list can have only elements and delimiters as children.");
|
|
}
|
|
}
|
|
|
|
switch (getTerminationKind()) {
|
|
case syntax::List::TerminationKind::Separated: {
|
|
children.push_back({elementWithoutDelimiter, nullptr});
|
|
break;
|
|
}
|
|
case syntax::List::TerminationKind::Terminated:
|
|
case syntax::List::TerminationKind::MaybeTerminated: {
|
|
if (elementWithoutDelimiter) {
|
|
children.push_back({elementWithoutDelimiter, nullptr});
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
return children;
|
|
}
|
|
|
|
// Almost the same implementation of `getElementsAsNodesAndDelimiters` but
|
|
// ignoring delimiters
|
|
std::vector<syntax::Node *> syntax::List::getElementsAsNodes() {
|
|
if (!firstChild())
|
|
return {};
|
|
|
|
auto children = std::vector<syntax::Node *>();
|
|
syntax::Node *elementWithoutDelimiter = nullptr;
|
|
for (auto *C = firstChild(); C; C = C->nextSibling()) {
|
|
switch (C->role()) {
|
|
case syntax::NodeRole::List_element: {
|
|
if (elementWithoutDelimiter) {
|
|
children.push_back(elementWithoutDelimiter);
|
|
}
|
|
elementWithoutDelimiter = C;
|
|
break;
|
|
}
|
|
case syntax::NodeRole::List_delimiter: {
|
|
children.push_back(elementWithoutDelimiter);
|
|
elementWithoutDelimiter = nullptr;
|
|
break;
|
|
}
|
|
default:
|
|
llvm_unreachable("A list has only elements or delimiters.");
|
|
}
|
|
}
|
|
|
|
switch (getTerminationKind()) {
|
|
case syntax::List::TerminationKind::Separated: {
|
|
children.push_back(elementWithoutDelimiter);
|
|
break;
|
|
}
|
|
case syntax::List::TerminationKind::Terminated:
|
|
case syntax::List::TerminationKind::MaybeTerminated: {
|
|
if (elementWithoutDelimiter) {
|
|
children.push_back(elementWithoutDelimiter);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
return children;
|
|
}
|
|
|
|
// The methods below can't be implemented without information about the derived
|
|
// list. These methods will be implemented by switching on the derived list's
|
|
// `NodeKind`
|
|
|
|
clang::tok::TokenKind syntax::List::getDelimiterTokenKind() {
|
|
llvm_unreachable("There are no subclasses of List, thus "
|
|
"getDelimiterTokenKind() cannot be called");
|
|
}
|
|
|
|
syntax::List::TerminationKind syntax::List::getTerminationKind() {
|
|
llvm_unreachable("There are no subclasses of List, thus getTerminationKind() "
|
|
"cannot be called");
|
|
}
|
|
|
|
bool syntax::List::canBeEmpty() {
|
|
llvm_unreachable(
|
|
"There are no subclasses of List, thus canBeEmpty() cannot be called");
|
|
}
|