14#include "clang/AST/DeclBase.h"
15#include "clang/Basic/SourceLocation.h"
16#include "clang/Basic/SourceManager.h"
17#include "clang/Tooling/Syntax/BuildTree.h"
18#include "clang/Tooling/Syntax/Nodes.h"
19#include "clang/Tooling/Syntax/TokenBufferTokenManager.h"
20#include "clang/Tooling/Syntax/Tree.h"
21#include "llvm/ADT/ArrayRef.h"
22#include "llvm/ADT/StringRef.h"
23#include "llvm/Support/Casting.h"
24#include "llvm/Support/Error.h"
38void addIfDistinct(
const Range &R, std::vector<Range> &Result) {
39 if (Result.empty() || Result.back() != R) {
44std::optional<FoldingRange> toFoldingRange(SourceRange SR,
45 const SourceManager &SM) {
46 const auto Begin = SM.getDecomposedLoc(SR.getBegin()),
47 End = SM.getDecomposedLoc(SR.getEnd());
51 if ((Begin.first != SM.getMainFileID()) || (End.first != SM.getMainFileID()))
54 Range.startCharacter = SM.getColumnNumber(Begin.first, Begin.second) - 1;
55 Range.startLine = SM.getLineNumber(Begin.first, Begin.second) - 1;
56 Range.endCharacter = SM.getColumnNumber(End.first, End.second) - 1;
57 Range.endLine = SM.getLineNumber(End.first, End.second) - 1;
61std::optional<FoldingRange>
62extractFoldingRange(
const syntax::Node *Node,
63 const syntax::TokenBufferTokenManager &TM) {
64 if (
const auto *Stmt = dyn_cast<syntax::CompoundStatement>(Node)) {
65 const auto *LBrace = cast_or_null<syntax::Leaf>(
66 Stmt->findChild(syntax::NodeRole::OpenParen));
70 const auto *RBrace = cast_or_null<syntax::Leaf>(
71 Stmt->findChild(syntax::NodeRole::CloseParen));
72 if (!LBrace || !RBrace)
75 const SourceLocation LBraceLocInfo =
76 TM.getToken(LBrace->getTokenKey())->endLocation(),
78 TM.getToken(RBrace->getTokenKey())->location();
79 auto Range = toFoldingRange(SourceRange(LBraceLocInfo, RBraceLocInfo),
90std::vector<FoldingRange>
91collectFoldingRanges(
const syntax::Node *Root,
92 const syntax::TokenBufferTokenManager &TM) {
93 std::queue<const syntax::Node *> Nodes;
95 std::vector<FoldingRange> Result;
96 while (!Nodes.empty()) {
97 const syntax::Node *Node = Nodes.front();
99 const auto Range = extractFoldingRange(Node, TM);
101 Result.push_back(*
Range);
102 if (
const auto *T = dyn_cast<syntax::Tree>(Node))
103 for (
const auto *NextNode =
T->getFirstChild(); NextNode;
104 NextNode = NextNode->getNextSibling())
105 Nodes.push(NextNode);
113 std::vector<Range> Ranges;
114 const auto &SM =
AST.getSourceManager();
115 const auto &LangOpts =
AST.getLangOpts();
117 auto FID = SM.getMainFileID();
120 return Offset.takeError();
125 AST.getASTContext(),
AST.getTokens(), *Offset, *Offset);
128 if (
const Decl *D = Node->ASTNode.get<Decl>()) {
129 if (llvm::isa<TranslationUnitDecl>(D)) {
135 if (!SR || SM.getFileID(SR->getBegin()) != SM.getMainFileID()) {
141 addIfDistinct(R, Ranges);
144 if (Ranges.empty()) {
149 return std::move(
Empty);
154 Head.range = std::move(Ranges.front());
157 llvm::MutableArrayRef(Ranges.data(), Ranges.size()).drop_front()) {
158 Tail->parent = std::make_unique<SelectionRange>();
163 return std::move(
Head);
172 syntax::TokenBufferTokenManager TM(
AST.getTokens(),
AST.getLangOpts(),
173 AST.getSourceManager());
174 const auto *SyntaxTree = syntax::buildSyntaxTree(A, TM,
AST.getASTContext());
175 return collectFoldingRanges(SyntaxTree, TM);
181llvm::Expected<std::vector<FoldingRange>>
185 auto DirectiveStructure = DirectiveTree::parse(OrigStream);
188 std::vector<FoldingRange> Result;
190 llvm::StringLiteral Kind) {
191 if (Start.
line >= End.line)
198 FR.
kind = Kind.str();
199 Result.push_back(FR);
201 auto OriginalToken = [&](
const Token &T) {
202 return OrigStream.tokens()[T.OriginalIndex];
204 auto StartOffset = [&](
const Token &T) {
205 return OriginalToken(T).text().data() - Code.data();
207 auto StartPosition = [&](
const Token &T) {
210 auto EndOffset = [&](
const Token &T) {
211 return StartOffset(T) + OriginalToken(T).Length;
213 auto EndPosition = [&](
const Token &T) {
219 for (
const auto &R : PPRanges) {
220 auto BTok = OrigStream.tokens()[R.Begin];
221 auto ETok = OrigStream.tokens()[R.End];
222 if (ETok.Kind == tok::eof)
224 if (BTok.Line >= ETok.Line)
235 auto Preprocessed = DirectiveStructure.stripDirectives(OrigStream);
240 auto Tokens = ParseableStream.tokens();
243 for (
const auto &Tok : Tokens) {
244 if (
auto *Paired = Tok.pair()) {
247 if (Tok.Line < Paired->Line) {
249 Position End = StartPosition(*Paired);
256 auto IsBlockComment = [&](
const Token &T) {
257 assert(T.Kind == tok::comment);
258 return OriginalToken(T).Length >= 2 &&
259 Code.substr(StartOffset(T), 2) ==
"/*";
263 for (
auto *T = Tokens.begin(); T != Tokens.end();) {
264 if (T->Kind != tok::comment) {
268 Token *FirstComment = T;
271 Token *LastComment = T;
273 while (T != Tokens.end() && T->Kind == tok::comment &&
274 StartPosition(*T).line <= End.
line + 1) {
275 End = EndPosition(*T);
279 if (IsBlockComment(*FirstComment)) {
283 if (IsBlockComment(*LastComment))
Stores and provides access to parsed AST.
static SelectionTree createRight(ASTContext &AST, const syntax::TokenBuffer &Tokens, unsigned Begin, unsigned End)
const Node * commonAncestor() const
FIXME: Skip testing on windows temporarily due to the different escaping code mode.
std::optional< SourceRange > toHalfOpenFileRange(const SourceManager &SM, const LangOptions &LangOpts, SourceRange R)
Turns a token range into a half-open range and checks its correctness.
Position offsetToPosition(llvm::StringRef Code, size_t Offset)
Turn an offset in Code into a [line, column] pair.
static void lex(llvm::StringRef Code, const LangOptions &LangOpts, llvm::function_ref< void(const syntax::Token &, const SourceManager &SM)> Action)
llvm::Expected< std::vector< FoldingRange > > getFoldingRanges(ParsedAST &AST)
Returns a list of ranges whose contents might be collapsible in an editor.
std::vector< Token::Range > pairDirectiveRanges(const DirectiveTree &Tree, const TokenStream &Code)
Pairs preprocessor conditional directives and computes their token ranges.
Position sourceLocToPosition(const SourceManager &SM, SourceLocation Loc)
Turn a SourceLocation into a [line, column] pair.
llvm::Expected< SelectionRange > getSemanticRanges(ParsedAST &AST, Position Pos)
Returns the list of all interesting ranges around the Position Pos.
clang::LangOptions genericLangOpts(clang::Language Lang, clang::LangStandard::Kind Standard)
A generic lang options suitable for lexing/parsing a langage.
void chooseConditionalBranches(DirectiveTree &Tree, const TokenStream &Code)
Describes the structure of a source file, as seen by the preprocessor.
llvm::Expected< size_t > positionToOffset(llvm::StringRef Code, Position P, bool AllowColumnsBeyondLineLength)
Turn a [line, column] pair into an offset in Code.
TokenStream cook(const TokenStream &Code, const LangOptions &LangOpts)
void pairBrackets(TokenStream &Stream)
Identifies bracket token in the stream which should be paired.
===– Representation.cpp - ClangDoc Representation --------—*- C++ -*-===//
Stores information about a region of code that can be folded.
static const llvm::StringLiteral REGION_KIND
static const llvm::StringLiteral COMMENT_KIND
int line
Line position in a document (zero-based).
int character
Character offset on a line in a document (zero-based).
Position start
The range's start position.
Position end
The range's end position.
A single C++ or preprocessor token.