doxygen/ASTMatchers_2Dynamic_2Parser_8cpp_source.html

//===- Parser.cpp - Matcher expression parser -----------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

///

/// \file

/// Recursive parser implementation for the matcher expression grammar.

///

//===----------------------------------------------------------------------===//


#include "clang/ASTMatchers/Dynamic/Parser.h"

#include "clang/ASTMatchers/ASTMatchersInternal.h"

#include "clang/ASTMatchers/Dynamic/Diagnostics.h"

#include "clang/ASTMatchers/Dynamic/Registry.h"

#include "clang/Basic/CharInfo.h"

#include "llvm/ADT/StringRef.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/ManagedStatic.h"

#include <cassert>

#include <cerrno>

#include <cstddef>

#include <cstdlib>

#include <optional>

#include <string>

#include <utility>

#include <vector>


namespace clang {

namespace ast_matchers {

namespace dynamic {


/// Simple structure to hold information for one token from the parser.


struct Parser::TokenInfo {

  /// Different possible tokens.


  enum TokenKind {

    TK_Eof,

    TK_NewLine,

    TK_OpenParen,

    TK_CloseParen,

    TK_Comma,

    TK_Period,

    TK_Literal,

    TK_Ident,

    TK_InvalidChar,

    TK_Error,

    TK_CodeCompletion

  };


  /// Some known identifiers.

  static const char* const ID_Bind;

  static const char *const ID_With;


  TokenInfo() = default;


  StringRef Text;

  TokenKind Kind = TK_Eof;

  SourceRange Range;

  VariantValue Value;

};


const char* const Parser::TokenInfo::ID_Bind = "bind";

const char *const Parser::TokenInfo::ID_With = "with";


/// Simple tokenizer for the parser.


class Parser::CodeTokenizer {

public:


  explicit CodeTokenizer(StringRef &MatcherCode, Diagnostics *Error)

      : Code(MatcherCode), StartOfLine(MatcherCode), Error(Error) {

    NextToken = getNextToken();

  }


  CodeTokenizer(StringRef &MatcherCode, Diagnostics *Error,

                unsigned CodeCompletionOffset)

      : Code(MatcherCode), StartOfLine(MatcherCode), Error(Error),

        CodeCompletionLocation(MatcherCode.data() + CodeCompletionOffset) {

    NextToken = getNextToken();

  }


  /// Returns but doesn't consume the next token.

  const TokenInfo &peekNextToken() const { return NextToken; }


  /// Consumes and returns the next token.


  TokenInfo consumeNextToken() {

    TokenInfo ThisToken = NextToken;

    NextToken = getNextToken();

    return ThisToken;

  }


  TokenInfo SkipNewlines() {

    while (NextToken.Kind == TokenInfo::TK_NewLine)

      NextToken = getNextToken();

    return NextToken;

  }


  TokenInfo consumeNextTokenIgnoreNewlines() {

    SkipNewlines();

    if (NextToken.Kind == TokenInfo::TK_Eof)

      return NextToken;

    return consumeNextToken();

  }


  TokenInfo::TokenKind nextTokenKind() const { return NextToken.Kind; }


private:

  TokenInfo getNextToken() {

    consumeWhitespace();

    TokenInfo Result;

    Result.Range.Start = currentLocation();


    if (CodeCompletionLocation && CodeCompletionLocation <= Code.data()) {

      Result.Kind = TokenInfo::TK_CodeCompletion;

      Result.Text = StringRef(CodeCompletionLocation, 0);

      CodeCompletionLocation = nullptr;

      return Result;

    }


    if (Code.empty()) {

      Result.Kind = TokenInfo::TK_Eof;

      Result.Text = "";

      return Result;

    }


    switch (Code[0]) {

    case '#':

      Code = Code.drop_until([](char c) { return c == '\n'; });

      return getNextToken();

    case ',':

      Result.Kind = TokenInfo::TK_Comma;

      Result.Text = Code.substr(0, 1);

      Code = Code.drop_front();

      break;

    case '.':

      Result.Kind = TokenInfo::TK_Period;

      Result.Text = Code.substr(0, 1);

      Code = Code.drop_front();

      break;

    case '\n':

      ++Line;

      StartOfLine = Code.drop_front();

      Result.Kind = TokenInfo::TK_NewLine;

      Result.Text = Code.substr(0, 1);

      Code = Code.drop_front();

      break;

    case '(':

      Result.Kind = TokenInfo::TK_OpenParen;

      Result.Text = Code.substr(0, 1);

      Code = Code.drop_front();

      break;

    case ')':

      Result.Kind = TokenInfo::TK_CloseParen;

      Result.Text = Code.substr(0, 1);

      Code = Code.drop_front();

      break;


    case '"':

    case '\'':

      // Parse a string literal.

      consumeStringLiteral(&Result);

      break;


    case '0': case '1': case '2': case '3': case '4':

    case '5': case '6': case '7': case '8': case '9':

      // Parse an unsigned and float literal.

      consumeNumberLiteral(&Result);

      break;


    default:

      if (isAlphanumeric(Code[0])) {

        // Parse an identifier

        size_t TokenLength = 1;

        while (true) {

          // A code completion location in/immediately after an identifier will

          // cause the portion of the identifier before the code completion

          // location to become a code completion token.

          if (CodeCompletionLocation == Code.data() + TokenLength) {

            CodeCompletionLocation = nullptr;

            Result.Kind = TokenInfo::TK_CodeCompletion;

            Result.Text = Code.substr(0, TokenLength);

            Code = Code.drop_front(TokenLength);

            return Result;

          }

          if (TokenLength == Code.size() || !isAlphanumeric(Code[TokenLength]))

            break;

          ++TokenLength;

        }

        if (TokenLength == 4 && Code.starts_with("true")) {

          Result.Kind = TokenInfo::TK_Literal;

          Result.Value = true;

        } else if (TokenLength == 5 && Code.starts_with("false")) {

          Result.Kind = TokenInfo::TK_Literal;

          Result.Value = false;

        } else {

          Result.Kind = TokenInfo::TK_Ident;

          Result.Text = Code.substr(0, TokenLength);

        }

        Code = Code.drop_front(TokenLength);

      } else {

        Result.Kind = TokenInfo::TK_InvalidChar;

        Result.Text = Code.substr(0, 1);

        Code = Code.drop_front(1);

      }

      break;

    }


    Result.Range.End = currentLocation();

    return Result;

  }


  /// Consume an unsigned and float literal.

  void consumeNumberLiteral(TokenInfo *Result) {

    bool isFloatingLiteral = false;

    unsigned Length = 1;

    if (Code.size() > 1) {

      // Consume the 'x' or 'b' radix modifier, if present.

      switch (toLowercase(Code[1])) {

      case 'x': case 'b': Length = 2;

      }

    }

    while (Length < Code.size() && isHexDigit(Code[Length]))

      ++Length;


    // Try to recognize a floating point literal.

    while (Length < Code.size()) {

      char c = Code[Length];

      if (c == '-' || c == '+' || c == '.' || isHexDigit(c)) {

        isFloatingLiteral = true;

        Length++;

      } else {

        break;

      }

    }


    Result->Text = Code.substr(0, Length);

    Code = Code.drop_front(Length);


    if (isFloatingLiteral) {

      char *end;

      errno = 0;

      std::string Text = Result->Text.str();

      double doubleValue = strtod(Text.c_str(), &end);

      if (*end == 0 && errno == 0) {

        Result->Kind = TokenInfo::TK_Literal;

        Result->Value = doubleValue;

        return;

      }

    } else {

      unsigned Value;

      if (!Result->Text.getAsInteger(0, Value)) {

        Result->Kind = TokenInfo::TK_Literal;

        Result->Value = Value;

        return;

      }

    }


    SourceRange Range;

    Range.Start = Result->Range.Start;

    Range.End = currentLocation();

    Error->addError(Range, Error->ET_ParserNumberError) << Result->Text;

    Result->Kind = TokenInfo::TK_Error;

  }


  /// Consume a string literal.

  ///

  /// \c Code must be positioned at the start of the literal (the opening

  /// quote). Consumed until it finds the same closing quote character.

  void consumeStringLiteral(TokenInfo *Result) {

    bool InEscape = false;

    const char Marker = Code[0];

    for (size_t Length = 1, Size = Code.size(); Length != Size; ++Length) {

      if (InEscape) {

        InEscape = false;

        continue;

      }

      if (Code[Length] == '\\') {

        InEscape = true;

        continue;

      }

      if (Code[Length] == Marker) {

        Result->Kind = TokenInfo::TK_Literal;

        Result->Text = Code.substr(0, Length + 1);

        Result->Value = Code.substr(1, Length - 1);

        Code = Code.drop_front(Length + 1);

        return;

      }

    }


    StringRef ErrorText = Code;

    Code = Code.drop_front(Code.size());

    SourceRange Range;

    Range.Start = Result->Range.Start;

    Range.End = currentLocation();

    Error->addError(Range, Error->ET_ParserStringError) << ErrorText;

    Result->Kind = TokenInfo::TK_Error;

  }


  /// Consume all leading whitespace from \c Code.

  void consumeWhitespace() {

    // Don't trim newlines.

    Code = Code.ltrim(" \t\v\f\r");

  }


  SourceLocation currentLocation() {

    SourceLocation Location;

    Location.Line = Line;

    Location.Column = Code.data() - StartOfLine.data() + 1;

    return Location;

  }


  StringRef &Code;

  StringRef StartOfLine;

  unsigned Line = 1;

  Diagnostics *Error;

  TokenInfo NextToken;

  const char *CodeCompletionLocation = nullptr;

};


Parser::Sema::~Sema() = default;


std::vector<ArgKind> Parser::Sema::getAcceptedCompletionTypes(

    llvm::ArrayRef<std::pair<MatcherCtor, unsigned>> Context) {

  return {};

}


std::vector<MatcherCompletion>


Parser::Sema::getMatcherCompletions(llvm::ArrayRef<ArgKind> AcceptedTypes) {

  return {};

}


struct Parser::ScopedContextEntry {

  Parser *P;


  ScopedContextEntry(Parser *P, MatcherCtor C) : P(P) {

    P->ContextStack.push_back(std::make_pair(C, 0u));

  }


  ~ScopedContextEntry() {

    P->ContextStack.pop_back();

  }


  void nextArg() {

    ++P->ContextStack.back().second;

  }


};


/// Parse expressions that start with an identifier.

///

/// This function can parse named values and matchers.

/// In case of failure it will try to determine the user's intent to give

/// an appropriate error message.

bool Parser::parseIdentifierPrefixImpl(VariantValue *Value) {

  const TokenInfo NameToken = Tokenizer->consumeNextToken();


  if (Tokenizer->nextTokenKind() != TokenInfo::TK_OpenParen) {

    // Parse as a named value.

    if (const VariantValue NamedValue =

            NamedValues ? NamedValues->lookup(NameToken.Text)

                        : VariantValue()) {


      if (Tokenizer->nextTokenKind() != TokenInfo::TK_Period) {

        *Value = NamedValue;

        return true;

      }


      std::string BindID;

      Tokenizer->consumeNextToken();

      TokenInfo ChainCallToken = Tokenizer->consumeNextToken();

      if (ChainCallToken.Kind == TokenInfo::TK_CodeCompletion) {

        addCompletion(ChainCallToken, MatcherCompletion("bind(\"", "bind", 1));

        return false;

      }


      if (ChainCallToken.Kind != TokenInfo::TK_Ident ||

          (ChainCallToken.Text != TokenInfo::ID_Bind &&

           ChainCallToken.Text != TokenInfo::ID_With)) {

        Error->addError(ChainCallToken.Range,

                        Error->ET_ParserMalformedChainedExpr);

        return false;

      }

      if (ChainCallToken.Text == TokenInfo::ID_With) {


        Diagnostics::Context Ctx(Diagnostics::Context::ConstructMatcher, Error,

                                 NameToken.Text, NameToken.Range);


        Error->addError(ChainCallToken.Range,

                        Error->ET_RegistryMatcherNoWithSupport);

        return false;

      }

      if (!parseBindID(BindID))

        return false;


      assert(NamedValue.isMatcher());

      std::optional<DynTypedMatcher> Result =

          NamedValue.getMatcher().getSingleMatcher();

      if (Result) {

        std::optional<DynTypedMatcher> Bound = Result->tryBind(BindID);

        if (Bound) {

          *Value = VariantMatcher::SingleMatcher(*Bound);

          return true;

        }

      }

      return false;

    }


    if (Tokenizer->nextTokenKind() == TokenInfo::TK_NewLine) {

      Error->addError(Tokenizer->peekNextToken().Range,

                      Error->ET_ParserNoOpenParen)

          << "NewLine";

      return false;

    }


    // If the syntax is correct and the name is not a matcher either, report

    // unknown named value.

    if ((Tokenizer->nextTokenKind() == TokenInfo::TK_Comma ||

         Tokenizer->nextTokenKind() == TokenInfo::TK_CloseParen ||

         Tokenizer->nextTokenKind() == TokenInfo::TK_NewLine ||

         Tokenizer->nextTokenKind() == TokenInfo::TK_Eof) &&

        !S->lookupMatcherCtor(NameToken.Text)) {

      Error->addError(NameToken.Range, Error->ET_RegistryValueNotFound)

          << NameToken.Text;

      return false;

    }

    // Otherwise, fallback to the matcher parser.

  }


  Tokenizer->SkipNewlines();


  assert(NameToken.Kind == TokenInfo::TK_Ident);

  TokenInfo OpenToken = Tokenizer->consumeNextToken();

  if (OpenToken.Kind != TokenInfo::TK_OpenParen) {

    Error->addError(OpenToken.Range, Error->ET_ParserNoOpenParen)

        << OpenToken.Text;

    return false;

  }


  std::optional<MatcherCtor> Ctor = S->lookupMatcherCtor(NameToken.Text);


  // Parse as a matcher expression.

  return parseMatcherExpressionImpl(NameToken, OpenToken, Ctor, Value);

}


bool Parser::parseBindID(std::string &BindID) {

  // Parse the parenthesized argument to .bind("foo")

  const TokenInfo OpenToken = Tokenizer->consumeNextToken();

  const TokenInfo IDToken = Tokenizer->consumeNextTokenIgnoreNewlines();

  const TokenInfo CloseToken = Tokenizer->consumeNextTokenIgnoreNewlines();


  // TODO: We could use different error codes for each/some to be more

  //       explicit about the syntax error.

  if (OpenToken.Kind != TokenInfo::TK_OpenParen) {

    Error->addError(OpenToken.Range, Error->ET_ParserMalformedBindExpr);

    return false;

  }

  if (IDToken.Kind != TokenInfo::TK_Literal || !IDToken.Value.isString()) {

    Error->addError(IDToken.Range, Error->ET_ParserMalformedBindExpr);

    return false;

  }

  if (CloseToken.Kind != TokenInfo::TK_CloseParen) {

    Error->addError(CloseToken.Range, Error->ET_ParserMalformedBindExpr);

    return false;

  }

  BindID = IDToken.Value.getString();

  return true;

}


bool Parser::parseMatcherBuilder(MatcherCtor Ctor, const TokenInfo &NameToken,

                                 const TokenInfo &OpenToken,

                                 VariantValue *Value) {

  std::vector<ParserValue> Args;

  TokenInfo EndToken;


  Tokenizer->SkipNewlines();


  {

    ScopedContextEntry SCE(this, Ctor);


    while (Tokenizer->nextTokenKind() != TokenInfo::TK_Eof) {

      if (Tokenizer->nextTokenKind() == TokenInfo::TK_CloseParen) {

        // End of args.

        EndToken = Tokenizer->consumeNextToken();

        break;

      }

      if (!Args.empty()) {

        // We must find a , token to continue.

        TokenInfo CommaToken = Tokenizer->consumeNextToken();

        if (CommaToken.Kind != TokenInfo::TK_Comma) {

          Error->addError(CommaToken.Range, Error->ET_ParserNoComma)

              << CommaToken.Text;

          return false;

        }

        // Allow for a trailing , token and possibly a new line.

        Tokenizer->SkipNewlines();

        if (Tokenizer->nextTokenKind() == TokenInfo::TK_CloseParen) {

          continue;

        }

      }


      Diagnostics::Context Ctx(Diagnostics::Context::MatcherArg, Error,

                               NameToken.Text, NameToken.Range,

                               Args.size() + 1);

      ParserValue ArgValue;

      Tokenizer->SkipNewlines();


      if (Tokenizer->peekNextToken().Kind == TokenInfo::TK_CodeCompletion) {

        addExpressionCompletions();

        return false;

      }


      TokenInfo NodeMatcherToken = Tokenizer->consumeNextToken();


      if (NodeMatcherToken.Kind != TokenInfo::TK_Ident) {

        Error->addError(NameToken.Range, Error->ET_ParserFailedToBuildMatcher)

            << NameToken.Text;

        return false;

      }


      ArgValue.Text = NodeMatcherToken.Text;

      ArgValue.Range = NodeMatcherToken.Range;


      std::optional<MatcherCtor> MappedMatcher =

          S->lookupMatcherCtor(ArgValue.Text);


      if (!MappedMatcher) {

        Error->addError(NodeMatcherToken.Range,

                        Error->ET_RegistryMatcherNotFound)

            << NodeMatcherToken.Text;

        return false;

      }


      ASTNodeKind NK = S->nodeMatcherType(*MappedMatcher);


      if (NK.isNone()) {

        Error->addError(NodeMatcherToken.Range,

                        Error->ET_RegistryNonNodeMatcher)

            << NodeMatcherToken.Text;

        return false;

      }


      ArgValue.Value = NK;


      Tokenizer->SkipNewlines();

      Args.push_back(ArgValue);


      SCE.nextArg();

    }

  }


  if (EndToken.Kind == TokenInfo::TK_Eof) {

    Error->addError(OpenToken.Range, Error->ET_ParserNoCloseParen);

    return false;

  }


  internal::MatcherDescriptorPtr BuiltCtor =

      S->buildMatcherCtor(Ctor, NameToken.Range, Args, Error);


  if (!BuiltCtor.get()) {

    Error->addError(NameToken.Range, Error->ET_ParserFailedToBuildMatcher)

        << NameToken.Text;

    return false;

  }


  std::string BindID;

  if (Tokenizer->peekNextToken().Kind == TokenInfo::TK_Period) {

    Tokenizer->consumeNextToken();

    TokenInfo ChainCallToken = Tokenizer->consumeNextToken();

    if (ChainCallToken.Kind == TokenInfo::TK_CodeCompletion) {

      addCompletion(ChainCallToken, MatcherCompletion("bind(\"", "bind", 1));

      addCompletion(ChainCallToken, MatcherCompletion("with(", "with", 1));

      return false;

    }

    if (ChainCallToken.Kind != TokenInfo::TK_Ident ||

        (ChainCallToken.Text != TokenInfo::ID_Bind &&

         ChainCallToken.Text != TokenInfo::ID_With)) {

      Error->addError(ChainCallToken.Range,

                      Error->ET_ParserMalformedChainedExpr);

      return false;

    }

    if (ChainCallToken.Text == TokenInfo::ID_Bind) {

      if (!parseBindID(BindID))

        return false;

      Diagnostics::Context Ctx(Diagnostics::Context::ConstructMatcher, Error,

                               NameToken.Text, NameToken.Range);

      SourceRange MatcherRange = NameToken.Range;

      MatcherRange.End = ChainCallToken.Range.End;

      VariantMatcher Result = S->actOnMatcherExpression(

          BuiltCtor.get(), MatcherRange, BindID, {}, Error);

      if (Result.isNull())

        return false;


      *Value = Result;

      return true;

    } else if (ChainCallToken.Text == TokenInfo::ID_With) {

      Tokenizer->SkipNewlines();


      if (Tokenizer->nextTokenKind() != TokenInfo::TK_OpenParen) {

        StringRef ErrTxt = Tokenizer->nextTokenKind() == TokenInfo::TK_Eof

                               ? StringRef("EOF")

                               : Tokenizer->peekNextToken().Text;

        Error->addError(Tokenizer->peekNextToken().Range,

                        Error->ET_ParserNoOpenParen)

            << ErrTxt;

        return false;

      }


      TokenInfo WithOpenToken = Tokenizer->consumeNextToken();


      return parseMatcherExpressionImpl(NameToken, WithOpenToken,

                                        BuiltCtor.get(), Value);

    }

  }


  Diagnostics::Context Ctx(Diagnostics::Context::ConstructMatcher, Error,

                           NameToken.Text, NameToken.Range);

  SourceRange MatcherRange = NameToken.Range;

  MatcherRange.End = EndToken.Range.End;

  VariantMatcher Result = S->actOnMatcherExpression(

      BuiltCtor.get(), MatcherRange, BindID, {}, Error);

  if (Result.isNull())

    return false;


  *Value = Result;

  return true;

}


/// Parse and validate a matcher expression.

/// \return \c true on success, in which case \c Value has the matcher parsed.

///   If the input is malformed, or some argument has an error, it

///   returns \c false.

bool Parser::parseMatcherExpressionImpl(const TokenInfo &NameToken,

                                        const TokenInfo &OpenToken,

                                        std::optional<MatcherCtor> Ctor,

                                        VariantValue *Value) {

  if (!Ctor) {

    Error->addError(NameToken.Range, Error->ET_RegistryMatcherNotFound)

        << NameToken.Text;

    // Do not return here. We need to continue to give completion suggestions.

  }


  if (Ctor && *Ctor && S->isBuilderMatcher(*Ctor))

    return parseMatcherBuilder(*Ctor, NameToken, OpenToken, Value);


  std::vector<ParserValue> Args;

  TokenInfo EndToken;


  Tokenizer->SkipNewlines();


  {

    ScopedContextEntry SCE(this, Ctor.value_or(nullptr));


    while (Tokenizer->nextTokenKind() != TokenInfo::TK_Eof) {

      if (Tokenizer->nextTokenKind() == TokenInfo::TK_CloseParen) {

        // End of args.

        EndToken = Tokenizer->consumeNextToken();

        break;

      }

      if (!Args.empty()) {

        // We must find a , token to continue.

        const TokenInfo CommaToken = Tokenizer->consumeNextToken();

        if (CommaToken.Kind != TokenInfo::TK_Comma) {

          Error->addError(CommaToken.Range, Error->ET_ParserNoComma)

              << CommaToken.Text;

          return false;

        }

        // Allow for a trailing , token and possibly a new line.

        Tokenizer->SkipNewlines();

        if (Tokenizer->nextTokenKind() == TokenInfo::TK_CloseParen) {

          continue;

        }

      }


      Diagnostics::Context Ctx(Diagnostics::Context::MatcherArg, Error,

                               NameToken.Text, NameToken.Range,

                               Args.size() + 1);

      ParserValue ArgValue;

      Tokenizer->SkipNewlines();

      ArgValue.Text = Tokenizer->peekNextToken().Text;

      ArgValue.Range = Tokenizer->peekNextToken().Range;

      if (!parseExpressionImpl(&ArgValue.Value)) {

        return false;

      }


      Tokenizer->SkipNewlines();

      Args.push_back(ArgValue);

      SCE.nextArg();

    }

  }


  if (EndToken.Kind == TokenInfo::TK_Eof) {

    Error->addError(OpenToken.Range, Error->ET_ParserNoCloseParen);

    return false;

  }


  std::string BindID;

  if (Tokenizer->peekNextToken().Kind == TokenInfo::TK_Period) {

    Tokenizer->consumeNextToken();

    TokenInfo ChainCallToken = Tokenizer->consumeNextToken();

    if (ChainCallToken.Kind == TokenInfo::TK_CodeCompletion) {

      addCompletion(ChainCallToken, MatcherCompletion("bind(\"", "bind", 1));

      return false;

    }


    if (ChainCallToken.Kind != TokenInfo::TK_Ident) {

      Error->addError(ChainCallToken.Range,

                      Error->ET_ParserMalformedChainedExpr);

      return false;

    }

    if (ChainCallToken.Text == TokenInfo::ID_With) {


      Diagnostics::Context Ctx(Diagnostics::Context::ConstructMatcher, Error,

                               NameToken.Text, NameToken.Range);


      Error->addError(ChainCallToken.Range,

                      Error->ET_RegistryMatcherNoWithSupport);

      return false;

    }

    if (ChainCallToken.Text != TokenInfo::ID_Bind) {

      Error->addError(ChainCallToken.Range,

                      Error->ET_ParserMalformedChainedExpr);

      return false;

    }

    if (!parseBindID(BindID))

      return false;

  }


  if (!Ctor)

    return false;


  // Merge the start and end infos.

  Diagnostics::Context Ctx(Diagnostics::Context::ConstructMatcher, Error,

                           NameToken.Text, NameToken.Range);

  SourceRange MatcherRange = NameToken.Range;

  MatcherRange.End = EndToken.Range.End;

  VariantMatcher Result = S->actOnMatcherExpression(

      *Ctor, MatcherRange, BindID, Args, Error);

  if (Result.isNull()) return false;


  *Value = Result;

  return true;

}


// If the prefix of this completion matches the completion token, add it to

// Completions minus the prefix.

void Parser::addCompletion(const TokenInfo &CompToken,

                           const MatcherCompletion& Completion) {

  if (StringRef(Completion.TypedText).starts_with(CompToken.Text) &&

      Completion.Specificity > 0) {

    Completions.emplace_back(Completion.TypedText.substr(CompToken.Text.size()),

                             Completion.MatcherDecl, Completion.Specificity);

  }

}


std::vector<MatcherCompletion> Parser::getNamedValueCompletions(

    ArrayRef<ArgKind> AcceptedTypes) {

  if (!NamedValues) return std::vector<MatcherCompletion>();

  std::vector<MatcherCompletion> Result;

  for (const auto &Entry : *NamedValues) {

    unsigned Specificity;

    if (Entry.getValue().isConvertibleTo(AcceptedTypes, &Specificity)) {

      std::string Decl =

          (Entry.getValue().getTypeAsString() + " " + Entry.getKey()).str();

      Result.emplace_back(Entry.getKey(), Decl, Specificity);

    }

  }

  return Result;

}


void Parser::addExpressionCompletions() {

  const TokenInfo CompToken = Tokenizer->consumeNextTokenIgnoreNewlines();

  assert(CompToken.Kind == TokenInfo::TK_CodeCompletion);


  // We cannot complete code if there is an invalid element on the context

  // stack.

  for (ContextStackTy::iterator I = ContextStack.begin(),

                                E = ContextStack.end();

       I != E; ++I) {

    if (!I->first)

      return;

  }


  auto AcceptedTypes = S->getAcceptedCompletionTypes(ContextStack);

  for (const auto &Completion : S->getMatcherCompletions(AcceptedTypes)) {

    addCompletion(CompToken, Completion);

  }


  for (const auto &Completion : getNamedValueCompletions(AcceptedTypes)) {

    addCompletion(CompToken, Completion);

  }

}


/// Parse an <Expression>

bool Parser::parseExpressionImpl(VariantValue *Value) {

  switch (Tokenizer->nextTokenKind()) {

  case TokenInfo::TK_Literal:

    *Value = Tokenizer->consumeNextToken().Value;

    return true;


  case TokenInfo::TK_Ident:

    return parseIdentifierPrefixImpl(Value);


  case TokenInfo::TK_CodeCompletion:

    addExpressionCompletions();

    return false;


  case TokenInfo::TK_Eof:

    Error->addError(Tokenizer->consumeNextToken().Range,

                    Error->ET_ParserNoCode);

    return false;


  case TokenInfo::TK_Error:

    // This error was already reported by the tokenizer.

    return false;

  case TokenInfo::TK_NewLine:

  case TokenInfo::TK_OpenParen:

  case TokenInfo::TK_CloseParen:

  case TokenInfo::TK_Comma:

  case TokenInfo::TK_Period:

  case TokenInfo::TK_InvalidChar:

    const TokenInfo Token = Tokenizer->consumeNextToken();

    Error->addError(Token.Range, Error->ET_ParserInvalidToken)

        << (Token.Kind == TokenInfo::TK_NewLine ? "NewLine" : Token.Text);

    return false;

  }


  llvm_unreachable("Unknown token kind.");

}


static llvm::ManagedStatic<Parser::RegistrySema> DefaultRegistrySema;


Parser::Parser(CodeTokenizer *Tokenizer, Sema *S,

               const NamedValueMap *NamedValues, Diagnostics *Error)

    : Tokenizer(Tokenizer), S(S ? S : &*DefaultRegistrySema),

      NamedValues(NamedValues), Error(Error) {}


Parser::RegistrySema::~RegistrySema() = default;


std::optional<MatcherCtor>


Parser::RegistrySema::lookupMatcherCtor(StringRef MatcherName) {

  return Registry::lookupMatcherCtor(MatcherName);

}


VariantMatcher Parser::RegistrySema::actOnMatcherExpression(

    MatcherCtor Ctor, SourceRange NameRange, StringRef BindID,

    ArrayRef<ParserValue> Args, Diagnostics *Error) {

  if (BindID.empty()) {

    return Registry::constructMatcher(Ctor, NameRange, Args, Error);

  } else {

    return Registry::constructBoundMatcher(Ctor, NameRange, BindID, Args,

                                           Error);

  }

}


std::vector<ArgKind> Parser::RegistrySema::getAcceptedCompletionTypes(

    ArrayRef<std::pair<MatcherCtor, unsigned>> Context) {

  return Registry::getAcceptedCompletionTypes(Context);

}


std::vector<MatcherCompletion> Parser::RegistrySema::getMatcherCompletions(

    ArrayRef<ArgKind> AcceptedTypes) {

  return Registry::getMatcherCompletions(AcceptedTypes);

}


bool Parser::RegistrySema::isBuilderMatcher(MatcherCtor Ctor) const {

  return Registry::isBuilderMatcher(Ctor);

}


ASTNodeKind Parser::RegistrySema::nodeMatcherType(MatcherCtor Ctor) const {

  return Registry::nodeMatcherType(Ctor);

}


internal::MatcherDescriptorPtr


Parser::RegistrySema::buildMatcherCtor(MatcherCtor Ctor, SourceRange NameRange,

                                       ArrayRef<ParserValue> Args,

                                       Diagnostics *Error) const {

  return Registry::buildMatcherCtor(Ctor, NameRange, Args, Error);

}


bool Parser::parseExpression(StringRef &Code, Sema *S,

                             const NamedValueMap *NamedValues,

                             VariantValue *Value, Diagnostics *Error) {

  CodeTokenizer Tokenizer(Code, Error);

  if (!Parser(&Tokenizer, S, NamedValues, Error).parseExpressionImpl(Value))

    return false;

  auto NT = Tokenizer.peekNextToken();

  if (NT.Kind != TokenInfo::TK_Eof && NT.Kind != TokenInfo::TK_NewLine) {

    Error->addError(Tokenizer.peekNextToken().Range,

                    Error->ET_ParserTrailingCode);

    return false;

  }

  return true;

}


std::vector<MatcherCompletion>


Parser::completeExpression(StringRef &Code, unsigned CompletionOffset, Sema *S,

                           const NamedValueMap *NamedValues) {

  Diagnostics Error;

  CodeTokenizer Tokenizer(Code, &Error, CompletionOffset);

  Parser P(&Tokenizer, S, NamedValues, &Error);

  VariantValue Dummy;

  P.parseExpressionImpl(&Dummy);


  // Sort by specificity, then by name.

  llvm::sort(P.Completions,

             [](const MatcherCompletion &A, const MatcherCompletion &B) {

               if (A.Specificity != B.Specificity)

                 return A.Specificity > B.Specificity;

               return A.TypedText < B.TypedText;

             });


  return P.Completions;

}


std::optional<DynTypedMatcher>


Parser::parseMatcherExpression(StringRef &Code, Sema *S,

                               const NamedValueMap *NamedValues,

                               Diagnostics *Error) {

  VariantValue Value;

  if (!parseExpression(Code, S, NamedValues, &Value, Error))

    return std::nullopt;

  if (!Value.isMatcher()) {

    Error->addError(SourceRange(), Error->ET_ParserNotAMatcher);

    return std::nullopt;

  }

  std::optional<DynTypedMatcher> Result = Value.getMatcher().getSingleMatcher();

  if (!Result) {

    Error->addError(SourceRange(), Error->ET_ParserOverloadedType)

        << Value.getTypeAsString();

  }

  return Result;

}


} // namespace dynamic

} // namespace ast_matchers

} // namespace clang

ASTMatchersInternal.h

Parser.h
Simple matcher expression parser.

CharInfo.h

Diagnostics.h
Diagnostics class to manage error messages.

consumeWhitespace
static StringRef consumeWhitespace(StringRef S)
Definition Parsing.cpp:142

Registry.h
Registry of all known matchers.

Value
Value
Definition UninitializedValues.cpp:118

c
__device__ __2f16 float c
Definition __clang_hip_libdevice_declares.h:296

clang::ASTNodeKind
Kind identifier.
Definition ASTTypeTraits.h:51

clang::Sema
Sema - This implements semantic analysis and AST building for C.
Definition Sema.h:856

clang::Value
Definition Value.h:95

clang::ast_matchers::dynamic::Diagnostics
Helper class to manage error messages.
Definition Diagnostics.h:50

clang::ast_matchers::dynamic::Parser::CodeTokenizer
Simple tokenizer for the parser.
Definition Parser.cpp:68

clang::ast_matchers::dynamic::Parser::CodeTokenizer::consumeNextTokenIgnoreNewlines
TokenInfo consumeNextTokenIgnoreNewlines()
Definition Parser.cpp:98

clang::ast_matchers::dynamic::Parser::CodeTokenizer::SkipNewlines
TokenInfo SkipNewlines()
Definition Parser.cpp:92

clang::ast_matchers::dynamic::Parser::CodeTokenizer::CodeTokenizer
CodeTokenizer(StringRef &MatcherCode, Diagnostics *Error, unsigned CodeCompletionOffset)
Definition Parser.cpp:75

clang::ast_matchers::dynamic::Parser::CodeTokenizer::nextTokenKind
TokenInfo::TokenKind nextTokenKind() const
Definition Parser.cpp:105

clang::ast_matchers::dynamic::Parser::CodeTokenizer::CodeTokenizer
CodeTokenizer(StringRef &MatcherCode, Diagnostics *Error)
Definition Parser.cpp:70

clang::ast_matchers::dynamic::Parser::CodeTokenizer::consumeNextToken
TokenInfo consumeNextToken()
Consumes and returns the next token.
Definition Parser.cpp:86

clang::ast_matchers::dynamic::Parser::CodeTokenizer::peekNextToken
const TokenInfo & peekNextToken() const
Returns but doesn't consume the next token.
Definition Parser.cpp:83

clang::ast_matchers::dynamic::Parser::RegistrySema::nodeMatcherType
ASTNodeKind nodeMatcherType(MatcherCtor) const override
Definition Parser.cpp:868

clang::ast_matchers::dynamic::Parser::RegistrySema::getAcceptedCompletionTypes
std::vector< ArgKind > getAcceptedCompletionTypes(llvm::ArrayRef< std::pair< MatcherCtor, unsigned > > Context) override
Compute the list of completion types for Context.
Definition Parser.cpp:854

clang::ast_matchers::dynamic::Parser::RegistrySema::lookupMatcherCtor
std::optional< MatcherCtor > lookupMatcherCtor(StringRef MatcherName) override
Look up a matcher by name.
Definition Parser.cpp:839

clang::ast_matchers::dynamic::Parser::RegistrySema::getMatcherCompletions
std::vector< MatcherCompletion > getMatcherCompletions(llvm::ArrayRef< ArgKind > AcceptedTypes) override
Compute the list of completions that match any of AcceptedTypes.
Definition Parser.cpp:859

clang::ast_matchers::dynamic::Parser::RegistrySema::buildMatcherCtor
internal::MatcherDescriptorPtr buildMatcherCtor(MatcherCtor, SourceRange NameRange, ArrayRef< ParserValue > Args, Diagnostics *Error) const override
Definition Parser.cpp:873

clang::ast_matchers::dynamic::Parser::RegistrySema::isBuilderMatcher
bool isBuilderMatcher(MatcherCtor Ctor) const override
Definition Parser.cpp:864

clang::ast_matchers::dynamic::Parser::RegistrySema::actOnMatcherExpression
VariantMatcher actOnMatcherExpression(MatcherCtor Ctor, SourceRange NameRange, StringRef BindID, ArrayRef< ParserValue > Args, Diagnostics *Error) override
Process a matcher expression.
Definition Parser.cpp:843

clang::ast_matchers::dynamic::Parser::Sema
Interface to connect the parser with the registry and more.
Definition Parser.h:67

clang::ast_matchers::dynamic::Parser::Sema::getAcceptedCompletionTypes
virtual std::vector< ArgKind > getAcceptedCompletionTypes(llvm::ArrayRef< std::pair< MatcherCtor, unsigned > > Context)
Compute the list of completion types for Context.
Definition Parser.cpp:322

clang::ast_matchers::dynamic::Parser::Sema::~Sema
virtual ~Sema()

clang::ast_matchers::dynamic::Parser::Sema::getMatcherCompletions
virtual std::vector< MatcherCompletion > getMatcherCompletions(llvm::ArrayRef< ArgKind > AcceptedTypes)
Compute the list of completions that match any of AcceptedTypes.
Definition Parser.cpp:328

clang::ast_matchers::dynamic::Parser::parseExpression
static bool parseExpression(StringRef &Code, Sema *S, const NamedValueMap *NamedValues, VariantValue *Value, Diagnostics *Error)
Parse an expression.
Definition Parser.cpp:879

clang::ast_matchers::dynamic::Parser::completeExpression
static std::vector< MatcherCompletion > completeExpression(StringRef &Code, unsigned CompletionOffset, Sema *S, const NamedValueMap *NamedValues)
Complete an expression at the given offset.
Definition Parser.cpp:895

clang::ast_matchers::dynamic::Parser::NamedValueMap
llvm::StringMap< VariantValue > NamedValueMap
Definition Parser.h:166

clang::ast_matchers::dynamic::Parser::parseMatcherExpression
static std::optional< DynTypedMatcher > parseMatcherExpression(StringRef &MatcherCode, Sema *S, const NamedValueMap *NamedValues, Diagnostics *Error)
Parse a matcher expression.
Definition Parser.cpp:915

clang::ast_matchers::dynamic::Registry::getAcceptedCompletionTypes
static std::vector< ArgKind > getAcceptedCompletionTypes(llvm::ArrayRef< std::pair< MatcherCtor, unsigned > > Context)
Compute the list of completion types for Context.
Definition Registry.cpp:668

clang::ast_matchers::dynamic::Registry::isBuilderMatcher
static bool isBuilderMatcher(MatcherCtor Ctor)
Definition Registry.cpp:634

clang::ast_matchers::dynamic::Registry::nodeMatcherType
static ASTNodeKind nodeMatcherType(MatcherCtor)
Definition Registry.cpp:625

clang::ast_matchers::dynamic::Registry::lookupMatcherCtor
static std::optional< MatcherCtor > lookupMatcherCtor(StringRef MatcherName)
Look up a matcher in the registry by name,.
Definition Registry.cpp:646

clang::ast_matchers::dynamic::Registry::buildMatcherCtor
static internal::MatcherDescriptorPtr buildMatcherCtor(MatcherCtor, SourceRange NameRange, ArrayRef< ParserValue > Args, Diagnostics *Error)
Definition Registry.cpp:639

clang::ast_matchers::dynamic::Registry::getMatcherCompletions
static std::vector< MatcherCompletion > getMatcherCompletions(ArrayRef< ArgKind > AcceptedTypes)
Compute the list of completions that match any of AcceptedTypes.
Definition Registry.cpp:702

clang::ast_matchers::dynamic::Registry::constructBoundMatcher
static VariantMatcher constructBoundMatcher(MatcherCtor Ctor, SourceRange NameRange, StringRef BindID, ArrayRef< ParserValue > Args, Diagnostics *Error)
Construct a matcher from the registry and bind it.
Definition Registry.cpp:814

clang::ast_matchers::dynamic::Registry::constructMatcher
static VariantMatcher constructMatcher(MatcherCtor Ctor, SourceRange NameRange, ArrayRef< ParserValue > Args, Diagnostics *Error)
Construct a matcher from the registry.
Definition Registry.cpp:807

clang::ast_matchers::dynamic::VariantMatcher
A variant matcher object.
Definition VariantValue.h:105

clang::ast_matchers::dynamic::VariantMatcher::SingleMatcher
static VariantMatcher SingleMatcher(const DynTypedMatcher &Matcher)
Clones the provided matcher.
Definition VariantValue.cpp:226

clang::ast_matchers::dynamic::VariantValue
Variant value class.
Definition VariantValue.h:254

clang::ast_matchers::dynamic::VariantValue::getString
const std::string & getString() const
Definition VariantValue.cpp:383

clang::ast_matchers::dynamic::internal::MatcherDescriptorPtr
A smart (owning) pointer for MatcherDescriptor.
Definition Registry.h:38

llvm::ArrayRef
Definition LLVM.h:31

clang::ast_matchers::dynamic
Definition Diagnostics.h:28

clang::ast_matchers::dynamic::DefaultRegistrySema
static llvm::ManagedStatic< Parser::RegistrySema > DefaultRegistrySema
Definition Parser.cpp:829

clang::ast_matchers::dynamic::MatcherCtor
const internal::MatcherDescriptor * MatcherCtor
Definition Registry.h:55

clang::ast_matchers
Definition ASTMatchers.h:102

clang::modulemap::Decl
std::variant< struct RequiresDecl, struct HeaderDecl, struct UmbrellaDirDecl, struct ModuleDecl, struct ExcludeDecl, struct ExportDecl, struct ExportAsDecl, struct ExternModuleDecl, struct UseDecl, struct LinkDecl, struct ConfigMacrosDecl, struct ConflictDecl > Decl
All declarations that can appear in a module declaration.
Definition ModuleMapFile.h:32

clang::transformer::EditKind::Range
@ Range
Definition RewriteRule.h:37

clang
The JSON file list parser is used to communicate input to InstallAPI.
Definition CalledOnceCheck.h:17

clang::DiagnosticLevelMask::Error
@ Error
Definition DiagnosticOptions.h:43

clang::LinkageSpecLanguageIDs::C
@ C
Definition DeclCXX.h:3003

clang::toLowercase
LLVM_READONLY char toLowercase(char c)
Converts the given ASCII character to its lowercase equivalent.
Definition CharInfo.h:224

clang::isAlphanumeric
LLVM_READONLY bool isAlphanumeric(unsigned char c)
Return true if this character is an ASCII letter or digit: [a-zA-Z0-9].
Definition CharInfo.h:138

clang::ObjCSubstitutionContext::Result
@ Result
The result type of a method or function.
Definition TypeBase.h:905

clang::PragmaClangSectionKind::Text
@ Text
Definition Sema.h:472

clang::isHexDigit
LLVM_READONLY bool isHexDigit(unsigned char c)
Return true if this character is an ASCII hex digit: [0-9a-fA-F].
Definition CharInfo.h:144

clang::SourceLocIdentKind::Line
@ Line
Definition Expr.h:5009

clang::ast_matchers::dynamic::Diagnostics::Context::MatcherArg
@ MatcherArg
Definition Diagnostics.h:113

clang::ast_matchers::dynamic::Diagnostics::Context::ConstructMatcher
@ ConstructMatcher
Definition Diagnostics.h:109

clang::ast_matchers::dynamic::MatcherCompletion
Definition Registry.h:57

clang::ast_matchers::dynamic::Parser::ScopedContextEntry
Definition Parser.cpp:332

clang::ast_matchers::dynamic::Parser::ScopedContextEntry::~ScopedContextEntry
~ScopedContextEntry()
Definition Parser.cpp:339

clang::ast_matchers::dynamic::Parser::ScopedContextEntry::P
Parser * P
Definition Parser.cpp:333

clang::ast_matchers::dynamic::Parser::ScopedContextEntry::ScopedContextEntry
ScopedContextEntry(Parser *P, MatcherCtor C)
Definition Parser.cpp:335

clang::ast_matchers::dynamic::Parser::ScopedContextEntry::nextArg
void nextArg()
Definition Parser.cpp:343

clang::ast_matchers::dynamic::Parser::TokenInfo
Simple structure to hold information for one token from the parser.
Definition Parser.cpp:36

clang::ast_matchers::dynamic::Parser::TokenInfo::Range
SourceRange Range
Definition Parser.cpp:60

clang::ast_matchers::dynamic::Parser::TokenInfo::TokenKind
TokenKind
Different possible tokens.
Definition Parser.cpp:38

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_Comma
@ TK_Comma
Definition Parser.cpp:43

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_NewLine
@ TK_NewLine
Definition Parser.cpp:40

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_Ident
@ TK_Ident
Definition Parser.cpp:46

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_OpenParen
@ TK_OpenParen
Definition Parser.cpp:41

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_InvalidChar
@ TK_InvalidChar
Definition Parser.cpp:47

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_CloseParen
@ TK_CloseParen
Definition Parser.cpp:42

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_Literal
@ TK_Literal
Definition Parser.cpp:45

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_Eof
@ TK_Eof
Definition Parser.cpp:39

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_Error
@ TK_Error
Definition Parser.cpp:48

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_CodeCompletion
@ TK_CodeCompletion
Definition Parser.cpp:49

clang::ast_matchers::dynamic::Parser::TokenInfo::TK_Period
@ TK_Period
Definition Parser.cpp:44

clang::ast_matchers::dynamic::Parser::TokenInfo::ID_Bind
static const char *const ID_Bind
Some known identifiers.
Definition Parser.cpp:53

clang::ast_matchers::dynamic::Parser::TokenInfo::ID_With
static const char *const ID_With
Definition Parser.cpp:54

clang::ast_matchers::dynamic::Parser::TokenInfo::Text
StringRef Text
Definition Parser.cpp:58

clang::ast_matchers::dynamic::Parser::TokenInfo::Kind
TokenKind Kind
Definition Parser.cpp:59

clang::ast_matchers::dynamic::Parser::TokenInfo::TokenInfo
TokenInfo()=default

clang::ast_matchers::dynamic::Parser::TokenInfo::Value
VariantValue Value
Definition Parser.cpp:61

clang::ast_matchers::dynamic::SourceRange
Definition Diagnostics.h:36