17#include "llvm/ADT/StringSwitch.h"
34 return "float_constant";
38 return "integer_constant";
60 llvm_unreachable(
"Unknown token name");
64 return (
'a' <= c && c <=
'z') || (
'A' <= c && c <=
'Z');
67static bool IsDigit(
char c) {
return '0' <= c && c <=
'9'; }
71static std::optional<llvm::StringRef>
IsWord(llvm::StringRef expr,
72 llvm::StringRef &remainder) {
75 llvm::StringRef candidate = remainder.take_while(
76 [](
char c) {
return IsDigit(c) ||
IsLetter(c) || c ==
'_' || c ==
'$'; });
77 if (candidate.empty() ||
IsDigit(candidate[0]))
79 remainder = remainder.drop_front(candidate.size());
87static std::optional<llvm::StringRef>
IsNumber(llvm::StringRef &remainder,
89 llvm::StringRef tail = remainder;
91 size_t dots = body.count(
'.');
92 if (dots > 1 || dots == body.size())
94 if (
IsDigit(body.front()) || (body[0] ==
'.' &&
IsDigit(body[1]))) {
96 tail = tail.drop_front(body.size());
97 bool isHex = body.contains_insensitive(
'x');
98 bool hasExp = !isHex && body.contains_insensitive(
'e');
99 bool hasHexExp = isHex && body.contains_insensitive(
'p');
100 if (hasExp || hasHexExp) {
102 if (body.ends_with_insensitive(
"e") || body.ends_with_insensitive(
"p"))
103 if (tail.consume_front(
"+") || tail.consume_front(
"-"))
106 size_t number_length = remainder.size() - tail.size();
107 llvm::StringRef number = remainder.take_front(number_length);
108 remainder = remainder.drop_front(number_length);
118 if (!token.
IsOneOf({Token::identifier, Token::period, Token::eof})) {
119 return llvm::make_error<DILDiagnosticError>(
120 expr, llvm::formatv(
"{0} is not allowed in DIL simple mode", token),
125 if (!token.
IsOneOf({Token::identifier, Token::integer_constant,
126 Token::period, Token::arrow, Token::star, Token::amp,
127 Token::l_square, Token::r_square, Token::eof})) {
128 return llvm::make_error<DILDiagnosticError>(
129 expr, llvm::formatv(
"{0} is not allowed in DIL legacy mode", token),
136 return llvm::Error::success();
141 std::vector<Token> tokens;
142 llvm::StringRef remainder = expr;
144 if (llvm::Expected<Token> t =
Lex(expr, remainder)) {
148 tokens.push_back(std::move(token));
150 return t.takeError();
152 }
while (tokens.back().GetKind() !=
Token::eof);
153 return DILLexer(expr, std::move(tokens));
157 llvm::StringRef &remainder) {
159 remainder = remainder.ltrim();
160 llvm::StringRef::iterator cur_pos = remainder.begin();
163 if (remainder.empty())
166 uint32_t position = cur_pos - expr.begin();
167 bool isFloat =
false;
168 std::optional<llvm::StringRef> maybe_number =
IsNumber(remainder, isFloat);
171 return Token(kind, maybe_number->str(), position);
173 std::optional<llvm::StringRef> maybe_word =
IsWord(expr, remainder);
175 llvm::StringRef word = *maybe_word;
176 Token::Kind kind = llvm::StringSwitch<Token::Kind>(word)
180 return Token(kind, word.str(), position);
183 constexpr std::pair<Token::Kind, const char *> operators[] = {
189 for (
auto [kind, str] : operators) {
190 if (remainder.consume_front(str))
191 return Token(kind, str, position);
195 return llvm::make_error<DILDiagnosticError>(expr,
"unrecognized token",
static llvm::raw_ostream & error(Stream &strm)
static llvm::Expected< DILLexer > Create(llvm::StringRef expr, lldb::DILMode mode=lldb::eDILModeFull)
Lexes all the tokens in expr and calls the private constructor with the lexed tokens.
DILLexer(llvm::StringRef dil_expr, std::vector< Token > lexed_tokens)
static llvm::Expected< Token > Lex(llvm::StringRef expr, llvm::StringRef &remainder)
Class defining the tokens generated by the DIL lexer and used by the DIL parser.
static llvm::StringRef GetTokenName(Kind kind)
uint32_t GetLocation() const
bool IsOneOf(llvm::ArrayRef< Kind > kinds) const
static std::optional< llvm::StringRef > IsWord(llvm::StringRef expr, llvm::StringRef &remainder)
static bool IsNumberBodyChar(char ch)
static llvm::Error IsNotAllowedByMode(llvm::StringRef expr, Token token, lldb::DILMode mode)
static bool IsLetter(char c)
static std::optional< llvm::StringRef > IsNumber(llvm::StringRef &remainder, bool &isFloat)
static bool IsDigit(char c)
DILMode
Data Inspection Language (DIL) evaluation modes.
@ eDILModeFull
Allowed: everything supported by DIL.
@ eDILModeLegacy
Allowed: identifiers, integers, operators: '.', '->', '*', '&', '[]'.
@ eDILModeSimple
Allowed: identifiers, operators: '.'.