17#include "llvm/ADT/StringSwitch.h"
34 return "float_constant";
38 return "integer_constant";
64 llvm_unreachable(
"Unknown token name");
68 return (
'a' <= c && c <=
'z') || (
'A' <= c && c <=
'Z');
71static bool IsDigit(
char c) {
return '0' <= c && c <=
'9'; }
75static std::optional<llvm::StringRef>
IsWord(llvm::StringRef expr,
76 llvm::StringRef &remainder) {
79 llvm::StringRef candidate = remainder.take_while(
80 [](
char c) {
return IsDigit(c) ||
IsLetter(c) || c ==
'_' || c ==
'$'; });
81 if (candidate.empty() ||
IsDigit(candidate[0]))
83 remainder = remainder.drop_front(candidate.size());
91static std::optional<llvm::StringRef>
IsNumber(llvm::StringRef &remainder,
93 llvm::StringRef tail = remainder;
95 size_t dots = body.count(
'.');
96 if (dots > 1 || dots == body.size())
98 if (
IsDigit(body.front()) || (body[0] ==
'.' &&
IsDigit(body[1]))) {
100 tail = tail.drop_front(body.size());
101 bool isHex = body.contains_insensitive(
'x');
102 bool hasExp = !isHex && body.contains_insensitive(
'e');
103 bool hasHexExp = isHex && body.contains_insensitive(
'p');
104 if (hasExp || hasHexExp) {
106 if (body.ends_with_insensitive(
"e") || body.ends_with_insensitive(
"p"))
107 if (tail.consume_front(
"+") || tail.consume_front(
"-"))
110 size_t number_length = remainder.size() - tail.size();
111 llvm::StringRef number = remainder.take_front(number_length);
112 remainder = remainder.drop_front(number_length);
122 if (!token.
IsOneOf({Token::identifier, Token::period, Token::eof})) {
123 return llvm::make_error<DILDiagnosticError>(
124 expr, llvm::formatv(
"{0} is not allowed in DIL simple mode", token),
129 if (!token.
IsOneOf({Token::identifier, Token::integer_constant,
130 Token::period, Token::arrow, Token::star, Token::amp,
131 Token::l_square, Token::r_square, Token::eof})) {
132 return llvm::make_error<DILDiagnosticError>(
133 expr, llvm::formatv(
"{0} is not allowed in DIL legacy mode", token),
140 return llvm::Error::success();
145 std::vector<Token> tokens;
146 llvm::StringRef remainder = expr;
148 if (llvm::Expected<Token> t =
Lex(expr, remainder)) {
152 tokens.push_back(std::move(token));
154 return t.takeError();
156 }
while (tokens.back().GetKind() !=
Token::eof);
157 return DILLexer(expr, std::move(tokens));
161 llvm::StringRef &remainder) {
163 remainder = remainder.ltrim();
164 llvm::StringRef::iterator cur_pos = remainder.begin();
167 if (remainder.empty())
170 uint32_t position = cur_pos - expr.begin();
171 bool isFloat =
false;
172 std::optional<llvm::StringRef> maybe_number =
IsNumber(remainder, isFloat);
175 return Token(kind, maybe_number->str(), position);
177 std::optional<llvm::StringRef> maybe_word =
IsWord(expr, remainder);
179 llvm::StringRef word = *maybe_word;
180 Token::Kind kind = llvm::StringSwitch<Token::Kind>(word)
184 return Token(kind, word.str(), position);
187 constexpr std::pair<Token::Kind, const char *> operators[] = {
194 for (
auto [kind, str] : operators) {
195 if (remainder.consume_front(str))
196 return Token(kind, str, position);
200 return llvm::make_error<DILDiagnosticError>(expr,
"unrecognized token",
static llvm::raw_ostream & error(Stream &strm)
static llvm::Expected< DILLexer > Create(llvm::StringRef expr, lldb::DILMode mode=lldb::eDILModeFull)
Lexes all the tokens in expr and calls the private constructor with the lexed tokens.
DILLexer(llvm::StringRef dil_expr, std::vector< Token > lexed_tokens)
static llvm::Expected< Token > Lex(llvm::StringRef expr, llvm::StringRef &remainder)
Class defining the tokens generated by the DIL lexer and used by the DIL parser.
static llvm::StringRef GetTokenName(Kind kind)
uint32_t GetLocation() const
bool IsOneOf(llvm::ArrayRef< Kind > kinds) const
static std::optional< llvm::StringRef > IsWord(llvm::StringRef expr, llvm::StringRef &remainder)
static bool IsNumberBodyChar(char ch)
static llvm::Error IsNotAllowedByMode(llvm::StringRef expr, Token token, lldb::DILMode mode)
static bool IsLetter(char c)
static std::optional< llvm::StringRef > IsNumber(llvm::StringRef &remainder, bool &isFloat)
static bool IsDigit(char c)
DILMode
Data Inspection Language (DIL) evaluation modes.
@ eDILModeFull
Allowed: everything supported by DIL.
@ eDILModeLegacy
Allowed: identifiers, integers, operators: '.', '->', '*', '&', '[]'.
@ eDILModeSimple
Allowed: identifiers, operators: '.'.