11#include "llvm-c/Disassembler.h"
12#include "llvm/ADT/SmallString.h"
13#include "llvm/ADT/StringExtras.h"
14#include "llvm/MC/MCAsmInfo.h"
15#include "llvm/MC/MCContext.h"
16#include "llvm/MC/MCDisassembler/MCDisassembler.h"
17#include "llvm/MC/MCDisassembler/MCExternalSymbolizer.h"
18#include "llvm/MC/MCDisassembler/MCRelocationInfo.h"
19#include "llvm/MC/MCInst.h"
20#include "llvm/MC/MCInstPrinter.h"
21#include "llvm/MC/MCInstrAnalysis.h"
22#include "llvm/MC/MCInstrInfo.h"
23#include "llvm/MC/MCRegisterInfo.h"
24#include "llvm/MC/MCSubtargetInfo.h"
25#include "llvm/MC/MCTargetOptions.h"
26#include "llvm/MC/TargetRegistry.h"
27#include "llvm/Support/ErrorHandling.h"
28#include "llvm/Support/ScopedPrinter.h"
29#include "llvm/Support/TargetSelect.h"
30#include "llvm/TargetParser/AArch64TargetParser.h"
57 static std::unique_ptr<MCDisasmInstance>
58 Create(
const char *triple,
const char *cpu,
const char *features_str,
63 bool GetMCInst(
const uint8_t *opcode_data,
size_t opcode_data_len,
66 std::string &inst_string, std::string &comments_string);
70 bool CanBranch(llvm::MCInst &mc_inst)
const;
72 bool IsCall(llvm::MCInst &mc_inst)
const;
73 bool IsLoad(llvm::MCInst &mc_inst)
const;
74 bool IsBarrier(llvm::MCInst &mc_inst)
const;
79 std::unique_ptr<llvm::MCRegisterInfo> &®_info_up,
80 std::unique_ptr<llvm::MCSubtargetInfo> &&subtarget_info_up,
81 llvm::MCTargetOptions mc_options,
82 std::unique_ptr<llvm::MCAsmInfo> &&asm_info_up,
83 std::unique_ptr<llvm::MCContext> &&context_up,
84 std::unique_ptr<llvm::MCDisassembler> &&disasm_up,
85 std::unique_ptr<llvm::MCInstPrinter> &&instr_printer_up,
86 std::unique_ptr<llvm::MCInstrAnalysis> &&instr_analysis_up);
137 uint8_t opcode_len = opcode_and_modrm.
opcode_len;
138 uint8_t modrm = opcode_and_modrm.
modrm;
143 if (opcode >= 0x70 && opcode <= 0x7F) {
150 if (opcode >= 0x80 && opcode <= 0x8F) {
163 if (opcode_len == 1) {
164 uint8_t modrm_reg = (modrm >> 3) & 7;
167 else if (modrm_reg == 3)
169 else if (modrm_reg == 4)
171 else if (modrm_reg == 5)
227 if (opcode_len == 2) {
267std::optional<InstructionOpcodeAndModrm>
269 bool is_exec_mode_64b) {
271 bool prefix_done =
false;
278 while (!prefix_done) {
279 if (op_idx >= bytes_len)
318 if (is_exec_mode_64b)
326 if (!is_exec_mode_64b && (inst_bytes[op_idx + 1] & 0xc0) != 0xc0) {
333 ret.
modrm = inst_bytes[op_idx + 3];
337 if (!is_exec_mode_64b && (inst_bytes[op_idx + 1] & 0xc0) != 0xc0) {
341 ret.
opcode_len = inst_bytes[op_idx + 1] & 0x1f;
343 ret.
modrm = inst_bytes[op_idx + 4];
348 if (!is_exec_mode_64b && (inst_bytes[op_idx + 1] & 0xc0) != 0xc0) {
352 ret.
opcode_len = inst_bytes[op_idx + 1] & 0x03;
354 ret.
modrm = inst_bytes[op_idx + 5];
364 ret.
modrm = inst_bytes[op_idx + 1];
374 ret.
modrm = inst_bytes[op_idx + 1];
378 ret.
modrm = inst_bytes[op_idx + 1];
382 ret.
modrm = inst_bytes[op_idx + 1];
386 ret.
modrm = inst_bytes[op_idx + 1];
389 ret.
modrm = inst_bytes[op_idx + 1];
398 std::optional<InstructionOpcodeAndModrm> ret;
424 disasm.shared_from_this())) {}
465 const ArchSpec &arch = disasm->GetArchitecture();
470 if (min_op_byte_size == max_op_byte_size) {
475 switch (min_op_byte_size) {
498 bool is_alternate_isa =
false;
502 const llvm::Triple::ArchType machine = arch.
GetMachine();
503 if (machine == llvm::Triple::arm || machine == llvm::Triple::thumb) {
504 if (machine == llvm::Triple::thumb || is_alternate_isa) {
505 uint32_t thumb_opcode = data.
GetU16(&data_offset);
506 if ((thumb_opcode & 0xe000) != 0xe000 ||
507 ((thumb_opcode & 0x1800u) == 0)) {
508 m_opcode.SetOpcode16(thumb_opcode, byte_order);
512 thumb_opcode |= data.
GetU16(&data_offset);
513 m_opcode.SetOpcode16_2(thumb_opcode, byte_order);
523 uint8_t *opcode_data =
524 const_cast<uint8_t *
>(data.
PeekData(data_offset, 1));
525 const size_t opcode_data_len = data.
BytesLeft(data_offset);
529 uint64_t inst_size = 0;
531 pc, inst, inst_size);
533 if (inst_size != 0) {
535 m_opcode.SetOpcode16_32TupleBytes(opcode_data, inst_size,
538 m_opcode.SetOpcodeBytes(opcode_data, inst_size);
560 if (disasm->GetArchitecture().GetMachine() == llvm::Triple::x86)
562 else if (disasm->GetArchitecture().GetMachine() == llvm::Triple::x86_64)
575 std::string out_string;
576 std::string markup_out_string;
577 std::string comment_string;
578 std::string markup_comment_string;
585 mc_disasm_ptr = disasm->m_alternate_disasm_up.get();
587 mc_disasm_ptr = disasm->m_disasm_up.get();
592 bool use_hex_immediates =
true;
612 uint64_t inst_size = 0;
613 bool valid = mc_disasm_ptr->
GetMCInst(opcode_data, opcode_data_len,
pc,
616 if (valid && inst_size > 0) {
617 mc_disasm_ptr->
SetStyle(use_hex_immediates, hex_style);
619 const bool saved_use_color = mc_disasm_ptr->
GetUseColor();
621 mc_disasm_ptr->
PrintMCInst(inst,
pc, out_string, comment_string);
624 markup_comment_string);
627 if (!comment_string.empty()) {
632 if (inst_size == 0) {
640 const uint8_t uval8 = data.
GetU8(&offset);
641 m_opcode.SetOpcode8(uval8, byte_order);
643 mnemonic_strm.
Printf(
"0x%2.2x", uval8);
646 const uint16_t uval16 = data.
GetU16(&offset);
647 m_opcode.SetOpcode16(uval16, byte_order);
649 mnemonic_strm.
Printf(
"0x%4.4x", uval16);
652 const uint32_t uval32 = data.
GetU32(&offset);
653 m_opcode.SetOpcode32(uval32, byte_order);
655 mnemonic_strm.
Printf(
"0x%8.8x", uval32);
658 const uint64_t uval64 = data.
GetU64(&offset);
659 m_opcode.SetOpcode64(uval64, byte_order);
661 mnemonic_strm.
Printf(
"0x%16.16" PRIx64, uval64);
667 const uint8_t *bytes = data.
PeekData(offset, inst_size);
668 if (bytes ==
nullptr)
671 m_opcode.SetOpcodeBytes(bytes, inst_size);
672 mnemonic_strm.
Printf(
"0x%2.2x", bytes[0]);
673 for (uint32_t i = 1; i < inst_size; ++i)
674 mnemonic_strm.
Printf(
" 0x%2.2x", bytes[i]);
683 llvm::StringRef(
"[ \t]*([^ ^\t]+)[ \t]*([^ ^\t].*)?"));
685 llvm::SmallVector<llvm::StringRef, 4> matches;
686 if (s_regex.
Execute(out_string, &matches)) {
691 if (s_regex.
Execute(markup_out_string, &matches)) {
726 static llvm::StringRef::const_iterator
728 llvm::StringRef::const_iterator ose) {
743 static std::pair<bool, llvm::StringRef::const_iterator>
745 llvm::StringRef::const_iterator ose) {
749 if (osi != ose && *osi == c) {
754 return std::make_pair(found, osi);
757 static std::pair<Operand, llvm::StringRef::const_iterator>
759 llvm::StringRef::const_iterator ose) {
761 ret.
m_type = Operand::Type::Register;
767 if (*osi >=
'0' && *osi <=
'9') {
769 return std::make_pair(
Operand(), osi);
773 }
else if (*osi >=
'a' && *osi <=
'z') {
779 return std::make_pair(
Operand(), osi);
782 return std::make_pair(ret, osi);
786 return std::make_pair(
Operand(), osi);
795 return std::make_pair(ret, osi);
798 static std::pair<Operand, llvm::StringRef::const_iterator>
800 llvm::StringRef::const_iterator ose) {
802 ret.
m_type = Operand::Type::Immediate;
809 if (*osi >=
'0' && *osi <=
'9') {
811 }
else if (*osi >=
'a' && *osi <=
'f') {
815 return std::make_pair(
Operand(), osi);
821 return std::make_pair(
Operand(), osi);
823 ret.
m_immediate = strtoull(str.c_str(),
nullptr, 0);
824 return std::make_pair(ret, osi);
831 return std::make_pair(
Operand(), osi);
837 return std::make_pair(
Operand(), osi);
844 return std::make_pair(
Operand(), osi);
851 ret.
m_immediate = strtoull(str.c_str(),
nullptr, 0);
852 return std::make_pair(ret, osi);
856 static std::pair<Operand, llvm::StringRef::const_iterator>
858 llvm::StringRef::const_iterator ose) {
859 std::pair<Operand, llvm::StringRef::const_iterator> offset_and_iterator =
861 if (offset_and_iterator.first.IsValid()) {
862 osi = offset_and_iterator.second;
868 return std::make_pair(
Operand(), osi);
871 std::pair<Operand, llvm::StringRef::const_iterator> base_and_iterator =
873 if (base_and_iterator.first.IsValid()) {
874 osi = base_and_iterator.second;
876 return std::make_pair(
Operand(), osi);
881 return std::make_pair(
Operand(), osi);
884 std::pair<Operand, llvm::StringRef::const_iterator> index_and_iterator =
886 if (index_and_iterator.first.IsValid()) {
887 osi = index_and_iterator.second;
889 return std::make_pair(
Operand(), osi);
894 return std::make_pair(
Operand(), osi);
897 std::pair<Operand, llvm::StringRef::const_iterator>
899 if (index_and_iterator.first.IsValid()) {
900 osi = index_and_iterator.second;
902 return std::make_pair(
Operand(), osi);
907 return std::make_pair(
Operand(), osi);
911 product.
m_type = Operand::Type::Product;
912 product.
m_children.push_back(index_and_iterator.first);
913 product.
m_children.push_back(multiplier_and_iterator.first);
916 index.
m_type = Operand::Type::Sum;
917 index.
m_children.push_back(base_and_iterator.first);
920 if (offset_and_iterator.first.IsValid()) {
922 offset.
m_type = Operand::Type::Sum;
923 offset.
m_children.push_back(offset_and_iterator.first);
927 deref.
m_type = Operand::Type::Dereference;
929 return std::make_pair(deref, osi);
932 deref.
m_type = Operand::Type::Dereference;
934 return std::make_pair(deref, osi);
939 static std::pair<Operand, llvm::StringRef::const_iterator>
941 llvm::StringRef::const_iterator ose) {
942 std::pair<Operand, llvm::StringRef::const_iterator> offset_and_iterator =
944 if (offset_and_iterator.first.IsValid()) {
945 osi = offset_and_iterator.second;
951 return std::make_pair(
Operand(), osi);
954 std::pair<Operand, llvm::StringRef::const_iterator> base_and_iterator =
956 if (base_and_iterator.first.IsValid()) {
957 osi = base_and_iterator.second;
959 return std::make_pair(
Operand(), osi);
964 return std::make_pair(
Operand(), osi);
967 if (offset_and_iterator.first.IsValid()) {
969 offset.
m_type = Operand::Type::Sum;
970 offset.
m_children.push_back(offset_and_iterator.first);
971 offset.
m_children.push_back(base_and_iterator.first);
974 deref.
m_type = Operand::Type::Dereference;
976 return std::make_pair(deref, osi);
979 deref.
m_type = Operand::Type::Dereference;
980 deref.
m_children.push_back(base_and_iterator.first);
981 return std::make_pair(deref, osi);
986 static std::pair<Operand, llvm::StringRef::const_iterator>
988 llvm::StringRef::const_iterator ose) {
992 return std::make_pair(
Operand(), osi);
995 std::pair<Operand, llvm::StringRef::const_iterator> base_and_iterator =
997 if (base_and_iterator.first.IsValid()) {
998 osi = base_and_iterator.second;
1000 return std::make_pair(
Operand(), osi);
1003 std::tie(found, osi) =
ConsumeChar(osi,
',', ose);
1005 return std::make_pair(
Operand(), osi);
1008 std::pair<Operand, llvm::StringRef::const_iterator> offset_and_iterator =
1010 if (offset_and_iterator.first.IsValid()) {
1011 osi = offset_and_iterator.second;
1014 std::tie(found, osi) =
ConsumeChar(osi,
']', ose);
1016 return std::make_pair(
Operand(), osi);
1020 offset.
m_type = Operand::Type::Sum;
1021 offset.
m_children.push_back(offset_and_iterator.first);
1022 offset.
m_children.push_back(base_and_iterator.first);
1025 deref.
m_type = Operand::Type::Dereference;
1027 return std::make_pair(deref, osi);
1031 static std::pair<Operand, llvm::StringRef::const_iterator>
1033 llvm::StringRef::const_iterator ose) {
1035 std::tie(found, osi) =
ConsumeChar(osi,
'[', ose);
1037 return std::make_pair(
Operand(), osi);
1040 std::pair<Operand, llvm::StringRef::const_iterator> base_and_iterator =
1042 if (base_and_iterator.first.IsValid()) {
1043 osi = base_and_iterator.second;
1045 return std::make_pair(
Operand(), osi);
1048 std::tie(found, osi) =
ConsumeChar(osi,
']', ose);
1050 return std::make_pair(
Operand(), osi);
1054 deref.
m_type = Operand::Type::Dereference;
1055 deref.
m_children.push_back(base_and_iterator.first);
1056 return std::make_pair(deref, osi);
1061 case Operand::Type::Dereference:
1065 case Operand::Type::Immediate:
1071 case Operand::Type::Invalid:
1074 case Operand::Type::Product:
1081 case Operand::Type::Register:
1084 case Operand::Type::Sum:
1096 const char *operands_string =
GetOperands(
nullptr);
1098 if (!operands_string) {
1102 llvm::StringRef operands_ref(operands_string);
1104 llvm::StringRef::const_iterator osi = operands_ref.begin();
1105 llvm::StringRef::const_iterator ose = operands_ref.end();
1107 while (osi != ose) {
1109 llvm::StringRef::const_iterator iter;
1124 operands.push_back(operand);
1129 std::pair<bool, llvm::StringRef::const_iterator> found_and_iter =
1131 if (found_and_iter.first) {
1132 osi = found_and_iter.second;
1140 if (disasm_sp && operands.size() > 1) {
1142 switch (disasm_sp->GetArchitecture().GetMachine()) {
1145 case llvm::Triple::x86:
1146 case llvm::Triple::x86_64:
1147 operands[operands.size() - 1].m_clobbered =
true;
1149 case llvm::Triple::arm:
1150 operands[0].m_clobbered =
true;
1158 ss.
Printf(
"[%s] expands to %zu operands:\n", operands_string,
1160 for (
const Operand &operand : operands) {
1209 bool is_alternate_isa;
1214 const size_t opcode_data_len = data.
GetByteSize();
1216 uint64_t inst_size = 0;
1217 const bool valid = mc_disasm_ptr->
GetMCInst(opcode_data, opcode_data_len,
1218 pc, inst, inst_size);
1234 is_alternate_isa =
false;
1236 if (disasm->m_alternate_disasm_up) {
1240 is_alternate_isa =
true;
1241 return disasm->m_alternate_disasm_up.get();
1244 return disasm->m_disasm_up.get();
1250std::unique_ptr<DisassemblerLLVMC::MCDisasmInstance>
1253 const char *features_str,
1256 using Instance = std::unique_ptr<DisassemblerLLVMC::MCDisasmInstance>;
1258 llvm::Triple triple(triple_name);
1261 const llvm::Target *curr_target =
1262 llvm::TargetRegistry::lookupTarget(triple,
Status);
1266 std::unique_ptr<llvm::MCInstrInfo> instr_info_up(
1267 curr_target->createMCInstrInfo());
1271 std::unique_ptr<llvm::MCRegisterInfo> reg_info_up(
1272 curr_target->createMCRegInfo(triple));
1276 std::unique_ptr<llvm::MCSubtargetInfo> subtarget_info_up(
1277 curr_target->createMCSubtargetInfo(triple, cpu, features_str));
1278 if (!subtarget_info_up)
1281 llvm::MCTargetOptions MCOptions;
1282 std::unique_ptr<llvm::MCAsmInfo> asm_info_up(
1283 curr_target->createMCAsmInfo(*reg_info_up, triple, MCOptions));
1287 std::unique_ptr<llvm::MCContext> context_up(
new llvm::MCContext(
1288 llvm::Triple(triple), *asm_info_up, *reg_info_up, *subtarget_info_up));
1292 std::unique_ptr<llvm::MCDisassembler> disasm_up(
1293 curr_target->createMCDisassembler(*subtarget_info_up, *context_up));
1297 std::unique_ptr<llvm::MCRelocationInfo> rel_info_up(
1298 curr_target->createMCRelocationInfo(triple, *context_up));
1302 std::unique_ptr<llvm::MCSymbolizer> symbolizer_up(
1303 curr_target->createMCSymbolizer(
1305 context_up.get(), std::move(rel_info_up)));
1306 disasm_up->setSymbolizer(std::move(symbolizer_up));
1308 unsigned asm_printer_variant =
1309 flavor == ~0U ? asm_info_up->getAssemblerDialect() : flavor;
1311 std::unique_ptr<llvm::MCInstPrinter> instr_printer_up(
1312 curr_target->createMCInstPrinter(llvm::Triple{triple},
1313 asm_printer_variant, *asm_info_up,
1314 *instr_info_up, *reg_info_up));
1315 if (!instr_printer_up)
1318 instr_printer_up->setPrintBranchImmAsAddress(
true);
1321 std::unique_ptr<llvm::MCInstrAnalysis> instr_analysis_up(
1322 curr_target->createMCInstrAnalysis(instr_info_up.get()));
1325 std::move(instr_info_up), std::move(reg_info_up),
1326 std::move(subtarget_info_up), MCOptions, std::move(asm_info_up),
1327 std::move(context_up), std::move(disasm_up), std::move(instr_printer_up),
1328 std::move(instr_analysis_up)));
1332 std::unique_ptr<llvm::MCInstrInfo> &&instr_info_up,
1333 std::unique_ptr<llvm::MCRegisterInfo> &®_info_up,
1334 std::unique_ptr<llvm::MCSubtargetInfo> &&subtarget_info_up,
1335 llvm::MCTargetOptions mc_options,
1336 std::unique_ptr<llvm::MCAsmInfo> &&asm_info_up,
1337 std::unique_ptr<llvm::MCContext> &&context_up,
1338 std::unique_ptr<llvm::MCDisassembler> &&disasm_up,
1339 std::unique_ptr<llvm::MCInstPrinter> &&instr_printer_up,
1340 std::unique_ptr<llvm::MCInstrAnalysis> &&instr_analysis_up)
1353 size_t opcode_data_len,
1355 llvm::MCInst &mc_inst,
1356 uint64_t &size)
const {
1357 llvm::ArrayRef<uint8_t> data(opcode_data, opcode_data_len);
1358 llvm::MCDisassembler::DecodeStatus status;
1360 status =
m_disasm_up->getInstruction(mc_inst, size, data,
pc, llvm::nulls());
1361 if (status == llvm::MCDisassembler::Success)
1368 llvm::MCInst &mc_inst,
lldb::addr_t pc, std::string &inst_string,
1369 std::string &comments_string) {
1370 llvm::raw_string_ostream inst_stream(inst_string);
1371 llvm::raw_string_ostream comments_stream(comments_string);
1379 static std::string g_newlines(
"\r\n");
1381 for (
size_t newline_pos = 0;
1382 (newline_pos = comments_string.find_first_of(g_newlines, newline_pos)) !=
1383 comments_string.npos;
1385 comments_string.replace(comments_string.begin() + newline_pos,
1386 comments_string.begin() + newline_pos + 1, 1,
' ');
1393 switch (hex_style) {
1412 llvm::MCInst &mc_inst)
const {
1420 llvm::MCInst &mc_inst)
const {
1435 llvm::MCInst &mc_inst)
const {
1440 llvm::MCInst &mc_inst)
const {
1446 bool IsBrkC47x =
false;
1447 if (InstrDesc.isTrap() && mc_inst.getNumOperands() == 1) {
1448 const llvm::MCOperand &Op0 = mc_inst.getOperand(0);
1449 if (Op0.isImm() && Op0.getImm() >= 0xc470 && Op0.getImm() <= 0xc474)
1453 return InstrDesc.isAuthenticated() || IsBrkC47x;
1457 llvm::StringRef subtarget_features, std::string &user_feature_overrides) {
1459 llvm::SmallVector<std::string, 0> valid_user_flags;
1460 llvm::StringSet<> user_disabled_features;
1462 for (llvm::StringRef flag : llvm::split(user_feature_overrides,
",")) {
1463 bool is_valid =
true;
1469 std::string warning_reason;
1470 llvm::raw_string_ostream ostream(warning_reason);
1476 if (flag.size() < 2) {
1478 ostream <<
"must have a name";
1479 }
else if (std::isdigit(
static_cast<unsigned char>(flag[1]))) {
1481 ostream <<
"name cannot start with a digit";
1482 }
else if (flag.front() !=
'+' && flag.front() !=
'-') {
1484 ostream <<
"must start with '+' or '-'";
1485 }
else if (!std::all_of(flag.begin() + 1, flag.end(), [](
unsigned char c) {
1486 return std::isalnum(c) || c ==
'_' || c ==
'-';
1489 ostream <<
"contains invalid characters";
1492 std::string message =
1493 (
"feature flag '" + flag +
"': " + warning_reason).str();
1497 valid_user_flags.push_back(flag.str());
1499 if (flag.starts_with(
'-'))
1500 user_disabled_features.insert(flag.substr(1));
1504 llvm::SmallVector<std::string, 0> final_features;
1507 if (!subtarget_features.empty()) {
1508 for (llvm::StringRef flag : llvm::split(subtarget_features,
",")) {
1516 bool add_flag =
true;
1517 if (flag.size() >= 2 && flag.starts_with(
'+')) {
1518 llvm::StringRef feature_name = flag.substr(1);
1519 if (user_disabled_features.count(feature_name))
1523 final_features.push_back(flag.str());
1528 final_features.insert(final_features.end(), valid_user_flags.begin(),
1529 valid_user_flags.end());
1530 user_feature_overrides = llvm::join(final_features,
",");
1534 const char *flavor_string,
1535 const char *cpu_string,
1536 const char *features_string)
1541 m_flavor.assign(
"default");
1544 const bool cpu_or_features_overriden = cpu_string || features_string;
1545 unsigned flavor = ~0U;
1550 if (triple.getArch() == llvm::Triple::x86 ||
1551 triple.getArch() == llvm::Triple::x86_64) {
1552 if (m_flavor ==
"intel") {
1560 if (triple.getArch() == llvm::Triple::arm) {
1561 std::string thumb_arch_name(thumb_arch.GetTriple().getArchName().str());
1563 if (thumb_arch_name.size() > 3) {
1564 thumb_arch_name.erase(0, 3);
1565 thumb_arch_name.insert(0,
"thumb");
1567 thumb_arch_name =
"thumbv9.3a";
1569 thumb_arch.GetTriple().setArchName(llvm::StringRef(thumb_arch_name));
1577 if (triple.getArch() == llvm::Triple::arm &&
1578 triple.getSubArch() == llvm::Triple::NoSubArch)
1579 triple.setArchName(
"armv9.3a");
1581 std::string features_str =
1582 features_string ? std::string(features_string) :
"";
1583 const char *triple_str = triple.getTriple().c_str();
1586 if (arch.IsAlwaysThumbInstructions()) {
1587 triple_str = thumb_arch.GetTriple().getTriple().c_str();
1588 if (!features_string)
1589 features_str +=
"+fp-armv8,";
1592 const char *cpu = cpu_string;
1594 if (!cpu_or_features_overriden) {
1595 switch (arch.GetCore()) {
1642 if (arch.IsMIPS() && !cpu_or_features_overriden) {
1643 uint32_t arch_flags = arch.GetFlags();
1645 features_str +=
"+msa,";
1647 features_str +=
"+dsp,";
1649 features_str +=
"+dspr2,";
1654 if (triple.isAArch64() && !cpu_or_features_overriden) {
1655 features_str +=
"+all,";
1656 if (triple.getVendor() == llvm::Triple::Apple)
1657 cpu =
"apple-latest";
1660 if (triple.isRISCV()) {
1661 auto subtarget_features = arch.GetSubtargetFeatures().getString();
1662 if (!cpu_or_features_overriden) {
1663 if (!subtarget_features.empty()) {
1664 features_str += subtarget_features;
1666 uint32_t arch_flags = arch.GetFlags();
1668 features_str +=
"+c,";
1670 features_str +=
"+e,";
1673 features_str +=
"+f,";
1676 features_str +=
"+f,+d,";
1679 features_str +=
"+f,+d,+q,";
1682 features_str +=
"+a,+m,";
1686 UpdateSubtargetFeatures(subtarget_features, features_str);
1693 m_disasm_up = MCDisasmInstance::Create(triple_str, cpu, features_str.c_str(),
1696 llvm::Triple::ArchType llvm_arch = triple.getArch();
1700 if (llvm_arch == llvm::Triple::arm) {
1701 std::string thumb_triple(thumb_arch.GetTriple().getTriple());
1702 m_alternate_disasm_up = MCDisasmInstance::Create(
1703 thumb_triple.c_str(),
"", features_str.c_str(), flavor, *
this);
1704 if (!m_alternate_disasm_up)
1705 m_disasm_up.reset();
1707 }
else if (arch.IsMIPS()) {
1709 uint32_t arch_flags = arch.GetFlags();
1711 features_str +=
"+mips16,";
1713 features_str +=
"+micromips,";
1715 m_alternate_disasm_up = MCDisasmInstance::Create(
1716 triple_str, cpu, features_str.c_str(), flavor, *
this);
1717 if (!m_alternate_disasm_up)
1718 m_disasm_up.reset();
1727 const char *features) {
1728 if (arch.
GetTriple().getArch() != llvm::Triple::UnknownArch) {
1730 std::make_shared<DisassemblerLLVMC>(arch, flavor, cpu, features);
1731 if (disasm_sp && disasm_sp->IsValid())
1740 size_t num_instructions,
1741 bool append,
bool data_from_file) {
1749 uint32_t data_cursor = data_offset;
1751 uint32_t instructions_parsed = 0;
1754 while (data_cursor < data_byte_size &&
1755 instructions_parsed < num_instructions) {
1768 uint32_t inst_size = inst_sp->Decode(*
this, data, data_cursor);
1774 data_cursor += inst_size;
1775 inst_addr.
Slide(inst_size);
1776 instructions_parsed++;
1779 return data_cursor - data_offset;
1784 "Disassembler that uses LLVM MC to disassemble "
1785 "i386, x86_64, ARM, and ARM64.",
1788 llvm::InitializeAllTargetInfos();
1789 llvm::InitializeAllTargetMCs();
1790 llvm::InitializeAllAsmParsers();
1791 llvm::InitializeAllDisassemblers();
1799 uint64_t offset, uint64_t size,
1800 int tag_type,
void *tag_bug) {
1802 ->
OpInfo(
pc, offset, size, tag_type, tag_bug);
1807 uint64_t *type, uint64_t
pc,
1808 const char **name) {
1816 if (flavor ==
nullptr || strcmp(flavor,
"default") == 0)
1819 if (triple.getArch() == llvm::Triple::x86 ||
1820 triple.getArch() == llvm::Triple::x86_64) {
1821 return strcmp(flavor,
"intel") == 0 || strcmp(flavor,
"att") == 0;
1829 int tag_type,
void *tag_bug) {
1834 memset(tag_bug, 0,
sizeof(::LLVMOpInfo1));
1841 uint64_t
pc,
const char **name) {
1851 if (*type_ptr == LLVMDisassembler_ReferenceType_In_ARM64_ADRP) {
1855 *type_ptr = LLVMDisassembler_ReferenceType_InOut_None;
1862 if (*type_ptr == LLVMDisassembler_ReferenceType_In_ARM64_ADDXri &&
1865 uint32_t addxri_inst;
1866 uint64_t adrp_imm, addxri_imm;
1872 if (adrp_imm & (1ULL << 20))
1873 adrp_imm |= ~((1ULL << 21) - 1);
1875 addxri_inst = value;
1876 addxri_imm = (addxri_inst >> 10) & 0xfff;
1879 if ((addxri_inst >> (12 + 5 + 5)) & 1)
1881 value = (
m_adrp_address & 0xfffffffffffff000LL) + (adrp_imm << 12) +
1888 if (
m_inst->UsingFileAddress()) {
1891 module_sp->ResolveFileAddress(value, value_so_addr);
1892 module_sp->ResolveFileAddress(
pc, pc_so_addr);
1900 const SymbolContextItem resolve_scope =
1901 eSymbolContextFunction | eSymbolContextSymbol;
1903 pc_so_addr.
GetModule()->ResolveSymbolContextForAddress(
1904 pc_so_addr, resolve_scope, sym_ctx);
1910 bool format_omitting_current_func_name =
false;
1913 for (uint32_t idx = 0;
1917 format_omitting_current_func_name =
true;
1927 if (format_omitting_current_func_name) {
1941 std::string str = std::string(ss.
GetString());
1942 size_t first_eol_char = str.find_first_of(
"\r\n");
1943 if (first_eol_char != std::string::npos) {
1944 str.erase(first_eol_char);
1946 m_inst->AppendComment(str);
1958 *type_ptr = LLVMDisassembler_ReferenceType_InOut_None;
#define LLDB_PLUGIN_DEFINE(PluginName)
bool HasDelaySlot(llvm::MCInst &mc_inst) const
llvm::MCTargetOptions m_mc_options
MCDisasmInstance(std::unique_ptr< llvm::MCInstrInfo > &&instr_info_up, std::unique_ptr< llvm::MCRegisterInfo > &®_info_up, std::unique_ptr< llvm::MCSubtargetInfo > &&subtarget_info_up, llvm::MCTargetOptions mc_options, std::unique_ptr< llvm::MCAsmInfo > &&asm_info_up, std::unique_ptr< llvm::MCContext > &&context_up, std::unique_ptr< llvm::MCDisassembler > &&disasm_up, std::unique_ptr< llvm::MCInstPrinter > &&instr_printer_up, std::unique_ptr< llvm::MCInstrAnalysis > &&instr_analysis_up)
~MCDisasmInstance()=default
bool IsAuthenticated(llvm::MCInst &mc_inst) const
std::unique_ptr< llvm::MCInstrInfo > m_instr_info_up
std::unique_ptr< llvm::MCRegisterInfo > m_reg_info_up
bool CanBranch(llvm::MCInst &mc_inst) const
std::unique_ptr< llvm::MCContext > m_context_up
std::unique_ptr< llvm::MCAsmInfo > m_asm_info_up
void PrintMCInst(llvm::MCInst &mc_inst, lldb::addr_t pc, std::string &inst_string, std::string &comments_string)
bool IsBarrier(llvm::MCInst &mc_inst) const
void SetStyle(bool use_hex_immed, HexImmediateStyle hex_style)
static std::unique_ptr< MCDisasmInstance > Create(const char *triple, const char *cpu, const char *features_str, unsigned flavor, DisassemblerLLVMC &owner)
bool GetMCInst(const uint8_t *opcode_data, size_t opcode_data_len, lldb::addr_t pc, llvm::MCInst &mc_inst, uint64_t &size) const
bool IsLoad(llvm::MCInst &mc_inst) const
bool IsCall(llvm::MCInst &mc_inst) const
std::unique_ptr< llvm::MCSubtargetInfo > m_subtarget_info_up
std::unique_ptr< llvm::MCInstrAnalysis > m_instr_analysis_up
std::unique_ptr< llvm::MCDisassembler > m_disasm_up
std::unique_ptr< llvm::MCInstPrinter > m_instr_printer_up
void SetUseColor(bool use_color)
std::optional< uint32_t > m_adrp_insn
DisassemblerLLVMC(const lldb_private::ArchSpec &arch, const char *flavor, const char *cpu, const char *features)
static const char * SymbolLookupCallback(void *DisInfo, uint64_t ReferenceValue, uint64_t *ReferenceType, uint64_t ReferencePC, const char **ReferenceName)
static void UpdateSubtargetFeatures(llvm::StringRef subtarget_features, std::string &user_feature_overrides)
This function merges the user overwrite features (provided via -Y option) with the subtarget features...
int OpInfo(uint64_t PC, uint64_t Offset, uint64_t Size, int TagType, void *TagBug)
const lldb_private::ExecutionContext * m_exe_ctx
const char * SymbolLookup(uint64_t ReferenceValue, uint64_t *ReferenceType, uint64_t ReferencePC, const char **ReferenceName)
std::unique_ptr< MCDisasmInstance > m_disasm_up
static llvm::StringRef GetPluginNameStatic()
friend class InstructionLLVMC
static int OpInfoCallback(void *DisInfo, uint64_t PC, uint64_t Offset, uint64_t Size, int TagType, void *TagBug)
static lldb::DisassemblerSP CreateInstance(const lldb_private::ArchSpec &arch, const char *flavor, const char *cpu, const char *features)
lldb::addr_t m_adrp_address
bool FlavorValidForArchSpec(const lldb_private::ArchSpec &arch, const char *flavor) override
~DisassemblerLLVMC() override
std::unique_ptr< MCDisasmInstance > m_alternate_disasm_up
InstructionLLVMC * m_inst
size_t DecodeInstructions(const lldb_private::Address &base_addr, const lldb_private::DataExtractor &data, lldb::offset_t data_offset, size_t num_instructions, bool append, bool data_from_file) override
Grants exclusive access to the disassembler and initializes it with the given InstructionLLVMC and an...
std::shared_ptr< DisassemblerLLVMC > m_disasm
DisassemblerScope(InstructionLLVMC &i, const lldb_private::ExecutionContext *exe_ctx=nullptr)
std::shared_ptr< DisassemblerLLVMC > operator->()
static std::pair< Operand, llvm::StringRef::const_iterator > ParseIntelIndexedAccess(llvm::StringRef::const_iterator osi, llvm::StringRef::const_iterator ose)
bool DoesBranch() override
DisassemblerLLVMC::MCDisasmInstance * GetDisasmToUse(bool &is_alternate_isa)
static void DumpOperand(const Operand &op, Stream &s)
size_t GetByteSize() const
static llvm::StringRef::const_iterator ConsumeWhitespace(llvm::StringRef::const_iterator osi, llvm::StringRef::const_iterator ose)
std::weak_ptr< DisassemblerLLVMC > m_disasm_wp
void CalculateMnemonicOperandsAndComment(const lldb_private::ExecutionContext *exe_ctx) override
bool m_has_visited_instruction
static std::pair< Operand, llvm::StringRef::const_iterator > ParseARMOffsetAccess(llvm::StringRef::const_iterator osi, llvm::StringRef::const_iterator ose)
DisassemblerLLVMC::MCDisasmInstance * GetDisasmToUse(bool &is_alternate_isa, DisassemblerScope &disasm)
void AppendComment(std::string &description)
bool UsingFileAddress() const
bool IsAuthenticated() override
static std::pair< Operand, llvm::StringRef::const_iterator > ParseIntelDerefAccess(llvm::StringRef::const_iterator osi, llvm::StringRef::const_iterator ose)
static std::pair< bool, llvm::StringRef::const_iterator > ConsumeChar(llvm::StringRef::const_iterator osi, const char c, llvm::StringRef::const_iterator ose)
size_t Decode(const lldb_private::Disassembler &disassembler, const lldb_private::DataExtractor &data, lldb::offset_t data_offset) override
bool ParseOperands(llvm::SmallVectorImpl< Instruction::Operand > &operands) override
bool IsBarrier() override
bool HasDelaySlot() override
static std::pair< Operand, llvm::StringRef::const_iterator > ParseARMDerefAccess(llvm::StringRef::const_iterator osi, llvm::StringRef::const_iterator ose)
static std::pair< Operand, llvm::StringRef::const_iterator > ParseRegisterName(llvm::StringRef::const_iterator osi, llvm::StringRef::const_iterator ose)
~InstructionLLVMC() override=default
lldb::InstructionControlFlowKind GetControlFlowKind(const lldb_private::ExecutionContext *exe_ctx) override
InstructionLLVMC(DisassemblerLLVMC &disasm, const lldb_private::Address &address, AddressClass addr_class)
static std::pair< Operand, llvm::StringRef::const_iterator > ParseImmediate(llvm::StringRef::const_iterator osi, llvm::StringRef::const_iterator ose)
A section + offset based address range class.
bool ContainsLoadAddress(const Address &so_addr, Target *target) const
Check if a section offset so_addr when represented as a load address is contained within this object'...
A section + offset based address class.
lldb::SectionSP GetSection() const
Get const accessor for the section.
@ DumpStyleSectionNameOffset
Display as the section name + offset.
@ DumpStyleNoFunctionName
Elide the function name; display an offset into the current function.
@ DumpStyleResolvedDescriptionNoFunctionArguments
bool Slide(int64_t offset)
bool Dump(Stream *s, ExecutionContextScope *exe_scope, DumpStyle style, DumpStyle fallback_style=DumpStyleInvalid, uint32_t addr_byte_size=UINT32_MAX, bool all_ranges=false, std::optional< Stream::HighlightSettings > settings=std::nullopt) const
Dump a description of this object to a Stream.
lldb::ModuleSP GetModule() const
Get accessor for the module for this address.
bool IsValid() const
Check if the object state is valid.
AddressClass GetAddressClass() const
An architecture specification class.
llvm::Triple & GetTriple()
Architecture triple accessor.
uint32_t GetMinimumOpcodeByteSize() const
llvm::Triple::ArchType GetMachine() const
Returns a machine family for the current architecture.
@ eRISCV_float_abi_double
single precision floating point, +f
@ eRISCV_float_abi_quad
double precision floating point, +d
@ eRISCV_float_abi_single
soft float
uint32_t GetMaximumOpcodeByteSize() const
A uniqued constant string class.
llvm::StringRef GetStringRef() const
Get the string value as a llvm::StringRef.
static void ReportWarning(std::string message, std::optional< lldb::user_id_t > debugger_id=std::nullopt, std::once_flag *once=nullptr)
Report warning events.
InstructionList m_instruction_list
Disassembler(const ArchSpec &arch, const char *flavor)
"lldb/Target/ExecutionContext.h" A class that contains an execution context.
Target * GetTargetPtr() const
Returns a pointer to the target object.
Instruction(const Address &address, AddressClass addr_class=AddressClass::eInvalid)
std::string m_markup_mnemonics
const char * GetOperands(const ExecutionContext *exe_ctx, bool markup=false)
std::string m_opcode_name
std::string m_markup_opcode_name
AddressClass GetAddressClass()
uint32_t GetByteSize() const
const void * GetOpcodeBytes() const
static bool RegisterPlugin(llvm::StringRef name, llvm::StringRef description, ABICreateInstance create_callback)
static bool UnregisterPlugin(ABICreateInstance create_callback)
bool Execute(llvm::StringRef string, llvm::SmallVectorImpl< llvm::StringRef > *matches=nullptr) const
Execute a regular expression match using the compiled regular expression that is already in this obje...
llvm::StringRef GetString() const
A stream class that can stream formatted output to a file.
size_t Printf(const char *format,...) __attribute__((format(printf
Output printf formatted output to the stream.
size_t PutCString(llvm::StringRef cstr)
Output a C string to the stream.
Defines a symbol context baton that can be handed other debug core functions.
Function * function
The Function for a given query.
bool GetAddressRange(uint32_t scope, uint32_t range_idx, bool use_inline_block_range, AddressRange &range) const
Get the address range contained within a symbol context.
Symbol * symbol
The Symbol for a given query.
bool GetUseHexImmediates() const
Disassembler::HexImmediateStyle GetHexImmediateStyle() const
bool ResolveLoadAddress(lldb::addr_t load_addr, Address &so_addr, uint32_t stop_id=SectionLoadHistory::eStopIDNow, bool allow_section_end=false)
const ArchSpec & GetArchitecture() const
#define LLDB_INVALID_ADDRESS
A class that represents a running process on the host machine.
Log * GetLog(Cat mask)
Retrieve the Log object for the channel associated with the given log enum.
std::shared_ptr< lldb_private::Instruction > InstructionSP
std::shared_ptr< lldb_private::Disassembler > DisassemblerSP
ByteOrder
Byte ordering definitions.
InstructionControlFlowKind
Architecture-agnostic categorization of instructions for traversing the control flow of a trace.
@ eInstructionControlFlowKindReturn
The instruction is a near (function) return.
@ eInstructionControlFlowKindFarJump
The instruction is a jump-like far transfer. E.g. FAR JMP.
@ eInstructionControlFlowKindOther
The instruction is something not listed below, i.e.
@ eInstructionControlFlowKindFarCall
The instruction is a call-like far transfer.
@ eInstructionControlFlowKindFarReturn
The instruction is a return-like far transfer.
@ eInstructionControlFlowKindUnknown
The instruction could not be classified.
@ eInstructionControlFlowKindJump
The instruction is a near unconditional jump.
@ eInstructionControlFlowKindCall
The instruction is a near (function) call.
@ eInstructionControlFlowKindCondJump
The instruction is a near conditional jump.
std::shared_ptr< lldb_private::Module > ModuleSP
std::optional< InstructionOpcodeAndModrm > InstructionLengthDecode(const uint8_t *inst_bytes, int bytes_len, bool is_exec_mode_64b)
Decode an instruction into opcode, modrm and opcode_len.
lldb::InstructionControlFlowKind GetControlFlowKind(bool is_exec_mode_64b, Opcode m_opcode)
lldb::InstructionControlFlowKind MapOpcodeIntoControlFlowKind(InstructionOpcodeAndModrm opcode_and_modrm)
Determine the InstructionControlFlowKind based on opcode and modrm bytes.
enum lldb_private::Instruction::Operand::Type m_type
std::vector< Operand > m_children
These are the three values deciding instruction control flow kind.