123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519 |
- //===-- DWARFExpression.cpp -----------------------------------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/DebugInfo/DWARF/DWARFExpression.h"
- #include "llvm/DebugInfo/DWARF/DWARFUnit.h"
- #include "llvm/MC/MCRegisterInfo.h"
- #include "llvm/Support/Format.h"
- #include <cassert>
- #include <cstdint>
- #include <vector>
- using namespace llvm;
- using namespace dwarf;
- namespace llvm {
- typedef std::vector<DWARFExpression::Operation::Description> DescVector;
- static DescVector getDescriptions() {
- DescVector Descriptions;
- typedef DWARFExpression::Operation Op;
- typedef Op::Description Desc;
- Descriptions.resize(0xff);
- Descriptions[DW_OP_addr] = Desc(Op::Dwarf2, Op::SizeAddr);
- Descriptions[DW_OP_deref] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_const1u] = Desc(Op::Dwarf2, Op::Size1);
- Descriptions[DW_OP_const1s] = Desc(Op::Dwarf2, Op::SignedSize1);
- Descriptions[DW_OP_const2u] = Desc(Op::Dwarf2, Op::Size2);
- Descriptions[DW_OP_const2s] = Desc(Op::Dwarf2, Op::SignedSize2);
- Descriptions[DW_OP_const4u] = Desc(Op::Dwarf2, Op::Size4);
- Descriptions[DW_OP_const4s] = Desc(Op::Dwarf2, Op::SignedSize4);
- Descriptions[DW_OP_const8u] = Desc(Op::Dwarf2, Op::Size8);
- Descriptions[DW_OP_const8s] = Desc(Op::Dwarf2, Op::SignedSize8);
- Descriptions[DW_OP_constu] = Desc(Op::Dwarf2, Op::SizeLEB);
- Descriptions[DW_OP_consts] = Desc(Op::Dwarf2, Op::SignedSizeLEB);
- Descriptions[DW_OP_dup] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_drop] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_over] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_pick] = Desc(Op::Dwarf2, Op::Size1);
- Descriptions[DW_OP_swap] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_rot] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_xderef] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_abs] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_and] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_div] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_minus] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_mod] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_mul] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_neg] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_not] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_or] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_plus] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_plus_uconst] = Desc(Op::Dwarf2, Op::SizeLEB);
- Descriptions[DW_OP_shl] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_shr] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_shra] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_xor] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_skip] = Desc(Op::Dwarf2, Op::SignedSize2);
- Descriptions[DW_OP_bra] = Desc(Op::Dwarf2, Op::SignedSize2);
- Descriptions[DW_OP_eq] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_ge] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_gt] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_le] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_lt] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_ne] = Desc(Op::Dwarf2);
- for (uint16_t LA = DW_OP_lit0; LA <= DW_OP_lit31; ++LA)
- Descriptions[LA] = Desc(Op::Dwarf2);
- for (uint16_t LA = DW_OP_reg0; LA <= DW_OP_reg31; ++LA)
- Descriptions[LA] = Desc(Op::Dwarf2);
- for (uint16_t LA = DW_OP_breg0; LA <= DW_OP_breg31; ++LA)
- Descriptions[LA] = Desc(Op::Dwarf2, Op::SignedSizeLEB);
- Descriptions[DW_OP_regx] = Desc(Op::Dwarf2, Op::SizeLEB);
- Descriptions[DW_OP_fbreg] = Desc(Op::Dwarf2, Op::SignedSizeLEB);
- Descriptions[DW_OP_bregx] = Desc(Op::Dwarf2, Op::SizeLEB, Op::SignedSizeLEB);
- Descriptions[DW_OP_piece] = Desc(Op::Dwarf2, Op::SizeLEB);
- Descriptions[DW_OP_deref_size] = Desc(Op::Dwarf2, Op::Size1);
- Descriptions[DW_OP_xderef_size] = Desc(Op::Dwarf2, Op::Size1);
- Descriptions[DW_OP_nop] = Desc(Op::Dwarf2);
- Descriptions[DW_OP_push_object_address] = Desc(Op::Dwarf3);
- Descriptions[DW_OP_call2] = Desc(Op::Dwarf3, Op::Size2);
- Descriptions[DW_OP_call4] = Desc(Op::Dwarf3, Op::Size4);
- Descriptions[DW_OP_call_ref] = Desc(Op::Dwarf3, Op::SizeRefAddr);
- Descriptions[DW_OP_form_tls_address] = Desc(Op::Dwarf3);
- Descriptions[DW_OP_call_frame_cfa] = Desc(Op::Dwarf3);
- Descriptions[DW_OP_bit_piece] = Desc(Op::Dwarf3, Op::SizeLEB, Op::SizeLEB);
- Descriptions[DW_OP_implicit_value] =
- Desc(Op::Dwarf3, Op::SizeLEB, Op::SizeBlock);
- Descriptions[DW_OP_stack_value] = Desc(Op::Dwarf3);
- Descriptions[DW_OP_WASM_location] =
- Desc(Op::Dwarf4, Op::SizeLEB, Op::WasmLocationArg);
- Descriptions[DW_OP_GNU_push_tls_address] = Desc(Op::Dwarf3);
- Descriptions[DW_OP_addrx] = Desc(Op::Dwarf4, Op::SizeLEB);
- Descriptions[DW_OP_GNU_addr_index] = Desc(Op::Dwarf4, Op::SizeLEB);
- Descriptions[DW_OP_GNU_const_index] = Desc(Op::Dwarf4, Op::SizeLEB);
- Descriptions[DW_OP_GNU_entry_value] = Desc(Op::Dwarf4, Op::SizeLEB);
- Descriptions[DW_OP_convert] = Desc(Op::Dwarf5, Op::BaseTypeRef);
- Descriptions[DW_OP_entry_value] = Desc(Op::Dwarf5, Op::SizeLEB);
- Descriptions[DW_OP_regval_type] =
- Desc(Op::Dwarf5, Op::SizeLEB, Op::BaseTypeRef);
- return Descriptions;
- }
- static DWARFExpression::Operation::Description getOpDesc(unsigned OpCode) {
- // FIXME: Make this constexpr once all compilers are smart enough to do it.
- static DescVector Descriptions = getDescriptions();
- // Handle possible corrupted or unsupported operation.
- if (OpCode >= Descriptions.size())
- return {};
- return Descriptions[OpCode];
- }
- bool DWARFExpression::Operation::extract(DataExtractor Data,
- uint8_t AddressSize, uint64_t Offset,
- Optional<DwarfFormat> Format) {
- EndOffset = Offset;
- Opcode = Data.getU8(&Offset);
- Desc = getOpDesc(Opcode);
- if (Desc.Version == Operation::DwarfNA)
- return false;
- for (unsigned Operand = 0; Operand < 2; ++Operand) {
- unsigned Size = Desc.Op[Operand];
- unsigned Signed = Size & Operation::SignBit;
- if (Size == Operation::SizeNA)
- break;
- switch (Size & ~Operation::SignBit) {
- case Operation::Size1:
- Operands[Operand] = Data.getU8(&Offset);
- if (Signed)
- Operands[Operand] = (int8_t)Operands[Operand];
- break;
- case Operation::Size2:
- Operands[Operand] = Data.getU16(&Offset);
- if (Signed)
- Operands[Operand] = (int16_t)Operands[Operand];
- break;
- case Operation::Size4:
- Operands[Operand] = Data.getU32(&Offset);
- if (Signed)
- Operands[Operand] = (int32_t)Operands[Operand];
- break;
- case Operation::Size8:
- Operands[Operand] = Data.getU64(&Offset);
- break;
- case Operation::SizeAddr:
- Operands[Operand] = Data.getUnsigned(&Offset, AddressSize);
- break;
- case Operation::SizeRefAddr:
- if (!Format)
- return false;
- Operands[Operand] =
- Data.getUnsigned(&Offset, dwarf::getDwarfOffsetByteSize(*Format));
- break;
- case Operation::SizeLEB:
- if (Signed)
- Operands[Operand] = Data.getSLEB128(&Offset);
- else
- Operands[Operand] = Data.getULEB128(&Offset);
- break;
- case Operation::BaseTypeRef:
- Operands[Operand] = Data.getULEB128(&Offset);
- break;
- case Operation::WasmLocationArg:
- assert(Operand == 1);
- switch (Operands[0]) {
- case 0:
- case 1:
- case 2:
- case 4:
- Operands[Operand] = Data.getULEB128(&Offset);
- break;
- case 3: // global as uint32
- Operands[Operand] = Data.getU32(&Offset);
- break;
- default:
- return false; // Unknown Wasm location
- }
- break;
- case Operation::SizeBlock:
- // We need a size, so this cannot be the first operand
- if (Operand == 0)
- return false;
- // Store the offset of the block as the value.
- Operands[Operand] = Offset;
- Offset += Operands[Operand - 1];
- break;
- default:
- llvm_unreachable("Unknown DWARFExpression Op size");
- }
- OperandEndOffsets[Operand] = Offset;
- }
- EndOffset = Offset;
- return true;
- }
- static void prettyPrintBaseTypeRef(DWARFUnit *U, raw_ostream &OS,
- DIDumpOptions DumpOpts,
- const uint64_t Operands[2],
- unsigned Operand) {
- assert(Operand < 2 && "operand out of bounds");
- auto Die = U->getDIEForOffset(U->getOffset() + Operands[Operand]);
- if (Die && Die.getTag() == dwarf::DW_TAG_base_type) {
- OS << " (";
- if (DumpOpts.Verbose)
- OS << format("0x%08" PRIx64 " -> ", Operands[Operand]);
- OS << format("0x%08" PRIx64 ")", U->getOffset() + Operands[Operand]);
- if (auto Name = dwarf::toString(Die.find(dwarf::DW_AT_name)))
- OS << " \"" << *Name << "\"";
- } else {
- OS << format(" <invalid base_type ref: 0x%" PRIx64 ">",
- Operands[Operand]);
- }
- }
- static bool prettyPrintRegisterOp(DWARFUnit *U, raw_ostream &OS,
- DIDumpOptions DumpOpts, uint8_t Opcode,
- const uint64_t Operands[2],
- const MCRegisterInfo *MRI, bool isEH) {
- if (!MRI)
- return false;
- uint64_t DwarfRegNum;
- unsigned OpNum = 0;
- if (Opcode == DW_OP_bregx || Opcode == DW_OP_regx ||
- Opcode == DW_OP_regval_type)
- DwarfRegNum = Operands[OpNum++];
- else if (Opcode >= DW_OP_breg0 && Opcode < DW_OP_bregx)
- DwarfRegNum = Opcode - DW_OP_breg0;
- else
- DwarfRegNum = Opcode - DW_OP_reg0;
- if (Optional<unsigned> LLVMRegNum = MRI->getLLVMRegNum(DwarfRegNum, isEH)) {
- if (const char *RegName = MRI->getName(*LLVMRegNum)) {
- if ((Opcode >= DW_OP_breg0 && Opcode <= DW_OP_breg31) ||
- Opcode == DW_OP_bregx)
- OS << format(" %s%+" PRId64, RegName, Operands[OpNum]);
- else
- OS << ' ' << RegName;
- if (Opcode == DW_OP_regval_type)
- prettyPrintBaseTypeRef(U, OS, DumpOpts, Operands, 1);
- return true;
- }
- }
- return false;
- }
- bool DWARFExpression::Operation::print(raw_ostream &OS, DIDumpOptions DumpOpts,
- const DWARFExpression *Expr,
- const MCRegisterInfo *RegInfo,
- DWARFUnit *U, bool isEH) const {
- if (Error) {
- OS << "<decoding error>";
- return false;
- }
- StringRef Name = OperationEncodingString(Opcode);
- assert(!Name.empty() && "DW_OP has no name!");
- OS << Name;
- if ((Opcode >= DW_OP_breg0 && Opcode <= DW_OP_breg31) ||
- (Opcode >= DW_OP_reg0 && Opcode <= DW_OP_reg31) ||
- Opcode == DW_OP_bregx || Opcode == DW_OP_regx ||
- Opcode == DW_OP_regval_type)
- if (prettyPrintRegisterOp(U, OS, DumpOpts, Opcode, Operands, RegInfo, isEH))
- return true;
- for (unsigned Operand = 0; Operand < 2; ++Operand) {
- unsigned Size = Desc.Op[Operand];
- unsigned Signed = Size & Operation::SignBit;
- if (Size == Operation::SizeNA)
- break;
- if (Size == Operation::BaseTypeRef && U) {
- // For DW_OP_convert the operand may be 0 to indicate that conversion to
- // the generic type should be done. The same holds for DW_OP_reinterpret,
- // which is currently not supported.
- if (Opcode == DW_OP_convert && Operands[Operand] == 0)
- OS << " 0x0";
- else
- prettyPrintBaseTypeRef(U, OS, DumpOpts, Operands, Operand);
- } else if (Size == Operation::WasmLocationArg) {
- assert(Operand == 1);
- switch (Operands[0]) {
- case 0:
- case 1:
- case 2:
- case 3: // global as uint32
- case 4:
- OS << format(" 0x%" PRIx64, Operands[Operand]);
- break;
- default: assert(false);
- }
- } else if (Size == Operation::SizeBlock) {
- uint64_t Offset = Operands[Operand];
- for (unsigned i = 0; i < Operands[Operand - 1]; ++i)
- OS << format(" 0x%02x", Expr->Data.getU8(&Offset));
- } else {
- if (Signed)
- OS << format(" %+" PRId64, (int64_t)Operands[Operand]);
- else if (Opcode != DW_OP_entry_value &&
- Opcode != DW_OP_GNU_entry_value)
- OS << format(" 0x%" PRIx64, Operands[Operand]);
- }
- }
- return true;
- }
- void DWARFExpression::print(raw_ostream &OS, DIDumpOptions DumpOpts,
- const MCRegisterInfo *RegInfo, DWARFUnit *U,
- bool IsEH) const {
- uint32_t EntryValExprSize = 0;
- uint64_t EntryValStartOffset = 0;
- if (Data.getData().empty())
- OS << "<empty>";
- for (auto &Op : *this) {
- if (!Op.print(OS, DumpOpts, this, RegInfo, U, IsEH)) {
- uint64_t FailOffset = Op.getEndOffset();
- while (FailOffset < Data.getData().size())
- OS << format(" %02x", Data.getU8(&FailOffset));
- return;
- }
- if (Op.getCode() == DW_OP_entry_value ||
- Op.getCode() == DW_OP_GNU_entry_value) {
- OS << "(";
- EntryValExprSize = Op.getRawOperand(0);
- EntryValStartOffset = Op.getEndOffset();
- continue;
- }
- if (EntryValExprSize) {
- EntryValExprSize -= Op.getEndOffset() - EntryValStartOffset;
- if (EntryValExprSize == 0)
- OS << ")";
- }
- if (Op.getEndOffset() < Data.getData().size())
- OS << ", ";
- }
- }
- bool DWARFExpression::Operation::verify(const Operation &Op, DWARFUnit *U) {
- for (unsigned Operand = 0; Operand < 2; ++Operand) {
- unsigned Size = Op.Desc.Op[Operand];
- if (Size == Operation::SizeNA)
- break;
- if (Size == Operation::BaseTypeRef) {
- // For DW_OP_convert the operand may be 0 to indicate that conversion to
- // the generic type should be done, so don't look up a base type in that
- // case. The same holds for DW_OP_reinterpret, which is currently not
- // supported.
- if (Op.Opcode == DW_OP_convert && Op.Operands[Operand] == 0)
- continue;
- auto Die = U->getDIEForOffset(U->getOffset() + Op.Operands[Operand]);
- if (!Die || Die.getTag() != dwarf::DW_TAG_base_type)
- return false;
- }
- }
- return true;
- }
- bool DWARFExpression::verify(DWARFUnit *U) {
- for (auto &Op : *this)
- if (!Operation::verify(Op, U))
- return false;
- return true;
- }
- /// A user-facing string representation of a DWARF expression. This might be an
- /// Address expression, in which case it will be implicitly dereferenced, or a
- /// Value expression.
- struct PrintedExpr {
- enum ExprKind {
- Address,
- Value,
- };
- ExprKind Kind;
- SmallString<16> String;
- PrintedExpr(ExprKind K = Address) : Kind(K) {}
- };
- static bool printCompactDWARFExpr(raw_ostream &OS, DWARFExpression::iterator I,
- const DWARFExpression::iterator E,
- const MCRegisterInfo &MRI) {
- SmallVector<PrintedExpr, 4> Stack;
- while (I != E) {
- const DWARFExpression::Operation &Op = *I;
- uint8_t Opcode = Op.getCode();
- switch (Opcode) {
- case dwarf::DW_OP_regx: {
- // DW_OP_regx: A register, with the register num given as an operand.
- // Printed as the plain register name.
- uint64_t DwarfRegNum = Op.getRawOperand(0);
- Optional<unsigned> LLVMRegNum = MRI.getLLVMRegNum(DwarfRegNum, false);
- if (!LLVMRegNum) {
- OS << "<unknown register " << DwarfRegNum << ">";
- return false;
- }
- raw_svector_ostream S(Stack.emplace_back(PrintedExpr::Value).String);
- S << MRI.getName(*LLVMRegNum);
- break;
- }
- case dwarf::DW_OP_bregx: {
- int DwarfRegNum = Op.getRawOperand(0);
- int64_t Offset = Op.getRawOperand(1);
- Optional<unsigned> LLVMRegNum = MRI.getLLVMRegNum(DwarfRegNum, false);
- if (!LLVMRegNum) {
- OS << "<unknown register " << DwarfRegNum << ">";
- return false;
- }
- raw_svector_ostream S(Stack.emplace_back().String);
- S << MRI.getName(*LLVMRegNum);
- if (Offset)
- S << format("%+" PRId64, Offset);
- break;
- }
- case dwarf::DW_OP_entry_value:
- case dwarf::DW_OP_GNU_entry_value: {
- // DW_OP_entry_value contains a sub-expression which must be rendered
- // separately.
- uint64_t SubExprLength = Op.getRawOperand(0);
- DWARFExpression::iterator SubExprEnd = I.skipBytes(SubExprLength);
- ++I;
- raw_svector_ostream S(Stack.emplace_back().String);
- S << "entry(";
- printCompactDWARFExpr(S, I, SubExprEnd, MRI);
- S << ")";
- I = SubExprEnd;
- continue;
- }
- case dwarf::DW_OP_stack_value: {
- // The top stack entry should be treated as the actual value of tne
- // variable, rather than the address of the variable in memory.
- assert(!Stack.empty());
- Stack.back().Kind = PrintedExpr::Value;
- break;
- }
- default:
- if (Opcode >= dwarf::DW_OP_reg0 && Opcode <= dwarf::DW_OP_reg31) {
- // DW_OP_reg<N>: A register, with the register num implied by the
- // opcode. Printed as the plain register name.
- uint64_t DwarfRegNum = Opcode - dwarf::DW_OP_reg0;
- Optional<unsigned> LLVMRegNum = MRI.getLLVMRegNum(DwarfRegNum, false);
- if (!LLVMRegNum) {
- OS << "<unknown register " << DwarfRegNum << ">";
- return false;
- }
- raw_svector_ostream S(Stack.emplace_back(PrintedExpr::Value).String);
- S << MRI.getName(*LLVMRegNum);
- } else if (Opcode >= dwarf::DW_OP_breg0 &&
- Opcode <= dwarf::DW_OP_breg31) {
- int DwarfRegNum = Opcode - dwarf::DW_OP_breg0;
- int64_t Offset = Op.getRawOperand(0);
- Optional<unsigned> LLVMRegNum = MRI.getLLVMRegNum(DwarfRegNum, false);
- if (!LLVMRegNum) {
- OS << "<unknown register " << DwarfRegNum << ">";
- return false;
- }
- raw_svector_ostream S(Stack.emplace_back().String);
- S << MRI.getName(*LLVMRegNum);
- if (Offset)
- S << format("%+" PRId64, Offset);
- } else {
- // If we hit an unknown operand, we don't know its effect on the stack,
- // so bail out on the whole expression.
- OS << "<unknown op " << dwarf::OperationEncodingString(Opcode) << " ("
- << (int)Opcode << ")>";
- return false;
- }
- break;
- }
- ++I;
- }
- assert(Stack.size() == 1 && "expected one value on stack");
- if (Stack.front().Kind == PrintedExpr::Address)
- OS << "[" << Stack.front().String << "]";
- else
- OS << Stack.front().String;
- return true;
- }
- bool DWARFExpression::printCompact(raw_ostream &OS, const MCRegisterInfo &MRI) {
- return printCompactDWARFExpr(OS, begin(), end(), MRI);
- }
- bool DWARFExpression::operator==(const DWARFExpression &RHS) const {
- if (AddressSize != RHS.AddressSize || Format != RHS.Format)
- return false;
- return Data.getData() == RHS.Data.getData();
- }
- } // namespace llvm
|