123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222 |
- #pragma once
- #ifdef __GNUC__
- #pragma GCC diagnostic push
- #pragma GCC diagnostic ignored "-Wunused-parameter"
- #endif
- //===- FunctionInfo.h -------------------------------------------*- C++ -*-===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #ifndef LLVM_DEBUGINFO_GSYM_FUNCTIONINFO_H
- #define LLVM_DEBUGINFO_GSYM_FUNCTIONINFO_H
- #include "llvm/DebugInfo/GSYM/ExtractRanges.h"
- #include "llvm/DebugInfo/GSYM/InlineInfo.h"
- #include "llvm/DebugInfo/GSYM/LineTable.h"
- #include "llvm/DebugInfo/GSYM/LookupResult.h"
- #include "llvm/DebugInfo/GSYM/StringTable.h"
- #include <cstdint>
- #include <tuple>
- namespace llvm {
- class raw_ostream;
- namespace gsym {
- class GsymReader;
- /// Function information in GSYM files encodes information for one contiguous
- /// address range. If a function has discontiguous address ranges, they will
- /// need to be encoded using multiple FunctionInfo objects.
- ///
- /// ENCODING
- ///
- /// The function information gets the function start address as an argument
- /// to the FunctionInfo::decode(...) function. This information is calculated
- /// from the GSYM header and an address offset from the GSYM address offsets
- /// table. The encoded FunctionInfo information must be aligned to a 4 byte
- /// boundary.
- ///
- /// The encoded data for a FunctionInfo starts with fixed data that all
- /// function info objects have:
- ///
- /// ENCODING NAME DESCRIPTION
- /// ========= =========== ====================================================
- /// uint32_t Size The size in bytes of this function.
- /// uint32_t Name The string table offset of the function name.
- ///
- /// The optional data in a FunctionInfo object follows this fixed information
- /// and consists of a stream of tuples that consist of:
- ///
- /// ENCODING NAME DESCRIPTION
- /// ========= =========== ====================================================
- /// uint32_t InfoType An "InfoType" enumeration that describes the type
- /// of optional data that is encoded.
- /// uint32_t InfoLength The size in bytes of the encoded data that
- /// immediately follows this length if this value is
- /// greater than zero.
- /// uint8_t[] InfoData Encoded bytes that represent the data for the
- /// "InfoType". These bytes are only present if
- /// "InfoLength" is greater than zero.
- ///
- /// The "InfoType" is an enumeration:
- ///
- /// enum InfoType {
- /// EndOfList = 0u,
- /// LineTableInfo = 1u,
- /// InlineInfo = 2u
- /// };
- ///
- /// This stream of tuples is terminated by a "InfoType" whose value is
- /// InfoType::EndOfList and a zero for "InfoLength". This signifies the end of
- /// the optional information list. This format allows us to add new optional
- /// information data to a FunctionInfo object over time and allows older
- /// clients to still parse the format and skip over any data that they don't
- /// understand or want to parse.
- ///
- /// So the function information encoding essientially looks like:
- ///
- /// struct {
- /// uint32_t Size;
- /// uint32_t Name;
- /// struct {
- /// uint32_t InfoType;
- /// uint32_t InfoLength;
- /// uint8_t InfoData[InfoLength];
- /// }[N];
- /// }
- ///
- /// Where "N" is the number of tuples.
- struct FunctionInfo {
- AddressRange Range;
- uint32_t Name; ///< String table offset in the string table.
- std::optional<LineTable> OptLineTable;
- std::optional<InlineInfo> Inline;
- FunctionInfo(uint64_t Addr = 0, uint64_t Size = 0, uint32_t N = 0)
- : Range(Addr, Addr + Size), Name(N) {}
- /// Query if a FunctionInfo has rich debug info.
- ///
- /// \returns A bool that indicates if this object has something else than
- /// range and name. When converting information from a symbol table and from
- /// debug info, we might end up with multiple FunctionInfo objects for the
- /// same range and we need to be able to tell which one is the better object
- /// to use.
- bool hasRichInfo() const { return OptLineTable || Inline; }
- /// Query if a FunctionInfo object is valid.
- ///
- /// Address and size can be zero and there can be no line entries for a
- /// symbol so the only indication this entry is valid is if the name is
- /// not zero. This can happen when extracting information from symbol
- /// tables that do not encode symbol sizes. In that case only the
- /// address and name will be filled in.
- ///
- /// \returns A boolean indicating if this FunctionInfo is valid.
- bool isValid() const {
- return Name != 0;
- }
- /// Decode an object from a binary data stream.
- ///
- /// \param Data The binary stream to read the data from. This object must
- /// have the data for the object starting at offset zero. The data
- /// can contain more data than needed.
- ///
- /// \param BaseAddr The FunctionInfo's start address and will be used as the
- /// base address when decoding any contained information like the line table
- /// and the inline info.
- ///
- /// \returns An FunctionInfo or an error describing the issue that was
- /// encountered during decoding.
- static llvm::Expected<FunctionInfo> decode(DataExtractor &Data,
- uint64_t BaseAddr);
- /// Encode this object into FileWriter stream.
- ///
- /// \param O The binary stream to write the data to at the current file
- /// position.
- ///
- /// \returns An error object that indicates failure or the offset of the
- /// function info that was successfully written into the stream.
- llvm::Expected<uint64_t> encode(FileWriter &O) const;
- /// Lookup an address within a FunctionInfo object's data stream.
- ///
- /// Instead of decoding an entire FunctionInfo object when doing lookups,
- /// we can decode only the information we need from the FunctionInfo's data
- /// for the specific address. The lookup result information is returned as
- /// a LookupResult.
- ///
- /// \param Data The binary stream to read the data from. This object must
- /// have the data for the object starting at offset zero. The data
- /// can contain more data than needed.
- ///
- /// \param GR The GSYM reader that contains the string and file table that
- /// will be used to fill in information in the returned result.
- ///
- /// \param FuncAddr The function start address decoded from the GsymReader.
- ///
- /// \param Addr The address to lookup.
- ///
- /// \returns An LookupResult or an error describing the issue that was
- /// encountered during decoding. An error should only be returned if the
- /// address is not contained in the FunctionInfo or if the data is corrupted.
- static llvm::Expected<LookupResult> lookup(DataExtractor &Data,
- const GsymReader &GR,
- uint64_t FuncAddr,
- uint64_t Addr);
- uint64_t startAddress() const { return Range.start(); }
- uint64_t endAddress() const { return Range.end(); }
- uint64_t size() const { return Range.size(); }
- void clear() {
- Range = {0, 0};
- Name = 0;
- OptLineTable = std::nullopt;
- Inline = std::nullopt;
- }
- };
- inline bool operator==(const FunctionInfo &LHS, const FunctionInfo &RHS) {
- return LHS.Range == RHS.Range && LHS.Name == RHS.Name &&
- LHS.OptLineTable == RHS.OptLineTable && LHS.Inline == RHS.Inline;
- }
- inline bool operator!=(const FunctionInfo &LHS, const FunctionInfo &RHS) {
- return !(LHS == RHS);
- }
- /// This sorting will order things consistently by address range first, but then
- /// followed by inlining being valid and line tables. We might end up with a
- /// FunctionInfo from debug info that will have the same range as one from the
- /// symbol table, but we want to quickly be able to sort and use the best version
- /// when creating the final GSYM file.
- inline bool operator<(const FunctionInfo &LHS, const FunctionInfo &RHS) {
- // First sort by address range
- if (LHS.Range != RHS.Range)
- return LHS.Range < RHS.Range;
- // Then sort by inline
- if (LHS.Inline.has_value() != RHS.Inline.has_value())
- return RHS.Inline.has_value();
- return LHS.OptLineTable < RHS.OptLineTable;
- }
- raw_ostream &operator<<(raw_ostream &OS, const FunctionInfo &R);
- } // namespace gsym
- } // namespace llvm
- #endif // LLVM_DEBUGINFO_GSYM_FUNCTIONINFO_H
- #ifdef __GNUC__
- #pragma GCC diagnostic pop
- #endif
|