123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517 |
- #pragma once
- #ifdef __GNUC__
- #pragma GCC diagnostic push
- #pragma GCC diagnostic ignored "-Wunused-parameter"
- #endif
- //===- MCAssembler.h - Object File Generation -------------------*- C++ -*-===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- #ifndef LLVM_MC_MCASSEMBLER_H
- #define LLVM_MC_MCASSEMBLER_H
- #include "llvm/ADT/ArrayRef.h"
- #include "llvm/ADT/SmallPtrSet.h"
- #include "llvm/ADT/StringRef.h"
- #include "llvm/ADT/iterator.h"
- #include "llvm/ADT/iterator_range.h"
- #include "llvm/BinaryFormat/MachO.h"
- #include "llvm/MC/MCDirectives.h"
- #include "llvm/MC/MCDwarf.h"
- #include "llvm/MC/MCLinkerOptimizationHint.h"
- #include "llvm/MC/MCSymbol.h"
- #include "llvm/Support/SMLoc.h"
- #include "llvm/Support/VersionTuple.h"
- #include <algorithm>
- #include <cassert>
- #include <cstddef>
- #include <cstdint>
- #include <memory>
- #include <string>
- #include <tuple>
- #include <utility>
- #include <vector>
- namespace llvm {
- class MCBoundaryAlignFragment;
- class MCCVDefRangeFragment;
- class MCCVInlineLineTableFragment;
- class MCDwarfCallFrameFragment;
- class MCDwarfLineAddrFragment;
- class MCEncodedFragment;
- class MCFixup;
- class MCLEBFragment;
- class MCPseudoProbeAddrFragment;
- class MCRelaxableFragment;
- class MCSymbolRefExpr;
- class raw_ostream;
- class MCAsmBackend;
- class MCAsmLayout;
- class MCContext;
- class MCCodeEmitter;
- class MCFragment;
- class MCObjectWriter;
- class MCSection;
- class MCValue;
- // FIXME: This really doesn't belong here. See comments below.
- struct IndirectSymbolData {
- MCSymbol *Symbol;
- MCSection *Section;
- };
- // FIXME: Ditto this. Purely so the Streamer and the ObjectWriter can talk
- // to one another.
- struct DataRegionData {
- // This enum should be kept in sync w/ the mach-o definition in
- // llvm/Object/MachOFormat.h.
- enum KindTy { Data = 1, JumpTable8, JumpTable16, JumpTable32 } Kind;
- MCSymbol *Start;
- MCSymbol *End;
- };
- class MCAssembler {
- friend class MCAsmLayout;
- public:
- using SectionListType = std::vector<MCSection *>;
- using SymbolDataListType = std::vector<const MCSymbol *>;
- using const_iterator = pointee_iterator<SectionListType::const_iterator>;
- using iterator = pointee_iterator<SectionListType::iterator>;
- using const_symbol_iterator =
- pointee_iterator<SymbolDataListType::const_iterator>;
- using symbol_iterator = pointee_iterator<SymbolDataListType::iterator>;
- using symbol_range = iterator_range<symbol_iterator>;
- using const_symbol_range = iterator_range<const_symbol_iterator>;
- using const_indirect_symbol_iterator =
- std::vector<IndirectSymbolData>::const_iterator;
- using indirect_symbol_iterator = std::vector<IndirectSymbolData>::iterator;
- using const_data_region_iterator =
- std::vector<DataRegionData>::const_iterator;
- using data_region_iterator = std::vector<DataRegionData>::iterator;
- /// MachO specific deployment target version info.
- // A Major version of 0 indicates that no version information was supplied
- // and so the corresponding load command should not be emitted.
- using VersionInfoType = struct {
- bool EmitBuildVersion;
- union {
- MCVersionMinType Type; ///< Used when EmitBuildVersion==false.
- MachO::PlatformType Platform; ///< Used when EmitBuildVersion==true.
- } TypeOrPlatform;
- unsigned Major;
- unsigned Minor;
- unsigned Update;
- /// An optional version of the SDK that was used to build the source.
- VersionTuple SDKVersion;
- };
- private:
- MCContext &Context;
- std::unique_ptr<MCAsmBackend> Backend;
- std::unique_ptr<MCCodeEmitter> Emitter;
- std::unique_ptr<MCObjectWriter> Writer;
- SectionListType Sections;
- SymbolDataListType Symbols;
- std::vector<IndirectSymbolData> IndirectSymbols;
- std::vector<DataRegionData> DataRegions;
- /// The list of linker options to propagate into the object file.
- std::vector<std::vector<std::string>> LinkerOptions;
- /// List of declared file names
- std::vector<std::pair<std::string, size_t>> FileNames;
- MCDwarfLineTableParams LTParams;
- /// The set of function symbols for which a .thumb_func directive has
- /// been seen.
- //
- // FIXME: We really would like this in target specific code rather than
- // here. Maybe when the relocation stuff moves to target specific,
- // this can go with it? The streamer would need some target specific
- // refactoring too.
- mutable SmallPtrSet<const MCSymbol *, 32> ThumbFuncs;
- /// The bundle alignment size currently set in the assembler.
- ///
- /// By default it's 0, which means bundling is disabled.
- unsigned BundleAlignSize;
- bool RelaxAll : 1;
- bool SubsectionsViaSymbols : 1;
- bool IncrementalLinkerCompatible : 1;
- /// ELF specific e_header flags
- // It would be good if there were an MCELFAssembler class to hold this.
- // ELF header flags are used both by the integrated and standalone assemblers.
- // Access to the flags is necessary in cases where assembler directives affect
- // which flags to be set.
- unsigned ELFHeaderEFlags;
- /// Used to communicate Linker Optimization Hint information between
- /// the Streamer and the .o writer
- MCLOHContainer LOHContainer;
- VersionInfoType VersionInfo;
- VersionInfoType DarwinTargetVariantVersionInfo;
- /// Evaluate a fixup to a relocatable expression and the value which should be
- /// placed into the fixup.
- ///
- /// \param Layout The layout to use for evaluation.
- /// \param Fixup The fixup to evaluate.
- /// \param DF The fragment the fixup is inside.
- /// \param Target [out] On return, the relocatable expression the fixup
- /// evaluates to.
- /// \param Value [out] On return, the value of the fixup as currently laid
- /// out.
- /// \param WasForced [out] On return, the value in the fixup is set to the
- /// correct value if WasForced is true, even if evaluateFixup returns false.
- /// \return Whether the fixup value was fully resolved. This is true if the
- /// \p Value result is fixed, otherwise the value may change due to
- /// relocation.
- bool evaluateFixup(const MCAsmLayout &Layout, const MCFixup &Fixup,
- const MCFragment *DF, MCValue &Target,
- uint64_t &Value, bool &WasForced) const;
- /// Check whether a fixup can be satisfied, or whether it needs to be relaxed
- /// (increased in size, in order to hold its value correctly).
- bool fixupNeedsRelaxation(const MCFixup &Fixup, const MCRelaxableFragment *DF,
- const MCAsmLayout &Layout) const;
- /// Check whether the given fragment needs relaxation.
- bool fragmentNeedsRelaxation(const MCRelaxableFragment *IF,
- const MCAsmLayout &Layout) const;
- /// Perform one layout iteration and return true if any offsets
- /// were adjusted.
- bool layoutOnce(MCAsmLayout &Layout);
- /// Perform one layout iteration of the given section and return true
- /// if any offsets were adjusted.
- bool layoutSectionOnce(MCAsmLayout &Layout, MCSection &Sec);
- /// Perform relaxation on a single fragment - returns true if the fragment
- /// changes as a result of relaxation.
- bool relaxFragment(MCAsmLayout &Layout, MCFragment &F);
- bool relaxInstruction(MCAsmLayout &Layout, MCRelaxableFragment &IF);
- bool relaxLEB(MCAsmLayout &Layout, MCLEBFragment &IF);
- bool relaxBoundaryAlign(MCAsmLayout &Layout, MCBoundaryAlignFragment &BF);
- bool relaxDwarfLineAddr(MCAsmLayout &Layout, MCDwarfLineAddrFragment &DF);
- bool relaxDwarfCallFrameFragment(MCAsmLayout &Layout,
- MCDwarfCallFrameFragment &DF);
- bool relaxCVInlineLineTable(MCAsmLayout &Layout,
- MCCVInlineLineTableFragment &DF);
- bool relaxCVDefRange(MCAsmLayout &Layout, MCCVDefRangeFragment &DF);
- bool relaxPseudoProbeAddr(MCAsmLayout &Layout, MCPseudoProbeAddrFragment &DF);
- /// finishLayout - Finalize a layout, including fragment lowering.
- void finishLayout(MCAsmLayout &Layout);
- std::tuple<MCValue, uint64_t, bool>
- handleFixup(const MCAsmLayout &Layout, MCFragment &F, const MCFixup &Fixup);
- public:
- struct Symver {
- SMLoc Loc;
- const MCSymbol *Sym;
- StringRef Name;
- // True if .symver *, *@@@* or .symver *, *, remove.
- bool KeepOriginalSym;
- };
- std::vector<Symver> Symvers;
- /// Construct a new assembler instance.
- //
- // FIXME: How are we going to parameterize this? Two obvious options are stay
- // concrete and require clients to pass in a target like object. The other
- // option is to make this abstract, and have targets provide concrete
- // implementations as we do with AsmParser.
- MCAssembler(MCContext &Context, std::unique_ptr<MCAsmBackend> Backend,
- std::unique_ptr<MCCodeEmitter> Emitter,
- std::unique_ptr<MCObjectWriter> Writer);
- MCAssembler(const MCAssembler &) = delete;
- MCAssembler &operator=(const MCAssembler &) = delete;
- ~MCAssembler();
- /// Compute the effective fragment size assuming it is laid out at the given
- /// \p SectionAddress and \p FragmentOffset.
- uint64_t computeFragmentSize(const MCAsmLayout &Layout,
- const MCFragment &F) const;
- /// Find the symbol which defines the atom containing the given symbol, or
- /// null if there is no such symbol.
- const MCSymbol *getAtom(const MCSymbol &S) const;
- /// Check whether a particular symbol is visible to the linker and is required
- /// in the symbol table, or whether it can be discarded by the assembler. This
- /// also effects whether the assembler treats the label as potentially
- /// defining a separate atom.
- bool isSymbolLinkerVisible(const MCSymbol &SD) const;
- /// Emit the section contents to \p OS.
- void writeSectionData(raw_ostream &OS, const MCSection *Section,
- const MCAsmLayout &Layout) const;
- /// Check whether a given symbol has been flagged with .thumb_func.
- bool isThumbFunc(const MCSymbol *Func) const;
- /// Flag a function symbol as the target of a .thumb_func directive.
- void setIsThumbFunc(const MCSymbol *Func) { ThumbFuncs.insert(Func); }
- /// ELF e_header flags
- unsigned getELFHeaderEFlags() const { return ELFHeaderEFlags; }
- void setELFHeaderEFlags(unsigned Flags) { ELFHeaderEFlags = Flags; }
- /// MachO deployment target version information.
- const VersionInfoType &getVersionInfo() const { return VersionInfo; }
- void setVersionMin(MCVersionMinType Type, unsigned Major, unsigned Minor,
- unsigned Update,
- VersionTuple SDKVersion = VersionTuple()) {
- VersionInfo.EmitBuildVersion = false;
- VersionInfo.TypeOrPlatform.Type = Type;
- VersionInfo.Major = Major;
- VersionInfo.Minor = Minor;
- VersionInfo.Update = Update;
- VersionInfo.SDKVersion = SDKVersion;
- }
- void setBuildVersion(MachO::PlatformType Platform, unsigned Major,
- unsigned Minor, unsigned Update,
- VersionTuple SDKVersion = VersionTuple()) {
- VersionInfo.EmitBuildVersion = true;
- VersionInfo.TypeOrPlatform.Platform = Platform;
- VersionInfo.Major = Major;
- VersionInfo.Minor = Minor;
- VersionInfo.Update = Update;
- VersionInfo.SDKVersion = SDKVersion;
- }
- const VersionInfoType &getDarwinTargetVariantVersionInfo() const {
- return DarwinTargetVariantVersionInfo;
- }
- void setDarwinTargetVariantBuildVersion(MachO::PlatformType Platform,
- unsigned Major, unsigned Minor,
- unsigned Update,
- VersionTuple SDKVersion) {
- DarwinTargetVariantVersionInfo.EmitBuildVersion = true;
- DarwinTargetVariantVersionInfo.TypeOrPlatform.Platform = Platform;
- DarwinTargetVariantVersionInfo.Major = Major;
- DarwinTargetVariantVersionInfo.Minor = Minor;
- DarwinTargetVariantVersionInfo.Update = Update;
- DarwinTargetVariantVersionInfo.SDKVersion = SDKVersion;
- }
- /// Reuse an assembler instance
- ///
- void reset();
- MCContext &getContext() const { return Context; }
- MCAsmBackend *getBackendPtr() const { return Backend.get(); }
- MCCodeEmitter *getEmitterPtr() const { return Emitter.get(); }
- MCObjectWriter *getWriterPtr() const { return Writer.get(); }
- MCAsmBackend &getBackend() const { return *Backend; }
- MCCodeEmitter &getEmitter() const { return *Emitter; }
- MCObjectWriter &getWriter() const { return *Writer; }
- MCDwarfLineTableParams getDWARFLinetableParams() const { return LTParams; }
- void setDWARFLinetableParams(MCDwarfLineTableParams P) { LTParams = P; }
- /// Finish - Do final processing and write the object to the output stream.
- /// \p Writer is used for custom object writer (as the MCJIT does),
- /// if not specified it is automatically created from backend.
- void Finish();
- // Layout all section and prepare them for emission.
- void layout(MCAsmLayout &Layout);
- // FIXME: This does not belong here.
- bool getSubsectionsViaSymbols() const { return SubsectionsViaSymbols; }
- void setSubsectionsViaSymbols(bool Value) { SubsectionsViaSymbols = Value; }
- bool isIncrementalLinkerCompatible() const {
- return IncrementalLinkerCompatible;
- }
- void setIncrementalLinkerCompatible(bool Value) {
- IncrementalLinkerCompatible = Value;
- }
- bool getRelaxAll() const { return RelaxAll; }
- void setRelaxAll(bool Value) { RelaxAll = Value; }
- bool isBundlingEnabled() const { return BundleAlignSize != 0; }
- unsigned getBundleAlignSize() const { return BundleAlignSize; }
- void setBundleAlignSize(unsigned Size) {
- assert((Size == 0 || !(Size & (Size - 1))) &&
- "Expect a power-of-two bundle align size");
- BundleAlignSize = Size;
- }
- /// \name Section List Access
- /// @{
- iterator begin() { return Sections.begin(); }
- const_iterator begin() const { return Sections.begin(); }
- iterator end() { return Sections.end(); }
- const_iterator end() const { return Sections.end(); }
- size_t size() const { return Sections.size(); }
- /// @}
- /// \name Symbol List Access
- /// @{
- symbol_iterator symbol_begin() { return Symbols.begin(); }
- const_symbol_iterator symbol_begin() const { return Symbols.begin(); }
- symbol_iterator symbol_end() { return Symbols.end(); }
- const_symbol_iterator symbol_end() const { return Symbols.end(); }
- symbol_range symbols() { return make_range(symbol_begin(), symbol_end()); }
- const_symbol_range symbols() const {
- return make_range(symbol_begin(), symbol_end());
- }
- size_t symbol_size() const { return Symbols.size(); }
- /// @}
- /// \name Indirect Symbol List Access
- /// @{
- // FIXME: This is a total hack, this should not be here. Once things are
- // factored so that the streamer has direct access to the .o writer, it can
- // disappear.
- std::vector<IndirectSymbolData> &getIndirectSymbols() {
- return IndirectSymbols;
- }
- indirect_symbol_iterator indirect_symbol_begin() {
- return IndirectSymbols.begin();
- }
- const_indirect_symbol_iterator indirect_symbol_begin() const {
- return IndirectSymbols.begin();
- }
- indirect_symbol_iterator indirect_symbol_end() {
- return IndirectSymbols.end();
- }
- const_indirect_symbol_iterator indirect_symbol_end() const {
- return IndirectSymbols.end();
- }
- size_t indirect_symbol_size() const { return IndirectSymbols.size(); }
- /// @}
- /// \name Linker Option List Access
- /// @{
- std::vector<std::vector<std::string>> &getLinkerOptions() {
- return LinkerOptions;
- }
- /// @}
- /// \name Data Region List Access
- /// @{
- // FIXME: This is a total hack, this should not be here. Once things are
- // factored so that the streamer has direct access to the .o writer, it can
- // disappear.
- std::vector<DataRegionData> &getDataRegions() { return DataRegions; }
- data_region_iterator data_region_begin() { return DataRegions.begin(); }
- const_data_region_iterator data_region_begin() const {
- return DataRegions.begin();
- }
- data_region_iterator data_region_end() { return DataRegions.end(); }
- const_data_region_iterator data_region_end() const {
- return DataRegions.end();
- }
- size_t data_region_size() const { return DataRegions.size(); }
- /// @}
- /// \name Data Region List Access
- /// @{
- // FIXME: This is a total hack, this should not be here. Once things are
- // factored so that the streamer has direct access to the .o writer, it can
- // disappear.
- MCLOHContainer &getLOHContainer() { return LOHContainer; }
- const MCLOHContainer &getLOHContainer() const {
- return const_cast<MCAssembler *>(this)->getLOHContainer();
- }
- struct CGProfileEntry {
- const MCSymbolRefExpr *From;
- const MCSymbolRefExpr *To;
- uint64_t Count;
- };
- std::vector<CGProfileEntry> CGProfile;
- /// @}
- /// \name Backend Data Access
- /// @{
- bool registerSection(MCSection &Section);
- void registerSymbol(const MCSymbol &Symbol, bool *Created = nullptr);
- MutableArrayRef<std::pair<std::string, size_t>> getFileNames() {
- return FileNames;
- }
- void addFileName(StringRef FileName) {
- FileNames.emplace_back(std::string(FileName), Symbols.size());
- }
- /// Write the necessary bundle padding to \p OS.
- /// Expects a fragment \p F containing instructions and its size \p FSize.
- void writeFragmentPadding(raw_ostream &OS, const MCEncodedFragment &F,
- uint64_t FSize) const;
- /// @}
- void dump() const;
- };
- /// Compute the amount of padding required before the fragment \p F to
- /// obey bundling restrictions, where \p FOffset is the fragment's offset in
- /// its section and \p FSize is the fragment's size.
- uint64_t computeBundlePadding(const MCAssembler &Assembler,
- const MCEncodedFragment *F, uint64_t FOffset,
- uint64_t FSize);
- } // end namespace llvm
- #endif // LLVM_MC_MCASSEMBLER_H
- #ifdef __GNUC__
- #pragma GCC diagnostic pop
- #endif
|