123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585 |
- //===-- llvm-mca.cpp - Machine Code Analyzer -------------------*- C++ -* -===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // This utility is a simple driver that allows static performance analysis on
- // machine code similarly to how IACA (Intel Architecture Code Analyzer) works.
- //
- // llvm-mca [options] <file-name>
- // -march <type>
- // -mcpu <cpu>
- // -o <file>
- //
- // The target defaults to the host target.
- // The cpu defaults to the 'native' host cpu.
- // The output defaults to standard output.
- //
- //===----------------------------------------------------------------------===//
- #include "CodeRegion.h"
- #include "CodeRegionGenerator.h"
- #include "PipelinePrinter.h"
- #include "Views/BottleneckAnalysis.h"
- #include "Views/DispatchStatistics.h"
- #include "Views/InstructionInfoView.h"
- #include "Views/RegisterFileStatistics.h"
- #include "Views/ResourcePressureView.h"
- #include "Views/RetireControlUnitStatistics.h"
- #include "Views/SchedulerStatistics.h"
- #include "Views/SummaryView.h"
- #include "Views/TimelineView.h"
- #include "llvm/MC/MCAsmBackend.h"
- #include "llvm/MC/MCAsmInfo.h"
- #include "llvm/MC/MCCodeEmitter.h"
- #include "llvm/MC/MCContext.h"
- #include "llvm/MC/MCObjectFileInfo.h"
- #include "llvm/MC/MCRegisterInfo.h"
- #include "llvm/MC/MCSubtargetInfo.h"
- #include "llvm/MC/MCTargetOptionsCommandFlags.h"
- #include "llvm/MCA/CodeEmitter.h"
- #include "llvm/MCA/Context.h"
- #include "llvm/MCA/InstrBuilder.h"
- #include "llvm/MCA/Pipeline.h"
- #include "llvm/MCA/Stages/EntryStage.h"
- #include "llvm/MCA/Stages/InstructionTables.h"
- #include "llvm/MCA/Support.h"
- #include "llvm/Support/CommandLine.h"
- #include "llvm/Support/ErrorHandling.h"
- #include "llvm/Support/ErrorOr.h"
- #include "llvm/Support/FileSystem.h"
- #include "llvm/Support/Host.h"
- #include "llvm/Support/InitLLVM.h"
- #include "llvm/Support/MemoryBuffer.h"
- #include "llvm/Support/SourceMgr.h"
- #include "llvm/Support/TargetRegistry.h"
- #include "llvm/Support/TargetSelect.h"
- #include "llvm/Support/ToolOutputFile.h"
- #include "llvm/Support/WithColor.h"
- using namespace llvm;
- static mc::RegisterMCTargetOptionsFlags MOF;
- static cl::OptionCategory ToolOptions("Tool Options");
- static cl::OptionCategory ViewOptions("View Options");
- static cl::opt<std::string> InputFilename(cl::Positional,
- cl::desc("<input file>"),
- cl::cat(ToolOptions), cl::init("-"));
- static cl::opt<std::string> OutputFilename("o", cl::desc("Output filename"),
- cl::init("-"), cl::cat(ToolOptions),
- cl::value_desc("filename"));
- static cl::opt<std::string>
- ArchName("march",
- cl::desc("Target architecture. "
- "See -version for available targets"),
- cl::cat(ToolOptions));
- static cl::opt<std::string>
- TripleName("mtriple",
- cl::desc("Target triple. See -version for available targets"),
- cl::cat(ToolOptions));
- static cl::opt<std::string>
- MCPU("mcpu",
- cl::desc("Target a specific cpu type (-mcpu=help for details)"),
- cl::value_desc("cpu-name"), cl::cat(ToolOptions), cl::init("native"));
- static cl::opt<std::string>
- MATTR("mattr",
- cl::desc("Additional target features."),
- cl::cat(ToolOptions));
- static cl::opt<bool>
- PrintJson("json",
- cl::desc("Print the output in json format"),
- cl::cat(ToolOptions), cl::init(false));
- static cl::opt<int>
- OutputAsmVariant("output-asm-variant",
- cl::desc("Syntax variant to use for output printing"),
- cl::cat(ToolOptions), cl::init(-1));
- static cl::opt<bool>
- PrintImmHex("print-imm-hex", cl::cat(ToolOptions), cl::init(false),
- cl::desc("Prefer hex format when printing immediate values"));
- static cl::opt<unsigned> Iterations("iterations",
- cl::desc("Number of iterations to run"),
- cl::cat(ToolOptions), cl::init(0));
- static cl::opt<unsigned>
- DispatchWidth("dispatch", cl::desc("Override the processor dispatch width"),
- cl::cat(ToolOptions), cl::init(0));
- static cl::opt<unsigned>
- RegisterFileSize("register-file-size",
- cl::desc("Maximum number of physical registers which can "
- "be used for register mappings"),
- cl::cat(ToolOptions), cl::init(0));
- static cl::opt<unsigned>
- MicroOpQueue("micro-op-queue-size", cl::Hidden,
- cl::desc("Number of entries in the micro-op queue"),
- cl::cat(ToolOptions), cl::init(0));
- static cl::opt<unsigned>
- DecoderThroughput("decoder-throughput", cl::Hidden,
- cl::desc("Maximum throughput from the decoders "
- "(instructions per cycle)"),
- cl::cat(ToolOptions), cl::init(0));
- static cl::opt<bool>
- PrintRegisterFileStats("register-file-stats",
- cl::desc("Print register file statistics"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<bool> PrintDispatchStats("dispatch-stats",
- cl::desc("Print dispatch statistics"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<bool>
- PrintSummaryView("summary-view", cl::Hidden,
- cl::desc("Print summary view (enabled by default)"),
- cl::cat(ViewOptions), cl::init(true));
- static cl::opt<bool> PrintSchedulerStats("scheduler-stats",
- cl::desc("Print scheduler statistics"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<bool>
- PrintRetireStats("retire-stats",
- cl::desc("Print retire control unit statistics"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<bool> PrintResourcePressureView(
- "resource-pressure",
- cl::desc("Print the resource pressure view (enabled by default)"),
- cl::cat(ViewOptions), cl::init(true));
- static cl::opt<bool> PrintTimelineView("timeline",
- cl::desc("Print the timeline view"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<unsigned> TimelineMaxIterations(
- "timeline-max-iterations",
- cl::desc("Maximum number of iterations to print in timeline view"),
- cl::cat(ViewOptions), cl::init(0));
- static cl::opt<unsigned> TimelineMaxCycles(
- "timeline-max-cycles",
- cl::desc(
- "Maximum number of cycles in the timeline view. Defaults to 80 cycles"),
- cl::cat(ViewOptions), cl::init(80));
- static cl::opt<bool>
- AssumeNoAlias("noalias",
- cl::desc("If set, assume that loads and stores do not alias"),
- cl::cat(ToolOptions), cl::init(true));
- static cl::opt<unsigned> LoadQueueSize("lqueue",
- cl::desc("Size of the load queue"),
- cl::cat(ToolOptions), cl::init(0));
- static cl::opt<unsigned> StoreQueueSize("squeue",
- cl::desc("Size of the store queue"),
- cl::cat(ToolOptions), cl::init(0));
- static cl::opt<bool>
- PrintInstructionTables("instruction-tables",
- cl::desc("Print instruction tables"),
- cl::cat(ToolOptions), cl::init(false));
- static cl::opt<bool> PrintInstructionInfoView(
- "instruction-info",
- cl::desc("Print the instruction info view (enabled by default)"),
- cl::cat(ViewOptions), cl::init(true));
- static cl::opt<bool> EnableAllStats("all-stats",
- cl::desc("Print all hardware statistics"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<bool>
- EnableAllViews("all-views",
- cl::desc("Print all views including hardware statistics"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<bool> EnableBottleneckAnalysis(
- "bottleneck-analysis",
- cl::desc("Enable bottleneck analysis (disabled by default)"),
- cl::cat(ViewOptions), cl::init(false));
- static cl::opt<bool> ShowEncoding(
- "show-encoding",
- cl::desc("Print encoding information in the instruction info view"),
- cl::cat(ViewOptions), cl::init(false));
- namespace {
- const Target *getTarget(const char *ProgName) {
- if (TripleName.empty())
- TripleName = Triple::normalize(sys::getDefaultTargetTriple());
- Triple TheTriple(TripleName);
- // Get the target specific parser.
- std::string Error;
- const Target *TheTarget =
- TargetRegistry::lookupTarget(ArchName, TheTriple, Error);
- if (!TheTarget) {
- errs() << ProgName << ": " << Error;
- return nullptr;
- }
- // Return the found target.
- return TheTarget;
- }
- ErrorOr<std::unique_ptr<ToolOutputFile>> getOutputStream() {
- if (OutputFilename == "")
- OutputFilename = "-";
- std::error_code EC;
- auto Out =
- std::make_unique<ToolOutputFile>(OutputFilename, EC, sys::fs::OF_Text);
- if (!EC)
- return std::move(Out);
- return EC;
- }
- } // end of anonymous namespace
- static void processOptionImpl(cl::opt<bool> &O, const cl::opt<bool> &Default) {
- if (!O.getNumOccurrences() || O.getPosition() < Default.getPosition())
- O = Default.getValue();
- }
- static void processViewOptions() {
- if (!EnableAllViews.getNumOccurrences() &&
- !EnableAllStats.getNumOccurrences())
- return;
- if (EnableAllViews.getNumOccurrences()) {
- processOptionImpl(PrintSummaryView, EnableAllViews);
- processOptionImpl(EnableBottleneckAnalysis, EnableAllViews);
- processOptionImpl(PrintResourcePressureView, EnableAllViews);
- processOptionImpl(PrintTimelineView, EnableAllViews);
- processOptionImpl(PrintInstructionInfoView, EnableAllViews);
- }
- const cl::opt<bool> &Default =
- EnableAllViews.getPosition() < EnableAllStats.getPosition()
- ? EnableAllStats
- : EnableAllViews;
- processOptionImpl(PrintRegisterFileStats, Default);
- processOptionImpl(PrintDispatchStats, Default);
- processOptionImpl(PrintSchedulerStats, Default);
- processOptionImpl(PrintRetireStats, Default);
- }
- // Returns true on success.
- static bool runPipeline(mca::Pipeline &P) {
- // Handle pipeline errors here.
- Expected<unsigned> Cycles = P.run();
- if (!Cycles) {
- WithColor::error() << toString(Cycles.takeError());
- return false;
- }
- return true;
- }
- int main(int argc, char **argv) {
- InitLLVM X(argc, argv);
- // Initialize targets and assembly parsers.
- InitializeAllTargetInfos();
- InitializeAllTargetMCs();
- InitializeAllAsmParsers();
- // Enable printing of available targets when flag --version is specified.
- cl::AddExtraVersionPrinter(TargetRegistry::printRegisteredTargetsForVersion);
- cl::HideUnrelatedOptions({&ToolOptions, &ViewOptions});
- // Parse flags and initialize target options.
- cl::ParseCommandLineOptions(argc, argv,
- "llvm machine code performance analyzer.\n");
- // Get the target from the triple. If a triple is not specified, then select
- // the default triple for the host. If the triple doesn't correspond to any
- // registered target, then exit with an error message.
- const char *ProgName = argv[0];
- const Target *TheTarget = getTarget(ProgName);
- if (!TheTarget)
- return 1;
- // GetTarget() may replaced TripleName with a default triple.
- // For safety, reconstruct the Triple object.
- Triple TheTriple(TripleName);
- ErrorOr<std::unique_ptr<MemoryBuffer>> BufferPtr =
- MemoryBuffer::getFileOrSTDIN(InputFilename);
- if (std::error_code EC = BufferPtr.getError()) {
- WithColor::error() << InputFilename << ": " << EC.message() << '\n';
- return 1;
- }
- // Apply overrides to llvm-mca specific options.
- processViewOptions();
- if (MCPU == "native")
- MCPU = std::string(llvm::sys::getHostCPUName());
- std::unique_ptr<MCSubtargetInfo> STI(
- TheTarget->createMCSubtargetInfo(TripleName, MCPU, MATTR));
- assert(STI && "Unable to create subtarget info!");
- if (!STI->isCPUStringValid(MCPU))
- return 1;
- if (!PrintInstructionTables && !STI->getSchedModel().isOutOfOrder()) {
- WithColor::error() << "please specify an out-of-order cpu. '" << MCPU
- << "' is an in-order cpu.\n";
- return 1;
- }
- if (!STI->getSchedModel().hasInstrSchedModel()) {
- WithColor::error()
- << "unable to find instruction-level scheduling information for"
- << " target triple '" << TheTriple.normalize() << "' and cpu '" << MCPU
- << "'.\n";
- if (STI->getSchedModel().InstrItineraries)
- WithColor::note()
- << "cpu '" << MCPU << "' provides itineraries. However, "
- << "instruction itineraries are currently unsupported.\n";
- return 1;
- }
- std::unique_ptr<MCRegisterInfo> MRI(TheTarget->createMCRegInfo(TripleName));
- assert(MRI && "Unable to create target register info!");
- MCTargetOptions MCOptions = mc::InitMCTargetOptionsFromFlags();
- std::unique_ptr<MCAsmInfo> MAI(
- TheTarget->createMCAsmInfo(*MRI, TripleName, MCOptions));
- assert(MAI && "Unable to create target asm info!");
- MCObjectFileInfo MOFI;
- SourceMgr SrcMgr;
- // Tell SrcMgr about this buffer, which is what the parser will pick up.
- SrcMgr.AddNewSourceBuffer(std::move(*BufferPtr), SMLoc());
- MCContext Ctx(MAI.get(), MRI.get(), &MOFI, &SrcMgr);
- MOFI.InitMCObjectFileInfo(TheTriple, /* PIC= */ false, Ctx);
- std::unique_ptr<buffer_ostream> BOS;
- std::unique_ptr<MCInstrInfo> MCII(TheTarget->createMCInstrInfo());
- assert(MCII && "Unable to create instruction info!");
- std::unique_ptr<MCInstrAnalysis> MCIA(
- TheTarget->createMCInstrAnalysis(MCII.get()));
- // Parse the input and create CodeRegions that llvm-mca can analyze.
- mca::AsmCodeRegionGenerator CRG(*TheTarget, SrcMgr, Ctx, *MAI, *STI, *MCII);
- Expected<const mca::CodeRegions &> RegionsOrErr = CRG.parseCodeRegions();
- if (!RegionsOrErr) {
- if (auto Err =
- handleErrors(RegionsOrErr.takeError(), [](const StringError &E) {
- WithColor::error() << E.getMessage() << '\n';
- })) {
- // Default case.
- WithColor::error() << toString(std::move(Err)) << '\n';
- }
- return 1;
- }
- const mca::CodeRegions &Regions = *RegionsOrErr;
- // Early exit if errors were found by the code region parsing logic.
- if (!Regions.isValid())
- return 1;
- if (Regions.empty()) {
- WithColor::error() << "no assembly instructions found.\n";
- return 1;
- }
- // Now initialize the output file.
- auto OF = getOutputStream();
- if (std::error_code EC = OF.getError()) {
- WithColor::error() << EC.message() << '\n';
- return 1;
- }
- unsigned AssemblerDialect = CRG.getAssemblerDialect();
- if (OutputAsmVariant >= 0)
- AssemblerDialect = static_cast<unsigned>(OutputAsmVariant);
- std::unique_ptr<MCInstPrinter> IP(TheTarget->createMCInstPrinter(
- Triple(TripleName), AssemblerDialect, *MAI, *MCII, *MRI));
- if (!IP) {
- WithColor::error()
- << "unable to create instruction printer for target triple '"
- << TheTriple.normalize() << "' with assembly variant "
- << AssemblerDialect << ".\n";
- return 1;
- }
- // Set the display preference for hex vs. decimal immediates.
- IP->setPrintImmHex(PrintImmHex);
- std::unique_ptr<ToolOutputFile> TOF = std::move(*OF);
- const MCSchedModel &SM = STI->getSchedModel();
- // Create an instruction builder.
- mca::InstrBuilder IB(*STI, *MCII, *MRI, MCIA.get());
- // Create a context to control ownership of the pipeline hardware.
- mca::Context MCA(*MRI, *STI);
- mca::PipelineOptions PO(MicroOpQueue, DecoderThroughput, DispatchWidth,
- RegisterFileSize, LoadQueueSize, StoreQueueSize,
- AssumeNoAlias, EnableBottleneckAnalysis);
- // Number each region in the sequence.
- unsigned RegionIdx = 0;
- std::unique_ptr<MCCodeEmitter> MCE(
- TheTarget->createMCCodeEmitter(*MCII, *MRI, Ctx));
- assert(MCE && "Unable to create code emitter!");
- std::unique_ptr<MCAsmBackend> MAB(TheTarget->createMCAsmBackend(
- *STI, *MRI, mc::InitMCTargetOptionsFromFlags()));
- assert(MAB && "Unable to create asm backend!");
- for (const std::unique_ptr<mca::CodeRegion> &Region : Regions) {
- // Skip empty code regions.
- if (Region->empty())
- continue;
- // Don't print the header of this region if it is the default region, and
- // it doesn't have an end location.
- if (Region->startLoc().isValid() || Region->endLoc().isValid()) {
- TOF->os() << "\n[" << RegionIdx++ << "] Code Region";
- StringRef Desc = Region->getDescription();
- if (!Desc.empty())
- TOF->os() << " - " << Desc;
- TOF->os() << "\n\n";
- }
- // Lower the MCInst sequence into an mca::Instruction sequence.
- ArrayRef<MCInst> Insts = Region->getInstructions();
- mca::CodeEmitter CE(*STI, *MAB, *MCE, Insts);
- std::vector<std::unique_ptr<mca::Instruction>> LoweredSequence;
- for (const MCInst &MCI : Insts) {
- Expected<std::unique_ptr<mca::Instruction>> Inst =
- IB.createInstruction(MCI);
- if (!Inst) {
- if (auto NewE = handleErrors(
- Inst.takeError(),
- [&IP, &STI](const mca::InstructionError<MCInst> &IE) {
- std::string InstructionStr;
- raw_string_ostream SS(InstructionStr);
- WithColor::error() << IE.Message << '\n';
- IP->printInst(&IE.Inst, 0, "", *STI, SS);
- SS.flush();
- WithColor::note()
- << "instruction: " << InstructionStr << '\n';
- })) {
- // Default case.
- WithColor::error() << toString(std::move(NewE));
- }
- return 1;
- }
- LoweredSequence.emplace_back(std::move(Inst.get()));
- }
- mca::SourceMgr S(LoweredSequence, PrintInstructionTables ? 1 : Iterations);
- if (PrintInstructionTables) {
- // Create a pipeline, stages, and a printer.
- auto P = std::make_unique<mca::Pipeline>();
- P->appendStage(std::make_unique<mca::EntryStage>(S));
- P->appendStage(std::make_unique<mca::InstructionTables>(SM));
- mca::PipelinePrinter Printer(*P, mca::View::OK_READABLE);
- // Create the views for this pipeline, execute, and emit a report.
- if (PrintInstructionInfoView) {
- Printer.addView(std::make_unique<mca::InstructionInfoView>(
- *STI, *MCII, CE, ShowEncoding, Insts, *IP));
- }
- Printer.addView(
- std::make_unique<mca::ResourcePressureView>(*STI, *IP, Insts));
- if (!runPipeline(*P))
- return 1;
- Printer.printReport(TOF->os());
- continue;
- }
- // Create a basic pipeline simulating an out-of-order backend.
- auto P = MCA.createDefaultPipeline(PO, S);
- mca::PipelinePrinter Printer(*P, PrintJson ? mca::View::OK_JSON
- : mca::View::OK_READABLE);
- // When we output JSON, we add a view that contains the instructions
- // and CPU resource information.
- if (PrintJson)
- Printer.addView(
- std::make_unique<mca::InstructionView>(*STI, *IP, Insts, MCPU));
- if (PrintSummaryView)
- Printer.addView(
- std::make_unique<mca::SummaryView>(SM, Insts, DispatchWidth));
- if (EnableBottleneckAnalysis) {
- Printer.addView(std::make_unique<mca::BottleneckAnalysis>(
- *STI, *IP, Insts, S.getNumIterations()));
- }
- if (PrintInstructionInfoView)
- Printer.addView(std::make_unique<mca::InstructionInfoView>(
- *STI, *MCII, CE, ShowEncoding, Insts, *IP));
- if (PrintDispatchStats)
- Printer.addView(std::make_unique<mca::DispatchStatistics>());
- if (PrintSchedulerStats)
- Printer.addView(std::make_unique<mca::SchedulerStatistics>(*STI));
- if (PrintRetireStats)
- Printer.addView(std::make_unique<mca::RetireControlUnitStatistics>(SM));
- if (PrintRegisterFileStats)
- Printer.addView(std::make_unique<mca::RegisterFileStatistics>(*STI));
- if (PrintResourcePressureView)
- Printer.addView(
- std::make_unique<mca::ResourcePressureView>(*STI, *IP, Insts));
- if (PrintTimelineView) {
- unsigned TimelineIterations =
- TimelineMaxIterations ? TimelineMaxIterations : 10;
- Printer.addView(std::make_unique<mca::TimelineView>(
- *STI, *IP, Insts, std::min(TimelineIterations, S.getNumIterations()),
- TimelineMaxCycles));
- }
- if (!runPipeline(*P))
- return 1;
- Printer.printReport(TOF->os());
- // Clear the InstrBuilder internal state in preparation for another round.
- IB.clear();
- }
- TOF->keep();
- return 0;
- }
|