123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310 |
- //=-- SampleProf.cpp - Sample profiling format support --------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // This file contains common definitions used in the reading and writing of
- // sample profile data.
- //
- //===----------------------------------------------------------------------===//
- #include "llvm/ProfileData/SampleProf.h"
- #include "llvm/Config/llvm-config.h"
- #include "llvm/IR/DebugInfoMetadata.h"
- #include "llvm/IR/PseudoProbe.h"
- #include "llvm/ProfileData/SampleProfReader.h"
- #include "llvm/Support/Compiler.h"
- #include "llvm/Support/Debug.h"
- #include "llvm/Support/Error.h"
- #include "llvm/Support/ErrorHandling.h"
- #include "llvm/Support/LEB128.h"
- #include "llvm/Support/ManagedStatic.h"
- #include "llvm/Support/raw_ostream.h"
- #include <string>
- #include <system_error>
- using namespace llvm;
- using namespace sampleprof;
- namespace llvm {
- namespace sampleprof {
- SampleProfileFormat FunctionSamples::Format;
- bool FunctionSamples::ProfileIsProbeBased = false;
- bool FunctionSamples::ProfileIsCS = false;
- bool FunctionSamples::UseMD5;
- } // namespace sampleprof
- } // namespace llvm
- namespace {
- // FIXME: This class is only here to support the transition to llvm::Error. It
- // will be removed once this transition is complete. Clients should prefer to
- // deal with the Error value directly, rather than converting to error_code.
- class SampleProfErrorCategoryType : public std::error_category {
- const char *name() const noexcept override { return "llvm.sampleprof"; }
- std::string message(int IE) const override {
- sampleprof_error E = static_cast<sampleprof_error>(IE);
- switch (E) {
- case sampleprof_error::success:
- return "Success";
- case sampleprof_error::bad_magic:
- return "Invalid sample profile data (bad magic)";
- case sampleprof_error::unsupported_version:
- return "Unsupported sample profile format version";
- case sampleprof_error::too_large:
- return "Too much profile data";
- case sampleprof_error::truncated:
- return "Truncated profile data";
- case sampleprof_error::malformed:
- return "Malformed sample profile data";
- case sampleprof_error::unrecognized_format:
- return "Unrecognized sample profile encoding format";
- case sampleprof_error::unsupported_writing_format:
- return "Profile encoding format unsupported for writing operations";
- case sampleprof_error::truncated_name_table:
- return "Truncated function name table";
- case sampleprof_error::not_implemented:
- return "Unimplemented feature";
- case sampleprof_error::counter_overflow:
- return "Counter overflow";
- case sampleprof_error::ostream_seek_unsupported:
- return "Ostream does not support seek";
- case sampleprof_error::compress_failed:
- return "Compress failure";
- case sampleprof_error::uncompress_failed:
- return "Uncompress failure";
- case sampleprof_error::zlib_unavailable:
- return "Zlib is unavailable";
- case sampleprof_error::hash_mismatch:
- return "Function hash mismatch";
- }
- llvm_unreachable("A value of sampleprof_error has no message.");
- }
- };
- } // end anonymous namespace
- static ManagedStatic<SampleProfErrorCategoryType> ErrorCategory;
- const std::error_category &llvm::sampleprof_category() {
- return *ErrorCategory;
- }
- void LineLocation::print(raw_ostream &OS) const {
- OS << LineOffset;
- if (Discriminator > 0)
- OS << "." << Discriminator;
- }
- raw_ostream &llvm::sampleprof::operator<<(raw_ostream &OS,
- const LineLocation &Loc) {
- Loc.print(OS);
- return OS;
- }
- #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
- LLVM_DUMP_METHOD void LineLocation::dump() const { print(dbgs()); }
- #endif
- /// Print the sample record to the stream \p OS indented by \p Indent.
- void SampleRecord::print(raw_ostream &OS, unsigned Indent) const {
- OS << NumSamples;
- if (hasCalls()) {
- OS << ", calls:";
- for (const auto &I : getSortedCallTargets())
- OS << " " << I.first << ":" << I.second;
- }
- OS << "\n";
- }
- #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
- LLVM_DUMP_METHOD void SampleRecord::dump() const { print(dbgs(), 0); }
- #endif
- raw_ostream &llvm::sampleprof::operator<<(raw_ostream &OS,
- const SampleRecord &Sample) {
- Sample.print(OS, 0);
- return OS;
- }
- /// Print the samples collected for a function on stream \p OS.
- void FunctionSamples::print(raw_ostream &OS, unsigned Indent) const {
- if (getFunctionHash())
- OS << "CFG checksum " << getFunctionHash() << "\n";
- OS << TotalSamples << ", " << TotalHeadSamples << ", " << BodySamples.size()
- << " sampled lines\n";
- OS.indent(Indent);
- if (!BodySamples.empty()) {
- OS << "Samples collected in the function's body {\n";
- SampleSorter<LineLocation, SampleRecord> SortedBodySamples(BodySamples);
- for (const auto &SI : SortedBodySamples.get()) {
- OS.indent(Indent + 2);
- OS << SI->first << ": " << SI->second;
- }
- OS.indent(Indent);
- OS << "}\n";
- } else {
- OS << "No samples collected in the function's body\n";
- }
- OS.indent(Indent);
- if (!CallsiteSamples.empty()) {
- OS << "Samples collected in inlined callsites {\n";
- SampleSorter<LineLocation, FunctionSamplesMap> SortedCallsiteSamples(
- CallsiteSamples);
- for (const auto &CS : SortedCallsiteSamples.get()) {
- for (const auto &FS : CS->second) {
- OS.indent(Indent + 2);
- OS << CS->first << ": inlined callee: " << FS.second.getName() << ": ";
- FS.second.print(OS, Indent + 4);
- }
- }
- OS.indent(Indent);
- OS << "}\n";
- } else {
- OS << "No inlined callsites in this function\n";
- }
- }
- raw_ostream &llvm::sampleprof::operator<<(raw_ostream &OS,
- const FunctionSamples &FS) {
- FS.print(OS);
- return OS;
- }
- unsigned FunctionSamples::getOffset(const DILocation *DIL) {
- return (DIL->getLine() - DIL->getScope()->getSubprogram()->getLine()) &
- 0xffff;
- }
- LineLocation FunctionSamples::getCallSiteIdentifier(const DILocation *DIL) {
- if (FunctionSamples::ProfileIsProbeBased)
- // In a pseudo-probe based profile, a callsite is simply represented by the
- // ID of the probe associated with the call instruction. The probe ID is
- // encoded in the Discriminator field of the call instruction's debug
- // metadata.
- return LineLocation(PseudoProbeDwarfDiscriminator::extractProbeIndex(
- DIL->getDiscriminator()),
- 0);
- else
- return LineLocation(FunctionSamples::getOffset(DIL),
- DIL->getBaseDiscriminator());
- }
- const FunctionSamples *FunctionSamples::findFunctionSamples(
- const DILocation *DIL, SampleProfileReaderItaniumRemapper *Remapper) const {
- assert(DIL);
- SmallVector<std::pair<LineLocation, StringRef>, 10> S;
- const DILocation *PrevDIL = DIL;
- for (DIL = DIL->getInlinedAt(); DIL; DIL = DIL->getInlinedAt()) {
- S.push_back(std::make_pair(
- LineLocation(getOffset(DIL), DIL->getBaseDiscriminator()),
- PrevDIL->getScope()->getSubprogram()->getLinkageName()));
- PrevDIL = DIL;
- }
- if (S.size() == 0)
- return this;
- const FunctionSamples *FS = this;
- for (int i = S.size() - 1; i >= 0 && FS != nullptr; i--) {
- FS = FS->findFunctionSamplesAt(S[i].first, S[i].second, Remapper);
- }
- return FS;
- }
- void FunctionSamples::findAllNames(DenseSet<StringRef> &NameSet) const {
- NameSet.insert(Name);
- for (const auto &BS : BodySamples)
- for (const auto &TS : BS.second.getCallTargets())
- NameSet.insert(TS.getKey());
- for (const auto &CS : CallsiteSamples) {
- for (const auto &NameFS : CS.second) {
- NameSet.insert(NameFS.first);
- NameFS.second.findAllNames(NameSet);
- }
- }
- }
- const FunctionSamples *FunctionSamples::findFunctionSamplesAt(
- const LineLocation &Loc, StringRef CalleeName,
- SampleProfileReaderItaniumRemapper *Remapper) const {
- std::string CalleeGUID;
- CalleeName = getRepInFormat(CalleeName, UseMD5, CalleeGUID);
- auto iter = CallsiteSamples.find(Loc);
- if (iter == CallsiteSamples.end())
- return nullptr;
- auto FS = iter->second.find(CalleeName);
- if (FS != iter->second.end())
- return &FS->second;
- if (Remapper) {
- if (auto NameInProfile = Remapper->lookUpNameInProfile(CalleeName)) {
- auto FS = iter->second.find(*NameInProfile);
- if (FS != iter->second.end())
- return &FS->second;
- }
- }
- // If we cannot find exact match of the callee name, return the FS with
- // the max total count. Only do this when CalleeName is not provided,
- // i.e., only for indirect calls.
- if (!CalleeName.empty())
- return nullptr;
- uint64_t MaxTotalSamples = 0;
- const FunctionSamples *R = nullptr;
- for (const auto &NameFS : iter->second)
- if (NameFS.second.getTotalSamples() >= MaxTotalSamples) {
- MaxTotalSamples = NameFS.second.getTotalSamples();
- R = &NameFS.second;
- }
- return R;
- }
- #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
- LLVM_DUMP_METHOD void FunctionSamples::dump() const { print(dbgs(), 0); }
- #endif
- std::error_code ProfileSymbolList::read(const uint8_t *Data,
- uint64_t ListSize) {
- const char *ListStart = reinterpret_cast<const char *>(Data);
- uint64_t Size = 0;
- while (Size < ListSize) {
- StringRef Str(ListStart + Size);
- add(Str);
- Size += Str.size() + 1;
- }
- if (Size != ListSize)
- return sampleprof_error::malformed;
- return sampleprof_error::success;
- }
- std::error_code ProfileSymbolList::write(raw_ostream &OS) {
- // Sort the symbols before output. If doing compression.
- // It will make the compression much more effective.
- std::vector<StringRef> SortedList(Syms.begin(), Syms.end());
- llvm::sort(SortedList);
- std::string OutputString;
- for (auto &Sym : SortedList) {
- OutputString.append(Sym.str());
- OutputString.append(1, '\0');
- }
- OS << OutputString;
- return sampleprof_error::success;
- }
- void ProfileSymbolList::dump(raw_ostream &OS) const {
- OS << "======== Dump profile symbol list ========\n";
- std::vector<StringRef> SortedList(Syms.begin(), Syms.end());
- llvm::sort(SortedList);
- for (auto &Sym : SortedList)
- OS << Sym << "\n";
- }
|