1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210 |
- //===-- sancov.cpp --------------------------------------------------------===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- // This file is a command-line tool for reading and analyzing sanitizer
- // coverage.
- //===----------------------------------------------------------------------===//
- #include "llvm/ADT/STLExtras.h"
- #include "llvm/ADT/StringExtras.h"
- #include "llvm/ADT/Twine.h"
- #include "llvm/DebugInfo/Symbolize/SymbolizableModule.h"
- #include "llvm/DebugInfo/Symbolize/Symbolize.h"
- #include "llvm/MC/MCAsmInfo.h"
- #include "llvm/MC/MCContext.h"
- #include "llvm/MC/MCDisassembler/MCDisassembler.h"
- #include "llvm/MC/MCInst.h"
- #include "llvm/MC/MCInstrAnalysis.h"
- #include "llvm/MC/MCInstrInfo.h"
- #include "llvm/MC/MCObjectFileInfo.h"
- #include "llvm/MC/MCRegisterInfo.h"
- #include "llvm/MC/MCSubtargetInfo.h"
- #include "llvm/MC/MCTargetOptions.h"
- #include "llvm/MC/TargetRegistry.h"
- #include "llvm/Object/Archive.h"
- #include "llvm/Object/Binary.h"
- #include "llvm/Object/COFF.h"
- #include "llvm/Object/MachO.h"
- #include "llvm/Object/ObjectFile.h"
- #include "llvm/Support/Casting.h"
- #include "llvm/Support/CommandLine.h"
- #include "llvm/Support/Errc.h"
- #include "llvm/Support/ErrorOr.h"
- #include "llvm/Support/FileSystem.h"
- #include "llvm/Support/InitLLVM.h"
- #include "llvm/Support/JSON.h"
- #include "llvm/Support/MD5.h"
- #include "llvm/Support/MemoryBuffer.h"
- #include "llvm/Support/Path.h"
- #include "llvm/Support/Regex.h"
- #include "llvm/Support/SHA1.h"
- #include "llvm/Support/SourceMgr.h"
- #include "llvm/Support/SpecialCaseList.h"
- #include "llvm/Support/TargetSelect.h"
- #include "llvm/Support/VirtualFileSystem.h"
- #include "llvm/Support/YAMLParser.h"
- #include "llvm/Support/raw_ostream.h"
- #include <set>
- #include <vector>
- using namespace llvm;
- namespace {
- // --------- COMMAND LINE FLAGS ---------
- cl::OptionCategory Cat("sancov Options");
- enum ActionType {
- CoveredFunctionsAction,
- HtmlReportAction,
- MergeAction,
- NotCoveredFunctionsAction,
- PrintAction,
- PrintCovPointsAction,
- StatsAction,
- SymbolizeAction
- };
- cl::opt<ActionType> Action(
- cl::desc("Action (required)"), cl::Required,
- cl::values(
- clEnumValN(PrintAction, "print", "Print coverage addresses"),
- clEnumValN(PrintCovPointsAction, "print-coverage-pcs",
- "Print coverage instrumentation points addresses."),
- clEnumValN(CoveredFunctionsAction, "covered-functions",
- "Print all covered funcions."),
- clEnumValN(NotCoveredFunctionsAction, "not-covered-functions",
- "Print all not covered funcions."),
- clEnumValN(StatsAction, "print-coverage-stats",
- "Print coverage statistics."),
- clEnumValN(HtmlReportAction, "html-report",
- "REMOVED. Use -symbolize & coverage-report-server.py."),
- clEnumValN(SymbolizeAction, "symbolize",
- "Produces a symbolized JSON report from binary report."),
- clEnumValN(MergeAction, "merge", "Merges reports.")),
- cl::cat(Cat));
- static cl::list<std::string>
- ClInputFiles(cl::Positional, cl::OneOrMore,
- cl::desc("<action> <binary files...> <.sancov files...> "
- "<.symcov files...>"),
- cl::cat(Cat));
- static cl::opt<bool> ClDemangle("demangle", cl::init(true),
- cl::desc("Print demangled function name"),
- cl::cat(Cat));
- static cl::opt<bool>
- ClSkipDeadFiles("skip-dead-files", cl::init(true),
- cl::desc("Do not list dead source files in reports"),
- cl::cat(Cat));
- static cl::opt<std::string>
- ClStripPathPrefix("strip_path_prefix", cl::init(""),
- cl::desc("Strip this prefix from file paths in reports"),
- cl::cat(Cat));
- static cl::opt<std::string>
- ClIgnorelist("ignorelist", cl::init(""),
- cl::desc("Ignorelist file (sanitizer ignorelist format)"),
- cl::cat(Cat));
- static cl::opt<bool> ClUseDefaultIgnorelist(
- "use_default_ignorelist", cl::init(true), cl::Hidden,
- cl::desc("Controls if default ignorelist should be used"), cl::cat(Cat));
- static const char *const DefaultIgnorelistStr = "fun:__sanitizer_.*\n"
- "src:/usr/include/.*\n"
- "src:.*/libc\\+\\+/.*\n";
- // --------- FORMAT SPECIFICATION ---------
- struct FileHeader {
- uint32_t Bitness;
- uint32_t Magic;
- };
- static const uint32_t BinCoverageMagic = 0xC0BFFFFF;
- static const uint32_t Bitness32 = 0xFFFFFF32;
- static const uint32_t Bitness64 = 0xFFFFFF64;
- static const Regex SancovFileRegex("(.*)\\.[0-9]+\\.sancov");
- static const Regex SymcovFileRegex(".*\\.symcov");
- // --------- MAIN DATASTRUCTURES ----------
- // Contents of .sancov file: list of coverage point addresses that were
- // executed.
- struct RawCoverage {
- explicit RawCoverage(std::unique_ptr<std::set<uint64_t>> Addrs)
- : Addrs(std::move(Addrs)) {}
- // Read binary .sancov file.
- static ErrorOr<std::unique_ptr<RawCoverage>>
- read(const std::string &FileName);
- std::unique_ptr<std::set<uint64_t>> Addrs;
- };
- // Coverage point has an opaque Id and corresponds to multiple source locations.
- struct CoveragePoint {
- explicit CoveragePoint(const std::string &Id) : Id(Id) {}
- std::string Id;
- SmallVector<DILineInfo, 1> Locs;
- };
- // Symcov file content: set of covered Ids plus information about all available
- // coverage points.
- struct SymbolizedCoverage {
- // Read json .symcov file.
- static std::unique_ptr<SymbolizedCoverage> read(const std::string &InputFile);
- std::set<std::string> CoveredIds;
- std::string BinaryHash;
- std::vector<CoveragePoint> Points;
- };
- struct CoverageStats {
- size_t AllPoints;
- size_t CovPoints;
- size_t AllFns;
- size_t CovFns;
- };
- // --------- ERROR HANDLING ---------
- static void fail(const llvm::Twine &E) {
- errs() << "ERROR: " << E << "\n";
- exit(1);
- }
- static void failIf(bool B, const llvm::Twine &E) {
- if (B)
- fail(E);
- }
- static void failIfError(std::error_code Error) {
- if (!Error)
- return;
- errs() << "ERROR: " << Error.message() << "(" << Error.value() << ")\n";
- exit(1);
- }
- template <typename T> static void failIfError(const ErrorOr<T> &E) {
- failIfError(E.getError());
- }
- static void failIfError(Error Err) {
- if (Err) {
- logAllUnhandledErrors(std::move(Err), errs(), "ERROR: ");
- exit(1);
- }
- }
- template <typename T> static void failIfError(Expected<T> &E) {
- failIfError(E.takeError());
- }
- static void failIfNotEmpty(const llvm::Twine &E) {
- if (E.str().empty())
- return;
- fail(E);
- }
- template <typename T>
- static void failIfEmpty(const std::unique_ptr<T> &Ptr,
- const std::string &Message) {
- if (Ptr.get())
- return;
- fail(Message);
- }
- // ----------- Coverage I/O ----------
- template <typename T>
- static void readInts(const char *Start, const char *End,
- std::set<uint64_t> *Ints) {
- const T *S = reinterpret_cast<const T *>(Start);
- const T *E = reinterpret_cast<const T *>(End);
- std::copy(S, E, std::inserter(*Ints, Ints->end()));
- }
- ErrorOr<std::unique_ptr<RawCoverage>>
- RawCoverage::read(const std::string &FileName) {
- ErrorOr<std::unique_ptr<MemoryBuffer>> BufOrErr =
- MemoryBuffer::getFile(FileName);
- if (!BufOrErr)
- return BufOrErr.getError();
- std::unique_ptr<MemoryBuffer> Buf = std::move(BufOrErr.get());
- if (Buf->getBufferSize() < 8) {
- errs() << "File too small (<8): " << Buf->getBufferSize() << '\n';
- return make_error_code(errc::illegal_byte_sequence);
- }
- const FileHeader *Header =
- reinterpret_cast<const FileHeader *>(Buf->getBufferStart());
- if (Header->Magic != BinCoverageMagic) {
- errs() << "Wrong magic: " << Header->Magic << '\n';
- return make_error_code(errc::illegal_byte_sequence);
- }
- auto Addrs = std::make_unique<std::set<uint64_t>>();
- switch (Header->Bitness) {
- case Bitness64:
- readInts<uint64_t>(Buf->getBufferStart() + 8, Buf->getBufferEnd(),
- Addrs.get());
- break;
- case Bitness32:
- readInts<uint32_t>(Buf->getBufferStart() + 8, Buf->getBufferEnd(),
- Addrs.get());
- break;
- default:
- errs() << "Unsupported bitness: " << Header->Bitness << '\n';
- return make_error_code(errc::illegal_byte_sequence);
- }
- // Ignore slots that are zero, so a runtime implementation is not required
- // to compactify the data.
- Addrs->erase(0);
- return std::unique_ptr<RawCoverage>(new RawCoverage(std::move(Addrs)));
- }
- // Print coverage addresses.
- raw_ostream &operator<<(raw_ostream &OS, const RawCoverage &CoverageData) {
- for (auto Addr : *CoverageData.Addrs) {
- OS << "0x";
- OS.write_hex(Addr);
- OS << "\n";
- }
- return OS;
- }
- static raw_ostream &operator<<(raw_ostream &OS, const CoverageStats &Stats) {
- OS << "all-edges: " << Stats.AllPoints << "\n";
- OS << "cov-edges: " << Stats.CovPoints << "\n";
- OS << "all-functions: " << Stats.AllFns << "\n";
- OS << "cov-functions: " << Stats.CovFns << "\n";
- return OS;
- }
- // Output symbolized information for coverage points in JSON.
- // Format:
- // {
- // '<file_name>' : {
- // '<function_name>' : {
- // '<point_id'> : '<line_number>:'<column_number'.
- // ....
- // }
- // }
- // }
- static void operator<<(json::OStream &W,
- const std::vector<CoveragePoint> &Points) {
- // Group points by file.
- std::map<std::string, std::vector<const CoveragePoint *>> PointsByFile;
- for (const auto &Point : Points) {
- for (const DILineInfo &Loc : Point.Locs) {
- PointsByFile[Loc.FileName].push_back(&Point);
- }
- }
- for (const auto &P : PointsByFile) {
- std::string FileName = P.first;
- std::map<std::string, std::vector<const CoveragePoint *>> PointsByFn;
- for (auto PointPtr : P.second) {
- for (const DILineInfo &Loc : PointPtr->Locs) {
- PointsByFn[Loc.FunctionName].push_back(PointPtr);
- }
- }
- W.attributeObject(P.first, [&] {
- // Group points by function.
- for (const auto &P : PointsByFn) {
- std::string FunctionName = P.first;
- std::set<std::string> WrittenIds;
- W.attributeObject(FunctionName, [&] {
- for (const CoveragePoint *Point : P.second) {
- for (const auto &Loc : Point->Locs) {
- if (Loc.FileName != FileName || Loc.FunctionName != FunctionName)
- continue;
- if (WrittenIds.find(Point->Id) != WrittenIds.end())
- continue;
- // Output <point_id> : "<line>:<col>".
- WrittenIds.insert(Point->Id);
- W.attribute(Point->Id,
- (utostr(Loc.Line) + ":" + utostr(Loc.Column)));
- }
- }
- });
- }
- });
- }
- }
- static void operator<<(json::OStream &W, const SymbolizedCoverage &C) {
- W.object([&] {
- W.attributeArray("covered-points", [&] {
- for (const std::string &P : C.CoveredIds) {
- W.value(P);
- }
- });
- W.attribute("binary-hash", C.BinaryHash);
- W.attributeObject("point-symbol-info", [&] { W << C.Points; });
- });
- }
- static std::string parseScalarString(yaml::Node *N) {
- SmallString<64> StringStorage;
- yaml::ScalarNode *S = dyn_cast<yaml::ScalarNode>(N);
- failIf(!S, "expected string");
- return std::string(S->getValue(StringStorage));
- }
- std::unique_ptr<SymbolizedCoverage>
- SymbolizedCoverage::read(const std::string &InputFile) {
- auto Coverage(std::make_unique<SymbolizedCoverage>());
- std::map<std::string, CoveragePoint> Points;
- ErrorOr<std::unique_ptr<MemoryBuffer>> BufOrErr =
- MemoryBuffer::getFile(InputFile);
- failIfError(BufOrErr);
- SourceMgr SM;
- yaml::Stream S(**BufOrErr, SM);
- yaml::document_iterator DI = S.begin();
- failIf(DI == S.end(), "empty document: " + InputFile);
- yaml::Node *Root = DI->getRoot();
- failIf(!Root, "expecting root node: " + InputFile);
- yaml::MappingNode *Top = dyn_cast<yaml::MappingNode>(Root);
- failIf(!Top, "expecting mapping node: " + InputFile);
- for (auto &KVNode : *Top) {
- auto Key = parseScalarString(KVNode.getKey());
- if (Key == "covered-points") {
- yaml::SequenceNode *Points =
- dyn_cast<yaml::SequenceNode>(KVNode.getValue());
- failIf(!Points, "expected array: " + InputFile);
- for (auto I = Points->begin(), E = Points->end(); I != E; ++I) {
- Coverage->CoveredIds.insert(parseScalarString(&*I));
- }
- } else if (Key == "binary-hash") {
- Coverage->BinaryHash = parseScalarString(KVNode.getValue());
- } else if (Key == "point-symbol-info") {
- yaml::MappingNode *PointSymbolInfo =
- dyn_cast<yaml::MappingNode>(KVNode.getValue());
- failIf(!PointSymbolInfo, "expected mapping node: " + InputFile);
- for (auto &FileKVNode : *PointSymbolInfo) {
- auto Filename = parseScalarString(FileKVNode.getKey());
- yaml::MappingNode *FileInfo =
- dyn_cast<yaml::MappingNode>(FileKVNode.getValue());
- failIf(!FileInfo, "expected mapping node: " + InputFile);
- for (auto &FunctionKVNode : *FileInfo) {
- auto FunctionName = parseScalarString(FunctionKVNode.getKey());
- yaml::MappingNode *FunctionInfo =
- dyn_cast<yaml::MappingNode>(FunctionKVNode.getValue());
- failIf(!FunctionInfo, "expected mapping node: " + InputFile);
- for (auto &PointKVNode : *FunctionInfo) {
- auto PointId = parseScalarString(PointKVNode.getKey());
- auto Loc = parseScalarString(PointKVNode.getValue());
- size_t ColonPos = Loc.find(':');
- failIf(ColonPos == std::string::npos, "expected ':': " + InputFile);
- auto LineStr = Loc.substr(0, ColonPos);
- auto ColStr = Loc.substr(ColonPos + 1, Loc.size());
- if (Points.find(PointId) == Points.end())
- Points.insert(std::make_pair(PointId, CoveragePoint(PointId)));
- DILineInfo LineInfo;
- LineInfo.FileName = Filename;
- LineInfo.FunctionName = FunctionName;
- char *End;
- LineInfo.Line = std::strtoul(LineStr.c_str(), &End, 10);
- LineInfo.Column = std::strtoul(ColStr.c_str(), &End, 10);
- CoveragePoint *CoveragePoint = &Points.find(PointId)->second;
- CoveragePoint->Locs.push_back(LineInfo);
- }
- }
- }
- } else {
- errs() << "Ignoring unknown key: " << Key << "\n";
- }
- }
- for (auto &KV : Points) {
- Coverage->Points.push_back(KV.second);
- }
- return Coverage;
- }
- // ---------- MAIN FUNCTIONALITY ----------
- std::string stripPathPrefix(std::string Path) {
- if (ClStripPathPrefix.empty())
- return Path;
- size_t Pos = Path.find(ClStripPathPrefix);
- if (Pos == std::string::npos)
- return Path;
- return Path.substr(Pos + ClStripPathPrefix.size());
- }
- static std::unique_ptr<symbolize::LLVMSymbolizer> createSymbolizer() {
- symbolize::LLVMSymbolizer::Options SymbolizerOptions;
- SymbolizerOptions.Demangle = ClDemangle;
- SymbolizerOptions.UseSymbolTable = true;
- return std::unique_ptr<symbolize::LLVMSymbolizer>(
- new symbolize::LLVMSymbolizer(SymbolizerOptions));
- }
- static std::string normalizeFilename(const std::string &FileName) {
- SmallString<256> S(FileName);
- sys::path::remove_dots(S, /* remove_dot_dot */ true);
- return stripPathPrefix(sys::path::convert_to_slash(std::string(S)));
- }
- class Ignorelists {
- public:
- Ignorelists()
- : DefaultIgnorelist(createDefaultIgnorelist()),
- UserIgnorelist(createUserIgnorelist()) {}
- bool isIgnorelisted(const DILineInfo &I) {
- if (DefaultIgnorelist &&
- DefaultIgnorelist->inSection("sancov", "fun", I.FunctionName))
- return true;
- if (DefaultIgnorelist &&
- DefaultIgnorelist->inSection("sancov", "src", I.FileName))
- return true;
- if (UserIgnorelist &&
- UserIgnorelist->inSection("sancov", "fun", I.FunctionName))
- return true;
- if (UserIgnorelist &&
- UserIgnorelist->inSection("sancov", "src", I.FileName))
- return true;
- return false;
- }
- private:
- static std::unique_ptr<SpecialCaseList> createDefaultIgnorelist() {
- if (!ClUseDefaultIgnorelist)
- return std::unique_ptr<SpecialCaseList>();
- std::unique_ptr<MemoryBuffer> MB =
- MemoryBuffer::getMemBuffer(DefaultIgnorelistStr);
- std::string Error;
- auto Ignorelist = SpecialCaseList::create(MB.get(), Error);
- failIfNotEmpty(Error);
- return Ignorelist;
- }
- static std::unique_ptr<SpecialCaseList> createUserIgnorelist() {
- if (ClIgnorelist.empty())
- return std::unique_ptr<SpecialCaseList>();
- return SpecialCaseList::createOrDie({{ClIgnorelist}},
- *vfs::getRealFileSystem());
- }
- std::unique_ptr<SpecialCaseList> DefaultIgnorelist;
- std::unique_ptr<SpecialCaseList> UserIgnorelist;
- };
- static std::vector<CoveragePoint>
- getCoveragePoints(const std::string &ObjectFile,
- const std::set<uint64_t> &Addrs,
- const std::set<uint64_t> &CoveredAddrs) {
- std::vector<CoveragePoint> Result;
- auto Symbolizer(createSymbolizer());
- Ignorelists Ig;
- std::set<std::string> CoveredFiles;
- if (ClSkipDeadFiles) {
- for (auto Addr : CoveredAddrs) {
- // TODO: it would be neccessary to set proper section index here.
- // object::SectionedAddress::UndefSection works for only absolute
- // addresses.
- object::SectionedAddress ModuleAddress = {
- Addr, object::SectionedAddress::UndefSection};
- auto LineInfo = Symbolizer->symbolizeCode(ObjectFile, ModuleAddress);
- failIfError(LineInfo);
- CoveredFiles.insert(LineInfo->FileName);
- auto InliningInfo =
- Symbolizer->symbolizeInlinedCode(ObjectFile, ModuleAddress);
- failIfError(InliningInfo);
- for (uint32_t I = 0; I < InliningInfo->getNumberOfFrames(); ++I) {
- auto FrameInfo = InliningInfo->getFrame(I);
- CoveredFiles.insert(FrameInfo.FileName);
- }
- }
- }
- for (auto Addr : Addrs) {
- std::set<DILineInfo> Infos; // deduplicate debug info.
- // TODO: it would be neccessary to set proper section index here.
- // object::SectionedAddress::UndefSection works for only absolute addresses.
- object::SectionedAddress ModuleAddress = {
- Addr, object::SectionedAddress::UndefSection};
- auto LineInfo = Symbolizer->symbolizeCode(ObjectFile, ModuleAddress);
- failIfError(LineInfo);
- if (ClSkipDeadFiles &&
- CoveredFiles.find(LineInfo->FileName) == CoveredFiles.end())
- continue;
- LineInfo->FileName = normalizeFilename(LineInfo->FileName);
- if (Ig.isIgnorelisted(*LineInfo))
- continue;
- auto Id = utohexstr(Addr, true);
- auto Point = CoveragePoint(Id);
- Infos.insert(*LineInfo);
- Point.Locs.push_back(*LineInfo);
- auto InliningInfo =
- Symbolizer->symbolizeInlinedCode(ObjectFile, ModuleAddress);
- failIfError(InliningInfo);
- for (uint32_t I = 0; I < InliningInfo->getNumberOfFrames(); ++I) {
- auto FrameInfo = InliningInfo->getFrame(I);
- if (ClSkipDeadFiles &&
- CoveredFiles.find(FrameInfo.FileName) == CoveredFiles.end())
- continue;
- FrameInfo.FileName = normalizeFilename(FrameInfo.FileName);
- if (Ig.isIgnorelisted(FrameInfo))
- continue;
- if (Infos.find(FrameInfo) == Infos.end()) {
- Infos.insert(FrameInfo);
- Point.Locs.push_back(FrameInfo);
- }
- }
- Result.push_back(Point);
- }
- return Result;
- }
- static bool isCoveragePointSymbol(StringRef Name) {
- return Name == "__sanitizer_cov" || Name == "__sanitizer_cov_with_check" ||
- Name == "__sanitizer_cov_trace_func_enter" ||
- Name == "__sanitizer_cov_trace_pc_guard" ||
- // Mac has '___' prefix
- Name == "___sanitizer_cov" || Name == "___sanitizer_cov_with_check" ||
- Name == "___sanitizer_cov_trace_func_enter" ||
- Name == "___sanitizer_cov_trace_pc_guard";
- }
- // Locate __sanitizer_cov* function addresses inside the stubs table on MachO.
- static void findMachOIndirectCovFunctions(const object::MachOObjectFile &O,
- std::set<uint64_t> *Result) {
- MachO::dysymtab_command Dysymtab = O.getDysymtabLoadCommand();
- MachO::symtab_command Symtab = O.getSymtabLoadCommand();
- for (const auto &Load : O.load_commands()) {
- if (Load.C.cmd == MachO::LC_SEGMENT_64) {
- MachO::segment_command_64 Seg = O.getSegment64LoadCommand(Load);
- for (unsigned J = 0; J < Seg.nsects; ++J) {
- MachO::section_64 Sec = O.getSection64(Load, J);
- uint32_t SectionType = Sec.flags & MachO::SECTION_TYPE;
- if (SectionType == MachO::S_SYMBOL_STUBS) {
- uint32_t Stride = Sec.reserved2;
- uint32_t Cnt = Sec.size / Stride;
- uint32_t N = Sec.reserved1;
- for (uint32_t J = 0; J < Cnt && N + J < Dysymtab.nindirectsyms; J++) {
- uint32_t IndirectSymbol =
- O.getIndirectSymbolTableEntry(Dysymtab, N + J);
- uint64_t Addr = Sec.addr + J * Stride;
- if (IndirectSymbol < Symtab.nsyms) {
- object::SymbolRef Symbol = *(O.getSymbolByIndex(IndirectSymbol));
- Expected<StringRef> Name = Symbol.getName();
- failIfError(Name);
- if (isCoveragePointSymbol(Name.get())) {
- Result->insert(Addr);
- }
- }
- }
- }
- }
- }
- if (Load.C.cmd == MachO::LC_SEGMENT) {
- errs() << "ERROR: 32 bit MachO binaries not supported\n";
- }
- }
- }
- // Locate __sanitizer_cov* function addresses that are used for coverage
- // reporting.
- static std::set<uint64_t>
- findSanitizerCovFunctions(const object::ObjectFile &O) {
- std::set<uint64_t> Result;
- for (const object::SymbolRef &Symbol : O.symbols()) {
- Expected<uint64_t> AddressOrErr = Symbol.getAddress();
- failIfError(AddressOrErr);
- uint64_t Address = AddressOrErr.get();
- Expected<StringRef> NameOrErr = Symbol.getName();
- failIfError(NameOrErr);
- StringRef Name = NameOrErr.get();
- Expected<uint32_t> FlagsOrErr = Symbol.getFlags();
- // TODO: Test this error.
- failIfError(FlagsOrErr);
- uint32_t Flags = FlagsOrErr.get();
- if (!(Flags & object::BasicSymbolRef::SF_Undefined) &&
- isCoveragePointSymbol(Name)) {
- Result.insert(Address);
- }
- }
- if (const auto *CO = dyn_cast<object::COFFObjectFile>(&O)) {
- for (const object::ExportDirectoryEntryRef &Export :
- CO->export_directories()) {
- uint32_t RVA;
- failIfError(Export.getExportRVA(RVA));
- StringRef Name;
- failIfError(Export.getSymbolName(Name));
- if (isCoveragePointSymbol(Name))
- Result.insert(CO->getImageBase() + RVA);
- }
- }
- if (const auto *MO = dyn_cast<object::MachOObjectFile>(&O)) {
- findMachOIndirectCovFunctions(*MO, &Result);
- }
- return Result;
- }
- // Ported from
- // compiler-rt/lib/sanitizer_common/sanitizer_stacktrace.h:GetPreviousInstructionPc
- // GetPreviousInstructionPc.
- static uint64_t getPreviousInstructionPc(uint64_t PC,
- Triple TheTriple) {
- if (TheTriple.isARM())
- return (PC - 3) & (~1);
- if (TheTriple.isMIPS() || TheTriple.isSPARC())
- return PC - 8;
- if (TheTriple.isRISCV())
- return PC - 2;
- if (TheTriple.isX86() || TheTriple.isSystemZ())
- return PC - 1;
- return PC - 4;
- }
- // Locate addresses of all coverage points in a file. Coverage point
- // is defined as the 'address of instruction following __sanitizer_cov
- // call - 1'.
- static void getObjectCoveragePoints(const object::ObjectFile &O,
- std::set<uint64_t> *Addrs) {
- Triple TheTriple("unknown-unknown-unknown");
- TheTriple.setArch(Triple::ArchType(O.getArch()));
- auto TripleName = TheTriple.getTriple();
- std::string Error;
- const Target *TheTarget = TargetRegistry::lookupTarget(TripleName, Error);
- failIfNotEmpty(Error);
- std::unique_ptr<const MCSubtargetInfo> STI(
- TheTarget->createMCSubtargetInfo(TripleName, "", ""));
- failIfEmpty(STI, "no subtarget info for target " + TripleName);
- std::unique_ptr<const MCRegisterInfo> MRI(
- TheTarget->createMCRegInfo(TripleName));
- failIfEmpty(MRI, "no register info for target " + TripleName);
- MCTargetOptions MCOptions;
- std::unique_ptr<const MCAsmInfo> AsmInfo(
- TheTarget->createMCAsmInfo(*MRI, TripleName, MCOptions));
- failIfEmpty(AsmInfo, "no asm info for target " + TripleName);
- MCContext Ctx(TheTriple, AsmInfo.get(), MRI.get(), STI.get());
- std::unique_ptr<MCDisassembler> DisAsm(
- TheTarget->createMCDisassembler(*STI, Ctx));
- failIfEmpty(DisAsm, "no disassembler info for target " + TripleName);
- std::unique_ptr<const MCInstrInfo> MII(TheTarget->createMCInstrInfo());
- failIfEmpty(MII, "no instruction info for target " + TripleName);
- std::unique_ptr<const MCInstrAnalysis> MIA(
- TheTarget->createMCInstrAnalysis(MII.get()));
- failIfEmpty(MIA, "no instruction analysis info for target " + TripleName);
- auto SanCovAddrs = findSanitizerCovFunctions(O);
- if (SanCovAddrs.empty())
- fail("__sanitizer_cov* functions not found");
- for (object::SectionRef Section : O.sections()) {
- if (Section.isVirtual() || !Section.isText()) // llvm-objdump does the same.
- continue;
- uint64_t SectionAddr = Section.getAddress();
- uint64_t SectSize = Section.getSize();
- if (!SectSize)
- continue;
- Expected<StringRef> BytesStr = Section.getContents();
- failIfError(BytesStr);
- ArrayRef<uint8_t> Bytes = arrayRefFromStringRef(*BytesStr);
- for (uint64_t Index = 0, Size = 0; Index < Section.getSize();
- Index += Size) {
- MCInst Inst;
- ArrayRef<uint8_t> ThisBytes = Bytes.slice(Index);
- uint64_t ThisAddr = SectionAddr + Index;
- if (!DisAsm->getInstruction(Inst, Size, ThisBytes, ThisAddr, nulls())) {
- if (Size == 0)
- Size = std::min<uint64_t>(
- ThisBytes.size(),
- DisAsm->suggestBytesToSkip(ThisBytes, ThisAddr));
- continue;
- }
- uint64_t Addr = Index + SectionAddr;
- // Sanitizer coverage uses the address of the next instruction - 1.
- uint64_t CovPoint = getPreviousInstructionPc(Addr + Size, TheTriple);
- uint64_t Target;
- if (MIA->isCall(Inst) &&
- MIA->evaluateBranch(Inst, SectionAddr + Index, Size, Target) &&
- SanCovAddrs.find(Target) != SanCovAddrs.end())
- Addrs->insert(CovPoint);
- }
- }
- }
- static void
- visitObjectFiles(const object::Archive &A,
- function_ref<void(const object::ObjectFile &)> Fn) {
- Error Err = Error::success();
- for (auto &C : A.children(Err)) {
- Expected<std::unique_ptr<object::Binary>> ChildOrErr = C.getAsBinary();
- failIfError(ChildOrErr);
- if (auto *O = dyn_cast<object::ObjectFile>(&*ChildOrErr.get()))
- Fn(*O);
- else
- failIfError(object::object_error::invalid_file_type);
- }
- failIfError(std::move(Err));
- }
- static void
- visitObjectFiles(const std::string &FileName,
- function_ref<void(const object::ObjectFile &)> Fn) {
- Expected<object::OwningBinary<object::Binary>> BinaryOrErr =
- object::createBinary(FileName);
- if (!BinaryOrErr)
- failIfError(BinaryOrErr);
- object::Binary &Binary = *BinaryOrErr.get().getBinary();
- if (object::Archive *A = dyn_cast<object::Archive>(&Binary))
- visitObjectFiles(*A, Fn);
- else if (object::ObjectFile *O = dyn_cast<object::ObjectFile>(&Binary))
- Fn(*O);
- else
- failIfError(object::object_error::invalid_file_type);
- }
- static std::set<uint64_t>
- findSanitizerCovFunctions(const std::string &FileName) {
- std::set<uint64_t> Result;
- visitObjectFiles(FileName, [&](const object::ObjectFile &O) {
- auto Addrs = findSanitizerCovFunctions(O);
- Result.insert(Addrs.begin(), Addrs.end());
- });
- return Result;
- }
- // Locate addresses of all coverage points in a file. Coverage point
- // is defined as the 'address of instruction following __sanitizer_cov
- // call - 1'.
- static std::set<uint64_t> findCoveragePointAddrs(const std::string &FileName) {
- std::set<uint64_t> Result;
- visitObjectFiles(FileName, [&](const object::ObjectFile &O) {
- getObjectCoveragePoints(O, &Result);
- });
- return Result;
- }
- static void printCovPoints(const std::string &ObjFile, raw_ostream &OS) {
- for (uint64_t Addr : findCoveragePointAddrs(ObjFile)) {
- OS << "0x";
- OS.write_hex(Addr);
- OS << "\n";
- }
- }
- static ErrorOr<bool> isCoverageFile(const std::string &FileName) {
- auto ShortFileName = llvm::sys::path::filename(FileName);
- if (!SancovFileRegex.match(ShortFileName))
- return false;
- ErrorOr<std::unique_ptr<MemoryBuffer>> BufOrErr =
- MemoryBuffer::getFile(FileName);
- if (!BufOrErr) {
- errs() << "Warning: " << BufOrErr.getError().message() << "("
- << BufOrErr.getError().value()
- << "), filename: " << llvm::sys::path::filename(FileName) << "\n";
- return BufOrErr.getError();
- }
- std::unique_ptr<MemoryBuffer> Buf = std::move(BufOrErr.get());
- if (Buf->getBufferSize() < 8) {
- return false;
- }
- const FileHeader *Header =
- reinterpret_cast<const FileHeader *>(Buf->getBufferStart());
- return Header->Magic == BinCoverageMagic;
- }
- static bool isSymbolizedCoverageFile(const std::string &FileName) {
- auto ShortFileName = llvm::sys::path::filename(FileName);
- return SymcovFileRegex.match(ShortFileName);
- }
- static std::unique_ptr<SymbolizedCoverage>
- symbolize(const RawCoverage &Data, const std::string ObjectFile) {
- auto Coverage = std::make_unique<SymbolizedCoverage>();
- ErrorOr<std::unique_ptr<MemoryBuffer>> BufOrErr =
- MemoryBuffer::getFile(ObjectFile);
- failIfError(BufOrErr);
- SHA1 Hasher;
- Hasher.update((*BufOrErr)->getBuffer());
- Coverage->BinaryHash = toHex(Hasher.final());
- Ignorelists Ig;
- auto Symbolizer(createSymbolizer());
- for (uint64_t Addr : *Data.Addrs) {
- // TODO: it would be neccessary to set proper section index here.
- // object::SectionedAddress::UndefSection works for only absolute addresses.
- auto LineInfo = Symbolizer->symbolizeCode(
- ObjectFile, {Addr, object::SectionedAddress::UndefSection});
- failIfError(LineInfo);
- if (Ig.isIgnorelisted(*LineInfo))
- continue;
- Coverage->CoveredIds.insert(utohexstr(Addr, true));
- }
- std::set<uint64_t> AllAddrs = findCoveragePointAddrs(ObjectFile);
- if (!std::includes(AllAddrs.begin(), AllAddrs.end(), Data.Addrs->begin(),
- Data.Addrs->end())) {
- fail("Coverage points in binary and .sancov file do not match.");
- }
- Coverage->Points = getCoveragePoints(ObjectFile, AllAddrs, *Data.Addrs);
- return Coverage;
- }
- struct FileFn {
- bool operator<(const FileFn &RHS) const {
- return std::tie(FileName, FunctionName) <
- std::tie(RHS.FileName, RHS.FunctionName);
- }
- std::string FileName;
- std::string FunctionName;
- };
- static std::set<FileFn>
- computeFunctions(const std::vector<CoveragePoint> &Points) {
- std::set<FileFn> Fns;
- for (const auto &Point : Points) {
- for (const auto &Loc : Point.Locs) {
- Fns.insert(FileFn{Loc.FileName, Loc.FunctionName});
- }
- }
- return Fns;
- }
- static std::set<FileFn>
- computeNotCoveredFunctions(const SymbolizedCoverage &Coverage) {
- auto Fns = computeFunctions(Coverage.Points);
- for (const auto &Point : Coverage.Points) {
- if (Coverage.CoveredIds.find(Point.Id) == Coverage.CoveredIds.end())
- continue;
- for (const auto &Loc : Point.Locs) {
- Fns.erase(FileFn{Loc.FileName, Loc.FunctionName});
- }
- }
- return Fns;
- }
- static std::set<FileFn>
- computeCoveredFunctions(const SymbolizedCoverage &Coverage) {
- auto AllFns = computeFunctions(Coverage.Points);
- std::set<FileFn> Result;
- for (const auto &Point : Coverage.Points) {
- if (Coverage.CoveredIds.find(Point.Id) == Coverage.CoveredIds.end())
- continue;
- for (const auto &Loc : Point.Locs) {
- Result.insert(FileFn{Loc.FileName, Loc.FunctionName});
- }
- }
- return Result;
- }
- typedef std::map<FileFn, std::pair<uint32_t, uint32_t>> FunctionLocs;
- // finds first location in a file for each function.
- static FunctionLocs resolveFunctions(const SymbolizedCoverage &Coverage,
- const std::set<FileFn> &Fns) {
- FunctionLocs Result;
- for (const auto &Point : Coverage.Points) {
- for (const auto &Loc : Point.Locs) {
- FileFn Fn = FileFn{Loc.FileName, Loc.FunctionName};
- if (Fns.find(Fn) == Fns.end())
- continue;
- auto P = std::make_pair(Loc.Line, Loc.Column);
- auto I = Result.find(Fn);
- if (I == Result.end() || I->second > P) {
- Result[Fn] = P;
- }
- }
- }
- return Result;
- }
- static void printFunctionLocs(const FunctionLocs &FnLocs, raw_ostream &OS) {
- for (const auto &P : FnLocs) {
- OS << stripPathPrefix(P.first.FileName) << ":" << P.second.first << " "
- << P.first.FunctionName << "\n";
- }
- }
- CoverageStats computeStats(const SymbolizedCoverage &Coverage) {
- CoverageStats Stats = {Coverage.Points.size(), Coverage.CoveredIds.size(),
- computeFunctions(Coverage.Points).size(),
- computeCoveredFunctions(Coverage).size()};
- return Stats;
- }
- // Print list of covered functions.
- // Line format: <file_name>:<line> <function_name>
- static void printCoveredFunctions(const SymbolizedCoverage &CovData,
- raw_ostream &OS) {
- auto CoveredFns = computeCoveredFunctions(CovData);
- printFunctionLocs(resolveFunctions(CovData, CoveredFns), OS);
- }
- // Print list of not covered functions.
- // Line format: <file_name>:<line> <function_name>
- static void printNotCoveredFunctions(const SymbolizedCoverage &CovData,
- raw_ostream &OS) {
- auto NotCoveredFns = computeNotCoveredFunctions(CovData);
- printFunctionLocs(resolveFunctions(CovData, NotCoveredFns), OS);
- }
- // Read list of files and merges their coverage info.
- static void readAndPrintRawCoverage(const std::vector<std::string> &FileNames,
- raw_ostream &OS) {
- std::vector<std::unique_ptr<RawCoverage>> Covs;
- for (const auto &FileName : FileNames) {
- auto Cov = RawCoverage::read(FileName);
- if (!Cov)
- continue;
- OS << *Cov.get();
- }
- }
- static std::unique_ptr<SymbolizedCoverage>
- merge(const std::vector<std::unique_ptr<SymbolizedCoverage>> &Coverages) {
- if (Coverages.empty())
- return nullptr;
- auto Result = std::make_unique<SymbolizedCoverage>();
- for (size_t I = 0; I < Coverages.size(); ++I) {
- const SymbolizedCoverage &Coverage = *Coverages[I];
- std::string Prefix;
- if (Coverages.size() > 1) {
- // prefix is not needed when there's only one file.
- Prefix = utostr(I);
- }
- for (const auto &Id : Coverage.CoveredIds) {
- Result->CoveredIds.insert(Prefix + Id);
- }
- for (const auto &CovPoint : Coverage.Points) {
- CoveragePoint NewPoint(CovPoint);
- NewPoint.Id = Prefix + CovPoint.Id;
- Result->Points.push_back(NewPoint);
- }
- }
- if (Coverages.size() == 1) {
- Result->BinaryHash = Coverages[0]->BinaryHash;
- }
- return Result;
- }
- static std::unique_ptr<SymbolizedCoverage>
- readSymbolizeAndMergeCmdArguments(std::vector<std::string> FileNames) {
- std::vector<std::unique_ptr<SymbolizedCoverage>> Coverages;
- {
- // Short name => file name.
- std::map<std::string, std::string> ObjFiles;
- std::string FirstObjFile;
- std::set<std::string> CovFiles;
- // Partition input values into coverage/object files.
- for (const auto &FileName : FileNames) {
- if (isSymbolizedCoverageFile(FileName)) {
- Coverages.push_back(SymbolizedCoverage::read(FileName));
- }
- auto ErrorOrIsCoverage = isCoverageFile(FileName);
- if (!ErrorOrIsCoverage)
- continue;
- if (ErrorOrIsCoverage.get()) {
- CovFiles.insert(FileName);
- } else {
- auto ShortFileName = llvm::sys::path::filename(FileName);
- if (ObjFiles.find(std::string(ShortFileName)) != ObjFiles.end()) {
- fail("Duplicate binary file with a short name: " + ShortFileName);
- }
- ObjFiles[std::string(ShortFileName)] = FileName;
- if (FirstObjFile.empty())
- FirstObjFile = FileName;
- }
- }
- SmallVector<StringRef, 2> Components;
- // Object file => list of corresponding coverage file names.
- std::map<std::string, std::vector<std::string>> CoverageByObjFile;
- for (const auto &FileName : CovFiles) {
- auto ShortFileName = llvm::sys::path::filename(FileName);
- auto Ok = SancovFileRegex.match(ShortFileName, &Components);
- if (!Ok) {
- fail("Can't match coverage file name against "
- "<module_name>.<pid>.sancov pattern: " +
- FileName);
- }
- auto Iter = ObjFiles.find(std::string(Components[1]));
- if (Iter == ObjFiles.end()) {
- fail("Object file for coverage not found: " + FileName);
- }
- CoverageByObjFile[Iter->second].push_back(FileName);
- };
- for (const auto &Pair : ObjFiles) {
- auto FileName = Pair.second;
- if (CoverageByObjFile.find(FileName) == CoverageByObjFile.end())
- errs() << "WARNING: No coverage file for " << FileName << "\n";
- }
- // Read raw coverage and symbolize it.
- for (const auto &Pair : CoverageByObjFile) {
- if (findSanitizerCovFunctions(Pair.first).empty()) {
- errs()
- << "WARNING: Ignoring " << Pair.first
- << " and its coverage because __sanitizer_cov* functions were not "
- "found.\n";
- continue;
- }
- for (const std::string &CoverageFile : Pair.second) {
- auto DataOrError = RawCoverage::read(CoverageFile);
- failIfError(DataOrError);
- Coverages.push_back(symbolize(*DataOrError.get(), Pair.first));
- }
- }
- }
- return merge(Coverages);
- }
- } // namespace
- int main(int Argc, char **Argv) {
- llvm::InitLLVM X(Argc, Argv);
- cl::HideUnrelatedOptions(Cat);
- llvm::InitializeAllTargetInfos();
- llvm::InitializeAllTargetMCs();
- llvm::InitializeAllDisassemblers();
- cl::ParseCommandLineOptions(Argc, Argv,
- "Sanitizer Coverage Processing Tool (sancov)\n\n"
- " This tool can extract various coverage-related information from: \n"
- " coverage-instrumented binary files, raw .sancov files and their "
- "symbolized .symcov version.\n"
- " Depending on chosen action the tool expects different input files:\n"
- " -print-coverage-pcs - coverage-instrumented binary files\n"
- " -print-coverage - .sancov files\n"
- " <other actions> - .sancov files & corresponding binary "
- "files, .symcov files\n"
- );
- // -print doesn't need object files.
- if (Action == PrintAction) {
- readAndPrintRawCoverage(ClInputFiles, outs());
- return 0;
- } else if (Action == PrintCovPointsAction) {
- // -print-coverage-points doesn't need coverage files.
- for (const std::string &ObjFile : ClInputFiles) {
- printCovPoints(ObjFile, outs());
- }
- return 0;
- }
- auto Coverage = readSymbolizeAndMergeCmdArguments(ClInputFiles);
- failIf(!Coverage, "No valid coverage files given.");
- switch (Action) {
- case CoveredFunctionsAction: {
- printCoveredFunctions(*Coverage, outs());
- return 0;
- }
- case NotCoveredFunctionsAction: {
- printNotCoveredFunctions(*Coverage, outs());
- return 0;
- }
- case StatsAction: {
- outs() << computeStats(*Coverage);
- return 0;
- }
- case MergeAction:
- case SymbolizeAction: { // merge & symbolize are synonims.
- json::OStream W(outs(), 2);
- W << *Coverage;
- return 0;
- }
- case HtmlReportAction:
- errs() << "-html-report option is removed: "
- "use -symbolize & coverage-report-server.py instead\n";
- return 1;
- case PrintAction:
- case PrintCovPointsAction:
- llvm_unreachable("unsupported action");
- }
- }
|