123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293 |
- //===- FuzzerMerge.h - merging corpa ----------------------------*- C++ -* ===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- // Merging Corpora.
- //
- // The task:
- // Take the existing corpus (possibly empty) and merge new inputs into
- // it so that only inputs with new coverage ('features') are added.
- // The process should tolerate the crashes, OOMs, leaks, etc.
- //
- // Algorithm:
- // The outer process collects the set of files and writes their names
- // into a temporary "control" file, then repeatedly launches the inner
- // process until all inputs are processed.
- // The outer process does not actually execute the target code.
- //
- // The inner process reads the control file and sees a) list of all the inputs
- // and b) the last processed input. Then it starts processing the inputs one
- // by one. Before processing every input it writes one line to control file:
- // STARTED INPUT_ID INPUT_SIZE
- // After processing an input it writes the following lines:
- // FT INPUT_ID Feature1 Feature2 Feature3 ...
- // COV INPUT_ID Coverage1 Coverage2 Coverage3 ...
- // If a crash happens while processing an input the last line in the control
- // file will be "STARTED INPUT_ID" and so the next process will know
- // where to resume.
- //
- // Once all inputs are processed by the inner process(es) the outer process
- // reads the control files and does the merge based entirely on the contents
- // of control file.
- // It uses a single pass greedy algorithm choosing first the smallest inputs
- // within the same size the inputs that have more new features.
- //
- //===----------------------------------------------------------------------===//
- #ifndef LLVM_FUZZER_MERGE_H
- #define LLVM_FUZZER_MERGE_H
- #include "FuzzerDefs.h"
- #include "FuzzerIO.h"
- #include <istream>
- #include <ostream>
- #include <set>
- #include <vector>
- namespace fuzzer {
- struct MergeFileInfo {
- std::string Name;
- size_t Size = 0;
- std::vector<uint32_t> Features, Cov;
- };
- struct Merger {
- std::vector<MergeFileInfo> Files;
- size_t NumFilesInFirstCorpus = 0;
- size_t FirstNotProcessedFile = 0;
- std::string LastFailure;
- bool Parse(std::istream &IS, bool ParseCoverage);
- bool Parse(const std::string &Str, bool ParseCoverage);
- void ParseOrExit(std::istream &IS, bool ParseCoverage);
- size_t Merge(const std::set<uint32_t> &InitialFeatures,
- std::set<uint32_t> *NewFeatures,
- const std::set<uint32_t> &InitialCov, std::set<uint32_t> *NewCov,
- std::vector<std::string> *NewFiles);
- size_t SetCoverMerge(const std::set<uint32_t> &InitialFeatures,
- std::set<uint32_t> *NewFeatures,
- const std::set<uint32_t> &InitialCov,
- std::set<uint32_t> *NewCov,
- std::vector<std::string> *NewFiles);
- size_t ApproximateMemoryConsumption() const;
- std::set<uint32_t> AllFeatures() const;
- };
- void CrashResistantMerge(const std::vector<std::string> &Args,
- const std::vector<SizedFile> &OldCorpus,
- const std::vector<SizedFile> &NewCorpus,
- std::vector<std::string> *NewFiles,
- const std::set<uint32_t> &InitialFeatures,
- std::set<uint32_t> *NewFeatures,
- const std::set<uint32_t> &InitialCov,
- std::set<uint32_t> *NewCov, const std::string &CFPath,
- bool Verbose, bool IsSetCoverMerge);
- } // namespace fuzzer
- #endif // LLVM_FUZZER_MERGE_H
|