//===- FuzzerMerge.h - merging corpa ----------------------------*- C++ -* ===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // Merging Corpora. // // The task: // Take the existing corpus (possibly empty) and merge new inputs into // it so that only inputs with new coverage ('features') are added. // The process should tolerate the crashes, OOMs, leaks, etc. // // Algorithm: // The outer process collects the set of files and writes their names // into a temporary "control" file, then repeatedly launches the inner // process until all inputs are processed. // The outer process does not actually execute the target code. // // The inner process reads the control file and sees a) list of all the inputs // and b) the last processed input. Then it starts processing the inputs one // by one. Before processing every input it writes one line to control file: // STARTED INPUT_ID INPUT_SIZE // After processing an input it writes the following lines: // FT INPUT_ID Feature1 Feature2 Feature3 ... // COV INPUT_ID Coverage1 Coverage2 Coverage3 ... // If a crash happens while processing an input the last line in the control // file will be "STARTED INPUT_ID" and so the next process will know // where to resume. // // Once all inputs are processed by the inner process(es) the outer process // reads the control files and does the merge based entirely on the contents // of control file. // It uses a single pass greedy algorithm choosing first the smallest inputs // within the same size the inputs that have more new features. // //===----------------------------------------------------------------------===// #ifndef LLVM_FUZZER_MERGE_H #define LLVM_FUZZER_MERGE_H #include "FuzzerDefs.h" #include "FuzzerIO.h" #include #include #include #include namespace fuzzer { struct MergeFileInfo { std::string Name; size_t Size = 0; std::vector Features, Cov; }; struct Merger { std::vector Files; size_t NumFilesInFirstCorpus = 0; size_t FirstNotProcessedFile = 0; std::string LastFailure; bool Parse(std::istream &IS, bool ParseCoverage); bool Parse(const std::string &Str, bool ParseCoverage); void ParseOrExit(std::istream &IS, bool ParseCoverage); size_t Merge(const std::set &InitialFeatures, std::set *NewFeatures, const std::set &InitialCov, std::set *NewCov, std::vector *NewFiles); size_t SetCoverMerge(const std::set &InitialFeatures, std::set *NewFeatures, const std::set &InitialCov, std::set *NewCov, std::vector *NewFiles); size_t ApproximateMemoryConsumption() const; std::set AllFeatures() const; }; void CrashResistantMerge(const std::vector &Args, const std::vector &OldCorpus, const std::vector &NewCorpus, std::vector *NewFiles, const std::set &InitialFeatures, std::set *NewFeatures, const std::set &InitialCov, std::set *NewCov, const std::string &CFPath, bool Verbose, bool IsSetCoverMerge); } // namespace fuzzer #endif // LLVM_FUZZER_MERGE_H