LLVM  8.0.1
FuzzerCLI.cpp
Go to the documentation of this file.
1 //===-- FuzzerCLI.cpp -----------------------------------------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
11 #include "llvm/ADT/Triple.h"
14 #include "llvm/IR/LLVMContext.h"
16 #include "llvm/Support/Compiler.h"
17 #include "llvm/Support/Error.h"
19 #include "llvm/Support/SourceMgr.h"
21 #include "llvm/IR/Verifier.h"
22 
23 using namespace llvm;
24 
25 void llvm::parseFuzzerCLOpts(int ArgC, char *ArgV[]) {
26  std::vector<const char *> CLArgs;
27  CLArgs.push_back(ArgV[0]);
28 
29  int I = 1;
30  while (I < ArgC)
31  if (StringRef(ArgV[I++]).equals("-ignore_remaining_args=1"))
32  break;
33  while (I < ArgC)
34  CLArgs.push_back(ArgV[I++]);
35 
36  cl::ParseCommandLineOptions(CLArgs.size(), CLArgs.data());
37 }
38 
40  std::vector<std::string> Args{ExecName};
41 
42  auto NameAndArgs = ExecName.split("--");
43  if (NameAndArgs.second.empty())
44  return;
45 
47  NameAndArgs.second.split(Opts, '-');
48  for (StringRef Opt : Opts) {
49  if (Opt.equals("gisel")) {
50  Args.push_back("-global-isel");
51  // For now we default GlobalISel to -O0
52  Args.push_back("-O0");
53  } else if (Opt.startswith("O")) {
54  Args.push_back("-" + Opt.str());
55  } else if (Triple(Opt).getArch()) {
56  Args.push_back("-mtriple=" + Opt.str());
57  } else {
58  errs() << ExecName << ": Unknown option: " << Opt << ".\n";
59  exit(1);
60  }
61  }
62  errs() << NameAndArgs.first << ": Injected args:";
63  for (int I = 1, E = Args.size(); I < E; ++I)
64  errs() << " " << Args[I];
65  errs() << "\n";
66 
67  std::vector<const char *> CLArgs;
68  CLArgs.reserve(Args.size());
69  for (std::string &S : Args)
70  CLArgs.push_back(S.c_str());
71 
72  cl::ParseCommandLineOptions(CLArgs.size(), CLArgs.data());
73 }
74 
76  // TODO: Refactor parts common with the 'handleExecNameEncodedBEOpts'
77  std::vector<std::string> Args{ExecName};
78 
79  auto NameAndArgs = ExecName.split("--");
80  if (NameAndArgs.second.empty())
81  return;
82 
84  NameAndArgs.second.split(Opts, '-');
85  for (StringRef Opt : Opts) {
86  if (Opt == "instcombine") {
87  Args.push_back("-passes=instcombine");
88  } else if (Opt == "earlycse") {
89  Args.push_back("-passes=early-cse");
90  } else if (Opt == "simplifycfg") {
91  Args.push_back("-passes=simplify-cfg");
92  } else if (Opt == "gvn") {
93  Args.push_back("-passes=gvn");
94  } else if (Opt == "sccp") {
95  Args.push_back("-passes=sccp");
96 
97  } else if (Opt == "loop_predication") {
98  Args.push_back("-passes=loop-predication");
99  } else if (Opt == "guard_widening") {
100  Args.push_back("-passes=guard-widening");
101  } else if (Opt == "loop_rotate") {
102  Args.push_back("-passes=loop(rotate)");
103  } else if (Opt == "loop_unswitch") {
104  Args.push_back("-passes=loop(unswitch)");
105  } else if (Opt == "loop_unroll") {
106  Args.push_back("-passes=unroll");
107  } else if (Opt == "loop_vectorize") {
108  Args.push_back("-passes=loop-vectorize");
109  } else if (Opt == "licm") {
110  Args.push_back("-passes=licm");
111  } else if (Opt == "indvars") {
112  Args.push_back("-passes=indvars");
113  } else if (Opt == "strength_reduce") {
114  Args.push_back("-passes=strength-reduce");
115  } else if (Opt == "irce") {
116  Args.push_back("-passes=irce");
117 
118  } else if (Triple(Opt).getArch()) {
119  Args.push_back("-mtriple=" + Opt.str());
120  } else {
121  errs() << ExecName << ": Unknown option: " << Opt << ".\n";
122  exit(1);
123  }
124  }
125 
126  errs() << NameAndArgs.first << ": Injected args:";
127  for (int I = 1, E = Args.size(); I < E; ++I)
128  errs() << " " << Args[I];
129  errs() << "\n";
130 
131  std::vector<const char *> CLArgs;
132  CLArgs.reserve(Args.size());
133  for (std::string &S : Args)
134  CLArgs.push_back(S.c_str());
135 
136  cl::ParseCommandLineOptions(CLArgs.size(), CLArgs.data());
137 }
138 
139 int llvm::runFuzzerOnInputs(int ArgC, char *ArgV[], FuzzerTestFun TestOne,
141  errs() << "*** This tool was not linked to libFuzzer.\n"
142  << "*** No fuzzing will be performed.\n";
143  if (int RC = Init(&ArgC, &ArgV)) {
144  errs() << "Initialization failed\n";
145  return RC;
146  }
147 
148  for (int I = 1; I < ArgC; ++I) {
149  StringRef Arg(ArgV[I]);
150  if (Arg.startswith("-")) {
151  if (Arg.equals("-ignore_remaining_args=1"))
152  break;
153  continue;
154  }
155 
156  auto BufOrErr = MemoryBuffer::getFile(Arg, /*FileSize-*/ -1,
157  /*RequiresNullTerminator=*/false);
158  if (std::error_code EC = BufOrErr.getError()) {
159  errs() << "Error reading file: " << Arg << ": " << EC.message() << "\n";
160  return 1;
161  }
162  std::unique_ptr<MemoryBuffer> Buf = std::move(BufOrErr.get());
163  errs() << "Running: " << Arg << " (" << Buf->getBufferSize() << " bytes)\n";
164  TestOne(reinterpret_cast<const uint8_t *>(Buf->getBufferStart()),
165  Buf->getBufferSize());
166  }
167  return 0;
168 }
169 
170 std::unique_ptr<Module> llvm::parseModule(
171  const uint8_t *Data, size_t Size, LLVMContext &Context) {
172 
173  if (Size <= 1)
174  // We get bogus data given an empty corpus - just create a new module.
175  return llvm::make_unique<Module>("M", Context);
176 
177  auto Buffer = MemoryBuffer::getMemBuffer(
178  StringRef(reinterpret_cast<const char *>(Data), Size), "Fuzzer input",
179  /*RequiresNullTerminator=*/false);
180 
181  SMDiagnostic Err;
182  auto M = parseBitcodeFile(Buffer->getMemBufferRef(), Context);
183  if (Error E = M.takeError()) {
184  errs() << toString(std::move(E)) << "\n";
185  return nullptr;
186  }
187  return std::move(M.get());
188 }
189 
190 size_t llvm::writeModule(const Module &M, uint8_t *Dest, size_t MaxSize) {
191  std::string Buf;
192  {
193  raw_string_ostream OS(Buf);
194  WriteBitcodeToFile(M, OS);
195  }
196  if (Buf.size() > MaxSize)
197  return 0;
198  memcpy(Dest, Buf.data(), Buf.size());
199  return Buf.size();
200 }
201 
202 std::unique_ptr<Module> llvm::parseAndVerify(const uint8_t *Data, size_t Size,
203  LLVMContext &Context) {
204  auto M = parseModule(Data, Size, Context);
205  if (!M || verifyModule(*M, &errs()))
206  return nullptr;
207 
208  return M;
209 }
raw_ostream & errs()
This returns a reference to a raw_ostream for standard error.
LLVMContext & Context
int(*)(int *argc, char ***argv) FuzzerInitFun
Definition: FuzzerCLI.h:45
This class represents lattice values for constants.
Definition: AllocatorList.h:24
A Module instance is used to store all the information related to an LLVM module. ...
Definition: Module.h:65
std::unique_ptr< Module > parseAndVerify(const uint8_t *Data, size_t Size, LLVMContext &Context)
Try to parse module and verify it.
Definition: FuzzerCLI.cpp:202
static std::unique_ptr< MemoryBuffer > getMemBuffer(StringRef InputData, StringRef BufferName="", bool RequiresNullTerminator=true)
Open the specified memory range as a MemoryBuffer.
size_t writeModule(const Module &M, uint8_t *Dest, size_t MaxSize)
Fuzzer friendly interface for the llvm bitcode printer.
Definition: FuzzerCLI.cpp:190
void handleExecNameEncodedBEOpts(StringRef ExecName)
Handle backend options that are encoded in the executable name.
Definition: FuzzerCLI.cpp:39
std::string toString(Error E)
Write all error messages (if any) in E to a string.
Definition: Error.h:967
void parseFuzzerCLOpts(int ArgC, char *ArgV[])
Parse cl::opts from a fuzz target commandline.
Definition: FuzzerCLI.cpp:25
LLVM_NODISCARD LLVM_ATTRIBUTE_ALWAYS_INLINE bool startswith(StringRef Prefix) const
Check if this string starts with the given Prefix.
Definition: StringRef.h:267
ArchType getArch() const
getArch - Get the parsed architecture type of this triple.
Definition: Triple.h:290
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:69
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
int runFuzzerOnInputs(int ArgC, char *ArgV[], FuzzerTestFun TestOne, FuzzerInitFun Init=[](int *, char ***) { return 0;})
Runs a fuzz target on the inputs specified on the command line.
Definition: FuzzerCLI.cpp:139
void WriteBitcodeToFile(const Module &M, raw_ostream &Out, bool ShouldPreserveUseListOrder=false, const ModuleSummaryIndex *Index=nullptr, bool GenerateHash=false, ModuleHash *ModHash=nullptr)
Write the specified module to the specified raw output stream.
bool ParseCommandLineOptions(int argc, const char *const *argv, StringRef Overview="", raw_ostream *Errs=nullptr, const char *EnvVar=nullptr)
int(*)(const uint8_t *Data, size_t Size) FuzzerTestFun
Definition: FuzzerCLI.h:44
std::unique_ptr< Module > parseModule(const uint8_t *Data, size_t Size, LLVMContext &Context)
Fuzzer friendly interface for the llvm bitcode parser.
Definition: FuzzerCLI.cpp:170
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44
This is a &#39;vector&#39; (really, a variable-sized array), optimized for the case when the array is small...
Definition: SmallVector.h:847
LLVM_NODISCARD std::pair< StringRef, StringRef > split(char Separator) const
Split into two substrings around the first occurrence of a separator character.
Definition: StringRef.h:727
LLVM_NODISCARD LLVM_ATTRIBUTE_ALWAYS_INLINE bool equals(StringRef RHS) const
equals - Check for string equality, this is more efficient than compare() when the relative ordering ...
Definition: StringRef.h:169
bool verifyModule(const Module &M, raw_ostream *OS=nullptr, bool *BrokenDebugInfo=nullptr)
Check a module for errors.
Definition: Verifier.cpp:4820
amdgpu Simplify well known AMD library false Value Value * Arg
Expected< std::unique_ptr< Module > > parseBitcodeFile(MemoryBufferRef Buffer, LLVMContext &Context)
Read the specified bitcode file, returning the module.
#define I(x, y, z)
Definition: MD5.cpp:58
uint32_t Size
Definition: Profile.cpp:47
static ErrorOr< std::unique_ptr< MemoryBuffer > > getFile(const Twine &Filename, int64_t FileSize=-1, bool RequiresNullTerminator=true, bool IsVolatile=false)
Open the specified file as a MemoryBuffer, returning a new MemoryBuffer if successful, otherwise returning null.
A raw_ostream that writes to an std::string.
Definition: raw_ostream.h:483
Lightweight error class with error context and mandatory checking.
Definition: Error.h:158
void handleExecNameEncodedOptimizerOpts(StringRef ExecName)
Handle optimizer options which are encoded in the executable name.
Definition: FuzzerCLI.cpp:75
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:49
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Instances of this class encapsulate one diagnostic report, allowing printing to a raw_ostream as a ca...
Definition: SourceMgr.h:260