| 1 | //===- BugDriver.h - Top-Level BugPoint class -------------------*- C++ -*-===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This class contains all of the shared state and information that is used by |
| 10 | // the BugPoint tool to track down errors in optimizations. This class is the |
| 11 | // main driver class that invokes all sub-functionality. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #ifndef LLVM_TOOLS_BUGPOINT_BUGDRIVER_H |
| 16 | #define LLVM_TOOLS_BUGPOINT_BUGDRIVER_H |
| 17 | |
| 18 | #include "llvm/IR/ValueMap.h" |
| 19 | #include "llvm/Support/Error.h" |
| 20 | #include "llvm/Support/FileSystem.h" |
| 21 | #include "llvm/Transforms/Utils/ValueMapper.h" |
| 22 | #include <memory> |
| 23 | #include <string> |
| 24 | #include <vector> |
| 25 | |
| 26 | namespace llvm { |
| 27 | |
| 28 | class Module; |
| 29 | class GlobalVariable; |
| 30 | class Function; |
| 31 | class BasicBlock; |
| 32 | class AbstractInterpreter; |
| 33 | class Instruction; |
| 34 | class LLVMContext; |
| 35 | |
| 36 | class CC; |
| 37 | |
| 38 | extern bool DisableSimplifyCFG; |
| 39 | |
| 40 | /// BugpointIsInterrupted - Set to true when the user presses ctrl-c. |
| 41 | /// |
| 42 | extern bool BugpointIsInterrupted; |
| 43 | |
| 44 | class BugDriver { |
| 45 | LLVMContext &Context; |
| 46 | const char *ToolName; // argv[0] of bugpoint |
| 47 | std::string ReferenceOutputFile; // Name of `good' output file |
| 48 | std::unique_ptr<Module> Program; // The raw program, linked together |
| 49 | std::vector<std::string> PassesToRun; |
| 50 | AbstractInterpreter *Interpreter; // How to run the program |
| 51 | AbstractInterpreter *SafeInterpreter; // To generate reference output, etc. |
| 52 | CC *cc; |
| 53 | bool run_find_bugs; |
| 54 | unsigned Timeout; |
| 55 | unsigned MemoryLimit; |
| 56 | bool UseValgrind; |
| 57 | |
| 58 | // FIXME: sort out public/private distinctions... |
| 59 | friend class ReducePassList; |
| 60 | friend class ReduceMisCodegenFunctions; |
| 61 | |
| 62 | public: |
| 63 | BugDriver(const char *toolname, bool find_bugs, unsigned timeout, |
| 64 | unsigned memlimit, bool use_valgrind, LLVMContext &ctxt); |
| 65 | ~BugDriver(); |
| 66 | |
| 67 | const char *getToolName() const { return ToolName; } |
| 68 | |
| 69 | LLVMContext &getContext() const { return Context; } |
| 70 | |
| 71 | // Set up methods... these methods are used to copy information about the |
| 72 | // command line arguments into instance variables of BugDriver. |
| 73 | // |
| 74 | bool addSources(const std::vector<std::string> &FileNames); |
| 75 | void addPass(std::string p) { PassesToRun.push_back(x: std::move(p)); } |
| 76 | void setPassesToRun(const std::vector<std::string> &PTR) { |
| 77 | PassesToRun = PTR; |
| 78 | } |
| 79 | const std::vector<std::string> &getPassesToRun() const { return PassesToRun; } |
| 80 | |
| 81 | /// run - The top level method that is invoked after all of the instance |
| 82 | /// variables are set up from command line arguments. The \p as_child argument |
| 83 | /// indicates whether the driver is to run in parent mode or child mode. |
| 84 | /// |
| 85 | Error run(); |
| 86 | |
| 87 | /// debugOptimizerCrash - This method is called when some optimizer pass |
| 88 | /// crashes on input. It attempts to prune down the testcase to something |
| 89 | /// reasonable, and figure out exactly which pass is crashing. |
| 90 | /// |
| 91 | Error debugOptimizerCrash(const std::string &ID = "passes" ); |
| 92 | |
| 93 | /// debugCodeGeneratorCrash - This method is called when the code generator |
| 94 | /// crashes on an input. It attempts to reduce the input as much as possible |
| 95 | /// while still causing the code generator to crash. |
| 96 | Error debugCodeGeneratorCrash(); |
| 97 | |
| 98 | /// debugMiscompilation - This method is used when the passes selected are not |
| 99 | /// crashing, but the generated output is semantically different from the |
| 100 | /// input. |
| 101 | Error debugMiscompilation(); |
| 102 | |
| 103 | /// compileSharedObject - This method creates a SharedObject from a given |
| 104 | /// BitcodeFile for debugging a code generator. |
| 105 | /// |
| 106 | Expected<std::string> compileSharedObject(const std::string &BitcodeFile); |
| 107 | |
| 108 | /// debugCodeGenerator - This method narrows down a module to a function or |
| 109 | /// set of functions, using the CBE as a ``safe'' code generator for other |
| 110 | /// functions that are not under consideration. |
| 111 | Error debugCodeGenerator(); |
| 112 | |
| 113 | /// isExecutingJIT - Returns true if bugpoint is currently testing the JIT |
| 114 | /// |
| 115 | bool isExecutingJIT(); |
| 116 | |
| 117 | Module &getProgram() const { return *Program; } |
| 118 | |
| 119 | /// Set the current module to the specified module, returning the old one. |
| 120 | std::unique_ptr<Module> swapProgramIn(std::unique_ptr<Module> M); |
| 121 | |
| 122 | AbstractInterpreter *switchToSafeInterpreter() { |
| 123 | AbstractInterpreter *Old = Interpreter; |
| 124 | Interpreter = (AbstractInterpreter *)SafeInterpreter; |
| 125 | return Old; |
| 126 | } |
| 127 | |
| 128 | void switchToInterpreter(AbstractInterpreter *AI) { Interpreter = AI; } |
| 129 | |
| 130 | /// If we reduce or update the program somehow, call this method to update |
| 131 | /// bugdriver with it. This deletes the old module and sets the specified one |
| 132 | /// as the current program. |
| 133 | void setNewProgram(std::unique_ptr<Module> M); |
| 134 | |
| 135 | /// Try to compile the specified module. This is used for code generation |
| 136 | /// crash testing. |
| 137 | Error compileProgram(Module &M) const; |
| 138 | |
| 139 | /// This method runs "Program", capturing the output of the program to a file. |
| 140 | /// A recommended filename may be optionally specified. |
| 141 | Expected<std::string> executeProgram(const Module &Program, |
| 142 | std::string OutputFilename, |
| 143 | std::string Bitcode, |
| 144 | const std::string &SharedObjects, |
| 145 | AbstractInterpreter *AI) const; |
| 146 | |
| 147 | /// Used to create reference output with the "safe" backend, if reference |
| 148 | /// output is not provided. If there is a problem with the code generator |
| 149 | /// (e.g., llc crashes), this will return false and set Error. |
| 150 | Expected<std::string> |
| 151 | executeProgramSafely(const Module &Program, |
| 152 | const std::string &OutputFile) const; |
| 153 | |
| 154 | /// Calls compileProgram and then records the output into ReferenceOutputFile. |
| 155 | /// Returns true if reference file created, false otherwise. Note: |
| 156 | /// initializeExecutionEnvironment should be called BEFORE this function. |
| 157 | Error createReferenceFile(Module &M, const std::string &Filename = |
| 158 | "bugpoint.reference.out-%%%%%%%" ); |
| 159 | |
| 160 | /// This method executes the specified module and diffs the output against the |
| 161 | /// file specified by ReferenceOutputFile. If the output is different, 1 is |
| 162 | /// returned. If there is a problem with the code generator (e.g., llc |
| 163 | /// crashes), this will return -1 and set Error. |
| 164 | Expected<bool> diffProgram(const Module &Program, |
| 165 | const std::string &BitcodeFile = "" , |
| 166 | const std::string &SharedObj = "" , |
| 167 | bool RemoveBitcode = false) const; |
| 168 | |
| 169 | /// This function is used to output M to a file named "bugpoint-ID.bc". |
| 170 | void EmitProgressBitcode(const Module &M, const std::string &ID, |
| 171 | bool NoFlyer = false) const; |
| 172 | |
| 173 | /// This method clones the current Program and deletes the specified |
| 174 | /// instruction from the cloned module. It then runs a series of cleanup |
| 175 | /// passes (ADCE and SimplifyCFG) to eliminate any code which depends on the |
| 176 | /// value. The modified module is then returned. |
| 177 | /// |
| 178 | std::unique_ptr<Module> deleteInstructionFromProgram(const Instruction *I, |
| 179 | unsigned Simp); |
| 180 | |
| 181 | /// This method clones the current Program and performs a series of cleanups |
| 182 | /// intended to get rid of extra cruft on the module. If the |
| 183 | /// MayModifySemantics argument is true, then the cleanups is allowed to |
| 184 | /// modify how the code behaves. |
| 185 | /// |
| 186 | std::unique_ptr<Module> performFinalCleanups(std::unique_ptr<Module> M, |
| 187 | bool MayModifySemantics = false); |
| 188 | |
| 189 | /// Given a module, extract up to one loop from it into a new function. This |
| 190 | /// returns null if there are no extractable loops in the program or if the |
| 191 | /// loop extractor crashes. |
| 192 | std::unique_ptr<Module> (Module *M); |
| 193 | |
| 194 | /// Extract all but the specified basic blocks into their own functions. The |
| 195 | /// only detail is that M is actually a module cloned from the one the BBs are |
| 196 | /// in, so some mapping needs to be performed. If this operation fails for |
| 197 | /// some reason (ie the implementation is buggy), this function should return |
| 198 | /// null, otherwise it returns a new Module. |
| 199 | std::unique_ptr<Module> |
| 200 | (const std::vector<BasicBlock *> &BBs, |
| 201 | Module *M); |
| 202 | |
| 203 | /// Carefully run the specified set of pass on the specified/ module, |
| 204 | /// returning the transformed module on success, or a null pointer on failure. |
| 205 | std::unique_ptr<Module> runPassesOn(Module *M, |
| 206 | const std::vector<std::string> &Passes, |
| 207 | ArrayRef<std::string> = {}); |
| 208 | |
| 209 | /// runPasses - Run the specified passes on Program, outputting a bitcode |
| 210 | /// file and writting the filename into OutputFile if successful. If the |
| 211 | /// optimizations fail for some reason (optimizer crashes), return true, |
| 212 | /// otherwise return false. If DeleteOutput is set to true, the bitcode is |
| 213 | /// deleted on success, and the filename string is undefined. This prints to |
| 214 | /// outs() a single line message indicating whether compilation was successful |
| 215 | /// or failed, unless Quiet is set. ExtraArgs specifies additional arguments |
| 216 | /// to pass to the child bugpoint instance. |
| 217 | /// |
| 218 | bool runPasses(Module &Program, const std::vector<std::string> &PassesToRun, |
| 219 | std::string &OutputFilename, bool DeleteOutput = false, |
| 220 | bool Quiet = false, |
| 221 | ArrayRef<std::string> = {}) const; |
| 222 | |
| 223 | /// runPasses - Just like the method above, but this just returns true or |
| 224 | /// false indicating whether or not the optimizer crashed on the specified |
| 225 | /// input (true = crashed). Does not produce any output. |
| 226 | /// |
| 227 | bool runPasses(Module &M, const std::vector<std::string> &PassesToRun) const { |
| 228 | std::string Filename; |
| 229 | return runPasses(Program&: M, PassesToRun, OutputFilename&: Filename, DeleteOutput: true); |
| 230 | } |
| 231 | |
| 232 | /// Take the specified pass list and create different combinations of passes |
| 233 | /// to compile the program with. Compile the program with each set and mark |
| 234 | /// test to see if it compiled correctly. If the passes compiled correctly |
| 235 | /// output nothing and rearrange the passes into a new order. If the passes |
| 236 | /// did not compile correctly, output the command required to recreate the |
| 237 | /// failure. |
| 238 | Error runManyPasses(const std::vector<std::string> &AllPasses); |
| 239 | |
| 240 | /// This writes the current "Program" to the named bitcode file. If an error |
| 241 | /// occurs, true is returned. |
| 242 | bool writeProgramToFile(const std::string &Filename, const Module &M) const; |
| 243 | bool writeProgramToFile(const std::string &Filename, int FD, |
| 244 | const Module &M) const; |
| 245 | bool writeProgramToFile(int FD, const Module &M) const; |
| 246 | |
| 247 | private: |
| 248 | /// initializeExecutionEnvironment - This method is used to set up the |
| 249 | /// environment for executing LLVM programs. |
| 250 | /// |
| 251 | Error initializeExecutionEnvironment(); |
| 252 | }; |
| 253 | |
| 254 | struct DiscardTemp { |
| 255 | sys::fs::TempFile &File; |
| 256 | ~DiscardTemp(); |
| 257 | }; |
| 258 | |
| 259 | /// Given a bitcode or assembly input filename, parse and return it, or return |
| 260 | /// null if not possible. |
| 261 | /// |
| 262 | std::unique_ptr<Module> parseInputFile(StringRef InputFilename, |
| 263 | LLVMContext &ctxt); |
| 264 | |
| 265 | /// getPassesString - Turn a list of passes into a string which indicates the |
| 266 | /// command line options that must be passed to add the passes. |
| 267 | /// |
| 268 | std::string getPassesString(const std::vector<std::string> &Passes); |
| 269 | |
| 270 | /// PrintFunctionList - prints out list of problematic functions |
| 271 | /// |
| 272 | void PrintFunctionList(const std::vector<Function *> &Funcs); |
| 273 | |
| 274 | /// PrintGlobalVariableList - prints out list of problematic global variables |
| 275 | /// |
| 276 | void PrintGlobalVariableList(const std::vector<GlobalVariable *> &GVs); |
| 277 | |
| 278 | // DeleteGlobalInitializer - "Remove" the global variable by deleting its |
| 279 | // initializer, making it external. |
| 280 | // |
| 281 | void DeleteGlobalInitializer(GlobalVariable *GV); |
| 282 | |
| 283 | // DeleteFunctionBody - "Remove" the function by deleting all of it's basic |
| 284 | // blocks, making it external. |
| 285 | // |
| 286 | void DeleteFunctionBody(Function *F); |
| 287 | |
| 288 | /// Given a module and a list of functions in the module, split the functions |
| 289 | /// OUT of the specified module, and place them in the new module. |
| 290 | std::unique_ptr<Module> |
| 291 | SplitFunctionsOutOfModule(Module *M, const std::vector<Function *> &F, |
| 292 | ValueToValueMapTy &VMap); |
| 293 | |
| 294 | } // End llvm namespace |
| 295 | |
| 296 | #endif |
| 297 | |