1 //===- llvm-extract.cpp - LLVM function extraction utility ----------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This utility changes the input module to only contain a single function,
11 // which is primarily used for debugging transformations.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "llvm/LLVMContext.h"
16 #include "llvm/Module.h"
17 #include "llvm/PassManager.h"
18 #include "llvm/Assembly/PrintModulePass.h"
19 #include "llvm/Bitcode/ReaderWriter.h"
20 #include "llvm/Transforms/IPO.h"
21 #include "llvm/Target/TargetData.h"
22 #include "llvm/Support/CommandLine.h"
23 #include "llvm/Support/IRReader.h"
24 #include "llvm/Support/ManagedStatic.h"
25 #include "llvm/Support/PrettyStackTrace.h"
26 #include "llvm/Support/ToolOutputFile.h"
27 #include "llvm/Support/SystemUtils.h"
28 #include "llvm/Support/Signals.h"
29 #include "llvm/Support/Regex.h"
30 #include "llvm/ADT/SmallPtrSet.h"
31 #include "llvm/ADT/SetVector.h"
32 #include <memory>
33 using namespace llvm;
34 
35 // InputFilename - The filename to read from.
36 static cl::opt<std::string>
37 InputFilename(cl::Positional, cl::desc("<input bitcode file>"),
38               cl::init("-"), cl::value_desc("filename"));
39 
40 static cl::opt<std::string>
41 OutputFilename("o", cl::desc("Specify output filename"),
42                cl::value_desc("filename"), cl::init("-"));
43 
44 static cl::opt<bool>
45 Force("f", cl::desc("Enable binary output on terminals"));
46 
47 static cl::opt<bool>
48 DeleteFn("delete", cl::desc("Delete specified Globals from Module"));
49 
50 // ExtractFuncs - The functions to extract from the module.
51 static cl::list<std::string>
52 ExtractFuncs("func", cl::desc("Specify function to extract"),
53              cl::ZeroOrMore, cl::value_desc("function"));
54 
55 // ExtractRegExpFuncs - The functions, matched via regular expression, to
56 // extract from the module.
57 static cl::list<std::string>
58 ExtractRegExpFuncs("rfunc", cl::desc("Specify function(s) to extract using a "
59                                      "regular expression"),
60                    cl::ZeroOrMore, cl::value_desc("rfunction"));
61 
62 // ExtractGlobals - The globals to extract from the module.
63 static cl::list<std::string>
64 ExtractGlobals("glob", cl::desc("Specify global to extract"),
65                cl::ZeroOrMore, cl::value_desc("global"));
66 
67 // ExtractRegExpGlobals - The globals, matched via regular expression, to
68 // extract from the module...
69 static cl::list<std::string>
70 ExtractRegExpGlobals("rglob", cl::desc("Specify global(s) to extract using a "
71                                        "regular expression"),
72                      cl::ZeroOrMore, cl::value_desc("rglobal"));
73 
74 static cl::opt<bool>
75 OutputAssembly("S",
76                cl::desc("Write output as LLVM assembly"), cl::Hidden);
77 
main(int argc,char ** argv)78 int main(int argc, char **argv) {
79   // Print a stack trace if we signal out.
80   sys::PrintStackTraceOnErrorSignal();
81   PrettyStackTraceProgram X(argc, argv);
82 
83   LLVMContext &Context = getGlobalContext();
84   llvm_shutdown_obj Y;  // Call llvm_shutdown() on exit.
85   cl::ParseCommandLineOptions(argc, argv, "llvm extractor\n");
86 
87   // Use lazy loading, since we only care about selected global values.
88   SMDiagnostic Err;
89   std::auto_ptr<Module> M;
90   M.reset(getLazyIRFileModule(InputFilename, Err, Context));
91 
92   if (M.get() == 0) {
93     Err.Print(argv[0], errs());
94     return 1;
95   }
96 
97   // Use SetVector to avoid duplicates.
98   SetVector<GlobalValue *> GVs;
99 
100   // Figure out which globals we should extract.
101   for (size_t i = 0, e = ExtractGlobals.size(); i != e; ++i) {
102     GlobalValue *GV = M.get()->getNamedGlobal(ExtractGlobals[i]);
103     if (!GV) {
104       errs() << argv[0] << ": program doesn't contain global named '"
105              << ExtractGlobals[i] << "'!\n";
106       return 1;
107     }
108     GVs.insert(GV);
109   }
110 
111   // Extract globals via regular expression matching.
112   for (size_t i = 0, e = ExtractRegExpGlobals.size(); i != e; ++i) {
113     std::string Error;
114     Regex RegEx(ExtractRegExpGlobals[i]);
115     if (!RegEx.isValid(Error)) {
116       errs() << argv[0] << ": '" << ExtractRegExpGlobals[i] << "' "
117         "invalid regex: " << Error;
118     }
119     bool match = false;
120     for (Module::global_iterator GV = M.get()->global_begin(),
121            E = M.get()->global_end(); GV != E; GV++) {
122       if (RegEx.match(GV->getName())) {
123         GVs.insert(&*GV);
124         match = true;
125       }
126     }
127     if (!match) {
128       errs() << argv[0] << ": program doesn't contain global named '"
129              << ExtractRegExpGlobals[i] << "'!\n";
130       return 1;
131     }
132   }
133 
134   // Figure out which functions we should extract.
135   for (size_t i = 0, e = ExtractFuncs.size(); i != e; ++i) {
136     GlobalValue *GV = M.get()->getFunction(ExtractFuncs[i]);
137     if (!GV) {
138       errs() << argv[0] << ": program doesn't contain function named '"
139              << ExtractFuncs[i] << "'!\n";
140       return 1;
141     }
142     GVs.insert(GV);
143   }
144   // Extract functions via regular expression matching.
145   for (size_t i = 0, e = ExtractRegExpFuncs.size(); i != e; ++i) {
146     std::string Error;
147     StringRef RegExStr = ExtractRegExpFuncs[i];
148     Regex RegEx(RegExStr);
149     if (!RegEx.isValid(Error)) {
150       errs() << argv[0] << ": '" << ExtractRegExpFuncs[i] << "' "
151         "invalid regex: " << Error;
152     }
153     bool match = false;
154     for (Module::iterator F = M.get()->begin(), E = M.get()->end(); F != E;
155          F++) {
156       if (RegEx.match(F->getName())) {
157         GVs.insert(&*F);
158         match = true;
159       }
160     }
161     if (!match) {
162       errs() << argv[0] << ": program doesn't contain global named '"
163              << ExtractRegExpFuncs[i] << "'!\n";
164       return 1;
165     }
166   }
167 
168   // Materialize requisite global values.
169   if (!DeleteFn)
170     for (size_t i = 0, e = GVs.size(); i != e; ++i) {
171       GlobalValue *GV = GVs[i];
172       if (GV->isMaterializable()) {
173         std::string ErrInfo;
174         if (GV->Materialize(&ErrInfo)) {
175           errs() << argv[0] << ": error reading input: " << ErrInfo << "\n";
176           return 1;
177         }
178       }
179     }
180   else {
181     // Deleting. Materialize every GV that's *not* in GVs.
182     SmallPtrSet<GlobalValue *, 8> GVSet(GVs.begin(), GVs.end());
183     for (Module::global_iterator I = M->global_begin(), E = M->global_end();
184          I != E; ++I) {
185       GlobalVariable *G = I;
186       if (!GVSet.count(G) && G->isMaterializable()) {
187         std::string ErrInfo;
188         if (G->Materialize(&ErrInfo)) {
189           errs() << argv[0] << ": error reading input: " << ErrInfo << "\n";
190           return 1;
191         }
192       }
193     }
194     for (Module::iterator I = M->begin(), E = M->end(); I != E; ++I) {
195       Function *F = I;
196       if (!GVSet.count(F) && F->isMaterializable()) {
197         std::string ErrInfo;
198         if (F->Materialize(&ErrInfo)) {
199           errs() << argv[0] << ": error reading input: " << ErrInfo << "\n";
200           return 1;
201         }
202       }
203     }
204   }
205 
206   // In addition to deleting all other functions, we also want to spiff it
207   // up a little bit.  Do this now.
208   PassManager Passes;
209   Passes.add(new TargetData(M.get())); // Use correct TargetData
210 
211   std::vector<GlobalValue*> Gvs(GVs.begin(), GVs.end());
212 
213   Passes.add(createGVExtractionPass(Gvs, DeleteFn));
214   if (!DeleteFn)
215     Passes.add(createGlobalDCEPass());           // Delete unreachable globals
216   Passes.add(createStripDeadDebugInfoPass());    // Remove dead debug info
217   Passes.add(createStripDeadPrototypesPass());   // Remove dead func decls
218 
219   std::string ErrorInfo;
220   tool_output_file Out(OutputFilename.c_str(), ErrorInfo,
221                        raw_fd_ostream::F_Binary);
222   if (!ErrorInfo.empty()) {
223     errs() << ErrorInfo << '\n';
224     return 1;
225   }
226 
227   if (OutputAssembly)
228     Passes.add(createPrintModulePass(&Out.os()));
229   else if (Force || !CheckBitcodeOutputToConsole(Out.os(), true))
230     Passes.add(createBitcodeWriterPass(Out.os()));
231 
232   Passes.run(*M.get());
233 
234   // Declare success.
235   Out.keep();
236 
237   return 0;
238 }
239