1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
|
//===----------------------------------------------------------------------===//
// LLVM extract Utility
//
// This utility changes the input module to only contain a single function,
// which is primarily used for debugging transformations.
//
//===----------------------------------------------------------------------===//
#include "llvm/Module.h"
#include "llvm/PassManager.h"
#include "llvm/Bytecode/Reader.h"
#include "llvm/Bytecode/WriteBytecodePass.h"
#include "llvm/GlobalVariable.h"
#include "llvm/Function.h"
#include "llvm/Transforms/IPO/GlobalDCE.h"
#include "llvm/Transforms/ConstantMerge.h"
#include "llvm/Transforms/CleanupGCCOutput.h"
#include "Support/CommandLine.h"
#include <memory>
static cl::String InputFilename("", "Specify input bytecode file", 0, "-");
static cl::String ExtractFunc("func", "Specify function to extract", 0, "main");
struct FunctionExtractorPass : public Pass {
const char *getPassName() const { return "Function Extractor"; }
bool run(Module *M) {
// Mark all global variables to be internal
for (Module::giterator I = M->gbegin(), E = M->gend(); I != E; ++I)
(*I)->setInternalLinkage(true);
Function *Named = 0;
// Loop over all of the functions in the module, dropping all references in
// functions that are not the named function.
for (Module::iterator I = M->begin(), E = M->end(); I != E;)
// Check to see if this is the named function!
if (!Named && (*I)->getName() == ExtractFunc) {
// Yes, it is. Keep track of it...
Named = *I;
// Make sure it's globally accessable...
Named->setInternalLinkage(false);
// Remove the named function from the module.
M->getFunctionList().remove(I);
E = M->end();
} else {
// Nope it's not the named function, delete the body of the function
(*I)->dropAllReferences();
++I;
}
// All of the functions that still have uses now must be used by global
// variables or the named function. Loop through them and create a new,
// external function for the used ones... making all uses point to the new
// functions.
std::vector<Function*> NewFunctions;
for (Module::iterator I = M->begin(), E = M->end(); I != E; ++I)
if (!(*I)->use_empty()) {
Function *New = new Function((*I)->getFunctionType(), false,
(*I)->getName());
(*I)->replaceAllUsesWith(New);
NewFunctions.push_back(New);
}
// Now the module only has unused functions with their references dropped.
// Delete them all now!
M->getFunctionList().delete_all();
// Re-insert the named function...
if (Named)
M->getFunctionList().push_back(Named);
else
std::cerr << "Warning: Function '" << ExtractFunc << "' not found!\n";
// Insert all of the function stubs...
M->getFunctionList().insert(M->end(), NewFunctions.begin(),
NewFunctions.end());
return true;
}
};
int main(int argc, char **argv) {
cl::ParseCommandLineOptions(argc, argv, " llvm extractor\n");
std::auto_ptr<Module> M(ParseBytecodeFile(InputFilename));
if (M.get() == 0) {
std::cerr << "bytecode didn't read correctly.\n";
return 1;
}
// In addition to just parsing the input from GCC, we also want to spiff it up
// a little bit. Do this now.
//
PassManager Passes;
Passes.add(new FunctionExtractorPass());
Passes.add(createGlobalDCEPass()); // Delete unreachable globals
Passes.add(createConstantMergePass()); // Merge dup global constants
Passes.add(createCleanupGCCOutputPass()); // Fix gccisms
Passes.add(new WriteBytecodePass(&std::cout)); // Write bytecode to file...
Passes.run(M.get());
return 0;
}
|