aboutsummaryrefslogtreecommitdiffstats
path: root/tools/extract/extract.cpp
blob: a78d1fd9b994dcec878d5959f8087ad7a7a68aab (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
//===----------------------------------------------------------------------===//
// LLVM extract Utility
//
// This utility changes the input module to only contain a single function,
// which is primarily used for debugging transformations.
//
//===----------------------------------------------------------------------===//

#include "llvm/Module.h"
#include "llvm/PassManager.h"
#include "llvm/Bytecode/Reader.h"
#include "llvm/Bytecode/WriteBytecodePass.h"
#include "llvm/GlobalVariable.h"
#include "llvm/Function.h"
#include "llvm/Transforms/IPO/GlobalDCE.h"
#include "llvm/Transforms/ConstantMerge.h"
#include "llvm/Transforms/CleanupGCCOutput.h"
#include "Support/CommandLine.h"
#include <memory>

static cl::String InputFilename("", "Specify input bytecode file", 0, "-");
static cl::String ExtractFunc("func", "Specify function to extract", 0, "main");

struct FunctionExtractorPass : public Pass {
  const char *getPassName() const { return "Function Extractor"; }

  bool run(Module *M) {
    // Mark all global variables to be internal
    for (Module::giterator I = M->gbegin(), E = M->gend(); I != E; ++I)
      (*I)->setInternalLinkage(true);

    Function *Named = 0;

    // Loop over all of the functions in the module, dropping all references in
    // functions that are not the named function.
    for (Module::iterator I = M->begin(), E = M->end(); I != E;)
      // Check to see if this is the named function!
      if (!Named && (*I)->getName() == ExtractFunc) {
        // Yes, it is.  Keep track of it...
        Named = *I;

        // Make sure it's globally accessable...
        Named->setInternalLinkage(false);

        // Remove the named function from the module.
        M->getFunctionList().remove(I);
        E = M->end();
      } else {
        // Nope it's not the named function, delete the body of the function
        (*I)->dropAllReferences();
        ++I;
      }

    // All of the functions that still have uses now must be used by global
    // variables or the named function.  Loop through them and create a new,
    // external function for the used ones... making all uses point to the new
    // functions.
    std::vector<Function*> NewFunctions;
    
    for (Module::iterator I = M->begin(), E = M->end(); I != E; ++I)
      if (!(*I)->use_empty()) {
        Function *New = new Function((*I)->getFunctionType(), false,
                                     (*I)->getName());
        (*I)->replaceAllUsesWith(New);
        NewFunctions.push_back(New);
      }
    
    // Now the module only has unused functions with their references dropped.
    // Delete them all now!
    M->getFunctionList().delete_all();

    // Re-insert the named function...
    if (Named)
      M->getFunctionList().push_back(Named);
    else
      std::cerr << "Warning: Function '" << ExtractFunc << "' not found!\n";
    
    // Insert all of the function stubs...
    M->getFunctionList().insert(M->end(), NewFunctions.begin(),
                                NewFunctions.end());
    return true;
  }
};


int main(int argc, char **argv) {
  cl::ParseCommandLineOptions(argc, argv, " llvm extractor\n");

  std::auto_ptr<Module> M(ParseBytecodeFile(InputFilename));
  if (M.get() == 0) {
    std::cerr << "bytecode didn't read correctly.\n";
    return 1;
  }

  // In addition to just parsing the input from GCC, we also want to spiff it up
  // a little bit.  Do this now.
  //
  PassManager Passes;
  Passes.add(new FunctionExtractorPass());
  Passes.add(createGlobalDCEPass());              // Delete unreachable globals
  Passes.add(createConstantMergePass());          // Merge dup global constants
  Passes.add(createCleanupGCCOutputPass());       // Fix gccisms
  Passes.add(new WriteBytecodePass(&std::cout));  // Write bytecode to file...

  Passes.run(M.get());
  return 0;
}