Initial checkin of the "extract" utility
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@2716 91177308-0d34-0410-b5e6-96231b3b80d8
diff --git a/tools/extract/Makefile b/tools/extract/Makefile
new file mode 100644
index 0000000..f9209d1
--- /dev/null
+++ b/tools/extract/Makefile
@@ -0,0 +1,6 @@
+LEVEL = ../..
+
+TOOLNAME = extract
+USEDLIBS = bcreader bcwriter transforms ipo analysis transformutils ipa vmcore support
+
+include $(LEVEL)/Makefile.common
diff --git a/tools/extract/extract.cpp b/tools/extract/extract.cpp
new file mode 100644
index 0000000..7a6a1c1
--- /dev/null
+++ b/tools/extract/extract.cpp
@@ -0,0 +1,104 @@
+//===----------------------------------------------------------------------===//
+// LLVM extract Utility
+//
+// This utility changes the input module to only contain a single function,
+// which is primarily used for debugging transformations.
+//
+//===----------------------------------------------------------------------===//
+
+#include "llvm/Module.h"
+#include "llvm/PassManager.h"
+#include "llvm/Bytecode/Reader.h"
+#include "llvm/Bytecode/WriteBytecodePass.h"
+#include "llvm/GlobalVariable.h"
+#include "llvm/Function.h"
+#include "llvm/Transforms/IPO/GlobalDCE.h"
+#include "llvm/Transforms/ConstantMerge.h"
+#include "llvm/Transforms/CleanupGCCOutput.h"
+#include "Support/CommandLine.h"
+#include <memory>
+
+static cl::String InputFilename("", "Specify input bytecode file", 0, "-");
+static cl::String ExtractFunc("func", "Specify function to extract", 0, "main");
+
+struct FunctionExtractorPass : public Pass {
+ const char *getPassName() const { return "Function Extractor"; }
+
+ bool run(Module *M) {
+ // Mark all global variables to be internal
+ for (Module::giterator I = M->gbegin(), E = M->gend(); I != E; ++I)
+ (*I)->setInternalLinkage(true);
+
+ Function *Named = 0;
+
+ // Loop over all of the functions in the module, dropping all references in
+ // functions that are not the named function.
+ for (Module::iterator I = M->begin(), E = M->end(); I != E;)
+ // Check to see if this is the named function!
+ if (!Named && (*I)->getName() == ExtractFunc) {
+ // Yes, it is. Keep track of it...
+ Named = *I;
+
+ // Remove the named function from the module.
+ M->getFunctionList().remove(I);
+ E = M->end();
+ } else {
+ // Nope it's not the named function, delete the body of the function
+ (*I)->dropAllReferences();
+ ++I;
+ }
+
+ // All of the functions that still have uses now must be used by global
+ // variables or the named function. Loop through them and create a new,
+ // external function for the used ones... making all uses point to the new
+ // functions.
+ std::vector<Function*> NewFunctions;
+
+ for (Module::iterator I = M->begin(), E = M->end(); I != E; ++I)
+ if (!(*I)->use_empty()) {
+ Function *New = new Function((*I)->getFunctionType(), false,
+ (*I)->getName());
+ (*I)->replaceAllUsesWith(New);
+ NewFunctions.push_back(New);
+ }
+
+ // Now the module only has unused functions with their references dropped.
+ // Delete them all now!
+ M->getFunctionList().delete_all();
+
+ // Re-insert the named function...
+ if (Named)
+ M->getFunctionList().push_back(Named);
+ else
+ std::cerr << "Warning: Function '" << ExtractFunc << "' not found!\n";
+
+ // Insert all of the function stubs...
+ M->getFunctionList().insert(M->end(), NewFunctions.begin(),
+ NewFunctions.end());
+ return true;
+ }
+};
+
+
+int main(int argc, char **argv) {
+ cl::ParseCommandLineOptions(argc, argv, " llvm extractor\n");
+
+ std::auto_ptr<Module> M(ParseBytecodeFile(InputFilename));
+ if (M.get() == 0) {
+ std::cerr << "bytecode didn't read correctly.\n";
+ return 1;
+ }
+
+ // In addition to just parsing the input from GCC, we also want to spiff it up
+ // a little bit. Do this now.
+ //
+ PassManager Passes;
+ Passes.add(new FunctionExtractorPass());
+ Passes.add(createGlobalDCEPass()); // Delete unreachable globals
+ Passes.add(createConstantMergePass()); // Merge dup global constants
+ Passes.add(createCleanupGCCOutputPass()); // Fix gccisms
+ Passes.add(new WriteBytecodePass(&std::cout)); // Write bytecode to file...
+
+ Passes.run(M.get());
+ return 0;
+}
diff --git a/tools/llvm-extract/llvm-extract.cpp b/tools/llvm-extract/llvm-extract.cpp
new file mode 100644
index 0000000..7a6a1c1
--- /dev/null
+++ b/tools/llvm-extract/llvm-extract.cpp
@@ -0,0 +1,104 @@
+//===----------------------------------------------------------------------===//
+// LLVM extract Utility
+//
+// This utility changes the input module to only contain a single function,
+// which is primarily used for debugging transformations.
+//
+//===----------------------------------------------------------------------===//
+
+#include "llvm/Module.h"
+#include "llvm/PassManager.h"
+#include "llvm/Bytecode/Reader.h"
+#include "llvm/Bytecode/WriteBytecodePass.h"
+#include "llvm/GlobalVariable.h"
+#include "llvm/Function.h"
+#include "llvm/Transforms/IPO/GlobalDCE.h"
+#include "llvm/Transforms/ConstantMerge.h"
+#include "llvm/Transforms/CleanupGCCOutput.h"
+#include "Support/CommandLine.h"
+#include <memory>
+
+static cl::String InputFilename("", "Specify input bytecode file", 0, "-");
+static cl::String ExtractFunc("func", "Specify function to extract", 0, "main");
+
+struct FunctionExtractorPass : public Pass {
+ const char *getPassName() const { return "Function Extractor"; }
+
+ bool run(Module *M) {
+ // Mark all global variables to be internal
+ for (Module::giterator I = M->gbegin(), E = M->gend(); I != E; ++I)
+ (*I)->setInternalLinkage(true);
+
+ Function *Named = 0;
+
+ // Loop over all of the functions in the module, dropping all references in
+ // functions that are not the named function.
+ for (Module::iterator I = M->begin(), E = M->end(); I != E;)
+ // Check to see if this is the named function!
+ if (!Named && (*I)->getName() == ExtractFunc) {
+ // Yes, it is. Keep track of it...
+ Named = *I;
+
+ // Remove the named function from the module.
+ M->getFunctionList().remove(I);
+ E = M->end();
+ } else {
+ // Nope it's not the named function, delete the body of the function
+ (*I)->dropAllReferences();
+ ++I;
+ }
+
+ // All of the functions that still have uses now must be used by global
+ // variables or the named function. Loop through them and create a new,
+ // external function for the used ones... making all uses point to the new
+ // functions.
+ std::vector<Function*> NewFunctions;
+
+ for (Module::iterator I = M->begin(), E = M->end(); I != E; ++I)
+ if (!(*I)->use_empty()) {
+ Function *New = new Function((*I)->getFunctionType(), false,
+ (*I)->getName());
+ (*I)->replaceAllUsesWith(New);
+ NewFunctions.push_back(New);
+ }
+
+ // Now the module only has unused functions with their references dropped.
+ // Delete them all now!
+ M->getFunctionList().delete_all();
+
+ // Re-insert the named function...
+ if (Named)
+ M->getFunctionList().push_back(Named);
+ else
+ std::cerr << "Warning: Function '" << ExtractFunc << "' not found!\n";
+
+ // Insert all of the function stubs...
+ M->getFunctionList().insert(M->end(), NewFunctions.begin(),
+ NewFunctions.end());
+ return true;
+ }
+};
+
+
+int main(int argc, char **argv) {
+ cl::ParseCommandLineOptions(argc, argv, " llvm extractor\n");
+
+ std::auto_ptr<Module> M(ParseBytecodeFile(InputFilename));
+ if (M.get() == 0) {
+ std::cerr << "bytecode didn't read correctly.\n";
+ return 1;
+ }
+
+ // In addition to just parsing the input from GCC, we also want to spiff it up
+ // a little bit. Do this now.
+ //
+ PassManager Passes;
+ Passes.add(new FunctionExtractorPass());
+ Passes.add(createGlobalDCEPass()); // Delete unreachable globals
+ Passes.add(createConstantMergePass()); // Merge dup global constants
+ Passes.add(createCleanupGCCOutputPass()); // Fix gccisms
+ Passes.add(new WriteBytecodePass(&std::cout)); // Write bytecode to file...
+
+ Passes.run(M.get());
+ return 0;
+}