diff options
Diffstat (limited to 'lib/Bytecode/Reader/ReaderWrappers.cpp')
-rw-r--r-- | lib/Bytecode/Reader/ReaderWrappers.cpp | 420 |
1 files changed, 420 insertions, 0 deletions
diff --git a/lib/Bytecode/Reader/ReaderWrappers.cpp b/lib/Bytecode/Reader/ReaderWrappers.cpp new file mode 100644 index 0000000000..1ee27185ad --- /dev/null +++ b/lib/Bytecode/Reader/ReaderWrappers.cpp @@ -0,0 +1,420 @@ +//===- ReaderWrappers.cpp - Parse bytecode from file or buffer -----------===// +// +// The LLVM Compiler Infrastructure +// +// This file was developed by the LLVM research group and is distributed under +// the University of Illinois Open Source License. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// +// +// This file implements loading and parsing a bytecode file and parsing a +// bytecode module from a given buffer. +// +//===----------------------------------------------------------------------===// + +#include "llvm/Bytecode/Analyzer.h" +#include "llvm/Bytecode/Reader.h" +#include "Reader.h" +#include "llvm/Module.h" +#include "llvm/Instructions.h" +#include "llvm/ADT/StringExtras.h" +#include "llvm/System/MappedFile.h" +#include <cerrno> +#include <iostream> +using namespace llvm; + +//===----------------------------------------------------------------------===// +// BytecodeFileReader - Read from an mmap'able file descriptor. +// + +namespace { + /// BytecodeFileReader - parses a bytecode file from a file + /// + class BytecodeFileReader : public BytecodeReader { + private: + sys::MappedFile mapFile; + + BytecodeFileReader(const BytecodeFileReader&); // Do not implement + void operator=(const BytecodeFileReader &BFR); // Do not implement + + public: + BytecodeFileReader(const std::string &Filename, llvm::BytecodeHandler* H=0); + }; +} + +BytecodeFileReader::BytecodeFileReader(const std::string &Filename, + llvm::BytecodeHandler* H ) + : BytecodeReader(H) + , mapFile( sys::Path(Filename)) +{ + mapFile.map(); + unsigned char* buffer = reinterpret_cast<unsigned char*>(mapFile.base()); + ParseBytecode(buffer, mapFile.size(), Filename); +} + +//===----------------------------------------------------------------------===// +// BytecodeBufferReader - Read from a memory buffer +// + +namespace { + /// BytecodeBufferReader - parses a bytecode file from a buffer + /// + class BytecodeBufferReader : public BytecodeReader { + private: + const unsigned char *Buffer; + bool MustDelete; + + BytecodeBufferReader(const BytecodeBufferReader&); // Do not implement + void operator=(const BytecodeBufferReader &BFR); // Do not implement + + public: + BytecodeBufferReader(const unsigned char *Buf, unsigned Length, + const std::string &ModuleID, + llvm::BytecodeHandler* Handler = 0); + ~BytecodeBufferReader(); + + }; +} + +BytecodeBufferReader::BytecodeBufferReader(const unsigned char *Buf, + unsigned Length, + const std::string &ModuleID, + llvm::BytecodeHandler* H ) + : BytecodeReader(H) +{ + // If not aligned, allocate a new buffer to hold the bytecode... + const unsigned char *ParseBegin = 0; + if (reinterpret_cast<uint64_t>(Buf) & 3) { + Buffer = new unsigned char[Length+4]; + unsigned Offset = 4 - ((intptr_t)Buffer & 3); // Make sure it's aligned + ParseBegin = Buffer + Offset; + memcpy((unsigned char*)ParseBegin, Buf, Length); // Copy it over + MustDelete = true; + } else { + // If we don't need to copy it over, just use the caller's copy + ParseBegin = Buffer = Buf; + MustDelete = false; + } + try { + ParseBytecode(ParseBegin, Length, ModuleID); + } catch (...) { + if (MustDelete) delete [] Buffer; + throw; + } +} + +BytecodeBufferReader::~BytecodeBufferReader() { + if (MustDelete) delete [] Buffer; +} + +//===----------------------------------------------------------------------===// +// BytecodeStdinReader - Read bytecode from Standard Input +// + +namespace { + /// BytecodeStdinReader - parses a bytecode file from stdin + /// + class BytecodeStdinReader : public BytecodeReader { + private: + std::vector<unsigned char> FileData; + unsigned char *FileBuf; + + BytecodeStdinReader(const BytecodeStdinReader&); // Do not implement + void operator=(const BytecodeStdinReader &BFR); // Do not implement + + public: + BytecodeStdinReader( llvm::BytecodeHandler* H = 0 ); + }; +} + +BytecodeStdinReader::BytecodeStdinReader( BytecodeHandler* H ) + : BytecodeReader(H) +{ + char Buffer[4096*4]; + + // Read in all of the data from stdin, we cannot mmap stdin... + while (std::cin.good()) { + std::cin.read(Buffer, 4096*4); + int BlockSize = std::cin.gcount(); + if (0 >= BlockSize) + break; + FileData.insert(FileData.end(), Buffer, Buffer+BlockSize); + } + + if (FileData.empty()) + throw std::string("Standard Input empty!"); + + FileBuf = &FileData[0]; + ParseBytecode(FileBuf, FileData.size(), "<stdin>"); +} + +//===----------------------------------------------------------------------===// +// Varargs transmogrification code... +// + +// CheckVarargs - This is used to automatically translate old-style varargs to +// new style varargs for backwards compatibility. +static ModuleProvider* CheckVarargs(ModuleProvider* MP) { + Module* M = MP->getModule(); + + // check to see if va_start takes arguements... + Function* F = M->getNamedFunction("llvm.va_start"); + if(F == 0) return MP; //No varargs use, just return. + + if (F->getFunctionType()->getNumParams() == 1) + return MP; // Modern varargs processing, just return. + + // If we get to this point, we know that we have an old-style module. + // Materialize the whole thing to perform the rewriting. + MP->materializeModule(); + + if(Function* F = M->getNamedFunction("llvm.va_start")) { + assert(F->arg_size() == 0 && "Obsolete va_start takes 0 argument!"); + + //foo = va_start() + // -> + //bar = alloca typeof(foo) + //va_start(bar) + //foo = load bar + + const Type* RetTy = Type::getPrimitiveType(Type::VoidTyID); + const Type* ArgTy = F->getFunctionType()->getReturnType(); + const Type* ArgTyPtr = PointerType::get(ArgTy); + Function* NF = M->getOrInsertFunction("llvm.va_start", + RetTy, ArgTyPtr, (Type *)0); + + for(Value::use_iterator I = F->use_begin(), E = F->use_end(); I != E;) + if (CallInst* CI = dyn_cast<CallInst>(*I++)) { + AllocaInst* bar = new AllocaInst(ArgTy, 0, "vastart.fix.1", CI); + new CallInst(NF, bar, "", CI); + Value* foo = new LoadInst(bar, "vastart.fix.2", CI); + CI->replaceAllUsesWith(foo); + CI->getParent()->getInstList().erase(CI); + } + F->setName(""); + } + + if(Function* F = M->getNamedFunction("llvm.va_end")) { + assert(F->arg_size() == 1 && "Obsolete va_end takes 1 argument!"); + //vaend foo + // -> + //bar = alloca 1 of typeof(foo) + //vaend bar + const Type* RetTy = Type::getPrimitiveType(Type::VoidTyID); + const Type* ArgTy = F->getFunctionType()->getParamType(0); + const Type* ArgTyPtr = PointerType::get(ArgTy); + Function* NF = M->getOrInsertFunction("llvm.va_end", + RetTy, ArgTyPtr, (Type *)0); + + for(Value::use_iterator I = F->use_begin(), E = F->use_end(); I != E;) + if (CallInst* CI = dyn_cast<CallInst>(*I++)) { + AllocaInst* bar = new AllocaInst(ArgTy, 0, "vaend.fix.1", CI); + new StoreInst(CI->getOperand(1), bar, CI); + new CallInst(NF, bar, "", CI); + CI->getParent()->getInstList().erase(CI); + } + F->setName(""); + } + + if(Function* F = M->getNamedFunction("llvm.va_copy")) { + assert(F->arg_size() == 1 && "Obsolete va_copy takes 1 argument!"); + //foo = vacopy(bar) + // -> + //a = alloca 1 of typeof(foo) + //b = alloca 1 of typeof(foo) + //store bar -> b + //vacopy(a, b) + //foo = load a + + const Type* RetTy = Type::getPrimitiveType(Type::VoidTyID); + const Type* ArgTy = F->getFunctionType()->getReturnType(); + const Type* ArgTyPtr = PointerType::get(ArgTy); + Function* NF = M->getOrInsertFunction("llvm.va_copy", + RetTy, ArgTyPtr, ArgTyPtr, (Type *)0); + + for(Value::use_iterator I = F->use_begin(), E = F->use_end(); I != E;) + if (CallInst* CI = dyn_cast<CallInst>(*I++)) { + AllocaInst* a = new AllocaInst(ArgTy, 0, "vacopy.fix.1", CI); + AllocaInst* b = new AllocaInst(ArgTy, 0, "vacopy.fix.2", CI); + new StoreInst(CI->getOperand(1), b, CI); + new CallInst(NF, a, b, "", CI); + Value* foo = new LoadInst(a, "vacopy.fix.3", CI); + CI->replaceAllUsesWith(foo); + CI->getParent()->getInstList().erase(CI); + } + F->setName(""); + } + return MP; +} + +//===----------------------------------------------------------------------===// +// Wrapper functions +//===----------------------------------------------------------------------===// + +/// getBytecodeBufferModuleProvider - lazy function-at-a-time loading from a +/// buffer +ModuleProvider* +llvm::getBytecodeBufferModuleProvider(const unsigned char *Buffer, + unsigned Length, + const std::string &ModuleID, + BytecodeHandler* H ) { + return CheckVarargs( + new BytecodeBufferReader(Buffer, Length, ModuleID, H)); +} + +/// ParseBytecodeBuffer - Parse a given bytecode buffer +/// +Module *llvm::ParseBytecodeBuffer(const unsigned char *Buffer, unsigned Length, + const std::string &ModuleID, + std::string *ErrorStr){ + try { + std::auto_ptr<ModuleProvider> + AMP(getBytecodeBufferModuleProvider(Buffer, Length, ModuleID)); + return AMP->releaseModule(); + } catch (std::string &err) { + if (ErrorStr) *ErrorStr = err; + return 0; + } +} + +/// getBytecodeModuleProvider - lazy function-at-a-time loading from a file +/// +ModuleProvider *llvm::getBytecodeModuleProvider(const std::string &Filename, + BytecodeHandler* H) { + if (Filename != std::string("-")) // Read from a file... + return CheckVarargs(new BytecodeFileReader(Filename,H)); + else // Read from stdin + return CheckVarargs(new BytecodeStdinReader(H)); +} + +/// ParseBytecodeFile - Parse the given bytecode file +/// +Module *llvm::ParseBytecodeFile(const std::string &Filename, + std::string *ErrorStr) { + try { + std::auto_ptr<ModuleProvider> AMP(getBytecodeModuleProvider(Filename)); + return AMP->releaseModule(); + } catch (std::string &err) { + if (ErrorStr) *ErrorStr = err; + return 0; + } +} + +// AnalyzeBytecodeFile - analyze one file +Module* llvm::AnalyzeBytecodeFile( + const std::string &Filename, ///< File to analyze + BytecodeAnalysis& bca, ///< Statistical output + std::string *ErrorStr, ///< Error output + std::ostream* output ///< Dump output +) +{ + try { + BytecodeHandler* analyzerHandler =createBytecodeAnalyzerHandler(bca,output); + std::auto_ptr<ModuleProvider> AMP( + getBytecodeModuleProvider(Filename,analyzerHandler)); + return AMP->releaseModule(); + } catch (std::string &err) { + if (ErrorStr) *ErrorStr = err; + return 0; + } +} + +// AnalyzeBytecodeBuffer - analyze a buffer +Module* llvm::AnalyzeBytecodeBuffer( + const unsigned char* Buffer, ///< Pointer to start of bytecode buffer + unsigned Length, ///< Size of the bytecode buffer + const std::string& ModuleID, ///< Identifier for the module + BytecodeAnalysis& bca, ///< The results of the analysis + std::string* ErrorStr, ///< Errors, if any. + std::ostream* output ///< Dump output, if any +) +{ + try { + BytecodeHandler* hdlr = createBytecodeAnalyzerHandler(bca, output); + std::auto_ptr<ModuleProvider> + AMP(getBytecodeBufferModuleProvider(Buffer, Length, ModuleID, hdlr)); + return AMP->releaseModule(); + } catch (std::string &err) { + if (ErrorStr) *ErrorStr = err; + return 0; + } +} + +bool llvm::GetBytecodeDependentLibraries(const std::string &fname, + Module::LibraryListType& deplibs) { + try { + std::auto_ptr<ModuleProvider> AMP( getBytecodeModuleProvider(fname)); + Module* M = AMP->releaseModule(); + + deplibs = M->getLibraries(); + delete M; + return true; + } catch (...) { + deplibs.clear(); + return false; + } +} + +static void getSymbols(Module*M, std::vector<std::string>& symbols) { + // Loop over global variables + for (Module::global_iterator GI = M->global_begin(), GE=M->global_end(); GI != GE; ++GI) + if (!GI->isExternal() && !GI->hasInternalLinkage()) + if (!GI->getName().empty()) + symbols.push_back(GI->getName()); + + // Loop over functions. + for (Module::iterator FI = M->begin(), FE = M->end(); FI != FE; ++FI) + if (!FI->isExternal() && !FI->hasInternalLinkage()) + if (!FI->getName().empty()) + symbols.push_back(FI->getName()); +} + +// Get just the externally visible defined symbols from the bytecode +bool llvm::GetBytecodeSymbols(const sys::Path& fName, + std::vector<std::string>& symbols) { + try { + std::auto_ptr<ModuleProvider> AMP( + getBytecodeModuleProvider(fName.toString())); + + // Get the module from the provider + Module* M = AMP->materializeModule(); + + // Get the symbols + getSymbols(M, symbols); + + // Done with the module + return true; + + } catch (...) { + return false; + } +} + +ModuleProvider* +llvm::GetBytecodeSymbols(const unsigned char*Buffer, unsigned Length, + const std::string& ModuleID, + std::vector<std::string>& symbols) { + + ModuleProvider* MP = 0; + try { + // Get the module provider + MP = getBytecodeBufferModuleProvider(Buffer, Length, ModuleID); + + // Get the module from the provider + Module* M = MP->materializeModule(); + + // Get the symbols + getSymbols(M, symbols); + + // Done with the module. Note that ModuleProvider will delete the + // Module when it is deleted. Also note that its the caller's responsibility + // to delete the ModuleProvider. + return MP; + + } catch (...) { + // We delete only the ModuleProvider here because its destructor will + // also delete the Module (we used materializeModule not releaseModule). + delete MP; + } + return 0; +} |