Discard code that supported old bytecode formats. This makes the Bytecode

Reader code much easier to read and maintain. Backwards compatibility from version 5 format has been retained. Older formats will produce an error. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@31723 91177308-0d34-0410-b5e6-96231b3b80d8
author: Reid Spencer <rspencer@reidspencer.com> 2006-11-14 04:47:22 +0000
committer: Reid Spencer <rspencer@reidspencer.com> 2006-11-14 04:47:22 +0000
commit: d798a515e93e1ac323ecff8dc6c0b0567c252e36 (patch)
tree: d5c74b60fe1e0c2615b3cbddc6ce781df6016ab1
parent: df1a10ece6a75f230d98c6fb001349eede90387a (diff)
10 files changed, 170 insertions, 21800 deletions
diff --git a/include/llvm/Bytecode/Analyzer.h b/include/llvm/Bytecode/Analyzer.h
index 825325dcf9..491629d7ed 100644
--- a/include/llvm/Bytecode/Analyzer.h
+++ b/include/llvm/Bytecode/Analyzer.h
@@ -68,7 +68,7 @@ struct BytecodeAnalysis {
   unsigned vbrCompBytes;    ///< Number of vbr bytes (compressed)
   unsigned vbrExpdBytes;    ///< Number of vbr bytes (expanded)
 
-  typedef std::map<BytecodeFormat::CompressedBytecodeBlockIdentifiers,unsigned>
+  typedef std::map<BytecodeFormat::BytecodeBlockIdentifiers,unsigned>
       BlockSizeMap;
   BlockSizeMap BlockSizes;
 
diff --git a/include/llvm/Bytecode/Format.h b/include/llvm/Bytecode/Format.h
index 24d1ed67ee..562d8ff011 100644
--- a/include/llvm/Bytecode/Format.h
+++ b/include/llvm/Bytecode/Format.h
@@ -20,78 +20,37 @@ namespace llvm {
 class BytecodeFormat {   // Throw the constants into a poorman's namespace...
   BytecodeFormat();      // do not implement
 public:
-
-  // ID Numbers that are used in bytecode files...
-  enum FileBlockIDs {
-    // File level identifiers...
-    Module = 0x01,
-
-    // Module subtypes:
-    Function = 0x11,
-    ConstantPool,
-    SymbolTable,
-    ModuleGlobalInfo,
-    GlobalTypePlane,
-    DependentLibs,
-
-    // Function subtypes:
-    // Can also have ConstantPool block
-    // Can also have SymbolTable block
-    BasicBlock = 0x31,// May contain many basic blocks (obsolete since LLVM 1.1)
-
-    // InstructionList - The instructions in the body of a function.  This
-    // superceeds the old BasicBlock node used in LLVM 1.0.
-    InstructionList = 0x32,
-
-    // CompactionTable - blocks with this id are used to define local remapping
-    // tables for a function, allowing the indices used within the function to
-    // be as small as possible.  This often allows the instructions to be
-    // encoded more efficiently.
-    CompactionTable = 0x33
-  };
-
-  /// In LLVM 1.3 format, the identifier and the size of the block are
-  /// encoded into a single vbr_uint32 with 5 bits for the block identifier
-  /// and 27-bits for block length. This limits blocks to a maximum of
+  /// The the identifier and the size of the block are encoded into a single 
+  /// vbr_uint32 with 5 bits for the block identifier and 27-bits for block 
+  /// length. This limits blocks to a maximum of
   /// 128MBytes of data, and block types to 31 which should be sufficient
   /// for the foreseeable usage. Because the values of block identifiers MUST
   /// fit within 5 bits (values 1-31), this enumeration is used to ensure
   /// smaller values are used for 1.3 and subsequent bytecode versions.
   /// @brief The block number identifiers used in LLVM 1.3 bytecode
   /// format.
-  enum CompressedBytecodeBlockIdentifiers {
-
-    // Zero value ist verbotten!
-    Reserved_DoNotUse = 0x00,      ///< Don't use this!
-
-    // This is the uber block that contains the rest of the blocks.
-    ModuleBlockID = 0x01,          ///< 1.3 identifier for modules
-
-    // Module subtypes:
-
-    // This is the identifier for a function
-    FunctionBlockID = 0x02,        ///< 1.3 identifier for Functions
-    ConstantPoolBlockID = 0x03,    ///< 1.3 identifier for constant pool
-    SymbolTableBlockID = 0x04,     ///< 1.3 identifier for symbol table
-    ModuleGlobalInfoBlockID = 0x05,///< 1.3 identifier for module globals
-    GlobalTypePlaneBlockID = 0x06, ///< 1.3 identifier for global types
-
-    // Function subtypes:
-
-    // InstructionList - The instructions in the body of a function.  This
-    // superceeds the old BasicBlock node used in LLVM 1.0.
-    InstructionListBlockID = 0x07, ///< 1.3 identifier for insruction list
-
-    // CompactionTable - blocks with this id are used to define local remapping
-    // tables for a function, allowing the indices used within the function to
-    // be as small as possible.  This often allows the instructions to be
-    // encoded more efficiently.
-    CompactionTableBlockID = 0x08, ///< 1.3 identifier for compaction tables
+  enum BytecodeBlockIdentifiers {
+
+    Reserved_DoNotUse      = 0,  ///< Zero value is forbidden, do not use.
+    ModuleBlockID          = 1,  ///< Module block that contains other blocks.
+    FunctionBlockID        = 2,  ///< Function block identifier
+    ConstantPoolBlockID    = 3,  ///< Constant pool identifier
+    SymbolTableBlockID     = 4,  ///< Symbol table identifier
+    ModuleGlobalInfoBlockID= 5,  ///< Module global info identifier
+    GlobalTypePlaneBlockID = 6,  ///< Global type plan identifier
+    InstructionListBlockID = 7,  ///< All instructions in a function
+
+    /// Blocks with this id are used to define a function local remapping
+    /// table for the function's values. This allows the indices used within 
+    /// the function to be as small as possible.  This often allows the 
+    /// instructions to be encoded more efficiently because VBR takes fewer
+    /// bytes with smaller values.
+    /// @brief Value Compaction Table Block
+    CompactionTableBlockID = 0x08,
 
     // Not a block id, just used to count them
     NumberOfBlockIDs
   };
-
 };
 
 } // End llvm namespace
diff --git a/lib/Bytecode/Reader/Analyzer.cpp b/lib/Bytecode/Reader/Analyzer.cpp
index 23d524c0aa..3d6a001080 100644
--- a/lib/Bytecode/Reader/Analyzer.cpp
+++ b/lib/Bytecode/Reader/Analyzer.cpp
@@ -532,7 +532,7 @@ public:
     assert(BType >= BytecodeFormat::ModuleBlockID);
     assert(BType < BytecodeFormat::NumberOfBlockIDs);
     bca.BlockSizes[
-      llvm::BytecodeFormat::CompressedBytecodeBlockIdentifiers(BType)] += Size;
+      llvm::BytecodeFormat::BytecodeBlockIdentifiers(BType)] += Size;
 
     if (bca.version < 3) // Check for long block headers versions
       bca.BlockSizes[llvm::BytecodeFormat::Reserved_DoNotUse] += 8;
diff --git a/lib/Bytecode/Reader/Reader.cpp b/lib/Bytecode/Reader/Reader.cpp
index 43150365e5..084b4fcade 100644
--- a/lib/Bytecode/Reader/Reader.cpp
+++ b/lib/Bytecode/Reader/Reader.cpp
@@ -73,18 +73,6 @@ inline void BytecodeReader::checkPastBlockEnd(const char * block_name) {
           " block.");
 }
 
-/// Align the buffer position to a 32 bit boundary
-inline void BytecodeReader::align32() {
-  if (hasAlignment) {
-    BufPtr Save = At;
-    At = (const unsigned char *)((intptr_t)(At+3) & (~3UL));
-    if (At > Save)
-      if (Handler) Handler->handleAlignment(At - Save);
-    if (At > BlockEnd)
-      error("Ran out of data while aligning!");
-  }
-}
-
 /// Read a whole unsigned integer
 inline unsigned BytecodeReader::read_uint() {
   if (At+4 > BlockEnd)
@@ -179,43 +167,9 @@ inline void BytecodeReader::read_double(double& DoubleVal) {
 
 /// Read a block header and obtain its type and size
 inline void BytecodeReader::read_block(unsigned &Type, unsigned &Size) {
-  if ( hasLongBlockHeaders ) {
-    Type = read_uint();
-    Size = read_uint();
-    switch (Type) {
-    case BytecodeFormat::Reserved_DoNotUse :
-      error("Reserved_DoNotUse used as Module Type?");
-      Type = BytecodeFormat::ModuleBlockID; break;
-    case BytecodeFormat::Module:
-      Type = BytecodeFormat::ModuleBlockID; break;
-    case BytecodeFormat::Function:
-      Type = BytecodeFormat::FunctionBlockID; break;
-    case BytecodeFormat::ConstantPool:
-      Type = BytecodeFormat::ConstantPoolBlockID; break;
-    case BytecodeFormat::SymbolTable:
-      Type = BytecodeFormat::SymbolTableBlockID; break;
-    case BytecodeFormat::ModuleGlobalInfo:
-      Type = BytecodeFormat::ModuleGlobalInfoBlockID; break;
-    case BytecodeFormat::GlobalTypePlane:
-      Type = BytecodeFormat::GlobalTypePlaneBlockID; break;
-    case BytecodeFormat::InstructionList:
-      Type = BytecodeFormat::InstructionListBlockID; break;
-    case BytecodeFormat::CompactionTable:
-      Type = BytecodeFormat::CompactionTableBlockID; break;
-    case BytecodeFormat::BasicBlock:
-      /// This block type isn't used after version 1.1. However, we have to
-      /// still allow the value in case this is an old bc format file.
-      /// We just let its value creep thru.
-      break;
-    default:
-      error("Invalid block id found: " + utostr(Type));
-      break;
-    }
-  } else {
-    Size = read_uint();
-    Type = Size & 0x1F; // mask low order five bits
-    Size >>= 5; // get rid of five low order bits, leaving high 27
-  }
+  Size = read_uint(); // Read the header
+  Type = Size & 0x1F; // mask low order five bits to get type
+  Size >>= 5;         // high order 27 bits is the size
   BlockStart = At;
   if (At + Size > BlockEnd)
     error("Attempt to size a block past end of memory");
@@ -223,56 +177,13 @@ inline void BytecodeReader::read_block(unsigned &Type, unsigned &Size) {
   if (Handler) Handler->handleBlock(Type, BlockStart, Size);
 }
 
-
-/// In LLVM 1.2 and before, Types were derived from Value and so they were
-/// written as part of the type planes along with any other Value. In LLVM
-/// 1.3 this changed so that Type does not derive from Value. Consequently,
-/// the BytecodeReader's containers for Values can't contain Types because
-/// there's no inheritance relationship. This means that the "Type Type"
-/// plane is defunct along with the Type::TypeTyID TypeID. In LLVM 1.3
-/// whenever a bytecode construct must have both types and values together,
-/// the types are always read/written first and then the Values. Furthermore
-/// since Type::TypeTyID no longer exists, its value (12) now corresponds to
-/// Type::LabelTyID. In order to overcome this we must "sanitize" all the
-/// type TypeIDs we encounter. For LLVM 1.3 bytecode files, there's no change.
-/// For LLVM 1.2 and before, this function will decrement the type id by
-/// one to account for the missing Type::TypeTyID enumerator if the value is
-/// larger than 12 (Type::LabelTyID). If the value is exactly 12, then this
-/// function returns true, otherwise false. This helps detect situations
-/// where the pre 1.3 bytecode is indicating that what follows is a type.
-/// @returns true iff type id corresponds to pre 1.3 "type type"
-inline bool BytecodeReader::sanitizeTypeId(unsigned &TypeId) {
-  if (hasTypeDerivedFromValue) { /// do nothing if 1.3 or later
-    if (TypeId == Type::LabelTyID) {
-      TypeId = Type::VoidTyID; // sanitize it
-      return true; // indicate we got TypeTyID in pre 1.3 bytecode
-    } else if (TypeId > Type::LabelTyID)
-      --TypeId; // shift all planes down because type type plane is missing
-  }
-  return false;
-}
-
-/// Reads a vbr uint to read in a type id and does the necessary
-/// conversion on it by calling sanitizeTypeId.
-/// @returns true iff \p TypeId read corresponds to a pre 1.3 "type type"
-/// @see sanitizeTypeId
-inline bool BytecodeReader::read_typeid(unsigned &TypeId) {
-  TypeId = read_vbr_uint();
-  if ( !has32BitTypes )
-    if ( TypeId == 0x00FFFFFF )
-      TypeId = read_vbr_uint();
-  return sanitizeTypeId(TypeId);
-}
-
 //===----------------------------------------------------------------------===//
 // IR Lookup Methods
 //===----------------------------------------------------------------------===//
 
 /// Determine if a type id has an implicit null value
 inline bool BytecodeReader::hasImplicitNull(unsigned TyID) {
-  if (!hasExplicitPrimitiveZeros)
-    return TyID != Type::LabelTyID && TyID != Type::VoidTyID;
-  return TyID >= Type::FirstDerivedTyID;
+  return TyID != Type::LabelTyID && TyID != Type::VoidTyID;
 }
 
 /// Obtain a type given a typeid and account for things like compaction tables,
@@ -304,23 +215,11 @@ const Type *BytecodeReader::getType(unsigned ID) {
   return Type::VoidTy;
 }
 
-/// Get a sanitized type id. This just makes sure that the \p ID
-/// is both sanitized and not the "type type" of pre-1.3 bytecode.
-/// @see sanitizeTypeId
-inline const Type* BytecodeReader::getSanitizedType(unsigned& ID) {
-  if (sanitizeTypeId(ID))
-    error("Invalid type id encountered");
-  return getType(ID);
-}
-
-/// This method just saves some coding. It uses read_typeid to read
+/// This method just saves some coding. It uses read_vbr_uint to read
 /// in a sanitized type id, errors that its not the type type, and
 /// then calls getType to return the type value.
-inline const Type* BytecodeReader::readSanitizedType() {
-  unsigned ID;
-  if (read_typeid(ID))
-    error("Invalid type id encountered");
-  return getType(ID);
+inline const Type* BytecodeReader::readType() {
+  return getType(read_vbr_uint());
 }
 
 /// Get the slot number associated with a type accounting for primitive
@@ -590,12 +489,6 @@ BytecodeReader::upgradeInstrOpcodes(
   if (!hasSignlessDivRem && !hasSignlessShrCastSetcc)
     return 0; // The opcode is fine the way it is.
 
-  // If this is a bytecode format that did not include the unreachable
-  // instruction, bump up the opcode number to adjust it.
-  if (hasNoUnreachableInst)
-    if (Opcode >= 6 && Opcode < 62)
-      ++Opcode;
-
   // If this is bytecode version 6, that only had signed Rem and Div 
   // instructions, then we must compensate for those two instructions only.
   // So that the switch statement below works, we're trying to turn this into
@@ -779,7 +672,7 @@ BytecodeReader::upgradeInstrOpcodes(
       CallInst* bar = new CallInst(NF, getValue(iType, Oprnds[0]));
       BB->getInstList().push_back(bar);
       BB->getInstList().push_back(new StoreInst(bar, foo));
-      Instruction* tmp = new VAArgInst(foo, getSanitizedType(Oprnds[1]));
+      Instruction* tmp = new VAArgInst(foo, getType(Oprnds[1]));
       BB->getInstList().push_back(tmp);
       Result = new LoadInst(foo);
       break;
@@ -803,7 +696,7 @@ BytecodeReader::upgradeInstrOpcodes(
       CallInst* bar = new CallInst(NF, getValue(iType, Oprnds[0]));
       BB->getInstList().push_back(bar);
       BB->getInstList().push_back(new StoreInst(bar, foo));
-      Result = new VAArgInst(foo, getSanitizedType(Oprnds[1]));
+      Result = new VAArgInst(foo, getType(Oprnds[1]));
       break;
     }
     case 34: // Select
@@ -919,11 +812,10 @@ void BytecodeReader::ParseInstruction(std::vector<unsigned> &Oprnds,
 
     for (unsigned i = 0; i != NumOprnds; ++i)
       Oprnds[i] = read_vbr_uint();
-    align32();
     break;
   }
 
-  const Type *InstTy = getSanitizedType(iType);
+  const Type *InstTy = getType(iType);
 
   // Make the necessary adjustments for dealing with backwards compatibility
   // of opcodes.
@@ -955,7 +847,7 @@ void BytecodeReader::ParseInstruction(std::vector<unsigned> &Oprnds,
       if (Oprnds.size() != 2)
         error("Invalid VAArg instruction!");
       Result = new VAArgInst(getValue(iType, Oprnds[0]),
-                             getSanitizedType(Oprnds[1]));
+                             getType(Oprnds[1]));
       break;
     case Instruction::ExtractElement: {
       if (Oprnds.size() != 2)
@@ -1001,7 +893,7 @@ void BytecodeReader::ParseInstruction(std::vector<unsigned> &Oprnds,
       if (Oprnds.size() != 2)
         error("Invalid Cast instruction!");
       Result = new CastInst(getValue(iType, Oprnds[0]),
-                            getSanitizedType(Oprnds[1]));
+                            getType(Oprnds[1]));
       break;
     case Instruction::Select:
       if (Oprnds.size() != 3)
@@ -1235,34 +1127,22 @@ void BytecodeReader::ParseInstruction(std::vector<unsigned> &Oprnds,
 
         unsigned ValIdx = Oprnds[i];
         unsigned IdxTy = 0;
-        if (!hasRestrictedGEPTypes) {
-          // Struct indices are always uints, sequential type indices can be 
-          // any of the 32 or 64-bit integer types.  The actual choice of 
-          // type is encoded in the low two bits of the slot number.
-          if (isa<StructType>(TopTy))
-            IdxTy = Type::UIntTyID;
-          else {
-            switch (ValIdx & 3) {
-            default:
-            case 0: IdxTy = Type::UIntTyID; break;
-            case 1: IdxTy = Type::IntTyID; break;
-            case 2: IdxTy = Type::ULongTyID; break;
-            case 3: IdxTy = Type::LongTyID; break;
-            }
-            ValIdx >>= 2;
+        // Struct indices are always uints, sequential type indices can be 
+        // any of the 32 or 64-bit integer types.  The actual choice of 
+        // type is encoded in the low two bits of the slot number.
+        if (isa<StructType>(TopTy))
+          IdxTy = Type::UIntTyID;
+        else {
+          switch (ValIdx & 3) {
+          default:
+          case 0: IdxTy = Type::UIntTyID; break;
+          case 1: IdxTy = Type::IntTyID; break;
+          case 2: IdxTy = Type::ULongTyID; break;
+          case 3: IdxTy = Type::LongTyID; break;
           }
-        } else {
-          IdxTy = isa<StructType>(TopTy) ? Type::UByteTyID : Type::LongTyID;
+          ValIdx >>= 2;
         }
-
         Idx.push_back(getValue(IdxTy, ValIdx));
-
-        // Convert ubyte struct indices into uint struct indices.
-        if (isa<StructType>(TopTy) && hasRestrictedGEPTypes)
-          if (ConstantInt *C = dyn_cast<ConstantInt>(Idx.back()))
-            if (C->getType() == Type::UByteTy)
-              Idx[Idx.size()-1] = ConstantExpr::getCast(C, Type::UIntTy);
-
         NextTy = GetElementPtrInst::getIndexedType(InstTy, Idx, true);
       }
 
@@ -1309,16 +1189,16 @@ void BytecodeReader::ParseInstruction(std::vector<unsigned> &Oprnds,
 }
 
 /// Get a particular numbered basic block, which might be a forward reference.
-/// This works together with ParseBasicBlock to handle these forward references
-/// in a clean manner.  This function is used when constructing phi, br, switch,
-/// and other instructions that reference basic blocks. Blocks are numbered
-/// sequentially as they appear in the function.
+/// This works together with ParseInstructionList to handle these forward 
+/// references in a clean manner.  This function is used when constructing 
+/// phi, br, switch, and other instructions that reference basic blocks. 
+/// Blocks are numbered sequentially as they appear in the function.
 BasicBlock *BytecodeReader::getBasicBlock(unsigned ID) {
   // Make sure there is room in the table...
   if (ParsedBasicBlocks.size() <= ID) ParsedBasicBlocks.resize(ID+1);
 
-  // First check to see if this is a backwards reference, i.e., ParseBasicBlock
-  // has already created this block, or if the forward reference has already
+  // First check to see if this is a backwards reference, i.e. this block
+  // has already been created, or if the forward reference has already
   // been created.
   if (ParsedBasicBlocks[ID])
     return ParsedBasicBlocks[ID];
@@ -1328,34 +1208,10 @@ BasicBlock *BytecodeReader::getBasicBlock(unsigned ID) {
   return ParsedBasicBlocks[ID] = new BasicBlock();
 }
 
-/// In LLVM 1.0 bytecode files, we used to output one basicblock at a time.
-/// This method reads in one of the basicblock packets. This method is not used
-/// for bytecode files after LLVM 1.0
-/// @returns The basic block constructed.
-BasicBlock *BytecodeReader::ParseBasicBlock(unsigned BlockNo) {
-  if (Handler) Handler->handleBasicBlockBegin(BlockNo);
-
-  BasicBlock *BB = 0;
-
-  if (ParsedBasicBlocks.size() == BlockNo)
-    ParsedBasicBlocks.push_back(BB = new BasicBlock());
-  else if (ParsedBasicBlocks[BlockNo] == 0)
-    BB = ParsedBasicBlocks[BlockNo] = new BasicBlock();
-  else
-    BB = ParsedBasicBlocks[BlockNo];
-
-  std::vector<unsigned> Operands;
-  while (moreInBlock())
-    ParseInstruction(Operands, BB);
-
-  if (Handler) Handler->handleBasicBlockEnd(BlockNo);
-  return BB;
-}
-
 /// Parse all of the BasicBlock's & Instruction's in the body of a function.
 /// In post 1.0 bytecode files, we no longer emit basic block individually,
 /// in order to avoid per-basic-block overhead.
-/// @returns Rhe number of basic blocks encountered.
+/// @returns the number of basic blocks encountered.
 unsigned BytecodeReader::ParseInstructionList(Function* F) {
   unsigned BlockNo = 0;
   std::vector<unsigned> Args;
@@ -1401,52 +1257,35 @@ void BytecodeReader::ParseSymbolTable(Function *CurrentFunction,
            E = CurrentFunction->end(); I != E; ++I)
       BBMap.push_back(I);
 
-  /// In LLVM 1.3 we write types separately from values so
-  /// The types are always first in the symbol table. This is
-  /// because Type no longer derives from Value.
-  if (!hasTypeDerivedFromValue) {
-    // Symtab block header: [num entries]
-    unsigned NumEntries = read_vbr_uint();
-    for (unsigned i = 0; i < NumEntries; ++i) {
-      // Symtab entry: [def slot #][name]
-      unsigned slot = read_vbr_uint();
-      std::string Name = read_str();
-      const Type* T = getType(slot);
-      ST->insert(Name, T);
-    }
+  // Symtab block header: [num entries]
+  unsigned NumEntries = read_vbr_uint();
+  for (unsigned i = 0; i < NumEntries; ++i) {
+    // Symtab entry: [def slot #][name]
+    unsigned slot = read_vbr_uint();
+    std::string Name = read_str();
+    const Type* T = getType(slot);
+    ST->insert(Name, T);
   }
 
   while (moreInBlock()) {
     // Symtab block header: [num entries][type id number]
     unsigned NumEntries = read_vbr_uint();
-    unsigned Typ = 0;
-    bool isTypeType = read_typeid(Typ);
+    unsigned Typ = read_vbr_uint();
 
     for (unsigned i = 0; i != NumEntries; ++i) {
       // Symtab entry: [def slot #][name]
       unsigned slot = read_vbr_uint();
       std::string Name = read_str();
-
-      // if we're reading a pre 1.3 bytecode file and the type plane
-      // is the "type type", handle it here
-      if (isTypeType) {
-        const Type* T = getType(slot);
-        if (T == 0)
-          error("Failed type look-up for name '" + Name + "'");
-        ST->insert(Name, T);
-        continue; // code below must be short circuited
+      Value *V = 0;
+      if (Typ == Type::LabelTyID) {
+        if (slot < BBMap.size())
+          V = BBMap[slot];
       } else {
-        Value *V = 0;
-        if (Typ == Type::LabelTyID) {
-          if (slot < BBMap.size())
-            V = BBMap[slot];
-        } else {
-          V = getValue(Typ, slot, false); // Find mapping...
-        }
-        if (V == 0)
-          error("Failed value look-up for name '" + Name + "'");
-        V->setName(Name);
+        V = getValue(Typ, slot, false); // Find mapping...
       }
+      if (V == 0)
+        error("Failed value look-up for name '" + Name + "'");
+      V->setName(Name);
     }
   }
   checkPastBlockEnd("Symbol Table");
@@ -1456,9 +1295,7 @@ void BytecodeReader::ParseSymbolTable(Function *CurrentFunction,
 /// Read in the types portion of a compaction table.
 void BytecodeReader::ParseCompactionTypes(unsigned NumEntries) {
   for (unsigned i = 0; i != NumEntries; ++i) {
-    unsigned TypeSlot = 0;
-    if (read_typeid(TypeSlot))
-      error("Invalid type in compaction table: type type");
+    unsigned TypeSlot = read_vbr_uint();
     const Type *Typ = getGlobalTableType(TypeSlot);
     CompactionTypes.push_back(std::make_pair(Typ, TypeSlot));
     if (Handler) Handler->handleCompactionTableType(i, TypeSlot, Typ);
@@ -1471,14 +1308,9 @@ void BytecodeReader::ParseCompactionTable() {
   // Notify handler that we're beginning a compaction table.
   if (Handler) Handler->handleCompactionTableBegin();
 
-  // In LLVM 1.3 Type no longer derives from Value. So,
-  // we always write them first in the compaction table
-  // because they can't occupy a "type plane" where the
-  // Values reside.
-  if (! hasTypeDerivedFromValue) {
-    unsigned NumEntries = read_vbr_uint();
-    ParseCompactionTypes(NumEntries);
-  }
+  // Get the types for the compaction table.
+  unsigned NumEntries = read_vbr_uint();
+  ParseCompactionTypes(NumEntries);
 
   // Compaction tables live in separate blocks so we have to loop
   // until we've read the whole thing.
@@ -1486,7 +1318,6 @@ void BytecodeReader::ParseCompactionTable() {
     // Read the number of Value* entries in the compaction table
     unsigned NumEntries = read_vbr_uint();
     unsigned Ty = 0;
-    unsigned isTypeType = false;
 
     // Decode the type from value read in. Most compaction table
     // planes will have one or two entries in them. If that's the
@@ -1496,42 +1327,35 @@ void BytecodeReader::ParseCompactionTable() {
       // In this case, both low-order bits are set (value 3). This
       // is a signal that the typeid follows.
       NumEntries >>= 2;
-      isTypeType = read_typeid(Ty);
+      Ty = read_vbr_uint();
     } else {
       // In this case, the low-order bits specify the number of entries
       // and the high order bits specify the type.
       Ty = NumEntries >> 2;
-      isTypeType = sanitizeTypeId(Ty);
       NumEntries &= 3;
     }
 
-    // if we're reading a pre 1.3 bytecode file and the type plane
-    // is the "type type", handle it here
-    if (isTypeType) {
-      ParseCompactionTypes(NumEntries);
-    } else {
-      // Make sure we have enough room for the plane.
-      if (Ty >= CompactionValues.size())
-        CompactionValues.resize(Ty+1);
-
-      // Make sure the plane is empty or we have some kind of error.
-      if (!CompactionValues[Ty].empty())
-        error("Compaction table plane contains multiple entries!");
-
-      // Notify handler about the plane.
-      if (Handler) Handler->handleCompactionTablePlane(Ty, NumEntries);
-
-      // Push the implicit zero.
-      CompactionValues[Ty].push_back(Constant::getNullValue(getType(Ty)));
-
-      // Read in each of the entries, put them in the compaction table
-      // and notify the handler that we have a new compaction table value.
-      for (unsigned i = 0; i != NumEntries; ++i) {
-        unsigned ValSlot = read_vbr_uint();
-        Value *V = getGlobalTableValue(Ty, ValSlot);
-        CompactionValues[Ty].push_back(V);
-        if (Handler) Handler->handleCompactionTableValue(i, Ty, ValSlot);
-      }
+    // Make sure we have enough room for the plane.
+    if (Ty >= CompactionValues.size())
+      CompactionValues.resize(Ty+1);
+
+    // Make sure the plane is empty or we have some kind of error.
+    if (!CompactionValues[Ty].empty())
+      error("Compaction table plane contains multiple entries!");
+
+    // Notify handler about the plane.
+    if (Handler) Handler->handleCompactionTablePlane(Ty, NumEntries);
+
+    // Push the implicit zero.
+    CompactionValues[Ty].push_back(Constant::getNullValue(getType(Ty)));
+
+    // Read in each of the entries, put them in the compaction table
+    // and notify the handler that we have a new compaction table value.
+    for (unsigned i = 0; i != NumEntries; ++i) {
+      unsigned ValSlot = read_vbr_uint();
+      Value *V = getGlobalTableValue(Ty, ValSlot);
+      CompactionValues[Ty].push_back(V);
+      if (Handler) Handler->handleCompactionTableValue(i, Ty, ValSlot);
     }
   }
   // Notify handler that the compaction table is done.
@@ -1543,23 +1367,20 @@ void BytecodeReader::ParseCompactionTable() {
 // a derived type, then additional data is read to fill out the type
 // definition.
 const Type *BytecodeReader::ParseType() {
-  unsigned PrimType = 0;
-  if (read_typeid(PrimType))
-    error("Invalid type (type type) in type constants!");
-
+  unsigned PrimType = read_vbr_uint();
   const Type *Result = 0;
   if ((Result = Type::getPrimitiveType((Type::TypeID)PrimType)))
     return Result;
 
   switch (PrimType) {
   case Type::FunctionTyID: {
-    const Type *RetType = readSanitizedType();
+    const Type *RetType = readType();
 
     unsigned NumParams = read_vbr_uint();
 
     std::vector<const Type*> Params;
     while (NumParams--)
-      Params.push_back(readSanitizedType());
+      Params.push_back(readType());
 
     bool isVarArg = Params.size() && Params.back() == Type::VoidTy;
     if (isVarArg) Params.pop_back();
@@ -1568,34 +1389,30 @@ const Type *BytecodeReader::ParseType() {
     break;
   }
   case Type::ArrayTyID: {
-    const Type *ElementType = readSanitizedType();
+    const Type *ElementType = readType();
     unsigned NumElements = read_vbr_uint();
     Result =  ArrayType::get(ElementType, NumElements);
     break;
   }
   case Type::PackedTyID: {
-    const Type *ElementType = readSanitizedType();
+    const Type *ElementType = readType();
     unsigned NumElements = read_vbr_uint();
     Result =  PackedType::get(ElementType, NumElements);
     break;
   }
   case Type::StructTyID: {
     std::vector<const Type*> Elements;
-    unsigned Typ = 0;
-    if (read_typeid(Typ))
-      error("Invalid element type (type type) for structure!");
-
+    unsigned Typ = read_vbr_uint();
     while (Typ) {         // List is terminated by void/0 typeid
       Elements.push_back(getType(Typ));
-      if (read_typeid(Typ))
-        error("Invalid element type (type type) for structure!");
+      Typ = read_vbr_uint();
     }
 
     Result = StructType::get(Elements);
     break;
   }
   case Type::PointerTyID: {
-    Result = PointerType::get(readSanitizedType());
+    Result = PointerType::get(readType());
     break;
   }
 
@@ -1676,14 +1493,6 @@ inline unsigned BytecodeReader::upgradeCEOpcodes(
   if (!hasSignlessDivRem && !hasSignlessShrCastSetcc)
     return Opcode;
 
-#if 0
-  // If this is a bytecode format that did not include the unreachable
-  // instruction, bump up the opcode number to adjust it.
-  if (hasNoUnreachableInst)
-    if (Opcode >= 6 && Opcode < 62)
-      ++Opcode;
-#endif
-
   // If this is bytecode version 6, that only had signed Rem and Div 
   // instructions, then we must compensate for those two instructions only.
   // So that the switch statement below works, we're trying to turn this into
@@ -1805,46 +1614,39 @@ Value *BytecodeReader::ParseConstantPoolValue(unsigned TypeID) {
   unsigned isExprNumArgs = read_vbr_uint();
 
   if (isExprNumArgs) {
-    if (!hasNoUndefValue) {
-      // 'undef' is encoded with 'exprnumargs' == 1.
-      if (isExprNumArgs == 1)
-        return UndefValue::get(getType(TypeID));
-
-      // Inline asm is encoded with exprnumargs == ~0U.
-      if (isExprNumArgs == ~0U) {
-        std::string AsmStr = read_str();
-        std::string ConstraintStr = read_str();
-        unsigned Flags = read_vbr_uint();
-        
-        const PointerType *PTy = dyn_cast<PointerType>(getType(TypeID));
-        const FunctionType *FTy = 
-          PTy ? dyn_cast<FunctionType>(PTy->getElementType()) : 0;
-
-        if (!FTy || !InlineAsm::Verify(FTy, ConstraintStr))
-          error("Invalid constraints for inline asm");
-        if (Flags & ~1U)
-          error("Invalid flags for inline asm");
-        bool HasSideEffects = Flags & 1;
-        return InlineAsm::get(FTy, AsmStr, ConstraintStr, HasSideEffects);
-      }
+    // 'undef' is encoded with 'exprnumargs' == 1.
+    if (isExprNumArgs == 1)
+      return UndefValue::get(getType(TypeID));
+
+    // Inline asm is encoded with exprnumargs == ~0U.
+    if (isExprNumArgs == ~0U) {
+      std::string AsmStr = read_str();
+      std::string ConstraintStr = read_str();
+      unsigned Flags = read_vbr_uint();
       
-      --isExprNumArgs;
+      const PointerType *PTy = dyn_cast<PointerType>(getType(TypeID));
+      const FunctionType *FTy = 
+        PTy ? dyn_cast<FunctionType>(PTy->getElementType()) : 0;
+
+      if (!FTy || !InlineAsm::Verify(FTy, ConstraintStr))
+        error("Invalid constraints for inline asm");
+      if (Flags & ~1U)
+        error("Invalid flags for inline asm");
+      bool HasSideEffects = Flags & 1;
+      return InlineAsm::get(FTy, AsmStr, ConstraintStr, HasSideEffects);
     }
+    
+    --isExprNumArgs;
 
     // FIXME: Encoding of constant exprs could be much more compact!
     std::vector<Constant*> ArgVec;
     ArgVec.reserve(isExprNumArgs);
     unsigned Opcode = read_vbr_uint();
 
-    // Bytecode files before LLVM 1.4 need have a missing terminator inst.
-    if (hasNoUnreachableInst) Opcode++;
-
     // Read the slot number and types of each of the arguments
     for (unsigned i = 0; i != isExprNumArgs; ++i) {
       unsigned ArgValSlot = read_vbr_uint();
-      unsigned ArgTypeSlot = 0;
-      if (read_typeid(ArgTypeSlot))
-        error("Invalid argument type (type type) for constant value");
+      unsigned ArgTypeSlot = read_vbr_uint();
 
       // Get the arg value from its slot if it exists, otherwise a placeholder
       ArgVec.push_back(getConstantValue(ArgTypeSlot, ArgValSlot));
@@ -1863,20 +1665,6 @@ Value *BytecodeReader::ParseConstantPoolValue(unsigned TypeID) {
       return Result;
     } else if (Opcode == Instruction::GetElementPtr) { // GetElementPtr
       std::vector<Constant*> IdxList(ArgVec.begin()+1, ArgVec.end());
-
-      if (hasRestrictedGEPTypes) {
-        const Type *BaseTy = ArgVec[0]->getType();
-        generic_gep_type_iterator<std::vector<Constant*>::iterator>
-          GTI = gep_type_begin(BaseTy, IdxList.begin(), IdxList.end()),
-          E = gep_type_end(BaseTy, IdxList.begin(), IdxList.end());
-        for (unsigned i = 0; GTI != E; ++GTI, ++i)
-          if (isa<StructType>(*GTI)) {
-            if (IdxList[i]->getType() != Type::UByteTy)
-              error("Invalid index for getelementptr!");
-            IdxList[i] = ConstantExpr::getCast(IdxList[i], Type::UIntTy);
-          }
-      }
-
       Constant* Result = ConstantExpr::getGetElementPtr(ArgVec[0], IdxList);
       if (Handler) Handler->handleConstantExpression(Opcode, ArgVec, Result);
       return Result;
@@ -2068,9 +1856,7 @@ void BytecodeReader::ResolveReferencesToConstant(Constant *NewV, unsigned Typ,
 /// Parse the constant strings section.
 void BytecodeReader::ParseStringConstants(unsigned NumEntries, ValueTable &Tab){
   for (; NumEntries; --NumEntries) {
-    unsigned Typ = 0;
-    if (read_typeid(Typ))
-      error("Invalid type (type type) for string constant");
+    unsigned Typ = read_vbr_uint();
     const Type *Ty = getType(Typ);
     if (!isa<ArrayType>(Ty))
       error("String constant data invalid!");
@@ -2106,22 +1892,16 @@ void BytecodeReader::ParseConstantPool(ValueTable &Tab,
   /// In LLVM 1.3 Type does not derive from Value so the types
   /// do not occupy a plane. Consequently, we read the types
   /// first in the constant pool.
-  if (isFunction && !hasTypeDerivedFromValue) {
+  if (isFunction) {
     unsigned NumEntries = read_vbr_uint();
     ParseTypes(TypeTab, NumEntries);
   }
 
   while (moreInBlock()) {
     unsigned NumEntries = read_vbr_uint();
-    unsigned Typ = 0;
-    bool isTypeType = read_typeid(Typ);
-
-    /// In LLVM 1.2 and before, Types were written to the
-    /// bytecode file in the "Type Type" plane (#12).
-    /// In 1.3 plane 12 is now the label plane.  Handle this here.
-    if (isTypeType) {
-      ParseTypes(TypeTab, NumEntries);
-    } else if (Typ == Type::VoidTyID) {
+    unsigned Typ = read_vbr_uint();
+
+    if (Typ == Type::VoidTyID) {
       /// Use of Type::VoidTyID is a misnomer. It actually means
       /// that the following plane is constant strings
       assert(&Tab == &ModuleValues && "Cannot read strings in functions!");
@@ -2213,20 +1993,6 @@ void BytecodeReader::ParseFunctionBody(Function* F) {
       ParseCompactionTable();
       break;
 
-    case BytecodeFormat::BasicBlock: {
-      if (!InsertedArguments) {
-        // Insert arguments into the value table before we parse the first basic
-        // block in the function, but after we potentially read in the
-        // compaction table.
-        insertArguments(F);
-        InsertedArguments = true;
-      }
-
-      BasicBlock *BB = ParseBasicBlock(BlockNum++);
-      F->getBasicBlockList().push_back(BB);
-      break;
-    }
-
     case BytecodeFormat::InstructionListBlockID: {
       // Insert arguments into the value table before we parse the instruction
       // list for the function, but after we potentially read in the compaction
@@ -2253,9 +2019,6 @@ void BytecodeReader::ParseFunctionBody(Function* F) {
author	Reid Spencer <rspencer@reidspencer.com>	2006-11-14 04:47:22 +0000
committer	Reid Spencer <rspencer@reidspencer.com>	2006-11-14 04:47:22 +0000
commit	d798a515e93e1ac323ecff8dc6c0b0567c252e36 (patch)
tree	d5c74b60fe1e0c2615b3cbddc6ce781df6016ab1
parent	df1a10ece6a75f230d98c6fb001349eede90387a (diff)