Enable streaming of bitcode

[oota-llvm.git] / lib / Target / X86 / Disassembler / X86DisassemblerDecoder.c
diff --git a/lib/Target/X86/Disassembler/X86DisassemblerDecoder.c b/lib/Target/X86/Disassembler/X86DisassemblerDecoder.c

index 8a88955561283549015eddf033906e667cc32bea..958f653eb736bc61313cb2c3d4e8320a59011752 100644 (file)
--- a/lib/Target/X86/Disassembler/X86DisassemblerDecoder.c
+++ b/lib/Target/X86/Disassembler/X86DisassemblerDecoder.c
@@ -103,12 +103,9 @@ static InstrUID decode(OpcodeType type,
                         InstructionContext insnContext,
                         uint8_t opcode,
                         uint8_t modRM) {
-  const struct ModRMDecision* dec;
+  const struct ModRMDecision* dec = 0;
    
    switch (type) {
-  default:
-    debug("Unknown opcode type");
-    return 0;
    case ONEBYTE:
      dec = &ONEBYTE_SYM.opcodeDecisions[insnContext].modRMDecisions[opcode];
      break;
@@ -406,12 +403,14 @@ static int readPrefixes(struct InternalInstruction* insn) {
        consumeByte(insn, &insn->vexPrefix[2]);
  
        /* We simulate the REX prefix for simplicity's sake */
-    
-      insn->rexPrefix = 0x40 
-                      | (wFromVEX3of3(insn->vexPrefix[2]) << 3)
-                      | (rFromVEX2of3(insn->vexPrefix[1]) << 2)
-                      | (xFromVEX2of3(insn->vexPrefix[1]) << 1)
-                      | (bFromVEX2of3(insn->vexPrefix[1]) << 0);
+   
+      if (insn->mode == MODE_64BIT) {
+        insn->rexPrefix = 0x40 
+                        | (wFromVEX3of3(insn->vexPrefix[2]) << 3)
+                        | (rFromVEX2of3(insn->vexPrefix[1]) << 2)
+                        | (xFromVEX2of3(insn->vexPrefix[1]) << 1)
+                        | (bFromVEX2of3(insn->vexPrefix[1]) << 0);
+      }
      
        switch (ppFromVEX3of3(insn->vexPrefix[2]))
        {
@@ -444,8 +443,10 @@ static int readPrefixes(struct InternalInstruction* insn) {
        insn->vexPrefix[0] = byte;
        consumeByte(insn, &insn->vexPrefix[1]);
          
-      insn->rexPrefix = 0x40 
-                      | (rFromVEX2of2(insn->vexPrefix[1]) << 2);
+      if (insn->mode == MODE_64BIT) {
+        insn->rexPrefix = 0x40 
+                        | (rFromVEX2of2(insn->vexPrefix[1]) << 2);
+      }
          
        switch (ppFromVEX2of2(insn->vexPrefix[1]))
        {
@@ -699,34 +700,6 @@ static BOOL is16BitEquvalent(const char* orig, const char* equiv) {
    }
  }
  
-/*
- * is64BitEquivalent - Determines whether two instruction names refer to
- * equivalent instructions but one is 64-bit whereas the other is not.
- *
- * @param orig  - The instruction that is not 64-bit
- * @param equiv - The instruction that is 64-bit
- */
-static BOOL is64BitEquivalent(const char* orig, const char* equiv) {
-  off_t i;
-  
-  for (i = 0;; i++) {
-    if (orig[i] == '\0' && equiv[i] == '\0')
-      return TRUE;
-    if (orig[i] == '\0' || equiv[i] == '\0')
-      return FALSE;
-    if (orig[i] != equiv[i]) {
-      if ((orig[i] == 'W' || orig[i] == 'L') && equiv[i] == 'Q')
-        continue;
-      if ((orig[i] == '1' || orig[i] == '3') && equiv[i] == '6')
-        continue;
-      if ((orig[i] == '6' || orig[i] == '2') && equiv[i] == '4')
-        continue;
-      return FALSE;
-    }
-  }
-}
-
-
  /*
   * getID - Determines the ID of an instruction, consuming the ModR/M byte as 
   *   appropriate for extended and escape opcodes.  Determines the attributes and 
@@ -763,8 +736,6 @@ static int getID(struct InternalInstruction* insn) {
          break;
        }
      
-      if (wFromVEX3of3(insn->vexPrefix[2]))
-        attrMask |= ATTR_REXW;
        if (lFromVEX3of3(insn->vexPrefix[2]))
          attrMask |= ATTR_VEXL;
      }
@@ -789,63 +760,58 @@ static int getID(struct InternalInstruction* insn) {
      }
    }
    else {
-    if (insn->rexPrefix & 0x08)
-      attrMask |= ATTR_REXW;
-  
      if (isPrefixAtLocation(insn, 0x66, insn->necessaryPrefixLocation))
        attrMask |= ATTR_OPSIZE;
      else if (isPrefixAtLocation(insn, 0xf3, insn->necessaryPrefixLocation))
        attrMask |= ATTR_XS;
      else if (isPrefixAtLocation(insn, 0xf2, insn->necessaryPrefixLocation))
        attrMask |= ATTR_XD;
-    
    }
  
+  if (insn->rexPrefix & 0x08)
+    attrMask |= ATTR_REXW;
+
    if (getIDWithAttrMask(&instructionID, insn, attrMask))
      return -1;
-  
+
    /* The following clauses compensate for limitations of the tables. */
-  
-  if ((attrMask & ATTR_XD) && (attrMask & ATTR_REXW)) {
+
+  if ((attrMask & ATTR_VEXL) && (attrMask & ATTR_REXW) &&
+      !(attrMask & ATTR_OPSIZE)) {
      /*
-     * Although for SSE instructions it is usually necessary to treat REX.W+F2
-     * as F2 for decode (in the absence of a 64BIT_REXW_XD category) there is
-     * an occasional instruction where F2 is incidental and REX.W is the more
-     * significant.  If the decoded instruction is 32-bit and adding REX.W
-     * instead of F2 changes a 32 to a 64, we adopt the new encoding.
+     * Some VEX instructions ignore the L-bit, but use the W-bit. Normally L-bit
+     * has precedence since there are no L-bit with W-bit entries in the tables.
+     * So if the L-bit isn't significant we should use the W-bit instead.
+     * We only need to do this if the instruction doesn't specify OpSize since
+     * there is a VEX_L_W_OPSIZE table.
       */
-    
+
      const struct InstructionSpecifier *spec;
-    uint16_t instructionIDWithREXw;
-    const struct InstructionSpecifier *specWithREXw;
-    
+    uint16_t instructionIDWithWBit;
+    const struct InstructionSpecifier *specWithWBit;
+
      spec = specifierForUID(instructionID);
-    
-    if (getIDWithAttrMask(&instructionIDWithREXw,
+
+    if (getIDWithAttrMask(&instructionIDWithWBit,
                            insn,
-                          attrMask & (~ATTR_XD))) {
-      /*
-       * Decoding with REX.w would yield nothing; give up and return original
-       * decode.
-       */
-      
+                          (attrMask & (~ATTR_VEXL)) | ATTR_REXW)) {
        insn->instructionID = instructionID;
        insn->spec = spec;
        return 0;
      }
-    
-    specWithREXw = specifierForUID(instructionIDWithREXw);
-    
-    if (is64BitEquivalent(spec->name, specWithREXw->name)) {
-      insn->instructionID = instructionIDWithREXw;
-      insn->spec = specWithREXw;
+
+    specWithWBit = specifierForUID(instructionIDWithWBit);
+
+    if (instructionID != instructionIDWithWBit) {
+      insn->instructionID = instructionIDWithWBit;
+      insn->spec = specWithWBit;
      } else {
        insn->instructionID = instructionID;
        insn->spec = spec;
      }
      return 0;
    }
-  
+
    if (insn->prefixPresent[0x66] && !(attrMask & ATTR_OPSIZE)) {
      /*
       * The instruction tables make no distinction between instructions that
@@ -899,7 +865,7 @@ static int getID(struct InternalInstruction* insn) {
  
      spec = specifierForUID(instructionID);
      
-    // Borrow opcode from one of the other XCHGar opcodes
+    /* Borrow opcode from one of the other XCHGar opcodes */
      insn->opcode = 0x91;
     
      if (getIDWithAttrMask(&instructionIDWithNewOpcode,
@@ -914,7 +880,7 @@ static int getID(struct InternalInstruction* insn) {
  
      specWithNewOpcode = specifierForUID(instructionIDWithNewOpcode);
  
-    // Change back 
+    /* Change back */
      insn->opcode = 0x90;
  
      insn->instructionID = instructionIDWithNewOpcode;
@@ -1487,6 +1453,9 @@ static int readVVVV(struct InternalInstruction* insn) {
    else
      return -1;
  
+  if (insn->mode != MODE_64BIT)
+    insn->vvvv &= 0x7;
+
    return 0;
  }
  
@@ -1500,6 +1469,7 @@ static int readVVVV(struct InternalInstruction* insn) {
  static int readOperands(struct InternalInstruction* insn) {
    int index;
    int hasVVVV, needVVVV;
+  int sawRegImm = 0;
    
    dbgprintf(insn, "readOperands()");
  
@@ -1528,11 +1498,22 @@ static int readOperands(struct InternalInstruction* insn) {
        dbgprintf(insn, "We currently don't hande code-offset encodings");
        return -1;
      case ENCODING_IB:
+      if (sawRegImm) {
+        /* Saw a register immediate so don't read again and instead split the
+           previous immediate.  FIXME: This is a hack. */
+        insn->immediates[insn->numImmediatesConsumed] =
+          insn->immediates[insn->numImmediatesConsumed - 1] & 0xf;
+        ++insn->numImmediatesConsumed;
+        break;
+      }
        if (readImmediate(insn, 1))
          return -1;
        if (insn->spec->operands[index].type == TYPE_IMM3 &&
            insn->immediates[insn->numImmediatesConsumed - 1] > 7)
          return -1;
+      if (insn->spec->operands[index].type == TYPE_XMM128 ||
+          insn->spec->operands[index].type == TYPE_XMM256)
+        sawRegImm = 1;
        break;
      case ENCODING_IW:
        if (readImmediate(insn, 2))