R600/SI: Use S_ADD_U32 and S_SUB_U32 for low half of 64-bit operations

author Tom Stellard <thomas.stellard@amd.com>

Fri, 5 Sep 2014 14:07:59 +0000 (14:07 +0000)

committer Tom Stellard <thomas.stellard@amd.com>

Fri, 5 Sep 2014 14:07:59 +0000 (14:07 +0000)
author Tom Stellard <thomas.stellard@amd.com>
Fri, 5 Sep 2014 14:07:59 +0000 (14:07 +0000)
committer Tom Stellard <thomas.stellard@amd.com>
Fri, 5 Sep 2014 14:07:59 +0000 (14:07 +0000)
diff --git a/lib/Target/R600/AMDGPUISelDAGToDAG.cpp b/lib/Target/R600/AMDGPUISelDAGToDAG.cpp

index b988d33ffbfe167b146eea46d3dfbf48743847cb..ed86a18e5cb2c252dfc159899cb4b431a4871b0c 100644 (file)
--- a/lib/Target/R600/AMDGPUISelDAGToDAG.cpp
+++ b/lib/Target/R600/AMDGPUISelDAGToDAG.cpp
@@ -701,7 +701,7 @@ SDNode *AMDGPUDAGToDAGISel::SelectADD_SUB_I64(SDNode *N) {
    SDValue AddLoArgs[] = { SDValue(Lo0, 0), SDValue(Lo1, 0) };
  
  
-  unsigned Opc = IsAdd ? AMDGPU::S_ADD_I32 : AMDGPU::S_SUB_I32;
+  unsigned Opc = IsAdd ? AMDGPU::S_ADD_U32 : AMDGPU::S_SUB_U32;
    unsigned CarryOpc = IsAdd ? AMDGPU::S_ADDC_U32 : AMDGPU::S_SUBB_U32;
  
    if (!isCFDepth0()) {
diff --git a/lib/Target/R600/SIInstrInfo.cpp b/lib/Target/R600/SIInstrInfo.cpp

index 73320a5235f50a16262fc00d7ca00e461aa1aaf9..11aaf45fe3294f7000327a1e4c3e54b2b894b240 100644 (file)
--- a/lib/Target/R600/SIInstrInfo.cpp
+++ b/lib/Target/R600/SIInstrInfo.cpp
@@ -494,7 +494,7 @@ bool SIInstrInfo::expandPostRAPseudo(MachineBasicBlock::iterator MI) const {
      BuildMI(MBB, MI, DL, get(AMDGPU::S_GETPC_B64), Reg);
  
      // Add 32-bit offset from this instruction to the start of the constant data.
-    BuildMI(MBB, MI, DL, get(AMDGPU::S_ADD_I32), RegLo)
+    BuildMI(MBB, MI, DL, get(AMDGPU::S_ADD_U32), RegLo)
              .addReg(RegLo)
              .addTargetIndex(AMDGPU::TI_CONSTDATA_START)
              .addReg(AMDGPU::SCC, RegState::Define | RegState::Implicit);
@@ -904,9 +904,11 @@ unsigned SIInstrInfo::getVALUOp(const MachineInstr &MI) {
    case AMDGPU::S_MOV_B32:
      return MI.getOperand(1).isReg() ?
             AMDGPU::COPY : AMDGPU::V_MOV_B32_e32;
-  case AMDGPU::S_ADD_I32: return AMDGPU::V_ADD_I32_e32;
+  case AMDGPU::S_ADD_I32:
+  case AMDGPU::S_ADD_U32: return AMDGPU::V_ADD_I32_e32;
    case AMDGPU::S_ADDC_U32: return AMDGPU::V_ADDC_U32_e32;
-  case AMDGPU::S_SUB_I32: return AMDGPU::V_SUB_I32_e32;
+  case AMDGPU::S_SUB_I32:
+  case AMDGPU::S_SUB_U32: return AMDGPU::V_SUB_I32_e32;
    case AMDGPU::S_SUBB_U32: return AMDGPU::V_SUBB_U32_e32;
    case AMDGPU::S_MUL_I32: return AMDGPU::V_MUL_LO_I32;
    case AMDGPU::S_AND_B32: return AMDGPU::V_AND_B32_e32;
diff --git a/lib/Target/R600/SIInstructions.td b/lib/Target/R600/SIInstructions.td

index f091c272379c4c06ec1c55d95b260a117bf9a4b7..56de9db372a1f3df7eca07de2817f51ffc73788b 100644 (file)
--- a/lib/Target/R600/SIInstructions.td
+++ b/lib/Target/R600/SIInstructions.td
@@ -1858,11 +1858,11 @@ def : Pat <
  // SOP2 Patterns
  //===----------------------------------------------------------------------===//
  
-// V_ADD_I32_e32/S_ADD_I32 produces carry in VCC/SCC. For the vector
+// V_ADD_I32_e32/S_ADD_U32 produces carry in VCC/SCC. For the vector
  // case, the sgpr-copies pass will fix this to use the vector version.
  def : Pat <
    (i32 (addc i32:$src0, i32:$src1)),
-  (S_ADD_I32 $src0, $src1)
+  (S_ADD_U32 $src0, $src1)
  >;
  
  } // Predicates = [isSI, isCFDepth0]
diff --git a/test/CodeGen/R600/add.ll b/test/CodeGen/R600/add.ll

index 711a2bc417741b06f2a04f17838c4f8b8307bd99..f62c9d6bd64de68f88998afb2674dc6cfe08c4e3 100644 (file)
--- a/test/CodeGen/R600/add.ll
+++ b/test/CodeGen/R600/add.ll
@@ -117,7 +117,7 @@ entry:
  }
  
  ; FUNC-LABEL: @add64
-; SI-CHECK: S_ADD_I32
+; SI-CHECK: S_ADD_U32
  ; SI-CHECK: S_ADDC_U32
  define void @add64(i64 addrspace(1)* %out, i64 %a, i64 %b) {
  entry:
diff --git a/test/CodeGen/R600/add_i64.ll b/test/CodeGen/R600/add_i64.ll

index dac4f173e3163bd944fa274391365f1473a35f58..5be969ce568c116250bc8bcff3bc2998227bc397 100644 (file)
--- a/test/CodeGen/R600/add_i64.ll
+++ b/test/CodeGen/R600/add_i64.ll
@@ -43,9 +43,9 @@ define void @sgpr_operand_reversed(i64 addrspace(1)* noalias %out, i64 addrspace
  
  
  ; SI-LABEL: @test_v2i64_sreg:
-; SI: S_ADD_I32
+; SI: S_ADD_U32
  ; SI: S_ADDC_U32
-; SI: S_ADD_I32
+; SI: S_ADD_U32
  ; SI: S_ADDC_U32
  define void @test_v2i64_sreg(<2 x i64> addrspace(1)* noalias %out, <2 x i64> %a, <2 x i64> %b) {
    %result = add <2 x i64> %a, %b
diff --git a/test/CodeGen/R600/ssubo.ll b/test/CodeGen/R600/ssubo.ll

index b330276ae9e76cf0d82eddf8d791bcd06b067f6c..066cdf5cd93fcea1521549bc6dd5cebc00978f38 100644 (file)
--- a/test/CodeGen/R600/ssubo.ll
+++ b/test/CodeGen/R600/ssubo.ll
@@ -38,7 +38,7 @@ define void @v_ssubo_i32(i32 addrspace(1)* %out, i1 addrspace(1)* %carryout, i32
  }
  
  ; FUNC-LABEL: @s_ssubo_i64
-; SI: S_SUB_I32
+; SI: S_SUB_U32
  ; SI: S_SUBB_U32
  define void @s_ssubo_i64(i64 addrspace(1)* %out, i1 addrspace(1)* %carryout, i64 %a, i64 %b) nounwind {
    %ssub = call { i64, i1 } @llvm.ssub.with.overflow.i64(i64 %a, i64 %b) nounwind
diff --git a/test/CodeGen/R600/sub.ll b/test/CodeGen/R600/sub.ll

index 8e64148142d22a96e7af102d52a99610658a977f..a8196a0ea4df94740bdb47a2a84da528a1d81798 100644 (file)
--- a/test/CodeGen/R600/sub.ll
+++ b/test/CodeGen/R600/sub.ll
@@ -40,7 +40,7 @@ define void @test4(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in) {
  }
  
  ; FUNC-LABEL: @s_sub_i64:
-; SI: S_SUB_I32
+; SI: S_SUB_U32
  ; SI: S_SUBB_U32
  
  ; EG-DAG: SETGE_UINT
diff --git a/test/CodeGen/R600/trunc.ll b/test/CodeGen/R600/trunc.ll

index 4a278fbcce05dcf65cf3f2a77b4605575a986991..f635ac2e0018eb634994c4cd2d9b4762043b6763 100644 (file)
--- a/test/CodeGen/R600/trunc.ll
+++ b/test/CodeGen/R600/trunc.ll
@@ -31,7 +31,7 @@ define void @trunc_load_shl_i64(i32 addrspace(1)* %out, i64 %a) {
  
  ; SI-LABEL: @trunc_shl_i64:
  ; SI: S_LOAD_DWORDX2 s{{\[}}[[LO_SREG:[0-9]+]]:{{[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0xd
-; SI: S_ADD_I32 s[[LO_SREG2:[0-9]+]], s[[LO_SREG]],
+; SI: S_ADD_U32 s[[LO_SREG2:[0-9]+]], s[[LO_SREG]],
  ; SI: S_ADDC_U32
  ; SI: S_LSHL_B64 s{{\[}}[[LO_SHL:[0-9]+]]:{{[0-9]+\]}}, s{{\[}}[[LO_SREG2]]:{{[0-9]+\]}}, 2
  ; SI: V_MOV_B32_e32 v[[LO_VREG:[0-9]+]], s[[LO_SHL]]
diff --git a/test/CodeGen/R600/uaddo.ll b/test/CodeGen/R600/uaddo.ll

index a80e502eef2a0f6d874da3de3cdee7f59a430815..0b854b543a5a4811ec2b8a14c0c83ed1bf57c20f 100644 (file)
--- a/test/CodeGen/R600/uaddo.ll
+++ b/test/CodeGen/R600/uaddo.ll
@@ -43,7 +43,7 @@ define void @v_uaddo_i32(i32 addrspace(1)* %out, i1 addrspace(1)* %carryout, i32
  }
  
  ; FUNC-LABEL: @s_uaddo_i64
-; SI: S_ADD_I32
+; SI: S_ADD_U32
  ; SI: S_ADDC_U32
  define void @s_uaddo_i64(i64 addrspace(1)* %out, i1 addrspace(1)* %carryout, i64 %a, i64 %b) nounwind {
    %uadd = call { i64, i1 } @llvm.uadd.with.overflow.i64(i64 %a, i64 %b) nounwind
diff --git a/test/CodeGen/R600/usubo.ll b/test/CodeGen/R600/usubo.ll

index d57a2c7f773eca64bc52d39e3c2bfadfa87d27a3..c293ad78e068d72428670645bdee38bb7a3df9b3 100644 (file)
--- a/test/CodeGen/R600/usubo.ll
+++ b/test/CodeGen/R600/usubo.ll
@@ -40,7 +40,7 @@ define void @v_usubo_i32(i32 addrspace(1)* %out, i1 addrspace(1)* %carryout, i32
  }
  
  ; FUNC-LABEL: @s_usubo_i64
-; SI: S_SUB_I32
+; SI: S_SUB_U32
  ; SI: S_SUBB_U32
  define void @s_usubo_i64(i64 addrspace(1)* %out, i1 addrspace(1)* %carryout, i64 %a, i64 %b) nounwind {
    %usub = call { i64, i1 } @llvm.usub.with.overflow.i64(i64 %a, i64 %b) nounwind
author	Tom Stellard <thomas.stellard@amd.com>
	Fri, 5 Sep 2014 14:07:59 +0000 (14:07 +0000)
committer	Tom Stellard <thomas.stellard@amd.com>
	Fri, 5 Sep 2014 14:07:59 +0000 (14:07 +0000)
lib/Target/R600/AMDGPUISelDAGToDAG.cpp		patch \| blob \| history
lib/Target/R600/SIInstrInfo.cpp		patch \| blob \| history
lib/Target/R600/SIInstructions.td		patch \| blob \| history
test/CodeGen/R600/add.ll		patch \| blob \| history
test/CodeGen/R600/add_i64.ll		patch \| blob \| history
test/CodeGen/R600/ssubo.ll		patch \| blob \| history
test/CodeGen/R600/sub.ll		patch \| blob \| history
test/CodeGen/R600/trunc.ll		patch \| blob \| history
test/CodeGen/R600/uaddo.ll		patch \| blob \| history
test/CodeGen/R600/usubo.ll		patch \| blob \| history