[NVPTX] Add missing .v4 qualifier on vector store instruction
authorJustin Holewinski <jholewinski@nvidia.com>
Thu, 17 Jul 2014 16:58:56 +0000 (16:58 +0000)
committerJustin Holewinski <jholewinski@nvidia.com>
Thu, 17 Jul 2014 16:58:56 +0000 (16:58 +0000)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213276 91177308-0d34-0410-b5e6-96231b3b80d8

lib/Target/NVPTX/NVPTXInstrInfo.td
test/CodeGen/NVPTX/vector-call.ll [new file with mode: 0644]

index d2c0373b9998f8675bc4921536a141ce596aad80..5919fe1c01652a78cc519782dd61374290e83216 100644 (file)
@@ -1917,7 +1917,7 @@ def StoreParamV2I8   : StoreParamV2Inst<Int16Regs, ".b8">;
 def StoreParamV4I32    : NVPTXInst<(outs), (ins Int32Regs:$val, Int32Regs:$val2,
                                                Int32Regs:$val3, Int32Regs:$val4,
                                                 i32imm:$a, i32imm:$b),
-                   "st.param.b32\t[param$a+$b], {{$val, $val2, $val3, $val4}};",
+                "st.param.v4.b32\t[param$a+$b], {{$val, $val2, $val3, $val4}};",
                          []>;
 
 def StoreParamV4I16    : NVPTXInst<(outs), (ins Int16Regs:$val, Int16Regs:$val2,
diff --git a/test/CodeGen/NVPTX/vector-call.ll b/test/CodeGen/NVPTX/vector-call.ll
new file mode 100644 (file)
index 0000000..a03d7fd
--- /dev/null
@@ -0,0 +1,12 @@
+; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s
+
+target triple = "nvptx-unknown-cuda"
+
+declare void @bar(<4 x i32>)
+
+; CHECK-LABEL @foo
+define void @foo(<4 x i32> %a) {
+; CHECK: st.param.v4.b32
+  tail call void @bar(<4 x i32> %a)
+  ret void
+}