Add SSE4A MOVNTSS/MOVNTSD instructions.
authorCraig Topper <craig.topper@gmail.com>
Mon, 7 May 2012 05:36:19 +0000 (05:36 +0000)
committerCraig Topper <craig.topper@gmail.com>
Mon, 7 May 2012 05:36:19 +0000 (05:36 +0000)
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@156281 91177308-0d34-0410-b5e6-96231b3b80d8

include/llvm/IntrinsicsX86.td
lib/Target/X86/X86InstrSSE.td
test/CodeGen/X86/sse4a.ll [new file with mode: 0644]

index cb7b3eadc8707436974b7c76352e487cceb7a407..1abeb9e5559904932a30bb877b9140a227224afe 100644 (file)
@@ -1004,6 +1004,16 @@ let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
         [IntrNoMem]>;
 }
 
+//===----------------------------------------------------------------------===//
+// SSE4A
+
+let TargetPrefix = "x86" in {  // All intrinsics start with "llvm.x86.".
+  def int_x86_sse4a_movnt_ss : GCCBuiltin<"__builtin_ia32_movntss">,
+    Intrinsic<[], [llvm_ptr_ty, llvm_v4f32_ty], []>;
+  def int_x86_sse4a_movnt_sd : GCCBuiltin<"__builtin_ia32_movntsd">,
+    Intrinsic<[], [llvm_ptr_ty, llvm_v2f64_ty], []>;
+}
+
 //===----------------------------------------------------------------------===//
 // AVX
 
index aa3e08bd4dc537581c0252d8324ffda3551d3130..0a940552453a87dc1034105d23a6ded958f0e3bb 100644 (file)
@@ -7270,6 +7270,20 @@ defm : pclmul_alias<"hqlq", 0x01>;
 defm : pclmul_alias<"lqhq", 0x10>;
 defm : pclmul_alias<"lqlq", 0x00>;
 
+//===----------------------------------------------------------------------===//
+// SSE4A Instructions
+//===----------------------------------------------------------------------===//
+
+let Predicates = [HasSSE4A] in {
+def MOVNTSS : I<0x2B, MRMDestMem, (outs), (ins f32mem:$dst, VR128:$src),
+                "movntss\t{$src, $dst|$dst, $src}",
+                [(int_x86_sse4a_movnt_ss addr:$dst, VR128:$src)]>, XS;
+
+def MOVNTSD : I<0x2B, MRMDestMem, (outs), (ins f64mem:$dst, VR128:$src),
+                "movntsd\t{$src, $dst|$dst, $src}",
+                [(int_x86_sse4a_movnt_sd addr:$dst, VR128:$src)]>, XD;
+}
+
 //===----------------------------------------------------------------------===//
 // AVX Instructions
 //===----------------------------------------------------------------------===//
diff --git a/test/CodeGen/X86/sse4a.ll b/test/CodeGen/X86/sse4a.ll
new file mode 100644 (file)
index 0000000..0732353
--- /dev/null
@@ -0,0 +1,19 @@
+; RUN: llc < %s -mtriple=i686-apple-darwin9 -mattr=sse4a | FileCheck %s
+
+define void @test1(float* %p, <4 x float> %a) nounwind optsize ssp {
+; CHECK: movntss
+entry:
+  tail call void @llvm.x86.sse4a.movnt.ss(float* %p, <4 x float> %a) nounwind
+  ret void
+}
+
+declare void @llvm.x86.sse4a.movnt.ss(float*, <4 x float>)
+
+define void @test2(double* %p, <2 x double> %a) nounwind optsize ssp {
+; CHECK: movntsd
+entry:
+  tail call void @llvm.x86.sse4a.movnt.sd(double* %p, <2 x double> %a) nounwind
+  ret void
+}
+
+declare void @llvm.x86.sse4a.movnt.sd(double*, <2 x double>)