1 ; RUN: llc -march=r600 -mcpu=cypress < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s
2 ; RUN: llc -march=r600 -mcpu=SI -verify-machineinstrs< %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
4 ; FUNC-LABEL: @anyext_load_i8:
7 define void @anyext_load_i8(i8 addrspace(1)* nocapture noalias %out, i8 addrspace(1)* nocapture noalias %src) nounwind {
8 %cast = bitcast i8 addrspace(1)* %src to i32 addrspace(1)*
9 %load = load i32 addrspace(1)* %cast, align 1
10 %x = bitcast i32 %load to <4 x i8>
11 %castOut = bitcast i8 addrspace(1)* %out to <4 x i8> addrspace(1)*
12 store <4 x i8> %x, <4 x i8> addrspace(1)* %castOut, align 1
16 ; FUNC-LABEL: @anyext_load_i16:
21 define void @anyext_load_i16(i16 addrspace(1)* nocapture noalias %out, i16 addrspace(1)* nocapture noalias %src) nounwind {
22 %cast = bitcast i16 addrspace(1)* %src to i32 addrspace(1)*
23 %load = load i32 addrspace(1)* %cast, align 1
24 %x = bitcast i32 %load to <2 x i16>
25 %castOut = bitcast i16 addrspace(1)* %out to <2 x i16> addrspace(1)*
26 store <2 x i16> %x, <2 x i16> addrspace(1)* %castOut, align 1
30 ; FUNC-LABEL: @anyext_load_lds_i8:
33 define void @anyext_load_lds_i8(i8 addrspace(3)* nocapture noalias %out, i8 addrspace(3)* nocapture noalias %src) nounwind {
34 %cast = bitcast i8 addrspace(3)* %src to i32 addrspace(3)*
35 %load = load i32 addrspace(3)* %cast, align 1
36 %x = bitcast i32 %load to <4 x i8>
37 %castOut = bitcast i8 addrspace(3)* %out to <4 x i8> addrspace(3)*
38 store <4 x i8> %x, <4 x i8> addrspace(3)* %castOut, align 1
42 ; FUNC-LABEL: @anyext_load_lds_i16:
47 define void @anyext_load_lds_i16(i16 addrspace(3)* nocapture noalias %out, i16 addrspace(3)* nocapture noalias %src) nounwind {
48 %cast = bitcast i16 addrspace(3)* %src to i32 addrspace(3)*
49 %load = load i32 addrspace(3)* %cast, align 1
50 %x = bitcast i32 %load to <2 x i16>
51 %castOut = bitcast i16 addrspace(3)* %out to <2 x i16> addrspace(3)*
52 store <2 x i16> %x, <2 x i16> addrspace(3)* %castOut, align 1
56 ; FUNC-LABEL: @sextload_global_i8_to_i64
57 ; SI: BUFFER_LOAD_SBYTE [[LOAD:v[0-9]+]],
58 ; SI: V_ASHRREV_I32_e32 v{{[0-9]+}}, 31, [[LOAD]]
59 ; SI: BUFFER_STORE_DWORDX2
60 define void @sextload_global_i8_to_i64(i64 addrspace(1)* %out, i8 addrspace(1)* %in) nounwind {
61 %a = load i8 addrspace(1)* %in, align 8
62 %ext = sext i8 %a to i64
63 store i64 %ext, i64 addrspace(1)* %out, align 8
67 ; FUNC-LABEL: @sextload_global_i16_to_i64
68 ; SI: BUFFER_LOAD_SSHORT [[LOAD:v[0-9]+]],
69 ; SI: V_ASHRREV_I32_e32 v{{[0-9]+}}, 31, [[LOAD]]
70 ; SI: BUFFER_STORE_DWORDX2
71 define void @sextload_global_i16_to_i64(i64 addrspace(1)* %out, i16 addrspace(1)* %in) nounwind {
72 %a = load i16 addrspace(1)* %in, align 8
73 %ext = sext i16 %a to i64
74 store i64 %ext, i64 addrspace(1)* %out, align 8
78 ; FUNC-LABEL: @sextload_global_i32_to_i64
79 ; SI: BUFFER_LOAD_DWORD [[LOAD:v[0-9]+]],
80 ; SI: V_ASHRREV_I32_e32 v{{[0-9]+}}, 31, [[LOAD]]
81 ; SI: BUFFER_STORE_DWORDX2
82 define void @sextload_global_i32_to_i64(i64 addrspace(1)* %out, i32 addrspace(1)* %in) nounwind {
83 %a = load i32 addrspace(1)* %in, align 8
84 %ext = sext i32 %a to i64
85 store i64 %ext, i64 addrspace(1)* %out, align 8
89 ; FUNC-LABEL: @zextload_global_i8_to_i64
90 ; SI: S_MOV_B32 [[ZERO:s[0-9]+]], 0
91 ; SI: BUFFER_LOAD_UBYTE [[LOAD:v[0-9]+]],
92 ; SI: V_MOV_B32_e32 {{v[0-9]+}}, [[ZERO]]
93 ; SI: BUFFER_STORE_DWORDX2
94 define void @zextload_global_i8_to_i64(i64 addrspace(1)* %out, i8 addrspace(1)* %in) nounwind {
95 %a = load i8 addrspace(1)* %in, align 8
96 %ext = zext i8 %a to i64
97 store i64 %ext, i64 addrspace(1)* %out, align 8
101 ; FUNC-LABEL: @zextload_global_i16_to_i64
102 ; SI: S_MOV_B32 [[ZERO:s[0-9]+]], 0
103 ; SI: BUFFER_LOAD_USHORT [[LOAD:v[0-9]+]],
104 ; SI: V_MOV_B32_e32 {{v[0-9]+}}, [[ZERO]]
105 ; SI: BUFFER_STORE_DWORDX2
106 define void @zextload_global_i16_to_i64(i64 addrspace(1)* %out, i16 addrspace(1)* %in) nounwind {
107 %a = load i16 addrspace(1)* %in, align 8
108 %ext = zext i16 %a to i64
109 store i64 %ext, i64 addrspace(1)* %out, align 8
113 ; FUNC-LABEL: @zextload_global_i32_to_i64
114 ; SI: S_MOV_B32 [[ZERO:s[0-9]+]], 0
115 ; SI: BUFFER_LOAD_DWORD [[LOAD:v[0-9]+]],
116 ; SI: V_MOV_B32_e32 {{v[0-9]+}}, [[ZERO]]
117 ; SI: BUFFER_STORE_DWORDX2
118 define void @zextload_global_i32_to_i64(i64 addrspace(1)* %out, i32 addrspace(1)* %in) nounwind {
119 %a = load i32 addrspace(1)* %in, align 8
120 %ext = zext i32 %a to i64
121 store i64 %ext, i64 addrspace(1)* %out, align 8