@@ -130,14 +130,14 @@ define half @ld_global_v8f16(ptr addrspace(1) %ptr) {
130
130
define float @ld_global_v2f32 (ptr addrspace (1 ) %ptr ) {
131
131
; CHECK-LABEL: ld_global_v2f32(
132
132
; CHECK: {
133
- ; CHECK-NEXT: .reg .f32 %f<4>;
133
+ ; CHECK-NEXT: .reg .b32 %f<4>;
134
134
; CHECK-NEXT: .reg .b64 %rd<2>;
135
135
; CHECK-EMPTY:
136
136
; CHECK-NEXT: // %bb.0:
137
- ; CHECK-NEXT: ld.param.u64 %rd1, [ld_global_v2f32_param_0];
138
- ; CHECK-NEXT: ld.global.nc.v2.f32 {%f1, %f2}, [%rd1];
137
+ ; CHECK-NEXT: ld.param.b64 %rd1, [ld_global_v2f32_param_0];
138
+ ; CHECK-NEXT: ld.global.nc.v2.b32 {%f1, %f2}, [%rd1];
139
139
; CHECK-NEXT: add.rn.f32 %f3, %f1, %f2;
140
- ; CHECK-NEXT: st.param.f32 [func_retval0], %f3;
140
+ ; CHECK-NEXT: st.param.b32 [func_retval0], %f3;
141
141
; CHECK-NEXT: ret;
142
142
%a = load <2 x float >, ptr addrspace (1 ) %ptr , !invariant.load !0
143
143
%v1 = extractelement <2 x float > %a , i32 0
@@ -149,16 +149,16 @@ define float @ld_global_v2f32(ptr addrspace(1) %ptr) {
149
149
define float @ld_global_v4f32 (ptr addrspace (1 ) %ptr ) {
150
150
; CHECK-LABEL: ld_global_v4f32(
151
151
; CHECK: {
152
- ; CHECK-NEXT: .reg .f32 %f<8>;
152
+ ; CHECK-NEXT: .reg .b32 %f<8>;
153
153
; CHECK-NEXT: .reg .b64 %rd<2>;
154
154
; CHECK-EMPTY:
155
155
; CHECK-NEXT: // %bb.0:
156
- ; CHECK-NEXT: ld.param.u64 %rd1, [ld_global_v4f32_param_0];
157
- ; CHECK-NEXT: ld.global.nc.v4.f32 {%f1, %f2, %f3, %f4}, [%rd1];
156
+ ; CHECK-NEXT: ld.param.b64 %rd1, [ld_global_v4f32_param_0];
157
+ ; CHECK-NEXT: ld.global.nc.v4.b32 {%f1, %f2, %f3, %f4}, [%rd1];
158
158
; CHECK-NEXT: add.rn.f32 %f5, %f1, %f2;
159
159
; CHECK-NEXT: add.rn.f32 %f6, %f3, %f4;
160
160
; CHECK-NEXT: add.rn.f32 %f7, %f5, %f6;
161
- ; CHECK-NEXT: st.param.f32 [func_retval0], %f7;
161
+ ; CHECK-NEXT: st.param.b32 [func_retval0], %f7;
162
162
; CHECK-NEXT: ret;
163
163
%a = load <4 x float >, ptr addrspace (1 ) %ptr , !invariant.load !0
164
164
%v1 = extractelement <4 x float > %a , i32 0
@@ -174,17 +174,17 @@ define float @ld_global_v4f32(ptr addrspace(1) %ptr) {
174
174
define float @ld_global_v8f32 (ptr addrspace (1 ) %ptr ) {
175
175
; CHECK-LABEL: ld_global_v8f32(
176
176
; CHECK: {
177
- ; CHECK-NEXT: .reg .f32 %f<12>;
177
+ ; CHECK-NEXT: .reg .b32 %f<12>;
178
178
; CHECK-NEXT: .reg .b64 %rd<2>;
179
179
; CHECK-EMPTY:
180
180
; CHECK-NEXT: // %bb.0:
181
- ; CHECK-NEXT: ld.param.u64 %rd1, [ld_global_v8f32_param_0];
182
- ; CHECK-NEXT: ld.global.nc.v4.f32 {%f1, %f2, %f3, %f4}, [%rd1+16];
183
- ; CHECK-NEXT: ld.global.nc.v4.f32 {%f5, %f6, %f7, %f8}, [%rd1];
181
+ ; CHECK-NEXT: ld.param.b64 %rd1, [ld_global_v8f32_param_0];
182
+ ; CHECK-NEXT: ld.global.nc.v4.b32 {%f1, %f2, %f3, %f4}, [%rd1+16];
183
+ ; CHECK-NEXT: ld.global.nc.v4.b32 {%f5, %f6, %f7, %f8}, [%rd1];
184
184
; CHECK-NEXT: add.rn.f32 %f9, %f5, %f7;
185
185
; CHECK-NEXT: add.rn.f32 %f10, %f1, %f3;
186
186
; CHECK-NEXT: add.rn.f32 %f11, %f9, %f10;
187
- ; CHECK-NEXT: st.param.f32 [func_retval0], %f11;
187
+ ; CHECK-NEXT: st.param.b32 [func_retval0], %f11;
188
188
; CHECK-NEXT: ret;
189
189
%a = load <8 x float >, ptr addrspace (1 ) %ptr , !invariant.load !0
190
190
%v1 = extractelement <8 x float > %a , i32 0
0 commit comments