@@ -14,13 +14,14 @@ define void @foo(i64 %img, ptr %red, i32 %idx) {
14
14
; CHECK-LABEL: foo(
15
15
; CHECK: {
16
16
; CHECK-NEXT: .reg .b32 %r<6>;
17
- ; CHECK-NEXT: .reg .b64 %rd<4 >;
17
+ ; CHECK-NEXT: .reg .b64 %rd<3 >;
18
18
; CHECK-EMPTY:
19
19
; CHECK-NEXT: // %bb.0:
20
20
; CHECK-NEXT: ld.param.b64 %rd1, [foo_param_0];
21
21
; CHECK-NEXT: ld.param.b32 %r1, [foo_param_2];
22
22
; CHECK-NEXT: tex.1d.v4.f32.s32 {%r2, %r3, %r4, %r5}, [%rd1, {%r1}];
23
- ; CHECK-NEXT: st.global.b32 [%rd3], %r2;
23
+ ; CHECK-NEXT: ld.param.b64 %rd2, [foo_param_1];
24
+ ; CHECK-NEXT: st.b32 [%rd2], %r2;
24
25
; CHECK-NEXT: ret;
25
26
%val = tail call { float , float , float , float } @llvm.nvvm.tex.unified.1d.v4f32.s32 (i64 %img , i32 %idx )
26
27
%ret = extractvalue { float , float , float , float } %val , 0
@@ -35,13 +36,13 @@ define void @bar(ptr %red, i32 %idx) {
35
36
; CHECK-LABEL: bar(
36
37
; CHECK: {
37
38
; CHECK-NEXT: .reg .b32 %r<6>;
38
- ; CHECK-NEXT: .reg .b64 %rd<4 >;
39
+ ; CHECK-NEXT: .reg .b64 %rd<3 >;
39
40
; CHECK-EMPTY:
40
41
; CHECK-NEXT: // %bb.0:
41
42
; CHECK-NEXT: ld.param.b64 %rd1, [bar_param_0];
42
43
; CHECK-NEXT: ld.param.b32 %r1, [bar_param_1];
43
44
; CHECK-NEXT: tex.1d.v4.f32.s32 {%r2, %r3, %r4, %r5}, [tex0, {%r1}];
44
- ; CHECK-NEXT: st.global. b32 [%rd2 ], %r2;
45
+ ; CHECK-NEXT: st.b32 [%rd1 ], %r2;
45
46
; CHECK-NEXT: ret;
46
47
%texHandle = tail call i64 @llvm.nvvm.texsurf.handle.internal.p1 (ptr addrspace (1 ) @tex0 )
47
48
%val = tail call { float , float , float , float } @llvm.nvvm.tex.unified.1d.v4f32.s32 (i64 %texHandle , i32 %idx )
@@ -56,12 +57,12 @@ define void @baz(ptr %red, i32 %idx) {
56
57
; CHECK-LABEL: baz(
57
58
; CHECK: {
58
59
; CHECK-NEXT: .reg .b32 %r<9>;
59
- ; CHECK-NEXT: .reg .b64 %rd<4 >;
60
+ ; CHECK-NEXT: .reg .b64 %rd<3 >;
60
61
; CHECK-EMPTY:
61
62
; CHECK-NEXT: // %bb.0:
62
63
; CHECK-NEXT: ld.param.b64 %rd1, [baz_param_0];
63
64
; CHECK-NEXT: ld.param.b32 %r1, [baz_param_1];
64
- ; CHECK-NEXT: mov.u64 %rd3 , tex0;
65
+ ; CHECK-NEXT: mov.u64 %rd2 , tex0;
65
66
; CHECK-NEXT: tex.1d.v4.f32.s32 {%r2, %r3, %r4, %r5}, [tex0, {%r1}];
66
67
; CHECK-NEXT: { // callseq 0, 0
67
68
; CHECK-NEXT: .param .b64 param0;
@@ -75,7 +76,7 @@ define void @baz(ptr %red, i32 %idx) {
75
76
; CHECK-NEXT: ld.param.b32 %r6, [retval0];
76
77
; CHECK-NEXT: } // callseq 0
77
78
; CHECK-NEXT: add.rn.f32 %r8, %r2, %r6;
78
- ; CHECK-NEXT: st.global. b32 [%rd2 ], %r8;
79
+ ; CHECK-NEXT: st.b32 [%rd1 ], %r8;
79
80
; CHECK-NEXT: ret;
80
81
%texHandle = tail call i64 @llvm.nvvm.texsurf.handle.internal.p1 (ptr addrspace (1 ) @tex0 )
81
82
%val = tail call { float , float , float , float } @llvm.nvvm.tex.unified.1d.v4f32.s32 (i64 %texHandle , i32 %idx )
0 commit comments