Skip to content

Commit f23cfb5

Browse files
committed
[NFC] Fix conflict resolution in b6bd010
The incoming commit use int reg instead of float reg, we should only update accoridly, don't blindly accept all the upstream code.
1 parent 4899fda commit f23cfb5

File tree

2 files changed

+13
-11
lines changed

2 files changed

+13
-11
lines changed

llvm/test/CodeGen/NVPTX/surf-read-cuda.ll

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,14 +14,15 @@ define void @foo(i64 %img, ptr %red, i32 %idx) {
1414
; CHECK-LABEL: foo(
1515
; CHECK: {
1616
; CHECK-NEXT: .reg .b32 %r<4>;
17-
; CHECK-NEXT: .reg .b64 %rd<4>;
17+
; CHECK-NEXT: .reg .b64 %rd<3>;
1818
; CHECK-EMPTY:
1919
; CHECK-NEXT: // %bb.0:
2020
; CHECK-NEXT: ld.param.b64 %rd1, [foo_param_0];
2121
; CHECK-NEXT: ld.param.b32 %r1, [foo_param_2];
2222
; CHECK-NEXT: suld.b.1d.b32.trap {%r2}, [%rd1, {%r1}];
23+
; CHECK-NEXT: ld.param.b64 %rd2, [foo_param_1];
2324
; CHECK-NEXT: cvt.rn.f32.s32 %r3, %r2;
24-
; CHECK-NEXT: st.global.b32 [%rd3], %r3;
25+
; CHECK-NEXT: st.b32 [%rd2], %r3;
2526
; CHECK-NEXT: ret;
2627
%val = tail call i32 @llvm.nvvm.suld.1d.i32.trap(i64 %img, i32 %idx)
2728
%ret = sitofp i32 %val to float
@@ -35,14 +36,14 @@ define void @bar(ptr %red, i32 %idx) {
3536
; CHECK-LABEL: bar(
3637
; CHECK: {
3738
; CHECK-NEXT: .reg .b32 %r<4>;
38-
; CHECK-NEXT: .reg .b64 %rd<4>;
39+
; CHECK-NEXT: .reg .b64 %rd<3>;
3940
; CHECK-EMPTY:
4041
; CHECK-NEXT: // %bb.0:
4142
; CHECK-NEXT: ld.param.b64 %rd1, [bar_param_0];
4243
; CHECK-NEXT: ld.param.b32 %r1, [bar_param_1];
4344
; CHECK-NEXT: suld.b.1d.b32.trap {%r2}, [surf0, {%r1}];
4445
; CHECK-NEXT: cvt.rn.f32.s32 %r3, %r2;
45-
; CHECK-NEXT: st.global.b32 [%rd2], %r3;
46+
; CHECK-NEXT: st.b32 [%rd1], %r3;
4647
; CHECK-NEXT: ret;
4748
%surfHandle = tail call i64 @llvm.nvvm.texsurf.handle.internal.p1(ptr addrspace(1) @surf0)
4849
%val = tail call i32 @llvm.nvvm.suld.1d.i32.trap(i64 %surfHandle, i32 %idx)

llvm/test/CodeGen/NVPTX/tex-read-cuda.ll

Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -14,13 +14,14 @@ define void @foo(i64 %img, ptr %red, i32 %idx) {
1414
; CHECK-LABEL: foo(
1515
; CHECK: {
1616
; CHECK-NEXT: .reg .b32 %r<6>;
17-
; CHECK-NEXT: .reg .b64 %rd<4>;
17+
; CHECK-NEXT: .reg .b64 %rd<3>;
1818
; CHECK-EMPTY:
1919
; CHECK-NEXT: // %bb.0:
2020
; CHECK-NEXT: ld.param.b64 %rd1, [foo_param_0];
2121
; CHECK-NEXT: ld.param.b32 %r1, [foo_param_2];
2222
; CHECK-NEXT: tex.1d.v4.f32.s32 {%r2, %r3, %r4, %r5}, [%rd1, {%r1}];
23-
; CHECK-NEXT: st.global.b32 [%rd3], %r2;
23+
; CHECK-NEXT: ld.param.b64 %rd2, [foo_param_1];
24+
; CHECK-NEXT: st.b32 [%rd2], %r2;
2425
; CHECK-NEXT: ret;
2526
%val = tail call { float, float, float, float } @llvm.nvvm.tex.unified.1d.v4f32.s32(i64 %img, i32 %idx)
2627
%ret = extractvalue { float, float, float, float } %val, 0
@@ -35,13 +36,13 @@ define void @bar(ptr %red, i32 %idx) {
3536
; CHECK-LABEL: bar(
3637
; CHECK: {
3738
; CHECK-NEXT: .reg .b32 %r<6>;
38-
; CHECK-NEXT: .reg .b64 %rd<4>;
39+
; CHECK-NEXT: .reg .b64 %rd<3>;
3940
; CHECK-EMPTY:
4041
; CHECK-NEXT: // %bb.0:
4142
; CHECK-NEXT: ld.param.b64 %rd1, [bar_param_0];
4243
; CHECK-NEXT: ld.param.b32 %r1, [bar_param_1];
4344
; CHECK-NEXT: tex.1d.v4.f32.s32 {%r2, %r3, %r4, %r5}, [tex0, {%r1}];
44-
; CHECK-NEXT: st.global.b32 [%rd2], %r2;
45+
; CHECK-NEXT: st.b32 [%rd1], %r2;
4546
; CHECK-NEXT: ret;
4647
%texHandle = tail call i64 @llvm.nvvm.texsurf.handle.internal.p1(ptr addrspace(1) @tex0)
4748
%val = tail call { float, float, float, float } @llvm.nvvm.tex.unified.1d.v4f32.s32(i64 %texHandle, i32 %idx)
@@ -56,12 +57,12 @@ define void @baz(ptr %red, i32 %idx) {
5657
; CHECK-LABEL: baz(
5758
; CHECK: {
5859
; CHECK-NEXT: .reg .b32 %r<9>;
59-
; CHECK-NEXT: .reg .b64 %rd<4>;
60+
; CHECK-NEXT: .reg .b64 %rd<3>;
6061
; CHECK-EMPTY:
6162
; CHECK-NEXT: // %bb.0:
6263
; CHECK-NEXT: ld.param.b64 %rd1, [baz_param_0];
6364
; CHECK-NEXT: ld.param.b32 %r1, [baz_param_1];
64-
; CHECK-NEXT: mov.u64 %rd3, tex0;
65+
; CHECK-NEXT: mov.u64 %rd2, tex0;
6566
; CHECK-NEXT: tex.1d.v4.f32.s32 {%r2, %r3, %r4, %r5}, [tex0, {%r1}];
6667
; CHECK-NEXT: { // callseq 0, 0
6768
; CHECK-NEXT: .param .b64 param0;
@@ -75,7 +76,7 @@ define void @baz(ptr %red, i32 %idx) {
7576
; CHECK-NEXT: ld.param.b32 %r6, [retval0];
7677
; CHECK-NEXT: } // callseq 0
7778
; CHECK-NEXT: add.rn.f32 %r8, %r2, %r6;
78-
; CHECK-NEXT: st.global.b32 [%rd2], %r8;
79+
; CHECK-NEXT: st.b32 [%rd1], %r8;
7980
; CHECK-NEXT: ret;
8081
%texHandle = tail call i64 @llvm.nvvm.texsurf.handle.internal.p1(ptr addrspace(1) @tex0)
8182
%val = tail call { float, float, float, float } @llvm.nvvm.tex.unified.1d.v4f32.s32(i64 %texHandle, i32 %idx)

0 commit comments

Comments
 (0)