Skip to content

Commit badf218

Browse files
asbDisasm
authored andcommitted
[RISCV] Add tests to demonstrate bitcasted fneg/fabs dagcombines
This target-independent code won't trigger for cases such as RV32FD where custom SelectionDAG nodes are generated. These new tests demonstrate such cases. Additionally, float-arith.ll was updated so that fneg.s, fsgnjn.s, and fabs.s selection patterns are actually exercised. llvm-svn: 352199
1 parent 83a98f4 commit badf218

File tree

3 files changed

+162
-25
lines changed

3 files changed

+162
-25
lines changed
Lines changed: 80 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,80 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2+
; RUN: llc -mtriple=riscv32 -verify-machineinstrs < %s \
3+
; RUN: | FileCheck -check-prefix=RV32I %s
4+
; RUN: llc -mtriple=riscv32 -mattr=+d -verify-machineinstrs < %s \
5+
; RUN: | FileCheck -check-prefix=RV32IFD %s
6+
; RUN: llc -mtriple=riscv64 -verify-machineinstrs < %s \
7+
; RUN: | FileCheck -check-prefix=RV64I %s
8+
;
9+
; This file tests cases where simple floating point operations can be
10+
; profitably handled though bit manipulation if a soft-float ABI is being used
11+
; (e.g. fneg implemented by XORing the sign bit). This is typically handled in
12+
; DAGCombiner::visitBITCAST, but this target-independent code may not trigger
13+
; in cases where we perform custom legalisation (e.g. RV32IFD).
14+
15+
; TODO: Add an appropriate target-specific DAG combine that can handle
16+
; RISCVISD::SplitF64/BuildPairF64 used for RV32IFD.
17+
18+
define double @fneg(double %a) nounwind {
19+
; RV32I-LABEL: fneg:
20+
; RV32I: # %bb.0:
21+
; RV32I-NEXT: lui a2, 524288
22+
; RV32I-NEXT: xor a1, a1, a2
23+
; RV32I-NEXT: ret
24+
;
25+
; RV32IFD-LABEL: fneg:
26+
; RV32IFD: # %bb.0:
27+
; RV32IFD-NEXT: addi sp, sp, -16
28+
; RV32IFD-NEXT: sw a0, 8(sp)
29+
; RV32IFD-NEXT: sw a1, 12(sp)
30+
; RV32IFD-NEXT: fld ft0, 8(sp)
31+
; RV32IFD-NEXT: fneg.d ft0, ft0
32+
; RV32IFD-NEXT: fsd ft0, 8(sp)
33+
; RV32IFD-NEXT: lw a0, 8(sp)
34+
; RV32IFD-NEXT: lw a1, 12(sp)
35+
; RV32IFD-NEXT: addi sp, sp, 16
36+
; RV32IFD-NEXT: ret
37+
;
38+
; RV64I-LABEL: fneg:
39+
; RV64I: # %bb.0:
40+
; RV64I-NEXT: addi a1, zero, -1
41+
; RV64I-NEXT: slli a1, a1, 63
42+
; RV64I-NEXT: xor a0, a0, a1
43+
; RV64I-NEXT: ret
44+
%1 = fneg double %a
45+
ret double %1
46+
}
47+
48+
declare double @llvm.fabs.f64(double)
49+
50+
define double @fabs(double %a) nounwind {
51+
; RV32I-LABEL: fabs:
52+
; RV32I: # %bb.0:
53+
; RV32I-NEXT: lui a2, 524288
54+
; RV32I-NEXT: addi a2, a2, -1
55+
; RV32I-NEXT: and a1, a1, a2
56+
; RV32I-NEXT: ret
57+
;
58+
; RV32IFD-LABEL: fabs:
59+
; RV32IFD: # %bb.0:
60+
; RV32IFD-NEXT: addi sp, sp, -16
61+
; RV32IFD-NEXT: sw a0, 8(sp)
62+
; RV32IFD-NEXT: sw a1, 12(sp)
63+
; RV32IFD-NEXT: fld ft0, 8(sp)
64+
; RV32IFD-NEXT: fabs.d ft0, ft0
65+
; RV32IFD-NEXT: fsd ft0, 8(sp)
66+
; RV32IFD-NEXT: lw a0, 8(sp)
67+
; RV32IFD-NEXT: lw a1, 12(sp)
68+
; RV32IFD-NEXT: addi sp, sp, 16
69+
; RV32IFD-NEXT: ret
70+
;
71+
; RV64I-LABEL: fabs:
72+
; RV64I: # %bb.0:
73+
; RV64I-NEXT: addi a1, zero, -1
74+
; RV64I-NEXT: slli a1, a1, 63
75+
; RV64I-NEXT: addi a1, a1, -1
76+
; RV64I-NEXT: and a0, a0, a1
77+
; RV64I-NEXT: ret
78+
%1 = call double @llvm.fabs.f64(double %a)
79+
ret double %1
80+
}

llvm/test/CodeGen/RISCV/float-arith.ll

Lines changed: 33 additions & 25 deletions
Original file line numberDiff line numberDiff line change
@@ -81,50 +81,58 @@ define float @fsgnj_s(float %a, float %b) nounwind {
8181
ret float %1
8282
}
8383

84-
define float @fneg_s(float %a) nounwind {
85-
; TODO: doesn't test the fneg selection pattern because
86-
; DAGCombiner::visitBITCAST will generate a xor on the incoming integer
87-
; argument
84+
; This function performs extra work to ensure that
85+
; DAGCombiner::visitBITCAST doesn't replace the fneg with an xor.
86+
define i32 @fneg_s(float %a, float %b) nounwind {
8887
; RV32IF-LABEL: fneg_s:
8988
; RV32IF: # %bb.0:
90-
; RV32IF-NEXT: lui a1, 524288
91-
; RV32IF-NEXT: xor a0, a0, a1
89+
; RV32IF-NEXT: fmv.w.x ft0, a0
90+
; RV32IF-NEXT: fadd.s ft0, ft0, ft0
91+
; RV32IF-NEXT: fneg.s ft1, ft0
92+
; RV32IF-NEXT: feq.s a0, ft0, ft1
9293
; RV32IF-NEXT: ret
93-
%1 = fsub float -0.0, %a
94-
ret float %1
94+
%1 = fadd float %a, %a
95+
%2 = fneg float %1
96+
%3 = fcmp oeq float %1, %2
97+
%4 = zext i1 %3 to i32
98+
ret i32 %4
9599
}
96100

101+
; This function performs extra work to ensure that
102+
; DAGCombiner::visitBITCAST doesn't replace the fneg with an xor.
97103
define float @fsgnjn_s(float %a, float %b) nounwind {
98-
; TODO: fsgnjn.s isn't selected because DAGCombiner::visitBITCAST will convert
99-
; (bitconvert (fneg x)) to a xor
100104
; RV32IF-LABEL: fsgnjn_s:
101105
; RV32IF: # %bb.0:
102-
; RV32IF-NEXT: lui a2, 524288
103-
; RV32IF-NEXT: xor a1, a1, a2
104106
; RV32IF-NEXT: fmv.w.x ft0, a1
105107
; RV32IF-NEXT: fmv.w.x ft1, a0
106-
; RV32IF-NEXT: fsgnj.s ft0, ft1, ft0
108+
; RV32IF-NEXT: fadd.s ft0, ft1, ft0
109+
; RV32IF-NEXT: fsgnjn.s ft0, ft1, ft0
107110
; RV32IF-NEXT: fmv.x.w a0, ft0
108111
; RV32IF-NEXT: ret
109-
%1 = fsub float -0.0, %b
110-
%2 = call float @llvm.copysign.f32(float %a, float %1)
111-
ret float %2
112+
%1 = fadd float %a, %b
113+
%2 = fneg float %1
114+
%3 = call float @llvm.copysign.f32(float %a, float %2)
115+
ret float %3
112116
}
113117

114118
declare float @llvm.fabs.f32(float)
115119

116-
define float @fabs_s(float %a) nounwind {
117-
; TODO: doesn't test the fabs selection pattern because
118-
; DAGCombiner::visitBITCAST will generate an and on the incoming integer
119-
; argument
120+
; This function performs extra work to ensure that
121+
; DAGCombiner::visitBITCAST doesn't replace the fabs with an and.
122+
define float @fabs_s(float %a, float %b) nounwind {
120123
; RV32IF-LABEL: fabs_s:
121124
; RV32IF: # %bb.0:
122-
; RV32IF-NEXT: lui a1, 524288
123-
; RV32IF-NEXT: addi a1, a1, -1
124-
; RV32IF-NEXT: and a0, a0, a1
125+
; RV32IF-NEXT: fmv.w.x ft0, a1
126+
; RV32IF-NEXT: fmv.w.x ft1, a0
127+
; RV32IF-NEXT: fadd.s ft0, ft1, ft0
128+
; RV32IF-NEXT: fabs.s ft1, ft0
129+
; RV32IF-NEXT: fadd.s ft0, ft1, ft0
130+
; RV32IF-NEXT: fmv.x.w a0, ft0
125131
; RV32IF-NEXT: ret
126-
%1 = call float @llvm.fabs.f32(float %a)
127-
ret float %1
132+
%1 = fadd float %a, %b
133+
%2 = call float @llvm.fabs.f32(float %1)
134+
%3 = fadd float %2, %1
135+
ret float %3
128136
}
129137

130138
declare float @llvm.minnum.f32(float, float)
Lines changed: 49 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,49 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2+
; RUN: llc -mtriple=riscv32 -verify-machineinstrs < %s \
3+
; RUN: | FileCheck -check-prefix=RV32I %s
4+
; RUN: llc -mtriple=riscv32 -mattr=+f -verify-machineinstrs < %s \
5+
; RUN: | FileCheck -check-prefix=RV32I %s
6+
; RUN: llc -mtriple=riscv64 -verify-machineinstrs < %s \
7+
; RUN: | FileCheck -check-prefix=RV64I %s
8+
9+
; This file tests cases where simple floating point operations can be
10+
; profitably handled though bit manipulation if a soft-float ABI is being used
11+
; (e.g. fneg implemented by XORing the sign bit). This is typically handled in
12+
; DAGCombiner::visitBITCAST, but this target-independent code may not trigger
13+
; in cases where we perform custom legalisation (e.g. RV64F).
14+
15+
define float @fneg(float %a) nounwind {
16+
; RV32I-LABEL: fneg:
17+
; RV32I: # %bb.0:
18+
; RV32I-NEXT: lui a1, 524288
19+
; RV32I-NEXT: xor a0, a0, a1
20+
; RV32I-NEXT: ret
21+
;
22+
; RV64I-LABEL: fneg:
23+
; RV64I: # %bb.0:
24+
; RV64I-NEXT: lui a1, 524288
25+
; RV64I-NEXT: xor a0, a0, a1
26+
; RV64I-NEXT: ret
27+
%1 = fneg float %a
28+
ret float %1
29+
}
30+
31+
declare float @llvm.fabs.f32(float)
32+
33+
define float @fabs(float %a) nounwind {
34+
; RV32I-LABEL: fabs:
35+
; RV32I: # %bb.0:
36+
; RV32I-NEXT: lui a1, 524288
37+
; RV32I-NEXT: addi a1, a1, -1
38+
; RV32I-NEXT: and a0, a0, a1
39+
; RV32I-NEXT: ret
40+
;
41+
; RV64I-LABEL: fabs:
42+
; RV64I: # %bb.0:
43+
; RV64I-NEXT: lui a1, 524288
44+
; RV64I-NEXT: addiw a1, a1, -1
45+
; RV64I-NEXT: and a0, a0, a1
46+
; RV64I-NEXT: ret
47+
%1 = call float @llvm.fabs.f32(float %a)
48+
ret float %1
49+
}

0 commit comments

Comments
 (0)