Skip to content

Commit 62e537a

Browse files
[NFC][LLVM][SVE] Add bfloat predicated binop and FMA tests.
This is a bfloat clone of sve-fp-combine.ll that only tests sve-b16b16 because without this feature all binops are expanded to float.
1 parent 64686c5 commit 62e537a

File tree

1 file changed

+308
-0
lines changed

1 file changed

+308
-0
lines changed
Lines changed: 308 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,308 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2+
; RUN: llc -mattr=+sve,+bf16,+sve-b16b16 < %s | FileCheck %s
3+
4+
target triple = "aarch64-unknown-linux-gnu"
5+
6+
define <vscale x 8 x bfloat> @fmla_nxv8bf16(<vscale x 8 x bfloat> %acc, <vscale x 8 x bfloat> %m1, <vscale x 8 x bfloat> %m2) {
7+
; CHECK-LABEL: fmla_nxv8bf16:
8+
; CHECK: // %bb.0:
9+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
10+
; CHECK-NEXT: bfadd z0.h, z0.h, z1.h
11+
; CHECK-NEXT: ret
12+
%mul = fmul contract <vscale x 8 x bfloat> %m1, %m2
13+
%res = fadd contract <vscale x 8 x bfloat> %acc, %mul
14+
ret <vscale x 8 x bfloat> %res
15+
}
16+
17+
define <vscale x 4 x bfloat> @fmla_nxv4bf16(<vscale x 4 x bfloat> %acc, <vscale x 4 x bfloat> %m1, <vscale x 4 x bfloat> %m2) {
18+
; CHECK-LABEL: fmla_nxv4bf16:
19+
; CHECK: // %bb.0:
20+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
21+
; CHECK-NEXT: bfadd z0.h, z0.h, z1.h
22+
; CHECK-NEXT: ret
23+
%mul = fmul contract <vscale x 4 x bfloat> %m1, %m2
24+
%res = fadd contract <vscale x 4 x bfloat> %acc, %mul
25+
ret <vscale x 4 x bfloat> %res
26+
}
27+
28+
define <vscale x 2 x bfloat> @fmla_nxv2bf16(<vscale x 2 x bfloat> %acc, <vscale x 2 x bfloat> %m1, <vscale x 2 x bfloat> %m2) {
29+
; CHECK-LABEL: fmla_nxv2bf16:
30+
; CHECK: // %bb.0:
31+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
32+
; CHECK-NEXT: bfadd z0.h, z0.h, z1.h
33+
; CHECK-NEXT: ret
34+
%mul = fmul contract <vscale x 2 x bfloat> %m1, %m2
35+
%res = fadd contract <vscale x 2 x bfloat> %acc, %mul
36+
ret <vscale x 2 x bfloat> %res
37+
}
38+
39+
define <vscale x 8 x bfloat> @fmls_nxv8bf16(<vscale x 8 x bfloat> %acc, <vscale x 8 x bfloat> %m1, <vscale x 8 x bfloat> %m2) {
40+
; CHECK-LABEL: fmls_nxv8bf16:
41+
; CHECK: // %bb.0:
42+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
43+
; CHECK-NEXT: bfsub z0.h, z0.h, z1.h
44+
; CHECK-NEXT: ret
45+
%mul = fmul contract <vscale x 8 x bfloat> %m1, %m2
46+
%res = fsub contract <vscale x 8 x bfloat> %acc, %mul
47+
ret <vscale x 8 x bfloat> %res
48+
}
49+
50+
define <vscale x 4 x bfloat> @fmls_nxv4bf16(<vscale x 4 x bfloat> %acc, <vscale x 4 x bfloat> %m1, <vscale x 4 x bfloat> %m2) {
51+
; CHECK-LABEL: fmls_nxv4bf16:
52+
; CHECK: // %bb.0:
53+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
54+
; CHECK-NEXT: bfsub z0.h, z0.h, z1.h
55+
; CHECK-NEXT: ret
56+
%mul = fmul contract <vscale x 4 x bfloat> %m1, %m2
57+
%res = fsub contract <vscale x 4 x bfloat> %acc, %mul
58+
ret <vscale x 4 x bfloat> %res
59+
}
60+
61+
define <vscale x 2 x bfloat> @fmls_nxv2bf16(<vscale x 2 x bfloat> %acc, <vscale x 2 x bfloat> %m1, <vscale x 2 x bfloat> %m2) {
62+
; CHECK-LABEL: fmls_nxv2bf16:
63+
; CHECK: // %bb.0:
64+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
65+
; CHECK-NEXT: bfsub z0.h, z0.h, z1.h
66+
; CHECK-NEXT: ret
67+
%mul = fmul contract <vscale x 2 x bfloat> %m1, %m2
68+
%res = fsub contract <vscale x 2 x bfloat> %acc, %mul
69+
ret <vscale x 2 x bfloat> %res
70+
}
71+
72+
define <vscale x 8 x bfloat> @fmla_sel_nxv8bf16(<vscale x 8 x i1> %pred, <vscale x 8 x bfloat> %acc, <vscale x 8 x bfloat> %m1, <vscale x 8 x bfloat> %m2) {
73+
; CHECK-LABEL: fmla_sel_nxv8bf16:
74+
; CHECK: // %bb.0:
75+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
76+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
77+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
78+
; CHECK-NEXT: ret
79+
%mul = fmul contract <vscale x 8 x bfloat> %m1, %m2
80+
%add = fadd contract <vscale x 8 x bfloat> %acc, %mul
81+
%res = select <vscale x 8 x i1> %pred, <vscale x 8 x bfloat> %add, <vscale x 8 x bfloat> %acc
82+
ret <vscale x 8 x bfloat> %res
83+
}
84+
85+
define <vscale x 4 x bfloat> @fmla_sel_nxv4bf16(<vscale x 4 x i1> %pred, <vscale x 4 x bfloat> %acc, <vscale x 4 x bfloat> %m1, <vscale x 4 x bfloat> %m2) {
86+
; CHECK-LABEL: fmla_sel_nxv4bf16:
87+
; CHECK: // %bb.0:
88+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
89+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
90+
; CHECK-NEXT: mov z0.s, p0/m, z1.s
91+
; CHECK-NEXT: ret
92+
%mul = fmul contract <vscale x 4 x bfloat> %m1, %m2
93+
%add = fadd contract <vscale x 4 x bfloat> %acc, %mul
94+
%res = select <vscale x 4 x i1> %pred, <vscale x 4 x bfloat> %add, <vscale x 4 x bfloat> %acc
95+
ret <vscale x 4 x bfloat> %res
96+
}
97+
98+
define <vscale x 2 x bfloat> @fmla_sel_nxv2bf16(<vscale x 2 x i1> %pred, <vscale x 2 x bfloat> %acc, <vscale x 2 x bfloat> %m1, <vscale x 2 x bfloat> %m2) {
99+
; CHECK-LABEL: fmla_sel_nxv2bf16:
100+
; CHECK: // %bb.0:
101+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
102+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
103+
; CHECK-NEXT: mov z0.d, p0/m, z1.d
104+
; CHECK-NEXT: ret
105+
%mul = fmul contract <vscale x 2 x bfloat> %m1, %m2
106+
%add = fadd contract <vscale x 2 x bfloat> %acc, %mul
107+
%res = select <vscale x 2 x i1> %pred, <vscale x 2 x bfloat> %add, <vscale x 2 x bfloat> %acc
108+
ret <vscale x 2 x bfloat> %res
109+
}
110+
111+
define <vscale x 8 x bfloat> @fmls_sel_nxv8bf16(<vscale x 8 x i1> %pred, <vscale x 8 x bfloat> %acc, <vscale x 8 x bfloat> %m1, <vscale x 8 x bfloat> %m2) {
112+
; CHECK-LABEL: fmls_sel_nxv8bf16:
113+
; CHECK: // %bb.0:
114+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
115+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
116+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
117+
; CHECK-NEXT: ret
118+
%mul = fmul contract <vscale x 8 x bfloat> %m1, %m2
119+
%sub = fsub contract <vscale x 8 x bfloat> %acc, %mul
120+
%res = select <vscale x 8 x i1> %pred, <vscale x 8 x bfloat> %sub, <vscale x 8 x bfloat> %acc
121+
ret <vscale x 8 x bfloat> %res
122+
}
123+
124+
define <vscale x 4 x bfloat> @fmls_sel_nxv4bf16(<vscale x 4 x i1> %pred, <vscale x 4 x bfloat> %acc, <vscale x 4 x bfloat> %m1, <vscale x 4 x bfloat> %m2) {
125+
; CHECK-LABEL: fmls_sel_nxv4bf16:
126+
; CHECK: // %bb.0:
127+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
128+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
129+
; CHECK-NEXT: mov z0.s, p0/m, z1.s
130+
; CHECK-NEXT: ret
131+
%mul = fmul contract <vscale x 4 x bfloat> %m1, %m2
132+
%sub = fsub contract <vscale x 4 x bfloat> %acc, %mul
133+
%res = select <vscale x 4 x i1> %pred, <vscale x 4 x bfloat> %sub, <vscale x 4 x bfloat> %acc
134+
ret <vscale x 4 x bfloat> %res
135+
}
136+
137+
define <vscale x 2 x bfloat> @fmls_sel_nxv2bf16(<vscale x 2 x i1> %pred, <vscale x 2 x bfloat> %acc, <vscale x 2 x bfloat> %m1, <vscale x 2 x bfloat> %m2) {
138+
; CHECK-LABEL: fmls_sel_nxv2bf16:
139+
; CHECK: // %bb.0:
140+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
141+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
142+
; CHECK-NEXT: mov z0.d, p0/m, z1.d
143+
; CHECK-NEXT: ret
144+
%mul = fmul contract <vscale x 2 x bfloat> %m1, %m2
145+
%sub = fsub contract <vscale x 2 x bfloat> %acc, %mul
146+
%res = select <vscale x 2 x i1> %pred, <vscale x 2 x bfloat> %sub, <vscale x 2 x bfloat> %acc
147+
ret <vscale x 2 x bfloat> %res
148+
}
149+
150+
define <vscale x 8 x bfloat> @fadd_sel_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x i1> %mask) {
151+
; CHECK-LABEL: fadd_sel_nxv8bf16:
152+
; CHECK: // %bb.0:
153+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
154+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
155+
; CHECK-NEXT: ret
156+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> zeroinitializer
157+
%fadd = fadd nsz <vscale x 8 x bfloat> %a, %sel
158+
ret <vscale x 8 x bfloat> %fadd
159+
}
160+
161+
define <vscale x 8 x bfloat> @fsub_sel_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x i1> %mask) {
162+
; CHECK-LABEL: fsub_sel_nxv8bf16:
163+
; CHECK: // %bb.0:
164+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
165+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
166+
; CHECK-NEXT: ret
167+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> zeroinitializer
168+
%fsub = fsub <vscale x 8 x bfloat> %a, %sel
169+
ret <vscale x 8 x bfloat> %fsub
170+
}
171+
172+
define <vscale x 8 x bfloat> @fadd_sel_negzero_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x i1> %mask) {
173+
; CHECK-LABEL: fadd_sel_negzero_nxv8bf16:
174+
; CHECK: // %bb.0:
175+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
176+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
177+
; CHECK-NEXT: ret
178+
%nz = fneg <vscale x 8 x bfloat> zeroinitializer
179+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %nz
180+
%fadd = fadd <vscale x 8 x bfloat> %a, %sel
181+
ret <vscale x 8 x bfloat> %fadd
182+
}
183+
184+
define <vscale x 8 x bfloat> @fsub_sel_negzero_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x i1> %mask) {
185+
; CHECK-LABEL: fsub_sel_negzero_nxv8bf16:
186+
; CHECK: // %bb.0:
187+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
188+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
189+
; CHECK-NEXT: ret
190+
%nz = fneg <vscale x 8 x bfloat> zeroinitializer
191+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %nz
192+
%fsub = fsub nsz <vscale x 8 x bfloat> %a, %sel
193+
ret <vscale x 8 x bfloat> %fsub
194+
}
195+
196+
define <vscale x 8 x bfloat> @fadd_sel_fmul_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
197+
; CHECK-LABEL: fadd_sel_fmul_nxv8bf16:
198+
; CHECK: // %bb.0:
199+
; CHECK-NEXT: movi v3.2d, #0000000000000000
200+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
201+
; CHECK-NEXT: sel z1.h, p0, z1.h, z3.h
202+
; CHECK-NEXT: bfadd z0.h, z0.h, z1.h
203+
; CHECK-NEXT: ret
204+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
205+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> zeroinitializer
206+
%fadd = fadd contract <vscale x 8 x bfloat> %a, %sel
207+
ret <vscale x 8 x bfloat> %fadd
208+
}
209+
210+
define <vscale x 8 x bfloat> @fsub_sel_fmul_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
211+
; CHECK-LABEL: fsub_sel_fmul_nxv8bf16:
212+
; CHECK: // %bb.0:
213+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
214+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
215+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
216+
; CHECK-NEXT: ret
217+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
218+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> zeroinitializer
219+
%fsub = fsub contract <vscale x 8 x bfloat> %a, %sel
220+
ret <vscale x 8 x bfloat> %fsub
221+
}
222+
223+
define <vscale x 8 x bfloat> @fadd_sel_fmul_nsz_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
224+
; CHECK-LABEL: fadd_sel_fmul_nsz_nxv8bf16:
225+
; CHECK: // %bb.0:
226+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
227+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
228+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
229+
; CHECK-NEXT: ret
230+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
231+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> zeroinitializer
232+
%fadd = fadd nsz contract <vscale x 8 x bfloat> %a, %sel
233+
ret <vscale x 8 x bfloat> %fadd
234+
}
235+
236+
define <vscale x 8 x bfloat> @fsub_sel_fmul_nsz_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
237+
; CHECK-LABEL: fsub_sel_fmul_nsz_nxv8bf16:
238+
; CHECK: // %bb.0:
239+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
240+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
241+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
242+
; CHECK-NEXT: ret
243+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
244+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> zeroinitializer
245+
%fsub = fsub nsz contract <vscale x 8 x bfloat> %a, %sel
246+
ret <vscale x 8 x bfloat> %fsub
247+
}
248+
249+
define <vscale x 8 x bfloat> @fadd_sel_fmul_negzero_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
250+
; CHECK-LABEL: fadd_sel_fmul_negzero_nxv8bf16:
251+
; CHECK: // %bb.0:
252+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
253+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
254+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
255+
; CHECK-NEXT: ret
256+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
257+
%nz = fneg <vscale x 8 x bfloat> zeroinitializer
258+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> %nz
259+
%fadd = fadd contract <vscale x 8 x bfloat> %a, %sel
260+
ret <vscale x 8 x bfloat> %fadd
261+
}
262+
263+
define <vscale x 8 x bfloat> @fsub_sel_fmul_negzero_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
264+
; CHECK-LABEL: fsub_sel_fmul_negzero_nxv8bf16:
265+
; CHECK: // %bb.0:
266+
; CHECK-NEXT: mov w8, #32768 // =0x8000
267+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
268+
; CHECK-NEXT: fmov h3, w8
269+
; CHECK-NEXT: mov z3.h, h3
270+
; CHECK-NEXT: sel z1.h, p0, z1.h, z3.h
271+
; CHECK-NEXT: bfsub z0.h, z0.h, z1.h
272+
; CHECK-NEXT: ret
273+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
274+
%nz = fneg <vscale x 8 x bfloat> zeroinitializer
275+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> %nz
276+
%fsub = fsub contract <vscale x 8 x bfloat> %a, %sel
277+
ret <vscale x 8 x bfloat> %fsub
278+
}
279+
280+
define <vscale x 8 x bfloat> @fadd_sel_fmul_negzero_nsz_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
281+
; CHECK-LABEL: fadd_sel_fmul_negzero_nsz_nxv8bf16:
282+
; CHECK: // %bb.0:
283+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
284+
; CHECK-NEXT: bfadd z1.h, z0.h, z1.h
285+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
286+
; CHECK-NEXT: ret
287+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
288+
%nz = fneg <vscale x 8 x bfloat> zeroinitializer
289+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> %nz
290+
%fadd = fadd nsz contract <vscale x 8 x bfloat> %a, %sel
291+
ret <vscale x 8 x bfloat> %fadd
292+
}
293+
294+
define <vscale x 8 x bfloat> @fsub_sel_fmul_negzero_nsz_nxv8bf16(<vscale x 8 x bfloat> %a, <vscale x 8 x bfloat> %b, <vscale x 8 x bfloat> %c, <vscale x 8 x i1> %mask) {
295+
; CHECK-LABEL: fsub_sel_fmul_negzero_nsz_nxv8bf16:
296+
; CHECK: // %bb.0:
297+
; CHECK-NEXT: bfmul z1.h, z1.h, z2.h
298+
; CHECK-NEXT: bfsub z1.h, z0.h, z1.h
299+
; CHECK-NEXT: mov z0.h, p0/m, z1.h
300+
; CHECK-NEXT: ret
301+
%fmul = fmul <vscale x 8 x bfloat> %b, %c
302+
%nz = fneg <vscale x 8 x bfloat> zeroinitializer
303+
%sel = select <vscale x 8 x i1> %mask, <vscale x 8 x bfloat> %fmul, <vscale x 8 x bfloat> %nz
304+
%fsub = fsub nsz contract <vscale x 8 x bfloat> %a, %sel
305+
ret <vscale x 8 x bfloat> %fsub
306+
}
307+
308+
declare <vscale x 8 x bfloat> @llvm.fma.nxv8bf16(<vscale x 8 x bfloat>, <vscale x 8 x bfloat>, <vscale x 8 x bfloat>)

0 commit comments

Comments
 (0)