Skip to content

Commit 90231bf

Browse files
authored
Merge pull request #4258 from martin-frbg/issue4257
Fix build on Fujitsu A64FX
2 parents bf3183d + e7d0540 commit 90231bf

File tree

1 file changed

+40
-50
lines changed

1 file changed

+40
-50
lines changed

kernel/arm64/KERNEL.A64FX

Lines changed: 40 additions & 50 deletions
Original file line numberDiff line numberDiff line change
@@ -57,7 +57,7 @@ CAMAXKERNEL = zamax.S
5757
ZAMAXKERNEL = zamax.S
5858

5959
SAXPYKERNEL = axpy.S
60-
DAXPYKERNEL = axpy.S
60+
DAXPYKERNEL = daxpy_thunderx2t99.S
6161
CAXPYKERNEL = zaxpy.S
6262
ZAXPYKERNEL = zaxpy.S
6363

@@ -81,45 +81,35 @@ DGEMVTKERNEL = gemv_t.S
8181
CGEMVTKERNEL = zgemv_t.S
8282
ZGEMVTKERNEL = zgemv_t.S
8383

84-
85-
SASUMKERNEL = asum.S
86-
DASUMKERNEL = asum.S
87-
CASUMKERNEL = casum.S
88-
ZASUMKERNEL = zasum.S
89-
90-
SCOPYKERNEL = copy.S
91-
DCOPYKERNEL = copy.S
92-
CCOPYKERNEL = copy.S
93-
ZCOPYKERNEL = copy.S
94-
95-
SSWAPKERNEL = swap.S
96-
DSWAPKERNEL = swap.S
97-
CSWAPKERNEL = swap.S
98-
ZSWAPKERNEL = swap.S
99-
100-
ISAMAXKERNEL = iamax.S
101-
IDAMAXKERNEL = iamax.S
102-
ICAMAXKERNEL = izamax.S
103-
IZAMAXKERNEL = izamax.S
104-
105-
SNRM2KERNEL = nrm2.S
106-
DNRM2KERNEL = nrm2.S
107-
CNRM2KERNEL = znrm2.S
108-
ZNRM2KERNEL = znrm2.S
109-
110-
DDOTKERNEL = dot.S
111-
ifneq ($(C_COMPILER), PGI)
112-
SDOTKERNEL = ../generic/dot.c
113-
else
114-
SDOTKERNEL = dot.S
115-
endif
116-
ifneq ($(C_COMPILER), PGI)
117-
CDOTKERNEL = zdot.S
118-
ZDOTKERNEL = zdot.S
119-
else
120-
CDOTKERNEL = ../arm/zdot.c
121-
ZDOTKERNEL = ../arm/zdot.c
122-
endif
84+
SASUMKERNEL = sasum_thunderx2t99.c
85+
DASUMKERNEL = dasum_thunderx2t99.c
86+
CASUMKERNEL = casum_thunderx2t99.c
87+
ZASUMKERNEL = zasum_thunderx2t99.c
88+
89+
SCOPYKERNEL = copy_thunderx2t99.c
90+
DCOPYKERNEL = copy_thunderx2t99.c
91+
CCOPYKERNEL = copy_thunderx2t99.c
92+
ZCOPYKERNEL = copy_thunderx2t99.c
93+
94+
SSWAPKERNEL = swap_thunderx2t99.S
95+
DSWAPKERNEL = swap_thunderx2t99.S
96+
CSWAPKERNEL = swap_thunderx2t99.S
97+
ZSWAPKERNEL = swap_thunderx2t99.S
98+
99+
ISAMAXKERNEL = iamax_thunderx2t99.c
100+
IDAMAXKERNEL = iamax_thunderx2t99.c
101+
ICAMAXKERNEL = izamax_thunderx2t99.c
102+
IZAMAXKERNEL = izamax_thunderx2t99.c
103+
104+
SNRM2KERNEL = scnrm2_thunderx2t99.c
105+
DNRM2KERNEL = dznrm2_thunderx2t99.c
106+
CNRM2KERNEL = scnrm2_thunderx2t99.c
107+
ZNRM2KERNEL = dznrm2_thunderx2t99.c
108+
109+
DDOTKERNEL = dot.c
110+
SDOTKERNEL = dot.c
111+
CDOTKERNEL = zdot_thunderx2t99.c
112+
ZDOTKERNEL = zdot_thunderx2t99.c
123113
DSDOTKERNEL = dot.S
124114

125115
DGEMM_BETA = dgemm_beta.S
@@ -128,10 +118,10 @@ SGEMM_BETA = sgemm_beta.S
128118
SGEMMKERNEL = sgemm_kernel_sve_v2x$(SGEMM_UNROLL_N).S
129119
STRMMKERNEL = strmm_kernel_sve_v1x$(SGEMM_UNROLL_N).S
130120

131-
SGEMMINCOPY = sgemm_ncopy_sve_v1.c
132-
SGEMMITCOPY = sgemm_tcopy_sve_v1.c
133-
SGEMMONCOPY = sgemm_ncopy_$(DGEMM_UNROLL_N).S
134-
SGEMMOTCOPY = sgemm_tcopy_$(DGEMM_UNROLL_N).S
121+
SGEMMINCOPY = gemm_ncopy_sve_v1x$(SGEMM_UNROLL_N).c
122+
SGEMMITCOPY = gemm_tcopy_sve_v1x$(SGEMM_UNROLL_N).c
123+
SGEMMONCOPY = sgemm_ncopy_$(SGEMM_UNROLL_N).S
124+
SGEMMOTCOPY = sgemm_tcopy_$(SGEMM_UNROLL_N).S
135125

136126
SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
137127
SGEMMITCOPYOBJ = sgemm_itcopy$(TSUFFIX).$(SUFFIX)
@@ -149,8 +139,8 @@ SSYMMLCOPY_M = symm_lcopy_sve.c
149139
DGEMMKERNEL = dgemm_kernel_sve_v2x$(DGEMM_UNROLL_N).S
150140
DTRMMKERNEL = dtrmm_kernel_sve_v1x$(DGEMM_UNROLL_N).S
151141

152-
DGEMMINCOPY = dgemm_ncopy_sve_v1.c
153-
DGEMMITCOPY = dgemm_tcopy_sve_v1.c
142+
DGEMMINCOPY = gemm_ncopy_sve_v1x$(DGEMM_UNROLL_N).c
143+
DGEMMITCOPY = gemm_tcopy_sve_v1x$(DGEMM_UNROLL_N).c
154144
DGEMMONCOPY = dgemm_ncopy_$(DGEMM_UNROLL_N).S
155145
DGEMMOTCOPY = dgemm_tcopy_$(DGEMM_UNROLL_N).S
156146

@@ -170,8 +160,8 @@ DSYMMLCOPY_M = symm_lcopy_sve.c
170160
CGEMMKERNEL = cgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
171161
CTRMMKERNEL = ctrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
172162

173-
CGEMMINCOPY = cgemm_ncopy_sve_v1.c
174-
CGEMMITCOPY = cgemm_tcopy_sve_v1.c
163+
CGEMMINCOPY = gemm_ncopy_complex_sve_v1x$(ZGEMM_UNROLL_N).c
164+
CGEMMITCOPY = gemm_tcopy_complex_sve_v1x$(ZGEMM_UNROLL_N).c
175165
CGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
176166
CGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
177167

@@ -194,8 +184,8 @@ CSYMMLCOPY_M = zsymm_lcopy_sve.c
194184
ZGEMMKERNEL = zgemm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
195185
ZTRMMKERNEL = ztrmm_kernel_sve_v1x$(ZGEMM_UNROLL_N).S
196186

197-
ZGEMMINCOPY = zgemm_ncopy_sve_v1.c
198-
ZGEMMITCOPY = zgemm_tcopy_sve_v1.c
187+
ZGEMMINCOPY = gemm_ncopy_complex_sve_v1x$(ZGEMM_UNROLL_N).c
188+
ZGEMMITCOPY = gemm_tcopy_complex_sve_v1x$(ZGEMM_UNROLL_N).c
199189
ZGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
200190
ZGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
201191

0 commit comments

Comments
 (0)