Skip to content

Commit 4e466d7

Browse files
authored
Merge pull request #15 from xianyi/develop
rebase
2 parents ccc28c6 + 4c6a457 commit 4e466d7

File tree

10 files changed

+962
-134
lines changed

10 files changed

+962
-134
lines changed

common_power.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -241,7 +241,7 @@ static inline int blas_quickdivide(blasint x, blasint y){
241241
#define HAVE_PREFETCH
242242
#endif
243243

244-
#if defined(POWER3) || defined(POWER6) || defined(PPCG4) || defined(CELL) || defined(POWER8) || defined(POWER9) || ( defined(PPC970) && ( defined(OS_DARWIN) || defined(OS_FREEBSD) ) )
244+
#if defined(POWER3) || defined(POWER6) || defined(PPCG4) || defined(CELL) || defined(POWER8) || defined(POWER9) || defined(PPC970)
245245
#define DCBT_ARG 0
246246
#else
247247
#define DCBT_ARG 8

kernel/arm64/KERNEL.ARMV8

Lines changed: 0 additions & 36 deletions
Original file line numberDiff line numberDiff line change
@@ -91,51 +91,17 @@ IDAMAXKERNEL = iamax.S
9191
ICAMAXKERNEL = izamax.S
9292
IZAMAXKERNEL = izamax.S
9393

94-
ifneq ($(OS_DARWIN)$(CROSS),11)
9594
SNRM2KERNEL = nrm2.S
9695
DNRM2KERNEL = nrm2.S
9796
CNRM2KERNEL = znrm2.S
9897
ZNRM2KERNEL = znrm2.S
99-
endif
10098

10199
DDOTKERNEL = dot.S
102100
SDOTKERNEL = dot.S
103101
CDOTKERNEL = zdot.S
104102
ZDOTKERNEL = zdot.S
105103
DSDOTKERNEL = dot.S
106104

107-
ifeq ($(OS_DARWIN)$(CROSS),11)
108-
109-
STRMMKERNEL = ../generic/trmmkernel_2x2.c
110-
DTRMMKERNEL = ../generic/trmmkernel_2x2.c
111-
CTRMMKERNEL = ../generic/ztrmmkernel_2x2.c
112-
ZTRMMKERNEL = ../generic/ztrmmkernel_2x2.c
113-
114-
SGEMMKERNEL = ../generic/gemmkernel_2x2.c
115-
SGEMMONCOPY = ../generic/gemm_ncopy_2.c
116-
SGEMMOTCOPY = ../generic/gemm_tcopy_2.c
117-
SGEMMONCOPYOBJ = sgemm_oncopy$(TSUFFIX).$(SUFFIX)
118-
SGEMMOTCOPYOBJ = sgemm_otcopy$(TSUFFIX).$(SUFFIX)
119-
120-
DGEMMKERNEL = ../generic/gemmkernel_2x2.c
121-
DGEMMONCOPY = ../generic/gemm_ncopy_2.c
122-
DGEMMOTCOPY = ../generic/gemm_tcopy_2.c
123-
DGEMMONCOPYOBJ = dgemm_oncopy$(TSUFFIX).$(SUFFIX)
124-
DGEMMOTCOPYOBJ = dgemm_otcopy$(TSUFFIX).$(SUFFIX)
125-
126-
CGEMMKERNEL = ../generic/zgemmkernel_2x2.c
127-
CGEMMONCOPY = ../generic/zgemm_ncopy_2.c
128-
CGEMMOTCOPY = ../generic/zgemm_tcopy_2.c
129-
CGEMMONCOPYOBJ = cgemm_oncopy$(TSUFFIX).$(SUFFIX)
130-
CGEMMOTCOPYOBJ = cgemm_otcopy$(TSUFFIX).$(SUFFIX)
131-
132-
ZGEMMKERNEL = ../generic/zgemmkernel_2x2.c
133-
ZGEMMONCOPY = ../generic/zgemm_ncopy_2.c
134-
ZGEMMOTCOPY = ../generic/zgemm_tcopy_2.c
135-
ZGEMMONCOPYOBJ = zgemm_oncopy$(TSUFFIX).$(SUFFIX)
136-
ZGEMMOTCOPYOBJ = zgemm_otcopy$(TSUFFIX).$(SUFFIX)
137-
138-
else
139105
SGEMMKERNEL = sgemm_kernel_$(SGEMM_UNROLL_M)x$(SGEMM_UNROLL_N).S
140106
STRMMKERNEL = strmm_kernel_$(SGEMM_UNROLL_M)x$(SGEMM_UNROLL_N).S
141107
ifneq ($(SGEMM_UNROLL_M), $(SGEMM_UNROLL_N))
@@ -202,5 +168,3 @@ ZGEMMONCOPY = ../generic/zgemm_ncopy_$(ZGEMM_UNROLL_N).c
202168
ZGEMMOTCOPY = ../generic/zgemm_tcopy_$(ZGEMM_UNROLL_N).c
203169
ZGEMMONCOPYOBJ = zgemm_oncopy$(TSUFFIX).$(SUFFIX)
204170
ZGEMMOTCOPYOBJ = zgemm_otcopy$(TSUFFIX).$(SUFFIX)
205-
206-
endif

kernel/power/idamax.c

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -324,14 +324,15 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x) {
324324

325325
if (inc_x == 1) {
326326

327+
#if defined(_CALL_ELF) && (_CALL_ELF == 2)
327328
BLASLONG n1 = n & -32;
328329
if (n1 > 0) {
329330

330331
max = diamax_kernel_32(n1, x, &maxf);
331332

332333
i = n1;
333334
}
334-
335+
#endif
335336
while (i < n) {
336337
if (ABS(x[i]) > maxf) {
337338
max = i;

kernel/power/idamin.c

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -326,13 +326,15 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x) {
326326
minf = ABS(x[0]); //index's not incremented
327327
if (inc_x == 1) {
328328

329+
#if defined(_CALL_ELF) && (_CALL_ELF == 2)
329330
BLASLONG n1 = n & -32;
330331
if (n1 > 0) {
331332

332333
min = diamin_kernel_32(n1, x, &minf);
333334
i = n1;
334335
}
335-
336+
#endif
337+
336338
while (i < n) {
337339
if (ABS(x[i]) < minf) {
338340
min = i;

kernel/power/izamax.c

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -316,13 +316,15 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
316316

317317
if (inc_x == 1) {
318318

319+
#if defined(_CALL_ELF) && (_CALL_ELF == 2)
319320
BLASLONG n1 = n & -16;
320321
if (n1 > 0) {
321322

322323
max = ziamax_kernel_16(n1, x, &maxf);
323324
i = n1;
324325
ix = n1 << 1;
325326
}
327+
#endif
326328

327329
while(i < n)
328330
{

kernel/power/izamin.c

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -314,14 +314,16 @@ BLASLONG CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x)
314314

315315
if (inc_x == 1) {
316316
minf = CABS1(x,0); //index will not be incremented
317+
318+
#if defined(_CALL_ELF) && (_CALL_ELF == 2)
317319
BLASLONG n1 = n & -16;
318320
if (n1 > 0) {
319321

320322
min = ziamin_kernel_16_TUNED(n1, x, &minf);
321323
i = n1;
322324
ix = n1 << 1;
323325
}
324-
326+
#endif
325327

326328
while(i < n)
327329
{

kernel/x86_64/KERNEL.SKYLAKEX

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
include $(KERNELDIR)/KERNEL.HASWELL
22

3-
SGEMMKERNEL = sgemm_kernel_16x4_skylakex.c
3+
SGEMMKERNEL = sgemm_kernel_16x4_skylakex_2.c
44

55
SGEMMINCOPY = ../generic/gemm_ncopy_16.c
66
SGEMMITCOPY = sgemm_tcopy_16_skylakex.c

0 commit comments

Comments
 (0)