Skip to content

Commit bd4c032

Browse files
authored
Update sgemm_kernel_8x4_haswell.c
1 parent 9dc9b7b commit bd4c032

File tree

1 file changed

+8
-8
lines changed

1 file changed

+8
-8
lines changed

kernel/x86_64/sgemm_kernel_8x4_haswell.c

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@
99
#define mult_alpha(acc,alpha,...) "vfmadd213ps ("#__VA_ARGS__"),"#alpha","#acc";"
1010
#endif
1111

12-
#if defined TRMMKERNEL && !defined LEFT
12+
#if defined(TRMMKERNEL) && !defined(LEFT)
1313
#ifdef TRANSA
1414
#define HEAD_SET_OFFSET(ndim) {}
1515
#define TAIL_SET_OFFSET(ndim) {off+=ndim;}
@@ -22,7 +22,7 @@
2222
#define TAIL_SET_OFFSET(ndim) {}
2323
#endif
2424

25-
#if defined TRMMKERNEL && defined LEFT
25+
#if defined(TRMMKERNEL) && defined(LEFT)
2626
#ifdef TRANSA
2727
#define init_update_kskip(val) "subq $"#val",%%r13;"
2828
#define save_update_kskip(val) ""
@@ -37,7 +37,7 @@
3737

3838
#ifdef TRMMKERNEL
3939
#define init_set_k "movq %%r12,%4; subq %%r13,%4;"
40-
#if (defined LEFT && !defined TRANSA) || (!defined LEFT && defined TRANSA)
40+
#if (defined(LEFT) && !defined(TRANSA)) || (!defined(LEFT) && defined(TRANSA))
4141
#define INIT_SET_KSKIP "movq %9,%%r13; salq $2,%%r13;"
4242
#define init_set_pointers(a_copy,b_copy) "leaq (%0,%%r13,"#a_copy"),%0; leaq (%1,%%r13,"#b_copy"),%1;"
4343
#define save_set_pointers(a_copy,b_copy) ""
@@ -63,7 +63,7 @@
6363
#define save_set_pa_pb_n2(mdim) save_set_pointers(mdim,2)
6464
#define save_set_pa_pb_n1(mdim) save_set_pointers(mdim,1)
6565

66-
#if defined TRMMKERNEL && !defined LEFT && defined TRANSA
66+
#if defined(TRMMKERNEL) && !defined(LEFT) && defined(TRANSA)
6767
#define kernel_kstart_n8(mdim) \
6868
KERNEL_k1m##mdim##n4 KERNEL_k1m##mdim##n4 KERNEL_k1m##mdim##n4 KERNEL_k1m##mdim##n4 "subq $16,%4;"
6969
#define kernel_kstart_n12(mdim) \
@@ -109,7 +109,7 @@
109109
unit_kernel_k1m8n4(%%ymm4,%%ymm5,%%ymm6,%%ymm7,16,24,%1)\
110110
unit_kernel_k1m8n4(%%ymm8,%%ymm9,%%ymm10,%%ymm11,16,24,%1,%%r12,4)\
111111
unit_kernel_k1m8n4(%%ymm12,%%ymm13,%%ymm14,%%ymm15,16,24,%1,%%r12,8) "addq $32,%1;"
112-
#if defined TRMMKERNEL && !defined LEFT && !defined TRANSA
112+
#if defined(TRMMKERNEL) && !defined(LEFT) && !defined(TRANSA)
113113
#define unit_kernel_endn4_k1m8n8(offa1,offb1,offb2) \
114114
"vmovsldup "#offa1"(%0),%%ymm1; vmovshdup "#offa1"(%0),%%ymm2;"\
115115
unit_kernel_k1m8n4(%%ymm8,%%ymm9,%%ymm10,%%ymm11,offb1,offb2,%1,%%r12,4)
@@ -192,7 +192,7 @@
192192
#define KERNEL_k1m4n8 KERNEL_h_k1m4n8 "addq $16,%1;"
193193
#define KERNEL_h_k1m4n12 KERNEL_h_k1m4n8 unit_kernel_k1m4n4(%%xmm12,%%xmm13,%%xmm14,%%xmm15,0,8,%1,%%r12,8)
194194
#define KERNEL_k1m4n12 KERNEL_h_k1m4n12 "addq $16,%1;"
195-
#if defined TRMMKERNEL && !defined LEFT && !defined TRANSA
195+
#if defined(TRMMKERNEL) && !defined(LEFT) && !defined(TRANSA)
196196
#define unit_kernel_endn4_k1m4n8(offa1,offb1,offb2) \
197197
"vmovsldup "#offa1"(%0),%%xmm1; vmovshdup "#offa1"(%0),%%xmm2;"\
198198
unit_kernel_k1m4n4(%%xmm8,%%xmm9,%%xmm10,%%xmm11,offb1,offb2,%1,%%r12,4)
@@ -285,7 +285,7 @@
285285
"vbroadcastss (%0),%%xmm10; vfmadd231ps %%xmm3,%%xmm10,%%xmm4; vfmadd231ps %%xmm2,%%xmm10,%%xmm6; vfmadd231ps %%xmm1,%%xmm10,%%xmm8;"\
286286
"vbroadcastss 4(%0),%%xmm10; vfmadd231ps %%xmm3,%%xmm10,%%xmm5; vfmadd231ps %%xmm2,%%xmm10,%%xmm7; vfmadd231ps %%xmm1,%%xmm10,%%xmm9;"\
287287
"addq $8,%0;"
288-
#if defined TRMMKERNEL && !defined LEFT && !defined TRANSA
288+
#if defined(TRMMKERNEL) && !defined(LEFT) && !defined(TRANSA)
289289
#define unit_kernel_endn4_k1m2n8(aoff1,aoff2,boff) \
290290
"vmovups "#boff"(%1,%%r12,4),%%xmm3;"\
291291
"vbroadcastss "#aoff1"(%0),%%xmm1; vfmadd231ps %%xmm3,%%xmm1,%%xmm6;"\
@@ -379,7 +379,7 @@
379379
"vmovups (%1),%%xmm3; vmovups (%1,%%r12,4),%%xmm2; vmovups (%1,%%r12,8),%%xmm1; addq $16,%1;"\
380380
"vbroadcastss (%0),%%xmm10; vfmadd231ps %%xmm3,%%xmm10,%%xmm4; vfmadd231ps %%xmm2,%%xmm10,%%xmm5; vfmadd231ps %%xmm1,%%xmm10,%%xmm6;"\
381381
"addq $4,%0;"
382-
#if defined TRMMKERNEL && !defined LEFT && !defined TRANSA
382+
#if defined(TRMMKERNEL) && !defined(LEFT) && !defined(TRANSA)
383383
#define unit_kernel_endn4_k1m1n8(aoff,boff) \
384384
"vmovups "#boff"(%1,%%r12,4),%%xmm3;"\
385385
"vbroadcastss "#aoff"(%0),%%xmm1; vfmadd231ps %%xmm3,%%xmm1,%%xmm5;"

0 commit comments

Comments
 (0)