Skip to content

Commit 9b19e9e

Browse files
authored
Update dgemm_kernel_8x8_skylakex.c
1 parent 6bd67dd commit 9b19e9e

File tree

1 file changed

+6
-4
lines changed

1 file changed

+6
-4
lines changed

kernel/x86_64/dgemm_kernel_8x8_skylakex.c

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -429,7 +429,8 @@ static void KERNEL_MAIN(double *packed_a, double *packed_b, BLASLONG m, BLASLONG
429429
double *c_pointer = c;
430430
__mmask16 k01 = 0x00f0,k02 = 0x000f,k03 = 0x0033;
431431
BLASLONG ndiv8_count;
432-
double *b_scratch = (double *)aligned_alloc(64,192*k);
432+
double *b_scratch;
433+
posix_memalign(&b_scratch,64,192*k);
433434
double *packed_b_pointer = packed_b;
434435
a_block_pointer = packed_a;
435436
for(ndiv8_count=ndiv8;ndiv8_count>2;ndiv8_count-=3){
@@ -637,9 +638,10 @@ static void KERNEL_MAIN(double *packed_a, double *packed_b, BLASLONG m, BLASLONG
637638
c_pointer ++;\
638639
}
639640
#define SAVE_m1n4 {\
640-
*c_pointer += _mm256_cvtsd_f64(yc1);\
641-
ya1 = _mm256_unpackhi_pd(yc1,yc1);\
642-
c_pointer[LDC] += _mm256_cvtsd_f64(ya1);\
641+
xb1 = _mm256_extractf128_pd(yc1,0);\
642+
*c_pointer += _mm_cvtsd_f64(xb1);\
643+
xb2 = _mm_unpackhi_pd(xb1,xb1);\
644+
c_pointer[LDC] += _mm_cvtsd_f64(xb2);\
643645
xb1 = _mm256_extractf128_pd(yc1,1);\
644646
c_pointer[LDC*2] += _mm_cvtsd_f64(xb1);\
645647
xb2 = _mm_unpackhi_pd(xb1,xb1);\

0 commit comments

Comments
 (0)