File tree 5 files changed +505
-14
lines changed 5 files changed +505
-14
lines changed Original file line number Diff line number Diff line change @@ -179,3 +179,4 @@ In chronological order:
179
179
* [ 2019-11-12] AVX512 CGEMM & ZGEMM kernels
180
180
* [ 2019-12-23] optimize AVX2 CGEMM and ZGEMM
181
181
* [ 2019-12-30] AVX2 CGEMM3M & ZGEMM3M kernels
182
+ * [ 2020-01-07] optimize AVX2 SGEMM and STRMM
Original file line number Diff line number Diff line change @@ -31,11 +31,11 @@ DAXPYKERNEL = daxpy.c
31
31
CAXPYKERNEL = caxpy.c
32
32
ZAXPYKERNEL = zaxpy.c
33
33
34
- STRMMKERNEL = sgemm_kernel_16x4_haswell.S
35
- SGEMMKERNEL = sgemm_kernel_16x4_haswell.S
34
+ STRMMKERNEL = sgemm_kernel_8x4_haswell.c
35
+ SGEMMKERNEL = sgemm_kernel_8x4_haswell.c
36
36
SGEMM_BETA = sgemm_beta_skylakex.c
37
- SGEMMINCOPY = ../generic/gemm_ncopy_16 .c
38
- SGEMMITCOPY = ../generic/gemm_tcopy_16 .c
37
+ SGEMMINCOPY = ../generic/gemm_ncopy_8 .c
38
+ SGEMMITCOPY = ../generic/gemm_tcopy_8 .c
39
39
SGEMMONCOPY = sgemm_ncopy_4_skylakex.c
40
40
SGEMMOTCOPY = ../generic/gemm_tcopy_4.c
41
41
SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
Original file line number Diff line number Diff line change @@ -30,10 +30,10 @@ DAXPYKERNEL = daxpy.c
30
30
CAXPYKERNEL = caxpy.c
31
31
ZAXPYKERNEL = zaxpy.c
32
32
33
- STRMMKERNEL = sgemm_kernel_16x4_haswell.S
34
- SGEMMKERNEL = sgemm_kernel_16x4_haswell.S
35
- SGEMMINCOPY = ../generic/gemm_ncopy_16 .c
36
- SGEMMITCOPY = ../generic/gemm_tcopy_16 .c
33
+ STRMMKERNEL = sgemm_kernel_8x4_haswell.c
34
+ SGEMMKERNEL = sgemm_kernel_8x4_haswell.c
35
+ SGEMMINCOPY = ../generic/gemm_ncopy_8 .c
36
+ SGEMMITCOPY = ../generic/gemm_tcopy_8 .c
37
37
SGEMMONCOPY = ../generic/gemm_ncopy_4.c
38
38
SGEMMOTCOPY = ../generic/gemm_tcopy_4.c
39
39
SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
You can’t perform that action at this time.
0 commit comments