File tree Expand file tree Collapse file tree 5 files changed +505
-14
lines changed Expand file tree Collapse file tree 5 files changed +505
-14
lines changed Original file line number Diff line number Diff line change @@ -179,3 +179,4 @@ In chronological order:
179179 * [ 2019-11-12] AVX512 CGEMM & ZGEMM kernels
180180 * [ 2019-12-23] optimize AVX2 CGEMM and ZGEMM
181181 * [ 2019-12-30] AVX2 CGEMM3M & ZGEMM3M kernels
182+ * [ 2020-01-07] optimize AVX2 SGEMM and STRMM
Original file line number Diff line number Diff line change @@ -31,11 +31,11 @@ DAXPYKERNEL = daxpy.c
3131CAXPYKERNEL = caxpy.c
3232ZAXPYKERNEL = zaxpy.c
3333
34- STRMMKERNEL = sgemm_kernel_16x4_haswell.S
35- SGEMMKERNEL = sgemm_kernel_16x4_haswell.S
34+ STRMMKERNEL = sgemm_kernel_8x4_haswell.c
35+ SGEMMKERNEL = sgemm_kernel_8x4_haswell.c
3636SGEMM_BETA = sgemm_beta_skylakex.c
37- SGEMMINCOPY = ../generic/gemm_ncopy_16 .c
38- SGEMMITCOPY = ../generic/gemm_tcopy_16 .c
37+ SGEMMINCOPY = ../generic/gemm_ncopy_8 .c
38+ SGEMMITCOPY = ../generic/gemm_tcopy_8 .c
3939SGEMMONCOPY = sgemm_ncopy_4_skylakex.c
4040SGEMMOTCOPY = ../generic/gemm_tcopy_4.c
4141SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
Original file line number Diff line number Diff line change @@ -30,10 +30,10 @@ DAXPYKERNEL = daxpy.c
3030CAXPYKERNEL = caxpy.c
3131ZAXPYKERNEL = zaxpy.c
3232
33- STRMMKERNEL = sgemm_kernel_16x4_haswell.S
34- SGEMMKERNEL = sgemm_kernel_16x4_haswell.S
35- SGEMMINCOPY = ../generic/gemm_ncopy_16 .c
36- SGEMMITCOPY = ../generic/gemm_tcopy_16 .c
33+ STRMMKERNEL = sgemm_kernel_8x4_haswell.c
34+ SGEMMKERNEL = sgemm_kernel_8x4_haswell.c
35+ SGEMMINCOPY = ../generic/gemm_ncopy_8 .c
36+ SGEMMITCOPY = ../generic/gemm_tcopy_8 .c
3737SGEMMONCOPY = ../generic/gemm_ncopy_4.c
3838SGEMMOTCOPY = ../generic/gemm_tcopy_4.c
3939SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
You can’t perform that action at this time.
0 commit comments