Browse Source

Optimized trmm kernels for CORTEXA57

tags/v0.2.16.rc1
Ashwin Sekhar T K 10 years ago
parent
commit
c99c43d51e
5 changed files with 6321 additions and 4 deletions
  1. +4
    -4
      kernel/arm64/KERNEL.CORTEXA57
  2. +1621
    -0
      kernel/arm64/ctrmm_kernel_4x4.S
  3. +1398
    -0
      kernel/arm64/dtrmm_kernel_4x4.S
  4. +1405
    -0
      kernel/arm64/strmm_kernel_4x4.S
  5. +1893
    -0
      kernel/arm64/ztrmm_kernel_4x4.S

+ 4
- 4
kernel/arm64/KERNEL.CORTEXA57 View File

@@ -60,10 +60,10 @@ DGEMVTKERNEL = gemv_t.S
CGEMVTKERNEL = zgemv_t.S
ZGEMVTKERNEL = zgemv_t.S

STRMMKERNEL = ../generic/trmmkernel_4x4.c
DTRMMKERNEL = ../generic/trmmkernel_4x4.c
CTRMMKERNEL = ../generic/ztrmmkernel_4x4.c
ZTRMMKERNEL = ../generic/ztrmmkernel_4x4.c
STRMMKERNEL = strmm_kernel_4x4.S
DTRMMKERNEL = dtrmm_kernel_4x4.S
CTRMMKERNEL = ctrmm_kernel_4x4.S
ZTRMMKERNEL = ztrmm_kernel_4x4.S

SGEMMKERNEL = sgemm_kernel_4x4.S
SGEMMONCOPY = ../generic/gemm_ncopy_4.c


+ 1621
- 0
kernel/arm64/ctrmm_kernel_4x4.S
File diff suppressed because it is too large
View File


+ 1398
- 0
kernel/arm64/dtrmm_kernel_4x4.S
File diff suppressed because it is too large
View File


+ 1405
- 0
kernel/arm64/strmm_kernel_4x4.S
File diff suppressed because it is too large
View File


+ 1893
- 0
kernel/arm64/ztrmm_kernel_4x4.S
File diff suppressed because it is too large
View File


Loading…
Cancel
Save