Browse Source

Merge pull request #898 from wernsaar/develop

added experimental support for optimized lapack fortran functions
tags/v0.2.19^2
Werner Saar 9 years ago
parent
commit
f04af36ad0
3 changed files with 1458 additions and 342 deletions
  1. +1083
    -0
      interface/lapack/fortran/dlaqr5.f
  2. +5
    -8
      kernel/power/dtrsm_logic_LT_16x4_power8.S
  3. +370
    -334
      kernel/power/dtrsm_macros_LT_16x4_power8.S

+ 1083
- 0
interface/lapack/fortran/dlaqr5.f
File diff suppressed because it is too large
View File


+ 5
- 8
kernel/power/dtrsm_logic_LT_16x4_power8.S View File

@@ -54,29 +54,26 @@ DSTRM_LT_L4x16_LOOP_START:

addic. L, KK, 0
ble- DSTRM_LT_L4x16_SAVE
mtctr L

DSTRM_LT_L4x16_LOOP:

dcbt AO, PRE
dcbt BO, PRE
KERNEL_16x4
addic. L, L, -1
ble- DSTRM_LT_L4x16_SAVE
bdz- DSTRM_LT_L4x16_SAVE

dcbt AO, PRE
KERNEL_16x4
addic. L, L, -1
ble- DSTRM_LT_L4x16_SAVE
bdz- DSTRM_LT_L4x16_SAVE

dcbt AO, PRE
KERNEL_16x4
addic. L, L, -1
ble- DSTRM_LT_L4x16_SAVE
bdz- DSTRM_LT_L4x16_SAVE

dcbt AO, PRE
KERNEL_16x4
addic. L, L, -1
bgt+ DSTRM_LT_L4x16_LOOP
bdnz+ DSTRM_LT_L4x16_LOOP


DSTRM_LT_L4x16_SAVE:


+ 370
- 334
kernel/power/dtrsm_macros_LT_16x4_power8.S
File diff suppressed because it is too large
View File


Loading…
Cancel
Save