Browse Source

Adapt ARM architect

tags/v0.3.11^2
Qiyu8 5 years ago
parent
commit
60e6c68e38
4 changed files with 6 additions and 6 deletions
  1. +1
    -1
      kernel/arm64/KERNEL.ARMV8
  2. +1
    -1
      kernel/arm64/KERNEL.CORTEXA53
  3. +1
    -1
      kernel/arm64/KERNEL.CORTEXA57
  4. +3
    -3
      kernel/generic/dot.c

+ 1
- 1
kernel/arm64/KERNEL.ARMV8 View File

@@ -97,7 +97,7 @@ CNRM2KERNEL = znrm2.S
ZNRM2KERNEL = znrm2.S

DDOTKERNEL = dot.S
SDOTKERNEL = dot.S
SDOTKERNEL = ../generic/dot.c
CDOTKERNEL = zdot.S
ZDOTKERNEL = zdot.S
DSDOTKERNEL = dot.S


+ 1
- 1
kernel/arm64/KERNEL.CORTEXA53 View File

@@ -97,7 +97,7 @@ CNRM2KERNEL = znrm2.S
ZNRM2KERNEL = znrm2.S

DDOTKERNEL = dot.S
SDOTKERNEL = dot.S
SDOTKERNEL = ../generic/dot.c
CDOTKERNEL = zdot.S
ZDOTKERNEL = zdot.S
DSDOTKERNEL = dot.S


+ 1
- 1
kernel/arm64/KERNEL.CORTEXA57 View File

@@ -70,7 +70,7 @@ DCOPYKERNEL = copy.S
CCOPYKERNEL = copy.S
ZCOPYKERNEL = copy.S

SDOTKERNEL = dot.S
SDOTKERNEL = ../generic/dot.c
DDOTKERNEL = dot.S
CDOTKERNEL = zdot.S
ZDOTKERNEL = zdot.S


+ 3
- 3
kernel/generic/dot.c View File

@@ -27,7 +27,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


#include "common.h"
#include "../simd/intrin.h"
#if defined(DSDOT)
double CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y)
#else
@@ -47,9 +47,9 @@ FLOAT CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y)

if ( (inc_x == 1) && (inc_y == 1) )
{
int n1 = n & -4;
int n1 = n & -4;
#if V_SIMD && !defined(DSDOT)
const int vstep = v_nlanes_f32;
const int vstep = v_nlanes_f32;
const int unrollx4 = n & (-vstep * 4);
const int unrollx = n & -vstep;
v_f32 vsum0 = v_zero_f32();


Loading…
Cancel
Save