Browse Source

Add workaround for NVIDIA HPC mishandling of the asm DOT kernels

tags/v0.3.14^2
Martin Kroeker GitHub 4 years ago
parent
commit
0f27a03607
No known key found for this signature in database GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 9 additions and 0 deletions
  1. +9
    -0
      kernel/arm64/KERNEL.CORTEXA57

+ 9
- 0
kernel/arm64/KERNEL.CORTEXA57 View File

@@ -70,10 +70,19 @@ DCOPYKERNEL = copy.S
CCOPYKERNEL = copy.S
ZCOPYKERNEL = copy.S

ifneq ($(C_COMPILER), PGI)
SDOTKERNEL = ../generic/dot.c
else
SDOTKERNEL = dot.S
endif
DDOTKERNEL = dot.S
ifneq ($(C_COMPILER), PGI)
CDOTKERNEL = zdot.S
ZDOTKERNEL = zdot.S
else
CDOTKERNEL = ../arm/zdot.c
ZDOTKERNEL = ../arm/zdot.c
endif
DSDOTKERNEL = dot.S

SNRM2KERNEL = nrm2.S


Loading…
Cancel
Save