Browse Source

For the sake of windows compatible, used "unsigned long long" to ensure 64-bit length

Signed-off-by: Wang, Long <long1.wang@intel.com>
tags/v0.3.8^2
Wang, Long 6 years ago
parent
commit
1191db1a49
2 changed files with 3 additions and 3 deletions
  1. +2
    -2
      kernel/x86_64/sgemm_kernel_16x4_skylakex.c
  2. +1
    -1
      kernel/x86_64/sgemm_kernel_16x4_skylakex_2.c

+ 2
- 2
kernel/x86_64/sgemm_kernel_16x4_skylakex.c View File

@@ -762,7 +762,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
int __attribute__ ((noinline)) int __attribute__ ((noinline))
CNAME(BLASLONG m, BLASLONG n, BLASLONG k, float alpha, float * __restrict A, float * __restrict B, float * __restrict C, BLASLONG ldc) CNAME(BLASLONG m, BLASLONG n, BLASLONG k, float alpha, float * __restrict A, float * __restrict B, float * __restrict C, BLASLONG ldc)
{ {
unsigned long M = m, N = n, K = k;
unsigned long long M = m, N = n, K = k;
if (M == 0) if (M == 0)
return 0; return 0;
if (N == 0) if (N == 0)
@@ -1639,4 +1639,4 @@ void sgemm_kernel_direct (BLASLONG M, BLASLONG N, BLASLONG K, float * __restrict
STORE_SCALAR(0, 0); STORE_SCALAR(0, 0);
} }
} }
}
}

+ 1
- 1
kernel/x86_64/sgemm_kernel_16x4_skylakex_2.c View File

@@ -452,7 +452,7 @@ CNAME(BLASLONG m, BLASLONG n, BLASLONG k, float alpha, float * __restrict__ A, f


int sgemm_kernel_direct_performant(BLASLONG M, BLASLONG N, BLASLONG K) int sgemm_kernel_direct_performant(BLASLONG M, BLASLONG N, BLASLONG K)
{ {
unsigned long mnk = M * N * K;
unsigned long long mnk = M * N * K;
/* large matrixes -> not performant */ /* large matrixes -> not performant */
if (mnk >= 28 * 512 * 512) if (mnk >= 28 * 512 * 512)
return 0; return 0;


Loading…
Cancel
Save