Browse Source

Rename HALF -> BFLOAT16 in some more places

pull/5362/head
Chris Sidebottom 2 months ago
parent
commit
7a97c4ca97
4 changed files with 7 additions and 5 deletions
  1. +2
    -1
      driver/level3/level3.c
  2. +2
    -2
      driver/level3/level3_thread.c
  3. +1
    -1
      lapack/CMakeLists.txt
  4. +2
    -1
      lapack/potrf/potrf_parallel.c

+ 2
- 1
driver/level3/level3.c View File

@@ -1,5 +1,6 @@
/*********************************************************************/ /*********************************************************************/
/* Copyright 2009, 2010 The University of Texas at Austin. */ /* Copyright 2009, 2010 The University of Texas at Austin. */
/* Copyright 2025 The OpenBLAS Project. */
/* All rights reserved. */ /* All rights reserved. */
/* */ /* */
/* Redistribution and use in source and binary forms, with or */ /* Redistribution and use in source and binary forms, with or */
@@ -305,7 +306,7 @@ int CNAME(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n,
} }


BLASLONG pad_min_l = min_l; BLASLONG pad_min_l = min_l;
#if defined(HALF)
#if defined(BFLOAT16)
#if defined(DYNAMIC_ARCH) #if defined(DYNAMIC_ARCH)
pad_min_l = (min_l + gotoblas->sbgemm_align_k - 1) & ~(gotoblas->sbgemm_align_k-1); pad_min_l = (min_l + gotoblas->sbgemm_align_k - 1) & ~(gotoblas->sbgemm_align_k-1);
#else #else


+ 2
- 2
driver/level3/level3_thread.c View File

@@ -1,6 +1,6 @@
/*********************************************************************/ /*********************************************************************/
/* Copyright 2009, 2010 The University of Texas at Austin. */ /* Copyright 2009, 2010 The University of Texas at Austin. */
/* Copyright 2023 The OpenBLAS Project. */
/* Copyright 2023, 2025 The OpenBLAS Project. */
/* All rights reserved. */ /* All rights reserved. */
/* */ /* */
/* Redistribution and use in source and binary forms, with or */ /* Redistribution and use in source and binary forms, with or */
@@ -324,7 +324,7 @@ static int inner_thread(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n,
BLASLONG pad_min_l = min_l; BLASLONG pad_min_l = min_l;


#if defined(HALF)
#if defined(BFLOAT16)
#if defined(DYNAMIC_ARCH) #if defined(DYNAMIC_ARCH)
pad_min_l = (min_l + gotoblas->sbgemm_align_k - 1) & ~(gotoblas->sbgemm_align_k-1); pad_min_l = (min_l + gotoblas->sbgemm_align_k - 1) & ~(gotoblas->sbgemm_align_k-1);
#else #else


+ 1
- 1
lapack/CMakeLists.txt View File

@@ -52,7 +52,7 @@ GenerateNamedObjects("laswp/generic/laswp_k_4.c" "" "laswp_plus" false "" "" fa
GenerateNamedObjects("laswp/generic/laswp_k_4.c" "MINUS" "laswp_minus" false "" "" false 3) GenerateNamedObjects("laswp/generic/laswp_k_4.c" "MINUS" "laswp_minus" false "" "" false 3)


foreach (float_type ${FLOAT_TYPES}) foreach (float_type ${FLOAT_TYPES})
if (${float_type} STREQUAL "HALF")
if (${float_type} STREQUAL "BFLOAT16")
continue() continue()
endif() endif()
GenerateNamedObjects("getrf/getrf_single.c" "UNIT" "getrf_single" false "" "" false ${float_type}) GenerateNamedObjects("getrf/getrf_single.c" "UNIT" "getrf_single" false "" "" false ${float_type})


+ 2
- 1
lapack/potrf/potrf_parallel.c View File

@@ -1,5 +1,6 @@
/*********************************************************************/ /*********************************************************************/
/* Copyright 2009, 2010 The University of Texas at Austin. */ /* Copyright 2009, 2010 The University of Texas at Austin. */
/* Copyright 2025 The OpenBLAS Project. */
/* All rights reserved. */ /* All rights reserved. */
/* */ /* */
/* Redistribution and use in source and binary forms, with or */ /* Redistribution and use in source and binary forms, with or */
@@ -405,7 +406,7 @@ static int thread_driver(blas_arg_t *args, FLOAT *sa, FLOAT *sb){
#elif defined(DOUBLE) #elif defined(DOUBLE)
mode = BLAS_DOUBLE | BLAS_REAL; mode = BLAS_DOUBLE | BLAS_REAL;
mask = MAX(DGEMM_UNROLL_M, DGEMM_UNROLL_N) - 1; mask = MAX(DGEMM_UNROLL_M, DGEMM_UNROLL_N) - 1;
#elif defined(HALF)
#elif defined(BFLOAT16)
mode = BLAS_HALF | BLAS_REAL; mode = BLAS_HALF | BLAS_REAL;
mask = MAX(SBGEMM_UNROLL_M, SBGEMM_UNROLL_N) - 1; mask = MAX(SBGEMM_UNROLL_M, SBGEMM_UNROLL_N) - 1;
#else #else


Loading…
Cancel
Save