You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

sbgemm_beta_neoversen2.c 3.4 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283
  1. /***************************************************************************
  2. * Copyright (c) 2022, The OpenBLAS Project
  3. * All rights reserved.
  4. * Redistribution and use in source and binary forms, with or without
  5. * modification, are permitted provided that the following conditions are
  6. * met:
  7. * 1. Redistributions of source code must retain the above copyright
  8. * notice, this list of conditions and the following disclaimer.
  9. * 2. Redistributions in binary form must reproduce the above copyright
  10. * notice, this list of conditions and the following disclaimer in
  11. * the documentation and/or other materials provided with the
  12. * distribution.
  13. * 3. Neither the name of the OpenBLAS project nor the names of
  14. * its contributors may be used to endorse or promote products
  15. * derived from this software without specific prior written permission.
  16. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  17. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  18. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  19. * ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE
  20. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  21. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  22. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  23. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  24. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  25. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  26. * POSSIBILITY OF SUCH DAMAGE.
  27. * *****************************************************************************/
  28. #include "common.h"
  29. int CNAME(BLASLONG m, BLASLONG n, BLASLONG dummy1, FLOAT beta, IFLOAT *dummy2,
  30. BLASLONG dummy3, IFLOAT *dummy4, BLASLONG dummy5, FLOAT *c,
  31. BLASLONG ldc) {
  32. BLASLONG i, j;
  33. BLASLONG chunk, remain;
  34. FLOAT *c_offset1, *c_offset;
  35. c_offset = c;
  36. chunk = m >> 3;
  37. remain = m & 7;
  38. if (beta == ZERO) {
  39. for (j = n; j > 0; j--) {
  40. c_offset1 = c_offset;
  41. c_offset += ldc;
  42. for (i = chunk; i > 0; i--) {
  43. *(c_offset1 + 0) = ZERO;
  44. *(c_offset1 + 1) = ZERO;
  45. *(c_offset1 + 2) = ZERO;
  46. *(c_offset1 + 3) = ZERO;
  47. *(c_offset1 + 4) = ZERO;
  48. *(c_offset1 + 5) = ZERO;
  49. *(c_offset1 + 6) = ZERO;
  50. *(c_offset1 + 7) = ZERO;
  51. c_offset1 += 8;
  52. }
  53. for (i = remain; i > 0; i--) {
  54. *c_offset1 = ZERO;
  55. c_offset1++;
  56. }
  57. }
  58. } else {
  59. for (j = n; j > 0; j--) {
  60. c_offset1 = c_offset;
  61. c_offset += ldc;
  62. for (i = chunk; i > 0; i--) {
  63. *(c_offset1 + 0) *= beta;
  64. *(c_offset1 + 1) *= beta;
  65. *(c_offset1 + 2) *= beta;
  66. *(c_offset1 + 3) *= beta;
  67. *(c_offset1 + 4) *= beta;
  68. *(c_offset1 + 5) *= beta;
  69. *(c_offset1 + 6) *= beta;
  70. *(c_offset1 + 7) *= beta;
  71. c_offset1 += 8;
  72. }
  73. for (i = remain; i > 0; i--) {
  74. *c_offset1 *= beta;
  75. c_offset1++;
  76. }
  77. }
  78. }
  79. return 0;
  80. };