You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

zherk_k.c 5.0 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158
  1. /*********************************************************************/
  2. /* Copyright 2009, 2010 The University of Texas at Austin. */
  3. /* All rights reserved. */
  4. /* */
  5. /* Redistribution and use in source and binary forms, with or */
  6. /* without modification, are permitted provided that the following */
  7. /* conditions are met: */
  8. /* */
  9. /* 1. Redistributions of source code must retain the above */
  10. /* copyright notice, this list of conditions and the following */
  11. /* disclaimer. */
  12. /* */
  13. /* 2. Redistributions in binary form must reproduce the above */
  14. /* copyright notice, this list of conditions and the following */
  15. /* disclaimer in the documentation and/or other materials */
  16. /* provided with the distribution. */
  17. /* */
  18. /* THIS SOFTWARE IS PROVIDED BY THE UNIVERSITY OF TEXAS AT */
  19. /* AUSTIN ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, */
  20. /* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF */
  21. /* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE */
  22. /* DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY OF TEXAS AT */
  23. /* AUSTIN OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, */
  24. /* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES */
  25. /* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE */
  26. /* GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR */
  27. /* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF */
  28. /* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT */
  29. /* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT */
  30. /* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE */
  31. /* POSSIBILITY OF SUCH DAMAGE. */
  32. /* */
  33. /* The views and conclusions contained in the software and */
  34. /* documentation are those of the authors and should not be */
  35. /* interpreted as representing official policies, either expressed */
  36. /* or implied, of The University of Texas at Austin. */
  37. /*********************************************************************/
  38. #include <stdio.h>
  39. #include "common.h"
  40. #ifndef LOWER
  41. #ifndef CONJ
  42. #ifdef XDOUBLE
  43. #define KERNEL_FUNC xherk_kernel_UN
  44. #elif defined(DOUBLE)
  45. #define KERNEL_FUNC zherk_kernel_UN
  46. #else
  47. #define KERNEL_FUNC cherk_kernel_UN
  48. #endif
  49. #else
  50. #ifdef XDOUBLE
  51. #define KERNEL_FUNC xherk_kernel_UC
  52. #elif defined(DOUBLE)
  53. #define KERNEL_FUNC zherk_kernel_UC
  54. #else
  55. #define KERNEL_FUNC cherk_kernel_UC
  56. #endif
  57. #endif
  58. #else
  59. #ifndef CONJ
  60. #ifdef XDOUBLE
  61. #define KERNEL_FUNC xherk_kernel_LN
  62. #elif defined(DOUBLE)
  63. #define KERNEL_FUNC zherk_kernel_LN
  64. #else
  65. #define KERNEL_FUNC cherk_kernel_LN
  66. #endif
  67. #else
  68. #ifdef XDOUBLE
  69. #define KERNEL_FUNC xherk_kernel_LC
  70. #elif defined(DOUBLE)
  71. #define KERNEL_FUNC zherk_kernel_LC
  72. #else
  73. #define KERNEL_FUNC cherk_kernel_LC
  74. #endif
  75. #endif
  76. #endif
  77. #define KERNEL_OPERATION(M, N, K, ALPHA, SA, SB, C, LDC, X, Y) \
  78. KERNEL_FUNC(M, N, K, ALPHA[0], SA, SB, (FLOAT *)(C) + ((X) + (Y) * LDC) * COMPSIZE, LDC, (X) - (Y))
  79. #if !defined(LOWER) && !defined(TRANS)
  80. #define SYRK_LOCAL HERK_UN
  81. #elif !defined(LOWER) && defined(TRANS)
  82. #define SYRK_LOCAL HERK_UC
  83. #elif defined(LOWER) && !defined(TRANS)
  84. #define SYRK_LOCAL HERK_LN
  85. #else
  86. #define SYRK_LOCAL HERK_LC
  87. #endif
  88. #undef SCAL_K
  89. #ifdef XDOUBLE
  90. #define SCAL_K QSCAL_K
  91. #elif defined(DOUBLE)
  92. #define SCAL_K DSCAL_K
  93. #else
  94. #define SCAL_K SSCAL_K
  95. #endif
  96. static inline int syrk_beta(BLASLONG m_from, BLASLONG m_to, BLASLONG n_from, BLASLONG n_to, FLOAT *alpha, FLOAT *c, BLASLONG ldc) {
  97. BLASLONG i;
  98. #ifndef LOWER
  99. if (m_from > n_from) n_from = m_from;
  100. if (m_to > n_to ) m_to = n_to;
  101. #else
  102. if (m_from < n_from) m_from = n_from;
  103. if (m_to < n_to ) n_to = m_to;
  104. #endif
  105. c += (m_from + n_from * ldc) * COMPSIZE;
  106. m_to -= m_from;
  107. n_to -= n_from;
  108. for (i = 0; i < n_to; i++){
  109. #ifndef LOWER
  110. SCAL_K(MIN(i + n_from - m_from + 1, m_to) * COMPSIZE, 0, 0, alpha[0], c, 1, NULL, 0, NULL, 0);
  111. if (i + n_from - m_from + 1 <= m_to)
  112. *(c + (i + n_from - m_from) * COMPSIZE + 1) = ZERO;
  113. c += ldc * COMPSIZE;
  114. #else
  115. SCAL_K(MIN(m_to - i + m_from - n_from, m_to) * COMPSIZE, 0, 0, alpha[0], c, 1, NULL, 0, NULL, 0);
  116. if (i < m_from - n_from) {
  117. c += ldc * COMPSIZE;
  118. } else {
  119. *(c + 1) = ZERO;
  120. c += (1 + ldc) * COMPSIZE;
  121. }
  122. #endif
  123. }
  124. return 0;
  125. }
  126. #ifdef THREADED_LEVEL3
  127. #include "level3_syrk_threaded.c"
  128. #else
  129. #include "level3_syrk.c"
  130. #endif