You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

KERNEL.POWER10 6.4 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225
  1. ifeq ($(__BYTE_ORDER__),__ORDER_BIG_ENDIAN__)
  2. include $(KERNELDIR)/KERNEL.POWER8
  3. else
  4. #SGEMM_BETA = ../generic/gemm_beta.c
  5. #DGEMM_BETA = ../generic/gemm_beta.c
  6. #CGEMM_BETA = ../generic/zgemm_beta.c
  7. #ZGEMM_BETA = ../generic/zgemm_beta.c
  8. SHGEMM_BETA = ../generic/gemm_beta.c
  9. SHGEMMKERNEL = shgemm_kernel_power10.c
  10. SHGEMMINCOPY = ../generic/gemm_ncopy_16.c
  11. SHGEMMITCOPY = ../generic/gemm_tcopy_16.c
  12. SHGEMMONCOPY = ../generic/gemm_ncopy_8.c
  13. SHGEMMOTCOPY = ../generic/gemm_tcopy_8.c
  14. SHGEMMINCOPYOBJ = shgemm_incopy$(TSUFFIX).$(SUFFIX)
  15. SHGEMMITCOPYOBJ = shgemm_itcopy$(TSUFFIX).$(SUFFIX)
  16. SHGEMMONCOPYOBJ = shgemm_oncopy$(TSUFFIX).$(SUFFIX)
  17. SHGEMMOTCOPYOBJ = shgemm_otcopy$(TSUFFIX).$(SUFFIX)
  18. STRMMKERNEL = sgemm_kernel_power10.c
  19. DTRMMKERNEL = dgemm_kernel_power10.c
  20. CTRMMKERNEL = cgemm_kernel_power10.S
  21. ZTRMMKERNEL = zgemm_kernel_power10.S
  22. SGEMMKERNEL = sgemm_kernel_power10.c
  23. SGEMMINCOPY = ../generic/gemm_ncopy_16.c
  24. SGEMMITCOPY = sgemm_tcopy_16_power8.S
  25. SGEMMONCOPY = ../generic/gemm_ncopy_8.c
  26. SGEMMOTCOPY = sgemm_tcopy_8_power8.S
  27. SGEMMINCOPYOBJ = sgemm_incopy$(TSUFFIX).$(SUFFIX)
  28. SGEMMITCOPYOBJ = sgemm_itcopy$(TSUFFIX).$(SUFFIX)
  29. SGEMMONCOPYOBJ = sgemm_oncopy$(TSUFFIX).$(SUFFIX)
  30. SGEMMOTCOPYOBJ = sgemm_otcopy$(TSUFFIX).$(SUFFIX)
  31. DGEMMKERNEL = dgemm_kernel_power10.c
  32. DGEMMINCOPY = ../generic/gemm_ncopy_16.c
  33. DGEMMITCOPY = dgemm_tcopy_16_power8.S
  34. DGEMMONCOPY = dgemm_ncopy_4_power8.S
  35. DGEMMOTCOPY = ../generic/gemm_tcopy_4.c
  36. DGEMMINCOPYOBJ = dgemm_incopy$(TSUFFIX).$(SUFFIX)
  37. DGEMMITCOPYOBJ = dgemm_itcopy$(TSUFFIX).$(SUFFIX)
  38. DGEMMONCOPYOBJ = dgemm_oncopy$(TSUFFIX).$(SUFFIX)
  39. DGEMMOTCOPYOBJ = dgemm_otcopy$(TSUFFIX).$(SUFFIX)
  40. CGEMMKERNEL = cgemm_kernel_power10.S
  41. CGEMMINCOPY = ../generic/zgemm_ncopy_8.c
  42. CGEMMITCOPY = ../generic/zgemm_tcopy_8.c
  43. CGEMMONCOPY = ../generic/zgemm_ncopy_4.c
  44. CGEMMOTCOPY = ../generic/zgemm_tcopy_4.c
  45. CGEMMONCOPYOBJ = cgemm_oncopy$(TSUFFIX).$(SUFFIX)
  46. CGEMMOTCOPYOBJ = cgemm_otcopy$(TSUFFIX).$(SUFFIX)
  47. CGEMMINCOPYOBJ = cgemm_incopy$(TSUFFIX).$(SUFFIX)
  48. CGEMMITCOPYOBJ = cgemm_itcopy$(TSUFFIX).$(SUFFIX)
  49. ZGEMMKERNEL = zgemm_kernel_power10.S
  50. ZGEMMONCOPY = ../generic/zgemm_ncopy_2.c
  51. ZGEMMOTCOPY = ../generic/zgemm_tcopy_2.c
  52. ZGEMMINCOPY = ../generic/zgemm_ncopy_8.c
  53. ZGEMMITCOPY = zgemm_tcopy_8_power8.S
  54. ZGEMMONCOPYOBJ = zgemm_oncopy$(TSUFFIX).$(SUFFIX)
  55. ZGEMMOTCOPYOBJ = zgemm_otcopy$(TSUFFIX).$(SUFFIX)
  56. ZGEMMINCOPYOBJ = zgemm_incopy$(TSUFFIX).$(SUFFIX)
  57. ZGEMMITCOPYOBJ = zgemm_itcopy$(TSUFFIX).$(SUFFIX)
  58. STRSMKERNEL_LN = ../generic/trsm_kernel_LN.c
  59. STRSMKERNEL_LT = ../generic/trsm_kernel_LT.c
  60. STRSMKERNEL_RN = ../generic/trsm_kernel_RN.c
  61. STRSMKERNEL_RT = ../generic/trsm_kernel_RT.c
  62. DTRSMKERNEL_LN = ../generic/trsm_kernel_LN.c
  63. DTRSMKERNEL_LT = dtrsm_kernel_LT_16x4_power8.S
  64. DTRSMKERNEL_RN = ../generic/trsm_kernel_RN.c
  65. DTRSMKERNEL_RT = ../generic/trsm_kernel_RT.c
  66. CTRSMKERNEL_LN = ../generic/trsm_kernel_LN.c
  67. CTRSMKERNEL_LT = ../generic/trsm_kernel_LT.c
  68. CTRSMKERNEL_RN = ../generic/trsm_kernel_RN.c
  69. CTRSMKERNEL_RT = ../generic/trsm_kernel_RT.c
  70. ZTRSMKERNEL_LN = ../generic/trsm_kernel_LN.c
  71. ZTRSMKERNEL_LT = ../generic/trsm_kernel_LT.c
  72. ZTRSMKERNEL_RN = ../generic/trsm_kernel_RN.c
  73. ZTRSMKERNEL_RT = ../generic/trsm_kernel_RT.c
  74. #Todo: CGEMM3MKERNEL should be 4x4 blocksizes.
  75. #CGEMM3MKERNEL = zgemm3m_kernel_8x4_sse3.S
  76. #ZGEMM3MKERNEL = zgemm3m_kernel_4x4_sse3.S
  77. #Pure C for other kernels
  78. #SAMAXKERNEL = ../arm/amax.c
  79. #DAMAXKERNEL = ../arm/amax.c
  80. #CAMAXKERNEL = ../arm/zamax.c
  81. #ZAMAXKERNEL = ../arm/zamax.c
  82. #
  83. #SAMINKERNEL = ../arm/amin.c
  84. #DAMINKERNEL = ../arm/amin.c
  85. #CAMINKERNEL = ../arm/zamin.c
  86. #ZAMINKERNEL = ../arm/zamin.c
  87. #
  88. #SMAXKERNEL = ../arm/max.c
  89. #DMAXKERNEL = ../arm/max.c
  90. #
  91. #SMINKERNEL = ../arm/min.c
  92. #DMINKERNEL = ../arm/min.c
  93. #
  94. ifneq ($(GCCVERSIONGTEQ9),1)
  95. ISAMAXKERNEL = isamax_power9.S
  96. else
  97. ISAMAXKERNEL = isamax.c
  98. endif
  99. IDAMAXKERNEL = idamax.c
  100. ifneq ($(GCCVERSIONGTEQ9),1)
  101. ICAMAXKERNEL = icamax_power9.S
  102. else
  103. ICAMAXKERNEL = icamax.c
  104. endif
  105. IZAMAXKERNEL = izamax.c
  106. #
  107. ifneq ($(GCCVERSIONGTEQ9),1)
  108. ISAMINKERNEL = isamin_power9.S
  109. else
  110. ISAMINKERNEL = isamin.c
  111. endif
  112. IDAMINKERNEL = idamin.c
  113. ifneq ($(GCCVERSIONGTEQ9),1)
  114. ICAMINKERNEL = icamin_power9.S
  115. else
  116. ICAMINKERNEL = icamin.c
  117. endif
  118. IZAMINKERNEL = izamin.c
  119. #
  120. #ISMAXKERNEL = ../arm/imax.c
  121. #IDMAXKERNEL = ../arm/imax.c
  122. #
  123. #ISMINKERNEL = ../arm/imin.c
  124. #IDMINKERNEL = ../arm/imin.c
  125. #
  126. SASUMKERNEL = sasum.c
  127. DASUMKERNEL = dasum.c
  128. CASUMKERNEL = casum.c
  129. ZASUMKERNEL = zasum.c
  130. #
  131. SAXPYKERNEL = saxpy.c
  132. DAXPYKERNEL = daxpy_power10.c
  133. ifneq ($(GCCVERSIONGTEQ9),1)
  134. CAXPYKERNEL = caxpy_power9.S
  135. else
  136. CAXPYKERNEL = caxpy.c
  137. endif
  138. ZAXPYKERNEL = zaxpy_power10.c
  139. #
  140. SCOPYKERNEL = scopy.c
  141. DCOPYKERNEL = dcopy.c
  142. CCOPYKERNEL = ccopy.c
  143. ZCOPYKERNEL = zcopy.c
  144. #
  145. SDOTKERNEL = sdot.c
  146. DDOTKERNEL = ddot.c
  147. DSDOTKERNEL = sdot.c
  148. ifneq ($(GCCVERSIONGTEQ9),1)
  149. CDOTKERNEL = cdot_power9.S
  150. else
  151. CDOTKERNEL = cdot.c
  152. endif
  153. ZDOTKERNEL = zdot.c
  154. #
  155. SNRM2KERNEL = ../arm/nrm2.c
  156. DNRM2KERNEL = ../arm/nrm2.c
  157. CNRM2KERNEL = ../arm/znrm2.c
  158. ZNRM2KERNEL = ../arm/znrm2.c
  159. #
  160. SROTKERNEL = srot.c
  161. DROTKERNEL = drot.c
  162. CROTKERNEL = crot.c
  163. ZROTKERNEL = zrot.c
  164. #
  165. SSCALKERNEL = sscal.c
  166. DSCALKERNEL = dscal.c
  167. CSCALKERNEL = zscal.c
  168. ZSCALKERNEL = zscal.c
  169. #
  170. SSWAPKERNEL = sswap.c
  171. DSWAPKERNEL = dswap.c
  172. CSWAPKERNEL = cswap.c
  173. ZSWAPKERNEL = zswap.c
  174. #
  175. SGEMVNKERNEL = sgemv_n.c
  176. DGEMVNKERNEL = dgemv_n_power10.c
  177. CGEMVNKERNEL = cgemv_n.c
  178. ZGEMVNKERNEL = zgemv_n_4.c
  179. #
  180. SGEMVTKERNEL = sgemv_t.c
  181. DGEMVTKERNEL = dgemv_t_power10.c
  182. CGEMVTKERNEL = cgemv_t.c
  183. ZGEMVTKERNEL = zgemv_t_4.c
  184. #SSYMV_U_KERNEL = ../generic/symv_k.c
  185. #SSYMV_L_KERNEL = ../generic/symv_k.c
  186. #DSYMV_U_KERNEL = ../generic/symv_k.c
  187. #DSYMV_L_KERNEL = ../generic/symv_k.c
  188. #QSYMV_U_KERNEL = ../generic/symv_k.c
  189. #QSYMV_L_KERNEL = ../generic/symv_k.c
  190. #CSYMV_U_KERNEL = ../generic/zsymv_k.c
  191. #CSYMV_L_KERNEL = ../generic/zsymv_k.c
  192. #ZSYMV_U_KERNEL = ../generic/zsymv_k.c
  193. #ZSYMV_L_KERNEL = ../generic/zsymv_k.c
  194. #XSYMV_U_KERNEL = ../generic/zsymv_k.c
  195. #XSYMV_L_KERNEL = ../generic/zsymv_k.c
  196. #ZHEMV_U_KERNEL = ../generic/zhemv_k.c
  197. #ZHEMV_L_KERNEL = ../generic/zhemv_k.c
  198. LSAME_KERNEL = ../generic/lsame.c
  199. SCABS_KERNEL = ../generic/cabs.c
  200. DCABS_KERNEL = ../generic/cabs.c
  201. QCABS_KERNEL = ../generic/cabs.c
  202. #Dump kernel
  203. CGEMM3MKERNEL = ../generic/zgemm3mkernel_dump.c
  204. ZGEMM3MKERNEL = ../generic/zgemm3mkernel_dump.c
  205. endif