You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

KERNEL 5.9 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414
  1. GEMVDEP = ../l2param.h
  2. ifdef HAVE_SSE
  3. ifndef SAMAXKERNEL
  4. SAMAXKERNEL = amax_sse.S
  5. endif
  6. ifndef CAMAXKERNEL
  7. CAMAXKERNEL = zamax_sse.S
  8. endif
  9. ifndef SAMINKERNEL
  10. SAMINKERNEL = amax_sse.S
  11. endif
  12. ifndef CAMINKERNEL
  13. CAMINKERNEL = zamax_sse.S
  14. endif
  15. ifndef ISAMAXKERNEL
  16. ISAMAXKERNEL = iamax_sse.S
  17. endif
  18. ifndef ICAMAXKERNEL
  19. ICAMAXKERNEL = izamax_sse.S
  20. endif
  21. ifndef ISAMINKERNEL
  22. ISAMINKERNEL = iamax_sse.S
  23. endif
  24. ifndef ICAMINKERNEL
  25. ICAMINKERNEL = izamax_sse.S
  26. endif
  27. ifndef ISMAXKERNEL
  28. ISMAXKERNEL = iamax_sse.S
  29. endif
  30. ifndef ISMINKERNEL
  31. ISMINKERNEL = iamax_sse.S
  32. endif
  33. ifndef SMAXKERNEL
  34. SMAXKERNEL = amax_sse.S
  35. endif
  36. ifndef SMINKERNEL
  37. SMINKERNEL = amax_sse.S
  38. endif
  39. ifndef SASUMKERNEL
  40. SASUMKERNEL = asum_sse.S
  41. endif
  42. ifndef CASUMKERNEL
  43. CASUMKERNEL = zasum_sse.S
  44. endif
  45. ifndef SDOTKERNEL
  46. SDOTKERNEL = ../arm/dot.c
  47. endif
  48. ifndef CDOTKERNEL
  49. CDOTKERNEL = zdot_sse.S
  50. endif
  51. ifndef SCOPYKERNEL
  52. SCOPYKERNEL = copy_sse.S
  53. endif
  54. ifndef CCOPYKERNEL
  55. CCOPYKERNEL = zcopy_sse.S
  56. endif
  57. ifndef SSACALKERNEL
  58. SSCALKERNEL = scal_sse.S
  59. endif
  60. ifndef CSACALKERNEL
  61. CSCALKERNEL = zscal_sse.S
  62. endif
  63. ifndef SAXPYKERNEL
  64. SAXPYKERNEL = axpy_sse.S
  65. endif
  66. ifndef CAXPYKERNEL
  67. CAXPYKERNEL = zaxpy_sse.S
  68. endif
  69. ifndef SROTKERNEL
  70. SROTKERNEL = rot_sse.S
  71. endif
  72. ifndef CROTKERNEL
  73. CROTKERNEL = zrot_sse.S
  74. endif
  75. ifndef SSWAPKERNEL
  76. SSWAPKERNEL = swap_sse.S
  77. endif
  78. ifndef CSWAPKERNEL
  79. CSWAPKERNEL = zswap_sse.S
  80. endif
  81. ifndef SGEMVNKERNEL
  82. SGEMVNKERNEL = ../arm/gemv_n.c
  83. endif
  84. ifndef SGEMVTKERNEL
  85. SGEMVTKERNEL = ../arm/gemv_t.c
  86. endif
  87. ifndef CGEMVNKERNEL
  88. CGEMVNKERNEL = zgemv_n_sse.S
  89. endif
  90. ifndef CGEMVTKERNEL
  91. CGEMVTKERNEL = zgemv_t_sse.S
  92. endif
  93. endif
  94. ifdef HAVE_SSE2
  95. ifndef DAMAXKERNEL
  96. DAMAXKERNEL = amax_sse2.S
  97. endif
  98. ifndef ZAMAXKERNEL
  99. ZAMAXKERNEL = zamax_sse2.S
  100. endif
  101. ifndef DAMINKERNEL
  102. DAMINKERNEL = amax_sse2.S
  103. endif
  104. ifndef ZAMINKERNEL
  105. ZAMINKERNEL = zamax_sse2.S
  106. endif
  107. ifndef IDAMAXKERNEL
  108. IDAMAXKERNEL = iamax_sse2.S
  109. endif
  110. ifndef IZAMAXKERNEL
  111. IZAMAXKERNEL = izamax_sse2.S
  112. endif
  113. ifndef IDAMINKERNEL
  114. IDAMINKERNEL = iamax_sse2.S
  115. endif
  116. ifndef IZAMINKERNEL
  117. IZAMINKERNEL = izamax_sse2.S
  118. endif
  119. ifndef IDMAXKERNEL
  120. IDMAXKERNEL = iamax_sse2.S
  121. endif
  122. ifndef IDMINKERNEL
  123. IDMINKERNEL = iamax_sse2.S
  124. endif
  125. ifndef DMAXKERNEL
  126. DMAXKERNEL = amax_sse2.S
  127. endif
  128. ifndef DMINKERNEL
  129. DMINKERNEL = amax_sse2.S
  130. endif
  131. ifndef DDOTKERNEL
  132. DDOTKERNEL = dot_sse2.S
  133. endif
  134. ifndef ZDOTKERNEL
  135. ZDOTKERNEL = zdot_sse2.S
  136. endif
  137. ifndef DCOPYKERNEL
  138. # DCOPYKERNEL = copy_sse2.S
  139. endif
  140. ifndef ZCOPYKERNEL
  141. ZCOPYKERNEL = zcopy_sse2.S
  142. endif
  143. ifndef DSACALKERNEL
  144. DSCALKERNEL = scal_sse2.S
  145. endif
  146. ifndef ZSACALKERNEL
  147. ZSCALKERNEL = zscal_sse2.S
  148. endif
  149. ifndef DASUMKERNEL
  150. DASUMKERNEL = asum_sse2.S
  151. endif
  152. ifndef ZASUMKERNEL
  153. ZASUMKERNEL = zasum_sse2.S
  154. endif
  155. ifndef DAXPYKERNEL
  156. DAXPYKERNEL = axpy_sse2.S
  157. endif
  158. ifndef ZAXPYKERNEL
  159. ZAXPYKERNEL = zaxpy_sse2.S
  160. endif
  161. ifndef SNRM2KERNEL
  162. SNRM2KERNEL = nrm2_sse.S
  163. endif
  164. ifndef CNRM2KERNEL
  165. CNRM2KERNEL = znrm2_sse.S
  166. endif
  167. ifndef DROTKERNEL
  168. DROTKERNEL = rot_sse2.S
  169. endif
  170. ifndef ZROTKERNEL
  171. ZROTKERNEL = zrot_sse2.S
  172. endif
  173. ifndef DSWAPKERNEL
  174. DSWAPKERNEL = swap_sse2.S
  175. endif
  176. ifndef ZSWAPKERNEL
  177. ZSWAPKERNEL = zswap_sse2.S
  178. endif
  179. ifndef DGEMVNKERNEL
  180. DGEMVNKERNEL = gemv_n_sse2.S
  181. endif
  182. ifndef DGEMVTKERNEL
  183. DGEMVTKERNEL = gemv_t_sse2.S
  184. endif
  185. ifndef ZGEMVNKERNEL
  186. ZGEMVNKERNEL = zgemv_n_sse2.S
  187. endif
  188. ifndef ZGEMVTKERNEL
  189. ZGEMVTKERNEL = zgemv_t_sse2.S
  190. endif
  191. endif
  192. ifndef SAMINKERNEL
  193. SAMINKERNEL = amax.S
  194. endif
  195. ifndef DAMINKERNEL
  196. DAMINKERNEL = amax.S
  197. endif
  198. ifndef QAMINKERNEL
  199. QAMINKERNEL = amax.S
  200. endif
  201. ifndef CAMINKERNEL
  202. CAMINKERNEL = zamax.S
  203. endif
  204. ifndef ZAMINKERNEL
  205. ZAMINKERNEL = zamax.S
  206. endif
  207. ifndef XAMINKERNEL
  208. XAMINKERNEL = zamax.S
  209. endif
  210. ifndef SMAXKERNEL
  211. SMAXKERNEL = amax.S
  212. endif
  213. ifndef DMAXKERNEL
  214. DMAXKERNEL = amax.S
  215. endif
  216. ifndef QMAXKERNEL
  217. QMAXKERNEL = amax.S
  218. endif
  219. ifndef SMINKERNEL
  220. SMINKERNEL = amax.S
  221. endif
  222. ifndef DMINKERNEL
  223. DMINKERNEL = amax.S
  224. endif
  225. ifndef QMINKERNEL
  226. QMINKERNEL = amax.S
  227. endif
  228. ifndef ISAMINKERNEL
  229. ISAMINKERNEL = iamax.S
  230. endif
  231. ifndef IDAMINKERNEL
  232. IDAMINKERNEL = iamax.S
  233. endif
  234. ifndef IQAMINKERNEL
  235. IQAMINKERNEL = iamax.S
  236. endif
  237. ifndef ICAMINKERNEL
  238. ICAMINKERNEL = izamax.S
  239. endif
  240. ifndef IZAMINKERNEL
  241. IZAMINKERNEL = izamax.S
  242. endif
  243. ifndef IXAMINKERNEL
  244. IXAMINKERNEL = izamax.S
  245. endif
  246. ifndef ISMINKERNEL
  247. ISMINKERNEL = iamax.S
  248. endif
  249. ifndef IDMINKERNEL
  250. IDMINKERNEL = iamax.S
  251. endif
  252. ifndef IQMINKERNEL
  253. IQMINKERNEL = iamax.S
  254. endif
  255. ifndef QDOTKERNEL
  256. QDOTKERNEL = qdot.S
  257. endif
  258. ifndef XDOTKERNEL
  259. XDOTKERNEL = xdot.S
  260. endif
  261. ifndef QAXPYKERNEL
  262. QAXPYKERNEL = qaxpy.S
  263. endif
  264. ifndef XAXPYKERNEL
  265. XAXPYKERNEL = xaxpy.S
  266. endif
  267. ifndef QGEMVNKERNEL
  268. QGEMVNKERNEL = qgemv_n.S
  269. endif
  270. ifndef QGEMVTKERNEL
  271. QGEMVTKERNEL = qgemv_t.S
  272. endif
  273. ifndef XGEMVNKERNEL
  274. XGEMVNKERNEL = xgemv_n.S
  275. endif
  276. ifndef XGEMVTKERNEL
  277. XGEMVTKERNEL = xgemv_t.S
  278. endif
  279. QGEMMKERNEL = qgemm_kernel_2x2.S
  280. QGEMMINCOPY =
  281. QGEMMITCOPY =
  282. QGEMMONCOPY = ../generic/gemm_ncopy_2.c
  283. QGEMMOTCOPY = ../generic/gemm_tcopy_2.c
  284. QGEMMINCOPYOBJ =
  285. QGEMMITCOPYOBJ =
  286. QGEMMONCOPYOBJ = qgemm_oncopy$(TSUFFIX).$(SUFFIX)
  287. QGEMMOTCOPYOBJ = qgemm_otcopy$(TSUFFIX).$(SUFFIX)
  288. XGEMMKERNEL = xgemm_kernel_1x1.S
  289. XGEMMINCOPY =
  290. XGEMMITCOPY =
  291. XGEMMONCOPY = ../generic/zgemm_ncopy_1.c
  292. XGEMMOTCOPY = ../generic/zgemm_tcopy_1.c
  293. XGEMMINCOPYOBJ =
  294. XGEMMITCOPYOBJ =
  295. XGEMMONCOPYOBJ = xgemm_oncopy$(TSUFFIX).$(SUFFIX)
  296. XGEMMOTCOPYOBJ = xgemm_otcopy$(TSUFFIX).$(SUFFIX)
  297. SGEMM_BETA = gemm_beta.S
  298. DGEMM_BETA = gemm_beta.S
  299. QGEMM_BETA = ../generic/gemm_beta.c
  300. CGEMM_BETA = zgemm_beta.S
  301. ZGEMM_BETA = zgemm_beta.S
  302. XGEMM_BETA = ../generic/zgemm_beta.c
  303. QTRSMKERNEL_LN = qtrsm_kernel_LN_2x2.S
  304. QTRSMKERNEL_LT = qtrsm_kernel_LT_2x2.S
  305. QTRSMKERNEL_RN = qtrsm_kernel_LT_2x2.S
  306. QTRSMKERNEL_RT = qtrsm_kernel_RT_2x2.S
  307. XTRSMKERNEL_LN = xtrsm_kernel_LT_1x1.S
  308. XTRSMKERNEL_LT = xtrsm_kernel_LT_1x1.S
  309. XTRSMKERNEL_RN = xtrsm_kernel_LT_1x1.S
  310. XTRSMKERNEL_RT = xtrsm_kernel_LT_1x1.S
  311. XGEMM3MKERNEL = xgemm3m_kernel_2x2.S