translate_atlas.hpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507
  1. // Copyright 2008-2016 Conrad Sanderson (http://conradsanderson.id.au)
  2. // Copyright 2008-2016 National ICT Australia (NICTA)
  3. //
  4. // Licensed under the Apache License, Version 2.0 (the "License");
  5. // you may not use this file except in compliance with the License.
  6. // You may obtain a copy of the License at
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. // ------------------------------------------------------------------------
  15. #ifdef ARMA_USE_ATLAS
  16. //! \namespace atlas namespace for ATLAS functions (imported from the global namespace)
  17. namespace atlas
  18. {
  19. template<typename eT>
  20. inline static const eT& tmp_real(const eT& X) { return X; }
  21. template<typename T>
  22. inline static const T tmp_real(const std::complex<T>& X) { return X.real(); }
  23. template<typename eT>
  24. arma_inline
  25. eT
  26. cblas_asum(const int N, const eT* X)
  27. {
  28. arma_type_check((is_supported_blas_type<eT>::value == false));
  29. if(is_float<eT>::value)
  30. {
  31. typedef float T;
  32. return eT( arma_wrapper(cblas_sasum)(N, (const T*)X, 1) );
  33. }
  34. else
  35. if(is_double<eT>::value)
  36. {
  37. typedef double T;
  38. return eT( arma_wrapper(cblas_dasum)(N, (const T*)X, 1) );
  39. }
  40. return eT(0);
  41. }
  42. template<typename eT>
  43. arma_inline
  44. eT
  45. cblas_nrm2(const int N, const eT* X)
  46. {
  47. arma_type_check((is_supported_blas_type<eT>::value == false));
  48. if(is_float<eT>::value)
  49. {
  50. typedef float T;
  51. return eT( arma_wrapper(cblas_snrm2)(N, (const T*)X, 1) );
  52. }
  53. else
  54. if(is_double<eT>::value)
  55. {
  56. typedef double T;
  57. return eT( arma_wrapper(cblas_dnrm2)(N, (const T*)X, 1) );
  58. }
  59. return eT(0);
  60. }
  61. template<typename eT>
  62. arma_inline
  63. eT
  64. cblas_dot(const int N, const eT* X, const eT* Y)
  65. {
  66. arma_type_check((is_supported_blas_type<eT>::value == false));
  67. if(is_float<eT>::value)
  68. {
  69. typedef float T;
  70. return eT( arma_wrapper(cblas_sdot)(N, (const T*)X, 1, (const T*)Y, 1) );
  71. }
  72. else
  73. if(is_double<eT>::value)
  74. {
  75. typedef double T;
  76. return eT( arma_wrapper(cblas_ddot)(N, (const T*)X, 1, (const T*)Y, 1) );
  77. }
  78. return eT(0);
  79. }
  80. template<typename eT>
  81. arma_inline
  82. eT
  83. cblas_cx_dot(const int N, const eT* X, const eT* Y)
  84. {
  85. arma_type_check((is_supported_blas_type<eT>::value == false));
  86. if(is_cx_float<eT>::value)
  87. {
  88. typedef typename std::complex<float> T;
  89. T out;
  90. arma_wrapper(cblas_cdotu_sub)(N, (const T*)X, 1, (const T*)Y, 1, &out);
  91. return eT(out);
  92. }
  93. else
  94. if(is_cx_double<eT>::value)
  95. {
  96. typedef typename std::complex<double> T;
  97. T out;
  98. arma_wrapper(cblas_zdotu_sub)(N, (const T*)X, 1, (const T*)Y, 1, &out);
  99. return eT(out);
  100. }
  101. return eT(0);
  102. }
  103. template<typename eT>
  104. inline
  105. void
  106. cblas_gemv
  107. (
  108. const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA,
  109. const int M, const int N,
  110. const eT alpha,
  111. const eT *A, const int lda,
  112. const eT *X, const int incX,
  113. const eT beta,
  114. eT *Y, const int incY
  115. )
  116. {
  117. arma_type_check((is_supported_blas_type<eT>::value == false));
  118. if(is_float<eT>::value)
  119. {
  120. typedef float T;
  121. arma_wrapper(cblas_sgemv)(Order, TransA, M, N, (const T)tmp_real(alpha), (const T*)A, lda, (const T*)X, incX, (const T)tmp_real(beta), (T*)Y, incY);
  122. }
  123. else
  124. if(is_double<eT>::value)
  125. {
  126. typedef double T;
  127. arma_wrapper(cblas_dgemv)(Order, TransA, M, N, (const T)tmp_real(alpha), (const T*)A, lda, (const T*)X, incX, (const T)tmp_real(beta), (T*)Y, incY);
  128. }
  129. else
  130. if(is_cx_float<eT>::value)
  131. {
  132. typedef std::complex<float> T;
  133. arma_wrapper(cblas_cgemv)(Order, TransA, M, N, (const T*)&alpha, (const T*)A, lda, (const T*)X, incX, (const T*)&beta, (T*)Y, incY);
  134. }
  135. else
  136. if(is_cx_double<eT>::value)
  137. {
  138. typedef std::complex<double> T;
  139. arma_wrapper(cblas_zgemv)(Order, TransA, M, N, (const T*)&alpha, (const T*)A, lda, (const T*)X, incX, (const T*)&beta, (T*)Y, incY);
  140. }
  141. }
  142. template<typename eT>
  143. inline
  144. void
  145. cblas_gemm
  146. (
  147. const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA,
  148. const enum CBLAS_TRANSPOSE TransB, const int M, const int N,
  149. const int K, const eT alpha, const eT *A,
  150. const int lda, const eT *B, const int ldb,
  151. const eT beta, eT *C, const int ldc
  152. )
  153. {
  154. arma_type_check((is_supported_blas_type<eT>::value == false));
  155. if(is_float<eT>::value)
  156. {
  157. typedef float T;
  158. arma_wrapper(cblas_sgemm)(Order, TransA, TransB, M, N, K, (const T)tmp_real(alpha), (const T*)A, lda, (const T*)B, ldb, (const T)tmp_real(beta), (T*)C, ldc);
  159. }
  160. else
  161. if(is_double<eT>::value)
  162. {
  163. typedef double T;
  164. arma_wrapper(cblas_dgemm)(Order, TransA, TransB, M, N, K, (const T)tmp_real(alpha), (const T*)A, lda, (const T*)B, ldb, (const T)tmp_real(beta), (T*)C, ldc);
  165. }
  166. else
  167. if(is_cx_float<eT>::value)
  168. {
  169. typedef std::complex<float> T;
  170. arma_wrapper(cblas_cgemm)(Order, TransA, TransB, M, N, K, (const T*)&alpha, (const T*)A, lda, (const T*)B, ldb, (const T*)&beta, (T*)C, ldc);
  171. }
  172. else
  173. if(is_cx_double<eT>::value)
  174. {
  175. typedef std::complex<double> T;
  176. arma_wrapper(cblas_zgemm)(Order, TransA, TransB, M, N, K, (const T*)&alpha, (const T*)A, lda, (const T*)B, ldb, (const T*)&beta, (T*)C, ldc);
  177. }
  178. }
  179. template<typename eT>
  180. inline
  181. void
  182. cblas_syrk
  183. (
  184. const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE Trans,
  185. const int N, const int K, const eT alpha,
  186. const eT* A, const int lda, const eT beta, eT* C, const int ldc
  187. )
  188. {
  189. arma_type_check((is_supported_blas_type<eT>::value == false));
  190. if(is_float<eT>::value)
  191. {
  192. typedef float T;
  193. arma_wrapper(cblas_ssyrk)(Order, Uplo, Trans, N, K, (const T)alpha, (const T*)A, lda, (const T)beta, (T*)C, ldc);
  194. }
  195. else
  196. if(is_double<eT>::value)
  197. {
  198. typedef double T;
  199. arma_wrapper(cblas_dsyrk)(Order, Uplo, Trans, N, K, (const T)alpha, (const T*)A, lda, (const T)beta, (T*)C, ldc);
  200. }
  201. }
  202. template<typename T>
  203. inline
  204. void
  205. cblas_herk
  206. (
  207. const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const enum CBLAS_TRANSPOSE Trans,
  208. const int N, const int K, const T alpha,
  209. const std::complex<T>* A, const int lda, const T beta, std::complex<T>* C, const int ldc
  210. )
  211. {
  212. arma_type_check((is_supported_blas_type<T>::value == false));
  213. if(is_float<T>::value)
  214. {
  215. typedef float TT;
  216. typedef std::complex<float> cx_TT;
  217. arma_wrapper(cblas_cherk)(Order, Uplo, Trans, N, K, (const TT)alpha, (const cx_TT*)A, lda, (const TT)beta, (cx_TT*)C, ldc);
  218. }
  219. else
  220. if(is_double<T>::value)
  221. {
  222. typedef double TT;
  223. typedef std::complex<double> cx_TT;
  224. arma_wrapper(cblas_zherk)(Order, Uplo, Trans, N, K, (const TT)alpha, (const cx_TT*)A, lda, (const TT)beta, (cx_TT*)C, ldc);
  225. }
  226. }
  227. template<typename eT>
  228. inline
  229. int
  230. clapack_getrf
  231. (
  232. const enum CBLAS_ORDER Order, const int M, const int N,
  233. eT *A, const int lda, int *ipiv
  234. )
  235. {
  236. arma_type_check((is_supported_blas_type<eT>::value == false));
  237. if(is_float<eT>::value)
  238. {
  239. typedef float T;
  240. return arma_wrapper(clapack_sgetrf)(Order, M, N, (T*)A, lda, ipiv);
  241. }
  242. else
  243. if(is_double<eT>::value)
  244. {
  245. typedef double T;
  246. return arma_wrapper(clapack_dgetrf)(Order, M, N, (T*)A, lda, ipiv);
  247. }
  248. else
  249. if(is_cx_float<eT>::value)
  250. {
  251. typedef std::complex<float> T;
  252. return arma_wrapper(clapack_cgetrf)(Order, M, N, (T*)A, lda, ipiv);
  253. }
  254. else
  255. if(is_cx_double<eT>::value)
  256. {
  257. typedef std::complex<double> T;
  258. return arma_wrapper(clapack_zgetrf)(Order, M, N, (T*)A, lda, ipiv);
  259. }
  260. return -1;
  261. }
  262. template<typename eT>
  263. inline
  264. int
  265. clapack_getri
  266. (
  267. const enum CBLAS_ORDER Order, const int N, eT *A,
  268. const int lda, const int *ipiv
  269. )
  270. {
  271. arma_type_check((is_supported_blas_type<eT>::value == false));
  272. if(is_float<eT>::value)
  273. {
  274. typedef float T;
  275. return arma_wrapper(clapack_sgetri)(Order, N, (T*)A, lda, ipiv);
  276. }
  277. else
  278. if(is_double<eT>::value)
  279. {
  280. typedef double T;
  281. return arma_wrapper(clapack_dgetri)(Order, N, (T*)A, lda, ipiv);
  282. }
  283. else
  284. if(is_cx_float<eT>::value)
  285. {
  286. typedef std::complex<float> T;
  287. return arma_wrapper(clapack_cgetri)(Order, N, (T*)A, lda, ipiv);
  288. }
  289. else
  290. if(is_cx_double<eT>::value)
  291. {
  292. typedef std::complex<double> T;
  293. return arma_wrapper(clapack_zgetri)(Order, N, (T*)A, lda, ipiv);
  294. }
  295. return -1;
  296. }
  297. template<typename eT>
  298. inline
  299. int
  300. clapack_gesv
  301. (
  302. const enum CBLAS_ORDER Order,
  303. const int N, const int NRHS,
  304. eT* A, const int lda, int* ipiv,
  305. eT* B, const int ldb
  306. )
  307. {
  308. arma_type_check((is_supported_blas_type<eT>::value == false));
  309. if(is_float<eT>::value)
  310. {
  311. typedef float T;
  312. return arma_wrapper(clapack_sgesv)(Order, N, NRHS, (T*)A, lda, ipiv, (T*)B, ldb);
  313. }
  314. else
  315. if(is_double<eT>::value)
  316. {
  317. typedef double T;
  318. return arma_wrapper(clapack_dgesv)(Order, N, NRHS, (T*)A, lda, ipiv, (T*)B, ldb);
  319. }
  320. else
  321. if(is_cx_float<eT>::value)
  322. {
  323. typedef std::complex<float> T;
  324. return arma_wrapper(clapack_cgesv)(Order, N, NRHS, (T*)A, lda, ipiv, (T*)B, ldb);
  325. }
  326. else
  327. if(is_cx_double<eT>::value)
  328. {
  329. typedef std::complex<double> T;
  330. return arma_wrapper(clapack_zgesv)(Order, N, NRHS, (T*)A, lda, ipiv, (T*)B, ldb);
  331. }
  332. return -1;
  333. }
  334. template<typename eT>
  335. inline
  336. int
  337. clapack_potrf(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const int N, eT *A, const int lda)
  338. {
  339. arma_type_check((is_supported_blas_type<eT>::value == false));
  340. if(is_float<eT>::value)
  341. {
  342. typedef float T;
  343. return arma_wrapper(clapack_spotrf)(Order, Uplo, N, (T*)A, lda);
  344. }
  345. else
  346. if(is_double<eT>::value)
  347. {
  348. typedef double T;
  349. return arma_wrapper(clapack_dpotrf)(Order, Uplo, N, (T*)A, lda);
  350. }
  351. else
  352. if(is_cx_float<eT>::value)
  353. {
  354. typedef std::complex<float> T;
  355. return arma_wrapper(clapack_cpotrf)(Order, Uplo, N, (T*)A, lda);
  356. }
  357. else
  358. if(is_cx_double<eT>::value)
  359. {
  360. typedef std::complex<double> T;
  361. return arma_wrapper(clapack_zpotrf)(Order, Uplo, N, (T*)A, lda);
  362. }
  363. return -1;
  364. }
  365. template<typename eT>
  366. inline
  367. int
  368. clapack_potri(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const int N, eT *A, const int lda)
  369. {
  370. arma_type_check((is_supported_blas_type<eT>::value == false));
  371. if(is_float<eT>::value)
  372. {
  373. typedef float T;
  374. return arma_wrapper(clapack_spotri)(Order, Uplo, N, (T*)A, lda);
  375. }
  376. else
  377. if(is_double<eT>::value)
  378. {
  379. typedef double T;
  380. return arma_wrapper(clapack_dpotri)(Order, Uplo, N, (T*)A, lda);
  381. }
  382. else
  383. if(is_cx_float<eT>::value)
  384. {
  385. typedef std::complex<float> T;
  386. return arma_wrapper(clapack_cpotri)(Order, Uplo, N, (T*)A, lda);
  387. }
  388. else
  389. if(is_cx_double<eT>::value)
  390. {
  391. typedef std::complex<double> T;
  392. return arma_wrapper(clapack_zpotri)(Order, Uplo, N, (T*)A, lda);
  393. }
  394. return -1;
  395. }
  396. template<typename eT>
  397. inline
  398. int
  399. clapack_posv(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo, const int N, const int NRHS, eT *A, const int lda, eT *B, const int ldb)
  400. {
  401. arma_type_check((is_supported_blas_type<eT>::value == false));
  402. if(is_float<eT>::value)
  403. {
  404. typedef float T;
  405. return arma_wrapper(clapack_sposv)(Order, Uplo, N, NRHS, (T*)A, lda, (T*)B, ldb);
  406. }
  407. else
  408. if(is_double<eT>::value)
  409. {
  410. typedef double T;
  411. return arma_wrapper(clapack_dposv)(Order, Uplo, N, NRHS, (T*)A, lda, (T*)B, ldb);
  412. }
  413. else
  414. if(is_cx_float<eT>::value)
  415. {
  416. typedef std::complex<float> T;
  417. return arma_wrapper(clapack_cposv)(Order, Uplo, N, NRHS, (T*)A, lda, (T*)B, ldb);
  418. }
  419. else
  420. if(is_cx_double<eT>::value)
  421. {
  422. typedef std::complex<double> T;
  423. return arma_wrapper(clapack_zposv)(Order, Uplo, N, NRHS, (T*)A, lda, (T*)B, ldb);
  424. }
  425. return -1;
  426. }
  427. }
  428. #endif