You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

utest_main2.c 18 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706
  1. /*****************************************************************************
  2. Copyright (c) 2011-2016, The OpenBLAS Project
  3. All rights reserved.
  4. Redistribution and use in source and binary forms, with or without
  5. modification, are permitted provided that the following conditions are
  6. met:
  7. 1. Redistributions of source code must retain the above copyright
  8. notice, this list of conditions and the following disclaimer.
  9. 2. Redistributions in binary form must reproduce the above copyright
  10. notice, this list of conditions and the following disclaimer in
  11. the documentation and/or other materials provided with the
  12. distribution.
  13. 3. Neither the name of the OpenBLAS project nor the names of
  14. its contributors may be used to endorse or promote products
  15. derived from this software without specific prior written
  16. permission.
  17. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  18. AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  19. IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  20. ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  21. LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  22. DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  23. SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  24. CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
  25. OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
  26. USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  27. **********************************************************************************/
  28. #include <stdio.h>
  29. #include <complex.h>
  30. #define CTEST_MAIN
  31. #define CTEST_SEGFAULT
  32. #define CTEST_ADD_TESTS_MANUALLY
  33. #include "cblas.h"
  34. #include "openblas_utest.h"
  35. CTEST(amax, samax){
  36. blasint N=3, inc=1;
  37. float te_max=0.0, tr_max=0.0;
  38. float x[]={-1.1, 2.2, -3.3};
  39. te_max=BLASFUNC(samax)(&N, x, &inc);
  40. tr_max=3.3;
  41. ASSERT_DBL_NEAR_TOL((double)(tr_max), (double)(te_max), SINGLE_EPS);
  42. }
  43. CTEST(amax, damax){
  44. blasint N=3, inc=1;
  45. double te_max=0.0, tr_max=0.0;
  46. double x[]={-1.1, 2.2, -3.3};
  47. te_max=BLASFUNC(damax)(&N, x, &inc);
  48. tr_max=3.3;
  49. ASSERT_DBL_NEAR_TOL((double)(tr_max), (double)(te_max), DOUBLE_EPS);
  50. }
  51. CTEST (drotmg,rotmg)
  52. {
  53. double te_d1, tr_d1;
  54. double te_d2, tr_d2;
  55. double te_x1, tr_x1;
  56. double te_y1, tr_y1;
  57. double te_param[5];
  58. double tr_param[5];
  59. int i=0;
  60. // original test case for libGoto bug fixed by feb2014 rewrite
  61. te_d1= 0.21149573940783739;
  62. te_d2= 0.046892057172954082;
  63. te_x1= -0.42272687517106533;
  64. te_y1= 0.42211309121921659;
  65. for(i=0; i<5; i++){
  66. te_param[i]=tr_param[i]=0.0;
  67. }
  68. //reference values as calculated by netlib blas
  69. tr_d1= 0.1732048;
  70. tr_d2= 0.03840234;
  71. tr_x1= -0.516180;
  72. tr_y1= 0.422113;
  73. tr_d1= 0.17320483687975;
  74. tr_d2= 0.03840233915037;
  75. tr_x1= -0.51618034832329;
  76. tr_y1= 0.42211309121922;
  77. tr_param[0]= 0.0;
  78. tr_param[1]= 0.0;
  79. tr_param[2]= 0.99854803659786;
  80. tr_param[3]= -0.22139439665872;
  81. tr_param[4]= 0.0;
  82. BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param);
  83. ASSERT_DBL_NEAR_TOL(tr_d1, te_d1, DOUBLE_EPS);
  84. ASSERT_DBL_NEAR_TOL(tr_d2, te_d2, DOUBLE_EPS);
  85. ASSERT_DBL_NEAR_TOL(tr_x1, te_x1, DOUBLE_EPS);
  86. ASSERT_DBL_NEAR_TOL(tr_y1, te_y1, DOUBLE_EPS);
  87. for(i=0; i<5; i++){
  88. ASSERT_DBL_NEAR_TOL(tr_param[i], te_param[i], DOUBLE_EPS);
  89. }
  90. }
  91. CTEST (drotmg,rotmg_issue1452)
  92. {
  93. double te_d1, tr_d1;
  94. double te_d2, tr_d2;
  95. double te_x1, tr_x1;
  96. double te_y1, tr_y1;
  97. double te_param[5];
  98. double tr_param[5];
  99. int i=0;
  100. // from issue #1452
  101. te_d1 = 5.9e-8;
  102. te_d2 = 5.960464e-8;
  103. te_x1 = 1.0;
  104. te_y1 = 150.0;
  105. for(i=0; i<5; i++){
  106. te_param[i]=tr_param[i]=0.0;
  107. }
  108. te_param[3]=1./4096.;
  109. //reference values as calculated by gonum blas with rotmg rewritten to Hopkins' algorithm
  110. tr_d1= 0.99995592822897;
  111. tr_d2= 0.98981219860583;
  112. tr_x1= 0.03662270484346;
  113. tr_y1= 150.000000000000;
  114. tr_param[0]= -1.0;
  115. tr_param[1]= 0.00000161109346;
  116. tr_param[2]= -0.00024414062500;
  117. tr_param[3]= 0.00024414062500;
  118. tr_param[4]= 0.00000162760417;
  119. //OpenBLAS
  120. BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param);
  121. ASSERT_DBL_NEAR_TOL(tr_d1, te_d1, DOUBLE_EPS);
  122. ASSERT_DBL_NEAR_TOL(tr_d2, te_d2, DOUBLE_EPS);
  123. ASSERT_DBL_NEAR_TOL(tr_x1, te_x1, DOUBLE_EPS);
  124. ASSERT_DBL_NEAR_TOL(tr_y1, te_y1, DOUBLE_EPS);
  125. for(i=0; i<5; i++){
  126. ASSERT_DBL_NEAR_TOL(tr_param[i], te_param[i], DOUBLE_EPS);
  127. }
  128. }
  129. CTEST(drotmg, rotmg_D1eqD2_X1eqX2)
  130. {
  131. double te_d1, tr_d1;
  132. double te_d2, tr_d2;
  133. double te_x1, tr_x1;
  134. double te_y1, tr_y1;
  135. double te_param[5];
  136. double tr_param[5];
  137. int i=0;
  138. te_d1= tr_d1=2.;
  139. te_d2= tr_d2=2.;
  140. te_x1= tr_x1=8.;
  141. te_y1= tr_y1=8.;
  142. for(i=0; i<5; i++){
  143. te_param[i]=tr_param[i]=0.0;
  144. }
  145. //reference values as calculated by netlib blas
  146. tr_d1= 1.0;
  147. tr_d2= 1.0;
  148. tr_x1= 16.0;
  149. tr_y1= 8.0;
  150. tr_param[0]=1.0;
  151. tr_param[1]=1.0;
  152. tr_param[2]=0.0;
  153. tr_param[3]=0.0;
  154. tr_param[4]=1.0;
  155. //OpenBLAS
  156. BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param);
  157. ASSERT_DBL_NEAR_TOL(tr_d1, te_d1, DOUBLE_EPS);
  158. ASSERT_DBL_NEAR_TOL(tr_d2, te_d2, DOUBLE_EPS);
  159. ASSERT_DBL_NEAR_TOL(tr_x1, te_x1, DOUBLE_EPS);
  160. ASSERT_DBL_NEAR_TOL(tr_y1, te_y1, DOUBLE_EPS);
  161. for(i=0; i<5; i++){
  162. ASSERT_DBL_NEAR_TOL(tr_param[i], te_param[i], DOUBLE_EPS);
  163. }
  164. }
  165. CTEST(drotmg, drotmg_D1_big_D2_big_flag_zero)
  166. {
  167. double te_d1, tr_d1;
  168. double te_d2, tr_d2;
  169. double te_x1, tr_x1;
  170. double te_y1, tr_y1;
  171. double te_param[5]={1.,4096.,-4096.,1.,4096.};
  172. double tr_param[5]={-1.,4096.,-3584.,1792.,4096.};
  173. int i=0;
  174. te_d1= tr_d1=1600000000.;
  175. te_d2= tr_d2=800000000.;
  176. te_x1= tr_x1=8.;
  177. te_y1= tr_y1=7.;
  178. //reference values as calculated by gonum
  179. tr_d1= 68.96627824858757;
  180. tr_d2= 34.483139124293785;
  181. tr_x1= 45312.;
  182. tr_y1= 7.0;
  183. //OpenBLAS
  184. BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param);
  185. ASSERT_DBL_NEAR_TOL(tr_d1, te_d1, DOUBLE_EPS);
  186. ASSERT_DBL_NEAR_TOL(tr_d2, te_d2, DOUBLE_EPS);
  187. ASSERT_DBL_NEAR_TOL(tr_x1, te_x1, DOUBLE_EPS);
  188. ASSERT_DBL_NEAR_TOL(tr_y1, te_y1, DOUBLE_EPS);
  189. for(i=0; i<5; i++){
  190. ASSERT_DBL_NEAR_TOL(tr_param[i], te_param[i], DOUBLE_EPS);
  191. }
  192. }
  193. CTEST(axpy,daxpy_inc_0)
  194. {
  195. blasint i;
  196. blasint N=8,incX=0,incY=0;
  197. double a=0.25;
  198. double x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  199. double y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  200. double x2[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  201. double y2[]={4.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  202. //OpenBLAS
  203. BLASFUNC(daxpy)(&N,&a,x1,&incX,y1,&incY);
  204. for(i=0; i<N; i++){
  205. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  206. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  207. }
  208. }
  209. CTEST(axpy,zaxpy_inc_0)
  210. {
  211. blasint i;
  212. blasint N=4,incX=0,incY=0;
  213. double a[2]={0.25,0.5};
  214. double x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  215. double y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  216. double x2[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  217. double y2[]={-3.0,9.0,6.0,8.0,2.0,4.0,6.0,8.0};
  218. //OpenBLAS
  219. BLASFUNC(zaxpy)(&N,a,x1,&incX,y1,&incY);
  220. for(i=0; i<2*N; i++){
  221. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  222. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  223. }
  224. }
  225. CTEST(axpy,saxpy_inc_0)
  226. {
  227. blasint i;
  228. blasint N=8,incX=0,incY=0;
  229. float a=0.25;
  230. float x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  231. float y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  232. float x2[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  233. float y2[]={4.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  234. //OpenBLAS
  235. BLASFUNC(saxpy)(&N,&a,x1,&incX,y1,&incY);
  236. for(i=0; i<N; i++){
  237. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  238. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  239. }
  240. }
  241. CTEST(axpy,caxpy_inc_0)
  242. {
  243. blasint i;
  244. blasint N=4,incX=0,incY=0;
  245. float a[2]={0.25,0.5};
  246. float x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  247. float y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  248. float x2[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  249. float y2[]={-3.0,9.0,6.0,8.0,2.0,4.0,6.0,8.0};
  250. //OpenBLAS
  251. BLASFUNC(caxpy)(&N,a,x1,&incX,y1,&incY);
  252. for(i=0; i<2*N; i++){
  253. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  254. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  255. }
  256. }
  257. CTEST( zdotu,zdotu_n_1)
  258. {
  259. blasint N=1,incX=1,incY=1;
  260. double x1[]={1.0,1.0};
  261. double y1[]={1.0,2.0};
  262. openblas_complex_double result1=openblas_make_complex_double(0.0,0.0);
  263. openblas_complex_double result2=openblas_make_complex_double(-1.0,3.0);
  264. #ifdef RETURN_BY_STACK
  265. BLASFUNC(zdotu)(&result1,&N,x1,&incX,y1,&incY);
  266. #else
  267. result1=BLASFUNC(zdotu)(&N,x1,&incX,y1,&incY);
  268. #endif
  269. #ifdef OPENBLAS_COMPLEX_STRUCT
  270. ASSERT_DBL_NEAR_TOL(result2.real, result1.real, DOUBLE_EPS);
  271. ASSERT_DBL_NEAR_TOL(result2.imag, result1.imag, DOUBLE_EPS);
  272. #else
  273. ASSERT_DBL_NEAR_TOL(creal(result2), creal(result1), DOUBLE_EPS);
  274. ASSERT_DBL_NEAR_TOL(cimag(result2), cimag(result1), DOUBLE_EPS);
  275. #endif
  276. }
  277. CTEST(zdotu, zdotu_offset_1)
  278. {
  279. blasint N=1,incX=1,incY=1;
  280. double x1[]={1.0,2.0,3.0,4.0};
  281. double y1[]={5.0,6.0,7.0,8.0};
  282. openblas_complex_double result1=openblas_make_complex_double(0.0,0.0);
  283. openblas_complex_double result2=openblas_make_complex_double(-9.0,32.0);
  284. #ifdef RETURN_BY_STACK
  285. BLASFUNC(zdotu)(&result1,&N,x1+1,&incX,y1+1,&incY);
  286. #else
  287. result1=BLASFUNC(zdotu)(&N,x1+1,&incX,y1+1,&incY);
  288. #endif
  289. #ifdef OPENBLAS_COMPLEX_STRUCT
  290. ASSERT_DBL_NEAR_TOL(result2.real, result1.real, DOUBLE_EPS);
  291. ASSERT_DBL_NEAR_TOL(result2.imag, result1.imag, DOUBLE_EPS);
  292. #else
  293. ASSERT_DBL_NEAR_TOL(creal(result2), creal(result1), DOUBLE_EPS);
  294. ASSERT_DBL_NEAR_TOL(cimag(result2), cimag(result1), DOUBLE_EPS);
  295. #endif
  296. }
  297. CTEST(dsdot,dsdot_n_1)
  298. {
  299. float x= 0.172555164F;
  300. float y= -0.0138700781F;
  301. blasint incx=1;
  302. blasint incy=1;
  303. blasint n=1;
  304. double res1=0.0f, res2=-0.00239335360107;
  305. res1=BLASFUNC(dsdot)(&n, &x, &incx, &y, &incy);
  306. ASSERT_DBL_NEAR_TOL(res2, res1, DOUBLE_EPS);
  307. }
  308. #if defined(BUILD_DOUBLE)
  309. CTEST(dnrm2,dnrm2_inf)
  310. {
  311. #ifndef INFINITY
  312. #define INFINITY HUGE_VAL
  313. #endif
  314. int i;
  315. double x[29];
  316. blasint incx=1;
  317. blasint n=28;
  318. double res1=0.0f, res2=INFINITY;
  319. for (i=0;i<n;i++)x[i]=0.0f;
  320. x[10]=-INFINITY;
  321. res1=BLASFUNC(dnrm2)(&n, x, &incx);
  322. ASSERT_DBL_NEAR_TOL(res2, res1, DOUBLE_EPS);
  323. }
  324. CTEST(dnrm2,dnrm2_tiny)
  325. {
  326. int i;
  327. double x[29];
  328. blasint incx=1;
  329. blasint n=28;
  330. double res1=0.0f, res2=0.0f;
  331. for (i=0;i<n;i++)x[i]=7.457008414e-310;
  332. res1=BLASFUNC(dnrm2)(&n, x, &incx);
  333. ASSERT_DBL_NEAR_TOL(res2, res1, DOUBLE_EPS);
  334. }
  335. #endif
  336. CTEST(rot,drot_inc_0)
  337. {
  338. blasint i=0;
  339. blasint N=4,incX=0,incY=0;
  340. double c=0.25,s=0.5;
  341. double x1[]={1.0,3.0,5.0,7.0};
  342. double y1[]={2.0,4.0,6.0,8.0};
  343. double x2[]={-0.21484375000000,3.0,5.0,7.0};
  344. double y2[]={ 0.03906250000000,4.0,6.0,8.0};
  345. //OpenBLAS
  346. BLASFUNC(drot)(&N,x1,&incX,y1,&incY,&c,&s);
  347. for(i=0; i<N; i++){
  348. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  349. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  350. }
  351. }
  352. CTEST(rot,zdrot_inc_0)
  353. {
  354. blasint i=0;
  355. blasint N=4,incX=0,incY=0;
  356. double c=0.25,s=0.5;
  357. double x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  358. double y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  359. double x2[]={-0.21484375000000,-0.45703125000000 ,5.0,7.0,1.0,3.0,5.0,7.0};
  360. double y2[]={ 0.03906250000000, 0.17187500000000 ,6.0,8.0,2.0,4.0,6.0,8.0};
  361. //OpenBLAS
  362. BLASFUNC(zdrot)(&N,x1,&incX,y1,&incY,&c,&s);
  363. for(i=0; i<2*N; i++){
  364. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  365. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  366. }
  367. }
  368. CTEST(rot,srot_inc_0)
  369. {
  370. blasint i=0;
  371. blasint N=4,incX=0,incY=0;
  372. float c=0.25,s=0.5;
  373. float x1[]={1.0,3.0,5.0,7.0};
  374. float y1[]={2.0,4.0,6.0,8.0};
  375. float x2[]={-0.21484375000000,3.0,5.0,7.0};
  376. float y2[]={ 0.03906250000000,4.0,6.0,8.0};
  377. //OpenBLAS
  378. BLASFUNC(srot)(&N,x1,&incX,y1,&incY,&c,&s);
  379. for(i=0; i<N; i++){
  380. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], SINGLE_EPS);
  381. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], SINGLE_EPS);
  382. }
  383. }
  384. CTEST(rot, csrot_inc_0)
  385. {
  386. blasint i=0;
  387. blasint N=4,incX=0,incY=0;
  388. float c=0.25,s=0.5;
  389. float x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  390. float y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  391. float x2[]={-0.21484375000000,-0.45703125000000 ,5.0,7.0,1.0,3.0,5.0,7.0};
  392. float y2[]={ 0.03906250000000, 0.17187500000000 ,6.0,8.0,2.0,4.0,6.0,8.0};
  393. //OpenBLAS
  394. BLASFUNC(csrot)(&N,x1,&incX,y1,&incY,&c,&s);
  395. for(i=0; i<2*N; i++){
  396. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], SINGLE_EPS);
  397. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], SINGLE_EPS);
  398. }
  399. }
  400. CTEST(swap,dswap_inc_0)
  401. {
  402. blasint i=0;
  403. blasint N=4,incX=0,incY=0;
  404. double x1[]={1.0,3.0,5.0,7.0};
  405. double y1[]={2.0,4.0,6.0,8.0};
  406. double x2[]={1.0,3.0,5.0,7.0};
  407. double y2[]={2.0,4.0,6.0,8.0};
  408. //OpenBLAS
  409. BLASFUNC(dswap)(&N,x1,&incX,y1,&incY);
  410. for(i=0; i<N; i++){
  411. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  412. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  413. }
  414. }
  415. CTEST(swap,zswap_inc_0)
  416. {
  417. blasint i=0;
  418. blasint N=4,incX=0,incY=0;
  419. double x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  420. double y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  421. double x2[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  422. double y2[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  423. //OpenBLAS
  424. BLASFUNC(zswap)(&N,x1,&incX,y1,&incY);
  425. for(i=0; i<2*N; i++){
  426. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], DOUBLE_EPS);
  427. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], DOUBLE_EPS);
  428. }
  429. }
  430. CTEST(swap,sswap_inc_0)
  431. {
  432. blasint i=0;
  433. blasint N=4,incX=0,incY=0;
  434. float x1[]={1.0,3.0,5.0,7.0};
  435. float y1[]={2.0,4.0,6.0,8.0};
  436. float x2[]={1.0,3.0,5.0,7.0};
  437. float y2[]={2.0,4.0,6.0,8.0};
  438. //OpenBLAS
  439. BLASFUNC(sswap)(&N,x1,&incX,y1,&incY);
  440. for(i=0; i<N; i++){
  441. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], SINGLE_EPS);
  442. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], SINGLE_EPS);
  443. }
  444. }
  445. CTEST(swap,cswap_inc_0)
  446. {
  447. blasint i=0;
  448. blasint N=4,incX=0,incY=0;
  449. float x1[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  450. float y1[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  451. float x2[]={1.0,3.0,5.0,7.0,1.0,3.0,5.0,7.0};
  452. float y2[]={2.0,4.0,6.0,8.0,2.0,4.0,6.0,8.0};
  453. //OpenBLAS
  454. BLASFUNC(cswap)(&N,x1,&incX,y1,&incY);
  455. for(i=0; i<2*N; i++){
  456. ASSERT_DBL_NEAR_TOL(x2[i], x1[i], SINGLE_EPS);
  457. ASSERT_DBL_NEAR_TOL(y2[i], y1[i], SINGLE_EPS);
  458. }
  459. }
  460. CTEST(min, smin_negative){
  461. blasint N=3, inc=1;
  462. float te_min=0.0, tr_min=0.0;
  463. float x[]={-1.1, -2.2, -3.3};
  464. te_min=BLASFUNC(smin)(&N, x, &inc);
  465. tr_min=-3.3;
  466. ASSERT_DBL_NEAR_TOL((double)(tr_min), (double)(te_min), SINGLE_EPS);
  467. }
  468. CTEST(min, dmin_positive){
  469. blasint N=3, inc=1;
  470. double te_min=0.0, tr_min=0.0;
  471. double x[]={1.1, 0.0, 3.3};
  472. te_min=BLASFUNC(dmin)(&N, x, &inc);
  473. tr_min=0.0;
  474. ASSERT_DBL_NEAR_TOL((double)(tr_min), (double)(te_min), DOUBLE_EPS);
  475. }
  476. CTEST(min, smin_zero){
  477. blasint N=3, inc=1;
  478. float te_min=0.0, tr_min=0.0;
  479. float x[]={1.1, 2.2, 0.0};
  480. te_min=BLASFUNC(smin)(&N, x, &inc);
  481. tr_min=0.0;
  482. ASSERT_DBL_NEAR_TOL((double)(tr_min), (double)(te_min), SINGLE_EPS);
  483. }
  484. CTEST(max, smax_negative){
  485. blasint N=3, inc=1;
  486. float te_max=0.0, tr_max=0.0;
  487. float x[]={-1.1, -2.2, -3.3};
  488. te_max=BLASFUNC(smax)(&N, x, &inc);
  489. tr_max=-1.1;
  490. ASSERT_DBL_NEAR_TOL((double)(tr_max), (double)(te_max), SINGLE_EPS);
  491. }
  492. CTEST(max, dmax_positive){
  493. blasint N=3, inc=1;
  494. double te_max=0.0, tr_max=0.0;
  495. double x[]={1.1, 0.0, 3.3};
  496. te_max=BLASFUNC(dmax)(&N, x, &inc);
  497. tr_max=3.3;
  498. ASSERT_DBL_NEAR_TOL((double)(tr_max), (double)(te_max), DOUBLE_EPS);
  499. }
  500. CTEST(max, smax_zero){
  501. blasint N=3, inc=1;
  502. float te_max=0.0, tr_max=0.0;
  503. float x[]={-1.1, -2.2, 0.0};
  504. te_max=BLASFUNC(smax)(&N, x, &inc);
  505. tr_max=0.0;
  506. ASSERT_DBL_NEAR_TOL((double)(tr_max), (double)(te_max), SINGLE_EPS);
  507. }
  508. CTEST(zscal, i_nan)
  509. {
  510. double i[] = {0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1 };
  511. double nan[] = {NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0};
  512. cblas_zscal(9, i, &nan, 1);
  513. ASSERT_TRUE(isnan(nan[0]));
  514. ASSERT_TRUE(isnan(nan[1]));
  515. ASSERT_TRUE(isnan(nan[16]));
  516. ASSERT_TRUE(isnan(nan[17]));
  517. }
  518. CTEST(zscal, nan_i)
  519. {
  520. double i[] = {0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1 };
  521. double nan[] = {NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0, NAN,0};
  522. cblas_zscal(9, &nan, &i, 1);
  523. ASSERT_TRUE(isnan(i[0]));
  524. ASSERT_TRUE(isnan(i[1]));
  525. ASSERT_TRUE(isnan(i[16]));
  526. ASSERT_TRUE(isnan(i[17]));
  527. }
  528. CTEST(zscal, i_inf)
  529. {
  530. double i[] = {0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1 };
  531. double inf[] = {INFINITY, 0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0};
  532. cblas_zscal(9, i, &inf, 1);
  533. ASSERT_TRUE(isnan(inf[0]));
  534. ASSERT_TRUE(isinf(inf[1]));
  535. ASSERT_TRUE(isnan(inf[16]));
  536. ASSERT_TRUE(isinf(inf[17]));
  537. }
  538. CTEST(zscal, inf_i)
  539. {
  540. double i[] = {0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1, 0,1 };
  541. double inf[] = {INFINITY, 0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0, INFINITY,0};
  542. cblas_zscal(9, &inf, &i, 1);
  543. ASSERT_TRUE(isnan(i[0]));
  544. ASSERT_TRUE(isinf(i[1]));
  545. ASSERT_TRUE(isnan(i[16]));
  546. ASSERT_TRUE(isinf(i[17]));
  547. }
  548. int main(int argc, const char ** argv){
  549. CTEST_ADD (amax, samax);
  550. CTEST_ADD (amax, damax);
  551. CTEST_ADD (min, smin_negative);
  552. CTEST_ADD (min, dmin_positive);
  553. CTEST_ADD (min, smin_zero);
  554. CTEST_ADD (max, smax_negative);
  555. CTEST_ADD (max, dmax_positive);
  556. CTEST_ADD (max, smax_zero);
  557. CTEST_ADD (drotmg,rotmg);
  558. CTEST_ADD (drotmg,rotmg_issue1452);
  559. CTEST_ADD (drotmg,rotmg_D1eqD2_X1eqX2);
  560. CTEST_ADD (drotmg,drotmg_D1_big_D2_big_flag_zero);
  561. CTEST_ADD (axpy,daxpy_inc_0);
  562. CTEST_ADD (axpy,zaxpy_inc_0);
  563. CTEST_ADD (axpy,saxpy_inc_0);
  564. CTEST_ADD (axpy,caxpy_inc_0);
  565. CTEST_ADD (zdotu,zdotu_n_1);
  566. CTEST_ADD (zdotu,zdotu_offset_1);
  567. CTEST_ADD (dsdot,dsdot_n_1);
  568. CTEST_ADD (dnrm2,dnrm2_inf);
  569. CTEST_ADD (dnrm2,dnrm2_tiny);
  570. CTEST_ADD (rot,drot_inc_0);
  571. CTEST_ADD (rot,zdrot_inc_0);
  572. CTEST_ADD (rot,srot_inc_0);
  573. CTEST_ADD (rot,csrot_inc_0);
  574. CTEST_ADD (swap,dswap_inc_0);
  575. CTEST_ADD (swap,zswap_inc_0);
  576. CTEST_ADD (swap,sswap_inc_0);
  577. CTEST_ADD (swap,cswap_inc_0);
  578. CTEST_ADD (zscal, i_nan);
  579. CTEST_ADD (zscal, nan_i);
  580. CTEST_ADD (zscal, i_inf);
  581. CTEST_ADD (zscal, inf_i);
  582. int num_fail=0;
  583. num_fail=ctest_main(argc, argv);
  584. return num_fail;
  585. }