Keep the flag handling separate from the scaling loops in rotmgtags/v0.3.0
| @@ -136,7 +136,7 @@ void CNAME(FLOAT *dd1, FLOAT *dd2, FLOAT *dx1, FLOAT dy1, FLOAT *dparam){ | |||
| if(*dd1 != ZERO) | |||
| { | |||
| while( (*dd1 <= RGAMSQ) || (*dd1 >= GAMSQ) ) | |||
| if( (*dd1 <= RGAMSQ) || (*dd1 >= GAMSQ) ) | |||
| { | |||
| if(dflag == ZERO) | |||
| { | |||
| @@ -146,33 +146,34 @@ void CNAME(FLOAT *dd1, FLOAT *dd2, FLOAT *dx1, FLOAT dy1, FLOAT *dparam){ | |||
| } | |||
| else | |||
| { | |||
| if(dflag == ONE) | |||
| { | |||
| dh21 = -ONE; | |||
| dh12 = ONE; | |||
| dflag = -ONE; | |||
| } | |||
| } | |||
| if( *dd1 <= RGAMSQ ) | |||
| { | |||
| *dd1 = *dd1 * (GAM * GAM); | |||
| *dx1 = *dx1 / GAM; | |||
| dh11 = dh11 / GAM; | |||
| dh12 = dh12 / GAM; | |||
| while (ABS(*dd1) <= RGAMSQ) { | |||
| *dd1 = *dd1 * (GAM * GAM); | |||
| *dx1 = *dx1 / GAM; | |||
| dh11 = dh11 / GAM; | |||
| dh12 = dh12 / GAM; | |||
| } | |||
| } | |||
| else | |||
| { | |||
| *dd1 = *dd1 / (GAM * GAM); | |||
| *dx1 = *dx1 * GAM; | |||
| dh11 = dh11 * GAM; | |||
| dh12 = dh12 * GAM; | |||
| while (ABS(*dd1) <= GAMSQ) { | |||
| *dd1 = *dd1 / (GAM * GAM); | |||
| *dx1 = *dx1 * GAM; | |||
| dh11 = dh11 * GAM; | |||
| dh12 = dh12 * GAM; | |||
| } | |||
| } | |||
| } | |||
| } | |||
| if(*dd2 != ZERO) | |||
| { | |||
| while( (ABS(*dd2) <= RGAMSQ) || (ABS(*dd2) >= GAMSQ) ) | |||
| if( (ABS(*dd2) <= RGAMSQ) || (ABS(*dd2) >= GAMSQ) ) | |||
| { | |||
| if(dflag == ZERO) | |||
| { | |||
| @@ -182,24 +183,25 @@ void CNAME(FLOAT *dd1, FLOAT *dd2, FLOAT *dx1, FLOAT dy1, FLOAT *dparam){ | |||
| } | |||
| else | |||
| { | |||
| if(dflag == ONE) | |||
| { | |||
| dh21 = -ONE; | |||
| dh12 = ONE; | |||
| dflag = -ONE; | |||
| } | |||
| } | |||
| if( ABS(*dd2) <= RGAMSQ ) | |||
| { | |||
| *dd2 = *dd2 * (GAM * GAM); | |||
| dh21 = dh21 / GAM; | |||
| dh22 = dh22 / GAM; | |||
| while (ABS(*dd2) <= RGAMSQ) { | |||
| *dd2 = *dd2 * (GAM * GAM); | |||
| dh21 = dh21 / GAM; | |||
| dh22 = dh22 / GAM; | |||
| } | |||
| } | |||
| else | |||
| { | |||
| *dd2 = *dd2 / (GAM * GAM); | |||
| dh21 = dh21 * GAM; | |||
| dh22 = dh22 * GAM; | |||
| while (ABS(*dd2) <= GAMSQ) { | |||
| *dd2 = *dd2 / (GAM * GAM); | |||
| dh21 = dh21 * GAM; | |||
| dh22 = dh22 * GAM; | |||
| } | |||
| } | |||
| } | |||
| } | |||
| @@ -7,6 +7,7 @@ else () | |||
| set(OpenBLAS_utest_src | |||
| utest_main.c | |||
| test_amax.c | |||
| test_rotmg.c | |||
| ) | |||
| endif () | |||
| @@ -8,8 +8,8 @@ UTESTBIN=openblas_utest | |||
| include $(TOPDIR)/Makefile.system | |||
| OBJS=utest_main.o test_amax.o | |||
| #test_rot.o test_swap.o test_axpy.o test_dotu.o test_rotmg.o test_dsdot.o test_fork.o | |||
| OBJS=utest_main.o test_amax.o test_rotmg.o | |||
| #test_rot.o test_swap.o test_axpy.o test_dotu.o test_dsdot.o test_fork.o | |||
| ifneq ($(NO_LAPACK), 1) | |||
| #OBJS += test_potrs.o | |||
| @@ -31,9 +31,9 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||
| **********************************************************************************/ | |||
| #include "common_utest.h" | |||
| #include "openblas_utest.h" | |||
| void test_drotmg() | |||
| CTEST (drotmg,rotmg) | |||
| { | |||
| double te_d1, tr_d1; | |||
| double te_d2, tr_d2; | |||
| @@ -42,31 +42,92 @@ void test_drotmg() | |||
| double te_param[5]; | |||
| double tr_param[5]; | |||
| int i=0; | |||
| te_d1= tr_d1=0.21149573940783739; | |||
| te_d2= tr_d2=0.046892057172954082; | |||
| te_x1= tr_x1=-0.42272687517106533; | |||
| te_y1= tr_y1=0.42211309121921659; | |||
| // original test case for libGoto bug fixed by feb2014 rewrite | |||
| te_d1= 0.21149573940783739; | |||
| te_d2= 0.046892057172954082; | |||
| te_x1= -0.42272687517106533; | |||
| te_y1= 0.42211309121921659; | |||
| for(i=0; i<5; i++){ | |||
| te_param[i]=tr_param[i]=0.0; | |||
| } | |||
| //reference values as calulated by netlib blas | |||
| tr_d1= 0.1732048; | |||
| tr_d2= 0.03840234; | |||
| tr_x1= -0.516180; | |||
| tr_y1= 0.422113; | |||
| tr_d1= 0.17320483687975; | |||
| tr_d2= 0.03840233915037; | |||
| tr_x1= -0.51618034832329; | |||
| tr_y1= 0.42211309121922; | |||
| tr_param[0]= 0.0; | |||
| tr_param[1]= 0.0; | |||
| tr_param[2]= 0.99854803659786; | |||
| tr_param[3]= -0.22139439665872; | |||
| tr_param[4]= 0.0; | |||
| BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param); | |||
| ASSERT_DBL_NEAR_TOL(te_d1, tr_d1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d2, tr_d2, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_x1, tr_x1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_y1, tr_y1, DOUBLE_EPS); | |||
| for(i=0; i<5; i++){ | |||
| ASSERT_DBL_NEAR_TOL(te_param[i], tr_param[i], DOUBLE_EPS); | |||
| } | |||
| } | |||
| CTEST (drotmg,rotmg_issue1452) | |||
| { | |||
| double te_d1, tr_d1; | |||
| double te_d2, tr_d2; | |||
| double te_x1, tr_x1; | |||
| double te_y1, tr_y1; | |||
| double te_param[5]; | |||
| double tr_param[5]; | |||
| int i=0; | |||
| // from issue #1452, buggy version returned 0.000244 for param[3] | |||
| te_d1 = 5.9e-8; | |||
| te_d2 = 5.960464e-8; | |||
| te_x1 = 1.0; | |||
| te_y1 = 150.0; | |||
| for(i=0; i<5; i++){ | |||
| te_param[i]=tr_param[i]=0.0; | |||
| } | |||
| //reference values as calulated by netlib blas | |||
| tr_d1= 0.99995592822897; | |||
| tr_d2= 0.98981219860583; | |||
| tr_x1= 0.03662270484346; | |||
| tr_y1= 150.000000000000; | |||
| tr_param[0]= -1.0; | |||
| tr_param[1]= 0.00000161109346; | |||
| tr_param[2]= -0.00024414062500; | |||
| tr_param[3]= 1.0; | |||
| tr_param[4]= 0.00000162760417; | |||
| //OpenBLAS | |||
| BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param); | |||
| //reference | |||
| BLASFUNC_REF(drotmg)(&tr_d1, &tr_d2, &tr_x1, &tr_y1, tr_param); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_d1, tr_d1, CHECK_EPS); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_d2, tr_d2, CHECK_EPS); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_x1, tr_x1, CHECK_EPS); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_y1, tr_y1, CHECK_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d1, tr_d1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d2, tr_d2, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_x1, tr_x1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_y1, tr_y1, DOUBLE_EPS); | |||
| for(i=0; i<5; i++){ | |||
| CU_ASSERT_DOUBLE_EQUAL(te_param[i], tr_param[i], CHECK_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_param[i], tr_param[i], DOUBLE_EPS); | |||
| } | |||
| } | |||
| void test_drotmg_D1eqD2_X1eqX2() | |||
| CTEST(drotmg, rotmg_D1eqD2_X1eqX2) | |||
| { | |||
| double te_d1, tr_d1; | |||
| double te_d2, tr_d2; | |||
| @@ -83,18 +144,28 @@ void test_drotmg_D1eqD2_X1eqX2() | |||
| for(i=0; i<5; i++){ | |||
| te_param[i]=tr_param[i]=0.0; | |||
| } | |||
| //reference values as calulated by netlib blas | |||
| tr_d1= 1.0; | |||
| tr_d2= 1.0; | |||
| tr_x1= 16.0; | |||
| tr_y1= 8.0; | |||
| tr_param[0]=1.0; | |||
| tr_param[1]=1.0; | |||
| tr_param[2]=0.0; | |||
| tr_param[3]=0.0; | |||
| tr_param[4]=1.0; | |||
| //OpenBLAS | |||
| BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param); | |||
| //reference | |||
| BLASFUNC_REF(drotmg)(&tr_d1, &tr_d2, &tr_x1, &tr_y1, tr_param); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_d1, tr_d1, CHECK_EPS); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_d2, tr_d2, CHECK_EPS); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_x1, tr_x1, CHECK_EPS); | |||
| CU_ASSERT_DOUBLE_EQUAL(te_y1, tr_y1, CHECK_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d1, tr_d1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d2, tr_d2, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_x1, tr_x1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_y1, tr_y1, DOUBLE_EPS); | |||
| for(i=0; i<5; i++){ | |||
| CU_ASSERT_DOUBLE_EQUAL(te_param[i], tr_param[i], CHECK_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_param[i], tr_param[i], DOUBLE_EPS); | |||
| } | |||
| } | |||
| @@ -49,6 +49,140 @@ CTEST(amax, samax){ | |||
| ASSERT_DBL_NEAR_TOL((double)(tr_max), (double)(te_max), SINGLE_EPS); | |||
| } | |||
| CTEST (drotmg,rotmg){ | |||
| double te_d1, tr_d1; | |||
| double te_d2, tr_d2; | |||
| double te_x1, tr_x1; | |||
| double te_y1, tr_y1; | |||
| double te_param[5]; | |||
| double tr_param[5]; | |||
| int i=0; | |||
| // original test case for libGoto bug fixed by feb2014 rewrite | |||
| te_d1= 0.21149573940783739; | |||
| te_d2= 0.046892057172954082; | |||
| te_x1= -0.42272687517106533; | |||
| te_y1= 0.42211309121921659; | |||
| for(i=0; i<5; i++){ | |||
| te_param[i]=tr_param[i]=0.0; | |||
| } | |||
| //reference values as calulated by netlib blas | |||
| tr_d1= 0.1732048; | |||
| tr_d2= 0.03840234; | |||
| tr_x1= -0.516180; | |||
| tr_y1= 0.422113; | |||
| tr_d1= 0.17320483687975; | |||
| tr_d2= 0.03840233915037; | |||
| tr_x1= -0.51618034832329; | |||
| tr_y1= 0.42211309121922; | |||
| tr_param[0]= 0.0; | |||
| tr_param[1]= 0.0; | |||
| tr_param[2]= 0.99854803659786; | |||
| tr_param[3]= -0.22139439665872; | |||
| tr_param[4]= 0.0; | |||
| BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param); | |||
| ASSERT_DBL_NEAR_TOL(te_d1, tr_d1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d2, tr_d2, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_x1, tr_x1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_y1, tr_y1, DOUBLE_EPS); | |||
| for(i=0; i<5; i++){ | |||
| ASSERT_DBL_NEAR_TOL(te_param[i], tr_param[i], DOUBLE_EPS); | |||
| } | |||
| } | |||
| CTEST (drotmg,rotmg_issue1452){ | |||
| double te_d1, tr_d1; | |||
| double te_d2, tr_d2; | |||
| double te_x1, tr_x1; | |||
| double te_y1, tr_y1; | |||
| double te_param[5]; | |||
| double tr_param[5]; | |||
| int i=0; | |||
| // from issue #1452, buggy version returned 0.000244 for param[3] | |||
| te_d1 = 5.9e-8; | |||
| te_d2 = 5.960464e-8; | |||
| te_x1 = 1.0; | |||
| te_y1 = 150.0; | |||
| for(i=0; i<5; i++){ | |||
| te_param[i]=tr_param[i]=0.0; | |||
| } | |||
| //reference values as calulated by netlib blas | |||
| tr_d1= 0.99995592822897; | |||
| tr_d2= 0.98981219860583; | |||
| tr_x1= 0.03662270484346; | |||
| tr_y1= 150.000000000000; | |||
| tr_param[0]= -1.0; | |||
| tr_param[1]= 0.00000161109346; | |||
| tr_param[2]= -0.00024414062500; | |||
| tr_param[3]= 1.0; | |||
| tr_param[4]= 0.00000162760417; | |||
| //OpenBLAS | |||
| BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param); | |||
| ASSERT_DBL_NEAR_TOL(te_d1, tr_d1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d2, tr_d2, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_x1, tr_x1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_y1, tr_y1, DOUBLE_EPS); | |||
| for(i=0; i<5; i++){ | |||
| ASSERT_DBL_NEAR_TOL(te_param[i], tr_param[i], DOUBLE_EPS); | |||
| } | |||
| } | |||
| CTEST(drotmg, rotmg_D1eqD2_X1eqX2){ | |||
| double te_d1, tr_d1; | |||
| double te_d2, tr_d2; | |||
| double te_x1, tr_x1; | |||
| double te_y1, tr_y1; | |||
| double te_param[5]; | |||
| double tr_param[5]; | |||
| int i=0; | |||
| te_d1= tr_d1=2.; | |||
| te_d2= tr_d2=2.; | |||
| te_x1= tr_x1=8.; | |||
| te_y1= tr_y1=8.; | |||
| for(i=0; i<5; i++){ | |||
| te_param[i]=tr_param[i]=0.0; | |||
| } | |||
| //reference values as calulated by netlib blas | |||
| tr_d1= 1.0; | |||
| tr_d2= 1.0; | |||
| tr_x1= 16.0; | |||
| tr_y1= 8.0; | |||
| tr_param[0]=1.0; | |||
| tr_param[1]=1.0; | |||
| tr_param[2]=0.0; | |||
| tr_param[3]=0.0; | |||
| tr_param[4]=1.0; | |||
| //OpenBLAS | |||
| BLASFUNC(drotmg)(&te_d1, &te_d2, &te_x1, &te_y1, te_param); | |||
| ASSERT_DBL_NEAR_TOL(te_d1, tr_d1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_d2, tr_d2, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_x1, tr_x1, DOUBLE_EPS); | |||
| ASSERT_DBL_NEAR_TOL(te_y1, tr_y1, DOUBLE_EPS); | |||
| for(i=0; i<5; i++){ | |||
| ASSERT_DBL_NEAR_TOL(te_param[i], tr_param[i], DOUBLE_EPS); | |||
| } | |||
| } | |||
| int main(int argc, const char ** argv){ | |||
| CTEST_ADD(amax, samax); | |||