use Test::PDL in tests for Basic and GLM

mohawk2 · mohawk2 · commit 46336b54e18e · 2024-11-22T03:25:28.000Z
diff --git a/Makefile.PL b/Makefile.PL
@@ -32,6 +32,7 @@ WriteMakefile(
     },
     TEST_REQUIRES => {
         'Test::More' => '0.88', # done_testing
+        'Test::PDL' => '0.21',
     },
     $got_PDL ? () : (DIR => []), # just write MYMETA if no PDL
     dist                => { PREOP => 'gsl-config --version && $(PERL) -MPDL::Core::Dev -e pdlpp_mkgen $(DISTVNAME)' },
diff --git a/t/stats_basic.t b/t/stats_basic.t
@@ -5,120 +5,113 @@ use Test::More;
 use PDL::LiteF;
 use PDL::NiceSlice;
 use PDL::Stats::Basic;
-
-sub tapprox {
-  my($a,$b, $eps) = @_;
-  $eps ||= 1e-6;
-  my $diff = abs($a-$b);
-    # use max to make it perl scalar
-  ref $diff eq 'PDL' and $diff = $diff->max;
-  return $diff < $eps;
-}
+use Test::PDL;
 
 my $a = sequence 5;
-
-is( tapprox( $a->stdv, 1.4142135623731 ), 1, "standard deviation of $a");
-is( tapprox( $a->stdv_unbiased, 1.58113883008419 ), 1, "unbiased standard deviation of $a");
-is( tapprox( $a->var, 2 ), 1, "variance of $a");
-is( tapprox( $a->var_unbiased, 2.5 ), 1, "unbiased variance of $a");
-is( tapprox( $a->se, 0.707106781186548 ), 1, "standard error of $a");
-is( tapprox( $a->ss, 10 ), 1, "sum of squared deviations from the mean of $a");
-is( tapprox( $a->skew, 0 ), 1, "sample skewness of $a");
-is( tapprox( $a->skew_unbiased, 0 ), 1, "unbiased sample skewness of $a");
-is( tapprox( $a->kurt, -1.3 ), 1, "sample kurtosis of $a");
-is( tapprox( $a->kurt_unbiased, -1.2 ), 1, "unbiased sample kurtosis of $a");
-
-{
-  ok(tapprox($_->ss, (($_ - $_->avg)**2)->sum), "ss for $_") for
-    pdl('[1 1 1 1 2 3 4 4 4 4 4 4]'),
-    pdl('[1 2 2 2 3 3 3 3 4 4 5 5]'),
-    pdl('[1 1 1 2 2 3 3 4 4 5 5 5]');
-}
+is_pdl $a->stdv, pdl( 1.4142135623731 ), "standard deviation of $a";
+is_pdl $a->stdv_unbiased, pdl( 1.58113883008419 ), "unbiased standard deviation of $a";
+is_pdl $a->var, pdl( 2 ), "variance of $a";
+is_pdl $a->var_unbiased, pdl( 2.5 ), "unbiased variance of $a";
+is_pdl $a->se, pdl( 0.707106781186548 ), "standard error of $a";
+is_pdl $a->ss, pdl( 10 ), "sum of squared deviations from the mean of $a";
+is_pdl $a->skew, pdl( 0 ), "sample skewness of $a";
+is_pdl $a->skew_unbiased, pdl( 0 ), "unbiased sample skewness of $a";
+is_pdl $a->kurt, pdl( -1.3 ), "sample kurtosis of $a";
+is_pdl $a->kurt_unbiased, pdl( -1.2 ), "unbiased sample kurtosis of $a";
+
+is_pdl $_->ss, (($_ - $_->avg)**2)->sumover, "ss for $_" for
+  pdl('[1 1 1 1 2 3 4 4 4 4 4 4]'),
+  pdl('[1 2 2 2 3 3 3 3 4 4 5 5]'),
+  pdl('[1 1 1 2 2 3 3 4 4 5 5 5]');
 
 my $a_bad = sequence 6;
 $a_bad->setbadat(-1);
-
-is( tapprox( $a_bad->stdv, 1.4142135623731 ), 1, "standard deviation of $a_bad");
-is( tapprox( $a_bad->stdv_unbiased, 1.58113883008419 ), 1, "unbiased standard deviation of $a_bad");
-is( tapprox( $a_bad->var, 2 ), 1, "variance of $a_bad");
-is( tapprox( $a_bad->var_unbiased, 2.5 ), 1, "unbiased variance of $a_bad");
-is( tapprox( $a_bad->se, 0.707106781186548 ), 1, "standard error of $a_bad");
-is( tapprox( $a_bad->ss, 10 ), 1, "sum of squared deviations from the mean of $a_bad");
-is( tapprox( $a_bad->skew, 0 ), 1, "sample skewness of $a_bad");
-is( tapprox( $a_bad->skew_unbiased, 0 ), 1, "unbiased sample skewness of $a_bad");
-is( tapprox( $a_bad->kurt, -1.3 ), 1, "sample kurtosis of $a_bad");
-is( tapprox( $a_bad->kurt_unbiased, -1.2 ), 1, "unbiased sample kurtosis of $a_bad");
-
-my $b = sequence 5;
-$b %= 2;
-$b = qsort $b;
-
-is( tapprox( $a->cov($b), 0.6 ), 1, "sample covariance of $a and $b" );
-is( tapprox( $a->corr($b), 0.866025403784439 ), 1, "Pearson correlation coefficient of $a and $b");
-is( tapprox( $a->n_pair($b), 5 ), 1, "Number of good pairs between $a and $b");
-is( tapprox( $a->corr($b)->t_corr( 5 ), 3 ), 1, "t significance test of Pearson correlation coefficient of $a and $b");
-is( tapprox( $a->corr_dev($b), 0.903696114115064 ), 1, "correlation calculated from dev_m values of $a and $b");
-
-my $b_bad = sequence 6;
-$b_bad = qsort( $b_bad % 2 );
-$b_bad->setbadat(0);
-
-is( tapprox( $a_bad->cov($b_bad), 0.5 ), 1, "sample covariance with bad data of $a_bad and $b_bad");
-is( tapprox( $a_bad->corr($b_bad), 0.894427190999916 ), 1, "Pearson correlation coefficient with bad data of $a_bad and $b_bad");
-is( tapprox( $a_bad->n_pair($b_bad), 4 ), 1, "Number of good pairs between $a_bad and $b_bad with bad values taken into account");
-is( tapprox( $a_bad->corr($b_bad)->t_corr( 4 ), 2.82842712474619 ), 1, "t signifiance test of Pearson correlation coefficient with bad data of $a_bad and $b_bad");
-is( tapprox( $a_bad->corr_dev($b_bad), 0.903696114115064 ), 1, "correlation calculated from dev_m values with bad data of $a_bad and $b_bad");
+is_pdl $a_bad->stdv, pdl( 1.4142135623731 ), "standard deviation of $a_bad";
+is_pdl $a_bad->stdv_unbiased, pdl( 1.58113883008419 ), "unbiased standard deviation of $a_bad";
+is_pdl $a_bad->var, pdl( 2 ), "variance of $a_bad";
+is_pdl $a_bad->var_unbiased, pdl( 2.5 ), "unbiased variance of $a_bad";
+is_pdl $a_bad->se, pdl( 0.707106781186548 ), "standard error of $a_bad";
+is_pdl $a_bad->ss, pdl( 10 ), "sum of squared deviations from the mean of $a_bad";
+is_pdl $a_bad->skew, pdl( 0 ), "sample skewness of $a_bad";
+is_pdl $a_bad->skew_unbiased, pdl( 0 ), "unbiased sample skewness of $a_bad";
+is_pdl $a_bad->kurt, pdl( -1.3 ), "sample kurtosis of $a_bad";
+is_pdl $a_bad->kurt_unbiased, pdl( -1.2 ), "unbiased sample kurtosis of $a_bad";
+
+my $b = pdl '0 0 0 1 1';
+is_pdl $a->cov($b), pdl( 0.6 ), "sample covariance of $a and $b";
+is_pdl $a->corr($b), pdl( 0.866025403784439 ), "Pearson correlation coefficient of $a and $b";
+is_pdl $a->n_pair($b), indx( 5 ), "Number of good pairs between $a and $b";
+is_pdl $a->corr($b)->t_corr( 5 ), pdl( 3 ), "t significance test of Pearson correlation coefficient of $a and $b";
+is_pdl $a->corr_dev($b), pdl( 0.903696114115064 ), "correlation calculated from dev_m values of $a and $b";
+
+my $b_bad = pdl 'BAD 0 0 1 1 1';
+is_pdl $a_bad->cov($b_bad), pdl( 0.5 ), "sample covariance with bad data of $a_bad and $b_bad";
+is_pdl $a_bad->corr($b_bad), pdl( 0.894427190999916 ), "Pearson correlation coefficient with bad data of $a_bad and $b_bad";
+is_pdl $a_bad->n_pair($b_bad), indx( 4 ), "Number of good pairs between $a_bad and $b_bad with bad values taken into account";
+is_pdl $a_bad->corr($b_bad)->t_corr( 4 ), pdl( 2.82842712474619 ), "t signifiance test of Pearson correlation coefficient with bad data of $a_bad and $b_bad";
+is_pdl $a_bad->corr_dev($b_bad), pdl( 0.903696114115064 ), "correlation calculated from dev_m values with bad data of $a_bad and $b_bad";
 
 my ($t, $df) = $a->t_test($b);
-is( tapprox( $t, 2.1380899352994 ), 1, "t-test between $a and $b - 't' output");
-is( tapprox( $df, 8 ), 1, "t-test between $a and $b - 'df' output");
+is_pdl $t, pdl( 2.1380899352994 ), "t-test between $a and $b - 't' output";
+is_pdl $df, pdl( 8 ), "t-test between $a and $b - 'df' output";
 
 ($t, $df) = $a->t_test_nev($b);
-is( tapprox( $t, 2.1380899352994 ), 1, "t-test with non-equal variance between $a and $b - 't' output");
-is( tapprox( $df, 4.94637223974763 ), 1, "t-test with non-equal variance between $a and $b - 'df' output");
+is_pdl $t, pdl( 2.1380899352994 ), "t-test with non-equal variance between $a and $b - 't' output";
+is_pdl $df, pdl( 4.94637223974763 ), "t-test with non-equal variance between $a and $b - 'df' output";
 
 ($t, $df) = $a->t_test_paired($b);
-is( tapprox( $t, 3.13785816221094 ), 1, "paired sample t-test between $a and $b - 't' output");
-is( tapprox( $df, 4 ), 1, "paired sample t-test between $a and $b - 'df' output");
+is_pdl $t, pdl( 3.13785816221094 ), "paired sample t-test between $a and $b - 't' output";
+is_pdl $df, pdl( 4 ), "paired sample t-test between $a and $b - 'df' output";
 
 ($t, $df) = $a_bad->t_test($b_bad);
-is( tapprox( $t, 1.87082869338697 ), 1, "t-test with bad values between $a_bad and $b_bad - 't' output");
-is( tapprox( $df, 8 ), 1, "t-test with bad values between $a_bad and $b_bad - 'd' output");
+is_pdl $t, pdl( 1.87082869338697 ), "t-test with bad values between $a_bad and $b_bad - 't' output";
+is_pdl $df, pdl( 8 ), "t-test with bad values between $a_bad and $b_bad - 'd' output";
 
 ($t, $df) = $a_bad->t_test_nev($b_bad);
-is( tapprox( $t, 1.87082869338697 ), 1, "t-test with non-equal variance with bad values between $a_bad and $b_bad - 't' output");
-is( tapprox( $df, 4.94637223974763 ), 1, "t-test with non-equal variance with bad values between $a_bad and $b_bad - 'df' output");
+is_pdl $t, pdl( 1.87082869338697 ), "t-test with non-equal variance with bad values between $a_bad and $b_bad - 't' output";
+is_pdl $df, pdl( 4.94637223974763 ), "t-test with non-equal variance with bad values between $a_bad and $b_bad - 'df' output";
 
 ($t, $df) = $a_bad->t_test_paired($b_bad);
-is( tapprox( $t, 4.89897948556636 ), 1, "paired sample t-test with bad values between $a_bad and $b_bad - 't' output");
-is( tapprox( $df, 3 ), 1, "paired sample t-test with bad values between $a_bad and $b_bad - 'df' output");
+is_pdl $t, pdl( 4.89897948556636 ), "paired sample t-test with bad values between $a_bad and $b_bad - 't' output";
+is_pdl $df, pdl( 3 ), "paired sample t-test with bad values between $a_bad and $b_bad - 'df' output";
 
 {
   my ($data, $idv, $ido) = rtable(\*DATA, {V=>0});
-  is( tapprox( sum(pdl($data->dims) - pdl(14, 5)), 0 ), 1, 'rtable data dim' );
-  is( tapprox( $data->sum / $data->nbad, 1.70731707317073 ), 1, 'rtable bad elem' );
+  is_pdl $data, pdl '
+   [  5 BAD BAD   2 BAD   5 BAD   9   4 BAD BAD BAD   5 BAD]
+   [  7 BAD   3   7   0 BAD   0   8 BAD   0   3   0 BAD   0]
+   [BAD BAD BAD BAD BAD   1 BAD   1 BAD BAD BAD BAD   1 BAD]
+   [BAD BAD BAD BAD BAD   0 BAD   5 BAD BAD BAD BAD   0 BAD]
+   [BAD BAD   0 BAD   2 BAD   0 BAD BAD   0   0   2 BAD   0]
+  ';
 }
 
 {
-  my $a = random 10, 3;
-  is( tapprox( sum($a->cov_table - $a->cov($a->dummy(1))), 0 ), 1, 'cov_table' );
-
+  my $a = pdl '
+  0.045 0.682 0.290 0.024 0.598 0.321 0.772 0.375 0.237 0.811;
+  0.356 0.094 0.925 0.139 0.701 0.849 0.689 0.109 0.240 0.847;
+  0.822 0.492 0.351 0.860 0.400 0.243 0.313 0.011 0.437 0.480
+';
+  is_pdl $a->cov_table, $a->cov($a->dummy(1)), 'cov_table';
   $a->setbadat(4,0);
-  is( tapprox( sum($a->cov_table - $a->cov($a->dummy(1))), 0 ), 1, 'cov_table bad val' );
+  is_pdl $a->cov_table, $a->cov($a->dummy(1)), 'cov_table bad val';
 }
 
 {
-  my $a = random 10, 3;
-  is( tapprox( sum(abs($a->corr_table - $a->corr($a->dummy(1)))), 0 ), 1, "Square Pearson correlation table");
-
+  my $a = pdl '
+  0.045 0.682 0.290 0.024 0.598 0.321 0.772 0.375 0.237 0.811;
+  0.356 0.094 0.925 0.139 0.701 0.849 0.689 0.109 0.240 0.847;
+  0.822 0.492 0.351 0.860 0.400 0.243 0.313 0.011 0.437 0.480
+';
+  is_pdl $a->corr_table, $a->corr($a->dummy(1)), "Square Pearson correlation table";
   $a->setbadat(4,0);
-  is( tapprox( sum(abs($a->corr_table - $a->corr($a->dummy(1)))), 0 ), 1, "Square Pearson correlation table with bad data");
+  is_pdl $a->corr_table, $a->corr($a->dummy(1)), "Square Pearson correlation table with bad data";
 }
 
 {
   my $a = pdl([0,1,2,3,4], [0,0,0,0,0]);
   $a = $a->setvaltobad(0);
-  is( $a->stdv->nbad, 1, "Bad value input to stdv makes the stdv itself bad");
+  ok $a->stdv->nbad, "Bad value input to stdv makes the stdv itself bad";
 }
 
 SKIP: {
@@ -127,67 +120,45 @@ SKIP: {
   my $x = pdl(1, 2);
   my $n = pdl(2, 10);
   my $p = .5;
-
-  my $a = pdl qw[ 0.75  0.9892578125 ];
-
-  is (tapprox( sum(abs(binomial_test( $x,$n,$p ) - $a)) ,0), 1, 'binomial_test');
+  is_pdl binomial_test( $x,$n,$p ), pdl(0.75, 0.9892578125), 'binomial_test';
 }
 
 {
     my $a = sequence 10, 2;
     my $factor = sequence(10) > 4;
     my $ans = pdl( [[0..4], [10..14]], [[5..9], [15..19]] );
-
     my ($a_, $l) = $a->group_by($factor);
-    is( tapprox( sum(abs($a_ - $ans)), 0 ), 1, 'group_by single factor equal n' );
-    is_deeply( $l, [0, 1], 'group_by single factor label');
+    is_pdl $a_, $ans, 'group_by single factor equal n';
+    is_deeply $l, [0, 1], 'group_by single factor label';
 
     $a = sequence 10,2;
     $factor = qsort sequence(10) % 3;
     $ans = pdl( [1.5, 11.5], [5, 15], [8, 18] );
-
-    is( tapprox( sum(abs($a->group_by($factor)->average - $ans)), 0 ), 1, 'group_by single factor unequal n' );
+    is_pdl $a->group_by($factor)->average, $ans, 'group_by single factor unequal n';
 
     $a = sequence 10;
     my @factors = ( [qw( a a a a b b b b b b )], [qw(0 1 0 1 0 1 0 1 0 1)] );
-    $ans = pdl(
-[
- [0,2,-1],
- [1,3,-1],
-],
-[
- [4,6,8],
- [5,7,9],
-]
-    );
-    $ans->badflag(1);
-    $ans = $ans->setvaltobad(-1);
-
+    $ans = pdl '[ 0 2 BAD; 1 3 BAD ], [ 4 6 8; 5 7 9 ]';
     ($a_, $l) = $a->group_by( @factors );
-    is(tapprox(sum(abs($a_ - $ans)), 0), 1, 'group_by multiple factors') or diag($a_, $ans);
-    is_deeply($l, [[qw(a_0 a_1)], [qw( b_0 b_1 )]], 'group_by multiple factors label');
+    is_pdl $a_, $ans, 'group_by multiple factors';
+    is_deeply $l, [[qw(a_0 a_1)], [qw( b_0 b_1 )]], 'group_by multiple factors label';
 }
 
 
 {
     my @a = qw(a a b b c c);
     my $a = PDL::Stats::Basic::_array_to_pdl( \@a );
     my $ans = pdl( 0,0,1,1,2,2 );
-    is( tapprox( sum(abs($a - $ans)), 0 ), 1, '_array_to_pdl' );
+    is_pdl $a, $ans, '_array_to_pdl';
 
     $a[-1] = undef;
     my $a_bad = PDL::Stats::Basic::_array_to_pdl( \@a );
-    my $ans_bad = pdl( 0,0,1,1,2,2 );
-    $ans_bad = $ans_bad->setbadat(-1);
-
-    like( $a_bad(-1)->isbad(), qr/1/, '_array_to_pdl with missing value undef' );
-    is( tapprox( sum(abs($a_bad - $ans_bad)), 0 ), 1, '_array_to_pdl with missing value undef correctly coded' );
+    my $ans_bad = pdl '0 0 1 1 2 BAD';
+    is_pdl $a_bad, $ans_bad, '_array_to_pdl with missing value undef correctly coded';
 
     $a[-1] = 'BAD';
     $a_bad = PDL::Stats::Basic::_array_to_pdl( \@a );
-
-    like( $a_bad(-1)->isbad(), qr/1/, '_array_to_pdl with missing value BAD' );
-    is( tapprox( sum(abs($a_bad - $ans_bad)), 0 ), 1, '_array_to_pdl with missing value BAD correctly coded' );
+    is_pdl $a_bad, $ans_bad, '_array_to_pdl with missing value BAD correctly coded';
 }
 
 done_testing();
diff --git a/t/stats_glm.t b/t/stats_glm.t

-Original file line number
+Diff line change
 use PDL::Stats::GLM;
 use PDL::LiteF;
 use PDL::NiceSlice;
 +use Test::PDL;
 -sub tapprox {
 -  my($a,$b, $eps) = @_;
 -  $eps ||= 1e-6;
 -  my $diff = abs($a-$b);
 -    # use max to make it perl scalar
 -  ref $diff eq 'PDL' and $diff = $diff->max;
 -  return $diff < $eps;
 -}
+-
 -my $a = sequence 5;
 -my $b = pdl(0, 0, 0, 1, 1);
+-
 -is( t_fill_m(), 1, "fill_m replaces bad values with sample mean");
 -sub t_fill_m {
 -  my $aa = sequence 5;
 -  $aa = $aa->setvaltobad(0);
 -  tapprox( $aa->fill_m->sum, 12.5 );
 -}
 +is_pdl pdl('BAD 1 2 3 4')->fill_m, pdl('2.5 1 2 3 4'), "fill_m replaces bad values with sample mean";
 -is( t_fill_rand(), 1, "fill_rand replaces bad values with random sample of good values from same variable");
 -sub t_fill_rand {
 -  my $aa = sequence 5;
 -  $aa = $aa->setvaltobad(0);
 -  my $stdv = $aa->fill_rand->stdv;
 -  tapprox( $stdv, 1.01980390271856 ) || tapprox( $stdv, 1.16619037896906 );
 +{
 +my $stdv = pdl('BAD 1 2 3 4')->fill_rand->stdv;
 +ok PDL::Core::approx( $stdv, 1.01980390271856 ) || PDL::Core::approx( $stdv, 1.16619037896906 ), "fill_rand replaces bad values with random sample of good values from same variable";
+}
 -ok tapprox( $a->dev_m->avg, 0 ), "dev_m replaces values with deviations from the mean on $a";
 -ok tapprox( $a->stddz->avg, 0 ), "stddz standardizes data on $a";
 +my $a = sequence 5;
 +is_pdl $a->dev_m, pdl('-2 -1 0 1 2'), "dev_m replaces values with deviations from the mean on $a";
 +is_pdl $a->stddz, pdl('-1.41421356237309 -0.707106781186547 0 0.707106781186547 1.41421356237309'), "stddz standardizes data on $a";
 -ok tapprox( $a->sse($b), 18), "sse gives sum of squared errors between actual and predicted values between $a and $b";
 -ok tapprox( $a->mse($b), 3.6), "mse gives mean of squared errors between actual and predicted values between $a and $b";
 -ok tapprox( $a->rmse($b), 1.89736659610103 ), "rmse gives root mean squared error, ie. stdv around predicted value between $a and $b";
 +my $b = pdl(0, 0, 0, 1, 1);
 +is_pdl $a->sse($b), pdl(18), "sse gives sum of squared errors between actual and predicted values between $a and $b";
 +is_pdl $a->mse($b), pdl(3.6), "mse gives mean of squared errors between actual and predicted values between $a and $b";
 +is_pdl $a->rmse($b), pdl(1.89736659610103), "rmse gives root mean squared error, ie. stdv around predicted value between $a and $b";
 -ok tapprox( $b->glue(1,ones(5))->pred_logistic(pdl(1,2))->sum, 4.54753948757851 ), "pred_logistic calculates predicted probability value for logistic regression";
 +is_pdl $b->glue(1,ones(5))->pred_logistic(pdl(1,2)), pdl('0.880797077977882 0.880797077977882 0.880797077977882 0.952574126822433 0.952574126822433'), "pred_logistic calculates predicted probability value for logistic regression";
 my $y = pdl(0, 1, 0, 1, 0);
 -ok tapprox( $y->d0(), 6.73011667009256 ), 'd0';
 -ok tapprox( $y->dm( ones(5) * .5 ), 6.93147180559945 ), 'dm';
 -ok tapprox( sum($y->dvrs(ones(5) * .5) ** 2), 6.93147180559945 ), 'dvrs';
 +is_pdl $y->d0(), pdl( 6.73011667009256 ), 'd0';
 +is_pdl $y->dm( ones(5) * .5 ), pdl( 6.93147180559945 ), 'dm';
 +is_pdl $y->dvrs(ones(5) * .5) ** 2, pdl('1.38629436111989 1.38629436111989 1.38629436111989 1.38629436111989 1.38629436111989'), 'dvrs';
+{
   my $a = pdl(ushort, [0,0,1,0,1], [0,0,0,1,1] );
     [qw(  0.0071428571    0.035714286   -0.057142857)],
    ],
   );
 -  ok tapprox( sum( abs($m{R2} - $rsq) ), 0 ), 'ols_t R2';
 -  ok tapprox( sum( abs($m{b} - $coeff) ), 0 ), 'ols_t b';
 +  is_pdl $m{R2}, $rsq, 'ols_t R2';
 +  is_pdl $m{b}, $coeff, 'ols_t b';
   my %m0 = $a->ols_t(sequence(5), {CONST=>0});
   my $b0 = pdl ([ 0.2 ], [ 0.23333333 ]);
+-
 -  ok tapprox( sum( abs($m0{b} - $b0) ), 0 ), 'ols_t, const=>0';
 +  is_pdl $m0{b}, $b0, 'ols_t, const=>0';
+}
 -ok tapprox( t_ols(), 0 ), 'ols';
 -sub t_ols {
 +{
   my $a = sequence 5;
   my $b = pdl(0,0,0,1,1);
   my %m = $a->ols($b, {plot=>0});
   test_stats_cmp(\%m, \%a);
+}
 -ok tapprox( t_ols_bad(), 0 ), 'ols with bad value';
 -sub t_ols_bad {
 -  my $a = sequence 6;
 +{
 +  my $a = pdl '0 1 2 3 4 BAD';
   my $b = pdl(0,0,0,1,1,1);
 -  $a->setbadat(5);
   my %m = $a->ols($b, {plot=>0});
 -  is( $b->sumover, 3, "ols with bad value didn't change caller value" );
 +  is_pdl $b, pdl(0,0,0,1,1,1), "ols with bad value didn't change caller value";
   ok $a->check_badflag, "ols with bad value didn't remove caller bad flag";
   my %a = (
     F    => 9,
   test_stats_cmp(\%m, \%a);
+}
 -ok tapprox( t_r2_change(), 0 ), 'r2_change';
 -sub t_r2_change {
 +{
   my $a = sequence 5, 2;
   my $b = pdl(0,0,0,1,1);
   my $c = pdl(0,0,2,2,2);
   my %p = $a->pca({CORR=>1, PLOT=>0});
   my %a = (
 -eigenvalue  => pdl( qw( 2.786684 0.18473727 0.028578689) ),
 +eigenvalue  => float( qw( 2.786684 0.18473727 0.028578689) ),
   # loadings in R
 -eigenvector => [pdl(
 +eigenvector => [float(
     # v1       v2        v3
  [qw(  0.58518141   0.58668657   0.55978709)],  # comp1
  [qw( -0.41537629  -0.37601061   0.82829859)],  # comp2
  [qw( -0.69643754   0.71722722 -0.023661276)],  # comp3
 ), \&PDL::abs],
 -loadings	=> [pdl(
 +loadings	=> [float(
  [qw(   0.97686463    0.97937725    0.93447296)],
  [qw(  -0.17853319    -0.1616134    0.35601163)],
  [qw(  -0.11773439    0.12124893 -0.0039999937)],
   %p = $a->pca({CORR=>0, PLOT=>0});
   %a = (
 -eigenvalue => [pdl(qw[ 22.0561695 1.581758022 0.202065959 ]), \&PDL::abs],
 -eigenvector => [pdl(
 +eigenvalue => [float(qw[ 22.0561695 1.581758022 0.202065959 ]), \&PDL::abs],
 +eigenvector => [float(
  [qw(-0.511688 -0.595281 -0.619528)],
  [qw( 0.413568  0.461388  -0.78491)],
  [qw( 0.753085 -0.657846 0.0101023)],
   test_stats_cmp(\%p, \%a, 1e-4);
+}
 -ok tapprox( t_pca_sorti(), 0 ), "pca_sorti - principal component analysis output sorted to find which vars a component is best represented";
 -sub t_pca_sorti {
 -  my $a = sequence 10, 5;
 -  $a = lvalue_assign_detour( $a, which($a % 7 == 0), 0 );
+-
 +{
 +  # pca_sorti - principal component analysis output sorted to find which vars a component is best represented
 +  my $a = pdl '
 +    0 1 2 3 4 5 6 0 8 9; 10 11 12 13  0 15 16 17 18 19;
 +    20  0 22 23 24 25 26 27  0 29; 30 31 32 33 34  0 36 37 38 39;
 +    40 41  0 43 44 45 46 47 48  0
 +  ';
   my %m = $a->pca({PLOT=>0});
+-
   my ($iv, $ic) = $m{loadings}->pca_sorti;
+-
 -  return sum($iv - pdl(qw(4 1 0 2 3))) + sum($ic - pdl(qw( 0 1 2 )));
 +  is_pdl $iv, indx(qw(4 1 0 2 3));
 +  is_pdl $ic, pdl(qw( 0 1 2 ));
+}
 SKIP: {
   eval { require PDL::Fit::LM; };
   skip 'no PDL::Fit::LM', 1 if $@;
+-
 -  ok tapprox( t_logistic(), 0 ), 'logistic';
+-
 -  my $y = pdl( 0, 0, 0, 1, 1 );
 -  my $x = pdl(2, 3, 5, 5, 5);
 -  my %m = $y->logistic( $x, {COV=>1} );
 -  isnt $m{cov}, undef, 'get cov from logistic if ask';
 -};
 -sub t_logistic {
   my $y = pdl( 0, 0, 0, 1, 1 );
   my $x = pdl(2, 3, 5, 5, 5);
   my %m = $y->logistic( $x );
   my $y_pred = $x->glue(1, ones(5))->pred_logistic( $m{b} );
   my $y_pred_ans
     = pdl qw(7.2364053e-07 0.00010154254 0.66666667 0.66666667 0.66666667);
 -  return sum( $y_pred - $y_pred_ans, $m{Dm_chisq} - 2.91082711764867 );
 -}
+-
 -my $a_bad = sequence 6;
 -$a_bad->setbadat(-1);
 -my $b_bad = pdl(0, 0, 0, 0, 1, 1);
 -$b_bad->setbadat(0);
+-
 -ok tapprox( $a_bad->dev_m->avg, 0 ), "dev_m with bad values $a_bad";
 -ok tapprox( $a_bad->stddz->avg, 0 ), "stdz with bad values $a_bad";
+-
 -ok tapprox( $a_bad->sse($b_bad), 23), "sse with bad values between $a_bad and $b_bad";
 -ok tapprox( $a_bad->mse($b_bad), 5.75), "mse with badvalues between $a_bad and $b_bad";
 -ok tapprox( $a_bad->rmse($b_bad), 2.39791576165636 ), "rmse with bad values between $a_bad and $b_bad";
+-
 -ok tapprox( $b_bad->glue(1,ones(6))->pred_logistic(pdl(1,2))->sum, 4.54753948757851 ), "pred_logistic with bad values";
 +  is_pdl $y_pred, $y_pred_ans;
 +  is_pdl $m{Dm_chisq}, pdl 2.91082711764867;
 +  %m = $y->logistic( $x, {COV=>1} );
 +  isnt $m{cov}, undef, 'get cov from logistic if ask';
 +};
 -ok tapprox( $b_bad->d0(), 6.73011667009256 ), "null deviance with bad values on $b_bad";
 -ok tapprox( $b_bad->dm( ones(6) * .5 ), 6.93147180559945 ), "model deviance with bad values on $b_bad";
 -ok tapprox( sum($b_bad->dvrs(ones(6) * .5) ** 2), 6.93147180559945 ), "deviance residual with bad values on $b_bad";
 +my $a_bad = pdl '0 1 2 3 4 BAD';
 +my $b_bad = pdl 'BAD 0 0 0 1 1';
 +is_pdl $a_bad->dev_m, pdl( '-2 -1 0 1 2 BAD' ), "dev_m with bad values $a_bad";
 +is_pdl $a_bad->stddz, pdl( '-1.41421356237309 -0.707106781186547 0 0.707106781186547 1.41421356237309 BAD' ), "stdz with bad values $a_bad";
 +is_pdl $a_bad->sse($b_bad), pdl(23), "sse with bad values between $a_bad and $b_bad";
 +is_pdl $a_bad->mse($b_bad), pdl(5.75), "mse with badvalues between $a_bad and $b_bad";
 +is_pdl $a_bad->rmse($b_bad), pdl( 2.39791576165636 ), "rmse with bad values between $a_bad and $b_bad";
 +is_pdl $b_bad->glue(1,ones(6))->pred_logistic(pdl(1,2)), pdl( 'BAD 0.880797077977882 0.880797077977882 0.880797077977882 0.952574126822433 0.952574126822433' ), "pred_logistic with bad values";
 +is_pdl $b_bad->d0(), pdl( 6.73011667009256 ), "null deviance with bad values on $b_bad";
 +is_pdl $b_bad->dm( ones(6) * .5 ), pdl( 6.93147180559945 ), "model deviance with bad values on $b_bad";
 +is_pdl $b_bad->dvrs(ones(6) * .5), pdl( 'BAD -1.17741002251547 -1.17741002251547 -1.17741002251547 1.17741002251547 1.17741002251547' ), "deviance residual with bad values on $b_bad";
+{
   eval { effect_code(['a']) };
   isnt $@, '', 'effect_code with only one value dies';
 -  my @a = qw( a a a b b b b c c BAD );
 -  my $a = effect_code(\@a);
 -  my $ans = pdl [
 -   [qw( 1   1   1   0   0   0   0  -1  -1 -99 )],
 -   [qw( 0   0   0   1   1   1   1  -1  -1 -99 )]
 -  ];
 -  $ans = $ans->setvaltobad(-99);
 -  is( sum(abs(which($a->isbad) - pdl(9,19))), 0, 'effect_code got bad value' );
 -  ok tapprox( sum(abs($a - $ans)), 0 ), 'effect_code coded with bad value';
 +  my $a = scalar effect_code([qw(a a a b b b b c c BAD)]);
 +  is_pdl $a, pdl('1 1 1 0 0 0 0 -1 -1 BAD; 0 0 0 1 1 1 1 -1 -1 BAD'), 'effect_code coded with bad value';
+}
 -ok tapprox( t_effect_code_w(), 0 ), 'effect_code_w';
 -sub t_effect_code_w {
 +{
   eval { effect_code_w(['a']) };
   isnt $@, '', 'effect_code_w with only one value dies';
 -  my @a = qw( a a a b b b b c c c );
 -  my $a = effect_code_w(\@a);
 -  return sum($a->sumover - pdl byte, (0, 0));
 +  is_pdl scalar effect_code_w([qw(a a a b b b b c c c)]), pdl '
 +    1 1 1 0 0 0 0 -1 -1 -1; 0 0 0 1 1 1 1 -1.3333333 -1.3333333 -1.3333333
 +  ';
+}
 -ok tapprox( t_anova(), 0 ), 'anova_3w';
 -sub t_anova {
 +{ # anova 3 way
   my $d = sequence 60;
   my @a = map {$a = $_; map { $a } 0..14 } qw(a b c d);
   my $b = $d % 3;
   my $c = $d % 2;
 -  $d = lvalue_assign_detour( $d, 20, 10 );
 +  $d->set( 20, 10 );
   my %m = $d->anova(\@a, $b, $c, {IVNM=>[qw(A B C)], plot=>0});
   $m{'# A ~ B ~ C # m'} = $m{'# A ~ B ~ C # m'}->(,2,)->squeeze;
   test_stats_cmp(\%m, {
   });
+}
 -ok tapprox( t_anova_1way(), 0 ), 'anova_1w';
 -sub t_anova_1way {
 +{ # anova 1 way
   my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 );
   my $a = qsort sequence(15) % 3;
   my %m = $d->anova($a, {plot=>0});
   });
+}
 -ok tapprox( t_anova_bad_dv(), 0 ), 'anova_3w bad dv';
 -sub t_anova_bad_dv {
 +{ # anova_3w bad dv
   my $d = sequence 60;
 -  $d = lvalue_assign_detour( $d, 20, 10 );
 +  $d->set( 20, 10 );
   $d->setbadat(1);
   $d->setbadat(10);
   my @a = map {$a = $_; map { $a } 0..14 } qw(a b c d);
   });
+}
 -ok tapprox( t_anova_bad_dv_iv(), 0 ), 'anova_3w bad dv iv';
 -sub t_anova_bad_dv_iv {
 +{ # anova_3w bad dv iv
   my $d = sequence 63;
   my @a = map {$a = $_; map { $a } 0..14 } qw(a b c d);
   push @a, undef, qw( b c );
   my $b = $d % 3;
   my $c = $d % 2;
 -  $d = lvalue_assign_detour( $d, 20, 10 );
 +  $d->set( 20, 10 );
   $d->setbadat(62);
   $b->setbadat(61);
   my %m = $d->anova(\@a, $b, $c, {IVNM=>[qw(A B C)], plot=>0});
   });
+}
 -{
 -  my $a = pdl([0,1,2,3,4], [0,0,0,0,0]);
 -  $a = $a->setvaltobad(0);
 -  is( $a->fill_m->setvaltobad(0)->nbad, 5, 'fill_m nan to bad');
 -}
 +is_pdl pdl('BAD 1 2 3 4; BAD BAD BAD BAD BAD')->fill_m, pdl('2.5 1 2 3 4; 0 0 0 0 0'), 'fill_m nan to bad';
 +is_pdl pdl([1,1,1], [2,2,2])->stddz, zeroes(3,2), 'stddz nan vs bad';
+{
 -  my $a = pdl([1,1,1], [2,2,2]);
 -  is( which($a->stddz == 0)->nelem, 6, 'stddz nan vs bad');
 -}
+-
 -ok tapprox( t_anova_rptd_basic(), 0 ), 'anova_rptd_basic';
 -sub t_anova_rptd_basic {
   # data from https://www.youtube.com/watch?v=Fh73dAOMm9M
   # Person,Before,After 2 weeks,After 4 weeks
   # P1,102,97,95
   });
+}
 -ok tapprox( t_anova_rptd_1way(), 0 ), 'anova_rptd_1w';
 -sub t_anova_rptd_1way {
 +{ # anova_rptd_1w
   my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 );
   my $s = sequence(5)->dummy(1,3)->flat;
   my $a = qsort sequence(15) % 3;
   });
+}
 -ok tapprox( t_anova_rptd_2way_bad_dv(), 0 ), 'anova_rptd_2w bad dv';
 my %anova_bad_a = (
   '| a | F' => 0.351351351351351,
   '| a | ms' => 0.722222222222222,
   '| a ~ b | F' => 5.25,
   '# a ~ b # m' => pdl(qw( 3  1.3333333  3.3333333 3.3333333  3.6666667  2.6666667  ))->reshape(3,2),
 );
 -sub t_anova_rptd_2way_bad_dv {
 +{ # anova_rptd_2w bad dv
   my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 3 4 2 1 5 4 3 2 2);
   $d = $d->setbadat(5);
   my $s = sequence(4)->dummy(1,6)->flat;
   test_stats_cmp(\%m, \%anova_bad_a);
+}
 -ok tapprox( t_anova_rptd_2way_bad_iv(), 0 ), 'anova_rptd_2w bad iv';
 -sub t_anova_rptd_2way_bad_iv {
 +{ # anova_rptd_2w bad iv
   my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 3 4 2 1 5 4 3 2 2);
   my $s = sequence(4)->dummy(1,6)->flat;
 # [0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3]
   test_stats_cmp(\%m, \%anova_bad_a);
+}
 -ok tapprox( t_anova_rptd_3way(), 0 ), 'anova_rptd_3w';
 -sub t_anova_rptd_3way {
 +{ # anova_rptd_3w
   my $d = pdl( qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 3 4 2 1 5 4 3 2 2 ),
                qw( 5 5 1 1 4 4 1 4 4 2 3 3 5 1 1 2 4 4 4 5 5 1 1 2 )
   );
   });
+}
 -ok tapprox( t_anova_rptd_mixed(), 0 ), 'anova_rptd mixed';
 -sub t_anova_rptd_mixed {
 +{ # anova_rptd mixed
   my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 3 4 2 1 5 4 3 2 2);
   my $s = sequence(4)->dummy(1,6)->flat;
 # [0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3]
 # Tests for mixed anova thanks to Erich Greene
 -ok tapprox( t_anova_rptd_mixed_l2ord2(), 0,      ), 'anova_rptd mixed with 2 btwn-subj var levels, data grouped by subject';
 -SKIP: {
 -    skip "yet to be fixed", 3;
 -    ok tapprox( t_anova_rptd_mixed_l2ord1(), 0,      ), 'anova_rptd mixed with 2 btwn-subj var levels, data grouped by within var';
 -    ok tapprox( t_anova_rptd_mixed_l3ord1(), 0, .001 ), 'anova_rptd mixed with 3 btwn-subj var levels, data grouped by within var';
 -    ok tapprox( t_anova_rptd_mixed_l3ord2(), 0, .001 ), 'anova_rptd mixed with 3 btwn-subj var levels, data grouped by subject';
 -}
 sub test_stats_cmp {
   local $Test::Builder::Level = $Test::Builder::Level + 1;
   my ($m, $ans, $eps) = @_;
   $eps ||= 1e-6;
 -  my $error = pdl 0;
   foreach (sort keys %$ans) {
     my $got = PDL->topdl($m->{$_});
     my $exp = $ans->{$_};
     if (ref $exp eq 'ARRAY') {
       ($exp, my $func) = @$exp;
       ($got, $exp) = map &$func($_), $got, $exp;
+    }
 -    $exp = PDL->topdl($exp);
 -    $error = $error + (my $this_diff = $got - $exp);
 -    fail($_), diag "got $m->{$_}\nexpected $exp" if any($this_diff->abs > $eps);
 +    is_pdl $got, PDL->topdl($exp), {atol=>$eps, test_name=>$_};
+  }
 -  return $error;
 -}
 -sub t_anova_rptd_mixed_backend {
 -    my ($d,$s,$w,$b,$ans) = @_;
 -    my %m = $d->anova_rptd($s,$w,$b,{ivnm=>['within','between'],btwn=>[1],plot=>0, v=>0});
 -    test_stats_cmp(\%m, $ans);
 -}
 -sub t_anova_rptd_mixed_l2_common {
 -    my ($d,$s,$w,$b) = @_;
 -    my %ans = (
 -	       '| within | df'           => 2,
 -	       '| within || err df'      => 12,
 -	       '| within | ss'           =>   .25,
 -	       '| within | ms'           =>   .125,
 -	       '| within || err ss'      => 23.666667,
 -	       '| within || err ms'      =>  1.9722222,
 -	       '| within | F'            =>  0.063380282,
 -	       '| between | df'          =>  1,
 -	       '| between || err df'     =>  6,
 -	       '| between | ss'          =>  2.0416667,
 -	       '| between | ms'          =>  2.0416667,
 -	       '| between || err ss'     => 16.583333,
 -	       '| between || err ms'     =>  2.7638889,
 -	       '| between | F'           =>  0.73869347,
 -	       '| within ~ between | df' =>  2,
 -	       '| within ~ between | ss' =>  6.0833333,
 -	       '| within ~ between | ms' =>  3.0416667,
 -	       '| within ~ between | F'  =>  1.5422535,
 -	      );
 -    $ans{"| within ~ between || err $_"} = $ans{"| within || err $_"} foreach qw/df ss ms/;
 -    return t_anova_rptd_mixed_backend($d,$s,$w,$b,\%ans);
 -}
 -sub t_anova_rptd_mixed_l3_common {
 -    my ($d,$s,$w,$b) = @_;
 -    my %ans = (
 -	       '| within | df'           =>  2,
 -	       '| within || err df'      => 12,
 -	       '| within | ss'           =>   .963,
 -	       '| within | ms'           =>   .481,
 -	       '| within || err ss'      => 20.889,
 -	       '| within || err ms'      =>  1.741,
 -	       '| within | F'            =>   .277,
 -	       '| between | df'          =>  2,
 -	       '| between || err df'     =>  6,
 -	       '| between | ss'          =>  1.185,
 -	       '| between | ms'          =>   .593,
 -	       '| between || err ss'     => 13.111,
 -	       '| between || err ms'     =>  2.185,
 -	       '| between | F'           =>   .271,
 -	       '| within ~ between | df' =>  4,
 -	       '| within ~ between | ss' =>  4.148,
 -	       '| within ~ between | ms' =>  1.037,
 -	       '| within ~ between | F'  =>   .596,
 -	      );
 -    $ans{"| within ~ between || err $_"} = $ans{"| within || err $_"} foreach qw/df ss ms/;
 -    return t_anova_rptd_mixed_backend($d,$s,$w,$b,\%ans);
 -}
 -sub t_anova_rptd_mixed_l2ord1 {
 -    my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 3 4 2 1 5 4 3 2 2);
 -    my $s = sequence(8)->dummy(1,3)->flat;
 -    # [0 1 2 3 4 5 6 7 0 1 2 3 4 5 6 7 0 1 2 3 4 5 6 7]
 -    my $w = qsort sequence(24) % 3;
 -    # [0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2]
 -    my $b = (sequence(8) % 2)->qsort->dummy(1,3)->flat;
 -    # [0 0 0 0 1 1 1 1 0 0 0 0 1 1 1 1 0 0 0 0 1 1 1 1]
 -    return t_anova_rptd_mixed_l2_common($d,$s,$w,$b);
+}
 -sub t_anova_rptd_mixed_l2ord2 {
 -    my $d = pdl qw( 3 1 4 2 4 2 1 1 1 5 2 5 2 3 4 1 5 3 5 5 2 3 3 2);
 -    my $s = qsort sequence(24) % 8;
 -    # [0 0 0 1 1 1 2 2 2 3 3 3 4 4 4 5 5 5 6 6 6 7 7 7]
 -    my $w = sequence(3)->dummy(1,8)->flat;
 -    # [0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2]
 -    my $b = qsort sequence(24) % 2;
 -    # [0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 1 1 1]
 -    return t_anova_rptd_mixed_l2_common($d,$s,$w,$b);
 -}
 -sub t_anova_rptd_mixed_l3ord1 {
 -    my $d = pdl qw( 5 2 2 5 4 1 5 3 5 4 4 3 4 3 4 3 5 1 4 3 3 4 5 4 5 5 2 );
 -    my $s = sequence(9)->dummy(1,3)->flat;
 -    # [0 1 2 3 4 5 6 7 8 0 1 2 3 4 5 6 7 8 0 1 2 3 4 5 6 7 8]
 -    my $w = qsort sequence(27) % 3;
 -    # [0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2]
 -    my $b = (sequence(9) % 3)->qsort->dummy(1,3)->flat;
 -    # [0 0 0 1 1 1 2 2 2 0 0 0 1 1 1 2 2 2 0 0 0 1 1 1 2 2 2]
 -    return t_anova_rptd_mixed_l3_common($d,$s,$w,$b);
 -}
 -sub t_anova_rptd_mixed_l3ord2 {
 -    my $d = pdl qw( 5 4 4 2 4 3 2 3 3 5 4 4 4 3 5 1 4 4 5 3 5 3 5 5 5 1 2 );
 -    my $s = qsort sequence(27) % 9;
 -    # [0 0 0 1 1 1 2 2 2 3 3 3 4 4 4 5 5 5 6 6 6 7 7 7 8 8 8]
 -    my $w = sequence(3)->dummy(1,9)->flat;
 -    # [0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2]
 -    my $b = qsort sequence(27) % 3;
 -    # [0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2]
 -    return t_anova_rptd_mixed_l3_common($d,$s,$w,$b);
 +my %anova_ans_l2_common = (
 +  '| within | df'           => 2,
 +  '| within || err df'      => 12,
 +  '| within | ss'           =>   .25,
 +  '| within | ms'           =>   .125,
 +  '| within || err ss'      => 23.666667,
 +  '| within || err ms'      =>  1.9722222,
 +  '| within | F'            =>  0.063380282,
 +  '| between | df'          =>  1,
 +  '| between || err df'     =>  6,
 +  '| between | ss'          =>  2.0416667,
 +  '| between | ms'          =>  2.0416667,
 +  '| between || err ss'     => 16.583333,
 +  '| between || err ms'     =>  2.7638889,
 +  '| between | F'           =>  0.73869347,
 +  '| within ~ between | df' =>  2,
 +  '| within ~ between | ss' =>  6.0833333,
 +  '| within ~ between | ms' =>  3.0416667,
 +  '| within ~ between | F'  =>  1.5422535,
 +);
 +$anova_ans_l2_common{"| within ~ between || err $_"} = $anova_ans_l2_common{"| within || err $_"} foreach qw/df ss ms/;
 +my %anova_ans_l3_common = (
 +  '| within | df'           =>  2,
 +  '| within || err df'      => 12,
 +  '| within | ss'           =>   .963,
 +  '| within | ms'           =>   .481,
 +  '| within || err ss'      => 20.889,
 +  '| within || err ms'      =>  1.741,
 +  '| within | F'            =>   .277,
 +  '| between | df'          =>  2,
 +  '| between || err df'     =>  6,
 +  '| between | ss'          =>  1.185,
 +  '| between | ms'          =>   .593,
 +  '| between || err ss'     => 13.111,
 +  '| between || err ms'     =>  2.185,
 +  '| between | F'           =>   .271,
 +  '| within ~ between | df' =>  4,
 +  '| within ~ between | ss' =>  4.148,
 +  '| within ~ between | ms' =>  1.037,
 +  '| within ~ between | F'  =>   .596,
 +);
 +$anova_ans_l3_common{"| within ~ between || err $_"} = $anova_ans_l3_common{"| within || err $_"} foreach qw/df ss ms/;
 +if (0) { # FIXME
 +  # anova_rptd mixed with 2 btwn-subj var levels, data grouped by within var
 +  my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 3 4 2 1 5 4 3 2 2);
 +  my $s = sequence(8)->dummy(1,3)->flat;
 +  # [0 1 2 3 4 5 6 7 0 1 2 3 4 5 6 7 0 1 2 3 4 5 6 7]
 +  my $w = qsort sequence(24) % 3;
 +  # [0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2]
 +  my $b = (sequence(8) % 2)->qsort->dummy(1,3)->flat;
 +  # [0 0 0 0 1 1 1 1 0 0 0 0 1 1 1 1 0 0 0 0 1 1 1 1]
 +  my %m = $d->anova_rptd($s,$w,$b,{ivnm=>['within','between'],btwn=>[1],plot=>0, v=>0});
 +  test_stats_cmp(\%m, \%anova_ans_l2_common);
+}
+-
+-
 -ok tapprox( t_anova_rptd_mixed_bad(), 0 ), 'anova_rptd mixed bad';
 -sub t_anova_rptd_mixed_bad {
 +{
 +  # anova_rptd mixed with 2 btwn-subj var levels, data grouped by subject
 +  my $d = pdl qw( 3 1 4 2 4 2 1 1 1 5 2 5 2 3 4 1 5 3 5 5 2 3 3 2);
 +  my $s = qsort sequence(24) % 8;
 +  # [0 0 0 1 1 1 2 2 2 3 3 3 4 4 4 5 5 5 6 6 6 7 7 7]
 +  my $w = sequence(3)->dummy(1,8)->flat;
 +  # [0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2]
 +  my $b = qsort sequence(24) % 2;
 +  # [0 0 0 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 1 1 1]
 +  my %m = $d->anova_rptd($s,$w,$b,{ivnm=>['within','between'],btwn=>[1],plot=>0, v=>0});
 +  test_stats_cmp(\%m, \%anova_ans_l2_common);
 +}
 +if (0) { # FIXME
 +  # eps=.001 anova_rptd mixed with 3 btwn-subj var levels, data grouped by within var
 +  my $d = pdl qw( 5 2 2 5 4 1 5 3 5 4 4 3 4 3 4 3 5 1 4 3 3 4 5 4 5 5 2 );
 +  my $s = sequence(9)->dummy(1,3)->flat;
 +  # [0 1 2 3 4 5 6 7 8 0 1 2 3 4 5 6 7 8 0 1 2 3 4 5 6 7 8]
 +  my $w = qsort sequence(27) % 3;
 +  # [0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2]
 +  my $b = (sequence(9) % 3)->qsort->dummy(1,3)->flat;
 +  # [0 0 0 1 1 1 2 2 2 0 0 0 1 1 1 2 2 2 0 0 0 1 1 1 2 2 2]
 +  my %m = $d->anova_rptd($s,$w,$b,{ivnm=>['within','between'],btwn=>[1],plot=>0, v=>0});
 +  test_stats_cmp(\%m, \%anova_ans_l3_common);
 +}
 +if (0) { # FIXME
 +  # eps=.001 anova_rptd mixed with 3 btwn-subj var levels, data grouped by subject
 +  my $d = pdl qw( 5 4 4 2 4 3 2 3 3 5 4 4 4 3 5 1 4 4 5 3 5 3 5 5 5 1 2 );
 +  my $s = qsort sequence(27) % 9;
 +  # [0 0 0 1 1 1 2 2 2 3 3 3 4 4 4 5 5 5 6 6 6 7 7 7 8 8 8]
 +  my $w = sequence(3)->dummy(1,9)->flat;
 +  # [0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2 0 1 2]
 +  my $b = qsort sequence(27) % 3;
 +  # [0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 2 2]
 +  my %m = $d->anova_rptd($s,$w,$b,{ivnm=>['within','between'],btwn=>[1],plot=>0, v=>0});
 +  test_stats_cmp(\%m, \%anova_ans_l3_common);
 +}
++
 +{ # anova_rptd mixed bad
   my $d = pdl qw( 3 2 1 5 2 1 5 3 1 4 1 2 3 5 5 3 4 2 1 5 4 3 2 2 1 1 1 1 );
   my $s = sequence(4)->dummy(1,6)->flat;
 # [0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3 0 1 2 3]
   });
+}
 -ok tapprox( t_anova_rptd_mixed_4w(), 0 ), 'anova_rptd_mixed_4w';
 -sub t_anova_rptd_mixed_4w {
 +{ # anova_rptd_mixed_4w
   my ($data, $idv, $subj) = rtable \*DATA, {v=>0};
   my ($age, $aa, $beer, $wings, $dv) = $data->dog;
   my %m = $dv->anova_rptd( $subj, $age, $aa, $beer, $wings, { ivnm=>[qw(age aa beer wings)], btwn=>[0,1], v=>0, plot=>0 } );
   my $a = effect_code( sequence(12) > 5 );
   my $b = effect_code([ map {(0, 1)} (1..6) ]);
   my $c = effect_code([ map {(0,0,1,1,2,2)} (1..2) ]);
+-
 -  my $ans = pdl [
 -   [qw( 1 -1  0 -0 -1  1 -1  1 -0  0  1 -1 )],
 -   [qw( 0 -0  1 -1 -1  1 -0  0 -1  1  1 -1 )]
 -  ];
 +  my $ans = pdl '1 -1  0 -0 -1  1 -1  1 -0  0  1 -1; 0 -0  1 -1 -1  1 -0  0 -1  1  1 -1';
   my $inter = interaction_code( $a, $b, $c);
+-
 -  is(sum(abs($inter - $ans)), 0, 'interaction_code');
 +  is_pdl $inter, $ans, 'interaction_code';
+}
 done_testing();
 -sub lvalue_assign_detour {
 -    my ($pdl, $index, $new_value) = @_;
+-
 -    my @arr = list $pdl;
 -    my @ind = ref($index)? list($index) : $index;
 -    $arr[$_] = $new_value
 -        for (@ind);
+-
 -    return pdl(\@arr)->reshape($pdl->dims)->sever;
 -}
+-
 __DATA__
 subj	age	Apple-android	beer	wings	recall
 	0	0	0	0	5