Skip to contents

This returns a list with four variations of a data.set:

Usage

partition(x, n_ind = min(table(x[[1]])))

Arguments

x

data.frame

n_ind

passed to [balance()] (the smallest sample size by default)

Value

a named list described above

Details

* original: the dataset passed, untouched * random: original but shuffled on first (ie grouping) column * balanced: original but balanced on first column * balanced_random: balanced but randomized on first column

Examples

pig %>% partition()
#> $original
#> # A tibble: 171 × 51
#>    sp         PC1      PC2      PC3      PC4      PC5      PC6      PC7      PC8
#>    <fct>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>
#>  1 WB    -0.0247   7.22e-3 -1.79e-4  0.0119  -9.82e-4  8.82e-3 -0.0104   0.00659
#>  2 WB    -0.00864  2.40e-2 -2.65e-4  0.00924 -1.43e-2 -1.99e-2 -0.00201  0.00375
#>  3 WB     0.0254  -1.68e-4  1.01e-2  0.00135 -6.58e-3 -1.40e-2 -0.0162  -0.00879
#>  4 WB    -0.0438  -2.98e-3 -9.55e-4  0.00969  1.86e-2  3.02e-3 -0.00255 -0.00433
#>  5 WB     0.0137   4.87e-3  1.76e-2 -0.00392 -1.16e-2 -5.32e-3 -0.00227 -0.00114
#>  6 WB     0.0493  -1.68e-2  2.86e-2 -0.00285  7.15e-3  4.62e-3 -0.0142  -0.00286
#>  7 WB    -0.0172  -2.36e-2  1.14e-2 -0.0116  -3.83e-3 -1.07e-2 -0.00379  0.00158
#>  8 WB     0.00194 -1.01e-2  2.05e-2  0.00390  1.53e-2 -8.58e-4 -0.0147  -0.00140
#>  9 WB    -0.00865  4.70e-3  8.53e-3  0.0149   1.97e-5 -6.02e-3  0.00608  0.00210
#> 10 WB     0.00141  4.27e-3  1.20e-2  0.00546 -1.34e-2 -6.73e-4  0.00912  0.00124
#> # ℹ 161 more rows
#> # ℹ 42 more variables: PC9 <dbl>, PC10 <dbl>, PC11 <dbl>, PC12 <dbl>,
#> #   PC13 <dbl>, PC14 <dbl>, PC15 <dbl>, PC16 <dbl>, PC17 <dbl>, PC18 <dbl>,
#> #   PC19 <dbl>, PC20 <dbl>, PC21 <dbl>, PC22 <dbl>, PC23 <dbl>, PC24 <dbl>,
#> #   PC25 <dbl>, PC26 <dbl>, PC27 <dbl>, PC28 <dbl>, PC29 <dbl>, PC30 <dbl>,
#> #   PC31 <dbl>, PC32 <dbl>, PC33 <dbl>, PC34 <dbl>, PC35 <dbl>, PC36 <dbl>,
#> #   PC37 <dbl>, PC38 <dbl>, PC39 <dbl>, PC40 <dbl>, PC41 <dbl>, PC42 <dbl>, …
#> 
#> $random
#> # A tibble: 171 × 51
#>    sp         PC1      PC2      PC3      PC4      PC5      PC6      PC7      PC8
#>    <fct>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>
#>  1 WB    -0.0247   7.22e-3 -1.79e-4  0.0119  -9.82e-4  8.82e-3 -0.0104   0.00659
#>  2 DP    -0.00864  2.40e-2 -2.65e-4  0.00924 -1.43e-2 -1.99e-2 -0.00201  0.00375
#>  3 WB     0.0254  -1.68e-4  1.01e-2  0.00135 -6.58e-3 -1.40e-2 -0.0162  -0.00879
#>  4 WB    -0.0438  -2.98e-3 -9.55e-4  0.00969  1.86e-2  3.02e-3 -0.00255 -0.00433
#>  5 WB     0.0137   4.87e-3  1.76e-2 -0.00392 -1.16e-2 -5.32e-3 -0.00227 -0.00114
#>  6 DP     0.0493  -1.68e-2  2.86e-2 -0.00285  7.15e-3  4.62e-3 -0.0142  -0.00286
#>  7 WB    -0.0172  -2.36e-2  1.14e-2 -0.0116  -3.83e-3 -1.07e-2 -0.00379  0.00158
#>  8 WB     0.00194 -1.01e-2  2.05e-2  0.00390  1.53e-2 -8.58e-4 -0.0147  -0.00140
#>  9 WB    -0.00865  4.70e-3  8.53e-3  0.0149   1.97e-5 -6.02e-3  0.00608  0.00210
#> 10 WB     0.00141  4.27e-3  1.20e-2  0.00546 -1.34e-2 -6.73e-4  0.00912  0.00124
#> # ℹ 161 more rows
#> # ℹ 42 more variables: PC9 <dbl>, PC10 <dbl>, PC11 <dbl>, PC12 <dbl>,
#> #   PC13 <dbl>, PC14 <dbl>, PC15 <dbl>, PC16 <dbl>, PC17 <dbl>, PC18 <dbl>,
#> #   PC19 <dbl>, PC20 <dbl>, PC21 <dbl>, PC22 <dbl>, PC23 <dbl>, PC24 <dbl>,
#> #   PC25 <dbl>, PC26 <dbl>, PC27 <dbl>, PC28 <dbl>, PC29 <dbl>, PC30 <dbl>,
#> #   PC31 <dbl>, PC32 <dbl>, PC33 <dbl>, PC34 <dbl>, PC35 <dbl>, PC36 <dbl>,
#> #   PC37 <dbl>, PC38 <dbl>, PC39 <dbl>, PC40 <dbl>, PC41 <dbl>, PC42 <dbl>, …
#> 
#> $balanced
#> # A tibble: 84 × 51
#>    sp         PC1      PC2      PC3      PC4      PC5      PC6      PC7      PC8
#>    <fct>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>
#>  1 DP    -0.0795   1.05e-2 -0.00151  0.00337 -8.65e-3 -2.58e-3  0.0113  -0.0134 
#>  2 DP    -0.0504  -3.02e-4  0.00555 -0.00218 -1.21e-2  8.24e-3 -0.00513  0.00286
#>  3 DP     0.0238  -1.47e-2  0.0118  -0.0264  -1.52e-2 -1.13e-2  0.0161  -0.00482
#>  4 DP    -0.0971  -8.33e-3 -0.0433   0.00436  2.28e-3  6.56e-3 -0.0148  -0.00986
#>  5 DP    -0.0791  -7.97e-3  0.00727  0.00714 -8.65e-3  1.02e-2  0.0110  -0.0179 
#>  6 DP     0.0190  -3.28e-3 -0.00412 -0.00478  1.64e-2 -1.57e-2  0.00642 -0.00433
#>  7 DP     0.0238  -1.47e-2  0.0118  -0.0264  -1.52e-2 -1.13e-2  0.0161  -0.00482
#>  8 DP    -0.00928 -3.65e-2  0.0107  -0.0235  -9.88e-4  7.92e-4 -0.00297  0.00382
#>  9 DP    -0.111   -5.70e-2  0.00831  0.00552 -3.54e-2 -3.33e-2 -0.00945 -0.00685
#> 10 DP    -0.0751   2.45e-2 -0.00527 -0.00418  1.11e-3 -1.63e-2 -0.0164  -0.00319
#> # ℹ 74 more rows
#> # ℹ 42 more variables: PC9 <dbl>, PC10 <dbl>, PC11 <dbl>, PC12 <dbl>,
#> #   PC13 <dbl>, PC14 <dbl>, PC15 <dbl>, PC16 <dbl>, PC17 <dbl>, PC18 <dbl>,
#> #   PC19 <dbl>, PC20 <dbl>, PC21 <dbl>, PC22 <dbl>, PC23 <dbl>, PC24 <dbl>,
#> #   PC25 <dbl>, PC26 <dbl>, PC27 <dbl>, PC28 <dbl>, PC29 <dbl>, PC30 <dbl>,
#> #   PC31 <dbl>, PC32 <dbl>, PC33 <dbl>, PC34 <dbl>, PC35 <dbl>, PC36 <dbl>,
#> #   PC37 <dbl>, PC38 <dbl>, PC39 <dbl>, PC40 <dbl>, PC41 <dbl>, PC42 <dbl>, …
#> 
#> $balanced_random
#> # A tibble: 84 × 51
#>    sp         PC1      PC2      PC3      PC4      PC5      PC6      PC7      PC8
#>    <fct>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>    <dbl>
#>  1 DP     0.00508 -8.73e-3 -0.00596 -0.00452  7.88e-4 -0.00345 -9.08e-5  0.00338
#>  2 WB     0.0374  -2.32e-2  0.0116  -0.0153   3.94e-3 -0.0103   1.52e-2 -0.0135 
#>  3 DP    -0.111   -5.70e-2  0.00831  0.00552 -3.54e-2 -0.0333  -9.45e-3 -0.00685
#>  4 WB    -0.0269  -1.20e-2 -0.00834 -0.0112   5.47e-3 -0.00261  9.14e-3 -0.00153
#>  5 WB    -0.00876 -2.24e-2 -0.0256  -0.0103   1.09e-3 -0.00316  8.02e-4 -0.00915
#>  6 DP     0.0138   1.31e-2 -0.00803  0.00174  1.91e-2 -0.00591  1.46e-2 -0.00762
#>  7 DP    -0.0400   9.77e-4  0.00657 -0.00292  4.25e-3  0.00793 -5.02e-5 -0.00935
#>  8 WB    -0.0751   2.45e-2 -0.00527 -0.00418  1.11e-3 -0.0163  -1.64e-2 -0.00319
#>  9 WB    -0.0170   7.31e-4 -0.0118  -0.00323  1.04e-2 -0.0133  -7.02e-4 -0.00648
#> 10 WB    -0.0795   1.05e-2 -0.00151  0.00337 -8.65e-3 -0.00258  1.13e-2 -0.0134 
#> # ℹ 74 more rows
#> # ℹ 42 more variables: PC9 <dbl>, PC10 <dbl>, PC11 <dbl>, PC12 <dbl>,
#> #   PC13 <dbl>, PC14 <dbl>, PC15 <dbl>, PC16 <dbl>, PC17 <dbl>, PC18 <dbl>,
#> #   PC19 <dbl>, PC20 <dbl>, PC21 <dbl>, PC22 <dbl>, PC23 <dbl>, PC24 <dbl>,
#> #   PC25 <dbl>, PC26 <dbl>, PC27 <dbl>, PC28 <dbl>, PC29 <dbl>, PC30 <dbl>,
#> #   PC31 <dbl>, PC32 <dbl>, PC33 <dbl>, PC34 <dbl>, PC35 <dbl>, PC36 <dbl>,
#> #   PC37 <dbl>, PC38 <dbl>, PC39 <dbl>, PC40 <dbl>, PC41 <dbl>, PC42 <dbl>, …
#>