pull

JohnMount · JohnMount · commit b7efde57fada · 2019-09-11T08:32:46.000-07:00
diff --git a/README.Rmd b/README.Rmd
@@ -32,7 +32,7 @@ values).  Other input columns are possible explanatory variables
 have missing values) that the user later wants to use to predict "y".
 In practice such an input `data.frame` may not be immediately suitable
 for machine learning procedures that often expect only numeric
-explanatory variables, and may not tolerate missing value.
+explanatory variables, and may not tolerate missing values.
 
 To solve this, `vtreat` builds a transformed `data.frame` where all
 explanatory variable columns have been transformed into a number of
diff --git a/README.md b/README.md
@@ -16,7 +16,7 @@ explanatory variables (typically numeric or categorical/string-valued,
 these columns may have missing values) that the user later wants to use
 to predict “y”. In practice such an input `data.frame` may not be
 immediately suitable for machine learning procedures that often expect
-only numeric explanatory variables, and may not tolerate missing value.
+only numeric explanatory variables, and may not tolerate missing values.
 
 To solve this, `vtreat` builds a transformed `data.frame` where all
 explanatory variable columns have been transformed into a number of
@@ -305,8 +305,8 @@ treatmentsC <- designTreatmentsC(dTrainC, colnames(dTrainC), 'y', TRUE,
                                  verbose=FALSE)
 print(treatmentsC$scoreFrame[, c('origName', 'varName', 'code', 'rsq', 'sig', 'extraModelDegrees')])
  #    origName   varName  code          rsq        sig extraModelDegrees
- #  1        x    x_catP  catP 1.559780e-01 0.22202097                 2
- #  2        x    x_catB  catB 1.142159e-05 0.99166241                 2
+ #  1        x    x_catP  catP 1.030137e-01 0.32099590                 2
+ #  2        x    x_catB  catB 1.125399e-05 0.99172381                 2
  #  3        z         z clean 2.376018e-01 0.13176020                 0
  #  4        z   z_isBAD isBAD 2.960654e-01 0.09248399                 0
  #  5        x  x_lev_NA   lev 2.960654e-01 0.09248399                 0
@@ -349,9 +349,9 @@ treatmentsN = designTreatmentsN(dTrainN, colnames(dTrainN), 'y',
                                 verbose=FALSE)
 print(treatmentsN$scoreFrame[, c('origName', 'varName', 'code', 'rsq', 'sig', 'extraModelDegrees')])
  #    origName   varName  code          rsq       sig extraModelDegrees
- #  1        x    x_catP  catP 3.558824e-01 0.1184999                 2
- #  2        x    x_catN  catN 2.663337e-02 0.6993947                 2
- #  3        x    x_catD  catD 4.226472e-02 0.6252538                 2
+ #  1        x    x_catP  catP 2.105263e-01 0.2528101                 2
+ #  2        x    x_catN  catN 3.205128e-03 0.8940756                 2
+ #  3        x    x_catD  catD 6.666667e-02 0.5369633                 2
  #  4        z         z clean 2.880952e-01 0.1701892                 0
  #  5        z   z_isBAD isBAD 3.333333e-01 0.1339746                 0
  #  6        x  x_lev_NA   lev 3.333333e-01 0.1339746                 0