Partial Pooling for Lower Variance Variable Encoding

diff --git a/ABDynprog/index.html b/ABDynprog/index.html index d2a95b7..8d39da9 100644 --- a/ABDynprog/index.html +++ b/ABDynprog/index.html @@ -42,7 +42,7 @@
./ABDynprog -
diff --git a/APAsig/index.html b/APAsig/index.html
index f9fc116..f8474b6 100644
--- a/APAsig/index.html
+++ b/APAsig/index.html
@@ -42,7 +42,7 @@
         
         
       ./APAsig
-         ..
+         ..
          
           APAsig.Rmd
           APAsig.Rproj
diff --git a/Accumulation/index.html b/Accumulation/index.html
index f4abec2..c700a1a 100644
--- a/Accumulation/index.html
+++ b/Accumulation/index.html
@@ -42,7 +42,7 @@
         
         
       ./Accumulation
-         ..
+         ..
          
 
 diff --git a/CrossSimulation/index.html b/CrossSimulation/index.html
index d77340c..e89ce3e 100644
--- a/CrossSimulation/index.html
+++ b/CrossSimulation/index.html
@@ -42,7 +42,7 @@
         
         
       ./CrossSimulation
-         ..
+         ..
          
           NestedCrossSimulation.html
          
diff --git a/DS/index.html b/DS/index.html
index 01c4757..7f8a49b 100644
--- a/DS/index.html
+++ b/DS/index.html
@@ -42,7 +42,7 @@
         
         
       ./DS
-         ..
+         ..
          
 
 diff --git a/DataPrep/index.html b/DataPrep/index.html
index a0da683..3dc33d8 100644
--- a/DataPrep/index.html
+++ b/DataPrep/index.html
@@ -42,7 +42,7 @@
         
         
       ./DataPrep
-         ..
+         ..
          
           EN-CNTNT-Whitepaper-Data-Prep-Using-R.pdf
          
diff --git a/Debugging/index.html b/Debugging/index.html
index 42ada22..e482536 100644
--- a/Debugging/index.html
+++ b/Debugging/index.html
@@ -42,7 +42,7 @@
         
         
       ./Debugging
-         ..
+         ..
          
 
 diff --git a/DiffPriv/index.html b/DiffPriv/index.html
index f68c02a..d5047f0 100644
--- a/DiffPriv/index.html
+++ b/DiffPriv/index.html
@@ -42,7 +42,7 @@
         
         
       ./DiffPriv
-         ..
+         ..
          
           DiffPriv.pdf
          
diff --git a/FixedPoint/index.html b/FixedPoint/index.html
index c48f4d4..5f6a05a 100644
--- a/FixedPoint/index.html
+++ b/FixedPoint/index.html
@@ -42,7 +42,7 @@
         
         
       ./FixedPoint
-         ..
+         ..
          
           FixedPoint.Rmd
           FixedPoint.Rproj
diff --git a/FluidData/PlotExample/index.html b/FluidData/PlotExample/index.html
index 5fa342b..cd0c3c0 100644
--- a/FluidData/PlotExample/index.html
+++ b/FluidData/PlotExample/index.html
@@ -42,7 +42,7 @@
         
         
       ./FluidData/PlotExample
-        
..

+        
..

          
           KerasPerfPlot.Rmd
           KerasPerfPlot.html
diff --git a/FluidData/index.html b/FluidData/index.html
index 87282b4..18bed5d 100644
--- a/FluidData/index.html
+++ b/FluidData/index.html
@@ -42,7 +42,7 @@
         
         
       ./FluidData
-         ..
+         ..
          
           15puzzleGroupoid.png
           ArbitraryTransform.Rmd
diff --git a/Intro_rquery/index.html b/Intro_rquery/index.html
index 29610ae..dd72712 100644
--- a/Intro_rquery/index.html
+++ b/Intro_rquery/index.html
@@ -42,7 +42,7 @@
         
         
       ./Intro_rquery
-         ..
+         ..
          
           IntroToRQuery.pdf
          
diff --git a/IntroductionToDataScience/Sec01_Lesson000_CourseIntroduction/index.html b/IntroductionToDataScience/Sec01_Lesson000_CourseIntroduction/index.html
index 9b40674..ceabfbf 100644
--- a/IntroductionToDataScience/Sec01_Lesson000_CourseIntroduction/index.html
+++ b/IntroductionToDataScience/Sec01_Lesson000_CourseIntroduction/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec01_Lesson000_CourseIntroduction
-        
..

+        
..

          
           CourseIntroduction.pdf
          
diff --git a/IntroductionToDataScience/Sec01_Lesson001_ProjectWalkThrough/index.html b/IntroductionToDataScience/Sec01_Lesson001_ProjectWalkThrough/index.html
index a6ca249..e92644c 100644
--- a/IntroductionToDataScience/Sec01_Lesson001_ProjectWalkThrough/index.html
+++ b/IntroductionToDataScience/Sec01_Lesson001_ProjectWalkThrough/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec01_Lesson001_ProjectWalkThrough
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec01_Lesson002_StartWithR/index.html b/IntroductionToDataScience/Sec01_Lesson002_StartWithR/index.html
index 56fdda2..009e131 100644
--- a/IntroductionToDataScience/Sec01_Lesson002_StartWithR/index.html
+++ b/IntroductionToDataScience/Sec01_Lesson002_StartWithR/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec01_Lesson002_StartWithR
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson002_ValidatingModels/index.html b/IntroductionToDataScience/Sec02_Lesson002_ValidatingModels/index.html
index ea1c00b..c6e7fc7 100644
--- a/IntroductionToDataScience/Sec02_Lesson002_ValidatingModels/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson002_ValidatingModels/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson002_ValidatingModels
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson004_NBPractice/index.html b/IntroductionToDataScience/Sec02_Lesson004_NBPractice/index.html
index 406a4a0..3b42f4a 100644
--- a/IntroductionToDataScience/Sec02_Lesson004_NBPractice/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson004_NBPractice/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson004_NBPractice
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson005_LRTheory/index.html b/IntroductionToDataScience/Sec02_Lesson005_LRTheory/index.html
index 3fe7e6f..272a400 100644
--- a/IntroductionToDataScience/Sec02_Lesson005_LRTheory/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson005_LRTheory/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson005_LRTheory
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson006_LRPractice/index.html b/IntroductionToDataScience/Sec02_Lesson006_LRPractice/index.html
index da3b635..80b0e95 100644
--- a/IntroductionToDataScience/Sec02_Lesson006_LRPractice/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson006_LRPractice/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson006_LRPractice
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson007_LogitTheory/index.html b/IntroductionToDataScience/Sec02_Lesson007_LogitTheory/index.html
index 47b0e37..0e4ac73 100644
--- a/IntroductionToDataScience/Sec02_Lesson007_LogitTheory/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson007_LogitTheory/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson007_LogitTheory
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson008_LogitPractice/index.html b/IntroductionToDataScience/Sec02_Lesson008_LogitPractice/index.html
index 801c7d6..24eeb1e 100644
--- a/IntroductionToDataScience/Sec02_Lesson008_LogitPractice/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson008_LogitPractice/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson008_LogitPractice
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson009_RFTheory/index.html b/IntroductionToDataScience/Sec02_Lesson009_RFTheory/index.html
index c061e4c..23af1be 100644
--- a/IntroductionToDataScience/Sec02_Lesson009_RFTheory/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson009_RFTheory/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson009_RFTheory
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson010_RFPractice/index.html b/IntroductionToDataScience/Sec02_Lesson010_RFPractice/index.html
index 24b24e7..39e1b06 100644
--- a/IntroductionToDataScience/Sec02_Lesson010_RFPractice/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson010_RFPractice/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson010_RFPractice
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson011_GAM/index.html b/IntroductionToDataScience/Sec02_Lesson011_GAM/index.html
index 8941488..1dec06b 100644
--- a/IntroductionToDataScience/Sec02_Lesson011_GAM/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson011_GAM/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson011_GAM
-        
..

+        
..

          
           GAM.Rmd
           GAM.html
diff --git a/IntroductionToDataScience/Sec02_Lesson012_SVM/index.html b/IntroductionToDataScience/Sec02_Lesson012_SVM/index.html
index 1a5a8ec..f3e66c5 100644
--- a/IntroductionToDataScience/Sec02_Lesson012_SVM/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson012_SVM/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson012_SVM
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson013_GBM/index.html b/IntroductionToDataScience/Sec02_Lesson013_GBM/index.html
index 4828a35..1637372 100644
--- a/IntroductionToDataScience/Sec02_Lesson013_GBM/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson013_GBM/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson013_GBM
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson014_Glmnet/index.html b/IntroductionToDataScience/Sec02_Lesson014_Glmnet/index.html
index 2e43b02..9162c24 100644
--- a/IntroductionToDataScience/Sec02_Lesson014_Glmnet/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson014_Glmnet/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson014_Glmnet
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec02_Lesson015_EvaluatingModels/index.html b/IntroductionToDataScience/Sec02_Lesson015_EvaluatingModels/index.html
index ba4dd98..0db50ac 100644
--- a/IntroductionToDataScience/Sec02_Lesson015_EvaluatingModels/index.html
+++ b/IntroductionToDataScience/Sec02_Lesson015_EvaluatingModels/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec02_Lesson015_EvaluatingModels
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec03_Lesson001_LoadingData/index.html b/IntroductionToDataScience/Sec03_Lesson001_LoadingData/index.html
index 42b9dbd..19e2ef0 100644
--- a/IntroductionToDataScience/Sec03_Lesson001_LoadingData/index.html
+++ b/IntroductionToDataScience/Sec03_Lesson001_LoadingData/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec03_Lesson001_LoadingData
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec03_Lesson002_VisualizingData/index.html b/IntroductionToDataScience/Sec03_Lesson002_VisualizingData/index.html
index 4343c65..cf7bca9 100644
--- a/IntroductionToDataScience/Sec03_Lesson002_VisualizingData/index.html
+++ b/IntroductionToDataScience/Sec03_Lesson002_VisualizingData/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec03_Lesson002_VisualizingData
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec03_Lesson003_MissingValues/index.html b/IntroductionToDataScience/Sec03_Lesson003_MissingValues/index.html
index a4b8cdb..efb194d 100644
--- a/IntroductionToDataScience/Sec03_Lesson003_MissingValues/index.html
+++ b/IntroductionToDataScience/Sec03_Lesson003_MissingValues/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec03_Lesson003_MissingValues
-        
..

+        
..

          
 
 diff --git a/IntroductionToDataScience/Sec03_Lesson004_UsefulDataTransformations/index.html b/IntroductionToDataScience/Sec03_Lesson004_UsefulDataTransformations/index.html
index 8774de9..97e7051 100644
--- a/IntroductionToDataScience/Sec03_Lesson004_UsefulDataTransformations/index.html
+++ b/IntroductionToDataScience/Sec03_Lesson004_UsefulDataTransformations/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec03_Lesson004_UsefulDataTransformations
-        
..

+        
..

          
           UsefulDataTransformations.Rmd
          
diff --git a/IntroductionToDataScience/Sec03_Lesson005_CategoricalVariables/index.html b/IntroductionToDataScience/Sec03_Lesson005_CategoricalVariables/index.html
index 5b24d45..459dc6b 100644
--- a/IntroductionToDataScience/Sec03_Lesson005_CategoricalVariables/index.html
+++ b/IntroductionToDataScience/Sec03_Lesson005_CategoricalVariables/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec03_Lesson005_CategoricalVariables
-        
..

+        
..

          
           CategoricalVariables.Rmd
           CategoricalVariables.Rproj
diff --git a/IntroductionToDataScience/Sec03_Lesson006_TheShapeOfData/index.html b/IntroductionToDataScience/Sec03_Lesson006_TheShapeOfData/index.html
index 0b42a89..0611671 100644
--- a/IntroductionToDataScience/Sec03_Lesson006_TheShapeOfData/index.html
+++ b/IntroductionToDataScience/Sec03_Lesson006_TheShapeOfData/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec03_Lesson006_TheShapeOfData
-        
..

+        
..

          
           CarEmail.pdf
           NBDB.Rmd
diff --git a/IntroductionToDataScience/Sec04_Lesson001_RecommendedBooks/index.html b/IntroductionToDataScience/Sec04_Lesson001_RecommendedBooks/index.html
index 0653a58..99ab9f6 100644
--- a/IntroductionToDataScience/Sec04_Lesson001_RecommendedBooks/index.html
+++ b/IntroductionToDataScience/Sec04_Lesson001_RecommendedBooks/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec04_Lesson001_RecommendedBooks
-        
..

+        
..

          
           RecommendedBooks.pdf
          
diff --git a/IntroductionToDataScience/Sec04_Lesson003_NextSteps/index.html b/IntroductionToDataScience/Sec04_Lesson003_NextSteps/index.html
index 3c8eb87..420a456 100644
--- a/IntroductionToDataScience/Sec04_Lesson003_NextSteps/index.html
+++ b/IntroductionToDataScience/Sec04_Lesson003_NextSteps/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience/Sec04_Lesson003_NextSteps
-        
..

+        
..

          
           NextSteps.pdf
          
diff --git a/IntroductionToDataScience/index.html b/IntroductionToDataScience/index.html
index 5f0f1e6..3101397 100644
--- a/IntroductionToDataScience/index.html
+++ b/IntroductionToDataScience/index.html
@@ -42,7 +42,7 @@
         
         
       ./IntroductionToDataScience
-         ..
+         ..
          
 
 diff --git a/KDD2009/index.html b/KDD2009/index.html
index d202df6..b2b92fe 100644
--- a/KDD2009/index.html
+++ b/KDD2009/index.html
@@ -42,7 +42,7 @@
         
         
       ./KDD2009
-         ..
+         ..
          
 
 diff --git a/LibreOffice/Workbook1/_rels/index.html b/LibreOffice/Workbook1/_rels/index.html
index 4322905..50fecc5 100644
--- a/LibreOffice/Workbook1/_rels/index.html
+++ b/LibreOffice/Workbook1/_rels/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice/Workbook1/_rels
-        
..

+        
..

          
          
         
diff --git a/LibreOffice/Workbook1/docProps/index.html b/LibreOffice/Workbook1/docProps/index.html
index 3d4e8df..6a377bc 100644
--- a/LibreOffice/Workbook1/docProps/index.html
+++ b/LibreOffice/Workbook1/docProps/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice/Workbook1/docProps
-        
..

+        
..

          
           app.xml
           core.xml
diff --git a/LibreOffice/Workbook1/index.html b/LibreOffice/Workbook1/index.html
index 71d9bc6..000c35c 100644
--- a/LibreOffice/Workbook1/index.html
+++ b/LibreOffice/Workbook1/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice/Workbook1
-        
..

+        
..

          
           [Content_Types].xml
           _rels
diff --git a/LibreOffice/Workbook1/xl/_rels/index.html b/LibreOffice/Workbook1/xl/_rels/index.html
index 557deb2..2a0a8aa 100644
--- a/LibreOffice/Workbook1/xl/_rels/index.html
+++ b/LibreOffice/Workbook1/xl/_rels/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice/Workbook1/xl/_rels
-        
..

+        
..

          
           workbook.xml.rels
          
diff --git a/LibreOffice/Workbook1/xl/index.html b/LibreOffice/Workbook1/xl/index.html
index 34985b2..d5d7378 100644
--- a/LibreOffice/Workbook1/xl/index.html
+++ b/LibreOffice/Workbook1/xl/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice/Workbook1/xl
-        
..

+        
..

          
           _rels
           sharedStrings.xml
diff --git a/LibreOffice/Workbook1/xl/theme/index.html b/LibreOffice/Workbook1/xl/theme/index.html
index 259bb23..af41388 100644
--- a/LibreOffice/Workbook1/xl/theme/index.html
+++ b/LibreOffice/Workbook1/xl/theme/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice/Workbook1/xl/theme
-        
..

+        
..

          
           theme1.xml
          
diff --git a/LibreOffice/Workbook1/xl/worksheets/index.html b/LibreOffice/Workbook1/xl/worksheets/index.html
index c6dd5da..aef91c8 100644
--- a/LibreOffice/Workbook1/xl/worksheets/index.html
+++ b/LibreOffice/Workbook1/xl/worksheets/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice/Workbook1/xl/worksheets
-        
..

+        
..

          
           sheet1.xml
          
diff --git a/LibreOffice/index.html b/LibreOffice/index.html
index 9895e9c..b6c66c4 100644
--- a/LibreOffice/index.html
+++ b/LibreOffice/index.html
@@ -42,7 +42,7 @@
         
         
       ./LibreOffice
-         ..
+         ..
          
           Workbook1
           Workbook1.xlsx
diff --git a/ModelTesting/index.html b/ModelTesting/index.html
index b0d1631..eb06fa5 100644
--- a/ModelTesting/index.html
+++ b/ModelTesting/index.html
@@ -42,7 +42,7 @@
         
         
       ./ModelTesting
-         ..
+         ..
          
 
 diff --git a/PDSwR/index.html b/PDSwR/index.html
index e675d22..1e6da79 100644
--- a/PDSwR/index.html
+++ b/PDSwR/index.html
@@ -42,7 +42,7 @@
         
         
       ./PDSwR
-         ..
+         ..
          
           PracticalDataScienceWithRErrata.html
           zumel_cover150.jpg
diff --git a/Parallel/index.html b/Parallel/index.html
index cc39825..cba1cc6 100644
--- a/Parallel/index.html
+++ b/Parallel/index.html
@@ -42,7 +42,7 @@
         
         
       ./Parallel
-         ..
+         ..
          
           PExample.Rmd
           PExample.html
diff --git a/PartialPooling_R/PartialPooling_R.Rmd b/PartialPooling_R/PartialPooling_R.Rmd
new file mode 100644
index 0000000..01cd258
--- /dev/null
+++ b/PartialPooling_R/PartialPooling_R.Rmd
@@ -0,0 +1,328 @@
+---
+title: 'Partial Pooling for Lower Variance Variable Encoding'
+author: "Nina Zumel"
+output: 
+  html_document:
+    keep_md: true
+---
+
+
+
+ 
+Banaue rice terraces. Photo: Jon Rawlinson
+
+
+


+
+
+In a [previous article](https://github.com/WinVector/vtreat/blob/main/Examples/CustomLevelCoding/CustomLevelCoding.md), we showed the use of partial pooling, or hierarchical/multilevel models, for level coding high-cardinality categorical variables in [`vtreat`](https://winvector.github.io/vtreat/). In this article, we will discuss a little more about the how and why of partial pooling in [`R`](https://www.r-project.org).
+
+We will use the `lme4` package to fit the hierarchical models. The acronym "lme" stands for "linear mixed-effects" models: models that combine so-called "fixed effects" and "random effects" in a single (generalized) linear model. The `lme4` documentation uses the random/fixed effects terminology, but we are going to follow Gelman and Hill, and avoid the use of the terms "fixed" and "random" effects.
+
+> The varying coefficients [corresponding to the levels of a categorical variable] in a multilevel model are sometimes called *random effects*, a term that refers to the randomness in the probability model for the group-level coefficients....
+
+> The term *fixed effects* is used in contrast to random effects -- but not in a consistent way! ... Because of the conflicting definitions and advice, we will avoid the terms "fixed" and "random" entirely, and focus on the description of the model itself...
+
+-- Gelman and Hill 2007, Chapter 11.4
+
+We will also restrict ourselves to the case that `vtreat` considers: partially pooled estimates of conditional group expectations, with no other predictors considered.
+
+## The Data
+
+Let's assume that the data is generated from a mixture of $M$ populations; each population is normally distributed with (unknown) means $\mu_{gp}$, all with the same (unknown) standard deviation $\sigma_w$:
+
+$$
+y_{gp} = N(\mu_{gp}, {\sigma_{w}}^2)
+$$
+
+The population means themselves are normally distributed, with unknown mean $\mu_0$ and unknown standard deviation $\sigma_b$:
+
+$$
+\mu_{gp} = N(\mu_0, {\sigma_{b}}^2)
+$$
+
+(The subscripts *w* and *b* stand for "within-group" and "between-group" standard deviations, respectively.)
+
+
+```{r setup, include=FALSE}
+knitr::opts_chunk$set(echo = TRUE)
+```
+
+```{r dat, echo=FALSE, message=FALSE, warning=FALSE}
+library("lme4")
+library("dplyr")
+library("tidyr")
+library("ggplot2")
+library("viridis")
+library("kableExtra")
+library("cdata")
+
+set.seed(46356)
+
+# source generate_data to create and save the data
+# source("generate_data.R")
+
+# read in the synthetic data and the true population means
+df = readRDS("synthdata.rds")
+true_mu = readRDS("truemu.rds")
+```
+
+We can generate a synthetic data set according to these assumptions, with distributions similar to the distributions observed in the radon data set that we used in our earlier post: 85 groups, sampled unevenly. We'll use $\mu_0 = 0, \sigma_w = 0.7, \sigma_b = 0.5$. Here, we take a peek at our data, `df`.
+
+```{r}
+head(df)
+```
+
+```{r echo=FALSE}
+
+rawdata = df %>% group_by(gp) %>% 
+  summarize(gmean = mean(y),
+            gsd = sd(y), 
+            count = n(),
+            grandmean = mean(df$y)) %>%
+  mutate(stderr = ifelse(count<=1, 1, gsd/sqrt(count))) %>%
+  mutate(errlo = gmean - stderr,
+         errhi = gmean + stderr) %>% 
+  right_join(true_mu, by="gp") 
+
+# add a jitter to the count so we can plot by number of observations without overlap
+set.seed(34255)
+countnoise = 0.8*runif(nrow(rawdata))
+rawdata$countr = rawdata$count + countnoise
+
+df = inner_join(df, select(rawdata, gp, countr), by="gp") 
+
+# distribution of population sizes
+
+rawdata %>% group_by(count) %>%
+  summarize(nobs = n()) %>%
+  ggplot(aes(x=count, y=nobs)) + 
+  geom_pointrange(aes(ymin=0, ymax=nobs), fatten=2) + 
+  ggtitle("Distribution of group sample sizes")
+
+```
+
+As the graph shows, some groups were heavily sampled, but most groups have only a handful of samples in the data set. Since this is synthetic data, we know the true population means (shown in red in the graph below), and we can compare them to the observed means $\bar{y}_i$ of each group $i$ (shown in black, with standard errors. The gray points are the actual observations). We've sorted the groups by the number of observations.
+
+```{r echo=FALSE}
+
+# meanorder = levels(reorder(rawdata$gp, rawdata$mu_gp))
+countorder = levels(reorder(rawdata$gp, rawdata$count))
+
+# by count
+gplevels = countorder
+rawdata %>% mutate(gp = factor(gp, levels=gplevels)) %>%
+  ggplot(aes(x=gp)) + 
+  geom_point(data=df, aes(x = factor(gp, levels=gplevels), y=y), color="#bdbdbd",
+              position=position_jitter(width=0.05, height=0)) +  
+  geom_line(aes(y=mu_gp, group=1), color="#993404") + 
+  geom_point(aes(y=mu_gp), color="#993404") + 
+  geom_pointrange(aes(y=gmean, ymin=errlo, ymax=errhi), fatten=3) + 
+  geom_hline(aes(yintercept=grandmean), color="darkblue")  + 
+  scale_x_discrete(breaks=NULL) + 
+  ggtitle("Raw group mean estimates",
+          subtitle="Groups ordered by observation count")
+
+```
+
+For groups with many observations, the observed group mean is near the true mean. For groups with few observations, the estimates are uncertain, and the observed group mean can be far from the true population mean.
+
+Can we get better estimates of the conditional mean for groups with only a few observations?
+
+## Partial Pooling
+
+If the data is generated by the process described above, and if we knew $\sigma_w$ and $\sigma_b$, then a good estimate $\hat{y}_i$ for the mean of group $i$ is the weighted average of the grand mean over all the data, $\bar{y}$, and the observed mean of all the observations in group $i$, $\bar{y}_i$.
+
+$$
+\large
+\hat{y_i} \approx \frac{\frac{n_i} {\sigma_w^2} \cdot \bar{y}_i  + \frac{1}{\sigma_b^2} \cdot \bar{y}}
+ {\frac{n_i} {\sigma_w^2} + \frac{1}{\sigma_b^2}}
+$$
+
+
+where $n_i$ is the number of observations for group $i$. In other words, for groups where you have a lot of observations, use an estimate close to the observed group mean. For groups where you have only a few observations, fall back to an estimate close to the grand mean.
+
+Gelman and Hill call the grand mean the *complete-pooling* estimate, because the data from all the groups is pooled to create the estimate \hat{y_i} (which is the same for all $i$). The "raw" observed means are the *no-pooling* estimate, because no pooling occurs; only observations from group $i$ contribute to $\hat{y_i}$. The weighted sum of the complete-pooling and the no-pooling estimate is hence the *partial-pooling* estimate.
+
+Of course, in practice we don't know $\sigma_w$ and $\sigma_b$. The `lmer` function essentially solves for the restricted maximum likelihood (REML) estimates of the appropriate parameters in order to estimate $\hat{y_i}$. You can express multilevel models in `lme4` using the notation `| gp` in formulas to designate that `gp` is the grouping variable that you want conditional estimates for. The model that we are interested in is the simplest: outcome as a function of the grouping variable, with no other predictors.
+
+```{r shrinkage}
+poolmod = lmer(y ~ (1 | gp), data=df)
+```
+
+See section 2.2 of [this `lmer` vignette](https://cran.r-project.org/web/packages/lme4/vignettes/lmer.pdf) for more discussion on writing formulas for models with additional predictors. Printing `poolmod` displays the REML estimates of the grand mean (The intercept), $\sigma_b$ (the standard deviation of $gp$) and $\sigma_w$ (the residual).
+
+```{r}
+poolmod
+```
+
+To pull these values out explicitly:
+```{r}
+# the estimated grand mean 
+(grandmean_est= fixef(poolmod))
+
+# get the estimated between-group standard deviation
+(sigma_b = as.data.frame(VarCorr(poolmod)) %>% 
+  filter(grp=="gp") %>% 
+  pull(sdcor))
+
+# get the estimated within-group standard deviation
+(sigma_w = as.data.frame(VarCorr(poolmod)) %>% 
+  filter(grp=="Residual") %>% 
+  pull(sdcor))
+
+```
+
+`predict(poolmod)` will return the partial pooling estimates of the group means. Below, we compare the partial pooling estimates to the raw group mean expectations. The gray lines represent the true group means, the dark blue horizontal line is the observed grand mean, and the black dots are the estimates. We have again sorted the groups by number of observations, and laid them out (with a slight jitter) on a log10 scale.
+
+```{r echo=FALSE}
+                               
+pooldata = rawdata %>% 
+  select(gp, count, countr)  %>%
+  mutate(gmean = as.numeric(predict(poolmod, newdata=rawdata)),
+         grandmean=grandmean_est) %>% 
+  right_join(true_mu, by="gp")
+
+alldata = select(rawdata, gp, count, countr, grandmean, gmean, mu_gp) %>%
+  mutate(estimate_type="raw") %>%
+  bind_rows(mutate(pooldata, estimate_type="partial pooling")) %>%
+  mutate(estimate_type=factor(estimate_type, levels=c("raw", "partial pooling")))
+
+
+alldata %>%
+  ggplot(aes(x=countr)) +
+  geom_line(aes(y=mu_gp), color="darkgray") +
+  geom_point(aes(y=mu_gp), color="darkgray") +
+  geom_point(aes(y=gmean)) +
+  geom_hline(aes(yintercept=grandmean), color="darkblue")  +
+  facet_wrap(~estimate_type, ncol=1) +
+  scale_x_log10("Number of observations (log10 scale)") + 
+  ggtitle("Group mean estimates", 
+          subtitle="Compared to observed and estimated grand means, respectively")
+
+
+```
+
+For groups with only a few observations, the partial pooling "shrinks" the estimates towards the grand mean[^1], which often results in a better estimate of the true conditional population means. We can see the relationship between shrinkage (the raw estimate minus the partial pooling estimate) and the groups, ordered by sample size.
+
+```{r, echo=FALSE}
+
+alldata %>% select(gp, countr, gmean, estimate_type) %>%
+  mutate(estimate_type = as.character(estimate_type)) %>%
+  mutate(estimate_type = ifelse(estimate_type=="partial pooling", "partial_pooling", estimate_type)) %>%
+  pivot_to_rowrecs(columnToTakeKeysFrom="estimate_type",
+                                columnToTakeValuesFrom="gmean",
+                                rowKeyColumns=c("gp", "countr")) %>%
+  ggplot(aes(x=countr, y=raw-partial_pooling)) + 
+  geom_point() + geom_hline(yintercept=0, color="darkblue") + 
+  ylab("shrinkage (raw - partial pooling estimate)") + 
+  scale_x_log10("Number of observations (log10 scale)") + 
+  ggtitle("Estimate shrinkage")
+
+```
+
+For this data set, the partial pooling estimates are on average closer to the true means than the raw estimates; we can see this by comparing the root mean squared errors of the two estimates.
+
+
+```{r echo=FALSE}
+# RMSE table on group mean estimates
+alldata %>%
+  group_by(estimate_type) %>%
+  mutate(sqrerr = (gmean-mu_gp)^2) %>%
+  summarize(rmse = sqrt(mean(sqrerr))) %>% 
+  knitr::kable(format="html") %>%
+  kableExtra::kable_styling(full_width=F)
+```
+
+[^1]: To be precise, partial pooling shrinks estimates toward the *estimated* grand mean `r format(grandmean_est, digits=3)`, not to the *observed* grand mean `r format(mean(df$y), digits=3)`. 
+
+
+### The Discrete Case
+
+For discrete (binary) outcomes or classification, use the function `glmer()` to fit multilevel logistic regression models. Suppose we want to predict $\mbox{P}(y > 0 \,|\, gp)$, the conditional probability that the outcome $y$ is positive, as a function of $gp$.
+
+```{r}
+df$ispos = df$y > 0
+
+# fit a logistic regression model
+mod_glm = glm(ispos ~ gp, data=df, family=binomial)
+```
+
+Again, the conditional probability estimates will be highly uncertain for groups with only a few observations. We can fit a multilevel model with `glmer` and compare the distributions of the resulting predictions in link space.
+
+```{r}
+mod_glmer = glmer(ispos ~ (1|gp), data=df, family=binomial)
+
+```
+
+```{r echo=FALSE}
+sigmoid = function (x) {
+  1/(1 + exp(-x))
+}
+
+meanests = data.frame(estimate_type = c("pred_glm", "pred_glmer"),
+                      pred = c(mean(df$ispos), sigmoid(fixef(mod_glmer))))
+global_prob = sigmoid(fixef(mod_glmer))
+
+predframe = group_by(df, gp) %>% summarize(count=n())
+
+# links, not probabilities. 
+# Use predict(, type="response") for probabilities
+predframe %>% mutate(pred_glm = predict(mod_glm, newdata=predframe),
+                     pred_glmer = predict(mod_glmer, newdata=predframe)) -> predframe
+
+gather(predframe, key = estimate_type, value=pred, pred_glm, pred_glmer) %>%
+  ggplot(aes(x=pred)) + geom_density(adjust=0.5) + 
+  geom_vline(data=meanests, aes(xintercept=pred), color="darkblue") + 
+  facet_wrap(~estimate_type, ncol=1) + 
+  ggtitle("Distribution of link values", 
+          subtitle="Compared to observed and estimated grand means, respectively")
+```
+
+Note that the distribution of predictions for the standard logistic regression model is trimodal, and that for some groups, the logistic regression model predicts probabilities very close to 0 or to 1. In most cases, these predictions will correspond to groups with few observations, and are unlikely to be good estimates of the true conditional probability. The partial pooling model avoids making *unjustified* predictions near 0 or 1, instead “shrinking” the estimates to the estimated global probability that $y > 0$, which in this case is about `r format(global_prob, digits=2)`. 
+
+We can see how the number of observations corresponds to the shrinkage (the difference between the logistic regression and the partial pooling estimates) in the graph below (this time in probability space). Points in orange correspond to groups where the logistic regression estimated probabilities of 0 or 1 (the two outer lobes of the response distribution). Multimodal densities are often symptoms of model flaws such as omitted variables or un-modeled mixtures, so it is exciting to see the partially pooled estimator avoid the "wings" seen in the simpler logistic regression estimator.
+
+```{r echo=FALSE}
+# probabilities this time
+# predframe = group_by(df, gp) %>% summarize(count=n())
+predframe = rawdata %>% select(gp, count, countr)
+
+predframe %>%
+  mutate(pred_glm = predict(mod_glm, newdata=predframe, type="response"),
+        pred_glmer = predict(mod_glmer, newdata=predframe, type="response")) %>%
+  mutate(shrinkage = pred_glm-pred_glmer,
+         pred0or1 = ifelse(pred_glm >= 0.99 | pred_glm < 1e-6, TRUE, FALSE),
+         gp=factor(gp, gplevels)) -> predframe
+         
+
+predframe %>%
+ggplot( aes(x=countr, y=shrinkage)) +
+  geom_point(aes(color=pred0or1)) +
+  geom_hline(yintercept=0, color="darkblue") +
+  scale_x_log10("Number of observations (log10 scale)") +
+  ylab("shrinkage (pred_glm - pred_glmer)") +
+  # scale_color_manual(values=c("black", "maroon")) +
+  scale_color_brewer(palette="Dark2") +
+  theme(legend.position="none") +
+  ggtitle("Shrinkage of probability estimates", subtitle="Groups ordered by observation count")
+
+
+```
+
+
+## Partial Pooling Degrades Gracefully
+
+When there is enough data for each population to get a good estimate of the population means -- for example, when the distribution of groups is fairly uniform, or at least not too skewed -- the partial pooling estimates will converge to the the raw (no-pooling) estimates. When the variation between population means is very low, the partial pooling estimates will converge to the complete pooling estimate (the grand mean).
+
+When there are only a few levels (Gelman and Hill suggest less than about five), there will generally not be enough information to make a good estimate of $\sigma_b$, so the partial pooled estimates likely won't be much better than the raw estimates.
+
+So partial pooling will be of the most potential value when the number of groups is large, and there are many rare levels. With respect to `vtreat`, this is exactly the situation when level coding is most useful! 
+
+Multilevel modeling assumes the data was generated from the mixture process above: each population is normally distributed, with the same standard deviation, and the population means are also normally distributed. Obviously, this may not be the case, but as Gelman and Hill argue, the additional inductive bias can be useful for those populations where you have little information.
+
+Thanks to [Geoffrey Simmons](https://www.linkedin.com/in/geoffrey-simmons-bb675242/), Principal Data Scientist at Echo Global Logistics, for suggesting partial pooling based level coding for `vtreat`, introducing us to the references, and reviewing our articles.
+
+## References
+
+Gelman, Andrew and Jennifer Hill. *Data Analysis Using Regression and Multilevel/Hierarchical Models*. Cambridge University Press, 2007.
diff --git a/PartialPooling_R/PartialPooling_R.Rproj b/PartialPooling_R/PartialPooling_R.Rproj
new file mode 100644
index 0000000..ecd36b4
--- /dev/null
+++ b/PartialPooling_R/PartialPooling_R.Rproj
@@ -0,0 +1,17 @@
+Version: 1.0
+ProjectId: 5a280da5-0156-4362-9216-76ec50a0ec96
+
+RestoreWorkspace: Default
+SaveWorkspace: Default
+AlwaysSaveHistory: Default
+
+EnableCodeIndexing: Yes
+UseSpacesForTab: Yes
+NumSpacesForTab: 2
+Encoding: UTF-8
+
+RnwWeave: knitr
+LaTeX: pdfLaTeX
+
+AutoAppendNewline: Yes
+StripTrailingWhitespace: Yes
diff --git a/PartialPooling_R/PartialPooling_R.html b/PartialPooling_R/PartialPooling_R.html
new file mode 100644
index 0000000..73a9334
--- /dev/null
+++ b/PartialPooling_R/PartialPooling_R.html
@@ -0,0 +1,906 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+Partial Pooling for Lower Variance Variable Encoding
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+Partial Pooling for Lower Variance Variable
+Encoding
+Nina Zumel
+
+
+
+
+
+
+
+ Banaue rice terraces. Photo:
+Jon
+Rawlinson 
+
+
+


+In a previous
+article, we showed the use of partial pooling, or
+hierarchical/multilevel models, for level coding high-cardinality
+categorical variables in vtreat. In
+this article, we will discuss a little more about the how and why of
+partial pooling in R.
+We will use the lme4 package to fit the hierarchical
+models. The acronym “lme” stands for “linear mixed-effects” models:
+models that combine so-called “fixed effects” and “random effects” in a
+single (generalized) linear model. The lme4 documentation
+uses the random/fixed effects terminology, but we are going to follow
+Gelman and Hill, and avoid the use of the terms “fixed” and “random”
+effects.
+
+The varying coefficients [corresponding to the levels of a
+categorical variable] in a multilevel model are sometimes called
+random effects, a term that refers to the randomness in the
+probability model for the group-level coefficients….
+
+
+The term fixed effects is used in contrast to random effects
+– but not in a consistent way! … Because of the conflicting definitions
+and advice, we will avoid the terms “fixed” and “random” entirely, and
+focus on the description of the model itself…
+
+– Gelman and Hill 2007, Chapter 11.4
+We will also restrict ourselves to the case that vtreat
+considers: partially pooled estimates of conditional group expectations,
+with no other predictors considered.
+
+The Data
+Let’s assume that the data is generated from a mixture of \(M\) populations; each population is
+normally distributed with (unknown) means \(\mu_{gp}\), all with the same (unknown)
+standard deviation \(\sigma_w\):
+\[
+y_{gp} = N(\mu_{gp}, {\sigma_{w}}^2)
+\]
+The population means themselves are normally distributed, with
+unknown mean \(\mu_0\) and unknown
+standard deviation \(\sigma_b\):
+\[
+\mu_{gp} = N(\mu_0, {\sigma_{b}}^2)
+\]
+(The subscripts w and b stand for “within-group”
+and “between-group” standard deviations, respectively.)
+We can generate a synthetic data set according to these assumptions,
+with distributions similar to the distributions observed in the radon
+data set that we used in our earlier post: 85 groups, sampled unevenly.
+We’ll use \(\mu_0 = 0, \sigma_w = 0.7,
+\sigma_b = 0.5\). Here, we take a peek at our data,
+df.
+head(df)
+##     gp          y
+## 1 gp75  1.1622536
+## 2 gp26 -1.0026492
+## 3 gp26 -0.4317629
+## 4 gp43  0.3547021
+## 5 gp19 -0.5028478
+## 6 gp41  0.1239806
+
+As the graph shows, some groups were heavily sampled, but most groups
+have only a handful of samples in the data set. Since this is synthetic
+data, we know the true population means (shown in red in the graph
+below), and we can compare them to the observed means \(\bar{y}_i\) of each group \(i\) (shown in black, with standard errors.
+The gray points are the actual observations). We’ve sorted the groups by
+the number of observations.
+
+For groups with many observations, the observed group mean is near
+the true mean. For groups with few observations, the estimates are
+uncertain, and the observed group mean can be far from the true
+population mean.
+Can we get better estimates of the conditional mean for groups with
+only a few observations?
+
+
+Partial Pooling
+If the data is generated by the process described above, and if we
+knew \(\sigma_w\) and \(\sigma_b\), then a good estimate \(\hat{y}_i\) for the mean of group \(i\) is the weighted average of the grand
+mean over all the data, \(\bar{y}\),
+and the observed mean of all the observations in group \(i\), \(\bar{y}_i\).
+\[
+\large
+\hat{y_i} \approx \frac{\frac{n_i} {\sigma_w^2} \cdot \bar{y}_i  +
+\frac{1}{\sigma_b^2} \cdot \bar{y}}
+{\frac{n_i} {\sigma_w^2} + \frac{1}{\sigma_b^2}}
+\]
+where \(n_i\) is the number of
+observations for group \(i\). In other
+words, for groups where you have a lot of observations, use an estimate
+close to the observed group mean. For groups where you have only a few
+observations, fall back to an estimate close to the grand mean.
+Gelman and Hill call the grand mean the complete-pooling
+estimate, because the data from all the groups is pooled to create the
+estimate (which is the same for all \(i\)). The “raw” observed means are the
+no-pooling estimate, because no pooling occurs; only
+observations from group \(i\)
+contribute to \(\hat{y_i}\). The
+weighted sum of the complete-pooling and the no-pooling estimate is
+hence the partial-pooling estimate.
+Of course, in practice we don’t know \(\sigma_w\) and \(\sigma_b\). The lmer function
+essentially solves for the restricted maximum likelihood (REML)
+estimates of the appropriate parameters in order to estimate \(\hat{y_i}\). You can express multilevel
+models in lme4 using the notation | gp in
+formulas to designate that gp is the grouping variable that
+you want conditional estimates for. The model that we are interested in
+is the simplest: outcome as a function of the grouping variable, with no
+other predictors.
+poolmod = lmer(y ~ (1 | gp), data=df)
+See section 2.2 of this
+lmer vignette for more discussion on writing formulas
+for models with additional predictors. Printing poolmod
+displays the REML estimates of the grand mean (The intercept), \(\sigma_b\) (the standard deviation of \(gp\)) and \(\sigma_w\) (the residual).
+poolmod
+## Linear mixed model fit by REML ['lmerMod']
+## Formula: y ~ (1 | gp)
+##    Data: df
+## REML criterion at convergence: 2282.939
+## Random effects:
+##  Groups   Name        Std.Dev.
+##  gp       (Intercept) 0.5348  
+##  Residual             0.7063  
+## Number of obs: 1002, groups:  gp, 85
+## Fixed Effects:
+## (Intercept)  
+##    -0.02761
+To pull these values out explicitly:
+# the estimated grand mean 
+(grandmean_est= fixef(poolmod))
+## (Intercept) 
+## -0.02760728
+# get the estimated between-group standard deviation
+(sigma_b = as.data.frame(VarCorr(poolmod)) %>% 
+  filter(grp=="gp") %>% 
+  pull(sdcor))
+## [1] 0.5348401
+# get the estimated within-group standard deviation
+(sigma_w = as.data.frame(VarCorr(poolmod)) %>% 
+  filter(grp=="Residual") %>% 
+  pull(sdcor))
+## [1] 0.7063342
+predict(poolmod) will return the partial pooling
+estimates of the group means. Below, we compare the partial pooling
+estimates to the raw group mean expectations. The gray lines represent
+the true group means, the dark blue horizontal line is the observed
+grand mean, and the black dots are the estimates. We have again sorted
+the groups by number of observations, and laid them out (with a slight
+jitter) on a log10 scale.
+
+For groups with only a few observations, the partial pooling
+“shrinks” the estimates towards the grand mean¹, which often results
+in a better estimate of the true conditional population means. We can
+see the relationship between shrinkage (the raw estimate minus the
+partial pooling estimate) and the groups, ordered by sample size.
+
+For this data set, the partial pooling estimates are on average
+closer to the true means than the raw estimates; we can see this by
+comparing the root mean squared errors of the two estimates.
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+estimate_type
+ 
+rmse
+

+raw
+ 
+0.3261321
+

+partial pooling
+ 
+0.2484646
+
+
+The Discrete Case
+For discrete (binary) outcomes or classification, use the function
+glmer() to fit multilevel logistic regression models.
+Suppose we want to predict \(\mbox{P}(y > 0
+\,|\, gp)\), the conditional probability that the outcome \(y\) is positive, as a function of \(gp\).
+df$ispos = df$y > 0
+
+# fit a logistic regression model
+mod_glm = glm(ispos ~ gp, data=df, family=binomial)
+Again, the conditional probability estimates will be highly uncertain
+for groups with only a few observations. We can fit a multilevel model
+with glmer and compare the distributions of the resulting
+predictions in link space.
+mod_glmer = glmer(ispos ~ (1|gp), data=df, family=binomial)
+
+Note that the distribution of predictions for the standard logistic
+regression model is trimodal, and that for some groups, the logistic
+regression model predicts probabilities very close to 0 or to 1. In most
+cases, these predictions will correspond to groups with few
+observations, and are unlikely to be good estimates of the true
+conditional probability. The partial pooling model avoids making
+unjustified predictions near 0 or 1, instead “shrinking” the
+estimates to the estimated global probability that \(y > 0\), which in this case is about
+0.49.
+We can see how the number of observations corresponds to the
+shrinkage (the difference between the logistic regression and the
+partial pooling estimates) in the graph below (this time in probability
+space). Points in orange correspond to groups where the logistic
+regression estimated probabilities of 0 or 1 (the two outer lobes of the
+response distribution). Multimodal densities are often symptoms of model
+flaws such as omitted variables or un-modeled mixtures, so it is
+exciting to see the partially pooled estimator avoid the “wings” seen in
+the simpler logistic regression estimator.
+
+
+
+
+Partial Pooling Degrades Gracefully
+When there is enough data for each population to get a good estimate
+of the population means – for example, when the distribution of groups
+is fairly uniform, or at least not too skewed – the partial pooling
+estimates will converge to the the raw (no-pooling) estimates. When the
+variation between population means is very low, the partial pooling
+estimates will converge to the complete pooling estimate (the grand
+mean).
+When there are only a few levels (Gelman and Hill suggest less than
+about five), there will generally not be enough information to make a
+good estimate of \(\sigma_b\), so the
+partial pooled estimates likely won’t be much better than the raw
+estimates.
+So partial pooling will be of the most potential value when the
+number of groups is large, and there are many rare levels. With respect
+to vtreat, this is exactly the situation when level coding
+is most useful!
+Multilevel modeling assumes the data was generated from the mixture
+process above: each population is normally distributed, with the same
+standard deviation, and the population means are also normally
+distributed. Obviously, this may not be the case, but as Gelman and Hill
+argue, the additional inductive bias can be useful for those populations
+where you have little information.
+Thanks to Geoffrey
+Simmons, Principal Data Scientist at Echo Global Logistics, for
+suggesting partial pooling based level coding for vtreat,
+introducing us to the references, and reviewing our articles.
+
+
+References
+Gelman, Andrew and Jennifer Hill. Data Analysis Using Regression
+and Multilevel/Hierarchical Models. Cambridge University Press,
+2007.
+
+
+
+
+To be precise, partial pooling shrinks estimates toward
+the estimated grand mean -0.0276, not to the observed
+grand mean 0.155.↩︎
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff --git a/PartialPooling_R/PartialPooling_R.md b/PartialPooling_R/PartialPooling_R.md
new file mode 100644
index 0000000..63601d1
--- /dev/null
+++ b/PartialPooling_R/PartialPooling_R.md
@@ -0,0 +1,231 @@
+---
+title: 'Partial Pooling for Lower Variance Variable Encoding'
+author: "Nina Zumel"
+output: 
+  html_document:
+    keep_md: true
+---
+
+
+
+ 
+Banaue rice terraces. Photo: Jon Rawlinson
+
+
+


+
+
+In a [previous article](https://github.com/WinVector/vtreat/blob/main/Examples/CustomLevelCoding/CustomLevelCoding.md), we showed the use of partial pooling, or hierarchical/multilevel models, for level coding high-cardinality categorical variables in [`vtreat`](https://winvector.github.io/vtreat/). In this article, we will discuss a little more about the how and why of partial pooling in [`R`](https://www.r-project.org).
+
+We will use the `lme4` package to fit the hierarchical models. The acronym "lme" stands for "linear mixed-effects" models: models that combine so-called "fixed effects" and "random effects" in a single (generalized) linear model. The `lme4` documentation uses the random/fixed effects terminology, but we are going to follow Gelman and Hill, and avoid the use of the terms "fixed" and "random" effects.
+
+> The varying coefficients [corresponding to the levels of a categorical variable] in a multilevel model are sometimes called *random effects*, a term that refers to the randomness in the probability model for the group-level coefficients....
+
+> The term *fixed effects* is used in contrast to random effects -- but not in a consistent way! ... Because of the conflicting definitions and advice, we will avoid the terms "fixed" and "random" entirely, and focus on the description of the model itself...
+
+-- Gelman and Hill 2007, Chapter 11.4
+
+We will also restrict ourselves to the case that `vtreat` considers: partially pooled estimates of conditional group expectations, with no other predictors considered.
+
+## The Data
+
+Let's assume that the data is generated from a mixture of $M$ populations; each population is normally distributed with (unknown) means $\mu_{gp}$, all with the same (unknown) standard deviation $\sigma_w$:
+
+$$
+y_{gp} = N(\mu_{gp}, {\sigma_{w}}^2)
+$$
+
+The population means themselves are normally distributed, with unknown mean $\mu_0$ and unknown standard deviation $\sigma_b$:
+
+$$
+\mu_{gp} = N(\mu_0, {\sigma_{b}}^2)
+$$
+
+(The subscripts *w* and *b* stand for "within-group" and "between-group" standard deviations, respectively.)
+
+
+
+
+
+
+We can generate a synthetic data set according to these assumptions, with distributions similar to the distributions observed in the radon data set that we used in our earlier post: 85 groups, sampled unevenly. We'll use $\mu_0 = 0, \sigma_w = 0.7, \sigma_b = 0.5$. Here, we take a peek at our data, `df`.
+
+
+``` r
+head(df)
+```
+
+```
+##     gp          y
+## 1 gp75  1.1622536
+## 2 gp26 -1.0026492
+## 3 gp26 -0.4317629
+## 4 gp43  0.3547021
+## 5 gp19 -0.5028478
+## 6 gp41  0.1239806
+```
+
+![](PartialPooling_R_files/figure-html/unnamed-chunk-2-1.png)
+
+As the graph shows, some groups were heavily sampled, but most groups have only a handful of samples in the data set. Since this is synthetic data, we know the true population means (shown in red in the graph below), and we can compare them to the observed means $\bar{y}_i$ of each group $i$ (shown in black, with standard errors. The gray points are the actual observations). We've sorted the groups by the number of observations.
+
+![](PartialPooling_R_files/figure-html/unnamed-chunk-3-1.png)
+
+For groups with many observations, the observed group mean is near the true mean. For groups with few observations, the estimates are uncertain, and the observed group mean can be far from the true population mean.
+
+Can we get better estimates of the conditional mean for groups with only a few observations?
+
+## Partial Pooling
+
+If the data is generated by the process described above, and if we knew $\sigma_w$ and $\sigma_b$, then a good estimate $\hat{y}_i$ for the mean of group $i$ is the weighted average of the grand mean over all the data, $\bar{y}$, and the observed mean of all the observations in group $i$, $\bar{y}_i$.
+
+$$
+\large
+\hat{y_i} \approx \frac{\frac{n_i} {\sigma_w^2} \cdot \bar{y}_i  + \frac{1}{\sigma_b^2} \cdot \bar{y}}
+ {\frac{n_i} {\sigma_w^2} + \frac{1}{\sigma_b^2}}
+$$
+
+
+where $n_i$ is the number of observations for group $i$. In other words, for groups where you have a lot of observations, use an estimate close to the observed group mean. For groups where you have only a few observations, fall back to an estimate close to the grand mean.
+
+Gelman and Hill call the grand mean the *complete-pooling* estimate, because the data from all the groups is pooled to create the estimate \hat{y_i} (which is the same for all $i$). The "raw" observed means are the *no-pooling* estimate, because no pooling occurs; only observations from group $i$ contribute to $\hat{y_i}$. The weighted sum of the complete-pooling and the no-pooling estimate is hence the *partial-pooling* estimate.
+
+Of course, in practice we don't know $\sigma_w$ and $\sigma_b$. The `lmer` function essentially solves for the restricted maximum likelihood (REML) estimates of the appropriate parameters in order to estimate $\hat{y_i}$. You can express multilevel models in `lme4` using the notation `| gp` in formulas to designate that `gp` is the grouping variable that you want conditional estimates for. The model that we are interested in is the simplest: outcome as a function of the grouping variable, with no other predictors.
+
+
+``` r
+poolmod = lmer(y ~ (1 | gp), data=df)
+```
+
+See section 2.2 of [this `lmer` vignette](https://cran.r-project.org/web/packages/lme4/vignettes/lmer.pdf) for more discussion on writing formulas for models with additional predictors. Printing `poolmod` displays the REML estimates of the grand mean (The intercept), $\sigma_b$ (the standard deviation of $gp$) and $\sigma_w$ (the residual).
+
+
+``` r
+poolmod
+```
+
+```
+## Linear mixed model fit by REML ['lmerMod']
+## Formula: y ~ (1 | gp)
+##    Data: df
+## REML criterion at convergence: 2282.939
+## Random effects:
+##  Groups   Name        Std.Dev.
+##  gp       (Intercept) 0.5348  
+##  Residual             0.7063  
+## Number of obs: 1002, groups:  gp, 85
+## Fixed Effects:
+## (Intercept)  
+##    -0.02761
+```
+
+To pull these values out explicitly:
+
+``` r
+# the estimated grand mean 
+(grandmean_est= fixef(poolmod))
+```
+
+```
+## (Intercept) 
+## -0.02760728
+```
+
+``` r
+# get the estimated between-group standard deviation
+(sigma_b = as.data.frame(VarCorr(poolmod)) %>% 
+  filter(grp=="gp") %>% 
+  pull(sdcor))
+```
+
+```
+## [1] 0.5348401
+```
+
+``` r
+# get the estimated within-group standard deviation
+(sigma_w = as.data.frame(VarCorr(poolmod)) %>% 
+  filter(grp=="Residual") %>% 
+  pull(sdcor))
+```
+
+```
+## [1] 0.7063342
+```
+
+`predict(poolmod)` will return the partial pooling estimates of the group means. Below, we compare the partial pooling estimates to the raw group mean expectations. The gray lines represent the true group means, the dark blue horizontal line is the observed grand mean, and the black dots are the estimates. We have again sorted the groups by number of observations, and laid them out (with a slight jitter) on a log10 scale.
+
+![](PartialPooling_R_files/figure-html/unnamed-chunk-6-1.png)
+
+For groups with only a few observations, the partial pooling "shrinks" the estimates towards the grand mean[^1], which often results in a better estimate of the true conditional population means. We can see the relationship between shrinkage (the raw estimate minus the partial pooling estimate) and the groups, ordered by sample size.
+
+![](PartialPooling_R_files/figure-html/unnamed-chunk-7-1.png)
+
+For this data set, the partial pooling estimates are on average closer to the true means than the raw estimates; we can see this by comparing the root mean squared errors of the two estimates.
+
+
+
+ 
+  
+   
+   
+  
+ 
+
+  
+   
+   
+  
+  
+   
+   
+  
+
+ estimate_type  rmse 
 raw  0.3261321 
 partial pooling  0.2484646 
+
+[^1]: To be precise, partial pooling shrinks estimates toward the *estimated* grand mean -0.0276, not to the *observed* grand mean 0.155. 
+
+
+### The Discrete Case
+
+For discrete (binary) outcomes or classification, use the function `glmer()` to fit multilevel logistic regression models. Suppose we want to predict $\mbox{P}(y > 0 \,|\, gp)$, the conditional probability that the outcome $y$ is positive, as a function of $gp$.
+
+
+``` r
+df$ispos = df$y > 0
+
+# fit a logistic regression model
+mod_glm = glm(ispos ~ gp, data=df, family=binomial)
+```
+
+Again, the conditional probability estimates will be highly uncertain for groups with only a few observations. We can fit a multilevel model with `glmer` and compare the distributions of the resulting predictions in link space.
+
+
+``` r
+mod_glmer = glmer(ispos ~ (1|gp), data=df, family=binomial)
+```
+
+![](PartialPooling_R_files/figure-html/unnamed-chunk-11-1.png)
+
+Note that the distribution of predictions for the standard logistic regression model is trimodal, and that for some groups, the logistic regression model predicts probabilities very close to 0 or to 1. In most cases, these predictions will correspond to groups with few observations, and are unlikely to be good estimates of the true conditional probability. The partial pooling model avoids making *unjustified* predictions near 0 or 1, instead “shrinking” the estimates to the estimated global probability that $y > 0$, which in this case is about 0.49. 
+
+We can see how the number of observations corresponds to the shrinkage (the difference between the logistic regression and the partial pooling estimates) in the graph below (this time in probability space). Points in orange correspond to groups where the logistic regression estimated probabilities of 0 or 1 (the two outer lobes of the response distribution). Multimodal densities are often symptoms of model flaws such as omitted variables or un-modeled mixtures, so it is exciting to see the partially pooled estimator avoid the "wings" seen in the simpler logistic regression estimator.
+
+![](PartialPooling_R_files/figure-html/unnamed-chunk-12-1.png)
+
+
+## Partial Pooling Degrades Gracefully
+
+When there is enough data for each population to get a good estimate of the population means -- for example, when the distribution of groups is fairly uniform, or at least not too skewed -- the partial pooling estimates will converge to the the raw (no-pooling) estimates. When the variation between population means is very low, the partial pooling estimates will converge to the complete pooling estimate (the grand mean).
+
+When there are only a few levels (Gelman and Hill suggest less than about five), there will generally not be enough information to make a good estimate of $\sigma_b$, so the partial pooled estimates likely won't be much better than the raw estimates.
+
+So partial pooling will be of the most potential value when the number of groups is large, and there are many rare levels. With respect to `vtreat`, this is exactly the situation when level coding is most useful! 
+
+Multilevel modeling assumes the data was generated from the mixture process above: each population is normally distributed, with the same standard deviation, and the population means are also normally distributed. Obviously, this may not be the case, but as Gelman and Hill argue, the additional inductive bias can be useful for those populations where you have little information.
+
+Thanks to [Geoffrey Simmons](https://www.linkedin.com/in/geoffrey-simmons-bb675242/), Principal Data Scientist at Echo Global Logistics, for suggesting partial pooling based level coding for `vtreat`, introducing us to the references, and reviewing our articles.
+
+## References
+
+Gelman, Andrew and Jennifer Hill. *Data Analysis Using Regression and Multilevel/Hierarchical Models*. Cambridge University Press, 2007.
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-gfm/index.html b/PartialPooling_R/PartialPooling_R_files/figure-gfm/index.html
new file mode 100644
index 0000000..d5eca35
--- /dev/null
+++ b/PartialPooling_R/PartialPooling_R_files/figure-gfm/index.html
@@ -0,0 +1,55 @@
+
+      
+        
+            
+        
+        
+      ./PartialPooling_R/PartialPooling_R_files/figure-gfm
+        
..

+         
+          unnamed-chunk-11-1.png
+          unnamed-chunk-12-1.png
+          unnamed-chunk-2-1.png
+          unnamed-chunk-3-1.png
+          unnamed-chunk-6-1.png
+          unnamed-chunk-7-1.png
+         
+        
+      
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-11-1.png b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-11-1.png
new file mode 100644
index 0000000..3b7ad14
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-11-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-12-1.png b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-12-1.png
new file mode 100644
index 0000000..750b2dc
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-12-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-2-1.png b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-2-1.png
new file mode 100644
index 0000000..5d56bd7
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-2-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-3-1.png b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-3-1.png
new file mode 100644
index 0000000..9d88dd1
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-3-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-6-1.png b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-6-1.png
new file mode 100644
index 0000000..9afb3a4
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-6-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-7-1.png b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-7-1.png
new file mode 100644
index 0000000..db8b037
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-gfm/unnamed-chunk-7-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-html/index.html b/PartialPooling_R/PartialPooling_R_files/figure-html/index.html
new file mode 100644
index 0000000..1a98a10
--- /dev/null
+++ b/PartialPooling_R/PartialPooling_R_files/figure-html/index.html
@@ -0,0 +1,55 @@
+
+      
+        
+            
+        
+        
+      ./PartialPooling_R/PartialPooling_R_files/figure-html
+        
..

+         
+          unnamed-chunk-11-1.png
+          unnamed-chunk-12-1.png
+          unnamed-chunk-2-1.png
+          unnamed-chunk-3-1.png
+          unnamed-chunk-6-1.png
+          unnamed-chunk-7-1.png
+         
+        
+      
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-11-1.png b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-11-1.png
new file mode 100644
index 0000000..3b7ad14
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-11-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-12-1.png b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-12-1.png
new file mode 100644
index 0000000..750b2dc
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-12-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-2-1.png b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-2-1.png
new file mode 100644
index 0000000..5d56bd7
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-2-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-3-1.png b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-3-1.png
new file mode 100644
index 0000000..9d88dd1
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-3-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-6-1.png b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-6-1.png
new file mode 100644
index 0000000..9afb3a4
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-6-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-7-1.png b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-7-1.png
new file mode 100644
index 0000000..db8b037
Binary files /dev/null and b/PartialPooling_R/PartialPooling_R_files/figure-html/unnamed-chunk-7-1.png differ
diff --git a/PartialPooling_R/PartialPooling_R_files/index.html b/PartialPooling_R/PartialPooling_R_files/index.html
new file mode 100644
index 0000000..688a40a
--- /dev/null
+++ b/PartialPooling_R/PartialPooling_R_files/index.html
@@ -0,0 +1,51 @@
+
+      
+        
+            
+        
+        
+      ./PartialPooling_R/PartialPooling_R_files
+        
..

+         
+          figure-gfm
+          figure-html
+         
+        
+      
diff --git a/PartialPooling_R/README.txt b/PartialPooling_R/README.txt
new file mode 100644
index 0000000..1a63b92
--- /dev/null
+++ b/PartialPooling_R/README.txt
@@ -0,0 +1 @@
+R source code for article: https://win-vector.com/2017/09/28/partial-pooling-for-lower-variance-variable-encoding/
diff --git a/PartialPooling_R/generate_data.R b/PartialPooling_R/generate_data.R
new file mode 100644
index 0000000..7c7a068
--- /dev/null
+++ b/PartialPooling_R/generate_data.R
@@ -0,0 +1,65 @@
+library("dplyr")
+library("tidyr")
+
+set.seed(46346)
+# example data
+
+
+# the radon data -- read it just to get similar stats
+srrs = read.table("srrs2.dat", header=TRUE, sep=",", stringsAsFactor=FALSE)
+
+# target: log of radon activity (activity)
+# grouping variable: county
+radonMN = filter(srrs, state=="MN") %>%
+  select("county", "activity") %>%
+  filter(activity > 0) %>%
+  mutate(activity = log(activity),
+         county = base::trimws(county)) %>%
+  mutate(critical = activity>1.5)
+
+stats = radonMN %>% group_by(county) %>%
+  summarize(amean = mean(activity),
+            sd_gp = sd(activity),
+            counts = n())
+
+summarize(stats, mu0 = mean(amean),
+          sd_between = sd(sd_gp, na.rm=TRUE))
+
+NGP = nrow(stats)  # same as MN data
+prob = stats$counts/sum(stats$counts)  # the proportions of the MN data
+
+mu0 = 0
+sigma_within =  0.7
+sigma_between =  0.5
+
+mu_gp = rnorm(NGP, mean=mu0, sigma_between)
+gpnames = paste0("gp", formatC(1:NGP, width=2, flag=0))
+names(mu_gp) = gpnames
+true_mu = data.frame(gp = names(mu_gp), mu_gp=mu_gp, stringsAsFactors=FALSE)
+
+
+# prob=NULL: uniform
+generate_data = function(nrows, mu_gp, sigma_within,  prob=NULL) {
+  ngps = length(mu_gp)
+  gps = 1:ngps
+  gpnames = names(mu_gp)
+  indices = sample(gps, size=nrows, replace=TRUE, prob=prob)
+
+  data =  data.frame(gp = gpnames[indices],
+                     y = rnorm(nrows, sd=sigma_within) + mu_gp[indices],
+                     stringsAsFactors = FALSE)
+
+  # any missing levels, add one observation, just to make the point
+  missing = setdiff(gpnames, unique(data$gp))
+  if(length(missing > 0)) {
+    data = rbind(data, data.frame(gp=missing,
+                                  y=rnorm(length(missing), sd=sigma_within) + mu_gp[missing],
+                                  stringsAsFactors=FALSE))
+  }
+
+  data
+}
+
+df = generate_data(1000, mu_gp, sigma_within, prob)
+saveRDS(df, "synthdata.rds")
+saveRDS(true_mu, "truemu.rds")
diff --git a/PartialPooling_R/index.html b/PartialPooling_R/index.html
new file mode 100644
index 0000000..445e81e
--- /dev/null
+++ b/PartialPooling_R/index.html
@@ -0,0 +1,64 @@
+
+      
+        
+            
+        
+        
+      ./PartialPooling_R
+         ..
+         
+
++R source code for article: https://win-vector.com/2017/09/28/partial-pooling-for-lower-variance-variable-encoding/
+
+
+          PartialPooling_R.Rmd
+          PartialPooling_R.Rproj
+          PartialPooling_R.html
+          PartialPooling_R.md
+          PartialPooling_R_files
+          README.txt
+          generate_data.R
+          synthdata.rds
+          terraces.jpg
+          truemu.rds
+         
+        
+      
diff --git a/PartialPooling_R/synthdata.rds b/PartialPooling_R/synthdata.rds
new file mode 100644
index 0000000..9955298
Binary files /dev/null and b/PartialPooling_R/synthdata.rds differ
diff --git a/PartialPooling_R/terraces.jpg b/PartialPooling_R/terraces.jpg
new file mode 100644
index 0000000..df3a3d8
Binary files /dev/null and b/PartialPooling_R/terraces.jpg differ
diff --git a/PartialPooling_R/truemu.rds b/PartialPooling_R/truemu.rds
new file mode 100644
index 0000000..a49041d
Binary files /dev/null and b/PartialPooling_R/truemu.rds differ
diff --git a/Prevalence/index.html b/Prevalence/index.html
index 2cf4c67..39f21a4 100644
--- a/Prevalence/index.html
+++ b/Prevalence/index.html
@@ -42,7 +42,7 @@
         
         
       ./Prevalence
-         ..
+         ..
          
 
 diff --git a/VariableSignal/index.html b/VariableSignal/index.html
index 615fd97..0877a9b 100644
--- a/VariableSignal/index.html
+++ b/VariableSignal/index.html
@@ -42,7 +42,7 @@
         
         
       ./VariableSignal
-         ..
+         ..
          
 
 diff --git a/Wald/index.html b/Wald/index.html
index 601d0ee..a86c1dc 100644
--- a/Wald/index.html
+++ b/Wald/index.html
@@ -42,7 +42,7 @@
         
         
       ./Wald
-         ..
+         ..
          
           SequentialTest.Rmd
           SequentialTest.html
diff --git a/Zipf/index.html b/Zipf/index.html
index eb404cc..85845fe 100644
--- a/Zipf/index.html
+++ b/Zipf/index.html
@@ -42,7 +42,7 @@
         
         
       ./Zipf
-         ..
+         ..
          
           FalseZipf.Rmd
           FalseZipf.html
diff --git a/Zipf/notes/index.html b/Zipf/notes/index.html
index 55eab00..0685de1 100644
--- a/Zipf/notes/index.html
+++ b/Zipf/notes/index.html
@@ -42,7 +42,7 @@
         
         
       ./Zipf/notes
-        
..

+        
..

          
           1984ComAp__10__127T.pdf
           Better-Angels-of-Our-Nature_-The-Decline-of-Violence-In-History-And-Its-Causes-The-Pinker-Steven.txt
diff --git a/binomIssue/index.html b/binomIssue/index.html
index 41f2979..ab8d903 100644
--- a/binomIssue/index.html
+++ b/binomIssue/index.html
@@ -42,7 +42,7 @@
         
         
       ./binomIssue
-         ..
+         ..
          
           Random.seed
           binomIssue.Rmd
diff --git a/casino/index.html b/casino/index.html
index 0afc757..8feebb5 100644
--- a/casino/index.html
+++ b/casino/index.html
@@ -42,7 +42,7 @@
         
         
       ./casino
-         ..
+         ..
          
 
 diff --git a/datashader/index.html b/datashader/index.html
index 48110ec..5484c5d 100644
--- a/datashader/index.html
+++ b/datashader/index.html
@@ -42,7 +42,7 @@
         
         
       ./datashader
-         ..
+         ..
          
           RPyExample.html
          
diff --git a/directory.html b/directory.html
new file mode 100644
index 0000000..a4115e0
--- /dev/null
+++ b/directory.html
@@ -0,0 +1,85 @@
+
+
+   
+      
+      
+    
+    
+      
+        
+          
+            
+            
+              
+            
+        
+        
+        
+            
+            
+              Win-Vector LLC
+              On Github
+              WinVector.github.io
+            
+          
+        
+      
+
+    
+        
+              WinVector.github.io Directory List
+              Code examples for various blog posts, talks, and tutorials.           
+        
+    
+
+
+
+
+
+  Directories:
+
+  ABDynprog
+  APAsig
+  Accumulation
+  CrossSimulation
+  DS
+  DataPrep
+  Debugging
+  DiffPriv
+  FixedPoint
+  FluidData
+  Intro_rquery
+  IntroductionToDataScience
+  KDD2009
+  LibreOffice
+  ModelTesting
+  PDSwR
+  Parallel
+  PartialPooling_R
+  Prevalence
+  VariableSignal
+  Wald
+  Zipf
+  binomIssue
+  casino
+  datashader
+  freq
+  margin
+  mzlabs
+  rateTest
+  stripGLM
+  uciCar
+  vtreathtml
+  wrappingFns
+  xDrift
+
+
+
+
+
+  
+© Win Vector LLC. Stylesheet based on curve, by uiusual.
+  
+
+
+
diff --git a/freq/index.html b/freq/index.html
index dded55b..83dcb72 100644
--- a/freq/index.html
+++ b/freq/index.html
@@ -42,7 +42,7 @@
         
         
       ./freq
-         ..
+         ..
          
           explicitSolution.html
           minimax.pdf
diff --git a/index.html b/index.html
index e3db8d6..b6e2709 100644
--- a/index.html
+++ b/index.html
@@ -1,106 +1,197 @@
-
-      
-        
-            
-        
-        
-        https://winvector.github.io/
-         
-
--
-Win-Vector LLC on Github.
-
-Some project sites:
-
-
- vtreat (source).
- cdata (source).
- WVPlots (source).
- seplyr (source).
- sigr (source).
- wrapr (source).
-
-
-
-View at: https://winvector.github.io/.
-Source: https://github.com/WinVector/WinVector.github.io/.
-
-Directories:
-
-
-
-          ABDynprog
-          APAsig
-          Accumulation
-          CrossSimulation
-          DS
-          DataPrep
-          Debugging
-          DiffPriv
-          FixedPoint
-          FluidData
-          Intro_rquery
-          IntroductionToDataScience
-          KDD2009
-          LibreOffice
-          ModelTesting
-          PDSwR
-          Parallel
-          Prevalence
-          README.txt
-          VariableSignal
-          Wald
-          Zipf
-          binomIssue
-          casino
-          datashader
-          freq
-          margin
-          mzlabs
-          rateTest
-          stripGLM
-          uciCar
-          vtreathtml
-          wrappingFns
-          xDrift
-         
-        
-      
+
+
+  
+    
+    
+    
+    
+    
+	
+	
+    
+    
+    
+    
+    
+   
+    
+    
+    
+    Win-Vector, LLC
+  
+  
+    
+      
+        
+          
+          
+            
+          
+		  
+		  
+		  
+          
+          
+            Win-Vector LLC
+            On Github
+            Directory List
+          
+        
+      
+    
+    
+      
+        
+          Featured Win Vector Projects
+          Code repositories and documentation in R  and python . 
+          
+          
+
+			
+				 PDSwR2

+				Code, Data, and Examples for Practical Data Science with R, 2nd edition (Nina Zumel and John Mount). 
+				
+				
+				  
+					Book Site
+				 
+				  
+					Book Example Code
+				  
+				
+			  
+
+            
+               vtreat

+              An R data frame processor/conditioner that prepares real-world data for predictive modeling in a statistically sound manner. 
+              
+              
+                
+					Project Site
+				
+                
+					Source
+				
+              
+            
+
+			
+				 pyvtreat

+				A python version of vtreat. 
+				
+				
+					
+						Project Site
+					
+					
+						Source
+					
+				
+			
+
+
+			
+				 cdata

+				Higher order fluid or coordinatized data transforms in R. 
+				
+				
+					
+						Project Site
+					
+					
+						Source
+					
+				
+			  
+
+			
+				 data_algebra

+				Codd method-chained SQL generator and Pandas data processing in Python. 
+				
+				
+					
+						Project Site
+					
+					
+						Source
+					
+				
+			 
+
+
+			  
+				 WVPlots

+				 Pre-packaged plots in R.
+				
+				
+					
+						Project Site
+					
+					
+						Source
+					
+				
+			  
+
+			  
+				 wvpy

+				 Tools for converting Jupyter notebooks to and from Python files..
+				
+				
+					
+						Project Site
+					
+					
+						Source
+					
+				
+			  
+
+			  
+				 sigr

+				Concise formatting of significances in R.
+				
+				
+					
+						Project Site
+					
+					
+						Source
+					
+				
+			  
+
+			  
+				 wrapr

+				 Wrap R for Sweet R Code.
+				
+				
+					
+						Project Site
+					
+					
+						Source
+					
+				
+			  
+
+          
+        
+    
+
+	
+	  
+		  
+			Contact us.
+		  
+	  
+	
+
+    
+    
+      
+		© Win Vector LLC. Stylesheet based on curve, by uiusual.
+      
+    
+  
+
\ No newline at end of file
diff --git a/margin/index.html b/margin/index.html
index 175c2ba..d69682b 100644
--- a/margin/index.html
+++ b/margin/index.html
@@ -42,7 +42,7 @@
         
         
       ./margin
-         ..
+         ..
          
           margin.pdf
           marginCalc.ipynb
diff --git a/mzlabs/AngryCalculator/index.html b/mzlabs/AngryCalculator/index.html
index 7ccd299..7d17e29 100644
--- a/mzlabs/AngryCalculator/index.html
+++ b/mzlabs/AngryCalculator/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/AngryCalculator
-        
..

+        
..

          
           angrycalculator.gif
          
diff --git a/mzlabs/JMPubs/funstuff/index.html b/mzlabs/JMPubs/funstuff/index.html
index 756037a..f504aa3 100644
--- a/mzlabs/JMPubs/funstuff/index.html
+++ b/mzlabs/JMPubs/funstuff/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/JMPubs/funstuff
-        
..

+        
..

          
           S_iguanadn.gif
           c_3_3.ps
diff --git a/mzlabs/JMPubs/index.html b/mzlabs/JMPubs/index.html
index e924b44..64acced 100644
--- a/mzlabs/JMPubs/index.html
+++ b/mzlabs/JMPubs/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/JMPubs
-        
..

+        
..

          
           A Randomized Algorithm to Optimize-Kannan.pdf
           Application of Convex Sampling to-Mount.pdf
diff --git a/mzlabs/JohnMount/funstuff/index.html b/mzlabs/JohnMount/funstuff/index.html
index 1aecd06..4641c7d 100644
--- a/mzlabs/JohnMount/funstuff/index.html
+++ b/mzlabs/JohnMount/funstuff/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/JohnMount/funstuff
-        
..

+        
..

          
           S_iguanadn.gif
           c_3_3.ps
diff --git a/mzlabs/JohnMount/index.html b/mzlabs/JohnMount/index.html
index 183fb6c..1ab0480 100644
--- a/mzlabs/JohnMount/index.html
+++ b/mzlabs/JohnMount/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/JohnMount
-        
..

+        
..

          
           A Randomized Algorithm to Optimize-Kannan.pdf
           FastUnimodularCounting.pdf
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/files/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/files/index.html
index 1bb5602..9946a9e 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoMisc/files
-        
..

+        
..

          
           page20-1000-full.html
           page20-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/index.html
index 6601eda..573adb6 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoMisc/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoMisc
-        
..

+        
..

          
           PhotoMisc.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/files/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/files/index.html
index b80aa02..ba103af 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoPeople/files
-        
..

+        
..

          
           page19-1000-full.html
           page19-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/index.html
index e8cccde..6743aba 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoPeople/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoPeople
-        
..

+        
..

          
           PhotoPeople.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/files/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/files/index.html
index 9ba79b4..64bdc2e 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/files
-        
..

+        
..

          
           page16-1000-full.html
           page16-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/index.html
index 98b6c2d..034cf4e 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/HW2006
-        
..

+        
..

          
           HW2006.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/files/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/files/index.html
index ec0d0da..adbbe3c 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/files
-        
..

+        
..

          
           page17-1000-full.html
           page17-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/index.html
index 842b2b2..5b67e4b 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/IL2005
-        
..

+        
..

          
           IL2005.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/files/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/files/index.html
index 7bfdba2..5c74ac7 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/files
-        
..

+        
..

          
           page13-1000-full.html
           page13-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/index.html
index ff8966e..efb9075 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/NZ2000
-        
..

+        
..

          
           NZ2000.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/files/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/files/index.html
index dfbc311..852e695 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/files
-        
..

+        
..

          
           page15-1000-full.html
           page15-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/index.html
index c02f835..9d6fc1e 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel/WY2006
-        
..

+        
..

          
           WY2006.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/index.html b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/index.html
index 7b99ee8..ec4f765 100644
--- a/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/PhotoTravel/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/PhotoTravel
-        
..

+        
..

          
           HW2006
           IL2005
diff --git a/mzlabs/MZLabsJM/JMPhotography/index.html b/mzlabs/MZLabsJM/JMPhotography/index.html
index 0f97ce1..e453304 100644
--- a/mzlabs/MZLabsJM/JMPhotography/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography
-        
..

+        
..

          
           JMPhotography.html
           PhotoMisc
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/files/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/files/index.html
index 216e0b1..07e3f75 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/files
-        
..

+        
..

          
           page7-1000-full.html
           page7-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/index.html
index daba057..813230e 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/DholRhythms
-        
..

+        
..

          
           DholRhyhms.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/files/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/files/index.html
index 295a2d8..9982ef4 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/files
-        
..

+        
..

          
           page23-1000-full.html
           page23-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/index.html
index b1c43cc..87eb94c 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/NSBCollectiveSternGrove
-        
..

+        
..

          
           NSBCollectiveSternGrove.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/files/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/files/index.html
index f6ca744..a98ebca 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/files
-        
..

+        
..

          
           2-03 India.mp3
           monoslideshow.xml
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/index.html
index 28e040c..fc7723e 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/NSBPhotos
-        
..

+        
..

          
           NSBPhotos.html
           files
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/index.html
index f3c577f..ca5878d 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24
-        
..

+        
..

          
           DholRhythms
           NSBCollectiveSternGrove
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/page25/files/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/page25/files/index.html
index 0c85d83..d392af8 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/page25/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/page25/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/page25/files
-        
..

+        
..

          
           page25-movie.m4v
          
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/page25/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/page25/index.html
index 3cfc2b4..ed9cbcf 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/page25/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/page25/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/page25
-        
..

+        
..

          
           files
           page25.html
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/page26/files/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/page26/files/index.html
index 53e41c2..7b741cb 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/page26/files/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/page26/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/page26/files
-        
..

+        
..

          
           page26-movie.m4v
           page26-movie.mov
diff --git a/mzlabs/MZLabsJM/JMPhotography/page24/page26/index.html b/mzlabs/MZLabsJM/JMPhotography/page24/page26/index.html
index 097fca3..86ec814 100644
--- a/mzlabs/MZLabsJM/JMPhotography/page24/page26/index.html
+++ b/mzlabs/MZLabsJM/JMPhotography/page24/page26/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/JMPhotography/page24/page26
-        
..

+        
..

          
           files
           page26.html
diff --git a/mzlabs/MZLabsJM/files/index.html b/mzlabs/MZLabsJM/files/index.html
index d01d05e..30006f7 100644
--- a/mzlabs/MZLabsJM/files/index.html
+++ b/mzlabs/MZLabsJM/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/files
-        
..

+        
..

          
           data-science-2.jpg
           page0_1.jpg
diff --git a/mzlabs/MZLabsJM/index.html b/mzlabs/MZLabsJM/index.html
index 1cee8b0..c273041 100644
--- a/mzlabs/MZLabsJM/index.html
+++ b/mzlabs/MZLabsJM/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM
-        
..

+        
..

          
           JMPhotography
           files
diff --git a/mzlabs/MZLabsJM/page1/index.html b/mzlabs/MZLabsJM/page1/index.html
index 787e9a9..238c1f6 100644
--- a/mzlabs/MZLabsJM/page1/index.html
+++ b/mzlabs/MZLabsJM/page1/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page1
-        
..

+        
..

          
           page1.html
          
diff --git a/mzlabs/MZLabsJM/page10/index.html b/mzlabs/MZLabsJM/page10/index.html
index a910be8..0a9ff1f 100644
--- a/mzlabs/MZLabsJM/page10/index.html
+++ b/mzlabs/MZLabsJM/page10/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page10
-        
..

+        
..

          
           page10.html
           page11
diff --git a/mzlabs/MZLabsJM/page10/page11/index.html b/mzlabs/MZLabsJM/page10/page11/index.html
index 9193aa1..3de2633 100644
--- a/mzlabs/MZLabsJM/page10/page11/index.html
+++ b/mzlabs/MZLabsJM/page10/page11/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page10/page11
-        
..

+        
..

          
           page11.html
          
diff --git a/mzlabs/MZLabsJM/page10/page9/index.html b/mzlabs/MZLabsJM/page10/page9/index.html
index fc2e9d2..37de0d4 100644
--- a/mzlabs/MZLabsJM/page10/page9/index.html
+++ b/mzlabs/MZLabsJM/page10/page9/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page10/page9
-        
..

+        
..

          
           page9.html
          
diff --git a/mzlabs/MZLabsJM/page3/index.html b/mzlabs/MZLabsJM/page3/index.html
index c9e8187..9a83ed8 100644
--- a/mzlabs/MZLabsJM/page3/index.html
+++ b/mzlabs/MZLabsJM/page3/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page3
-        
..

+        
..

          
           page3.html
          
diff --git a/mzlabs/MZLabsJM/page4/index.html b/mzlabs/MZLabsJM/page4/index.html
index a2cff61..fbdd655 100644
--- a/mzlabs/MZLabsJM/page4/index.html
+++ b/mzlabs/MZLabsJM/page4/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page4
-        
..

+        
..

          
           page21
           page22
diff --git a/mzlabs/MZLabsJM/page4/page21/files/index.html b/mzlabs/MZLabsJM/page4/page21/files/index.html
index f62071c..a6a877a 100644
--- a/mzlabs/MZLabsJM/page4/page21/files/index.html
+++ b/mzlabs/MZLabsJM/page4/page21/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page4/page21/files
-        
..

+        
..

          
           page21-1000-pop.html
           page21-1000-thumb.jpg
diff --git a/mzlabs/MZLabsJM/page4/page21/index.html b/mzlabs/MZLabsJM/page4/page21/index.html
index 45fee88..d1d7b5b 100644
--- a/mzlabs/MZLabsJM/page4/page21/index.html
+++ b/mzlabs/MZLabsJM/page4/page21/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page4/page21
-        
..

+        
..

          
           files
           page21.html
diff --git a/mzlabs/MZLabsJM/page4/page22/index.html b/mzlabs/MZLabsJM/page4/page22/index.html
index 1a0dd0e..dfa9483 100644
--- a/mzlabs/MZLabsJM/page4/page22/index.html
+++ b/mzlabs/MZLabsJM/page4/page22/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page4/page22
-        
..

+        
..

          
           page22.html
          
diff --git a/mzlabs/MZLabsJM/page4/page5/files/index.html b/mzlabs/MZLabsJM/page4/page5/files/index.html
index 2206293..118c890 100644
--- a/mzlabs/MZLabsJM/page4/page5/files/index.html
+++ b/mzlabs/MZLabsJM/page4/page5/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page4/page5/files
-        
..

+        
..

          
           page5-1000-full.html
           page5-1000-full.jpg
diff --git a/mzlabs/MZLabsJM/page4/page5/index.html b/mzlabs/MZLabsJM/page4/page5/index.html
index cd01f67..ef76c2a 100644
--- a/mzlabs/MZLabsJM/page4/page5/index.html
+++ b/mzlabs/MZLabsJM/page4/page5/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page4/page5
-        
..

+        
..

          
           files
           page5.html
diff --git a/mzlabs/MZLabsJM/page4/page8/index.html b/mzlabs/MZLabsJM/page4/page8/index.html
index ae28e43..5182221 100644
--- a/mzlabs/MZLabsJM/page4/page8/index.html
+++ b/mzlabs/MZLabsJM/page4/page8/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page4/page8
-        
..

+        
..

          
           page8.html
          
diff --git a/mzlabs/MZLabsJM/page6/Gerty/files/index.html b/mzlabs/MZLabsJM/page6/Gerty/files/index.html
index b609c76..982aaa6 100644
--- a/mzlabs/MZLabsJM/page6/Gerty/files/index.html
+++ b/mzlabs/MZLabsJM/page6/Gerty/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6/Gerty/files
-        
..

+        
..

          
           machines.png
          
diff --git a/mzlabs/MZLabsJM/page6/Gerty/index.html b/mzlabs/MZLabsJM/page6/Gerty/index.html
index 4228989..92a5f09 100644
--- a/mzlabs/MZLabsJM/page6/Gerty/index.html
+++ b/mzlabs/MZLabsJM/page6/Gerty/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6/Gerty
-        
..

+        
..

          
           Gerty.html
           files
diff --git a/mzlabs/MZLabsJM/page6/Stationery/index.html b/mzlabs/MZLabsJM/page6/Stationery/index.html
index a52b2bd..c431852 100644
--- a/mzlabs/MZLabsJM/page6/Stationery/index.html
+++ b/mzlabs/MZLabsJM/page6/Stationery/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6/Stationery
-        
..

+        
..

          
           Stationery.html
          
diff --git a/mzlabs/MZLabsJM/page6/index.html b/mzlabs/MZLabsJM/page6/index.html
index a93cafa..bfa8539 100644
--- a/mzlabs/MZLabsJM/page6/index.html
+++ b/mzlabs/MZLabsJM/page6/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6
-        
..

+        
..

          
           Gerty
           Stationery
diff --git a/mzlabs/MZLabsJM/page6/page2/index.html b/mzlabs/MZLabsJM/page6/page2/index.html
index 8bf7c6c..7ada562 100644
--- a/mzlabs/MZLabsJM/page6/page2/index.html
+++ b/mzlabs/MZLabsJM/page6/page2/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6/page2
-        
..

+        
..

          
           page2.html
          
diff --git a/mzlabs/MZLabsJM/page6/styled-2/index.html b/mzlabs/MZLabsJM/page6/styled-2/index.html
index 4a86460..4808bf2 100644
--- a/mzlabs/MZLabsJM/page6/styled-2/index.html
+++ b/mzlabs/MZLabsJM/page6/styled-2/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6/styled-2
-        
..

+        
..

          
          
         
diff --git a/mzlabs/MZLabsJM/page6/styled/files/index.html b/mzlabs/MZLabsJM/page6/styled/files/index.html
index 068e3e5..1a1ed3f 100644
--- a/mzlabs/MZLabsJM/page6/styled/files/index.html
+++ b/mzlabs/MZLabsJM/page6/styled/files/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6/styled/files
-        
..

+        
..

          
           angry_billy_mumy.png
           charles_evans.jpg
diff --git a/mzlabs/MZLabsJM/page6/styled/index.html b/mzlabs/MZLabsJM/page6/styled/index.html
index 883f77e..ff6167b 100644
--- a/mzlabs/MZLabsJM/page6/styled/index.html
+++ b/mzlabs/MZLabsJM/page6/styled/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/page6/styled
-        
..

+        
..

          
           files
          
diff --git a/mzlabs/MZLabsJM/rw_common/images/index.html b/mzlabs/MZLabsJM/rw_common/images/index.html
index d76d310..db566e4 100644
--- a/mzlabs/MZLabsJM/rw_common/images/index.html
+++ b/mzlabs/MZLabsJM/rw_common/images/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/images
-        
..

+        
..

          
           thumb167.gif
          
diff --git a/mzlabs/MZLabsJM/rw_common/index.html b/mzlabs/MZLabsJM/rw_common/index.html
index 69adea5..bb3f94d 100644
--- a/mzlabs/MZLabsJM/rw_common/index.html
+++ b/mzlabs/MZLabsJM/rw_common/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common
-        
..

+        
..

          
           images
           themes
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/background/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/background/index.html
index c2d366a..d55a836 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/background/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/background/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/background
-        
..

+        
..

          
           black.css
           darkgradient.css
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/font/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/font/index.html
index 4527613..ccf0fce 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/font/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/font/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/font
-        
..

+        
..

          
           modern.css
           original.css
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/highlight/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/highlight/index.html
index c48b9c5..f20c177 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/highlight/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/highlight/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/highlight
-        
..

+        
..

          
           off.css
          
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/index.html
index eeb52a9..1007eae 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/css
-        
..

+        
..

          
           background
           font
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/sidebar/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/sidebar/index.html
index 3fea6cb..494b25c 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/sidebar/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/sidebar/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/sidebar
-        
..

+        
..

          
           sidebar_hide.css
           sidebar_left.css
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/styles/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/styles/index.html
index eeed300..5811072 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/styles/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/styles/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/styles
-        
..

+        
..

          
           blue.css
           graphite.css
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/width/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/width/index.html
index 74e5f80..82a6ec9 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/width/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/width/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/css/width
-        
..

+        
..

          
           1000.css
           600.css
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/blue/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/blue/index.html
index bf3f8d7..0addb78 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/blue/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/blue/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/blue
-        
..

+        
..

          
           button_over.png
           menu_bg.png
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/graphite/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/graphite/index.html
index fd9ae0a..dbca529 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/graphite/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/graphite/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/graphite
-        
..

+        
..

          
           button_over.png
           menu_bg.png
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/index.html
index 71b3365..0221467 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/images
-        
..

+        
..

          
           blue
           button_current.png
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/metal/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/metal/index.html
index 82b599f..1435b8b 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/metal/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/metal/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/metal
-        
..

+        
..

          
           button_over.png
           menu_bg.png
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/purple/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/purple/index.html
index d7d391d..5bfd68b 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/purple/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/purple/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious/images/purple
-        
..

+        
..

          
           button_over.png
           menu_bg.png
diff --git a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/index.html b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/index.html
index e334841..f01c089 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/aqualicious/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/aqualicious/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes/aqualicious
-        
..

+        
..

          
           css
           handheld.css
diff --git a/mzlabs/MZLabsJM/rw_common/themes/index.html b/mzlabs/MZLabsJM/rw_common/themes/index.html
index 3ed0ddb..3f1ad12 100644
--- a/mzlabs/MZLabsJM/rw_common/themes/index.html
+++ b/mzlabs/MZLabsJM/rw_common/themes/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/MZLabsJM/rw_common/themes
-        
..

+        
..

          
           aqualicious
          
diff --git a/mzlabs/NinaZumel/index.html b/mzlabs/NinaZumel/index.html
index 9ff3254..b0a7927 100644
--- a/mzlabs/NinaZumel/index.html
+++ b/mzlabs/NinaZumel/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/NinaZumel
-        
..

+        
..

          
           NBZ_bio.htm
           aiedam99.pdf
diff --git a/mzlabs/NinaZumel/publications/index.html b/mzlabs/NinaZumel/publications/index.html
index a6840a3..c745d0d 100644
--- a/mzlabs/NinaZumel/publications/index.html
+++ b/mzlabs/NinaZumel/publications/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/NinaZumel/publications
-        
..

+        
..

          
           05 Franco.pdf
           A_Ghost_in_the_System_FINAL.pdf
diff --git a/mzlabs/cgi-bin/index.html b/mzlabs/cgi-bin/index.html
index 48ac526..6e4858b 100644
--- a/mzlabs/cgi-bin/index.html
+++ b/mzlabs/cgi-bin/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/cgi-bin
-        
..

+        
..

          
          
         
diff --git a/mzlabs/gart/index.html b/mzlabs/gart/index.html
index 144edf4..982b639 100644
--- a/mzlabs/gart/index.html
+++ b/mzlabs/gart/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/gart
-        
..

+        
..

          
           GArt.html
           command_line.txt
diff --git a/mzlabs/images/index.html b/mzlabs/images/index.html
index 54908ee..a022a81 100644
--- a/mzlabs/images/index.html
+++ b/mzlabs/images/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/images
-        
..

+        
..

          
           composite.jpg
          
diff --git a/mzlabs/index.html b/mzlabs/index.html
index 5aa1eb3..408ccb9 100644
--- a/mzlabs/index.html
+++ b/mzlabs/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs
-         ..
+         ..
          
           AngryCalculator
           JMPubs
diff --git a/mzlabs/mzlabs/index.html b/mzlabs/mzlabs/index.html
index d76e4d6..1edfb63 100644
--- a/mzlabs/mzlabs/index.html
+++ b/mzlabs/mzlabs/index.html
@@ -42,7 +42,7 @@
         
         
       ./mzlabs/mzlabs
-        
..

+        
..

          
           John Mount.html
           Nina Zumel.html
diff --git a/rateTest/figure/index.html b/rateTest/figure/index.html
index 877bb7d..3d34795 100644
--- a/rateTest/figure/index.html
+++ b/rateTest/figure/index.html
@@ -42,7 +42,7 @@
         
         
       ./rateTest/figure
-        
..

+        
..

          
           rateExample.png
          
diff --git a/rateTest/index.html b/rateTest/index.html
index e35af01..7d9b8da 100644
--- a/rateTest/index.html
+++ b/rateTest/index.html
@@ -42,7 +42,7 @@
         
         
       ./rateTest
-         ..
+         ..
          
           figure
           rateTestExample.Rmd
diff --git a/stripGLM/index.html b/stripGLM/index.html
index d9d3d2d..34d46a2 100644
--- a/stripGLM/index.html
+++ b/stripGLM/index.html
@@ -42,7 +42,7 @@
         
         
       ./stripGLM
-         ..
+         ..
          
           stripGLM.Rmd
           stripGLM.html
diff --git a/style.css b/style.css
new file mode 100644
index 0000000..3df7200
--- /dev/null
+++ b/style.css
@@ -0,0 +1,739 @@
+
+/*--------------------------------------------------------------
+1.0 VARIABLE
+--------------------------------------------------------------*/
+
+:root {
+
+  /*------------------------------------------------------------
+  |
+  | 1.1 COLOR
+  |
+  ------------------------------------------------------------*/
+
+  --ui-color-brand: #353535;
+
+  /* COLOR PALETTE */
+
+  --ui-color-n-000: #FAF9F6;
+  --ui-color-n-050: #f5f5f5;
+  --ui-color-n-100: #c7e9c0;
+  --ui-color-n-300: #a1d99b;
+  --ui-color-n-500: #238b45;
+  --ui-color-n-700: #006d2c; 
+  --ui-color-n-900: #00441b; /* the text in all the boxes (body) */
+
+  /* BACKGROUND COLOR */
+  
+  --ui-color-background-primary  : var(--ui-color-n-000);
+  --ui-color-background-secondary: var(--ui-color-n-500);
+  --ui-color-background-tertiary : var(--ui-color-n-100);
+
+  /* BORDER COLOR */
+
+  --ui-color-border: var(--ui-color-n-100);
+
+  /* TYPOGRAPHY COLOR */
+
+  --ui-color-typography-heading: var(--ui-color-n-700);
+  --ui-color-typography-body   : var(--ui-color-n-900);
+  --ui-color-typography-note   : var(--ui-color-n-300);
+  --ui-color-typography-button : var(--ui-color-n-000);
+
+  /*------------------------------------------------------------
+  |
+  | 1.2 TYPOGRAPHY
+  |
+  ------------------------------------------------------------*/
+
+  --ui-typography-typeface: "Inter", sans-serif;
+
+  /* FONT SIZE */
+
+  --ui-typography-h1: 1.9375rem;
+  --ui-typography-h2: 1.5625rem;
+  --ui-typography-h3: 1.25rem;
+  --ui-typography-h4: 1rem;
+  --ui-typography-p : 1rem;
+  --ui-typography-s : .8125rem;
+
+  /* LEADING */
+
+  --ui-typography-h1-leading: 1.2;
+  --ui-typography-h2-leading: 1.2;
+  --ui-typography-h4-leading: 1.25;
+  --ui-typography-p-leading : 1.5;
+
+  /* MARGIN */
+
+  --ui-typography-margin-heading: .75rem;
+  --ui-typography-margin-body   : 1.125rem;
+
+  /*------------------------------------------------------------
+  |
+  | 1.3 LAYOUT
+  |
+  ------------------------------------------------------------*/
+  
+  --ui-layout-container: 1.25rem;
+  --ui-layout-grid     : 3.625rem;
+  --ui-layout-gutter   : 1rem;
+
+  /* GAP */
+  
+  --ui-gap-header  : 1rem;
+  --ui-gap-card    : 1.25rem;
+  --ui-gap-project : 1rem;
+
+  /* BORDER RADIUS */
+  
+  --ui-radius-avatar: 5rem;
+  --ui-radius-card  : .5rem;
+
+}
+
+/*--------------------------------------------------------------
+2.0 FOUNDATION
+--------------------------------------------------------------*/
+
+html { box-sizing: border-box; }
+
+*,
+*:before,
+*:after { box-sizing: inherit; }
+
+body {
+  background-color: var(--ui-color-background-primary);
+  color: var(--ui-color-typography-body);
+  font-family: var(--ui-typography-typeface);
+  font-feature-settings: "liga", "kern";
+  font-size: var(--ui-typography-p);
+  font-weight: 400;
+  line-height: var(--ui-typography-p-leading);
+  margin: 0 auto;
+  text-rendering: optimizeLegibility;
+  -webkit-font-smoothing: antialiased;
+}
+
+/*--------------------------------------------------------------
+3.0 TYPOGRAPHY
+--------------------------------------------------------------*/
+
+a {
+  color: var(--ui-color-brand);
+  text-decoration-color: var(--ui-color-typography-note);
+}
+
+h1,
+h2,
+h4,
+p,
+ul { margin-top: 0; }
+
+h1,
+h2,
+h4 { color: var(--ui-color-typography-heading); }
+
+h1,
+h2 { margin-bottom: var(--ui-typography-margin-heading); }
+
+h1 {
+  font-size: var(--ui-typography-h1);
+  line-height: var(--ui-typography-h1-leading);
+}
+
+h2 {
+  font-size: var(--ui-typography-h2);
+  line-height: var(--ui-typography-h2-leading);
+}
+
+h4 {
+  font-size: var(--ui-typography-h4);
+  line-height: var(--ui-typography-h4-leading);
+}
+
+p,
+ul { margin-bottom: var(--ui-typography-margin-body); }
+
+p:last-child,
+ul:last-child { margin-bottom: 0; }
+
+ul { padding-left: 0; }
+
+strong { font-weight: 700; }
+
+small { font-size: var(--ui-typography-s); }
+
+.ui-text-note {
+  color: var(--ui-color-typography-note);
+  line-height: 1;
+}
+
+/*--------------------------------------------------------------
+4.0 IMAGE
+--------------------------------------------------------------*/
+
+img,
+svg {
+  display: block;
+  height: auto;
+  margin: 0 auto;
+  max-width: 100%;
+}
+
+/*--------------------------------------------------------------
+5.0 LAYOUT
+--------------------------------------------------------------*/
+
+.ui-layout-container {
+  padding-left: var(--ui-layout-container);
+  padding-right: var(--ui-layout-container);
+}
+
+.ui-layout-flex,
+.ui-layout-grid {
+  align-items: center;
+  justify-content: center;
+}
+
+.ui-layout-flex { display: flex; }
+
+.ui-layout-grid { display: grid; }
+
+
+/*--------------------------------------------------------------
+|
+| 6.4 CARD
+|
+--------------------------------------------------------------*/
+
+.ui-component-card {
+  border: .0625rem solid var(--ui-color-border);
+  border-radius: var(--ui-radius-card);
+  overflow: hidden;
+  width: 100%;
+}
+
+/*--------------------------------------------------------------
+|
+| 6.5 LIST
+|
+--------------------------------------------------------------*/
+
+.ui-component-list {
+  grid-template-columns: 1fr;
+  row-gap: .75rem;
+}
+
+.ui-component-list--item {
+  background-position: left center;
+  background-repeat: no-repeat;
+  background-size: 1.125rem;
+  list-style: none;
+  padding-left: 1.875rem;
+}
+
+.ui-component-list--item-check {
+  background-image: url(https://res.cloudinary.com/uisual/image/upload/assets/icons/check.svg);
+}
+
+.ui-component-list--item-cross {
+  background-image: url(https://res.cloudinary.com/uisual/image/upload/assets/icons/cross.svg);
+}
+
+/*--------------------------------------------------------------
+7.0 SECTION
+--------------------------------------------------------------*/
+
+/*--------------------------------------------------------------
+|
+| 7.1 HEADER
+|
+--------------------------------------------------------------*/
+
+.ui-section-header {
+  background-color: var(--ui-color-background-secondary);
+  text-align: center;
+  padding-bottom: 1.25rem;
+  padding-top: 1.25rem;
+}
+
+.ui-section-header__layout { 
+	justify-content: space-between; 
+	align-items: stretch;
+}
+
+/* LOGO */
+
+.ui-section-header--logo { z-index: 1; }
+
+/* HAMBURGER */
+
+#ui-section-header--menu-id { display: none; }
+
+.ui-section-header--menu-icon {
+  cursor: pointer;
+  display: block;
+  height: 1.125rem;
+  padding-bottom: .25rem;
+  padding-top: .25rem;
+  position: relative;
+  width: 1.125rem;
+  z-index: 1;
+}
+
+.ui-section-header--menu-icon::before,
+.ui-section-header--menu-icon::after {
+  background: var(--ui-color-background-primary);
+  content: "";
+  height: .125rem;
+  left: 0;
+  position: absolute;
+  transition: all 250ms cubic-bezier(.785, .135, .15, .86);
+  width: 1.125rem;
+}
+
+.ui-section-header--menu-icon::before { top: .3125rem; }
+
+.ui-section-header--menu-icon::after { top: .6875rem; }
+
+#ui-section-header--menu-id:checked ~
+.ui-section-header--menu-icon::before {
+  transform: translateY(3px) rotate(135deg);
+}
+
+#ui-section-header--menu-id:checked ~
+.ui-section-header--menu-icon::after {
+  transform: translateY(-3px) rotate(45deg);
+}
+
+/* MENU */
+
+.ui-section-header--nav {
+  background-color: var(--ui-color-background-secondary);
+  box-shadow: 0 .5rem 1rem rgba(0,0,0,.05);
+  flex-direction: column;
+  gap: var(--ui-gap-header);
+  left: 0;
+  opacity: 0;
+  padding: 7.375rem var(--ui-layout-container) 5rem;
+  position: absolute;
+  right: 0;
+  top: -1rem;
+  transition: all 250ms cubic-bezier(.785, .135, .15, .86);
+  visibility: hidden;
+}
+
+#ui-section-header--menu-id:checked ~
+.ui-section-header--nav {
+  opacity: 1;
+  top: 0;
+  visibility: visible;
+}
+
+.ui-section-header--nav-link {
+  font-size: var(--ui-typography-h3);
+  padding: .5rem;
+  text-decoration: none;
+  color: var(--ui-color-background-primary)
+}
+
+
+/*--------------------------------------------------------------
+|
+| 7.6 PROJECT
+|
+--------------------------------------------------------------*/
+
+.ui-section-project {
+  padding-bottom: 5rem;
+  padding-top: 5rem;
+  text-align: center;
+}
+
+.ui-section-project__layout {
+  justify-content: initial;
+  align-items: stretch;
+  margin-top: var(--ui-gap-project);
+  row-gap: var(--ui-gap-card);
+}
+
+/* CARD */
+
+.ui-component-card--project {
+  background-color: var(--ui-color-background-tertiary);
+  padding: 1.5rem 1.5rem 1.75rem;
+  text-align: left;
+}
+
+/* LIST */
+
+.ui-component-list--project {
+  margin-bottom: 1.5rem;
+  margin-top: 1.25rem;
+}
+
+
+/*--------------------------------------------------------------
+|
+| 7.8 CLOSE
+|
+--------------------------------------------------------------*/
+
+.ui-section-close {
+  background-color: var(--ui-color-background-secondary);
+  padding-bottom: 1.25rem;
+  padding-top: 1.25rem;
+  text-align: center;
+}
+
+.ui-section-close__layout {
+  text-align: center;
+  align-items: stretch;
+  flex-direction: column;
+  row-gap: var(--ui-typography-margin-body);
+}
+
+/*--------------------------------------------------------------
+|
+| 7.9 FOOTER
+|
+--------------------------------------------------------------*/
+
+.ui-section-footer {
+  padding-bottom: 1.25rem;
+  padding-top: 1.25rem;
+}
+
+.ui-section-footer__layout {
+  column-gap: var(--ui-layout-gutter);
+}
+
+.ui-section-footer--copyright {
+  margin-bottom: 0;
+  margin-right: auto;
+}
+
+/*--------------------------------------------------------------
+8.0 MEDIA
+--------------------------------------------------------------*/
+
+/*--------------------------------------------------------------
+|
+| 8.1 768PX
+|
+--------------------------------------------------------------*/
+
+@media screen and (min-width: 48rem) {
+
+  /*------------------------------------------------------------
+  VARIABLE
+  ------------------------------------------------------------*/
+  
+  :root {
+
+    /*----------------------------------------------------------
+    |
+    | TYPOGRAPHY
+    |
+    ----------------------------------------------------------*/
+
+    /* FONT SIZE */
+
+    --ui-typography-h1: 2.1875rem;
+    --ui-typography-h2: 1.75rem;
+    --ui-typography-h4: 1.125rem;
+    --ui-typography-p : 1.125rem;
+    --ui-typography-s : .875rem;
+
+    /* MARGIN */
+
+    --ui-typography-margin-body: 1.25rem;
+
+    /*----------------------------------------------------------
+    |
+    | LAYOUT
+    |
+    ----------------------------------------------------------*/
+
+    --ui-layout-container: 4.25rem;
+    --ui-layout-gutter   : 1.5rem;
+
+    /* GAP */
+
+    --ui-gap-header: 1.5rem;
+    --ui-gap-card  : 1.5rem;
+    --ui-gap-faq   : 2rem;
+
+  }
+
+  /*------------------------------------------------------------
+  IMAGE
+  ------------------------------------------------------------*/
+
+  .ui-image-half-right {
+    padding-left: var(--ui-layout-gutter);
+  }
+
+  /*------------------------------------------------------------
+  LAYOUT
+  ------------------------------------------------------------*/
+
+  .ui-layout-container,
+  .ui-layout-column-center {
+    margin-left: auto;
+    margin-right: auto;
+  }
+
+  .ui-layout-grid-2,
+  .ui-layout-grid-3 {
+    column-gap: var(--ui-layout-gutter);
+    grid-template-columns: repeat(2, 1fr);
+    justify-items: center;
+  }
+
+  .ui-layout-grid-3 div:nth-of-type(3) {
+    left: calc(50% + (var(--ui-layout-gutter) / 2));
+    position: relative;
+  }
+
+  .ui-layout-column-4 {
+    width: calc((var(--ui-layout-grid) * 4) +
+           (var(--ui-layout-gutter) * 3));
+  }
+
+
+  /*------------------------------------------------------------
+  |
+  | LIST
+  |
+  ------------------------------------------------------------*/
+
+  .ui-component-list--item {
+    background-size: 1.25rem;
+    padding-left: 2rem;
+  }
+
+
+  /*------------------------------------------------------------
+  |
+  | HEADER
+  |
+  ------------------------------------------------------------*/
+
+  .ui-section-header {
+    padding-bottom: 2rem;
+    padding-top: 2rem;
+  }
+
+  /* ICON */
+
+  .ui-section-header--menu-icon { display: none; }
+
+  /* NAV */
+
+  .ui-section-header--nav {
+    background-color: transparent;
+    box-shadow: none;
+    flex-direction: row;
+    opacity: 1;
+    padding: 0;
+    position: static;
+    visibility: visible;
+  }
+  
+  .ui-section-header--nav-link {
+    font-size: var(--ui-typography-p);
+    padding: 0;
+  }
+
+
+  /*------------------------------------------------------------
+  |
+  | PROJECT
+  |
+  ------------------------------------------------------------*/
+
+  .ui-component-card--project { 
+	padding: 2rem 2rem 2.25rem; 
+  }
+
+  /*------------------------------------------------------------
+  |
+  | CLOSE
+  |
+  ------------------------------------------------------------*/
+
+  .ui-section-close__layout {
+    align-items: center;
+    column-gap: var(--ui-layout-gutter);
+    flex-direction: row;
+    justify-content: space-between;
+    text-align: left;
+  }
+
+  /*------------------------------------------------------------
+  |
+  | FOOTER
+  |
+  ------------------------------------------------------------*/
+
+  .ui-section-footer {
+    padding-bottom: 2rem;
+    padding-top: 2rem;
+  }
+  
+}
+
+/*--------------------------------------------------------------
+|
+| 8.2 1024PX
+|
+--------------------------------------------------------------*/
+
+@media screen and (min-width: 64rem) {
+
+  /*------------------------------------------------------------
+  VARIABLE
+  ------------------------------------------------------------*/
+
+  :root {
+
+    /*----------------------------------------------------------
+    |
+    | LAYOUT
+    |
+    ----------------------------------------------------------*/
+
+    --ui-layout-container: 0;
+  
+  }
+
+  /*------------------------------------------------------------
+  LAYOUT
+  ------------------------------------------------------------*/
+  
+  .ui-layout-container { width: 60rem; }
+
+  .ui-layout-grid-3 { grid-template-columns: repeat(3, 1fr); }
+
+  .ui-layout-grid-3 div:nth-of-type(3) { position: static; }
+
+  /*------------------------------------------------------------
+  SECTION
+  ------------------------------------------------------------*/
+
+
+/*--------------------------------------------------------------
+|
+| 8.3 1200PX
+|
+--------------------------------------------------------------*/
+
+@media screen and (min-width: 75rem) {
+
+  /*------------------------------------------------------------
+  VARIABLE
+  ------------------------------------------------------------*/
+
+  :root {
+
+    /*----------------------------------------------------------
+    |
+    | TYPOGRAPHY
+    |
+    ----------------------------------------------------------*/
+
+    /* FONT SIZE */
+
+    --ui-typography-h1: 2.75rem;
+    --ui-typography-h2: 2.1875rem;
+    --ui-typography-h4: 1.4375rem;
+
+    /* MARGIN */
+
+    --ui-typography-margin-heading: 1rem;
+    --ui-typography-margin-body   : 1.75rem;
+
+    /*----------------------------------------------------------
+    |
+    | LAYOUT
+    |
+    ----------------------------------------------------------*/
+
+    --ui-layout-grid  : 4rem;
+    --ui-layout-gutter: 2rem;
+
+    /* GAP */
+
+    --ui-gap-header  : 2rem;
+    --ui-gap-customer: 4rem;
+    --ui-gap-card    : 2rem;
+    --ui-gap-project : 3rem;
+    
+  }
+
+  /*------------------------------------------------------------
+  TYPOGRAPHY
+  ------------------------------------------------------------*/
+
+  .ui-text-intro { font-size: var(--ui-typography-h4); }
+
+  /*------------------------------------------------------------
+  LAYOUT
+  ------------------------------------------------------------*/
+  
+  .ui-layout-container { width: 70rem; }
+
+
+  /*------------------------------------------------------------
+  SECTION
+  ------------------------------------------------------------*/
+
+  /*------------------------------------------------------------
+  |
+  | HEADER
+  |
+  ------------------------------------------------------------*/
+
+  .ui-section-header { padding-top: 3rem; }
+
+
+  /*------------------------------------------------------------
+  |
+  | PROJECT
+  |
+  ------------------------------------------------------------*/
+
+  .ui-section-project {
+    padding-bottom: 2.5rem;
+    padding-top: 2.5rem;
+  }
+
+  .ui-component-card--project { padding: 3rem; }
+
+
+  /*------------------------------------------------------------
+  |
+  | CLOSE
+  |
+  ------------------------------------------------------------*/
+
+  .ui-section-close {
+    padding-bottom: 1.25rem;
+    padding-top: 1.25rem;
+  }
+  
+  /*------------------------------------------------------------
+  |
+  | FOOTER
+  |
+  ------------------------------------------------------------*/
+
+  .ui-section-footer {
+	text-align: center;
+    padding-bottom: 3rem;
+    padding-top: 3rem;
+  }
+
+}
\ No newline at end of file
diff --git a/uciCar/index.html b/uciCar/index.html
index 2decb7b..f93a2ff 100644
--- a/uciCar/index.html
+++ b/uciCar/index.html
@@ -42,7 +42,7 @@
         
         
       ./uciCar
-         ..
+         ..
          
 
 diff --git a/vtreathtml/index.html b/vtreathtml/index.html
index c6ae31c..f45c48a 100644
--- a/vtreathtml/index.html
+++ b/vtreathtml/index.html
@@ -42,7 +42,7 @@
         
         
       ./vtreathtml
-         ..
+         ..
          
           SavingTreamentPlans.html
           vtreat.html
diff --git a/wrappingFns/index.html b/wrappingFns/index.html
index 68e5d53..c086e8d 100644
--- a/wrappingFns/index.html
+++ b/wrappingFns/index.html
@@ -42,7 +42,7 @@
         
         
       ./wrappingFns
-         ..
+         ..
          
           modelSize.Rmd
           modelSize.html
diff --git a/wv-icon.png b/wv-icon.png
new file mode 100644
index 0000000..792204e
Binary files /dev/null and b/wv-icon.png differ
diff --git a/xDrift/index.html b/xDrift/index.html
index ca08c27..ac70ba9 100644
--- a/xDrift/index.html
+++ b/xDrift/index.html
@@ -42,7 +42,7 @@
         
         
       ./xDrift
-         ..
+         ..
          
           orthApprox.pdf
           xDrift.html
Partial Pooling for Lower Variance Variable +Encoding

Nina Zumel

The Data

Partial Pooling

The Discrete Case

Partial Pooling Degrades Gracefully

References

WinVector.github.io Directory List

Directories:

Featured Win Vector Projects