4 Spending our data
+General data splitting
+Re-emphasize roles or different data sets and good/bad ways of doing things.
+Validation sets.
+What we do differently with a lot of data.
+Allude to resampling.
+ +diff --git a/TMwR.bib b/TMwR.bib index a725d7ce..c980228c 100644 --- a/TMwR.bib +++ b/TMwR.bib @@ -147,4 +147,23 @@ @book{bolstad2004 author={Bolstad, B}, year={2004}, publisher={University of California, Berkeley} +} + + +@article{Durrleman1989, + author = {Durrleman, S and Simon, R}, + title = {Flexible regression models with cubic splines}, + journal = {Statistics in Medicine}, + volume = {8}, + number = {5}, + pages = {551-561}, + year = {1989} +} + + +@book{kuhn20202, + title={Feature engineering and selection: A practical approach for predictive models}, + author={Kuhn, M and Johnson, K}, + year={2020}, + publisher={CRC Press} } \ No newline at end of file diff --git a/_book/a-model-workflow.html b/_book/a-model-workflow.html index 4c465884..fb4536e1 100644 --- a/_book/a-model-workflow.html +++ b/_book/a-model-workflow.html @@ -24,7 +24,7 @@ - + diff --git a/_book/a-tale-of-two-models.html b/_book/a-tale-of-two-models.html index 31d45696..3985d1de 100644 --- a/_book/a-tale-of-two-models.html +++ b/_book/a-tale-of-two-models.html @@ -24,7 +24,7 @@ - + diff --git a/_book/a-tale-of-two-models.md b/_book/a-tale-of-two-models.md index 92725ffe..b2df7124 100644 --- a/_book/a-tale-of-two-models.md +++ b/_book/a-tale-of-two-models.md @@ -1,7 +1,7 @@ -# A tale of two models +# A tale of two models {#two-models} (tentative title) diff --git a/_book/a-tidyverse-primer.html b/_book/a-tidyverse-primer.html index 0273e201..9df0a755 100644 --- a/_book/a-tidyverse-primer.html +++ b/_book/a-tidyverse-primer.html @@ -24,7 +24,7 @@ - + diff --git a/_book/data-spending.html b/_book/data-spending.html new file mode 100644 index 00000000..734b5075 --- /dev/null +++ b/_book/data-spending.html @@ -0,0 +1,177 @@ + + +
+ + + +