diff --git a/ccn2019.rev3.Rmd b/ccn2019.rev3.Rmd index 7a879be..01ebefb 100644 --- a/ccn2019.rev3.Rmd +++ b/ccn2019.rev3.Rmd @@ -71,6 +71,15 @@ #DEBUG inspect_cor(seqs, show_plot = T) ``` +```{r remove_highly_correlated_predictors} +# WIP: This is an extra step for non-pls methods to remove highly correlated predictors +cor_matrix <- cor(seqs[,-1]) +cor_high <- findCorrelation(cor_matrix, 0.8) +high_cor_remove <- row.names(cor_matrix)[cor_high] +#FIXME remove by column name +seqs.uncorr <- seqs %>% select(-high_cor_remove) +``` + ```{r models} #! =============================================== #! prepare data for modeling (remove na, etc)