Merge pull request h2oai#271 from h2oai/fv-h2o3-tutorials-code

Added a folder with the R and Python codes for the H2O-3 Tutorials
akshaydeshneni · Nov 20, 2020 · 7bf2bef · 7bf2bef
2 parents 7eed162 + 3f0c00d
commit 7bf2bef
Show file tree

Hide file tree

Showing 72 changed files with 14,760 additions and 2,762 deletions.
diff --git a/...earning-with-h2o-3-part-1/introduction-to-machine-learning-with-h2o-3-part-1.md b/...earning-with-h2o-3-part-1/introduction-to-machine-learning-with-h2o-3-part-1.md
diff --git a/...earning-with-h2o-3-part-2/introduction-to-machine-learning-with-h2o-3-part-2.md b/...earning-with-h2o-3-part-2/introduction-to-machine-learning-with-h2o-3-part-2.md
diff --git a/...roduction-to-machine-learning-with-h2o-3-part-3/assets/aml-cl-leaderboard-1.jpg b/...roduction-to-machine-learning-with-h2o-3-part-3/assets/aml-cl-leaderboard-1.jpg
diff --git a/...roduction-to-machine-learning-with-h2o-3-part-3/assets/aml-cl-leaderboard-2.jpg b/...roduction-to-machine-learning-with-h2o-3-part-3/assets/aml-cl-leaderboard-2.jpg
diff --git a/...ntroduction-to-machine-learning-with-h2o-3-part-3/assets/aml-cl-leaderboard.jpg b/...ntroduction-to-machine-learning-with-h2o-3-part-3/assets/aml-cl-leaderboard.jpg
diff --git a/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/auto-ml-11.jpg b/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/auto-ml-11.jpg
diff --git a/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/auto-ml-66.jpg b/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/auto-ml-66.jpg
diff --git a/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/auto-ml-cl-75.jpg b/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/auto-ml-cl-75.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-output.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-output.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-perf-1.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-perf-1.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-perf-2.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-perf-2.jpg
diff --git a/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-pred.jpg b/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-pred.jpg
diff --git a/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-preds.jpg b/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-preds.jpg
diff --git a/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-roc.jpg b/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-cl-roc.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-preds-reg.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/automl-preds-reg.jpg
diff --git a/...duction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-leaderboard.jpg b/...duction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-leaderboard.jpg
diff --git a/...ction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-leaderboard_1.jpg b/...ction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-leaderboard_1.jpg
diff --git a/...ction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-leaderboard_2.jpg b/...ction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-leaderboard_2.jpg
diff --git a/...roduction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-summary-1.jpg b/...roduction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-summary-1.jpg
diff --git a/...roduction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-summary-2.jpg b/...roduction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-summary-2.jpg
diff --git a/...roduction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-summary-3.jpg b/...roduction-to-machine-learning-with-h2o-3-part-3/assets/automl-reg-summary-3.jpg
diff --git a/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/cl-predict.jpg b/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/cl-predict.jpg
diff --git a/...duction-to-machine-learning-with-h2o-3-part-3/assets/cl-predictions-outputs.jpg b/...duction-to-machine-learning-with-h2o-3-part-3/assets/cl-predictions-outputs.jpg
diff --git a/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/cl-training-auc.jpg b/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/cl-training-auc.jpg
diff --git a/...sion/introduction-to-machine-learning-with-h2o-3-part-3/assets/cluster-info.jpg b/...sion/introduction-to-machine-learning-with-h2o-3-part-3/assets/cluster-info.jpg
diff --git a/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/delinquent-dist.jpg b/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/delinquent-dist.jpg
diff --git a/...roduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-build-cl.jpg b/...roduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-build-cl.jpg
diff --git a/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-build.jpg b/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-build.jpg
diff --git a/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg-1.jpg b/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg-1.jpg
diff --git a/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg-2.jpg b/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg-2.jpg
diff --git a/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg-3.jpg b/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg-3.jpg
diff --git a/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg.jpg b/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-automl-reg.jpg
diff --git a/...achine-learning-with-h2o-3-part-3/assets/flow-automl-regression-leaderboard.jpg b/...achine-learning-with-h2o-3-part-3/assets/flow-automl-regression-leaderboard.jpg
diff --git a/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-choose-frame.jpg b/...introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-choose-frame.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-automl-1.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-automl-1.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-automl-2.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-automl-2.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-automl-3.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-automl-3.jpg
diff --git a/...troduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-leaderboard.jpg b/...troduction-to-machine-learning-with-h2o-3-part-3/assets/flow-cl-leaderboard.jpg
diff --git a/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-frames.jpg b/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-frames.jpg
diff --git a/...roduction-to-machine-learning-with-h2o-3-part-3/assets/flow-gbm-predictions.jpg b/...roduction-to-machine-learning-with-h2o-3-part-3/assets/flow-gbm-predictions.jpg
diff --git a/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-instance.jpg b/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-instance.jpg
diff --git a/...tion-to-machine-learning-with-h2o-3-part-3/assets/flow-reg-view-leaderboard.jpg b/...tion-to-machine-learning-with-h2o-3-part-3/assets/flow-reg-view-leaderboard.jpg
diff --git a/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-run-automl.jpg b/...n/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-run-automl.jpg
diff --git a/...troduction-to-machine-learning-with-h2o-3-part-3/assets/flow-view-cl-automl.jpg b/...troduction-to-machine-learning-with-h2o-3-part-3/assets/flow-view-cl-automl.jpg
diff --git a/...ntroduction-to-machine-learning-with-h2o-3-part-3/assets/flow-xgb-predict-2.jpg b/...ntroduction-to-machine-learning-with-h2o-3-part-3/assets/flow-xgb-predict-2.jpg
diff --git a/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-xgb-preds.jpg b/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/flow-xgb-preds.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-actual-preds.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-actual-preds.jpg
diff --git a/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-predict.jpg b/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-predict.jpg
diff --git a/...sion/introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-test-per.jpg b/...sion/introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-test-per.jpg
diff --git a/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-view-preds.jpg b/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/gbm-view-preds.jpg
diff --git a/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/get-frames.jpg b/...ersion/introduction-to-machine-learning-with-h2o-3-part-3/assets/get-frames.jpg
diff --git a/...introduction-to-machine-learning-with-h2o-3-part-3/assets/leader-automl-reg.jpg b/...introduction-to-machine-learning-with-h2o-3-part-3/assets/leader-automl-reg.jpg
diff --git a/...version/introduction-to-machine-learning-with-h2o-3-part-3/assets/rate-dist.jpg b/...version/introduction-to-machine-learning-with-h2o-3-part-3/assets/rate-dist.jpg
diff --git a/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/split-frame.gif b/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/split-frame.gif
diff --git a/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/std_coef_plot.jpg b/...ion/introduction-to-machine-learning-with-h2o-3-part-3/assets/std_coef_plot.jpg
diff --git a/...sion/introduction-to-machine-learning-with-h2o-3-part-3/assets/training-auc.jpg b/...sion/introduction-to-machine-learning-with-h2o-3-part-3/assets/training-auc.jpg
diff --git a/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/xgb-actual-preds.jpg b/.../introduction-to-machine-learning-with-h2o-3-part-3/assets/xgb-actual-preds.jpg
diff --git a/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/xgb-predict.jpg b/...rsion/introduction-to-machine-learning-with-h2o-3-part-3/assets/xgb-predict.jpg
diff --git a/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/xgb-view-preds.jpg b/...on/introduction-to-machine-learning-with-h2o-3-part-3/assets/xgb-view-preds.jpg
diff --git a/...earning-with-h2o-3-part-3/introduction-to-machine-learning-with-h2o-3-part-3.md b/...earning-with-h2o-3-part-3/introduction-to-machine-learning-with-h2o-3-part-3.md
diff --git a/...on/.ipynb_checkpoints/introduction-to-machine-learning-with-h2o-3-automl-checkpoint.ipynb b/...on/.ipynb_checkpoints/introduction-to-machine-learning-with-h2o-3-automl-checkpoint.ipynb
diff --git a/...b_checkpoints/introduction-to-machine-learning-with-h2o-3-classification-checkpoint.ipynb b/...b_checkpoints/introduction-to-machine-learning-with-h2o-3-classification-checkpoint.ipynb
diff --git a/...ipynb_checkpoints/introduction-to-machine-learning-with-h2o-3-regression-checkpoint.ipynb b/...ipynb_checkpoints/introduction-to-machine-learning-with-h2o-3-regression-checkpoint.ipynb
diff --git a/H2O-3/h2o-3-tutorials-code /Python/introduction-to-machine-learning-with-h2o-3-automl.ipynb b/H2O-3/h2o-3-tutorials-code /Python/introduction-to-machine-learning-with-h2o-3-automl.ipynb
diff --git a/...3-tutorials-code /Python/introduction-to-machine-learning-with-h2o-3-classification.ipynb b/...3-tutorials-code /Python/introduction-to-machine-learning-with-h2o-3-classification.ipynb
diff --git a/...h2o-3-tutorials-code /Python/introduction-to-machine-learning-with-h2o-3-regression.ipynb b/...h2o-3-tutorials-code /Python/introduction-to-machine-learning-with-h2o-3-regression.ipynb
diff --git a/H2O-3/h2o-3-tutorials-code /R/RMD-files/AutoML Tutorial with H2O-3 with R.Rmd b/H2O-3/h2o-3-tutorials-code /R/RMD-files/AutoML Tutorial with H2O-3 with R.Rmd
@@ -0,0 +1,193 @@
+---
+title: "AutoML Tutorial with H2O-3 Using R"
+output: html_notebook
+---
+
+This is an [R Markdown](http://rmarkdown.rstudio.com) Notebook. When you execute code within the notebook, the results appear beneath the code. To execute a code chunk, click *Run* (play) button within the chunk or by placing your cursor inside it and pressing *Cmd+Shift+Enter*. 
+
+## Task 1: Initial Setup
+
+```{r}
+library(h2o)
+library(tidyverse)
+library(DT)
+
+h2o.init(bind_to_localhost = FALSE, context_path = "h2o")
+```
+
+```{r}
+h2o.no_progress()
+```
+
+```{r}
+loan_level <- h2o.importFile(path = "https://s3.amazonaws.com/data.h2o.ai/H2O-3-Tutorials/loan_level_50k.csv")
+```
+
+## Task 2: Machine Learning Concepts - See Tutorial
+
+## Task 3: Start Experiment
+
+```{r}
+h2o.head(loan_level) %>% as_tibble()
+h2o.describe(loan_level) %>% as_tibble()
+```
+
+```{r}
+h2o.table(loan_level[, c("DELINQUENT")])
+```
+
+```{r}
+h2o.hist(loan_level[, c("ORIGINAL_INTEREST_RATE")])
+```
+
+```{r}
+splits <- h2o.splitFrame(loan_level, c(0.8), seed = 42)
+
+train <- splits[[1]]
+test  <- splits[[2]] 
+
+dim(train)
+dim(test)
+```
+
+## Task 4: H2O AutoML Classification
+
+```{r}
+ignore <- c("DELINQUENT", "PREPAID", "PREPAYMENT_PENALTY_MORTGAGE_FLAG", "PRODUCT_TYPE")
+y <- "DELINQUENT"
+
+x <- setdiff(colnames(train), ignore)
+
+x
+```
+
+```{r}
+aml_cl <- h2o.automl(max_models = 25, max_runtime_secs_per_model = 30,
+                     seed = 42, project_name = "classification",
+                     balance_classes = TRUE, class_sampling_factors = c(0.5, 1.25),
+                     
+                     x = x,
+                     y = y,
+                     training_frame = train
+                     
+)
+```
+
+```{r}
+lb <- h2o.get_leaderboard(aml_cl)
+h2o.head(lb, n = 25)
+```
+
+```{r}
+lb2 <- h2o.get_leaderboard(aml_cl, extra_columns = "ALL")
+h2o.head(lb2, n = 25)
+```
+
+```{r}
+# Get model ids for all models in the AutoML Leaderboard
+model_ids <- as.data.frame(aml_cl@leaderboard$model_id)[,1]
+# Get the "All Models" Stacked Ensemble model
+se <- h2o.getModel(grep("StackedEnsemble_AllModels", model_ids, value = TRUE)[1])
+# Get the Stacked Ensemble metalearner model
+metalearner <- h2o.getModel(se@model$metalearner$name)
+```
+
+```{r}
+h2o.coef(metalearner)
+h2o.coef_norm(metalearner)
+h2o.std_coef_plot(metalearner)
+```
+
+```{r}
+aml_cl@leader
+```
+
+```{r}
+aml_leader <- aml_cl@leader
+
+aml_leader_test_perf <- h2o.performance(aml_leader, test)
+```
+
+```{r}
+h2o.auc(aml_leader_test_perf)
+plot(aml_leader_test_perf)
+```
+
+```{r}
+aml_leader_pred <- h2o.predict(aml_leader, test)
+h2o.head(aml_leader_pred, n=10)
+```
+
+## Task 5: h2O AutoML Regression
+
+```{r}
+ignore_reg <- c("ORIGINAL_INTEREST_RATE", "FIRST_PAYMENT_DATE", "MATURITY_DATE", "MORTGAGE_INSURANCE_PERCENTAGE",
+            "PREPAYMENT_PENALTY_MORTGAGE_FLAG", "LOAN_SEQUENCE_NUMBER", "PREPAID",
+            "DELINQUENT", "PRODUCT_TYPE")
+
+y_reg <- "ORIGINAL_INTEREST_RATE"
+
+x_reg <- setdiff(colnames(train), ignore_reg)
+x_reg
+```
+
+```{r}
+aml_reg <- h2o.automl(max_runtime_secs = 900, max_runtime_secs_per_model = 30, seed = 42,
+                      project_name = "regression", stopping_metric = 'RMSE', sort_metric = 'RMSE',
+                      
+                      x = x_reg,
+                      y = y_reg,
+                      training_frame = train
+                      )
+```
+
+```{r}
+lb <- h2o.get_leaderboard(aml_reg)
+h2o.head(lb, n = -1)
+```
+
+ To get specific models, you have two options
+
+```{r}
+# Get model ids for all models in the AutoML Leaderboard
+model_ids <- as.data.frame(aml_reg@leaderboard$model_id)[,1]
+# Get the "All Models" Stacked Ensemble model
+gbm <- h2o.getModel(grep("GBM_2", model_ids, value = TRUE)[1])
+gbm
+```
+
+And you can just get the model id and place it inside the parenthesis
+```{r}
+#gbm <- h2o.getModel("model_id")
+```
+
+```{r}
+gbm@allparameters[["ntrees"]]
+gbm@allparameters[["max_depth"]]
+gbm@allparameters[["learn_rate"]]
+gbm@allparameters[["sample_rate"]]
+```
+
+```{r}
+gbm
+```
+
+```{r}
+gbm_test_perf <- h2o.performance(gbm, test)
+
+h2o.rmse(gbm_test_perf)
+h2o.mae(gbm_test_perf)
+```
+
+```{r}
+gbm_pred <- h2o.predict(gbm, test)
+
+preds <- h2o.cbind(test[, c("ORIGINAL_INTEREST_RATE")], gbm_pred)
+
+h2o.head(preds, n=10)
+```
+
+## For Task 6-8 please refer to md file ----
+```{r}
+h2o.shutdown()
+```