From 1e347ae2ff42f5854a25df13e1106127d0bd50d0 Mon Sep 17 00:00:00 2001
From: Jinhwan Kim <hwanistic@gmail.com>
Date: Wed, 15 Nov 2023 15:24:25 +0900
Subject: [PATCH] fix: markdown r codeblock

"``` {r}" to

"``` r"
---
 README.md        |   6 +--
 docs/index.html  | 119 ++++++++++++++++++++++++++++++-----------------
 docs/pkgdown.yml |   2 +-
 docs/search.json |   2 +-
 4 files changed, 81 insertions(+), 48 deletions(-)
diff --git a/README.md b/README.md
index 751209f..a07b0a7 100644
--- a/README.md
+++ b/README.md
@@ -19,7 +19,7 @@ devtools::install_github("statgarten/stove")
 
 ### 1. Sample Data Import
 
-```{r}
+``` r
 # remotes::install_github("statgarten/datatoys")
 library(stove)
 library(datatoys)
@@ -39,7 +39,7 @@ cleaned_data <- cleaned_data %>%
 
 ### 2. Data split and Define preprocessing
 
-```{r}
+``` r
 target_var <- "TG"
 train_set_ratio <- 0.7
 seed <- 1234
@@ -69,7 +69,7 @@ rec <- stove::prepForCV(data = data_train,
 
 ### 3. Modeling
 
-```{r}
+``` r
 # User input
 
 mode <- "classification"
diff --git a/docs/index.html b/docs/index.html
index 008f0d0..f44a3e4 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -88,54 +88,88 @@ <h2 id="example-code">Example Code<a class="anchor" aria-label="anchor" href="#e
 <div class="section level3">
 <h3 id="id_1-sample-data-import">1. Sample Data Import<a class="anchor" aria-label="anchor" href="#id_1-sample-data-import"></a>
 </h3>
-<p>```{r} # remotes::install_github(“statgarten/datatoys”) library(stove) library(datatoys) library(dplyr)</p>
-<p>set.seed(1234)</p>
-<p>cleaned_data &lt;- datatoys::bloodTest</p>
-<p>cleaned_data &lt;- cleaned_data %&gt;% mutate_at(vars(SEX, ANE, IHD, STK), factor) %&gt;% mutate(TG = ifelse(TG &lt; 150, 0, 1)) %&gt;% mutate_at(vars(TG), factor) %&gt;% group_by(TG) %&gt;% sample_n(500) # TG(0):TG(1) = 500:500</p>
-<pre><code>
-### 2. Data split and Define preprocessing
-
-```{r}
-target_var &lt;- "TG"
-train_set_ratio &lt;- 0.7
-seed &lt;- 1234
-formula &lt;- paste0(target_var, " ~ .")
-
-# Split data
-
-split_tmp &lt;- stove::trainTestSplit(data = cleaned_data,
-                                   target = target_var,
-                                   prop = train_set_ratio,
-                                   seed = seed
-                                   )
-
-data_train &lt;- split_tmp[[1]] # train data
-data_test &lt;- split_tmp[[2]] # test data
-data_split &lt;- split_tmp[[3]] # whole data with split information
-
-# Define preprocessing recipe for cross validation
-
-rec &lt;- stove::prepForCV(data = data_train,
-                        formula = formula,
-                        imputation = T,
-                        normalization = T,
-                        seed = seed
-                        )</code></pre>
+<div class="sourceCode" id="cb2"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span><span class="co"># remotes::install_github("statgarten/datatoys")</span></span>
+<span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://github.com/statgarten/stove" class="external-link">stove</a></span><span class="op">)</span></span>
+<span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://statgarten.github.io/datatoys/" class="external-link">datatoys</a></span><span class="op">)</span></span>
+<span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://dplyr.tidyverse.org" class="external-link">dplyr</a></span><span class="op">)</span></span>
+<span></span>
+<span><span class="fu"><a href="https://rdrr.io/r/base/Random.html" class="external-link">set.seed</a></span><span class="op">(</span><span class="fl">1234</span><span class="op">)</span></span>
+<span></span>
+<span><span class="va">cleaned_data</span> <span class="op">&lt;-</span> <span class="fu">datatoys</span><span class="fu">::</span><span class="va"><a href="https://statgarten.github.io/datatoys/reference/bloodTest.html" class="external-link">bloodTest</a></span></span>
+<span></span>
+<span><span class="va">cleaned_data</span> <span class="op">&lt;-</span> <span class="va">cleaned_data</span> <span class="op"><a href="reference/pipe.html">%&gt;%</a></span></span>
+<span>  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate_all.html" class="external-link">mutate_at</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/vars.html" class="external-link">vars</a></span><span class="op">(</span><span class="va">SEX</span>, <span class="va">ANE</span>, <span class="va">IHD</span>, <span class="va">STK</span><span class="op">)</span>, <span class="va">factor</span><span class="op">)</span> <span class="op"><a href="reference/pipe.html">%&gt;%</a></span></span>
+<span>  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate.html" class="external-link">mutate</a></span><span class="op">(</span>TG <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/ifelse.html" class="external-link">ifelse</a></span><span class="op">(</span><span class="va">TG</span> <span class="op">&lt;</span> <span class="fl">150</span>, <span class="fl">0</span>, <span class="fl">1</span><span class="op">)</span><span class="op">)</span> <span class="op"><a href="reference/pipe.html">%&gt;%</a></span></span>
+<span>  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/mutate_all.html" class="external-link">mutate_at</a></span><span class="op">(</span><span class="fu"><a href="https://dplyr.tidyverse.org/reference/vars.html" class="external-link">vars</a></span><span class="op">(</span><span class="va">TG</span><span class="op">)</span>, <span class="va">factor</span><span class="op">)</span> <span class="op"><a href="reference/pipe.html">%&gt;%</a></span></span>
+<span>  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/group_by.html" class="external-link">group_by</a></span><span class="op">(</span><span class="va">TG</span><span class="op">)</span> <span class="op"><a href="reference/pipe.html">%&gt;%</a></span></span>
+<span>  <span class="fu"><a href="https://dplyr.tidyverse.org/reference/sample_n.html" class="external-link">sample_n</a></span><span class="op">(</span><span class="fl">500</span><span class="op">)</span> <span class="co"># TG(0):TG(1) = 500:500</span></span></code></pre></div>
 </div>
 <div class="section level3">
-<h3 id="id_3-modeling">3. Modeling<a class="anchor" aria-label="anchor" href="#id_3-modeling"></a>
+<h3 id="id_2-data-split-and-define-preprocessing">2. Data split and Define preprocessing<a class="anchor" aria-label="anchor" href="#id_2-data-split-and-define-preprocessing"></a>
 </h3>
-<p>```{r} # User input</p>
-<p>mode &lt;- “classification” algo &lt;- “logisticRegression” # Custom name engine &lt;- “glmnet” # glmnet (default) v &lt;- 2 metric &lt;- “roc_auc” # roc_auc (default), accuracy gridNum &lt;- 5 iter &lt;- 10 seed &lt;- 1234</p>
-</div>
+<div class="sourceCode" id="cb3"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span><span class="va">target_var</span> <span class="op">&lt;-</span> <span class="st">"TG"</span></span>
+<span><span class="va">train_set_ratio</span> <span class="op">&lt;-</span> <span class="fl">0.7</span></span>
+<span><span class="va">seed</span> <span class="op">&lt;-</span> <span class="fl">1234</span></span>
+<span><span class="va">formula</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://rdrr.io/r/base/paste.html" class="external-link">paste0</a></span><span class="op">(</span><span class="va">target_var</span>, <span class="st">" ~ ."</span><span class="op">)</span></span>
+<span></span>
+<span><span class="co"># Split data</span></span>
+<span></span>
+<span><span class="va">split_tmp</span> <span class="op">&lt;-</span> <span class="fu">stove</span><span class="fu">::</span><span class="fu"><a href="reference/trainTestSplit.html">trainTestSplit</a></span><span class="op">(</span>data <span class="op">=</span> <span class="va">cleaned_data</span>,</span>
+<span>                                   target <span class="op">=</span> <span class="va">target_var</span>,</span>
+<span>                                   prop <span class="op">=</span> <span class="va">train_set_ratio</span>,</span>
+<span>                                   seed <span class="op">=</span> <span class="va">seed</span></span>
+<span>                                   <span class="op">)</span></span>
+<span></span>
+<span><span class="va">data_train</span> <span class="op">&lt;-</span> <span class="va">split_tmp</span><span class="op">[[</span><span class="fl">1</span><span class="op">]</span><span class="op">]</span> <span class="co"># train data</span></span>
+<span><span class="va">data_test</span> <span class="op">&lt;-</span> <span class="va">split_tmp</span><span class="op">[[</span><span class="fl">2</span><span class="op">]</span><span class="op">]</span> <span class="co"># test data</span></span>
+<span><span class="va">data_split</span> <span class="op">&lt;-</span> <span class="va">split_tmp</span><span class="op">[[</span><span class="fl">3</span><span class="op">]</span><span class="op">]</span> <span class="co"># whole data with split information</span></span>
+<span></span>
+<span><span class="co"># Define preprocessing recipe for cross validation</span></span>
+<span></span>
+<span><span class="va">rec</span> <span class="op">&lt;-</span> <span class="fu">stove</span><span class="fu">::</span><span class="fu"><a href="reference/prepForCV.html">prepForCV</a></span><span class="op">(</span>data <span class="op">=</span> <span class="va">data_train</span>,</span>
+<span>                        formula <span class="op">=</span> <span class="va">formula</span>,</span>
+<span>                        imputation <span class="op">=</span> <span class="cn">T</span>,</span>
+<span>                        normalization <span class="op">=</span> <span class="cn">T</span>,</span>
+<span>                        seed <span class="op">=</span> <span class="va">seed</span></span>
+<span>                        <span class="op">)</span></span></code></pre></div>
 </div>
-</div>
-<div class="section level1">
-<h1 id="modeling-using-logistic-regression-algorithm">Modeling using logistic regression algorithm<a class="anchor" aria-label="anchor" href="#modeling-using-logistic-regression-algorithm"></a>
-</h1>
-<p>finalized &lt;- stove::logisticRegression( algo = algo, engine = engine, mode = mode, trainingData = data_train, splitedData = data_split, formula = formula, rec = rec, v = v, gridNum = gridNum, iter = iter, metric = metric, seed = seed ) ```</p>
+<div class="section level3">
+<h3 id="id_3-modeling">3. Modeling<a class="anchor" aria-label="anchor" href="#id_3-modeling"></a>
+</h3>
+<div class="sourceCode" id="cb4"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span><span class="co"># User input</span></span>
+<span></span>
+<span><span class="va">mode</span> <span class="op">&lt;-</span> <span class="st">"classification"</span></span>
+<span><span class="va">algo</span> <span class="op">&lt;-</span> <span class="st">"logisticRegression"</span> <span class="co"># Custom name</span></span>
+<span><span class="va">engine</span> <span class="op">&lt;-</span> <span class="st">"glmnet"</span> <span class="co"># glmnet (default)</span></span>
+<span><span class="va">v</span> <span class="op">&lt;-</span> <span class="fl">2</span></span>
+<span><span class="va">metric</span> <span class="op">&lt;-</span> <span class="st">"roc_auc"</span> <span class="co"># roc_auc (default), accuracy</span></span>
+<span><span class="va">gridNum</span> <span class="op">&lt;-</span> <span class="fl">5</span></span>
+<span><span class="va">iter</span> <span class="op">&lt;-</span> <span class="fl">10</span></span>
+<span><span class="va">seed</span> <span class="op">&lt;-</span> <span class="fl">1234</span></span>
+<span></span>
+<span><span class="co"># Modeling using logistic regression algorithm</span></span>
+<span></span>
+<span><span class="va">finalized</span> <span class="op">&lt;-</span> <span class="fu">stove</span><span class="fu">::</span><span class="fu"><a href="reference/logisticRegression.html">logisticRegression</a></span><span class="op">(</span></span>
+<span>  algo <span class="op">=</span> <span class="va">algo</span>,</span>
+<span>  engine <span class="op">=</span> <span class="va">engine</span>,</span>
+<span>  mode <span class="op">=</span> <span class="va">mode</span>,</span>
+<span>  trainingData <span class="op">=</span> <span class="va">data_train</span>,</span>
+<span>  splitedData <span class="op">=</span> <span class="va">data_split</span>,</span>
+<span>  formula <span class="op">=</span> <span class="va">formula</span>,</span>
+<span>  rec <span class="op">=</span> <span class="va">rec</span>,</span>
+<span>  v <span class="op">=</span> <span class="va">v</span>,</span>
+<span>  gridNum <span class="op">=</span> <span class="va">gridNum</span>,</span>
+<span>  iter <span class="op">=</span> <span class="va">iter</span>,</span>
+<span>  metric <span class="op">=</span> <span class="va">metric</span>,</span>
+<span>  seed <span class="op">=</span> <span class="va">seed</span></span>
+<span><span class="op">)</span></span></code></pre></div>
 <p>You can compare several models’ performance and visualize them.<br>
 These <a href="https://github.com/statgarten/stove/tree/main/quarto-doc" class="external-link">documents</a> contain the example codes for modeling workflow using stove.</p>
+</div>
+</div>
 <div class="section level2">
 <h2 id="white_check_mark-recommendation">
 <span class="emoji" data-emoji="white_check_mark">✅</span> Recommendation<a class="anchor" aria-label="anchor" href="#white_check_mark-recommendation"></a>
@@ -308,7 +342,6 @@ <h2 id="clipboard-dependency">
 </details>
 </div>
 </div>
-
   </main><aside class="col-md-3"><div class="links">
 <h2 data-toc-skip>Links</h2>
 <ul class="list-unstyled">
diff --git a/docs/pkgdown.yml b/docs/pkgdown.yml
index eb8b77a..4d480a8 100644
--- a/docs/pkgdown.yml
+++ b/docs/pkgdown.yml
@@ -2,5 +2,5 @@ pandoc: 3.1.6.1
 pkgdown: 2.0.7
 pkgdown_sha: ~
 articles: {}
-last_built: 2023-11-15T06:22Z
+last_built: 2023-11-15T06:23Z
 
diff --git a/docs/search.json b/docs/search.json
index e8e2fde..c34e909 100644
--- a/docs/search.json
+++ b/docs/search.json
@@ -1 +1 @@
-[{"path":"/LICENSE.html","id":null,"dir":"","previous_headings":"","what":"MIT License","title":"MIT License","text":"Copyright (c) 2023 stove authors Permission hereby granted, free charge, person obtaining copy software associated documentation files (“Software”), deal Software without restriction, including without limitation rights use, copy, modify, merge, publish, distribute, sublicense, /sell copies Software, permit persons Software furnished , subject following conditions: copyright notice permission notice shall included copies substantial portions Software. SOFTWARE PROVIDED “”, WITHOUT WARRANTY KIND, EXPRESS IMPLIED, INCLUDING LIMITED WARRANTIES MERCHANTABILITY, FITNESS PARTICULAR PURPOSE NONINFRINGEMENT. EVENT SHALL AUTHORS COPYRIGHT HOLDERS LIABLE CLAIM, DAMAGES LIABILITY, WHETHER ACTION CONTRACT, TORT OTHERWISE, ARISING , CONNECTION SOFTWARE USE DEALINGS SOFTWARE.","code":""},{"path":"/authors.html","id":null,"dir":"","previous_headings":"","what":"Authors","title":"Authors and Citation","text":"Yeonchan Seong. Author, maintainer.","code":""},{"path":"/authors.html","id":"citation","dir":"","previous_headings":"","what":"Citation","title":"Authors and Citation","text":"Seong Y (2023). stove: Stove. R package version 1.1, https://github.com/statgarten/stove.","code":"@Manual{,   title = {stove: Stove},   author = {Yeonchan Seong},   year = {2023},   note = {R package version 1.1},   url = {https://github.com/statgarten/stove}, }"},{"path":"/index.html","id":"yellow_heart-stove-","dir":"","previous_headings":"","what":"Stove","title":"Stove","text":"stove package provides functions ML modeling. Packages Tidymodels used, configured easy ML beginners use. Although belongs statgarten whose packages incorporated shiny app, stove package also can used console.","code":""},{"path":"/index.html","id":"wrench-install","dir":"","previous_headings":"","what":"🔧 Install","title":"Stove","text":"","code":"# install.packages(\"devtools\") devtools::install_github(\"statgarten/stove\")"},{"path":[]},{"path":"/index.html","id":"id_1-sample-data-import","dir":"","previous_headings":"Example Code","what":"1. Sample Data Import","title":"Stove","text":"```{r} # remotes::install_github(“statgarten/datatoys”) library(stove) library(datatoys) library(dplyr) set.seed(1234) cleaned_data <- datatoys::bloodTest cleaned_data <- cleaned_data %>% mutate_at(vars(SEX, ANE, IHD, STK), factor) %>% mutate(TG = ifelse(TG < 150, 0, 1)) %>% mutate_at(vars(TG), factor) %>% group_by(TG) %>% sample_n(500) # TG(0):TG(1) = 500:500","code":"### 2. Data split and Define preprocessing  ```{r} target_var <- \"TG\" train_set_ratio <- 0.7 seed <- 1234 formula <- paste0(target_var, \" ~ .\")  # Split data  split_tmp <- stove::trainTestSplit(data = cleaned_data,                                    target = target_var,                                    prop = train_set_ratio,                                    seed = seed                                    )  data_train <- split_tmp[[1]] # train data data_test <- split_tmp[[2]] # test data data_split <- split_tmp[[3]] # whole data with split information  # Define preprocessing recipe for cross validation  rec <- stove::prepForCV(data = data_train,                         formula = formula,                         imputation = T,                         normalization = T,                         seed = seed                         )"},{"path":"/index.html","id":"id_3-modeling","dir":"","previous_headings":"Example Code","what":"3. Modeling","title":"Stove","text":"```{r} # User input mode <- “classification” algo <- “logisticRegression” # Custom name engine <- “glmnet” # glmnet (default) v <- 2 metric <- “roc_auc” # roc_auc (default), accuracy gridNum <- 5 iter <- 10 seed <- 1234","code":""},{"path":"/index.html","id":"modeling-using-logistic-regression-algorithm","dir":"","previous_headings":"","what":"Modeling using logistic regression algorithm","title":"Stove","text":"finalized <- stove::logisticRegression( algo = algo, engine = engine, mode = mode, trainingData = data_train, splitedData = data_split, formula = formula, rec = rec, v = v, gridNum = gridNum, iter = iter, metric = metric, seed = seed ) ``` can compare several models’ performance visualize . documents contain example codes modeling workflow using stove.","code":""},{"path":"/index.html","id":"white_check_mark-recommendation","dir":"","previous_headings":"","what":"✅ Recommendation","title":"Stove","text":"training ML model, amount data required depends complexity task want solve complexity learning algorithm. ‘stove’ support training process without cross-validation. recommend training model data least 1,000 rows.","code":""},{"path":"/index.html","id":"blush-authors","dir":"","previous_headings":"","what":"😊 Authors","title":"Stove","text":"Yeonchan Seong @ycseong07","code":""},{"path":"/index.html","id":"memo-license","dir":"","previous_headings":"","what":"📝 License","title":"Stove","text":"Copyright ©️ 2022 Yeonchan Seong project MIT licensed","code":""},{"path":"/index.html","id":"clipboard-dependency","dir":"","previous_headings":"","what":"📋 Dependency","title":"Stove","text":"assertthat - 0.2.1 base64enc - 0.1-3 bayesplot - 1.10.0 boot - 1.3-28.1 C50 - 0.1.7 callr - 3.7.3 class - 7.3-20 cli - 3.6.0 cluster - 2.1.4 codetools - 0.2-18 colorspace - 2.0-3 colourpicker - 1.2.0 combinat - 0.0-8 cowplot - 1.1.1 crayon - 1.5.2 crosstalk - 1.2.0 Cubist - 0.4.1 data.table - 1.14.6 DBI - 1.1.3 dials - 1.1.0 DiceDesign - 1.9 digest - 0.6.31 discrim - 1.0.0 dplyr - 1.0.10 DT - 0.26 dygraphs - 1.1.1.6 ellipsis - 0.3.2 factoextra - 1.0.7 fansi - 1.0.3 fastmap - 1.1.0 forcats - 0.5.2 foreach - 1.5.2 Formula - 1.2-4 furrr - 0.3.1 future - 1.30.0 future.apply - 1.10.0 generics - 0.1.3 ggplot2 - 3.4.0 ggrepel - 0.9.2 glmnet - 4.1-6 globals - 0.16.2 glue - 1.6.2 gower - 1.0.1 GPfit - 1.0-8 gridExtra - 2.3 gtable - 0.3.1 gtools - 3.9.4 hardhat - 1.2.0 haven - 2.5.1 highr - 0.1 hms - 1.1.2 htmltools - 0.5.4 htmlwidgets - 1.6.1 httpuv - 1.6.7 igraph - 1.3.5 inline - 0.3.19 inum - 1.0-4 ipred - 0.9-13 iterators - 1.0.14 kknn - 1.3.1 klaR - 1.7-1 labelled - 2.10.0 later - 1.3.0 lattice - 0.20-45 lava - 1.7.1 lhs - 1.1.6 libcoin - 1.0-9 lifecycle - 1.0.3 listenv - 0.9.0 lme4 - 1.1-31 loo - 2.5.1 lubridate - 1.9.0 magrittr - 2.0.3 markdown - 1.4 MASS - 7.3-58.1 Matrix - 1.5-3 matrixStats - 0.63.0 mime - 0.12 miniUI - 0.1.1.1 minqa - 1.2.5 munsell - 0.5.0 mvtnorm - 1.1-3 naivebayes - 0.9.7 nlme - 3.1-161 nloptr - 2.0.3 nnet - 7.3-18 parallelly - 1.33.0 parsnip - 1.0.3 partykit - 1.2-16 pillar - 1.8.1 pkgbuild - 1.4.0 pkgconfig - 2.0.3 plyr - 1.8.8 prettyunits - 1.1.1 processx - 3.8.0 prodlim - 2019.11.13 promises - 1.2.0.1 ps - 1.7.0 purrr - 0.3.4 questionr - 0.7.7 R6 - 2.5.1 randomForest - 4.7-1.1 ranger - 0.14.1 RColorBrewer - 1.1-3 Rcpp - 1.0.9 RcppParallel - 5.1.6 recipes - 1.0.3 reshape2 - 1.4.4 rlang - rpart - 4.1.19 rsample - 1.1.1 rstan - 2.21.7 rstanarm - 2.21.3 rstantools - 2.2.0 rstudioapi - 0.14 scales - 1.2.1 sessioninfo - 1.2.2 shape - 1.4.6 shiny - 1.7.4 shinyjs - 2.1.0 shinystan - 2.6.0 shinythemes - 1.2.0 StanHeaders - 2.21.0-7 stringi - 1.7.8 stringr - 1.5.0 survival - 3.5-0 threejs - 0.3.3 tibble - 3.1.8 tidyr - 1.2.1 tidyselect - 1.2.0 timechange - 0.1.1 timeDate - 4022.108 treesnip - 0.1.0.9001 tune - 1.0.1 utf8 - 1.2.2 vctrs - 0.5.1 withr - 2.5.0 workflows - 1.1.2 xtable - 1.8-4 xts - 0.12.2 yardstick - 1.1.0 zoo - 1.8-11","code":""},{"path":"/reference/KNN.html","id":null,"dir":"Reference","previous_headings":"","what":"K-Nearest Neighbors — KNN","title":"K-Nearest Neighbors — KNN","text":"K-Nearest Neighbors","code":""},{"path":"/reference/KNN.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"K-Nearest Neighbors — KNN","text":"","code":"KNN(   algo = \"KNN\",   engine = \"kknn\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/KNN.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"K-Nearest Neighbors — KNN","text":"algo name algorithm can customized user (default: \"KNN\"). engine name software used fit model (\"kknn\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/KNN.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"K-Nearest Neighbors — KNN","text":"function training user-defined K-Nearest Neighbors model. Hyperparameters tuning: neighbors","code":""},{"path":"/reference/MLP.html","id":null,"dir":"Reference","previous_headings":"","what":"neural network — MLP","title":"neural network — MLP","text":"neural network","code":""},{"path":"/reference/MLP.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"neural network — MLP","text":"","code":"MLP(   algo = \"MLP\",   engine = \"nnet\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/MLP.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"neural network — MLP","text":"algo name algorithm can customized user (default: \"MLP\"). engine name software used fit model (\"nnet\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/MLP.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"neural network — MLP","text":"function training user-defined MLP model. Hyperparameters tuning: hidden_units, penalty, epochs","code":""},{"path":"/reference/SVMLinear.html","id":null,"dir":"Reference","previous_headings":"","what":"SVMLinear — SVMLinear","title":"SVMLinear — SVMLinear","text":"SVMLinear","code":""},{"path":"/reference/SVMLinear.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"SVMLinear — SVMLinear","text":"","code":"SVMLinear(   algo = \"SVMLinear\",   engine = \"kernlab\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/SVMLinear.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"SVMLinear — SVMLinear","text":"algo name algorithm can customized user (default: \"SVMLinear\"). engine name software used fit model (\"kernlab\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/SVMLinear.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"SVMLinear — SVMLinear","text":"function training user-defined SVM Linear model.","code":""},{"path":"/reference/SVMPoly.html","id":null,"dir":"Reference","previous_headings":"","what":"SVMPoly — SVMPoly","title":"SVMPoly — SVMPoly","text":"SVMPoly","code":""},{"path":"/reference/SVMPoly.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"SVMPoly — SVMPoly","text":"","code":"SVMPoly(   algo = \"SVMPoly\",   engine = \"kernlab\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/SVMPoly.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"SVMPoly — SVMPoly","text":"algo name algorithm can customized user (default: \"SVMPoly\"). engine name software used fit model (\"kernlab\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/SVMPoly.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"SVMPoly — SVMPoly","text":"function training user-defined SVM Poly model.","code":""},{"path":"/reference/SVMRbf.html","id":null,"dir":"Reference","previous_headings":"","what":"SVMRbf — SVMRbf","title":"SVMRbf — SVMRbf","text":"SVMRbf","code":""},{"path":"/reference/SVMRbf.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"SVMRbf — SVMRbf","text":"","code":"SVMRbf(   algo = \"SVMRbf\",   engine = \"kernlab\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/SVMRbf.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"SVMRbf — SVMRbf","text":"algo name algorithm can customized user (default: \"SVMRbf\"). engine name software used fit model (\"kernlab\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/SVMRbf.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"SVMRbf — SVMRbf","text":"function training user-defined SVM Rbf model.","code":""},{"path":"/reference/bayesOptCV.html","id":null,"dir":"Reference","previous_headings":"","what":"Bayesian optimization with cross validation — bayesOptCV","title":"Bayesian optimization with cross validation — bayesOptCV","text":"Bayesian optimization cross validation","code":""},{"path":"/reference/bayesOptCV.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Bayesian optimization with cross validation — bayesOptCV","text":"","code":"bayesOptCV(   rec = NULL,   model = NULL,   v = NULL,   trainingData = NULL,   gridNum = NULL,   iter = NULL,   seed = NULL )"},{"path":"/reference/bayesOptCV.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Bayesian optimization with cross validation — bayesOptCV","text":"rec recipe object including local preprocessing. model model object including list hyperparameters, engine mode. v Perform cross-validation dividing training data v folds. trainingData training data. gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. seed Seed reproducible results.","code":""},{"path":"/reference/bayesOptCV.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Bayesian optimization with cross validation — bayesOptCV","text":"Optimize hyperparameters model Cross Validation Bayesian optimization.","code":""},{"path":"/reference/clusteringVis.html","id":null,"dir":"Reference","previous_headings":"","what":"clusteringVis — clusteringVis","title":"clusteringVis — clusteringVis","text":"clusteringVis","code":""},{"path":"/reference/clusteringVis.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"clusteringVis — clusteringVis","text":"","code":"clusteringVis(   data = NULL,   model = NULL,   maxK = \"15\",   nBoot = \"100\",   selectOptimal = \"silhouette\",   seedNum = \"6471\" )"},{"path":"/reference/clusteringVis.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"clusteringVis — clusteringVis","text":"data data model model maxK maxK nStart nStart","code":""},{"path":"/reference/clusteringVis.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"clusteringVis — clusteringVis","text":"Deprecated","code":""},{"path":"/reference/decisionTree.html","id":null,"dir":"Reference","previous_headings":"","what":"Decision Tree — decisionTree","title":"Decision Tree — decisionTree","text":"Decision Tree","code":""},{"path":"/reference/decisionTree.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Decision Tree — decisionTree","text":"","code":"decisionTree(   algo = \"Decision Tree\",   engine = \"rpart\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/decisionTree.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Decision Tree — decisionTree","text":"algo name algorithm can customized user (default: \"Decision Tree\"). engine name software used fit model (\"rpart\" (default), \"C50\", \"partykit\"). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/decisionTree.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Decision Tree — decisionTree","text":"function training user-defined Decision Tree model. Hyperparameters tuning: tree_depth, min_n, cost_complexity","code":""},{"path":"/reference/evalMetricsR.html","id":null,"dir":"Reference","previous_headings":"","what":"Evaluation metrics for Regression — evalMetricsR","title":"Evaluation metrics for Regression — evalMetricsR","text":"Evaluation metrics Regression","code":""},{"path":"/reference/evalMetricsR.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Evaluation metrics for Regression — evalMetricsR","text":"","code":"evalMetricsR(modelsList, targetVar)"},{"path":"/reference/evalMetricsR.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Evaluation metrics for Regression — evalMetricsR","text":"modelsList ML 모델 리스트 targetVar 타겟 변수","code":""},{"path":"/reference/evalMetricsR.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Evaluation metrics for Regression — evalMetricsR","text":"ML 모델 리스트로부터 Regression 모델들에 대한 Evaluation metrics를 생성합니다.","code":""},{"path":"/reference/fitBestModel.html","id":null,"dir":"Reference","previous_headings":"","what":"fitting in best model — fitBestModel","title":"fitting in best model — fitBestModel","text":"fitting best model","code":""},{"path":"/reference/fitBestModel.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"fitting in best model — fitBestModel","text":"","code":"fitBestModel(   optResult,   metric,   model,   formula,   trainingData,   splitedData,   modelName )"},{"path":"/reference/fitBestModel.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"fitting in best model — fitBestModel","text":"optResult result object bayesOptCV metric Baseline metric evaluating model performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\") model model object including list hyperparameters, engine mode. formula formula modeling trainingData training data. splitedData whole dataset including information fold modelName name model defined algorithm engine selected user","code":""},{"path":"/reference/fitBestModel.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"fitting in best model — fitBestModel","text":"Get bayesOptCV function's return value fit model.","code":""},{"path":"/reference/gridSearchCV.html","id":null,"dir":"Reference","previous_headings":"","what":"Grid search with cross validation — gridSearchCV","title":"Grid search with cross validation — gridSearchCV","text":"Grid search cross validation","code":""},{"path":"/reference/gridSearchCV.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Grid search with cross validation — gridSearchCV","text":"","code":"gridSearchCV(   rec = NULL,   model = NULL,   v = NULL,   trainingData = NULL,   parameterGrid = NULL,   seed = NULL )"},{"path":"/reference/gridSearchCV.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Grid search with cross validation — gridSearchCV","text":"rec 데이터, 전처리 정보를 포함한 recipe object model hyperparameters, ngine, mode 정보가 포함된 model object v v-fold cross validation을 진행 (default: 5, 각 fold 별로 30개 이상의 observations가 있어야 유효한 모델링 결과를 얻을 수 있습니다.) trainingData 훈련데이터 셋 seed seed값 설정 parameter_grid grid search를 수행할 때 각 hyperparameter의 값을 담은 object","code":""},{"path":"/reference/gridSearchCV.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Grid search with cross validation — gridSearchCV","text":"하이퍼파라미터를 탐색하는 Grid Search와 데이터 셋을 나누어 평가하는 cross validation을 함께 수행합니다.","code":""},{"path":"/reference/kMeansClustering.html","id":null,"dir":"Reference","previous_headings":"","what":"K means clustering — kMeansClustering","title":"K means clustering — kMeansClustering","text":"K means clustering","code":""},{"path":"/reference/kMeansClustering.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"K means clustering — kMeansClustering","text":"","code":"kMeansClustering(   data,   maxK = 15,   nStart = 25,   iterMax = 10,   nBoot = 100,   algorithm = \"Hartigan-Wong\",   selectOptimal = \"silhouette\",   seedNum = 6471 )"},{"path":"/reference/kMeansClustering.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"K means clustering — kMeansClustering","text":"data 전처리가 완료된 데이터 maxK 클러스터링 수행 시 군집을 2, 3, ..., maxK개로 분할 (default: 15) iterMax 반복계산을 수행할 최대 횟수 (default: 10) nBoot gap statictic을 사용해 클러스터링을 수행할 때 Monte Carlo (bootstrap) 샘플의 개수 (selectOptimal == \"gap_stat\" 일 경우에만 지정, default: 100) algorithm K means를 수행할 알고리즘 선택 (\"Hartigan-Wong\" (default), \"Lloyd\", \"Forgy\", \"MacQueen\") selectOptimal 최적의 K값을 선정할 때 사용할 method 선택 (\"silhouette\" (default), \"gap_stat\") seedNum seed값 설정 nstart 랜덤 샘플에 대해 초기 클러스터링을 nstart번 시행 (default: 25)","code":""},{"path":"/reference/kMeansClustering.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"K means clustering — kMeansClustering","text":"function K means clustering. parameters tuning: maxK, nstart","code":""},{"path":"/reference/lightGbm.html","id":null,"dir":"Reference","previous_headings":"","what":"Light GBM — lightGbm","title":"Light GBM — lightGbm","text":"Light GBM","code":""},{"path":"/reference/lightGbm.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Light GBM — lightGbm","text":"","code":"lightGbm(   algo = \"lightGBM\",   engine = \"lightgbm\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/lightGbm.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Light GBM — lightGbm","text":"algo name algorithm can customized user. (default: \"lightGBM\"). engine name software used fit model(\"lightgbm\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/lightGbm.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Light GBM — lightGbm","text":"function training user-defined Light GBM model. Hyperparameters tuning: tree_depth, trees, learn_rate, mtry, min_n, loss_reduction","code":""},{"path":"/reference/linearRegression.html","id":null,"dir":"Reference","previous_headings":"","what":"Linear Regression — linearRegression","title":"Linear Regression — linearRegression","text":"Linear Regression","code":""},{"path":"/reference/linearRegression.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Linear Regression — linearRegression","text":"","code":"linearRegression(   algo = \"Linear Regression\",   engine = \"glmnet\",   mode = \"regression\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = \"rmse\",   seed = 1234 )"},{"path":"/reference/linearRegression.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Linear Regression — linearRegression","text":"algo name algorithm can customized user (default: \"Linear Regression\"). engine name software used fit model (\"glmnet\" (default), \"lm\", \"glm\", \"stan\"). mode model type. \"classification\" \"regression\" (\"regression\" (default)). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/linearRegression.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Linear Regression — linearRegression","text":"function training user-defined Linear Regression model. Hyperparameters tuning: penalty, mixture","code":""},{"path":"/reference/logisticRegression.html","id":null,"dir":"Reference","previous_headings":"","what":"Logistic Regression — logisticRegression","title":"Logistic Regression — logisticRegression","text":"function training user-defined Logistic regression model. function supports: binary classification","code":""},{"path":"/reference/logisticRegression.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Logistic Regression — logisticRegression","text":"","code":"logisticRegression(   algo = \"Logistic Regression\",   engine = \"glmnet\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = \"roc_auc\",   seed = 1234 )"},{"path":"/reference/logisticRegression.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Logistic Regression — logisticRegression","text":"algo name algorithm can customized user (default: \"Logistic Regression\"). engine name software used fit model (Option: \"glmnet\" (default)). mode model type. \"classification\" \"regression\" (Option: \"classification\" (default)). trainingData training data. splitedData whole dataset including information fold formula formula modeling rec Recipe object containing preprocessing information cross-validation v Applying v-fold cross validation modeling process (default: 5) gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/logisticRegression.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Logistic Regression — logisticRegression","text":"Hyperparameters tuning: penalty, mixture","code":""},{"path":"/reference/multinomialRegression.html","id":null,"dir":"Reference","previous_headings":"","what":"Multinomial Regression — multinomialRegression","title":"Multinomial Regression — multinomialRegression","text":"function training user-defined Multinomial regression model. function supports: multinomial classification","code":""},{"path":"/reference/multinomialRegression.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Multinomial Regression — multinomialRegression","text":"","code":"multinomialRegression(   algo = \"Multinomial Regression\",   engine = \"glmnet\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = \"roc_auc\",   seed = 1234 )"},{"path":"/reference/multinomialRegression.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Multinomial Regression — multinomialRegression","text":"algo name algorithm can customized user (default: \"Multinomial Regression\"). engine name software used fit model (Option: \"glmnet\" (default)). mode model type. \"classification\" \"regression\" (Option: \"classification\" (default)). trainingData data frame training. splitedData data frame including metadata split. formula formula modeling. rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/multinomialRegression.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Multinomial Regression — multinomialRegression","text":"Hyperparameters tuning: penalty, mixture","code":""},{"path":"/reference/naiveBayes.html","id":null,"dir":"Reference","previous_headings":"","what":"Naive Bayes — naiveBayes","title":"Naive Bayes — naiveBayes","text":"Naive Bayes","code":""},{"path":"/reference/naiveBayes.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Naive Bayes — naiveBayes","text":"","code":"naiveBayes(   algo = \"Naive Bayes\",   engine = \"klaR\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/naiveBayes.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Naive Bayes — naiveBayes","text":"algo name algorithm can customized user (default: \"Naive Bayes\"). engine name software used fit model (\"klaR\" (default), naivebayes). mode model type. \"classification\" \"regression\" (\"classification\" (default)). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/naiveBayes.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Naive Bayes — naiveBayes","text":"function training user-defined Naive Bayes model. Hyperparameters tuning: smoothness, Laplace","code":""},{"path":"/reference/pipe.html","id":null,"dir":"Reference","previous_headings":"","what":"AUC-ROC Curve — %>%","title":"AUC-ROC Curve — %>%","text":"AUC-ROC Curve Confusion matrix Regression plot Evaluation metrics Classification","code":""},{"path":"/reference/pipe.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"AUC-ROC Curve — %>%","text":"","code":"rocCurve(modelsList, targetVar)  confusionMatrix(modelName, modelsList, targetVar)  regressionPlot(modelName, modelsList, targetVar)  evalMetricsC(modelsList, targetVar)"},{"path":"/reference/pipe.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"AUC-ROC Curve — %>%","text":"modelsList ML 모델 리스트 targetVar 타겟 변수 modelName 모델명","code":""},{"path":"/reference/pipe.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"AUC-ROC Curve — %>%","text":"ML 모델 리스트로부터 AUC-ROC Curve를 생성합니다. ML 모델 리스트 내 특정 모델에 대해 Confusion matrix를 생성합니다. ML 모델 리스트 내 특정 모델에 대해 Regression plot를 생성합니다. ML 모델 리스트로부터 Classification 모델들에 대한 Evaluation metrics를 생성합니다.","code":""},{"path":"/reference/plotRmseComparison.html","id":null,"dir":"Reference","previous_headings":"","what":"rmsePlot — plotRmseComparison","title":"rmsePlot — plotRmseComparison","text":"rmsePlot","code":""},{"path":"/reference/plotRmseComparison.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"rmsePlot — plotRmseComparison","text":"","code":"plotRmseComparison(tunedResultsList, v = v, iter = iter)"},{"path":"/reference/plotRmseComparison.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"rmsePlot — plotRmseComparison","text":"rmsePlot","code":""},{"path":"/reference/prepForCV.html","id":null,"dir":"Reference","previous_headings":"","what":"Preprocessing for cross validation — prepForCV","title":"Preprocessing for cross validation — prepForCV","text":"Preprocessing cross validation","code":""},{"path":"/reference/prepForCV.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Preprocessing for cross validation — prepForCV","text":"","code":"prepForCV(   data = NULL,   formula = NULL,   imputation = FALSE,   normalization = FALSE,   nominalImputationType = \"mode\",   numericImputationType = \"mean\",   normalizationType = \"range\",   seed = \"4814\" )"},{"path":"/reference/prepForCV.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Preprocessing for cross validation — prepForCV","text":"data Training dataset apply local preprocessing recipe. formula formula modeling imputation \"imputation = TRUE\", model trained using cross-validation imputation. normalization \"normalization = TRUE\", model trained using cross-validation normalization nominalImputationType Imputation method nominal variable (Option: mode(default), bag, knn) numericImputationType Imputation method numeric variable (Option: mean(default), bag, knn, linear, lower, median, roll) normalizationType Normalization method (Option: range(default), center, normalization, scale) seed seed","code":""},{"path":"/reference/prepForCV.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Preprocessing for cross validation — prepForCV","text":"Define local preprocessing method applied training data fold training data divided several folds.","code":""},{"path":"/reference/randomForest.html","id":null,"dir":"Reference","previous_headings":"","what":"Random Forest — randomForest","title":"Random Forest — randomForest","text":"Random Forest","code":""},{"path":"/reference/randomForest.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Random Forest — randomForest","text":"","code":"randomForest(   algo = \"Random Forest\",   engine = \"ranger\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/randomForest.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Random Forest — randomForest","text":"algo name algorithm can customized user (default: \"Random Forest\"). engine name software used fit model (\"rpart\" (default), \"randomForest\", \"partykit\"). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/randomForest.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Random Forest — randomForest","text":"function training user-defined Random Forest model. Hyperparameters tuning: trees, min_n, mtry","code":""},{"path":"/reference/trainTestSplit.html","id":null,"dir":"Reference","previous_headings":"","what":"Train-Test Split — trainTestSplit","title":"Train-Test Split — trainTestSplit","text":"Train-Test Split","code":""},{"path":"/reference/trainTestSplit.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Train-Test Split — trainTestSplit","text":"","code":"trainTestSplit(data = NULL, target = NULL, prop, seed = \"4814\")"},{"path":"/reference/trainTestSplit.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Train-Test Split — trainTestSplit","text":"data Full data set global preprocess completed. target target variable. prop Proportion total data used training data. seed Seed reproducible results.","code":""},{"path":"/reference/trainTestSplit.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Train-Test Split — trainTestSplit","text":"Separate entire data training set test set.","code":""},{"path":"/reference/xgBoost.html","id":null,"dir":"Reference","previous_headings":"","what":"XGBoost — xgBoost","title":"XGBoost — xgBoost","text":"function training user-defined XGBoost model. Hyperparameters tuning: tree_depth, trees,learn_rate, mtry, min_n, loss_reduction, sample_size","code":""},{"path":"/reference/xgBoost.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"XGBoost — xgBoost","text":"","code":"xgBoost(   algo = \"XGBoost\",   engine = \"xgboost\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/xgBoost.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"XGBoost — xgBoost","text":"algo name algorithm can customized user (default: \"XGBoost\"). engine name software used fit model (\"xgboost\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/xgBoost.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"XGBoost — xgBoost","text":"XGBoost","code":""}]
+[{"path":"/LICENSE.html","id":null,"dir":"","previous_headings":"","what":"MIT License","title":"MIT License","text":"Copyright (c) 2023 stove authors Permission hereby granted, free charge, person obtaining copy software associated documentation files (“Software”), deal Software without restriction, including without limitation rights use, copy, modify, merge, publish, distribute, sublicense, /sell copies Software, permit persons Software furnished , subject following conditions: copyright notice permission notice shall included copies substantial portions Software. SOFTWARE PROVIDED “”, WITHOUT WARRANTY KIND, EXPRESS IMPLIED, INCLUDING LIMITED WARRANTIES MERCHANTABILITY, FITNESS PARTICULAR PURPOSE NONINFRINGEMENT. EVENT SHALL AUTHORS COPYRIGHT HOLDERS LIABLE CLAIM, DAMAGES LIABILITY, WHETHER ACTION CONTRACT, TORT OTHERWISE, ARISING , CONNECTION SOFTWARE USE DEALINGS SOFTWARE.","code":""},{"path":"/authors.html","id":null,"dir":"","previous_headings":"","what":"Authors","title":"Authors and Citation","text":"Yeonchan Seong. Author, maintainer.","code":""},{"path":"/authors.html","id":"citation","dir":"","previous_headings":"","what":"Citation","title":"Authors and Citation","text":"Seong Y (2023). stove: Stove. R package version 1.1, https://github.com/statgarten/stove.","code":"@Manual{,   title = {stove: Stove},   author = {Yeonchan Seong},   year = {2023},   note = {R package version 1.1},   url = {https://github.com/statgarten/stove}, }"},{"path":"/index.html","id":"yellow_heart-stove-","dir":"","previous_headings":"","what":"Stove","title":"Stove","text":"stove package provides functions ML modeling. Packages Tidymodels used, configured easy ML beginners use. Although belongs statgarten whose packages incorporated shiny app, stove package also can used console.","code":""},{"path":"/index.html","id":"wrench-install","dir":"","previous_headings":"","what":"🔧 Install","title":"Stove","text":"","code":"# install.packages(\"devtools\") devtools::install_github(\"statgarten/stove\")"},{"path":[]},{"path":"/index.html","id":"id_1-sample-data-import","dir":"","previous_headings":"Example Code","what":"1. Sample Data Import","title":"Stove","text":"","code":"# remotes::install_github(\"statgarten/datatoys\") library(stove) library(datatoys) library(dplyr)  set.seed(1234)  cleaned_data <- datatoys::bloodTest  cleaned_data <- cleaned_data %>%   mutate_at(vars(SEX, ANE, IHD, STK), factor) %>%   mutate(TG = ifelse(TG < 150, 0, 1)) %>%   mutate_at(vars(TG), factor) %>%   group_by(TG) %>%   sample_n(500) # TG(0):TG(1) = 500:500"},{"path":"/index.html","id":"id_2-data-split-and-define-preprocessing","dir":"","previous_headings":"Example Code","what":"2. Data split and Define preprocessing","title":"Stove","text":"","code":"target_var <- \"TG\" train_set_ratio <- 0.7 seed <- 1234 formula <- paste0(target_var, \" ~ .\")  # Split data  split_tmp <- stove::trainTestSplit(data = cleaned_data,                                    target = target_var,                                    prop = train_set_ratio,                                    seed = seed                                    )  data_train <- split_tmp[[1]] # train data data_test <- split_tmp[[2]] # test data data_split <- split_tmp[[3]] # whole data with split information  # Define preprocessing recipe for cross validation  rec <- stove::prepForCV(data = data_train,                         formula = formula,                         imputation = T,                         normalization = T,                         seed = seed                         )"},{"path":"/index.html","id":"id_3-modeling","dir":"","previous_headings":"Example Code","what":"3. Modeling","title":"Stove","text":"can compare several models’ performance visualize . documents contain example codes modeling workflow using stove.","code":"# User input  mode <- \"classification\" algo <- \"logisticRegression\" # Custom name engine <- \"glmnet\" # glmnet (default) v <- 2 metric <- \"roc_auc\" # roc_auc (default), accuracy gridNum <- 5 iter <- 10 seed <- 1234  # Modeling using logistic regression algorithm  finalized <- stove::logisticRegression(   algo = algo,   engine = engine,   mode = mode,   trainingData = data_train,   splitedData = data_split,   formula = formula,   rec = rec,   v = v,   gridNum = gridNum,   iter = iter,   metric = metric,   seed = seed )"},{"path":"/index.html","id":"white_check_mark-recommendation","dir":"","previous_headings":"","what":"✅ Recommendation","title":"Stove","text":"training ML model, amount data required depends complexity task want solve complexity learning algorithm. ‘stove’ support training process without cross-validation. recommend training model data least 1,000 rows.","code":""},{"path":"/index.html","id":"blush-authors","dir":"","previous_headings":"","what":"😊 Authors","title":"Stove","text":"Yeonchan Seong @ycseong07","code":""},{"path":"/index.html","id":"memo-license","dir":"","previous_headings":"","what":"📝 License","title":"Stove","text":"Copyright ©️ 2022 Yeonchan Seong project MIT licensed","code":""},{"path":"/index.html","id":"clipboard-dependency","dir":"","previous_headings":"","what":"📋 Dependency","title":"Stove","text":"assertthat - 0.2.1 base64enc - 0.1-3 bayesplot - 1.10.0 boot - 1.3-28.1 C50 - 0.1.7 callr - 3.7.3 class - 7.3-20 cli - 3.6.0 cluster - 2.1.4 codetools - 0.2-18 colorspace - 2.0-3 colourpicker - 1.2.0 combinat - 0.0-8 cowplot - 1.1.1 crayon - 1.5.2 crosstalk - 1.2.0 Cubist - 0.4.1 data.table - 1.14.6 DBI - 1.1.3 dials - 1.1.0 DiceDesign - 1.9 digest - 0.6.31 discrim - 1.0.0 dplyr - 1.0.10 DT - 0.26 dygraphs - 1.1.1.6 ellipsis - 0.3.2 factoextra - 1.0.7 fansi - 1.0.3 fastmap - 1.1.0 forcats - 0.5.2 foreach - 1.5.2 Formula - 1.2-4 furrr - 0.3.1 future - 1.30.0 future.apply - 1.10.0 generics - 0.1.3 ggplot2 - 3.4.0 ggrepel - 0.9.2 glmnet - 4.1-6 globals - 0.16.2 glue - 1.6.2 gower - 1.0.1 GPfit - 1.0-8 gridExtra - 2.3 gtable - 0.3.1 gtools - 3.9.4 hardhat - 1.2.0 haven - 2.5.1 highr - 0.1 hms - 1.1.2 htmltools - 0.5.4 htmlwidgets - 1.6.1 httpuv - 1.6.7 igraph - 1.3.5 inline - 0.3.19 inum - 1.0-4 ipred - 0.9-13 iterators - 1.0.14 kknn - 1.3.1 klaR - 1.7-1 labelled - 2.10.0 later - 1.3.0 lattice - 0.20-45 lava - 1.7.1 lhs - 1.1.6 libcoin - 1.0-9 lifecycle - 1.0.3 listenv - 0.9.0 lme4 - 1.1-31 loo - 2.5.1 lubridate - 1.9.0 magrittr - 2.0.3 markdown - 1.4 MASS - 7.3-58.1 Matrix - 1.5-3 matrixStats - 0.63.0 mime - 0.12 miniUI - 0.1.1.1 minqa - 1.2.5 munsell - 0.5.0 mvtnorm - 1.1-3 naivebayes - 0.9.7 nlme - 3.1-161 nloptr - 2.0.3 nnet - 7.3-18 parallelly - 1.33.0 parsnip - 1.0.3 partykit - 1.2-16 pillar - 1.8.1 pkgbuild - 1.4.0 pkgconfig - 2.0.3 plyr - 1.8.8 prettyunits - 1.1.1 processx - 3.8.0 prodlim - 2019.11.13 promises - 1.2.0.1 ps - 1.7.0 purrr - 0.3.4 questionr - 0.7.7 R6 - 2.5.1 randomForest - 4.7-1.1 ranger - 0.14.1 RColorBrewer - 1.1-3 Rcpp - 1.0.9 RcppParallel - 5.1.6 recipes - 1.0.3 reshape2 - 1.4.4 rlang - rpart - 4.1.19 rsample - 1.1.1 rstan - 2.21.7 rstanarm - 2.21.3 rstantools - 2.2.0 rstudioapi - 0.14 scales - 1.2.1 sessioninfo - 1.2.2 shape - 1.4.6 shiny - 1.7.4 shinyjs - 2.1.0 shinystan - 2.6.0 shinythemes - 1.2.0 StanHeaders - 2.21.0-7 stringi - 1.7.8 stringr - 1.5.0 survival - 3.5-0 threejs - 0.3.3 tibble - 3.1.8 tidyr - 1.2.1 tidyselect - 1.2.0 timechange - 0.1.1 timeDate - 4022.108 treesnip - 0.1.0.9001 tune - 1.0.1 utf8 - 1.2.2 vctrs - 0.5.1 withr - 2.5.0 workflows - 1.1.2 xtable - 1.8-4 xts - 0.12.2 yardstick - 1.1.0 zoo - 1.8-11","code":""},{"path":"/reference/KNN.html","id":null,"dir":"Reference","previous_headings":"","what":"K-Nearest Neighbors — KNN","title":"K-Nearest Neighbors — KNN","text":"K-Nearest Neighbors","code":""},{"path":"/reference/KNN.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"K-Nearest Neighbors — KNN","text":"","code":"KNN(   algo = \"KNN\",   engine = \"kknn\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/KNN.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"K-Nearest Neighbors — KNN","text":"algo name algorithm can customized user (default: \"KNN\"). engine name software used fit model (\"kknn\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/KNN.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"K-Nearest Neighbors — KNN","text":"function training user-defined K-Nearest Neighbors model. Hyperparameters tuning: neighbors","code":""},{"path":"/reference/MLP.html","id":null,"dir":"Reference","previous_headings":"","what":"neural network — MLP","title":"neural network — MLP","text":"neural network","code":""},{"path":"/reference/MLP.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"neural network — MLP","text":"","code":"MLP(   algo = \"MLP\",   engine = \"nnet\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/MLP.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"neural network — MLP","text":"algo name algorithm can customized user (default: \"MLP\"). engine name software used fit model (\"nnet\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/MLP.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"neural network — MLP","text":"function training user-defined MLP model. Hyperparameters tuning: hidden_units, penalty, epochs","code":""},{"path":"/reference/SVMLinear.html","id":null,"dir":"Reference","previous_headings":"","what":"SVMLinear — SVMLinear","title":"SVMLinear — SVMLinear","text":"SVMLinear","code":""},{"path":"/reference/SVMLinear.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"SVMLinear — SVMLinear","text":"","code":"SVMLinear(   algo = \"SVMLinear\",   engine = \"kernlab\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/SVMLinear.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"SVMLinear — SVMLinear","text":"algo name algorithm can customized user (default: \"SVMLinear\"). engine name software used fit model (\"kernlab\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/SVMLinear.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"SVMLinear — SVMLinear","text":"function training user-defined SVM Linear model.","code":""},{"path":"/reference/SVMPoly.html","id":null,"dir":"Reference","previous_headings":"","what":"SVMPoly — SVMPoly","title":"SVMPoly — SVMPoly","text":"SVMPoly","code":""},{"path":"/reference/SVMPoly.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"SVMPoly — SVMPoly","text":"","code":"SVMPoly(   algo = \"SVMPoly\",   engine = \"kernlab\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/SVMPoly.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"SVMPoly — SVMPoly","text":"algo name algorithm can customized user (default: \"SVMPoly\"). engine name software used fit model (\"kernlab\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/SVMPoly.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"SVMPoly — SVMPoly","text":"function training user-defined SVM Poly model.","code":""},{"path":"/reference/SVMRbf.html","id":null,"dir":"Reference","previous_headings":"","what":"SVMRbf — SVMRbf","title":"SVMRbf — SVMRbf","text":"SVMRbf","code":""},{"path":"/reference/SVMRbf.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"SVMRbf — SVMRbf","text":"","code":"SVMRbf(   algo = \"SVMRbf\",   engine = \"kernlab\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/SVMRbf.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"SVMRbf — SVMRbf","text":"algo name algorithm can customized user (default: \"SVMRbf\"). engine name software used fit model (\"kernlab\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/SVMRbf.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"SVMRbf — SVMRbf","text":"function training user-defined SVM Rbf model.","code":""},{"path":"/reference/bayesOptCV.html","id":null,"dir":"Reference","previous_headings":"","what":"Bayesian optimization with cross validation — bayesOptCV","title":"Bayesian optimization with cross validation — bayesOptCV","text":"Bayesian optimization cross validation","code":""},{"path":"/reference/bayesOptCV.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Bayesian optimization with cross validation — bayesOptCV","text":"","code":"bayesOptCV(   rec = NULL,   model = NULL,   v = NULL,   trainingData = NULL,   gridNum = NULL,   iter = NULL,   seed = NULL )"},{"path":"/reference/bayesOptCV.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Bayesian optimization with cross validation — bayesOptCV","text":"rec recipe object including local preprocessing. model model object including list hyperparameters, engine mode. v Perform cross-validation dividing training data v folds. trainingData training data. gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. seed Seed reproducible results.","code":""},{"path":"/reference/bayesOptCV.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Bayesian optimization with cross validation — bayesOptCV","text":"Optimize hyperparameters model Cross Validation Bayesian optimization.","code":""},{"path":"/reference/clusteringVis.html","id":null,"dir":"Reference","previous_headings":"","what":"clusteringVis — clusteringVis","title":"clusteringVis — clusteringVis","text":"clusteringVis","code":""},{"path":"/reference/clusteringVis.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"clusteringVis — clusteringVis","text":"","code":"clusteringVis(   data = NULL,   model = NULL,   maxK = \"15\",   nBoot = \"100\",   selectOptimal = \"silhouette\",   seedNum = \"6471\" )"},{"path":"/reference/clusteringVis.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"clusteringVis — clusteringVis","text":"data data model model maxK maxK nStart nStart","code":""},{"path":"/reference/clusteringVis.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"clusteringVis — clusteringVis","text":"Deprecated","code":""},{"path":"/reference/decisionTree.html","id":null,"dir":"Reference","previous_headings":"","what":"Decision Tree — decisionTree","title":"Decision Tree — decisionTree","text":"Decision Tree","code":""},{"path":"/reference/decisionTree.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Decision Tree — decisionTree","text":"","code":"decisionTree(   algo = \"Decision Tree\",   engine = \"rpart\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/decisionTree.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Decision Tree — decisionTree","text":"algo name algorithm can customized user (default: \"Decision Tree\"). engine name software used fit model (\"rpart\" (default), \"C50\", \"partykit\"). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/decisionTree.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Decision Tree — decisionTree","text":"function training user-defined Decision Tree model. Hyperparameters tuning: tree_depth, min_n, cost_complexity","code":""},{"path":"/reference/evalMetricsR.html","id":null,"dir":"Reference","previous_headings":"","what":"Evaluation metrics for Regression — evalMetricsR","title":"Evaluation metrics for Regression — evalMetricsR","text":"Evaluation metrics Regression","code":""},{"path":"/reference/evalMetricsR.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Evaluation metrics for Regression — evalMetricsR","text":"","code":"evalMetricsR(modelsList, targetVar)"},{"path":"/reference/evalMetricsR.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Evaluation metrics for Regression — evalMetricsR","text":"modelsList ML 모델 리스트 targetVar 타겟 변수","code":""},{"path":"/reference/evalMetricsR.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Evaluation metrics for Regression — evalMetricsR","text":"ML 모델 리스트로부터 Regression 모델들에 대한 Evaluation metrics를 생성합니다.","code":""},{"path":"/reference/fitBestModel.html","id":null,"dir":"Reference","previous_headings":"","what":"fitting in best model — fitBestModel","title":"fitting in best model — fitBestModel","text":"fitting best model","code":""},{"path":"/reference/fitBestModel.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"fitting in best model — fitBestModel","text":"","code":"fitBestModel(   optResult,   metric,   model,   formula,   trainingData,   splitedData,   modelName )"},{"path":"/reference/fitBestModel.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"fitting in best model — fitBestModel","text":"optResult result object bayesOptCV metric Baseline metric evaluating model performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\") model model object including list hyperparameters, engine mode. formula formula modeling trainingData training data. splitedData whole dataset including information fold modelName name model defined algorithm engine selected user","code":""},{"path":"/reference/fitBestModel.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"fitting in best model — fitBestModel","text":"Get bayesOptCV function's return value fit model.","code":""},{"path":"/reference/gridSearchCV.html","id":null,"dir":"Reference","previous_headings":"","what":"Grid search with cross validation — gridSearchCV","title":"Grid search with cross validation — gridSearchCV","text":"Grid search cross validation","code":""},{"path":"/reference/gridSearchCV.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Grid search with cross validation — gridSearchCV","text":"","code":"gridSearchCV(   rec = NULL,   model = NULL,   v = NULL,   trainingData = NULL,   parameterGrid = NULL,   seed = NULL )"},{"path":"/reference/gridSearchCV.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Grid search with cross validation — gridSearchCV","text":"rec 데이터, 전처리 정보를 포함한 recipe object model hyperparameters, ngine, mode 정보가 포함된 model object v v-fold cross validation을 진행 (default: 5, 각 fold 별로 30개 이상의 observations가 있어야 유효한 모델링 결과를 얻을 수 있습니다.) trainingData 훈련데이터 셋 seed seed값 설정 parameter_grid grid search를 수행할 때 각 hyperparameter의 값을 담은 object","code":""},{"path":"/reference/gridSearchCV.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Grid search with cross validation — gridSearchCV","text":"하이퍼파라미터를 탐색하는 Grid Search와 데이터 셋을 나누어 평가하는 cross validation을 함께 수행합니다.","code":""},{"path":"/reference/kMeansClustering.html","id":null,"dir":"Reference","previous_headings":"","what":"K means clustering — kMeansClustering","title":"K means clustering — kMeansClustering","text":"K means clustering","code":""},{"path":"/reference/kMeansClustering.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"K means clustering — kMeansClustering","text":"","code":"kMeansClustering(   data,   maxK = 15,   nStart = 25,   iterMax = 10,   nBoot = 100,   algorithm = \"Hartigan-Wong\",   selectOptimal = \"silhouette\",   seedNum = 6471 )"},{"path":"/reference/kMeansClustering.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"K means clustering — kMeansClustering","text":"data 전처리가 완료된 데이터 maxK 클러스터링 수행 시 군집을 2, 3, ..., maxK개로 분할 (default: 15) iterMax 반복계산을 수행할 최대 횟수 (default: 10) nBoot gap statictic을 사용해 클러스터링을 수행할 때 Monte Carlo (bootstrap) 샘플의 개수 (selectOptimal == \"gap_stat\" 일 경우에만 지정, default: 100) algorithm K means를 수행할 알고리즘 선택 (\"Hartigan-Wong\" (default), \"Lloyd\", \"Forgy\", \"MacQueen\") selectOptimal 최적의 K값을 선정할 때 사용할 method 선택 (\"silhouette\" (default), \"gap_stat\") seedNum seed값 설정 nstart 랜덤 샘플에 대해 초기 클러스터링을 nstart번 시행 (default: 25)","code":""},{"path":"/reference/kMeansClustering.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"K means clustering — kMeansClustering","text":"function K means clustering. parameters tuning: maxK, nstart","code":""},{"path":"/reference/lightGbm.html","id":null,"dir":"Reference","previous_headings":"","what":"Light GBM — lightGbm","title":"Light GBM — lightGbm","text":"Light GBM","code":""},{"path":"/reference/lightGbm.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Light GBM — lightGbm","text":"","code":"lightGbm(   algo = \"lightGBM\",   engine = \"lightgbm\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 15,   metric = NULL,   seed = 1234 )"},{"path":"/reference/lightGbm.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Light GBM — lightGbm","text":"algo name algorithm can customized user. (default: \"lightGBM\"). engine name software used fit model(\"lightgbm\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/lightGbm.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Light GBM — lightGbm","text":"function training user-defined Light GBM model. Hyperparameters tuning: tree_depth, trees, learn_rate, mtry, min_n, loss_reduction","code":""},{"path":"/reference/linearRegression.html","id":null,"dir":"Reference","previous_headings":"","what":"Linear Regression — linearRegression","title":"Linear Regression — linearRegression","text":"Linear Regression","code":""},{"path":"/reference/linearRegression.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Linear Regression — linearRegression","text":"","code":"linearRegression(   algo = \"Linear Regression\",   engine = \"glmnet\",   mode = \"regression\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = \"rmse\",   seed = 1234 )"},{"path":"/reference/linearRegression.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Linear Regression — linearRegression","text":"algo name algorithm can customized user (default: \"Linear Regression\"). engine name software used fit model (\"glmnet\" (default), \"lm\", \"glm\", \"stan\"). mode model type. \"classification\" \"regression\" (\"regression\" (default)). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/linearRegression.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Linear Regression — linearRegression","text":"function training user-defined Linear Regression model. Hyperparameters tuning: penalty, mixture","code":""},{"path":"/reference/logisticRegression.html","id":null,"dir":"Reference","previous_headings":"","what":"Logistic Regression — logisticRegression","title":"Logistic Regression — logisticRegression","text":"function training user-defined Logistic regression model. function supports: binary classification","code":""},{"path":"/reference/logisticRegression.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Logistic Regression — logisticRegression","text":"","code":"logisticRegression(   algo = \"Logistic Regression\",   engine = \"glmnet\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = \"roc_auc\",   seed = 1234 )"},{"path":"/reference/logisticRegression.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Logistic Regression — logisticRegression","text":"algo name algorithm can customized user (default: \"Logistic Regression\"). engine name software used fit model (Option: \"glmnet\" (default)). mode model type. \"classification\" \"regression\" (Option: \"classification\" (default)). trainingData training data. splitedData whole dataset including information fold formula formula modeling rec Recipe object containing preprocessing information cross-validation v Applying v-fold cross validation modeling process (default: 5) gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/logisticRegression.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Logistic Regression — logisticRegression","text":"Hyperparameters tuning: penalty, mixture","code":""},{"path":"/reference/multinomialRegression.html","id":null,"dir":"Reference","previous_headings":"","what":"Multinomial Regression — multinomialRegression","title":"Multinomial Regression — multinomialRegression","text":"function training user-defined Multinomial regression model. function supports: multinomial classification","code":""},{"path":"/reference/multinomialRegression.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Multinomial Regression — multinomialRegression","text":"","code":"multinomialRegression(   algo = \"Multinomial Regression\",   engine = \"glmnet\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = \"roc_auc\",   seed = 1234 )"},{"path":"/reference/multinomialRegression.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Multinomial Regression — multinomialRegression","text":"algo name algorithm can customized user (default: \"Multinomial Regression\"). engine name software used fit model (Option: \"glmnet\" (default)). mode model type. \"classification\" \"regression\" (Option: \"classification\" (default)). trainingData data frame training. splitedData data frame including metadata split. formula formula modeling. rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/multinomialRegression.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Multinomial Regression — multinomialRegression","text":"Hyperparameters tuning: penalty, mixture","code":""},{"path":"/reference/naiveBayes.html","id":null,"dir":"Reference","previous_headings":"","what":"Naive Bayes — naiveBayes","title":"Naive Bayes — naiveBayes","text":"Naive Bayes","code":""},{"path":"/reference/naiveBayes.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Naive Bayes — naiveBayes","text":"","code":"naiveBayes(   algo = \"Naive Bayes\",   engine = \"klaR\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/naiveBayes.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Naive Bayes — naiveBayes","text":"algo name algorithm can customized user (default: \"Naive Bayes\"). engine name software used fit model (\"klaR\" (default), naivebayes). mode model type. \"classification\" \"regression\" (\"classification\" (default)). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/naiveBayes.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Naive Bayes — naiveBayes","text":"function training user-defined Naive Bayes model. Hyperparameters tuning: smoothness, Laplace","code":""},{"path":"/reference/pipe.html","id":null,"dir":"Reference","previous_headings":"","what":"AUC-ROC Curve — %>%","title":"AUC-ROC Curve — %>%","text":"AUC-ROC Curve Confusion matrix Regression plot Evaluation metrics Classification","code":""},{"path":"/reference/pipe.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"AUC-ROC Curve — %>%","text":"","code":"rocCurve(modelsList, targetVar)  confusionMatrix(modelName, modelsList, targetVar)  regressionPlot(modelName, modelsList, targetVar)  evalMetricsC(modelsList, targetVar)"},{"path":"/reference/pipe.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"AUC-ROC Curve — %>%","text":"modelsList ML 모델 리스트 targetVar 타겟 변수 modelName 모델명","code":""},{"path":"/reference/pipe.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"AUC-ROC Curve — %>%","text":"ML 모델 리스트로부터 AUC-ROC Curve를 생성합니다. ML 모델 리스트 내 특정 모델에 대해 Confusion matrix를 생성합니다. ML 모델 리스트 내 특정 모델에 대해 Regression plot를 생성합니다. ML 모델 리스트로부터 Classification 모델들에 대한 Evaluation metrics를 생성합니다.","code":""},{"path":"/reference/plotRmseComparison.html","id":null,"dir":"Reference","previous_headings":"","what":"rmsePlot — plotRmseComparison","title":"rmsePlot — plotRmseComparison","text":"rmsePlot","code":""},{"path":"/reference/plotRmseComparison.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"rmsePlot — plotRmseComparison","text":"","code":"plotRmseComparison(tunedResultsList, v = v, iter = iter)"},{"path":"/reference/plotRmseComparison.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"rmsePlot — plotRmseComparison","text":"rmsePlot","code":""},{"path":"/reference/prepForCV.html","id":null,"dir":"Reference","previous_headings":"","what":"Preprocessing for cross validation — prepForCV","title":"Preprocessing for cross validation — prepForCV","text":"Preprocessing cross validation","code":""},{"path":"/reference/prepForCV.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Preprocessing for cross validation — prepForCV","text":"","code":"prepForCV(   data = NULL,   formula = NULL,   imputation = FALSE,   normalization = FALSE,   nominalImputationType = \"mode\",   numericImputationType = \"mean\",   normalizationType = \"range\",   seed = \"4814\" )"},{"path":"/reference/prepForCV.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Preprocessing for cross validation — prepForCV","text":"data Training dataset apply local preprocessing recipe. formula formula modeling imputation \"imputation = TRUE\", model trained using cross-validation imputation. normalization \"normalization = TRUE\", model trained using cross-validation normalization nominalImputationType Imputation method nominal variable (Option: mode(default), bag, knn) numericImputationType Imputation method numeric variable (Option: mean(default), bag, knn, linear, lower, median, roll) normalizationType Normalization method (Option: range(default), center, normalization, scale) seed seed","code":""},{"path":"/reference/prepForCV.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Preprocessing for cross validation — prepForCV","text":"Define local preprocessing method applied training data fold training data divided several folds.","code":""},{"path":"/reference/randomForest.html","id":null,"dir":"Reference","previous_headings":"","what":"Random Forest — randomForest","title":"Random Forest — randomForest","text":"Random Forest","code":""},{"path":"/reference/randomForest.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Random Forest — randomForest","text":"","code":"randomForest(   algo = \"Random Forest\",   engine = \"ranger\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/randomForest.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Random Forest — randomForest","text":"algo name algorithm can customized user (default: \"Random Forest\"). engine name software used fit model (\"rpart\" (default), \"randomForest\", \"partykit\"). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/randomForest.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Random Forest — randomForest","text":"function training user-defined Random Forest model. Hyperparameters tuning: trees, min_n, mtry","code":""},{"path":"/reference/trainTestSplit.html","id":null,"dir":"Reference","previous_headings":"","what":"Train-Test Split — trainTestSplit","title":"Train-Test Split — trainTestSplit","text":"Train-Test Split","code":""},{"path":"/reference/trainTestSplit.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Train-Test Split — trainTestSplit","text":"","code":"trainTestSplit(data = NULL, target = NULL, prop, seed = \"4814\")"},{"path":"/reference/trainTestSplit.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Train-Test Split — trainTestSplit","text":"data Full data set global preprocess completed. target target variable. prop Proportion total data used training data. seed Seed reproducible results.","code":""},{"path":"/reference/trainTestSplit.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Train-Test Split — trainTestSplit","text":"Separate entire data training set test set.","code":""},{"path":"/reference/xgBoost.html","id":null,"dir":"Reference","previous_headings":"","what":"XGBoost — xgBoost","title":"XGBoost — xgBoost","text":"function training user-defined XGBoost model. Hyperparameters tuning: tree_depth, trees,learn_rate, mtry, min_n, loss_reduction, sample_size","code":""},{"path":"/reference/xgBoost.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"XGBoost — xgBoost","text":"","code":"xgBoost(   algo = \"XGBoost\",   engine = \"xgboost\",   mode = \"classification\",   trainingData = NULL,   splitedData = NULL,   formula = NULL,   rec = NULL,   v = 5,   gridNum = 5,   iter = 10,   metric = NULL,   seed = 1234 )"},{"path":"/reference/xgBoost.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"XGBoost — xgBoost","text":"algo name algorithm can customized user (default: \"XGBoost\"). engine name software used fit model (\"xgboost\" (default)). mode model type. \"classification\" \"regression\" (\"classification\" (default), \"regression\"). trainingData training data. splitedData data frame including metadata split. formula formula modeling rec Recipe object containing preprocessing information cross-validation. v Applying v-fold cross validation modeling process (default: 5). gridNum Initial number iterations run starting optimization algorithm. iter maximum number search iterations. metric Metric evaluate performance (classification: \"roc_auc\" (default), \"accuracy\" / regression: \"rmse\" (default), \"rsq\"). seed Seed reproducible results.","code":""},{"path":"/reference/xgBoost.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"XGBoost — xgBoost","text":"XGBoost","code":""}]