public class DRFParametersV3 extends SharedTreeParametersV3
| Modifier and Type | Field and Description |
|---|---|
boolean |
balance_classes
Balance training data class counts via over/under-sampling (for imbalanced data).
|
boolean |
binomial_double_trees
For binary classification: Build 2x as many trees (one per class) - can lead to higher accuracy.
|
boolean |
build_tree_one_node
Run on one node only; no network overhead but fewer cpus used.
|
java.lang.String |
checkpoint
Model checkpoint to resume training with
|
float[] |
class_sampling_factors
Desired over/under-sampling ratios per class (in lexicographic order).
|
float |
col_sample_rate_per_tree
Column sample rate per tree (from 0.0 to 1.0)
|
FoldAssignmentScheme |
fold_assignment
Cross-validation fold assignment scheme, if fold_column is not specified
|
ColSpecifierV3 |
fold_column
Column with cross-validation fold index assignment per observation
|
boolean |
ignore_const_cols
Ignore constant columns
|
java.lang.String[] |
ignored_columns
Ignored columns
|
boolean |
keep_cross_validation_predictions
Keep cross-validation model predictions
|
float |
max_after_balance_size
Maximum relative size of the training data after balancing class counts (can be less than 1.0).
|
int |
max_confusion_matrix_size
Maximum size (# classes) for confusion matrices to be printed in the Logs
|
int |
max_depth
Maximum tree depth.
|
int |
max_hit_ratio_k
Max.
|
double |
max_runtime_secs
Maximum allowed runtime in seconds for model training.
|
double |
min_rows
Fewest allowed (weighted) observations in a leaf (in R called 'nodesize').
|
java.lang.String |
model_id
Destination id for this model; auto-generated if not specified
|
int |
mtries
Number of variables randomly sampled as candidates at each split.
|
int |
nbins
For numerical columns (real/int), build a histogram of (at least) this many bins, then split at the best point
|
int |
nbins_cats
For categorical columns (factors), build a histogram of this many bins, then split at the best point.
|
int |
nbins_top_level
For numerical columns (real/int), build a histogram of (at most) this many bins at the root level, then decrease by factor of two per level
|
int |
nfolds
Number of folds for N-fold cross-validation
|
int |
ntrees
Number of trees.
|
ColSpecifierV3 |
offset_column
Offset column
|
boolean |
parallelize_cross_validation
Allow parallel training of cross-validation models
|
double |
r2_stopping
Stop making trees when the R^2 metric equals or exceeds this
|
ColSpecifierV3 |
response_column
Response column
|
float |
sample_rate
Row sample rate (from 0.0 to 1.0)
|
boolean |
score_each_iteration
Whether to score during each iteration of model training
|
int |
score_tree_interval
Score the model after every so many trees.
|
long |
seed
Seed for pseudo random number generator (if applicable)
|
StoppingMetric |
stopping_metric
Metric to use for early stopping (AUTO: logloss for classification, deviance for regression)
|
int |
stopping_rounds
Early stopping based on convergence of stopping_metric.
|
double |
stopping_tolerance
Relative tolerance for metric-based stopping criterion Relative tolerance for metric-based stopping criterion (stop if relative improvement is not at least this much)
|
java.lang.String |
training_frame
Training frame
|
java.lang.String |
validation_frame
Validation frame
|
ColSpecifierV3 |
weights_column
Column with observation weights
|
| Constructor and Description |
|---|
DRFParametersV3() |
public int mtries
public boolean binomial_double_trees
public boolean balance_classes
public float[] class_sampling_factors
public float max_after_balance_size
public int max_confusion_matrix_size
public int max_hit_ratio_k
public int ntrees
public int max_depth
public double min_rows
public int nbins
public int nbins_top_level
public int nbins_cats
public double r2_stopping
public long seed
public boolean build_tree_one_node
public float sample_rate
public float col_sample_rate_per_tree
public int score_tree_interval
public java.lang.String model_id
public java.lang.String training_frame
public java.lang.String validation_frame
public int nfolds
public boolean keep_cross_validation_predictions
public boolean parallelize_cross_validation
public ColSpecifierV3 response_column
public ColSpecifierV3 weights_column
public ColSpecifierV3 offset_column
public ColSpecifierV3 fold_column
public FoldAssignmentScheme fold_assignment
public java.lang.String[] ignored_columns
public boolean ignore_const_cols
public boolean score_each_iteration
public java.lang.String checkpoint
public int stopping_rounds
public double max_runtime_secs
public StoppingMetric stopping_metric
public double stopping_tolerance