public class ModelSelectionParametersV3 extends ModelParametersSchemaV3
| Modifier and Type | Field and Description |
|---|---|
double[] |
alpha
Distribution of regularization between the L1 (Lasso) and L2 (Ridge) penalties.
|
boolean |
balanceClasses
Balance training data class counts via over/under-sampling (for imbalanced data).
|
FrameKeyV3 |
betaConstraints
Beta constraints
|
double |
betaEpsilon
Converge if beta changes less (using L-infinity norm) than beta esilon, ONLY applies to IRLSM solver
|
boolean |
buildGlmModel
For maxrsweep mode only.
|
boolean |
calcLike
If true, will return likelihood function value for GLM.
|
float[] |
classSamplingFactors
Desired over/under-sampling ratios per class (in lexicographic order).
|
boolean |
coldStart
Only applicable to multiple alpha/lambda values.
|
boolean |
computePValues
Request p-values computation, p-values work only with IRLSM solver and no regularization
|
boolean |
earlyStopping
Stop early when there is no more relative improvement on train or validation (if provided)
|
GLMFamily |
family
Family.
|
double |
gradientEpsilon
Converge if objective changes less (using L-infinity norm) than this, ONLY applies to L-BFGS solver.
|
GLMInfluence |
influence
If set to dfbetas will calculate the difference in beta when a datarow is included and excluded in the dataset.
|
boolean |
intercept
Include constant term in the model
|
double[] |
lambda
Regularization strength
|
double |
lambdaMinRatio
Minimum lambda used in lambda search, specified as a ratio of lambda_max (the smallest lambda that drives all
coefficients to zero).
|
boolean |
lambdaSearch
Use lambda search starting at lambda max, given lambda is then interpreted as lambda min
|
GLMLink |
link
Link function.
|
int |
maxActivePredictors
Maximum number of active predictors during computation.
|
float |
maxAfterBalanceSize
Maximum relative size of the training data after balancing class counts (can be less than 1.0).
|
int |
maxConfusionMatrixSize
[Deprecated] Maximum size (# classes) for confusion matrices to be printed in the Logs
|
int |
maxIterations
Maximum number of iterations
|
int |
maxPredictorNumber
Maximum number of predictors to be considered when building GLM models.
|
int |
minPredictorNumber
For mode = 'backward' only.
|
GLMMissingValuesHandling |
missingValuesHandling
Handling of missing values.
|
ModelSelectionMode |
mode
Mode: Used to choose model selection algorithms to use.
|
boolean |
multinodeMode
For maxrsweep only.
|
int |
nlambdas
Number of lambdas to be used in a search.
|
boolean |
nonNegative
Restrict coefficients (not intercept) to be non-negative
|
int |
nparallelism
number of models to build in parallel.
|
double |
objectiveEpsilon
Converge if objective value changes less than this.
|
double |
objReg
Likelihood divider in objective value computation, default (of -1.0) will set it to 1/nobs
|
FrameKeyV3 |
plugValues
Plug Values (a single row frame containing values that will be used to impute missing values of the
training/validation frame, use with conjunction missing_values_handling = PlugValues)
|
double |
prior
Prior probability for y==1.
|
double |
pValuesThreshold
For mode='backward' only.
|
boolean |
removeCollinearColumns
In case of linearly dependent columns, remove some of the dependent columns
|
int |
scoreIterationInterval
Perform scoring for every score_iteration_interval iterations
|
long |
seed
Seed for pseudo random number generator (if applicable)
|
GLMSolver |
solver
AUTO will set the solver based on given data and the other parameters.
|
boolean |
standardize
Standardize numeric columns to have zero mean and unit variance
|
double[] |
startval
Double array to initialize coefficients for GLM.
|
double |
theta
Theta
|
double |
tweedieLinkPower
Tweedie link power
|
double |
tweedieVariancePower
Tweedie variance power
|
aucType, categoricalEncoding, checkpoint, customDistributionFunc, customMetricFunc, distribution, exportCheckpointsDir, foldAssignment, foldColumn, gainsliftBins, huberAlpha, ignoreConstCols, ignoredColumns, keepCrossValidationFoldAssignment, keepCrossValidationModels, keepCrossValidationPredictions, maxCategoricalLevels, maxRuntimeSecs, modelId, nfolds, offsetColumn, parallelizeCrossValidation, quantileAlpha, responseColumn, scoreEachIteration, stoppingMetric, stoppingRounds, stoppingTolerance, trainingFrame, tweediePower, validationFrame, weightsColumn| Constructor and Description |
|---|
ModelSelectionParametersV3()
Public constructor
|
| Modifier and Type | Method and Description |
|---|---|
java.lang.String |
toString()
Return the contents of this object as a JSON String.
|
public long seed
public GLMFamily family
@SerializedName(value="tweedie_variance_power") public double tweedieVariancePower
@SerializedName(value="tweedie_link_power") public double tweedieLinkPower
public double theta
public GLMSolver solver
public double[] alpha
public double[] lambda
@SerializedName(value="lambda_search") public boolean lambdaSearch
@SerializedName(value="multinode_mode") public boolean multinodeMode
@SerializedName(value="build_glm_model") public boolean buildGlmModel
@SerializedName(value="early_stopping") public boolean earlyStopping
public int nlambdas
@SerializedName(value="score_iteration_interval") public int scoreIterationInterval
public boolean standardize
@SerializedName(value="cold_start") public boolean coldStart
@SerializedName(value="missing_values_handling") public GLMMissingValuesHandling missingValuesHandling
@SerializedName(value="plug_values") public FrameKeyV3 plugValues
@SerializedName(value="non_negative") public boolean nonNegative
@SerializedName(value="max_iterations") public int maxIterations
@SerializedName(value="beta_epsilon") public double betaEpsilon
@SerializedName(value="objective_epsilon") public double objectiveEpsilon
@SerializedName(value="gradient_epsilon") public double gradientEpsilon
@SerializedName(value="obj_reg") public double objReg
public GLMLink link
public double[] startval
@SerializedName(value="calc_like") public boolean calcLike
public ModelSelectionMode mode
public boolean intercept
public double prior
@SerializedName(value="lambda_min_ratio") public double lambdaMinRatio
@SerializedName(value="beta_constraints") public FrameKeyV3 betaConstraints
@SerializedName(value="max_active_predictors") public int maxActivePredictors
@SerializedName(value="balance_classes") public boolean balanceClasses
@SerializedName(value="class_sampling_factors") public float[] classSamplingFactors
@SerializedName(value="max_after_balance_size") public float maxAfterBalanceSize
@SerializedName(value="max_confusion_matrix_size") public int maxConfusionMatrixSize
@SerializedName(value="compute_p_values") public boolean computePValues
@SerializedName(value="remove_collinear_columns") public boolean removeCollinearColumns
@SerializedName(value="max_predictor_number") public int maxPredictorNumber
@SerializedName(value="min_predictor_number") public int minPredictorNumber
public int nparallelism
@SerializedName(value="p_values_threshold") public double pValuesThreshold
public GLMInfluence influence
public ModelSelectionParametersV3()
public java.lang.String toString()
toString in class ModelParametersSchemaV3