public class DataInfo extends water.Keyed<DataInfo>
| Modifier and Type | Class and Description |
|---|---|
class |
DataInfo.Row |
class |
DataInfo.Rows |
static class |
DataInfo.TransformType |
| Modifier and Type | Field and Description |
|---|---|
int[] |
_activeCols |
water.fvec.Frame |
_adaptedFrame |
int[][] |
_catLvls |
boolean[] |
_catMissing |
int[] |
_catModes |
int[] |
_catOffsets |
int |
_cats |
java.lang.String[] |
_coefNames |
boolean |
_fold |
boolean |
_imputeMissing |
boolean |
_intercept |
double[] |
_normMul |
double[] |
_normRespMul |
double[] |
_normRespSub |
double[] |
_normSub |
double[] |
_numMeans |
int |
_nums |
boolean |
_offset |
int |
_outpus |
int[] |
_permutation |
DataInfo.TransformType |
_predictor_transform |
DataInfo.TransformType |
_response_transform |
int |
_responses |
boolean |
_skipMissing |
boolean |
_useAllFactorLevels |
boolean |
_valid |
boolean |
_weights |
| Constructor and Description |
|---|
DataInfo(water.fvec.Frame train,
water.fvec.Frame valid,
boolean useAllFactorLevels,
DataInfo.TransformType predictor_transform,
boolean skipMissing,
boolean imputeMissing,
boolean missingBucket) |
DataInfo(water.fvec.Frame train,
water.fvec.Frame valid,
int nResponses,
boolean useAllFactorLevels,
DataInfo.TransformType predictor_transform,
DataInfo.TransformType response_transform,
boolean skipMissing,
boolean imputeMissing,
boolean missingBucket,
boolean weight,
boolean offset,
boolean fold) |
DataInfo(water.fvec.Frame train,
water.fvec.Frame valid,
int nResponses,
boolean useAllFactorLevels,
DataInfo.TransformType predictor_transform,
DataInfo.TransformType response_transform,
boolean skipMissing,
boolean imputeMissing,
boolean missingBucket,
boolean weight,
boolean offset,
boolean fold,
boolean intercept) |
| Modifier and Type | Method and Description |
|---|---|
int[] |
activeCols() |
void |
addOutput(java.lang.String name,
water.fvec.Vec v) |
void |
addResponse(java.lang.String[] names,
water.fvec.Vec[] vecs) |
protected long |
checksum_impl() |
java.lang.String[] |
coefNames() |
DataInfo |
deep_clone() |
double[] |
denormalizeBeta(double[] beta) |
void |
dropWeights() |
DataInfo.Row |
extractDenseRow(water.fvec.Chunk[] chunks,
int rid,
DataInfo.Row row) |
DataInfo.Row |
extractDenseRow(double[] vals,
DataInfo.Row row) |
DataInfo.Row[] |
extractSparseRows(water.fvec.Chunk[] chunks)
Extract (sparse) rows from given chunks.
|
DataInfo |
filterExpandedColumns(int[] cols) |
int |
foldChunkId() |
int |
fullN() |
int |
getCategoricalId(int cid,
int val) |
water.fvec.Vec |
getOffsetVec() |
water.fvec.Vec |
getOutputVec(int i) |
water.fvec.Vec |
getWeightsVec() |
static int |
imputeCat(water.fvec.Vec v) |
int |
largestCat() |
int[] |
mapNames(java.lang.String[] names) |
DataInfo.Row |
newDenseRow() |
DataInfo.Row |
newDenseRow(double[] numVals,
long start) |
int |
numStart() |
int |
offsetChunkId() |
int |
outputChunkId() |
int |
outputChunkId(int n) |
int |
responseChunkId(int n) |
DataInfo.Rows |
rows(water.fvec.Chunk[] chks) |
DataInfo.Rows |
rows(water.fvec.Chunk[] chks,
boolean sparse) |
DataInfo |
scoringInfo() |
void |
setPredictorTransform(DataInfo.TransformType t) |
void |
setResponse(java.lang.String name,
water.fvec.Vec v) |
void |
setResponse(java.lang.String name,
water.fvec.Vec v,
int n) |
void |
setResponseTransform(DataInfo.TransformType t) |
water.fvec.Vec |
setWeights(java.lang.String name,
water.fvec.Vec vec) |
void |
unScaleNumericals(double[] in,
double[] out)
Undo the standardization/normalization of numerical columns
|
void |
updateWeightedSigmaAndMean(double[] sigmas,
double[] mean) |
void |
updateWeightedSigmaAndMeanForResponse(double[] sigmas,
double[] mean) |
DataInfo |
validDinfo(water.fvec.Frame valid) |
int |
weightChunkId() |
checksum, makeSchema, readAll_impl, readAll, remove_impl, remove, remove, remove, remove, writeAll_impl, writeAllpublic int[] _activeCols
public water.fvec.Frame _adaptedFrame
public int _responses
public int _outpus
public DataInfo.TransformType _predictor_transform
public DataInfo.TransformType _response_transform
public boolean _useAllFactorLevels
public int _nums
public int _cats
public int[] _catOffsets
public boolean[] _catMissing
public int[] _catModes
public int[] _permutation
public double[] _normMul
public double[] _normSub
public double[] _normRespMul
public double[] _normRespSub
public double[] _numMeans
public boolean _intercept
public boolean _offset
public boolean _weights
public boolean _fold
public final boolean _skipMissing
public final boolean _imputeMissing
public boolean _valid
public final int[][] _catLvls
public java.lang.String[] _coefNames
public DataInfo(water.fvec.Frame train,
water.fvec.Frame valid,
boolean useAllFactorLevels,
DataInfo.TransformType predictor_transform,
boolean skipMissing,
boolean imputeMissing,
boolean missingBucket)
public DataInfo(water.fvec.Frame train,
water.fvec.Frame valid,
int nResponses,
boolean useAllFactorLevels,
DataInfo.TransformType predictor_transform,
DataInfo.TransformType response_transform,
boolean skipMissing,
boolean imputeMissing,
boolean missingBucket,
boolean weight,
boolean offset,
boolean fold)
public DataInfo(water.fvec.Frame train,
water.fvec.Frame valid,
int nResponses,
boolean useAllFactorLevels,
DataInfo.TransformType predictor_transform,
DataInfo.TransformType response_transform,
boolean skipMissing,
boolean imputeMissing,
boolean missingBucket,
boolean weight,
boolean offset,
boolean fold,
boolean intercept)
public water.fvec.Vec setWeights(java.lang.String name,
water.fvec.Vec vec)
public void dropWeights()
public int[] activeCols()
public void addResponse(java.lang.String[] names,
water.fvec.Vec[] vecs)
public int responseChunkId(int n)
public int foldChunkId()
public int offsetChunkId()
public int weightChunkId()
public int outputChunkId()
public int outputChunkId(int n)
public void addOutput(java.lang.String name,
water.fvec.Vec v)
public water.fvec.Vec getOutputVec(int i)
public void setResponse(java.lang.String name,
water.fvec.Vec v)
public void setResponse(java.lang.String name,
water.fvec.Vec v,
int n)
protected long checksum_impl()
checksum_impl in class water.Keyed<DataInfo>public DataInfo deep_clone()
public DataInfo validDinfo(water.fvec.Frame valid)
public DataInfo scoringInfo()
public double[] denormalizeBeta(double[] beta)
public static int imputeCat(water.fvec.Vec v)
public DataInfo filterExpandedColumns(int[] cols)
public void updateWeightedSigmaAndMean(double[] sigmas,
double[] mean)
public void updateWeightedSigmaAndMeanForResponse(double[] sigmas,
double[] mean)
public void setPredictorTransform(DataInfo.TransformType t)
public void setResponseTransform(DataInfo.TransformType t)
public final int fullN()
public final int largestCat()
public final int numStart()
public final java.lang.String[] coefNames()
public int[] mapNames(java.lang.String[] names)
public final void unScaleNumericals(double[] in,
double[] out)
in - input valuesout - output values (can be the same as input)public final int getCategoricalId(int cid,
int val)
public final DataInfo.Row extractDenseRow(double[] vals, DataInfo.Row row)
public final DataInfo.Row extractDenseRow(water.fvec.Chunk[] chunks, int rid, DataInfo.Row row)
public water.fvec.Vec getWeightsVec()
public water.fvec.Vec getOffsetVec()
public DataInfo.Row newDenseRow()
public DataInfo.Row newDenseRow(double[] numVals, long start)
public DataInfo.Rows rows(water.fvec.Chunk[] chks)
public DataInfo.Rows rows(water.fvec.Chunk[] chks, boolean sparse)
public final DataInfo.Row[] extractSparseRows(water.fvec.Chunk[] chunks)
chunks - - chunk of dataset