public abstract class SharedTreeModelBuilder<TM extends DTree.TreeModel> extends Job.ValidatedJob
| Modifier and Type | Class and Description |
|---|---|
class |
SharedTreeModelBuilder.Score |
class |
SharedTreeModelBuilder.ScoreBuildHistogram |
Job.ValidatedJob.Response2CMAdaptorJob.ChunkProgress, Job.ChunkProgressJob, Job.ColumnsJob, Job.Fail, Job.FrameJob, Job.HexJob, Job.JobCancelledException, Job.JobState, Job.ModelJob, Job.Progress, Job.ProgressMonitor, Job.ValidatedJobRequest2.ColumnSelect, Request2.Dependent, Request2.DoClassBoolean, Request2.DRFCopyDataBoolean, Request2.MultiVecSelect, Request2.MultiVecSelectType, Request2.TypeaheadKey, Request2.VecClassSelect, Request2.VecSelectRequest.API, Request.Default, Request.Filter, Request.Validator<V>RequestBuilders.ArrayBuilder, RequestBuilders.ArrayHeaderRowBuilder, RequestBuilders.ArrayRowBuilder, RequestBuilders.ArrayRowElementBuilder, RequestBuilders.ArrayRowSingleColBuilder, RequestBuilders.BooleanStringBuilder, RequestBuilders.Builder, RequestBuilders.ElementBuilder, RequestBuilders.HideBuilder, RequestBuilders.KeyCellBuilder, RequestBuilders.KeyElementBuilder, RequestBuilders.KeyLinkElementBuilder, RequestBuilders.KeyMinAvgMaxBuilder, RequestBuilders.NoCaptionObjectBuilder, RequestBuilders.ObjectBuilder, RequestBuilders.PaginatedTable, RequestBuilders.PreFormattedBuilder, RequestBuilders.Response, RequestBuilders.ResponseInfo, RequestBuilders.WarningCellBuilderRequestArguments.Argument<T>, RequestArguments.Bool, RequestArguments.CaseModeSelect, RequestArguments.CaseSelect, RequestArguments.ClassifyBool, RequestArguments.DRFCopyDataBool, RequestArguments.EnumArgument<T extends java.lang.Enum<T>>, RequestArguments.ExistingFile, RequestArguments.FrameClassVec, RequestArguments.FrameKeyMultiVec, RequestArguments.FrameKeyVec, RequestArguments.GeneralFile, RequestArguments.H2OCategoryStrata, RequestArguments.H2OCategoryWeights, RequestArguments.H2OExistingKey, RequestArguments.H2OGLMModelKey, RequestArguments.H2OHexKey, RequestArguments.H2OHexKeyCol, RequestArguments.H2OIllegalArgumentException, RequestArguments.H2OKey, RequestArguments.H2OKey2, RequestArguments.H2OKMeansModelKey, RequestArguments.H2OModelKey<TM extends OldModel,TK extends TypeaheadKeysRequest>, RequestArguments.HexAllColumnSelect, RequestArguments.HexColumnSelect, RequestArguments.HexKeyClassCol, RequestArguments.HexNonClassColumnSelect, RequestArguments.HexNonConstantColumnSelect, RequestArguments.HexPCAColumnSelect, RequestArguments.InputCheckBox, RequestArguments.InputSelect<T>, RequestArguments.InputText<T>, RequestArguments.Int, RequestArguments.LongInt, RequestArguments.MultipleSelect<T>, RequestArguments.MultipleText<T>, RequestArguments.NTree, RequestArguments.NumberSequence, RequestArguments.NumberSequenceFloat, RequestArguments.Real, RequestArguments.Record<T>, RequestArguments.RFModelKey, RequestArguments.RSeq, RequestArguments.RSeqFloat, RequestArguments.Str, RequestArguments.StringList, RequestArguments.TypeaheadInputText<T>RequestStatics.RequestTypeConstants.Extensions, Constants.Schemes, Constants.Suffixes| Modifier and Type | Field and Description |
|---|---|
protected long[] |
_distribution |
protected int |
_nclass |
protected int |
_ncols |
protected long |
_nrows |
static int |
DECIDED_ROW
Marker for already decided row.
|
static DocGen.FieldDoc[] |
DOC_FIELDS |
protected boolean |
importance |
int |
max_depth |
static int |
MAX_SUPPORTED_LEVELS
Maximal number of supported levels in response.
|
int |
min_rows |
int |
nbins |
int |
ntrees |
static int |
OUT_OF_BAG
Marker for sampled out rows
|
boolean |
score_each_iteration |
_cmDomain, _names, _responseName, _sourceResponseDomain, _train, _valid, _validResponse, _validResponseDomain, validationclassification, responsecols, ignored_cols, ignored_cols_by_namesource_fjtask, CANCELLED_END_TIME, description, destination_key, end_time, exception, job_key, start_time, state_parms, response_info_requestHelp, SUPPORTS_ONLY_V1, SUPPORTS_ONLY_V2, SUPPORTS_V1_V2ARRAY_BUILDER, ARRAY_HEADER_ROW_BUILDER, ARRAY_ROW_BUILDER, ARRAY_ROW_ELEMENT_BUILDER, ARRAY_ROW_SINGLECOL_BUILDER, ELEMENT_BUILDER, GSON_BUILDER, OBJECT_BUILDER, ROOT_OBJECT_queryHtml_argumentsALPHA, ARGUMENTS, AUC, BASE, BEST_THRESHOLD, BETA_EPS, BIN_LIMIT, BROWSE, BUCKET, BUILT_IN_KEY_JOBS, CANCELLED, CARDINALITY, CASE, CASE_MODE, CHUNK, CLASS, CLOUD_HEALTH, CLOUD_NAME, CLOUD_SIZE, CLOUD_UPTIME_MILLIS, CLUSTERS, COEFFICIENTS, COL_INDEX, COLS, COLUMN_NAME, COLUMNS_DISPLAY, CONSENSUS, CONTENTS, COUNT, DATA_KEY, DEPTH, DESCRIPTION, DEST_KEY, DTHRESHOLDS, ELAPSED, END_TIME, ENUM_DOMAIN_SIZE, ERROR, ESCAPE_NAN, EXCLUSIVE_SPLIT_LIMIT, EXPRESSION, FAILED, FAMILY, FEATURES, FILE, FILES, FILTER, FIRST_CHUNK, FJ_QUEUE_HI, FJ_QUEUE_LO, FJ_THREADS_HI, FJ_THREADS_LO, FREE_DISK, FREE_MEM, HEADER, HEIGHT, HELP, IGNORE, ITEMS, ITERATIVE_CM, JOB, JOB_KEY, JOBS, JSON_H2O, KEY, KEYS, LAMBDA, LAST_CONTACT, LIMIT, LINK, LOCKED, MAX, MAX_DISK, MAX_ITER, MAX_MEM, MAX_ROWS, MEAN, MIN, MODEL_KEY, MODELS, MORE, MTRY, MTRY_NODES, NAME, NEG_X, NO_CM, NODE, NODE_HEALTH, NODE_NAME, NODES, NORMALIZE, NUM_COLS, NUM_CPUS, NUM_FAILED, NUM_KEYS, NUM_MISSING_VALUES, NUM_ROWS, NUM_SUCCEEDED, NUM_TREES, OBJECT, OFFSET, OOBEE, PARALLEL, PARSER_TYPE, PATH, PREVIEW, PREVIOUS_MODEL_KEY, PROGRESS, PROGRESS_KEY, PROGRESS_TOTAL, REDIRECT, REDIRECT_ARGS, REPLICATION_FACTOR, REQUEST_TIME, RESPONSE, RHO, ROW, ROW_SIZE, ROWS, RPCS, SAMPLE, SAMPLING_STRATEGY, SCALE, SEED, SENT_ROWS, SEPARATOR, SIZE, SOURCE_KEY, STACK_TRACES, START_TIME, STAT_TYPE, STATUS, STEP, STRATA_SAMPLES, SUCCEEDED, SYSTEM_LOAD, TASK_KEY, TCPS_ACTIVE, TCPS_DUTY, TIME, TO_ENUM, TOT_MEM, TREE_COUNT, TREE_DEPTH, TREE_LEAVES, TREE_NUM, TREES, TWEEDIE_POWER, TYPE, URL, USE_NON_LOCAL_DATA, VALUE, VALUE_SIZE, VALUE_TYPE, VARIANCE, VERSION, VIEW, WARNINGS, WEIGHT, WEIGHTS, WIDTH, X, XVAL, Y| Constructor and Description |
|---|
SharedTreeModelBuilder() |
| Modifier and Type | Method and Description |
|---|---|
protected DHistogram[][][] |
buildLayer(Frame fr,
DTree[] ktrees,
int[] leafs,
DHistogram[][][] hcs,
boolean subset,
boolean build_tree_per_node) |
void |
buildModel() |
protected abstract TM |
buildModel(TM initialModel,
Frame trainFr,
java.lang.String[] names,
java.lang.String[][] domains,
Timer t_build)
Builds model
|
protected Chunk |
chk_nids(Chunk[] chks,
int t) |
protected Chunk |
chk_resp(Chunk[] chks) |
protected Chunk |
chk_tree(Chunk[] chks,
int c) |
protected Chunk |
chk_work(Chunk[] chks,
int c) |
protected void |
cleanUp(Frame fr,
Timer t_build) |
static java.util.Random |
createRNG(long seed) |
protected double[] |
data_row(Chunk[] chks,
int row,
double[] data) |
protected TM |
doScoring(TM model,
Frame fTrain,
DTree[] ktrees,
int tid,
DTree.TreeModel.TreeStats tstats,
boolean finalScoring,
boolean oob,
boolean build_tree_per_node) |
protected abstract float[][] |
doVarImpCalc(TM model,
DTree[] ktrees,
int tid,
Frame validationFrame) |
protected boolean |
inBagRow(Chunk[] chks,
int row) |
protected void |
init()
Invoked before job runs.
|
protected boolean |
isClassification() |
static boolean |
isDecidedRow(int nid) |
static boolean |
isOOBRow(int nid) |
protected abstract Log.Tag.Sys |
logTag()
Returns a log tag for a particular model builder (e.g., DRF, GBM)
|
protected AUC |
makeAUC(ConfusionMatrix[] cms,
float[] threshold) |
protected abstract DTree.DecidedNode |
makeDecided(DTree.UndecidedNode udn,
DHistogram[] hs) |
protected abstract TM |
makeModel(Key outputKey,
Key dataKey,
Key testKey,
java.lang.String[] names,
java.lang.String[][] domains,
java.lang.String[] cmDomain) |
protected abstract TM |
makeModel(TM model,
double err,
ConfusionMatrix cm,
float[] varimp,
float[] varimpSD,
AUC validAUC) |
protected abstract TM |
makeModel(TM model,
DTree[] ktrees,
DTree.TreeModel.TreeStats tstats) |
static int |
nid2Oob(int nid) |
static int |
oob2Nid(int oobNid) |
protected static void |
printGenerateTrees(DTree[] trees) |
float |
progress() |
protected abstract float |
score1(Chunk[] chks,
float[] fs,
int row) |
java.lang.String |
speedDescription()
Description of a speed criteria: msecs/frob
|
long |
speedValue()
Value of the described speed criteria: msecs/frob
|
protected Vec |
vec_nids(Frame fr,
int t) |
protected Vec |
vec_resp(Frame fr,
int t) |
getCMDomain, getOrigValidation, getValidAdaptor, getValidation, getVectorDomain, hasValidation, prepareValidationWithModel, toJSONregisteredselectFrame, selectVecsall, cancel, cancel, cancel, checkIdx, cleanup, defaultDestKey, defaultJobKey, dest, emptyLTrash, execImpl, findJob, findJobByDest, fork, get, gridParallelism, gtrash, gtrash, invoke, isCancelled, isCrashed, isDone, isEnded, isRunning, ltrash, ltrash, onCancelled, redirect, remove, runTimeMs, self, serve, start, waitUntilJobEnded, waitUntilJobEndedcreate, fillResponseInfo, input, logStart, makeJsonBox, serveGrid, set, split, superServeGrid, supportedVersions, toStringaddToNavbar, addToNavbar, addToNavbar, DocExampleFail, DocExampleSucc, href, href, hrefType, HTMLHelp, htmlTemplate, initializeNavBar, log, mapTypeahead, ReSTHelp, serve, serveJava, toDocGET, toHTML, toJava, wrap, wrap, wrap, writeJSONFieldsbuild, buildJSONResponseBox, buildResponseHeader, namebuildQuery, checkArguments, queryArgumentValueSetarguments, argumentsToJson, frameColumnNameToIndex, vaCategoryNames, vaCategoryNames, vaColumnNameToIndexcheckJsonName, encodeRedirectArgs, JSON2HTML, jsonError, requestName, Str2JSONclone, frozenType, init, newInstance, read, toDocField, write, writeJSONpublic static DocGen.FieldDoc[] DOC_FIELDS
public int ntrees
public int max_depth
public int min_rows
public int nbins
public boolean score_each_iteration
protected boolean importance
protected int _ncols
protected long _nrows
protected int _nclass
protected long[] _distribution
public static final int MAX_SUPPORTED_LEVELS
public static final int DECIDED_ROW
public static final int OUT_OF_BAG
protected void init()
Jobinit in class Job.ValidatedJobpublic void buildModel()
protected TM doScoring(TM model, Frame fTrain, DTree[] ktrees, int tid, DTree.TreeModel.TreeStats tstats, boolean finalScoring, boolean oob, boolean build_tree_per_node)
protected abstract float[][] doVarImpCalc(TM model, DTree[] ktrees, int tid, Frame validationFrame)
protected double[] data_row(Chunk[] chks, int row, double[] data)
protected DHistogram[][][] buildLayer(Frame fr, DTree[] ktrees, int[] leafs, DHistogram[][][] hcs, boolean subset, boolean build_tree_per_node)
protected abstract DTree.DecidedNode makeDecided(DTree.UndecidedNode udn, DHistogram[] hs)
protected abstract float score1(Chunk[] chks, float[] fs, int row)
public java.lang.String speedDescription()
JobspeedDescription in class Jobpublic long speedValue()
JobspeedValue in class Jobprotected abstract Log.Tag.Sys logTag()
protected abstract TM buildModel(TM initialModel, Frame trainFr, java.lang.String[] names, java.lang.String[][] domains, Timer t_build)
initialModel - initial model created by makeModel(Key, Key, Key, String[], String[][], String[]) method.trainFr - training dataset which can contain additional temporary vectors prepared by buildModel() method.names - names of columns in trainFr used for model trainingdomains - domains of columns in trainFr used for model trainingt_build - timer to measure model building processbuildModel()protected abstract TM makeModel(Key outputKey, Key dataKey, Key testKey, java.lang.String[] names, java.lang.String[][] domains, java.lang.String[] cmDomain)
protected abstract TM makeModel(TM model, double err, ConfusionMatrix cm, float[] varimp, float[] varimpSD, AUC validAUC)
protected abstract TM makeModel(TM model, DTree[] ktrees, DTree.TreeModel.TreeStats tstats)
protected AUC makeAUC(ConfusionMatrix[] cms, float[] threshold)
protected boolean inBagRow(Chunk[] chks, int row)
protected final boolean isClassification()
public static final boolean isOOBRow(int nid)
public static final boolean isDecidedRow(int nid)
public static final int oob2Nid(int oobNid)
public static final int nid2Oob(int nid)
public static java.util.Random createRNG(long seed)
protected static void printGenerateTrees(DTree[] trees)