public class GBM extends SharedTreeModelBuilder<GBM.GBMModel>
Modifier and Type | Class and Description |
---|---|
static class |
GBM.Family
Distribution functions
|
static class |
GBM.GBMModel |
SharedTreeModelBuilder.Score, SharedTreeModelBuilder.ScoreBuildHistogram
Job.ValidatedJob.Response2CMAdaptor
Job.ChunkProgress, Job.ChunkProgressJob, Job.ColumnsJob, Job.ColumnsResJob, Job.Fail, Job.FrameJob, Job.JobCancelledException, Job.JobHandle, Job.JobState, Job.List, Job.ModelJob, Job.ModelJobWithoutClassificationField, Job.Progress, Job.ProgressMonitor, Job.ValidatedJob
Request2.ColumnSelect, Request2.Dependent, Request2.DoClassBoolean, Request2.DRFCopyDataBoolean, Request2.MultiVecSelect, Request2.MultiVecSelectType, Request2.SpecialVecSelect, Request2.TypeaheadKey, Request2.VecClassSelect, Request2.VecSelect
Request.API, Request.Default, Request.Filter, Request.Validator<V>
RequestBuilders.ArrayBuilder, RequestBuilders.ArrayHeaderRowBuilder, RequestBuilders.ArrayRowBuilder, RequestBuilders.ArrayRowElementBuilder, RequestBuilders.ArrayRowSingleColBuilder, RequestBuilders.BooleanStringBuilder, RequestBuilders.Builder, RequestBuilders.ElementBuilder, RequestBuilders.HideBuilder, RequestBuilders.KeyCellBuilder, RequestBuilders.KeyElementBuilder, RequestBuilders.KeyLinkElementBuilder, RequestBuilders.KeyMinAvgMaxBuilder, RequestBuilders.NoCaptionObjectBuilder, RequestBuilders.ObjectBuilder, RequestBuilders.PaginatedTable, RequestBuilders.PreFormattedBuilder, RequestBuilders.Response, RequestBuilders.ResponseInfo, RequestBuilders.WarningCellBuilder
RequestArguments.Argument<T>, RequestArguments.Bool, RequestArguments.ClassifyBool, RequestArguments.DRFCopyDataBool, RequestArguments.EnumArgument<T extends java.lang.Enum<T>>, RequestArguments.ExistingFile, RequestArguments.FrameClassVec, RequestArguments.FrameKeyMultiVec, RequestArguments.FrameKeyVec, RequestArguments.GeneralFile, RequestArguments.H2OExistingKey, RequestArguments.H2OIllegalArgumentException, RequestArguments.H2OKey, RequestArguments.H2OKey2, RequestArguments.InputCheckBox, RequestArguments.InputSelect<T>, RequestArguments.InputText<T>, RequestArguments.Int, RequestArguments.LongInt, RequestArguments.MultipleSelect<T>, RequestArguments.MultipleText<T>, RequestArguments.NumberSequence, RequestArguments.NumberSequenceFloat, RequestArguments.Real, RequestArguments.Record<T>, RequestArguments.RSeq, RequestArguments.RSeqFloat, RequestArguments.Str, RequestArguments.StringList, RequestArguments.TypeaheadInputText<T>
RequestStatics.RequestType
Constants.Extensions, Constants.Schemes, Constants.Suffixes
Modifier and Type | Field and Description |
---|---|
static DocGen.FieldDoc[] |
DOC_FIELDS |
GBM.Family |
family |
int |
grid_parallelism |
boolean |
group_split |
double |
learn_rate |
_distribution, _modelClassDist, _nclass, _ncols, _nrows, _ntreesFromCheckpoint, _priorClassDist, balance_classes, checkpoint, class_sampling_factors, DECIDED_ROW, importance, max_after_balance_size, max_depth, MAX_SUPPORTED_LEVELS, min_rows, nbins, ntrees, OUT_OF_BAG, overwrite_checkpoint, score_each_iteration
_cmDomain, _cv_count, _names, _responseName, _sourceResponseDomain, _train, _valid, _validResponse, _validResponseDomain, holdout_fraction, keep_cross_validation_splits, n_folds, validation, xval_models
classification
response
cols, ignored_cols, ignored_cols_by_name
source
_cv, _fjtask, description, destination_key, end_time, exception, job_key, LIST, start_time, state
_parms, response_info
_requestHelp, SUPPORTS_ONLY_V1, SUPPORTS_ONLY_V2, SUPPORTS_V1_V2
ARRAY_BUILDER, ARRAY_HEADER_ROW_BUILDER, ARRAY_ROW_BUILDER, ARRAY_ROW_ELEMENT_BUILDER, ARRAY_ROW_SINGLECOL_BUILDER, ELEMENT_BUILDER, GSON_BUILDER, OBJECT_BUILDER, ROOT_OBJECT
_queryHtml
_arguments
ALPHA, ARGUMENTS, AUC, BASE, BEST_THRESHOLD, BETA_EPS, BIN_LIMIT, BROWSE, BUCKET, BUILT_IN_KEY_JOBS, CANCELLED, CARDINALITY, CASE, CASE_MODE, CHUNK, CLASS, CLOUD_HEALTH, CLOUD_NAME, CLOUD_SIZE, CLOUD_UPTIME_MILLIS, CLUSTERS, COEFFICIENTS, COL_INDEX, COLS, COLUMN_NAME, COLUMNS_DISPLAY, CONSENSUS, CONTENTS, COUNT, DATA_KEY, DEPTH, DESCRIPTION, DEST_KEY, DTHRESHOLDS, ELAPSED, END_TIME, ENUM_DOMAIN_SIZE, ERROR, ESCAPE_NAN, EXCLUSIVE_SPLIT_LIMIT, EXPRESSION, FAILED, FAMILY, FEATURES, FILE, FILES, FILTER, FIRST_CHUNK, FJ_QUEUE_HI, FJ_QUEUE_LO, FJ_THREADS_HI, FJ_THREADS_LO, FREE_DISK, FREE_MEM, GFLOPS, HEADER, HEIGHT, HELP, IGNORE, ITEMS, ITERATIVE_CM, JOB, JOB_KEY, JOBS, JSON_H2O, KEY, KEYS, LAMBDA, LAST_CONTACT, LIMIT, LINK, LOCKED, MAX, MAX_DISK, MAX_ITER, MAX_MEM, MAX_ROWS, MEAN, MEM_BW, MIN, MODEL_KEY, MODELS, MORE, MTRY, MTRY_NODES, NAME, NEG_X, NO_CM, NODE, NODE_HEALTH, NODE_NAME, NODES, NORMALIZE, NUM_COLS, NUM_CPUS, NUM_FAILED, NUM_KEYS, NUM_MISSING_VALUES, NUM_ROWS, NUM_SUCCEEDED, NUM_TREES, OBJECT, OFFSET, OOBEE, PARALLEL, PARSER_TYPE, PATH, PREVIEW, PREVIOUS_MODEL_KEY, PRIOR, PROGRESS, PROGRESS_KEY, PROGRESS_TOTAL, REDIRECT, REDIRECT_ARGS, REPLICATION_FACTOR, REQUEST_TIME, RESPONSE, RHO, ROW, ROW_SIZE, ROWS, RPCS, SAMPLE, SAMPLING_STRATEGY, SCALE, SEED, SENT_ROWS, SEPARATOR, SIZE, SOURCE_KEY, STACK_TRACES, START_TIME, STAT_TYPE, STATUS, STEP, STRATA_SAMPLES, SUCCEEDED, SYSTEM_LOAD, TASK_KEY, TCPS_ACTIVE, TCPS_DUTY, TIME, TO_ENUM, TOT_MEM, TREE_COUNT, TREE_DEPTH, TREE_LEAVES, TREE_NUM, TREES, TWEEDIE_POWER, TYPE, URL, USE_NON_LOCAL_DATA, VALUE, VALUE_SIZE, VALUE_TYPE, VARIANCE, VERSION, VIEW, WARNINGS, WEIGHT, WEIGHTS, WIDTH, X, XVAL, Y
Constructor and Description |
---|
GBM() |
Modifier and Type | Method and Description |
---|---|
protected GBM.GBMModel |
buildModel(GBM.GBMModel model,
Frame fr,
java.lang.String[] names,
java.lang.String[][] domains,
Timer t_build)
Builds model
|
void |
crossValidate(Frame[] splits,
Frame[] cv_preds,
long[] offsets,
int i)
Cross-Validate a GBM model by building new models on N train/test holdout splits
|
protected VarImp |
doVarImpCalc(GBM.GBMModel model,
DTree[] ktrees,
int tid,
Frame validationFrame,
boolean scale)
Compute relative variable importance for GBM model.
|
protected void |
execImpl()
The real implementation which should be provided by ancestors.
|
int |
gridParallelism() |
protected void |
initAlgo(GBM.GBMModel initialModel)
Initialize algorithm - e.g., allocate algorithm specific datastructure.
|
protected void |
initWorkFrame(GBM.GBMModel initialModel,
Frame fr)
Initialize working frame.
|
static java.lang.String |
link(Key k,
java.lang.String content)
Return the query link to this page
|
protected Log.Tag.Sys |
logTag()
Returns a log tag for a particular model builder (e.g., DRF, GBM)
|
protected DTree.DecidedNode |
makeDecided(DTree.UndecidedNode udn,
DHistogram[] hs) |
protected GBM.GBMModel |
makeModel(GBM.GBMModel model,
double err,
ConfusionMatrix cm,
VarImp varimp,
AUCData validAUC) |
protected GBM.GBMModel |
makeModel(GBM.GBMModel model,
DTree[] ktrees,
DTree.TreeModel.TreeStats tstats) |
protected GBM.GBMModel |
makeModel(Key outputKey,
Key dataKey,
Key testKey,
int ntrees,
java.lang.String[] names,
java.lang.String[][] domains,
java.lang.String[] cmDomain,
float[] priorClassDist,
float[] classDist) |
protected RequestBuilders.Response |
redirect() |
Frame |
score(Frame fr) |
protected float |
score1(Chunk[] chks,
float[] fs,
int row) |
protected GBM.GBMModel |
updateModel(GBM.GBMModel additionModel,
GBM.GBMModel checkpoint,
boolean overwriteCheckpoint) |
buildLayer, buildModel, chk_nids, chk_oobt, chk_resp, chk_tree, chk_work, cleanUp, createRNG, data_row, debugPrintTreeColumns, defaultDestKey, doScoring, inBagRow, init, isClassification, isDecidedRow, isOOBRow, makeAUC, nid2Oob, oob2Nid, printGenerateTrees, progress, speedDescription, speedValue, supportsBagging, vec_nids, vec_resp, vec_tree
cv_progress, genericCrossValidation, getCMDomain, getOrigValidation, getValidAdaptor, getValidation, getVectorDomain, hasValidation, prepareValidationWithModel, queryArgumentValueSet, registered, toJSON
selectFrame, selectVecs
all, cancel, cancel, cancel, checkIdx, defaultJobKey, dest, findJob, findJobByDest, fork, get, getState, hygiene, hygiene, invoke, isCancelledOrCrashed, isCrashed, isDone, isEnded, isRunning, isRunning, onCancelled, remove, runTimeMs, self, serve, start, waitUntilJobEnded, waitUntilJobEnded
create, fillResponseInfo, filterNaCols, find, input, logStart, makeJsonBox, serveGrid, servePublic, set, split, superServeGrid, supportedVersions, toJSON, toString
addToNavbar, addToNavbar, addToNavbar, DocExampleFail, DocExampleSucc, href, href, hrefType, HTMLHelp, htmlTemplate, initializeNavBar, log, mapTypeahead, ReSTHelp, serve, serveJava, serveResponse, toDocGET, toHTML, toJava, wrap, wrap, wrap, writeJSONFields
build, buildJSONResponseBox, buildResponseHeader, name
buildQuery, checkArguments
arguments, argumentsToJson, frameColumnNameToIndex
checkJsonName, encodeRedirectArgs, JSON2HTML, jsonError, requestName, Str2JSON
clone, frozenType, init, newInstance, read, toDocField, write, writeJSON
public static DocGen.FieldDoc[] DOC_FIELDS
@Request.API(help="Distribution for computing loss function. AUTO selects gaussian for continuous and multinomial for categorical response", filter=Request.Default.class, json=true, importance=CRITICAL) public GBM.Family family
@Request.API(help="Learning rate, from 0. to 1.0", filter=Request.Default.class, dmin=0.0, dmax=1.0, json=true, importance=SECONDARY) public double learn_rate
@Request.API(help="Grid search parallelism", filter=Request.Default.class, lmax=4L, gridable=false, importance=SECONDARY) public int grid_parallelism
@Request.API(help="Perform Group Splitting Categoricals", filter=Request.Default.class) public boolean group_split
protected Log.Tag.Sys logTag()
SharedTreeModelBuilder
logTag
in class SharedTreeModelBuilder<GBM.GBMModel>
protected GBM.GBMModel makeModel(Key outputKey, Key dataKey, Key testKey, int ntrees, java.lang.String[] names, java.lang.String[][] domains, java.lang.String[] cmDomain, float[] priorClassDist, float[] classDist)
makeModel
in class SharedTreeModelBuilder<GBM.GBMModel>
protected GBM.GBMModel makeModel(GBM.GBMModel model, double err, ConfusionMatrix cm, VarImp varimp, AUCData validAUC)
makeModel
in class SharedTreeModelBuilder<GBM.GBMModel>
protected GBM.GBMModel makeModel(GBM.GBMModel model, DTree[] ktrees, DTree.TreeModel.TreeStats tstats)
makeModel
in class SharedTreeModelBuilder<GBM.GBMModel>
protected GBM.GBMModel updateModel(GBM.GBMModel additionModel, GBM.GBMModel checkpoint, boolean overwriteCheckpoint)
updateModel
in class SharedTreeModelBuilder<GBM.GBMModel>
public static java.lang.String link(Key k, java.lang.String content)
protected void execImpl()
Func
public int gridParallelism()
gridParallelism
in class Job
protected RequestBuilders.Response redirect()
protected void initAlgo(GBM.GBMModel initialModel)
SharedTreeModelBuilder
initAlgo
in class SharedTreeModelBuilder<GBM.GBMModel>
protected void initWorkFrame(GBM.GBMModel initialModel, Frame fr)
SharedTreeModelBuilder
initWorkFrame
in class SharedTreeModelBuilder<GBM.GBMModel>
initialModel
- initial modelfr
- working frame which contains train data and additional columns prepared by this builder.protected GBM.GBMModel buildModel(GBM.GBMModel model, Frame fr, java.lang.String[] names, java.lang.String[][] domains, Timer t_build)
SharedTreeModelBuilder
buildModel
in class SharedTreeModelBuilder<GBM.GBMModel>
model
- initial model created by makeModel() method.fr
- training dataset which can contain additional temporary vectors prepared by buildModel() method.names
- names of columns in trainFr
used for model trainingdomains
- domains of columns in trainFr
used for model trainingt_build
- timer to measure model building processprotected float score1(Chunk[] chks, float[] fs, int row)
score1
in class SharedTreeModelBuilder<GBM.GBMModel>
protected DTree.DecidedNode makeDecided(DTree.UndecidedNode udn, DHistogram[] hs)
makeDecided
in class SharedTreeModelBuilder<GBM.GBMModel>
protected VarImp doVarImpCalc(GBM.GBMModel model, DTree[] ktrees, int tid, Frame validationFrame, boolean scale)
doVarImpCalc
in class SharedTreeModelBuilder<GBM.GBMModel>
public void crossValidate(Frame[] splits, Frame[] cv_preds, long[] offsets, int i)
crossValidate
in class Job.ValidatedJob
splits
- Frames containing train/test splitscv_preds
- Array of Frames to store the predictions for each cross-validation runoffsets
- Array to store the offsets of starting row indices for each cross-validation runi
- Which fold of cross-validation to perform