public final class DataOptions extends Object implements com.oracle.labs.mlrg.olcut.config.Options
Modifier and Type | Class and Description |
---|---|
static class |
DataOptions.Delimiter
The delimiters supported by CSV files in this options object.
|
static class |
DataOptions.InputFormat
The input formats supported by this options object.
|
Modifier and Type | Field and Description |
---|---|
char |
csvQuoteChar |
String |
csvResponseName |
DataOptions.Delimiter |
delimiter |
int |
hashDim |
DataOptions.InputFormat |
inputFormat |
int |
minCount |
int |
ngram |
Path |
outputPath |
RowProcessor<?> |
rowProcessor |
long |
seed |
boolean |
termCounting |
Path |
testingPath |
Path |
trainingPath |
Constructor and Description |
---|
DataOptions() |
Modifier and Type | Method and Description |
---|---|
String |
getOptionsDescription() |
<T extends Output<T>> |
load(OutputFactory<T> outputFactory) |
<T extends Output<T>> |
saveModel(Model<T> model) |
@Option(longName="hashing-dimension", usage="Hashing dimension used for standard text format.") public int hashDim
@Option(longName="ngram", usage="Ngram size to generate when using standard text format.") public int ngram
@Option(longName="term-counting", usage="Use term counts instead of boolean when using the standard text format.") public boolean termCounting
@Option(charName=102, longName="model-output-path", usage="Path to serialize model to.") public Path outputPath
@Option(charName=114, longName="seed", usage="RNG seed.") public long seed
@Option(charName=115, longName="input-format", usage="Loads the data using the specified format.") public DataOptions.InputFormat inputFormat
@Option(longName="csv-response-name", usage="Response name in the csv file.") public String csvResponseName
@Option(longName="csv-delimiter", usage="Delimiter") public DataOptions.Delimiter delimiter
@Option(longName="csv-quote-char", usage="Quote character in the CSV file.") public char csvQuoteChar
@Option(longName="columnar-row-processor", usage="The name of the row processor from the config file.") public RowProcessor<?> rowProcessor
@Option(longName="min-count", usage="Minimum cardinality of the features.") public int minCount
@Option(charName=117, longName="training-file", usage="Path to the training file.") public Path trainingPath
@Option(charName=118, longName="testing-file", usage="Path to the testing file.") public Path testingPath
public String getOptionsDescription()
getOptionsDescription
in interface com.oracle.labs.mlrg.olcut.config.Options
public <T extends Output<T>> com.oracle.labs.mlrg.olcut.util.Pair<Dataset<T>,Dataset<T>> load(OutputFactory<T> outputFactory) throws IOException
IOException
public <T extends Output<T>> void saveModel(Model<T> model) throws IOException
IOException
Copyright © 2015–2021 Oracle and/or its affiliates. All rights reserved.