public final class StratifiedSplit extends GeneratedMessageV3 implements StratifiedSplitOrBuilder
Assigns input data to the training, validation, and test sets so that the
distribution of values found in the categorical column (as specified by the
key
field) is mirrored within each split. The fraction values determine
the relative sizes of the splits.
For example, if the specified column has three values, with 50% of the rows
having value "A", 25% value "B", and 25% value "C", and the split fractions
are specified as 80/10/10, then the training set will constitute 80% of the
training data, with about 50% of the training set rows having the value "A"
for the specified column, about 25% having the value "B", and about 25%
having the value "C".
Only the top 500 occurring values are used; any values not in the top
500 values are randomly assigned to a split. If less than three rows contain
a specific value, those rows are randomly assigned.
Supported only for tabular Datasets.
Protobuf type google.cloud.aiplatform.v1beta1.StratifiedSplit
Inherited Members
com.google.protobuf.GeneratedMessageV3.<ListT>makeMutableCopy(ListT)
Static Fields
public static final int KEY_FIELD_NUMBER
Field Value |
---|
Type | Description |
int | |
public static final int TEST_FRACTION_FIELD_NUMBER
Field Value |
---|
Type | Description |
int | |
public static final int TRAINING_FRACTION_FIELD_NUMBER
Field Value |
---|
Type | Description |
int | |
public static final int VALIDATION_FRACTION_FIELD_NUMBER
Field Value |
---|
Type | Description |
int | |
Static Methods
public static StratifiedSplit getDefaultInstance()
public static final Descriptors.Descriptor getDescriptor()
public static StratifiedSplit.Builder newBuilder()
public static StratifiedSplit.Builder newBuilder(StratifiedSplit prototype)
public static StratifiedSplit parseDelimitedFrom(InputStream input)
public static StratifiedSplit parseDelimitedFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
public static StratifiedSplit parseFrom(byte[] data)
Parameter |
---|
Name | Description |
data | byte[]
|
public static StratifiedSplit parseFrom(byte[] data, ExtensionRegistryLite extensionRegistry)
public static StratifiedSplit parseFrom(ByteString data)
public static StratifiedSplit parseFrom(ByteString data, ExtensionRegistryLite extensionRegistry)
public static StratifiedSplit parseFrom(CodedInputStream input)
public static StratifiedSplit parseFrom(CodedInputStream input, ExtensionRegistryLite extensionRegistry)
public static StratifiedSplit parseFrom(InputStream input)
public static StratifiedSplit parseFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
public static StratifiedSplit parseFrom(ByteBuffer data)
public static StratifiedSplit parseFrom(ByteBuffer data, ExtensionRegistryLite extensionRegistry)
public static Parser<StratifiedSplit> parser()
Methods
public boolean equals(Object obj)
Parameter |
---|
Name | Description |
obj | Object
|
Overrides
public StratifiedSplit getDefaultInstanceForType()
Required. The key is a name of one of the Dataset's data columns.
The key provided must be for a categorical column.
string key = 4 [(.google.api.field_behavior) = REQUIRED];
Returns |
---|
Type | Description |
String | The key.
|
public ByteString getKeyBytes()
Required. The key is a name of one of the Dataset's data columns.
The key provided must be for a categorical column.
string key = 4 [(.google.api.field_behavior) = REQUIRED];
Returns |
---|
Type | Description |
ByteString | The bytes for key.
|
public Parser<StratifiedSplit> getParserForType()
Overrides
public int getSerializedSize()
Returns |
---|
Type | Description |
int | |
Overrides
public double getTestFraction()
The fraction of the input data that is to be used to evaluate the Model.
double test_fraction = 3;
Returns |
---|
Type | Description |
double | The testFraction.
|
public double getTrainingFraction()
The fraction of the input data that is to be used to train the Model.
double training_fraction = 1;
Returns |
---|
Type | Description |
double | The trainingFraction.
|
public final UnknownFieldSet getUnknownFields()
Overrides
public double getValidationFraction()
The fraction of the input data that is to be used to validate the Model.
double validation_fraction = 2;
Returns |
---|
Type | Description |
double | The validationFraction.
|
Returns |
---|
Type | Description |
int | |
Overrides
protected GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()
Overrides
public final boolean isInitialized()
Overrides
public StratifiedSplit.Builder newBuilderForType()
protected StratifiedSplit.Builder newBuilderForType(GeneratedMessageV3.BuilderParent parent)
Overrides
protected Object newInstance(GeneratedMessageV3.UnusedPrivateParameter unused)
Overrides
public StratifiedSplit.Builder toBuilder()
public void writeTo(CodedOutputStream output)
Overrides