Class OcrConfig (2.45.0)

public final class OcrConfig extends GeneratedMessageV3 implements OcrConfigOrBuilder

Config for Document OCR.

Protobuf type google.cloud.documentai.v1.OcrConfig

Implements

OcrConfigOrBuilder

Static Fields

ADVANCED_OCR_OPTIONS_FIELD_NUMBER

public static final int ADVANCED_OCR_OPTIONS_FIELD_NUMBER
Field Value
TypeDescription
int

COMPUTE_STYLE_INFO_FIELD_NUMBER

public static final int COMPUTE_STYLE_INFO_FIELD_NUMBER
Field Value
TypeDescription
int

DISABLE_CHARACTER_BOXES_DETECTION_FIELD_NUMBER

public static final int DISABLE_CHARACTER_BOXES_DETECTION_FIELD_NUMBER
Field Value
TypeDescription
int

ENABLE_IMAGE_QUALITY_SCORES_FIELD_NUMBER

public static final int ENABLE_IMAGE_QUALITY_SCORES_FIELD_NUMBER
Field Value
TypeDescription
int

ENABLE_NATIVE_PDF_PARSING_FIELD_NUMBER

public static final int ENABLE_NATIVE_PDF_PARSING_FIELD_NUMBER
Field Value
TypeDescription
int

ENABLE_SYMBOL_FIELD_NUMBER

public static final int ENABLE_SYMBOL_FIELD_NUMBER
Field Value
TypeDescription
int

HINTS_FIELD_NUMBER

public static final int HINTS_FIELD_NUMBER
Field Value
TypeDescription
int

PREMIUM_FEATURES_FIELD_NUMBER

public static final int PREMIUM_FEATURES_FIELD_NUMBER
Field Value
TypeDescription
int

Static Methods

getDefaultInstance()

public static OcrConfig getDefaultInstance()
Returns
TypeDescription
OcrConfig

getDescriptor()

public static final Descriptors.Descriptor getDescriptor()
Returns
TypeDescription
Descriptor

newBuilder()

public static OcrConfig.Builder newBuilder()
Returns
TypeDescription
OcrConfig.Builder

newBuilder(OcrConfig prototype)

public static OcrConfig.Builder newBuilder(OcrConfig prototype)
Parameter
NameDescription
prototypeOcrConfig
Returns
TypeDescription
OcrConfig.Builder

parseDelimitedFrom(InputStream input)

public static OcrConfig parseDelimitedFrom(InputStream input)
Parameter
NameDescription
inputInputStream
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
IOException

parseDelimitedFrom(InputStream input, ExtensionRegistryLite extensionRegistry)

public static OcrConfig parseDelimitedFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
Parameters
NameDescription
inputInputStream
extensionRegistryExtensionRegistryLite
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
IOException

parseFrom(byte[] data)

public static OcrConfig parseFrom(byte[] data)
Parameter
NameDescription
databyte[]
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
InvalidProtocolBufferException

parseFrom(byte[] data, ExtensionRegistryLite extensionRegistry)

public static OcrConfig parseFrom(byte[] data, ExtensionRegistryLite extensionRegistry)
Parameters
NameDescription
databyte[]
extensionRegistryExtensionRegistryLite
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
InvalidProtocolBufferException

parseFrom(ByteString data)

public static OcrConfig parseFrom(ByteString data)
Parameter
NameDescription
dataByteString
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
InvalidProtocolBufferException

parseFrom(ByteString data, ExtensionRegistryLite extensionRegistry)

public static OcrConfig parseFrom(ByteString data, ExtensionRegistryLite extensionRegistry)
Parameters
NameDescription
dataByteString
extensionRegistryExtensionRegistryLite
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
InvalidProtocolBufferException

parseFrom(CodedInputStream input)

public static OcrConfig parseFrom(CodedInputStream input)
Parameter
NameDescription
inputCodedInputStream
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
IOException

parseFrom(CodedInputStream input, ExtensionRegistryLite extensionRegistry)

public static OcrConfig parseFrom(CodedInputStream input, ExtensionRegistryLite extensionRegistry)
Parameters
NameDescription
inputCodedInputStream
extensionRegistryExtensionRegistryLite
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
IOException

parseFrom(InputStream input)

public static OcrConfig parseFrom(InputStream input)
Parameter
NameDescription
inputInputStream
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
IOException

parseFrom(InputStream input, ExtensionRegistryLite extensionRegistry)

public static OcrConfig parseFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
Parameters
NameDescription
inputInputStream
extensionRegistryExtensionRegistryLite
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
IOException

parseFrom(ByteBuffer data)

public static OcrConfig parseFrom(ByteBuffer data)
Parameter
NameDescription
dataByteBuffer
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
InvalidProtocolBufferException

parseFrom(ByteBuffer data, ExtensionRegistryLite extensionRegistry)

public static OcrConfig parseFrom(ByteBuffer data, ExtensionRegistryLite extensionRegistry)
Parameters
NameDescription
dataByteBuffer
extensionRegistryExtensionRegistryLite
Returns
TypeDescription
OcrConfig
Exceptions
TypeDescription
InvalidProtocolBufferException

parser()

public static Parser<OcrConfig> parser()
Returns
TypeDescription
Parser<OcrConfig>

Methods

equals(Object obj)

public boolean equals(Object obj)
Parameter
NameDescription
objObject
Returns
TypeDescription
boolean
Overrides

getAdvancedOcrOptions(int index)

public String getAdvancedOcrOptions(int index)

A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are:

  • legacy_layout: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.

repeated string advanced_ocr_options = 5;

Parameter
NameDescription
indexint

The index of the element to return.

Returns
TypeDescription
String

The advancedOcrOptions at the given index.

getAdvancedOcrOptionsBytes(int index)

public ByteString getAdvancedOcrOptionsBytes(int index)

A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are:

  • legacy_layout: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.

repeated string advanced_ocr_options = 5;

Parameter
NameDescription
indexint

The index of the value to return.

Returns
TypeDescription
ByteString

The bytes of the advancedOcrOptions at the given index.

getAdvancedOcrOptionsCount()

public int getAdvancedOcrOptionsCount()

A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are:

  • legacy_layout: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.

repeated string advanced_ocr_options = 5;

Returns
TypeDescription
int

The count of advancedOcrOptions.

getAdvancedOcrOptionsList()

public ProtocolStringList getAdvancedOcrOptionsList()

A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are:

  • legacy_layout: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.

repeated string advanced_ocr_options = 5;

Returns
TypeDescription
ProtocolStringList

A list containing the advancedOcrOptions.

getComputeStyleInfo() (deprecated)

public boolean getComputeStyleInfo()

Deprecated. google.cloud.documentai.v1.OcrConfig.compute_style_info is deprecated. See google/cloud/documentai/v1/document_io.proto;l=165

Turn on font identification model and return font style information. Deprecated, use PremiumFeatures.compute_style_info instead.

bool compute_style_info = 8 [deprecated = true];

Returns
TypeDescription
boolean

The computeStyleInfo.

getDefaultInstanceForType()

public OcrConfig getDefaultInstanceForType()
Returns
TypeDescription
OcrConfig

getDisableCharacterBoxesDetection()

public boolean getDisableCharacterBoxesDetection()

Turn off character box detector in OCR engine. Character box detection is enabled by default in OCR 2.0 (and later) processors.

bool disable_character_boxes_detection = 10;

Returns
TypeDescription
boolean

The disableCharacterBoxesDetection.

getEnableImageQualityScores()

public boolean getEnableImageQualityScores()

Enables intelligent document quality scores after OCR. Can help with diagnosing why OCR responses are of poor quality for a given input. Adds additional latency comparable to regular OCR to the process call.

bool enable_image_quality_scores = 4;

Returns
TypeDescription
boolean

The enableImageQualityScores.

getEnableNativePdfParsing()

public boolean getEnableNativePdfParsing()

Enables special handling for PDFs with existing text information. Results in better text extraction quality in such PDF inputs.

bool enable_native_pdf_parsing = 3;

Returns
TypeDescription
boolean

The enableNativePdfParsing.

getEnableSymbol()

public boolean getEnableSymbol()

Includes symbol level OCR information if set to true.

bool enable_symbol = 6;

Returns
TypeDescription
boolean

The enableSymbol.

getHints()

public OcrConfig.Hints getHints()

Hints for the OCR model.

.google.cloud.documentai.v1.OcrConfig.Hints hints = 2;

Returns
TypeDescription
OcrConfig.Hints

The hints.

getHintsOrBuilder()

public OcrConfig.HintsOrBuilder getHintsOrBuilder()

Hints for the OCR model.

.google.cloud.documentai.v1.OcrConfig.Hints hints = 2;

Returns
TypeDescription
OcrConfig.HintsOrBuilder

getParserForType()

public Parser<OcrConfig> getParserForType()
Returns
TypeDescription
Parser<OcrConfig>
Overrides

getPremiumFeatures()

public OcrConfig.PremiumFeatures getPremiumFeatures()

Configurations for premium OCR features.

.google.cloud.documentai.v1.OcrConfig.PremiumFeatures premium_features = 11;

Returns
TypeDescription
OcrConfig.PremiumFeatures

The premiumFeatures.

getPremiumFeaturesOrBuilder()

public OcrConfig.PremiumFeaturesOrBuilder getPremiumFeaturesOrBuilder()

Configurations for premium OCR features.

.google.cloud.documentai.v1.OcrConfig.PremiumFeatures premium_features = 11;

Returns
TypeDescription
OcrConfig.PremiumFeaturesOrBuilder

getSerializedSize()

public int getSerializedSize()
Returns
TypeDescription
int
Overrides

hasHints()

public boolean hasHints()

Hints for the OCR model.

.google.cloud.documentai.v1.OcrConfig.Hints hints = 2;

Returns
TypeDescription
boolean

Whether the hints field is set.

hasPremiumFeatures()

public boolean hasPremiumFeatures()

Configurations for premium OCR features.

.google.cloud.documentai.v1.OcrConfig.PremiumFeatures premium_features = 11;

Returns
TypeDescription
boolean

Whether the premiumFeatures field is set.

hashCode()

public int hashCode()
Returns
TypeDescription
int
Overrides

internalGetFieldAccessorTable()

protected GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()
Returns
TypeDescription
FieldAccessorTable
Overrides

isInitialized()

public final boolean isInitialized()
Returns
TypeDescription
boolean
Overrides

newBuilderForType()

public OcrConfig.Builder newBuilderForType()
Returns
TypeDescription
OcrConfig.Builder

newBuilderForType(GeneratedMessageV3.BuilderParent parent)

protected OcrConfig.Builder newBuilderForType(GeneratedMessageV3.BuilderParent parent)
Parameter
NameDescription
parentBuilderParent
Returns
TypeDescription
OcrConfig.Builder
Overrides

newInstance(GeneratedMessageV3.UnusedPrivateParameter unused)

protected Object newInstance(GeneratedMessageV3.UnusedPrivateParameter unused)
Parameter
NameDescription
unusedUnusedPrivateParameter
Returns
TypeDescription
Object
Overrides

toBuilder()

public OcrConfig.Builder toBuilder()
Returns
TypeDescription
OcrConfig.Builder

writeTo(CodedOutputStream output)

public void writeTo(CodedOutputStream output)
Parameter
NameDescription
outputCodedOutputStream
Overrides
Exceptions
TypeDescription
IOException