- 3.56.0 (latest)
- 3.55.0
- 3.54.0
- 3.53.0
- 3.52.0
- 3.50.0
- 3.49.0
- 3.48.0
- 3.47.0
- 3.46.0
- 3.45.0
- 3.44.0
- 3.43.0
- 3.42.0
- 3.41.0
- 3.40.0
- 3.38.0
- 3.37.0
- 3.36.0
- 3.35.0
- 3.34.0
- 3.33.0
- 3.32.0
- 3.31.0
- 3.30.0
- 3.29.0
- 3.28.0
- 3.25.0
- 3.24.0
- 3.23.0
- 3.22.0
- 3.21.0
- 3.20.0
- 3.19.0
- 3.18.0
- 3.17.0
- 3.16.0
- 3.15.0
- 3.14.0
- 3.13.0
- 3.12.0
- 3.11.0
- 3.10.0
- 3.9.0
- 3.8.0
- 3.7.0
- 3.6.0
- 3.5.0
- 3.4.2
- 3.3.0
- 3.2.0
- 3.0.0
- 2.9.8
- 2.8.9
- 2.7.4
- 2.5.3
- 2.4.0
public static final class PredictionServiceGrpc.PredictionServiceBlockingStub extends AbstractBlockingStub<PredictionServiceGrpc.PredictionServiceBlockingStub>
A stub to allow clients to do synchronous rpc calls to service PredictionService.
A service for online predictions and explanations.
Inheritance
java.lang.Object > io.grpc.stub.AbstractStub > io.grpc.stub.AbstractBlockingStub > PredictionServiceGrpc.PredictionServiceBlockingStubMethods
build(Channel channel, CallOptions callOptions)
protected PredictionServiceGrpc.PredictionServiceBlockingStub build(Channel channel, CallOptions callOptions)
Parameters | |
---|---|
Name | Description |
channel |
io.grpc.Channel |
callOptions |
io.grpc.CallOptions |
Returns | |
---|---|
Type | Description |
PredictionServiceGrpc.PredictionServiceBlockingStub |
chatCompletions(ChatCompletionsRequest request)
public Iterator<HttpBody> chatCompletions(ChatCompletionsRequest request)
Exposes an OpenAI-compatible endpoint for chat completions.
Parameter | |
---|---|
Name | Description |
request |
ChatCompletionsRequest |
Returns | |
---|---|
Type | Description |
Iterator<com.google.api.HttpBody> |
countTokens(CountTokensRequest request)
public CountTokensResponse countTokens(CountTokensRequest request)
Perform a token counting.
Parameter | |
---|---|
Name | Description |
request |
CountTokensRequest |
Returns | |
---|---|
Type | Description |
CountTokensResponse |
directPredict(DirectPredictRequest request)
public DirectPredictResponse directPredict(DirectPredictRequest request)
Perform an unary online prediction request to a gRPC model server for Vertex first-party products and frameworks.
Parameter | |
---|---|
Name | Description |
request |
DirectPredictRequest |
Returns | |
---|---|
Type | Description |
DirectPredictResponse |
directRawPredict(DirectRawPredictRequest request)
public DirectRawPredictResponse directRawPredict(DirectRawPredictRequest request)
Perform an unary online prediction request to a gRPC model server for custom containers.
Parameter | |
---|---|
Name | Description |
request |
DirectRawPredictRequest |
Returns | |
---|---|
Type | Description |
DirectRawPredictResponse |
explain(ExplainRequest request)
public ExplainResponse explain(ExplainRequest request)
Perform an online explanation. If deployed_model_id is specified, the corresponding DeployModel must have explanation_spec populated. If deployed_model_id is not specified, all DeployedModels must have explanation_spec populated.
Parameter | |
---|---|
Name | Description |
request |
ExplainRequest |
Returns | |
---|---|
Type | Description |
ExplainResponse |
generateContent(GenerateContentRequest request)
public GenerateContentResponse generateContent(GenerateContentRequest request)
Generate content with multimodal inputs.
Parameter | |
---|---|
Name | Description |
request |
GenerateContentRequest |
Returns | |
---|---|
Type | Description |
GenerateContentResponse |
predict(PredictRequest request)
public PredictResponse predict(PredictRequest request)
Perform an online prediction.
Parameter | |
---|---|
Name | Description |
request |
PredictRequest |
Returns | |
---|---|
Type | Description |
PredictResponse |
rawPredict(RawPredictRequest request)
public HttpBody rawPredict(RawPredictRequest request)
Perform an online prediction with an arbitrary HTTP payload. The response includes the following HTTP headers:
X-Vertex-AI-Endpoint-Id
: ID of the Endpoint that served this prediction.X-Vertex-AI-Deployed-Model-Id
: ID of the Endpoint's DeployedModel that served this prediction.
Parameter | |
---|---|
Name | Description |
request |
RawPredictRequest |
Returns | |
---|---|
Type | Description |
com.google.api.HttpBody |
serverStreamingPredict(StreamingPredictRequest request)
public Iterator<StreamingPredictResponse> serverStreamingPredict(StreamingPredictRequest request)
Perform a server-side streaming online prediction request for Vertex LLM streaming.
Parameter | |
---|---|
Name | Description |
request |
StreamingPredictRequest |
Returns | |
---|---|
Type | Description |
Iterator<StreamingPredictResponse> |
streamGenerateContent(GenerateContentRequest request)
public Iterator<GenerateContentResponse> streamGenerateContent(GenerateContentRequest request)
Generate content with multimodal inputs with streaming support.
Parameter | |
---|---|
Name | Description |
request |
GenerateContentRequest |
Returns | |
---|---|
Type | Description |
Iterator<GenerateContentResponse> |