public
static
interface
PredictionServiceGrpc
.
AsyncService
A service for online predictions and explanations.
Methods
directPredict(DirectPredictRequest request, StreamObserver<DirectPredictResponse> responseObserver)
public
default
void
directPredict
(
DirectPredictRequest
request
,
StreamObserver<DirectPredictResponse>
responseObserver
)
Perform an unary online prediction request to a gRPC model server for Vertex first-party products and frameworks.
request
responseObserver
io.grpc.stub.StreamObserver
< DirectPredictResponse
>
directRawPredict(DirectRawPredictRequest request, StreamObserver<DirectRawPredictResponse> responseObserver)
public
default
void
directRawPredict
(
DirectRawPredictRequest
request
,
StreamObserver<DirectRawPredictResponse>
responseObserver
)
Perform an unary online prediction request to a gRPC model server for custom containers.
request
responseObserver
io.grpc.stub.StreamObserver
< DirectRawPredictResponse
>
explain(ExplainRequest request, StreamObserver<ExplainResponse> responseObserver)
public
default
void
explain
(
ExplainRequest
request
,
StreamObserver<ExplainResponse>
responseObserver
)
Perform an online explanation. If deployed_model_id is specified, the corresponding DeployModel must have explanation_spec populated. If deployed_model_id is not specified, all DeployedModels must have explanation_spec populated.
request
responseObserver
io.grpc.stub.StreamObserver
< ExplainResponse
>
generateContent(GenerateContentRequest request, StreamObserver<GenerateContentResponse> responseObserver)
public
default
void
generateContent
(
GenerateContentRequest
request
,
StreamObserver<GenerateContentResponse>
responseObserver
)
Generate content with multimodal inputs.
request
responseObserver
io.grpc.stub.StreamObserver
< GenerateContentResponse
>
predict(PredictRequest request, StreamObserver<PredictResponse> responseObserver)
public
default
void
predict
(
PredictRequest
request
,
StreamObserver<PredictResponse>
responseObserver
)
Perform an online prediction.
request
responseObserver
io.grpc.stub.StreamObserver
< PredictResponse
>
rawPredict(RawPredictRequest request, StreamObserver<HttpBody> responseObserver)
public
default
void
rawPredict
(
RawPredictRequest
request
,
StreamObserver<HttpBody>
responseObserver
)
Perform an online prediction with an arbitrary HTTP payload. The response includes the following HTTP headers:
-
X-Vertex-AI-Endpoint-Id
: ID of the Endpoint that served this prediction. -
X-Vertex-AI-Deployed-Model-Id
: ID of the Endpoint's DeployedModel that served this prediction.
request
responseObserver
io.grpc.stub.StreamObserver
< com.google.api.HttpBody
>
serverStreamingPredict(StreamingPredictRequest request, StreamObserver<StreamingPredictResponse> responseObserver)
public
default
void
serverStreamingPredict
(
StreamingPredictRequest
request
,
StreamObserver<StreamingPredictResponse>
responseObserver
)
Perform a server-side streaming online prediction request for Vertex LLM streaming.
request
responseObserver
io.grpc.stub.StreamObserver
< StreamingPredictResponse
>
streamDirectPredict(StreamObserver<StreamDirectPredictResponse> responseObserver)
public
default
StreamObserver<StreamDirectPredictRequest>
streamDirectPredict
(
StreamObserver<StreamDirectPredictResponse>
responseObserver
)
Perform a streaming online prediction request to a gRPC model server for Vertex first-party products and frameworks.
responseObserver
io.grpc.stub.StreamObserver
< StreamDirectPredictResponse
>
streamDirectRawPredict(StreamObserver<StreamDirectRawPredictResponse> responseObserver)
public
default
StreamObserver<StreamDirectRawPredictRequest>
streamDirectRawPredict
(
StreamObserver<StreamDirectRawPredictResponse>
responseObserver
)
Perform a streaming online prediction request to a gRPC model server for custom containers.
responseObserver
io.grpc.stub.StreamObserver
< StreamDirectRawPredictResponse
>
streamGenerateContent(GenerateContentRequest request, StreamObserver<GenerateContentResponse> responseObserver)
public
default
void
streamGenerateContent
(
GenerateContentRequest
request
,
StreamObserver<GenerateContentResponse>
responseObserver
)
Generate content with multimodal inputs with streaming support.
request
responseObserver
io.grpc.stub.StreamObserver
< GenerateContentResponse
>
streamRawPredict(StreamRawPredictRequest request, StreamObserver<HttpBody> responseObserver)
public
default
void
streamRawPredict
(
StreamRawPredictRequest
request
,
StreamObserver<HttpBody>
responseObserver
)
Perform a streaming online prediction with an arbitrary HTTP payload.
request
responseObserver
io.grpc.stub.StreamObserver
< com.google.api.HttpBody
>
streamingPredict(StreamObserver<StreamingPredictResponse> responseObserver)
public
default
StreamObserver<StreamingPredictRequest>
streamingPredict
(
StreamObserver<StreamingPredictResponse>
responseObserver
)
Perform a streaming online prediction request for Vertex first-party products and frameworks.
responseObserver
io.grpc.stub.StreamObserver
< StreamingPredictResponse
>
streamingRawPredict(StreamObserver<StreamingRawPredictResponse> responseObserver)
public
default
StreamObserver<StreamingRawPredictRequest>
streamingRawPredict
(
StreamObserver<StreamingRawPredictResponse>
responseObserver
)
Perform a streaming online prediction request through gRPC.
responseObserver
io.grpc.stub.StreamObserver
< StreamingRawPredictResponse
>