Package inference
Class GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub
java.lang.Object
io.grpc.stub.AbstractStub<GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub>
io.grpc.stub.AbstractFutureStub<GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub>
inference.GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub
- Enclosing class:
GRPCInferenceServiceGrpc
public static final class GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub
extends io.grpc.stub.AbstractFutureStub<GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub>
A stub to allow clients to do ListenableFuture-style rpc calls to service GRPCInferenceService.
@@ @@.. cpp:var:: service InferenceService @@ @@ Inference Server GRPC endpoints. @@
-
Nested Class Summary
Nested classes/interfaces inherited from class io.grpc.stub.AbstractStub
io.grpc.stub.AbstractStub.StubFactory<T extends io.grpc.stub.AbstractStub<T>> -
Method Summary
Modifier and TypeMethodDescriptionbuild(io.grpc.Channel channel, io.grpc.CallOptions callOptions) com.google.common.util.concurrent.ListenableFuture<GrpcService.CudaSharedMemoryRegisterResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.CudaSharedMemoryStatusResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.CudaSharedMemoryUnregisterResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.LogSettingsResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelConfigResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelInferResponse> modelInfer(GrpcService.ModelInferRequest request) @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelMetadataResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelReadyResponse> modelReady(GrpcService.ModelReadyRequest request) @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelStatisticsResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.RepositoryIndexResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.RepositoryModelLoadResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.RepositoryModelUnloadResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ServerLiveResponse> serverLive(GrpcService.ServerLiveRequest request) @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ServerMetadataResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.ServerReadyResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.SystemSharedMemoryRegisterResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.SystemSharedMemoryStatusResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.SystemSharedMemoryUnregisterResponse> @@ ..com.google.common.util.concurrent.ListenableFuture<GrpcService.TraceSettingResponse> @@ ..Methods inherited from class io.grpc.stub.AbstractFutureStub
newStub, newStubMethods inherited from class io.grpc.stub.AbstractStub
getCallOptions, getChannel, withCallCredentials, withChannel, withCompression, withDeadline, withDeadlineAfter, withExecutor, withInterceptors, withMaxInboundMessageSize, withMaxOutboundMessageSize, withOption, withWaitForReady
-
Method Details
-
build
protected GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub build(io.grpc.Channel channel, io.grpc.CallOptions callOptions) - Specified by:
buildin classio.grpc.stub.AbstractStub<GRPCInferenceServiceGrpc.GRPCInferenceServiceFutureStub>
-
serverLive
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ServerLiveResponse> serverLive(GrpcService.ServerLiveRequest request) @@ .. cpp:var:: rpc ServerLive(ServerLiveRequest) returns @@ (ServerLiveResponse) @@ @@ Check liveness of the inference server. @@
-
serverReady
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ServerReadyResponse> serverReady(GrpcService.ServerReadyRequest request) @@ .. cpp:var:: rpc ServerReady(ServerReadyRequest) returns @@ (ServerReadyResponse) @@ @@ Check readiness of the inference server. @@
-
modelReady
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelReadyResponse> modelReady(GrpcService.ModelReadyRequest request) @@ .. cpp:var:: rpc ModelReady(ModelReadyRequest) returns @@ (ModelReadyResponse) @@ @@ Check readiness of a model in the inference server. @@
-
serverMetadata
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ServerMetadataResponse> serverMetadata(GrpcService.ServerMetadataRequest request) @@ .. cpp:var:: rpc ServerMetadata(ServerMetadataRequest) returns @@ (ServerMetadataResponse) @@ @@ Get server metadata. @@
-
modelMetadata
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelMetadataResponse> modelMetadata(GrpcService.ModelMetadataRequest request) @@ .. cpp:var:: rpc ModelMetadata(ModelMetadataRequest) returns @@ (ModelMetadataResponse) @@ @@ Get model metadata. @@
-
modelInfer
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelInferResponse> modelInfer(GrpcService.ModelInferRequest request) @@ .. cpp:var:: rpc ModelInfer(ModelInferRequest) returns @@ (ModelInferResponse) @@ @@ Perform inference using a specific model. @@
-
modelConfig
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelConfigResponse> modelConfig(GrpcService.ModelConfigRequest request) @@ .. cpp:var:: rpc ModelConfig(ModelConfigRequest) returns @@ (ModelConfigResponse) @@ @@ Get model configuration. @@
-
modelStatistics
public com.google.common.util.concurrent.ListenableFuture<GrpcService.ModelStatisticsResponse> modelStatistics(GrpcService.ModelStatisticsRequest request) @@ .. cpp:var:: rpc ModelStatistics( @@ ModelStatisticsRequest) @@ returns (ModelStatisticsResponse) @@ @@ Get the cumulative inference statistics for a model. @@
-
repositoryIndex
public com.google.common.util.concurrent.ListenableFuture<GrpcService.RepositoryIndexResponse> repositoryIndex(GrpcService.RepositoryIndexRequest request) @@ .. cpp:var:: rpc RepositoryIndex(RepositoryIndexRequest) returns @@ (RepositoryIndexResponse) @@ @@ Get the index of model repository contents. @@
-
repositoryModelLoad
public com.google.common.util.concurrent.ListenableFuture<GrpcService.RepositoryModelLoadResponse> repositoryModelLoad(GrpcService.RepositoryModelLoadRequest request) @@ .. cpp:var:: rpc RepositoryModelLoad(RepositoryModelLoadRequest) returns @@ (RepositoryModelLoadResponse) @@ @@ Load or reload a model from a repository. @@
-
repositoryModelUnload
public com.google.common.util.concurrent.ListenableFuture<GrpcService.RepositoryModelUnloadResponse> repositoryModelUnload(GrpcService.RepositoryModelUnloadRequest request) @@ .. cpp:var:: rpc RepositoryModelUnload(RepositoryModelUnloadRequest) @@ returns (RepositoryModelUnloadResponse) @@ @@ Unload a model. @@
-
traceSetting
public com.google.common.util.concurrent.ListenableFuture<GrpcService.TraceSettingResponse> traceSetting(GrpcService.TraceSettingRequest request) @@ .. cpp:var:: rpc TraceSetting(TraceSettingRequest) @@ returns (TraceSettingResponse) @@ @@ Update and get the trace setting of the Triton server. @@
-
logSettings
public com.google.common.util.concurrent.ListenableFuture<GrpcService.LogSettingsResponse> logSettings(GrpcService.LogSettingsRequest request) @@ .. cpp:var:: rpc LogSettings(LogSettingsRequest) @@ returns (LogSettingsResponse) @@ @@ Update and get the log settings of the Triton server. @@
-