pub struct GrpcInferenceServiceClient<T> { /* private fields */ }
Expand description
@@ @@.. cpp:var:: service InferenceService @@ @@ Inference Server GRPC endpoints. @@
Implementations§
Source§impl<T> GrpcInferenceServiceClient<T>where
T: GrpcService<BoxBody>,
T::Error: Into<StdError>,
T::ResponseBody: Body<Data = Bytes> + Send + 'static,
<T::ResponseBody as Body>::Error: Into<StdError> + Send,
impl<T> GrpcInferenceServiceClient<T>where
T: GrpcService<BoxBody>,
T::Error: Into<StdError>,
T::ResponseBody: Body<Data = Bytes> + Send + 'static,
<T::ResponseBody as Body>::Error: Into<StdError> + Send,
pub fn new(inner: T) -> Self
pub fn with_interceptor<F>(
inner: T,
interceptor: F,
) -> GrpcInferenceServiceClient<InterceptedService<T, F>>where
F: Interceptor,
T::ResponseBody: Default,
T: Service<Request<BoxBody>, Response = Response<<T as GrpcService<BoxBody>>::ResponseBody>>,
<T as Service<Request<BoxBody>>>::Error: Into<StdError> + Send + Sync,
Sourcepub fn send_gzip(self) -> Self
pub fn send_gzip(self) -> Self
Compress requests with gzip
.
This requires the server to support it otherwise it might respond with an error.
Sourcepub fn accept_gzip(self) -> Self
pub fn accept_gzip(self) -> Self
Enable decompressing responses with gzip
.
Sourcepub async fn server_live(
&mut self,
request: impl IntoRequest<ServerLiveRequest>,
) -> Result<Response<ServerLiveResponse>, Status>
pub async fn server_live( &mut self, request: impl IntoRequest<ServerLiveRequest>, ) -> Result<Response<ServerLiveResponse>, Status>
@@ .. cpp:var:: rpc ServerLive(ServerLiveRequest) returns @@ (ServerLiveResponse) @@ @@ Check liveness of the inference server. @@
Sourcepub async fn server_ready(
&mut self,
request: impl IntoRequest<ServerReadyRequest>,
) -> Result<Response<ServerReadyResponse>, Status>
pub async fn server_ready( &mut self, request: impl IntoRequest<ServerReadyRequest>, ) -> Result<Response<ServerReadyResponse>, Status>
@@ .. cpp:var:: rpc ServerReady(ServerReadyRequest) returns @@ (ServerReadyResponse) @@ @@ Check readiness of the inference server. @@
Sourcepub async fn model_ready(
&mut self,
request: impl IntoRequest<ModelReadyRequest>,
) -> Result<Response<ModelReadyResponse>, Status>
pub async fn model_ready( &mut self, request: impl IntoRequest<ModelReadyRequest>, ) -> Result<Response<ModelReadyResponse>, Status>
@@ .. cpp:var:: rpc ModelReady(ModelReadyRequest) returns @@ (ModelReadyResponse) @@ @@ Check readiness of a model in the inference server. @@
Sourcepub async fn server_metadata(
&mut self,
request: impl IntoRequest<ServerMetadataRequest>,
) -> Result<Response<ServerMetadataResponse>, Status>
pub async fn server_metadata( &mut self, request: impl IntoRequest<ServerMetadataRequest>, ) -> Result<Response<ServerMetadataResponse>, Status>
@@ .. cpp:var:: rpc ServerMetadata(ServerMetadataRequest) returns @@ (ServerMetadataResponse) @@ @@ Get server metadata. @@
Sourcepub async fn model_metadata(
&mut self,
request: impl IntoRequest<ModelMetadataRequest>,
) -> Result<Response<ModelMetadataResponse>, Status>
pub async fn model_metadata( &mut self, request: impl IntoRequest<ModelMetadataRequest>, ) -> Result<Response<ModelMetadataResponse>, Status>
@@ .. cpp:var:: rpc ModelMetadata(ModelMetadataRequest) returns @@ (ModelMetadataResponse) @@ @@ Get model metadata. @@
Sourcepub async fn model_infer(
&mut self,
request: impl IntoRequest<ModelInferRequest>,
) -> Result<Response<ModelInferResponse>, Status>
pub async fn model_infer( &mut self, request: impl IntoRequest<ModelInferRequest>, ) -> Result<Response<ModelInferResponse>, Status>
@@ .. cpp:var:: rpc ModelInfer(ModelInferRequest) returns @@ (ModelInferResponse) @@ @@ Perform inference using a specific model. @@
Sourcepub async fn model_stream_infer(
&mut self,
request: impl IntoStreamingRequest<Message = ModelInferRequest>,
) -> Result<Response<Streaming<ModelStreamInferResponse>>, Status>
pub async fn model_stream_infer( &mut self, request: impl IntoStreamingRequest<Message = ModelInferRequest>, ) -> Result<Response<Streaming<ModelStreamInferResponse>>, Status>
@@ .. cpp:var:: rpc ModelStreamInfer(stream ModelInferRequest) returns @@ (stream ModelStreamInferResponse) @@ @@ Perform streaming inference. @@
Sourcepub async fn model_config(
&mut self,
request: impl IntoRequest<ModelConfigRequest>,
) -> Result<Response<ModelConfigResponse>, Status>
pub async fn model_config( &mut self, request: impl IntoRequest<ModelConfigRequest>, ) -> Result<Response<ModelConfigResponse>, Status>
@@ .. cpp:var:: rpc ModelConfig(ModelConfigRequest) returns @@ (ModelConfigResponse) @@ @@ Get model configuration. @@
Sourcepub async fn model_statistics(
&mut self,
request: impl IntoRequest<ModelStatisticsRequest>,
) -> Result<Response<ModelStatisticsResponse>, Status>
pub async fn model_statistics( &mut self, request: impl IntoRequest<ModelStatisticsRequest>, ) -> Result<Response<ModelStatisticsResponse>, Status>
@@ .. cpp:var:: rpc ModelStatistics( @@ ModelStatisticsRequest) @@ returns (ModelStatisticsResponse) @@ @@ Get the cumulative inference statistics for a model. @@
Sourcepub async fn repository_index(
&mut self,
request: impl IntoRequest<RepositoryIndexRequest>,
) -> Result<Response<RepositoryIndexResponse>, Status>
pub async fn repository_index( &mut self, request: impl IntoRequest<RepositoryIndexRequest>, ) -> Result<Response<RepositoryIndexResponse>, Status>
@@ .. cpp:var:: rpc RepositoryIndex(RepositoryIndexRequest) returns @@ (RepositoryIndexResponse) @@ @@ Get the index of model repository contents. @@
Sourcepub async fn repository_model_load(
&mut self,
request: impl IntoRequest<RepositoryModelLoadRequest>,
) -> Result<Response<RepositoryModelLoadResponse>, Status>
pub async fn repository_model_load( &mut self, request: impl IntoRequest<RepositoryModelLoadRequest>, ) -> Result<Response<RepositoryModelLoadResponse>, Status>
@@ .. cpp:var:: rpc RepositoryModelLoad(RepositoryModelLoadRequest) returns @@ (RepositoryModelLoadResponse) @@ @@ Load or reload a model from a repository. @@
Sourcepub async fn repository_model_unload(
&mut self,
request: impl IntoRequest<RepositoryModelUnloadRequest>,
) -> Result<Response<RepositoryModelUnloadResponse>, Status>
pub async fn repository_model_unload( &mut self, request: impl IntoRequest<RepositoryModelUnloadRequest>, ) -> Result<Response<RepositoryModelUnloadResponse>, Status>
@@ .. cpp:var:: rpc RepositoryModelUnload(RepositoryModelUnloadRequest) @@ returns (RepositoryModelUnloadResponse) @@ @@ Unload a model. @@
@@ .. cpp:var:: rpc SystemSharedMemoryStatus( @@ SystemSharedMemoryStatusRequest) @@ returns (SystemSharedMemoryStatusRespose) @@ @@ Get the status of all registered system-shared-memory regions. @@
@@ .. cpp:var:: rpc SystemSharedMemoryRegister( @@ SystemSharedMemoryRegisterRequest) @@ returns (SystemSharedMemoryRegisterResponse) @@ @@ Register a system-shared-memory region. @@
@@ .. cpp:var:: rpc SystemSharedMemoryUnregister( @@ SystemSharedMemoryUnregisterRequest) @@ returns (SystemSharedMemoryUnregisterResponse) @@ @@ Unregister a system-shared-memory region. @@
@@ .. cpp:var:: rpc CudaSharedMemoryStatus( @@ CudaSharedMemoryStatusRequest) @@ returns (CudaSharedMemoryStatusRespose) @@ @@ Get the status of all registered CUDA-shared-memory regions. @@
@@ .. cpp:var:: rpc CudaSharedMemoryRegister( @@ CudaSharedMemoryRegisterRequest) @@ returns (CudaSharedMemoryRegisterResponse) @@ @@ Register a CUDA-shared-memory region. @@
@@ .. cpp:var:: rpc CudaSharedMemoryUnregister( @@ CudaSharedMemoryUnregisterRequest) @@ returns (CudaSharedMemoryUnregisterResponse) @@ @@ Unregister a CUDA-shared-memory region. @@
Sourcepub async fn trace_setting(
&mut self,
request: impl IntoRequest<TraceSettingRequest>,
) -> Result<Response<TraceSettingResponse>, Status>
pub async fn trace_setting( &mut self, request: impl IntoRequest<TraceSettingRequest>, ) -> Result<Response<TraceSettingResponse>, Status>
@@ .. cpp:var:: rpc TraceSetting(TraceSettingRequest) @@ returns (TraceSettingResponse) @@ @@ Update and get the trace setting of the Triton server. @@
Trait Implementations§
Source§impl<T: Clone> Clone for GrpcInferenceServiceClient<T>
impl<T: Clone> Clone for GrpcInferenceServiceClient<T>
Source§fn clone(&self) -> GrpcInferenceServiceClient<T>
fn clone(&self) -> GrpcInferenceServiceClient<T>
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source
. Read moreAuto Trait Implementations§
impl<T> Freeze for GrpcInferenceServiceClient<T>where
T: Freeze,
impl<T> RefUnwindSafe for GrpcInferenceServiceClient<T>where
T: RefUnwindSafe,
impl<T> Send for GrpcInferenceServiceClient<T>where
T: Send,
impl<T> Sync for GrpcInferenceServiceClient<T>where
T: Sync,
impl<T> Unpin for GrpcInferenceServiceClient<T>where
T: Unpin,
impl<T> UnwindSafe for GrpcInferenceServiceClient<T>where
T: UnwindSafe,
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoRequest<T> for T
impl<T> IntoRequest<T> for T
Source§fn into_request(self) -> Request<T>
fn into_request(self) -> Request<T>
T
in a tonic::Request