pub struct ModelRateLimiter {
pub resources: Vec<Resource>,
pub priority: u32,
}
Expand description
@@ @@ .. cpp:var:: message ModelRateLimiter @@ @@ The specifications required by the rate limiter to properly @@ schedule the inference requests across the different models @@ and their instances. @@
Fields§
§resources: Vec<Resource>
@@ .. cpp:var:: Resource resources (repeated) @@ @@ The resources required to execute the request on a model instance. @@ Resources are just names with a corresponding count. The execution @@ of the instance will be blocked until the specificied resources are @@ available. By default an instance uses no rate-limiter resources. @@
priority: u32
@@ .. cpp:var:: uint32 priority @@ @@ The optional weighting value to be used for prioritizing across @@ instances. An instance with priority 2 will be given 1/2 the @@ number of scheduling chances as an instance_group with priority @@ 1. The default priority is 1. The priority of value 0 will be @@ treated as priority 1. @@
Trait Implementations§
Source§impl Clone for ModelRateLimiter
impl Clone for ModelRateLimiter
Source§fn clone(&self) -> ModelRateLimiter
fn clone(&self) -> ModelRateLimiter
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source
. Read moreSource§impl Debug for ModelRateLimiter
impl Debug for ModelRateLimiter
Source§impl Default for ModelRateLimiter
impl Default for ModelRateLimiter
Source§impl Message for ModelRateLimiter
impl Message for ModelRateLimiter
Source§fn encoded_len(&self) -> usize
fn encoded_len(&self) -> usize
Source§fn encode<B>(&self, buf: &mut B) -> Result<(), EncodeError>
fn encode<B>(&self, buf: &mut B) -> Result<(), EncodeError>
Source§fn encode_to_vec(&self) -> Vec<u8> ⓘwhere
Self: Sized,
fn encode_to_vec(&self) -> Vec<u8> ⓘwhere
Self: Sized,
Source§fn encode_length_delimited<B>(&self, buf: &mut B) -> Result<(), EncodeError>
fn encode_length_delimited<B>(&self, buf: &mut B) -> Result<(), EncodeError>
Source§fn encode_length_delimited_to_vec(&self) -> Vec<u8> ⓘwhere
Self: Sized,
fn encode_length_delimited_to_vec(&self) -> Vec<u8> ⓘwhere
Self: Sized,
Source§fn decode<B>(buf: B) -> Result<Self, DecodeError>
fn decode<B>(buf: B) -> Result<Self, DecodeError>
Source§fn decode_length_delimited<B>(buf: B) -> Result<Self, DecodeError>
fn decode_length_delimited<B>(buf: B) -> Result<Self, DecodeError>
Source§fn merge<B>(&mut self, buf: B) -> Result<(), DecodeError>
fn merge<B>(&mut self, buf: B) -> Result<(), DecodeError>
self
. Read moreSource§fn merge_length_delimited<B>(&mut self, buf: B) -> Result<(), DecodeError>
fn merge_length_delimited<B>(&mut self, buf: B) -> Result<(), DecodeError>
self
.Source§impl PartialEq for ModelRateLimiter
impl PartialEq for ModelRateLimiter
impl StructuralPartialEq for ModelRateLimiter
Auto Trait Implementations§
impl Freeze for ModelRateLimiter
impl RefUnwindSafe for ModelRateLimiter
impl Send for ModelRateLimiter
impl Sync for ModelRateLimiter
impl Unpin for ModelRateLimiter
impl UnwindSafe for ModelRateLimiter
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoRequest<T> for T
impl<T> IntoRequest<T> for T
Source§fn into_request(self) -> Request<T>
fn into_request(self) -> Request<T>
T
in a tonic::Request