Struct ModelInferRequest

Source

pub struct ModelInferRequest {
    pub model_name: String,
    pub model_version: String,
    pub id: String,
    pub parameters: HashMap<String, InferParameter>,
    pub inputs: Vec<InferInputTensor>,
    pub outputs: Vec<InferRequestedOutputTensor>,
    pub raw_input_contents: Vec<Vec<u8>>,
}

Expand description

@@ @@.. cpp:var:: message ModelInferRequest @@ @@ Request message for ModelInfer. @@

Fields§

§model_name: String

@@ .. cpp:var:: string model_name @@ @@ The name of the model to use for inferencing. @@

§model_version: String

@@ .. cpp:var:: string model_version @@ @@ The version of the model to use for inference. If not @@ given the latest/most-recent version of the model is used. @@

§id: String

@@ .. cpp:var:: string id @@ @@ Optional identifier for the request. If specified will be @@ returned in the response. @@

§parameters: HashMap<String, InferParameter>

@@ .. cpp:var:: map<string,InferParameter> parameters @@ @@ Optional inference parameters. @@

§inputs: Vec<InferInputTensor>

@@ @@ .. cpp:var:: InferInputTensor inputs (repeated) @@ @@ The input tensors for the inference. @@

§outputs: Vec<InferRequestedOutputTensor>

@@ @@ .. cpp:var:: InferRequestedOutputTensor outputs (repeated) @@ @@ The requested output tensors for the inference. Optional, if not @@ specified all outputs specified in the model config will be @@ returned. @@

§raw_input_contents: Vec<Vec<u8>>

@@ @@ .. cpp:var:: bytes raw_input_contents @@ @@ The data contained in an input tensor can be represented in @@ “raw” bytes form or in the repeated type that matches the @@ tensor’s data type. Using the “raw” bytes form will @@ typically allow higher performance due to the way protobuf @@ allocation and reuse interacts with GRPC. For example, see @@ https://github.com/grpc/grpc/issues/23231. @@ @@ To use the raw representation ‘raw_input_contents’ must be @@ initialized with data for each tensor in the same order as @@ ‘inputs’. For each tensor, the size of this content must @@ match what is expected by the tensor’s shape and data @@ type. The raw data must be the flattened, one-dimensional, @@ row-major order of the tensor elements without any stride @@ or padding between the elements. Note that the FP16 and BF16 data @@ types must be represented as raw content as there is no @@ specific data type for a 16-bit float type. @@ @@ If this field is specified then InferInputTensor::contents @@ must not be specified for any input tensor. @@

Struct ModelInferRequestCopy item path

Fields§

Trait Implementations§

impl Clone for ModelInferRequest

fn clone(&self) -> ModelInferRequest

fn clone_from(&mut self, source: &Self)

impl Debug for ModelInferRequest

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for ModelInferRequest

fn default() -> Self

impl Message for ModelInferRequest

fn encoded_len(&self) -> usize

fn clear(&mut self)

fn encode<B>(&self, buf: &mut B) -> Result<(), EncodeError>where B: BufMut, Self: Sized,

fn encode_to_vec(&self) -> Vec<u8> ⓘwhere Self: Sized,

fn encode_length_delimited<B>(&self, buf: &mut B) -> Result<(), EncodeError>where B: BufMut, Self: Sized,

fn encode_length_delimited_to_vec(&self) -> Vec<u8> ⓘwhere Self: Sized,

fn decode<B>(buf: B) -> Result<Self, DecodeError>where B: Buf, Self: Default,

fn decode_length_delimited<B>(buf: B) -> Result<Self, DecodeError>where B: Buf, Self: Default,

fn merge<B>(&mut self, buf: B) -> Result<(), DecodeError>where B: Buf, Self: Sized,

fn merge_length_delimited<B>(&mut self, buf: B) -> Result<(), DecodeError>where B: Buf, Self: Sized,

impl PartialEq for ModelInferRequest

fn eq(&self, other: &ModelInferRequest) -> bool

fn ne(&self, other: &Rhs) -> bool

impl StructuralPartialEq for ModelInferRequest

Auto Trait Implementations§

impl Freeze for ModelInferRequest

impl RefUnwindSafe for ModelInferRequest

impl Send for ModelInferRequest

impl Sync for ModelInferRequest

impl Unpin for ModelInferRequest

impl UnwindSafe for ModelInferRequest

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoRequest<T> for T

fn into_request(self) -> Request<T>

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct ModelInferRequest

fn encode<B>(&self, buf: &mut B) -> Result<(), EncodeError>
where B: BufMut, Self: Sized,

fn encode_to_vec(&self) -> Vec<u8> ⓘ
where Self: Sized,

fn encode_length_delimited<B>(&self, buf: &mut B) -> Result<(), EncodeError>
where B: BufMut, Self: Sized,

fn encode_length_delimited_to_vec(&self) -> Vec<u8> ⓘ
where Self: Sized,

fn decode<B>(buf: B) -> Result<Self, DecodeError>
where B: Buf, Self: Default,

fn decode_length_delimited<B>(buf: B) -> Result<Self, DecodeError>
where B: Buf, Self: Default,

fn merge<B>(&mut self, buf: B) -> Result<(), DecodeError>
where B: Buf, Self: Sized,

fn merge_length_delimited<B>(&mut self, buf: B) -> Result<(), DecodeError>
where B: Buf, Self: Sized,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,