Struct ChatCompletionRequest

Source

pub struct ChatCompletionRequest {Show 18 fields
    pub model: String,
    pub messages: Vec<ChatMessage>,
    pub temperature: Option<f32>,
    pub max_tokens: Option<u32>,
    pub top_p: Option<f32>,
    pub frequency_penalty: Option<f32>,
    pub presence_penalty: Option<f32>,
    pub stop: Option<Vec<String>>,
    pub user: Option<String>,
    pub provider: Option<String>,
    pub stream: Option<bool>,
    pub logit_bias: Option<Value>,
    pub logprobs: Option<bool>,
    pub top_logprobs: Option<u32>,
    pub n: Option<u32>,
    pub response_format: Option<ResponseFormat>,
    pub tools: Option<Vec<Tool>>,
    pub tool_choice: Option<ToolChoice>,
}

Expand description

Represents a request to create a chat completion.

Fields§

§model: String

The identifier of the model to use for the completion (e.g., “gpt-4o”, “claude-sonnet-4”).

§messages: Vec<ChatMessage>

A list of messages that form the conversation history.

§temperature: Option<f32>

The sampling temperature to use, between 0.0 and 2.0. Higher values will make the output more random, while lower values will make it more focused and deterministic.

§max_tokens: Option<u32>

The maximum number of tokens to generate in the completion.

§top_p: Option<f32>

The nucleus sampling parameter. The model considers the results of the tokens with top_p probability mass. So, 0.1 means only the tokens comprising the top 10% probability mass are considered.

§frequency_penalty: Option<f32>

A penalty applied to new tokens based on their frequency in the text so far. It decreases the model’s likelihood to repeat the same line verbatim.

§presence_penalty: Option<f32>

A penalty applied to new tokens based on whether they appear in the text so far. It increases the model’s likelihood to talk about new topics.

§stop: Option<Vec<String>>

A list of sequences that will cause the model to stop generating further tokens.

§user: Option<String>

A unique identifier representing your end-user, which can help in monitoring and tracking conversations.

§provider: Option<String>

A hint to the router about which provider to use for the model.

§stream: Option<bool>

If set to true, the response will be streamed as a series of events.

§logit_bias: Option<Value>

Modify the likelihood of specified tokens appearing in the completion.

§logprobs: Option<bool>

Whether to return log probabilities of the output tokens.

§top_logprobs: Option<u32>

An integer between 0 and 20 specifying the number of most likely tokens to return at each token position.

§n: Option<u32>

How many chat completion choices to generate for each input message.

§response_format: Option<ResponseFormat>

An object specifying the format that the model must output.

§tools: Option<Vec<Tool>>

A list of tools the model may call.

§tool_choice: Option<ToolChoice>

Controls which (if any) tool is called by the model.

Struct ChatCompletionRequest Copy item path

Fields§

Implementations§

impl ChatCompletionRequest

pub fn new(model: impl Into<String>, messages: Vec<ChatMessage>) -> Self

§Arguments

pub fn with_temperature(self, temperature: f32) -> Self

§Arguments

pub fn with_max_tokens(self, max_tokens: u32) -> Self

§Arguments

pub fn with_user(self, user: impl Into<String>) -> Self

§Arguments

pub fn with_provider(self, provider: impl Into<String>) -> Self

§Arguments

pub fn with_stream(self, stream: bool) -> Self

§Arguments

pub fn with_logit_bias(self, logit_bias: Value) -> Self

§Arguments

pub fn with_logprobs(self, logprobs: bool) -> Self

§Arguments

pub fn with_top_logprobs(self, top_logprobs: u32) -> Self

§Arguments

pub fn with_n(self, n: u32) -> Self

§Arguments

pub fn with_response_format(self, response_format: ResponseFormat) -> Self

§Arguments

pub fn with_tools(self, tools: Vec<Tool>) -> Self

§Arguments

pub fn with_tool_choice(self, tool_choice: ToolChoice) -> Self

§Arguments

pub fn validate_openai_compatibility(&self) -> Result<(), String>

§Returns

Trait Implementations§

impl Clone for ChatCompletionRequest

fn clone(&self) -> ChatCompletionRequest

fn clone_from(&mut self, source: &Self)

impl Debug for ChatCompletionRequest

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'de> Deserialize<'de> for ChatCompletionRequest

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for ChatCompletionRequest

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for ChatCompletionRequest

impl RefUnwindSafe for ChatCompletionRequest

impl Send for ChatCompletionRequest

impl Sync for ChatCompletionRequest

impl Unpin for ChatCompletionRequest

impl UnwindSafe for ChatCompletionRequest

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct ChatCompletionRequest

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T> ErasedDestructor for T
where T: 'static,