Struct ModelPricing

Source

pub struct ModelPricing {
    pub input_per_million: f64,
    pub output_per_million: f64,
    pub cached_input_per_million: Option<f64>,
    pub cache_write_per_million: Option<f64>,
    pub batch_input_per_million: Option<f64>,
    pub batch_output_per_million: Option<f64>,
    pub flex_input_per_million: Option<f64>,
    pub flex_output_per_million: Option<f64>,
    pub prompt_cache_min_tokens: Option<u32>,
    pub effective_at: DateTime<Utc>,
}

Fields§

§input_per_million: f64

USD per 1M input tokens.

§output_per_million: f64

USD per 1M output tokens.

§cached_input_per_million: Option<f64>

USD per 1M cached input tokens (Anthropic 10%, OpenAI 10%, Gemini 10%).

§cache_write_per_million: Option<f64>

USD per 1M cache-creation (cache-write) input tokens. Anthropic charges ~1.25× the base input rate for tokens written to the prompt cache. None for providers with no documented write premium (cost path unchanged).

§batch_input_per_million: Option<f64>

USD per 1M batch (async) input tokens. Providers with a batch tier (OpenAI / Anthropic / Gemini) bill async requests at ~50% of standard input. None for providers with no batch tier.

§batch_output_per_million: Option<f64>

USD per 1M batch (async) output tokens (~50% of standard output). None for providers with no batch tier.

§flex_input_per_million: Option<f64>

USD per 1M input tokens under OpenAI’s Flex service tier (service_tier: "flex") — a synchronous-but-slower tier billed at Batch API rates (~50% of standard). None for models/providers with no Flex tier; presence is the eligibility gate (only models that carry a Flex rate may be opted into service_tier=flex). See developers.openai.com/api/docs/guides/flex-processing.

§flex_output_per_million: Option<f64>

USD per 1M output tokens under the Flex service tier (~50% of standard output). None when the model has no Flex tier.

§prompt_cache_min_tokens: Option<u32>

Provider minimum prefix length, in tokens, before a cache_control breakpoint actually caches (shorter prefixes silently don’t cache). Anthropic varies this by model (2048–4096); None when not documented.

§effective_at: DateTime<Utc>

When this pricing took effect (for historical replay).

Struct ModelPricing Copy item path

Fields§

Implementations§

impl ModelPricing

pub fn cache_write_rate_per_million(&self, tier: CacheWriteTier) -> Option<f64>

pub fn flex_eligible(&self) -> bool

pub fn flex_rates_per_million(&self) -> Option<(f64, f64)>

Trait Implementations§

impl Clone for ModelPricing

fn clone(&self) -> ModelPricing

fn clone_from(&mut self, source: &Self)

impl Debug for ModelPricing

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'de> Deserialize<'de> for ModelPricing

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for ModelPricing

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for ModelPricing

impl RefUnwindSafe for ModelPricing

impl Send for ModelPricing

impl Sync for ModelPricing

impl Unpin for ModelPricing

impl UnsafeUnpin for ModelPricing

impl UnwindSafe for ModelPricing

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct ModelPricing

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,