openai_protocol/
rerank.rs1use std::collections::HashMap;
2
3use serde::{Deserialize, Serialize};
4use serde_json::Value;
5use validator::Validate;
6
7use super::common::{default_model, default_true, GenerationRequest, StringOrArray, UsageInfo};
8
9fn default_rerank_object() -> String {
10 "rerank".to_string()
11}
12
13fn current_timestamp() -> i64 {
15 std::time::SystemTime::now()
16 .duration_since(std::time::UNIX_EPOCH)
17 .unwrap_or_else(|_| std::time::Duration::from_secs(0))
18 .as_secs() as i64
19}
20
21#[derive(Debug, Clone, Deserialize, Serialize, Validate)]
26#[validate(schema(function = "validate_rerank_request"))]
27pub struct RerankRequest {
28 #[validate(custom(function = "validate_query"))]
30 pub query: String,
31
32 #[validate(custom(function = "validate_documents"))]
34 pub documents: Vec<String>,
35
36 #[serde(default = "default_model")]
38 pub model: String,
39
40 #[serde(skip_serializing_if = "Option::is_none")]
42 #[validate(range(min = 1))]
43 pub top_k: Option<usize>,
44
45 #[serde(default = "default_true")]
47 pub return_documents: bool,
48
49 pub rid: Option<StringOrArray>,
52
53 pub user: Option<String>,
55}
56
57impl GenerationRequest for RerankRequest {
58 fn get_model(&self) -> Option<&str> {
59 Some(&self.model)
60 }
61
62 fn is_stream(&self) -> bool {
63 false }
65
66 fn extract_text_for_routing(&self) -> String {
67 self.query.clone()
68 }
69}
70
71impl super::validated::Normalizable for RerankRequest {
72 }
74
75fn validate_query(query: &str) -> Result<(), validator::ValidationError> {
81 if query.trim().is_empty() {
82 return Err(validator::ValidationError::new("query cannot be empty"));
83 }
84 Ok(())
85}
86
87fn validate_documents(documents: &[String]) -> Result<(), validator::ValidationError> {
89 if documents.is_empty() {
90 return Err(validator::ValidationError::new(
91 "documents list cannot be empty",
92 ));
93 }
94 Ok(())
95}
96
97fn validate_rerank_request(req: &RerankRequest) -> Result<(), validator::ValidationError> {
99 if let Some(k) = req.top_k {
101 if k > req.documents.len() {
102 tracing::warn!(
104 "top_k ({}) is greater than number of documents ({})",
105 k,
106 req.documents.len()
107 );
108 }
109 }
110 Ok(())
111}
112
113impl RerankRequest {
114 pub fn effective_top_k(&self) -> usize {
116 self.top_k.unwrap_or(self.documents.len())
117 }
118}
119
120#[derive(Debug, Clone, Serialize, Deserialize)]
122pub struct RerankResult {
123 pub score: f32,
125
126 #[serde(skip_serializing_if = "Option::is_none")]
128 pub document: Option<String>,
129
130 pub index: usize,
132
133 #[serde(skip_serializing_if = "Option::is_none")]
135 pub meta_info: Option<HashMap<String, Value>>,
136}
137
138#[derive(Debug, Clone, Serialize, Deserialize)]
140pub struct RerankResponse {
141 pub results: Vec<RerankResult>,
143
144 pub model: String,
146
147 pub usage: Option<UsageInfo>,
149
150 #[serde(default = "default_rerank_object")]
152 pub object: String,
153
154 pub id: Option<StringOrArray>,
156
157 pub created: i64,
159}
160
161impl RerankResponse {
162 pub fn new(
164 results: Vec<RerankResult>,
165 model: String,
166 request_id: Option<StringOrArray>,
167 ) -> Self {
168 RerankResponse {
169 results,
170 model,
171 usage: None,
172 object: default_rerank_object(),
173 id: request_id,
174 created: current_timestamp(),
175 }
176 }
177
178 pub fn apply_top_k(&mut self, k: usize) {
180 self.results.truncate(k);
181 }
182
183 pub fn drop_documents(&mut self) {
185 for result in &mut self.results {
186 result.document = None;
187 }
188 }
189}
190
191#[derive(Debug, Clone, Serialize, Deserialize)]
194pub struct V1RerankReqInput {
195 pub query: String,
196 pub documents: Vec<String>,
197}
198
199impl From<V1RerankReqInput> for RerankRequest {
201 fn from(v1: V1RerankReqInput) -> Self {
202 RerankRequest {
203 query: v1.query,
204 documents: v1.documents,
205 model: default_model(),
206 top_k: None,
207 return_documents: true,
208 rid: None,
209 user: None,
210 }
211 }
212}