openai_struct/models/realtime_session_create_response_turn_detection.rs
1/*
2 * OpenAI API
3 *
4 * The OpenAI REST API. Please see pub https://platform.openai.com/docs/api-reference for more details.
5 *
6 * OpenAPI spec pub version: 2.3.0
7 *
8 * Generated pub by: https://github.com/swagger-api/swagger-codegen.git
9 */
10
11/// pub RealtimeSessionCreateResponseTurnDetection : Configuration for turn detection. Can be set to `null` to turn off. Server VAD means that the model will detect the start and end of speech based on audio volume and respond at the end of user speech.
12
13#[allow(unused_imports)]
14use serde_json::Value;
15
16#[derive(Debug, Serialize, Deserialize)]
17pub struct RealtimeSessionCreateResponseTurnDetection {
18 /// Amount of audio to include before the VAD detected speech (in milliseconds). Defaults to 300ms.
19 #[serde(rename = "prefix_padding_ms")]
20 pub prefix_padding_ms: Option<i32>,
21 /// Duration of silence to detect speech stop (in milliseconds). Defaults to 500ms. With shorter values the model will respond more quickly, but may jump in on short pauses from the user.
22 #[serde(rename = "silence_duration_ms")]
23 pub silence_duration_ms: Option<i32>,
24 /// Activation threshold for VAD (0.0 to 1.0), this defaults to 0.5. A higher threshold will require louder audio to activate the model, and thus might perform better in noisy environments.
25 #[serde(rename = "threshold")]
26 pub threshold: Option<f32>,
27 /// Type of turn detection, only `server_vad` is currently supported.
28 #[serde(rename = "type")]
29 pub _type: Option<String>,
30}