Skip to main content

audio_codec/
opus.rs

1use super::{Decoder, Encoder, PcmBuf, Sample};
2pub use opus_rs::Application as OpusApplication;
3use opus_rs::{Application, OpusDecoder as OpusDecoderRaw, OpusEncoder as OpusEncoderRaw};
4
5pub struct OpusDecoder {
6    decoder: OpusDecoderRaw,
7    sample_rate: u32,
8    channels: u16,
9    w_output_f32: Vec<f32>,
10    w_pcm_i16: Vec<i16>,
11}
12
13impl OpusDecoder {
14    /// Create a new Opus decoder instance
15    pub fn new(sample_rate: u32, channels: u16) -> Self {
16        let decoder = OpusDecoderRaw::new(sample_rate as i32, channels as usize)
17            .expect("Failed to create Opus decoder");
18
19        Self {
20            decoder,
21            sample_rate,
22            channels,
23            w_output_f32: Vec::new(),
24            w_pcm_i16: Vec::new(),
25        }
26    }
27
28    /// Create a default Opus decoder (48kHz, stereo)
29    pub fn new_default() -> Self {
30        Self::new(48000, 2)
31    }
32
33    pub fn decode_into(&mut self, data: &[u8], output: &mut [i16]) -> usize {
34        if data.is_empty() {
35            return 0;
36        }
37
38        // Detect the actual channel count from the Opus packet's TOC byte
39        // (bit 2 is the stereo flag per RFC 6716). opus-rs 0.1.19+ rejects
40        // decoding when the packet channel count doesn't match the decoder's,
41        // so we adapt the decoder here to avoid returning empty PCM.
42        let packet_channels = if data[0] & 0x04 != 0 { 2usize } else { 1 };
43        if self.channels as usize != packet_channels {
44            self.channels = packet_channels as u16;
45            self.decoder = OpusDecoderRaw::new(self.sample_rate as i32, packet_channels)
46                .expect("Failed to create Opus decoder");
47        }
48
49        let channels = usize::from(self.channels);
50        let frame_size = (self.sample_rate as usize * 20) / 1000;
51        let max_samples = frame_size * channels;
52        if self.w_output_f32.len() < max_samples {
53            self.w_output_f32.resize(max_samples, 0.0);
54        }
55
56        match self
57            .decoder
58            .decode(data, frame_size, &mut self.w_output_f32[..max_samples])
59        {
60            Ok(len) => {
61                let total_samples = len * channels;
62                if total_samples == 0 {
63                    return 0;
64                }
65
66                if self.w_pcm_i16.len() < total_samples {
67                    self.w_pcm_i16.resize(total_samples, 0);
68                }
69
70                for i in 0..total_samples {
71                    self.w_pcm_i16[i] =
72                        (self.w_output_f32[i] * 32768.0).clamp(-32768.0, 32767.0) as i16;
73                }
74
75                let n = total_samples.min(output.len());
76                output[..n].copy_from_slice(&self.w_pcm_i16[..n]);
77                n
78            }
79            Err(_) => 0,
80        }
81    }
82}
83
84impl Decoder for OpusDecoder {
85    fn decode(&mut self, data: &[u8]) -> PcmBuf {
86        let channels = usize::from(self.channels);
87        if channels == 0 || data.is_empty() {
88            return Vec::new();
89        }
90
91        let frame_size = (self.sample_rate as usize * 20) / 1000;
92        let max_samples = frame_size * channels;
93        let mut pcm = vec![0i16; max_samples];
94        let n = self.decode_into(data, &mut pcm);
95        pcm.truncate(n);
96        if channels == 2 {
97            pcm = pcm
98                .chunks_exact(2)
99                .map(|chunk| ((chunk[0] as i32 + chunk[1] as i32) / 2) as i16)
100                .collect();
101        }
102        pcm
103    }
104
105    fn sample_rate(&self) -> u32 {
106        self.sample_rate
107    }
108
109    fn channels(&self) -> u16 {
110        self.channels
111    }
112}
113
114pub struct OpusEncoder {
115    encoder: OpusEncoderRaw,
116    sample_rate: u32,
117    channels: u16,
118    w_input_f32: Vec<f32>,
119    w_packet: Vec<u8>,
120}
121
122impl OpusEncoder {
123    pub fn new_with_application(sample_rate: u32, channels: u16, application: Application) -> Self {
124        let encoder = OpusEncoderRaw::new(sample_rate as i32, channels as usize, application)
125            .expect("Failed to create Opus encoder");
126
127        Self {
128            encoder,
129            sample_rate,
130            channels,
131            w_input_f32: Vec::new(),
132            w_packet: vec![0u8; 1275],
133        }
134    }
135
136    /// Create a new Opus encoder instance.
137    ///
138    /// Keep backward-compatible defaults with pre-0.3.31 behavior:
139    /// - VoIP application
140    /// - caller can provide mono PCM even when encoder is configured as stereo;
141    ///   `encode()` duplicates mono samples to stereo.
142    pub fn new(sample_rate: u32, channels: u16) -> Self {
143        let mut enc = Self::new_with_application(sample_rate, channels, Application::Voip);
144        enc.encoder.bitrate_bps = if channels == 2 { 64000 } else { 48000 };
145        enc.encoder.complexity = 5;
146        enc.encoder.use_cbr = true;
147        enc
148    }
149
150    /// Create a default Opus encoder (48kHz, stereo)
151    pub fn new_default() -> Self {
152        Self::new(48000, 2)
153    }
154
155    /// Set the encoder bitrate in bits per second.
156    pub fn set_bitrate(&mut self, bitrate_bps: i32) {
157        self.encoder.bitrate_bps = bitrate_bps;
158    }
159
160    /// Set the encoder complexity (0-10).
161    pub fn set_complexity(&mut self, complexity: i32) {
162        self.encoder.complexity = complexity;
163    }
164
165    /// Enable or disable constant bitrate (CBR) mode.
166    pub fn set_cbr(&mut self, cbr: bool) {
167        self.encoder.use_cbr = cbr;
168    }
169
170    /// Encode into a caller-provided packet buffer.
171    ///
172    /// Returns `Some(bytes_written)` on success.
173    pub fn encode_into(&mut self, samples: &[Sample], output: &mut [u8]) -> Option<usize> {
174        let channels = usize::from(self.channels);
175        if samples.is_empty() || channels == 0 || samples.len() % channels != 0 {
176            return None;
177        }
178
179        let frame_size = samples.len() / channels;
180
181        if self.w_input_f32.len() < samples.len() {
182            self.w_input_f32.resize(samples.len(), 0.0);
183        }
184
185        for (dst, &s) in self.w_input_f32[..samples.len()]
186            .iter_mut()
187            .zip(samples.iter())
188        {
189            *dst = s as f32 / 32768.0;
190        }
191
192        self.encoder
193            .encode(&self.w_input_f32[..samples.len()], frame_size, output)
194            .ok()
195    }
196
197    fn encode_raw(&mut self, samples: &[Sample]) -> Vec<u8> {
198        let channels = usize::from(self.channels);
199        if samples.is_empty() || channels == 0 || samples.len() % channels != 0 {
200            return Vec::new();
201        }
202
203        let frame_size = samples.len() / channels;
204
205        if self.w_input_f32.len() < samples.len() {
206            self.w_input_f32.resize(samples.len(), 0.0);
207        }
208
209        for (dst, &s) in self.w_input_f32[..samples.len()]
210            .iter_mut()
211            .zip(samples.iter())
212        {
213            *dst = s as f32 / 32768.0;
214        }
215
216        match self.encoder.encode(
217            &self.w_input_f32[..samples.len()],
218            frame_size,
219            &mut self.w_packet,
220        ) {
221            Ok(len) => {
222                let mut out = Vec::with_capacity(len);
223                out.extend_from_slice(&self.w_packet[..len]);
224                out
225            }
226            Err(_) => Vec::new(),
227        }
228    }
229}
230
231impl Encoder for OpusEncoder {
232    fn encode(&mut self, samples: &[Sample]) -> Vec<u8> {
233        if self.channels == 2 {
234            let mut stereo_samples = Vec::with_capacity(samples.len() * 2);
235            for &sample in samples {
236                stereo_samples.push(sample);
237                stereo_samples.push(sample);
238            }
239            return self.encode_raw(&stereo_samples);
240        }
241        self.encode_raw(samples)
242    }
243
244    fn sample_rate(&self) -> u32 {
245        self.sample_rate
246    }
247
248    fn channels(&self) -> u16 {
249        self.channels
250    }
251}