transcode_audio/
transcode-audio.rs1extern crate ffmpeg_rs;
2use std::env;
3use std::path::Path;
4
5use ffmpeg_rs::{codec, filter, format, frame, media};
6use ffmpeg_rs::{rescale, Rescale};
7
8fn filter(
9 spec: &str,
10 decoder: &codec::decoder::Audio,
11 encoder: &codec::encoder::Audio,
12) -> Result<filter::Graph, ffmpeg_rs::Error> {
13 let mut filter = filter::Graph::new();
14
15 let args = format!(
16 "time_base={}:sample_rate={}:sample_fmt={}:channel_layout=0x{:x}",
17 decoder.time_base(),
18 decoder.rate(),
19 decoder.format().name(),
20 decoder.channel_layout().bits()
21 );
22
23 filter.add(&filter::find("abuffer").unwrap(), "in", &args)?;
24 filter.add(&filter::find("abuffersink").unwrap(), "out", "")?;
25
26 {
27 let mut out = filter.get("out").unwrap();
28
29 out.set_sample_format(encoder.format());
30 out.set_channel_layout(encoder.channel_layout());
31 out.set_sample_rate(encoder.rate());
32 }
33
34 filter.output("in", 0)?.input("out", 0)?.parse(spec)?;
35 filter.validate()?;
36
37 println!("{}", filter.dump());
38
39 if let Some(codec) = encoder.codec() {
40 if !codec
41 .capabilities()
42 .contains(ffmpeg_rs::codec::capabilities::Capabilities::VARIABLE_FRAME_SIZE)
43 {
44 filter
45 .get("out")
46 .unwrap()
47 .sink()
48 .set_frame_size(encoder.frame_size());
49 }
50 }
51
52 Ok(filter)
53}
54
55struct Transcoder {
56 stream: usize,
57 filter: filter::Graph,
58 decoder: codec::decoder::Audio,
59 encoder: codec::encoder::Audio,
60 in_time_base: ffmpeg_rs::Rational,
61 out_time_base: ffmpeg_rs::Rational,
62}
63
64fn transcoder<P: AsRef<Path>>(
65 ictx: &mut format::context::Input,
66 octx: &mut format::context::Output,
67 path: &P,
68 filter_spec: &str,
69) -> Result<Transcoder, ffmpeg_rs::Error> {
70 let input = ictx
71 .streams()
72 .best(media::Type::Audio)
73 .expect("could not find best audio stream");
74 let context = ffmpeg_rs::codec::context::Context::from_parameters(input.parameters())?;
75 let mut decoder = context.decoder().audio()?;
76 let codec = ffmpeg_rs::encoder::find(octx.format().codec(path, media::Type::Audio))
77 .expect("failed to find encoder")
78 .audio()?;
79 let global = octx
80 .format()
81 .flags()
82 .contains(ffmpeg_rs::format::flag::Flags::GLOBAL_HEADER);
83
84 decoder.set_parameters(input.parameters())?;
85
86 let mut output = octx.add_stream(codec)?;
87 let context = ffmpeg_rs::codec::context::Context::from_parameters(output.parameters())?;
88 let mut encoder = context.encoder().audio()?;
89
90 let channel_layout = codec
91 .channel_layouts()
92 .map(|cls| cls.best(decoder.channel_layout().channels()))
93 .unwrap_or(ffmpeg_rs::channel_layout::ChannelLayout::STEREO);
94
95 if global {
96 encoder.set_flags(ffmpeg_rs::codec::flag::Flags::GLOBAL_HEADER);
97 }
98
99 encoder.set_rate(decoder.rate() as i32);
100 encoder.set_channel_layout(channel_layout);
101 encoder.set_channels(channel_layout.channels());
102 encoder.set_format(
103 codec
104 .formats()
105 .expect("unknown supported formats")
106 .next()
107 .unwrap(),
108 );
109 encoder.set_bit_rate(decoder.bit_rate());
110 encoder.set_max_bit_rate(decoder.max_bit_rate());
111
112 encoder.set_time_base((1, decoder.rate() as i32));
113 output.set_time_base((1, decoder.rate() as i32));
114
115 let encoder = encoder.open_as(codec)?;
116 output.set_parameters(&encoder);
117
118 let filter = filter(filter_spec, &decoder, &encoder)?;
119
120 let in_time_base = decoder.time_base();
121 let out_time_base = output.time_base();
122
123 Ok(Transcoder {
124 stream: input.index(),
125 filter,
126 decoder,
127 encoder,
128 in_time_base,
129 out_time_base,
130 })
131}
132
133impl Transcoder {
134 fn send_frame_to_encoder(&mut self, frame: &ffmpeg_rs::Frame) {
135 self.encoder.send_frame(frame).unwrap();
136 }
137
138 fn send_eof_to_encoder(&mut self) {
139 self.encoder.send_eof().unwrap();
140 }
141
142 fn receive_and_process_encoded_packets(&mut self, octx: &mut format::context::Output) {
143 let mut encoded = ffmpeg_rs::Packet::empty();
144 while self.encoder.receive_packet(&mut encoded).is_ok() {
145 encoded.set_stream(0);
146 encoded.rescale_ts(self.in_time_base, self.out_time_base);
147 encoded.write_interleaved(octx).unwrap();
148 }
149 }
150
151 fn add_frame_to_filter(&mut self, frame: &ffmpeg_rs::Frame) {
152 self.filter.get("in").unwrap().source().add(frame).unwrap();
153 }
154
155 fn flush_filter(&mut self) {
156 self.filter.get("in").unwrap().source().flush().unwrap();
157 }
158
159 fn get_and_process_filtered_frames(&mut self, octx: &mut format::context::Output) {
160 let mut filtered = frame::Audio::empty();
161 while self
162 .filter
163 .get("out")
164 .unwrap()
165 .sink()
166 .frame(&mut filtered)
167 .is_ok()
168 {
169 self.send_frame_to_encoder(&filtered);
170 self.receive_and_process_encoded_packets(octx);
171 }
172 }
173
174 fn send_packet_to_decoder(&mut self, packet: &ffmpeg_rs::Packet) {
175 self.decoder.send_packet(packet).unwrap();
176 }
177
178 fn send_eof_to_decoder(&mut self) {
179 self.decoder.send_eof().unwrap();
180 }
181
182 fn receive_and_process_decoded_frames(&mut self, octx: &mut format::context::Output) {
183 let mut decoded = frame::Audio::empty();
184 while self.decoder.receive_frame(&mut decoded).is_ok() {
185 let timestamp = decoded.timestamp();
186 decoded.set_pts(timestamp);
187 self.add_frame_to_filter(&decoded);
188 self.get_and_process_filtered_frames(octx);
189 }
190 }
191}
192
193fn main() {
205 ffmpeg_rs::init().unwrap();
206
207 let input = env::args().nth(1).expect("missing input");
208 let output = env::args().nth(2).expect("missing output");
209 let filter = env::args().nth(3).unwrap_or_else(|| "anull".to_owned());
210 let seek = env::args().nth(4).and_then(|s| s.parse::<i64>().ok());
211
212 let mut ictx = format::input(&input).unwrap();
213 let mut octx = format::output(&output).unwrap();
214 let mut transcoder = transcoder(&mut ictx, &mut octx, &output, &filter).unwrap();
215
216 if let Some(position) = seek {
217 let position = position.rescale((1, 1), rescale::TIME_BASE);
219 ictx.seek(position, ..position).unwrap();
222 }
223
224 octx.set_metadata(ictx.metadata().to_owned());
225 octx.write_header().unwrap();
226
227 for (stream, mut packet) in ictx.packets() {
228 if stream.index() == transcoder.stream {
229 packet.rescale_ts(stream.time_base(), transcoder.in_time_base);
230 transcoder.send_packet_to_decoder(&packet);
231 transcoder.receive_and_process_decoded_frames(&mut octx);
232 }
233 }
234
235 transcoder.send_eof_to_decoder();
236 transcoder.receive_and_process_decoded_frames(&mut octx);
237
238 transcoder.flush_filter();
239 transcoder.get_and_process_filtered_frames(&mut octx);
240
241 transcoder.send_eof_to_encoder();
242 transcoder.receive_and_process_encoded_packets(&mut octx);
243
244 octx.write_trailer().unwrap();
245}