transcode_audio/
transcode-audio.rs

1extern crate ffmpeg_rs;
2use std::env;
3use std::path::Path;
4
5use ffmpeg_rs::{codec, filter, format, frame, media};
6use ffmpeg_rs::{rescale, Rescale};
7
8fn filter(
9    spec: &str,
10    decoder: &codec::decoder::Audio,
11    encoder: &codec::encoder::Audio,
12) -> Result<filter::Graph, ffmpeg_rs::Error> {
13    let mut filter = filter::Graph::new();
14
15    let args = format!(
16        "time_base={}:sample_rate={}:sample_fmt={}:channel_layout=0x{:x}",
17        decoder.time_base(),
18        decoder.rate(),
19        decoder.format().name(),
20        decoder.channel_layout().bits()
21    );
22
23    filter.add(&filter::find("abuffer").unwrap(), "in", &args)?;
24    filter.add(&filter::find("abuffersink").unwrap(), "out", "")?;
25
26    {
27        let mut out = filter.get("out").unwrap();
28
29        out.set_sample_format(encoder.format());
30        out.set_channel_layout(encoder.channel_layout());
31        out.set_sample_rate(encoder.rate());
32    }
33
34    filter.output("in", 0)?.input("out", 0)?.parse(spec)?;
35    filter.validate()?;
36
37    println!("{}", filter.dump());
38
39    if let Some(codec) = encoder.codec() {
40        if !codec
41            .capabilities()
42            .contains(ffmpeg_rs::codec::capabilities::Capabilities::VARIABLE_FRAME_SIZE)
43        {
44            filter
45                .get("out")
46                .unwrap()
47                .sink()
48                .set_frame_size(encoder.frame_size());
49        }
50    }
51
52    Ok(filter)
53}
54
55struct Transcoder {
56    stream: usize,
57    filter: filter::Graph,
58    decoder: codec::decoder::Audio,
59    encoder: codec::encoder::Audio,
60    in_time_base: ffmpeg_rs::Rational,
61    out_time_base: ffmpeg_rs::Rational,
62}
63
64fn transcoder<P: AsRef<Path>>(
65    ictx: &mut format::context::Input,
66    octx: &mut format::context::Output,
67    path: &P,
68    filter_spec: &str,
69) -> Result<Transcoder, ffmpeg_rs::Error> {
70    let input = ictx
71        .streams()
72        .best(media::Type::Audio)
73        .expect("could not find best audio stream");
74    let context = ffmpeg_rs::codec::context::Context::from_parameters(input.parameters())?;
75    let mut decoder = context.decoder().audio()?;
76    let codec = ffmpeg_rs::encoder::find(octx.format().codec(path, media::Type::Audio))
77        .expect("failed to find encoder")
78        .audio()?;
79    let global = octx
80        .format()
81        .flags()
82        .contains(ffmpeg_rs::format::flag::Flags::GLOBAL_HEADER);
83
84    decoder.set_parameters(input.parameters())?;
85
86    let mut output = octx.add_stream(codec)?;
87    let context = ffmpeg_rs::codec::context::Context::from_parameters(output.parameters())?;
88    let mut encoder = context.encoder().audio()?;
89
90    let channel_layout = codec
91        .channel_layouts()
92        .map(|cls| cls.best(decoder.channel_layout().channels()))
93        .unwrap_or(ffmpeg_rs::channel_layout::ChannelLayout::STEREO);
94
95    if global {
96        encoder.set_flags(ffmpeg_rs::codec::flag::Flags::GLOBAL_HEADER);
97    }
98
99    encoder.set_rate(decoder.rate() as i32);
100    encoder.set_channel_layout(channel_layout);
101    encoder.set_channels(channel_layout.channels());
102    encoder.set_format(
103        codec
104            .formats()
105            .expect("unknown supported formats")
106            .next()
107            .unwrap(),
108    );
109    encoder.set_bit_rate(decoder.bit_rate());
110    encoder.set_max_bit_rate(decoder.max_bit_rate());
111
112    encoder.set_time_base((1, decoder.rate() as i32));
113    output.set_time_base((1, decoder.rate() as i32));
114
115    let encoder = encoder.open_as(codec)?;
116    output.set_parameters(&encoder);
117
118    let filter = filter(filter_spec, &decoder, &encoder)?;
119
120    let in_time_base = decoder.time_base();
121    let out_time_base = output.time_base();
122
123    Ok(Transcoder {
124        stream: input.index(),
125        filter,
126        decoder,
127        encoder,
128        in_time_base,
129        out_time_base,
130    })
131}
132
133impl Transcoder {
134    fn send_frame_to_encoder(&mut self, frame: &ffmpeg_rs::Frame) {
135        self.encoder.send_frame(frame).unwrap();
136    }
137
138    fn send_eof_to_encoder(&mut self) {
139        self.encoder.send_eof().unwrap();
140    }
141
142    fn receive_and_process_encoded_packets(&mut self, octx: &mut format::context::Output) {
143        let mut encoded = ffmpeg_rs::Packet::empty();
144        while self.encoder.receive_packet(&mut encoded).is_ok() {
145            encoded.set_stream(0);
146            encoded.rescale_ts(self.in_time_base, self.out_time_base);
147            encoded.write_interleaved(octx).unwrap();
148        }
149    }
150
151    fn add_frame_to_filter(&mut self, frame: &ffmpeg_rs::Frame) {
152        self.filter.get("in").unwrap().source().add(frame).unwrap();
153    }
154
155    fn flush_filter(&mut self) {
156        self.filter.get("in").unwrap().source().flush().unwrap();
157    }
158
159    fn get_and_process_filtered_frames(&mut self, octx: &mut format::context::Output) {
160        let mut filtered = frame::Audio::empty();
161        while self
162            .filter
163            .get("out")
164            .unwrap()
165            .sink()
166            .frame(&mut filtered)
167            .is_ok()
168        {
169            self.send_frame_to_encoder(&filtered);
170            self.receive_and_process_encoded_packets(octx);
171        }
172    }
173
174    fn send_packet_to_decoder(&mut self, packet: &ffmpeg_rs::Packet) {
175        self.decoder.send_packet(packet).unwrap();
176    }
177
178    fn send_eof_to_decoder(&mut self) {
179        self.decoder.send_eof().unwrap();
180    }
181
182    fn receive_and_process_decoded_frames(&mut self, octx: &mut format::context::Output) {
183        let mut decoded = frame::Audio::empty();
184        while self.decoder.receive_frame(&mut decoded).is_ok() {
185            let timestamp = decoded.timestamp();
186            decoded.set_pts(timestamp);
187            self.add_frame_to_filter(&decoded);
188            self.get_and_process_filtered_frames(octx);
189        }
190    }
191}
192
193// Transcode the `best` audio stream of the input file into a the output file while applying a
194// given filter. If no filter was specified the stream gets copied (`anull` filter).
195//
196// Example 1: Transcode *.mp3 file to *.wmv while speeding it up
197// transcode-audio in.mp3 out.wmv "atempo=1.2"
198//
199// Example 2: Overlay an audio file
200// transcode-audio in.mp3 out.mp3 "amovie=overlay.mp3 [ov]; [in][ov] amerge [out]"
201//
202// Example 3: Seek to a specified position (in seconds)
203// transcode-audio in.mp3 out.mp3 anull 30
204fn main() {
205    ffmpeg_rs::init().unwrap();
206
207    let input = env::args().nth(1).expect("missing input");
208    let output = env::args().nth(2).expect("missing output");
209    let filter = env::args().nth(3).unwrap_or_else(|| "anull".to_owned());
210    let seek = env::args().nth(4).and_then(|s| s.parse::<i64>().ok());
211
212    let mut ictx = format::input(&input).unwrap();
213    let mut octx = format::output(&output).unwrap();
214    let mut transcoder = transcoder(&mut ictx, &mut octx, &output, &filter).unwrap();
215
216    if let Some(position) = seek {
217        // If the position was given in seconds, rescale it to ffmpegs base timebase.
218        let position = position.rescale((1, 1), rescale::TIME_BASE);
219        // If this seek was embedded in the transcoding loop, a call of `flush()`
220        // for every opened buffer after the successful seek would be advisable.
221        ictx.seek(position, ..position).unwrap();
222    }
223
224    octx.set_metadata(ictx.metadata().to_owned());
225    octx.write_header().unwrap();
226
227    for (stream, mut packet) in ictx.packets() {
228        if stream.index() == transcoder.stream {
229            packet.rescale_ts(stream.time_base(), transcoder.in_time_base);
230            transcoder.send_packet_to_decoder(&packet);
231            transcoder.receive_and_process_decoded_frames(&mut octx);
232        }
233    }
234
235    transcoder.send_eof_to_decoder();
236    transcoder.receive_and_process_decoded_frames(&mut octx);
237
238    transcoder.flush_filter();
239    transcoder.get_and_process_filtered_frames(&mut octx);
240
241    transcoder.send_eof_to_encoder();
242    transcoder.receive_and_process_encoded_packets(&mut octx);
243
244    octx.write_trailer().unwrap();
245}