1
0
Fork 0
mirror of https://github.com/alfg/mp4-rust.git synced 2025-01-03 00:48:40 +00:00

Add mpeg_aac_decoder example (#50)

* Add mpeg_aac_decoder example

* Convert mpeg_aac_decoder example to it's own package
This commit is contained in:
Kasper 2021-02-02 02:11:35 +01:00 committed by GitHub
parent b59758c7df
commit 335aa39f7c
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
4 changed files with 248 additions and 0 deletions

2
examples/mpeg_aac_decoder/.gitignore vendored Normal file
View file

@ -0,0 +1,2 @@
/Cargo.lock
/target

View file

@ -0,0 +1,9 @@
[package]
name = "mpeg_aac_decoder"
version = "0.1.0"
edition = "2018"
[dependencies]
mp4 = "0.8.1"
fdk-aac = "0.4.0"
rodio = { version = "0.13.0", default-features = false }

Binary file not shown.

View file

@ -0,0 +1,237 @@
use fdk_aac::dec::{Decoder, DecoderError, Transport};
use rodio::{OutputStream, Sink, Source};
use std::fs::File;
use std::io::{BufReader, Read, Seek};
use std::ops::Range;
use std::time::Duration;
fn main() {
let path = "audio_aac.m4a";
let file = File::open(path).expect("Error opening file");
let metadata = file.metadata().expect("Error getting file metadata");
let size = metadata.len();
let buf = BufReader::new(file);
let decoder = MpegAacDecoder::new(buf, size).expect("Error creating decoder");
let output_stream = OutputStream::try_default();
let (_stream, handle) = output_stream.expect("Error creating output stream");
let sink = Sink::try_new(&handle).expect("Error creating sink");
sink.append(decoder);
sink.play();
sink.set_volume(0.5);
sink.sleep_until_end();
}
pub struct MpegAacDecoder<R>
where
R: Read + Seek,
{
mp4_reader: mp4::Mp4Reader<R>,
decoder: Decoder,
current_pcm_index: usize,
current_pcm: Vec<i16>,
track_id: u32,
position: u32,
}
impl<R> MpegAacDecoder<R>
where
R: Read + Seek,
{
pub fn new(reader: R, size: u64) -> Result<MpegAacDecoder<R>, &'static str> {
let decoder = Decoder::new(Transport::Adts);
let mp4 = mp4::Mp4Reader::read_header(reader, size).or(Err("Error reading MPEG header"))?;
let mut track_id: Option<u32> = None;
{
for track in mp4.tracks().iter() {
let media_type = track.media_type().or(Err("Error getting media type"))?;
match media_type {
mp4::MediaType::AAC => {
track_id = Some(track.track_id());
break;
}
_ => {}
}
}
}
match track_id {
Some(track_id) => {
return Ok(MpegAacDecoder {
mp4_reader: mp4,
decoder: decoder,
current_pcm_index: 0,
current_pcm: Vec::new(),
track_id: track_id,
position: 1,
});
}
None => {
return Err("No aac track found");
}
}
}
}
impl<R> Iterator for MpegAacDecoder<R>
where
R: Read + Seek,
{
type Item = i16;
fn next(&mut self) -> Option<i16> {
if self.current_pcm_index == self.current_pcm.len() {
let mut pcm = vec![0; 8192];
let result = match self.decoder.decode_frame(&mut self.current_pcm) {
Err(DecoderError::NOT_ENOUGH_BITS) => {
let sample_result = self.mp4_reader.read_sample(self.track_id, self.position);
let sample = sample_result.expect("Error reading sample")?;
let tracks = self.mp4_reader.tracks();
let track = tracks.get(self.track_id as usize - 1).expect("No track ID");
let adts_header = construct_adts_header(track, &sample).expect("ADTS bytes");
let adts_bytes = mp4::Bytes::copy_from_slice(&adts_header);
let bytes = [adts_bytes, sample.bytes].concat();
self.position += 1;
let _bytes_read = match self.decoder.fill(&bytes) {
Ok(bytes_read) => bytes_read,
Err(_) => return None,
};
self.decoder.decode_frame(&mut pcm)
}
val => val,
};
if let Err(err) = result {
println!("DecoderError: {}", err);
return None;
}
let decoded_fram_size = self.decoder.decoded_frame_size();
if decoded_fram_size < pcm.len() {
let _ = pcm.split_off(decoded_fram_size);
}
self.current_pcm = pcm;
self.current_pcm_index = 0;
}
let value = self.current_pcm[self.current_pcm_index];
self.current_pcm_index += 1;
return Some(value);
}
}
impl<R> Source for MpegAacDecoder<R>
where
R: Read + Seek,
{
fn current_frame_len(&self) -> Option<usize> {
let frame_size: usize = self.decoder.decoded_frame_size();
Some(frame_size)
}
fn channels(&self) -> u16 {
let num_channels: i32 = self.decoder.stream_info().numChannels;
num_channels as _
}
fn sample_rate(&self) -> u32 {
let sample_rate: i32 = self.decoder.stream_info().sampleRate;
sample_rate as _
}
fn total_duration(&self) -> Option<Duration> {
return None;
}
}
fn get_bits(byte: u16, range: Range<u16>) -> u16 {
let shaved_left = byte << range.start - 1;
let moved_back = shaved_left >> range.start - 1;
let shave_right = moved_back >> 16 - range.end;
return shave_right;
}
fn get_bits_u8(byte: u8, range: Range<u8>) -> u8 {
let shaved_left = byte << range.start - 1;
let moved_back = shaved_left >> range.start - 1;
let shave_right = moved_back >> 8 - range.end;
return shave_right;
}
pub fn construct_adts_header(track: &mp4::Mp4Track, sample: &mp4::Mp4Sample) -> Option<Vec<u8>> {
// B: Only support 0 (MPEG-4)
// D: Only support 1 (without CRC)
// byte7 and byte9 not included without CRC
let adts_header_length = 7;
// AAAA_AAAA
let byte0 = 0b1111_1111;
// AAAA_BCCD
let byte1 = 0b1111_0001;
// EEFF_FFGH
let mut byte2 = 0b0000_0000;
let object_type = match track.audio_profile() {
Ok(mp4::AudioObjectType::AacMain) => 1,
Ok(mp4::AudioObjectType::AacLowComplexity) => 2,
Ok(mp4::AudioObjectType::AacScalableSampleRate) => 3,
Ok(mp4::AudioObjectType::AacLongTermPrediction) => 4,
Err(_) => return None,
};
let adts_object_type = object_type - 1;
byte2 = (byte2 << 2) | adts_object_type; // EE
let sample_freq_index = match track.sample_freq_index() {
Ok(mp4::SampleFreqIndex::Freq96000) => 0,
Ok(mp4::SampleFreqIndex::Freq88200) => 1,
Ok(mp4::SampleFreqIndex::Freq64000) => 2,
Ok(mp4::SampleFreqIndex::Freq48000) => 3,
Ok(mp4::SampleFreqIndex::Freq44100) => 4,
Ok(mp4::SampleFreqIndex::Freq32000) => 5,
Ok(mp4::SampleFreqIndex::Freq24000) => 6,
Ok(mp4::SampleFreqIndex::Freq22050) => 7,
Ok(mp4::SampleFreqIndex::Freq16000) => 8,
Ok(mp4::SampleFreqIndex::Freq12000) => 9,
Ok(mp4::SampleFreqIndex::Freq11025) => 10,
Ok(mp4::SampleFreqIndex::Freq8000) => 11,
Ok(mp4::SampleFreqIndex::Freq7350) => 12,
// 13-14 = reserved
// 15 = explicit frequency (forbidden in adts)
Err(_) => return None,
};
byte2 = (byte2 << 4) | sample_freq_index; // FFFF
byte2 = (byte2 << 1) | 0b1; // G
let channel_config = match track.channel_config() {
// 0 = for when channel config is sent via an inband PCE
Ok(mp4::ChannelConfig::Mono) => 1,
Ok(mp4::ChannelConfig::Stereo) => 2,
Ok(mp4::ChannelConfig::Three) => 3,
Ok(mp4::ChannelConfig::Four) => 4,
Ok(mp4::ChannelConfig::Five) => 5,
Ok(mp4::ChannelConfig::FiveOne) => 6,
Ok(mp4::ChannelConfig::SevenOne) => 7,
// 8-15 = reserved
Err(_) => return None,
};
byte2 = (byte2 << 1) | get_bits_u8(channel_config, 6..6); // H
// HHIJ_KLMM
let mut byte3 = 0b0000_0000;
byte3 = (byte3 << 2) | get_bits_u8(channel_config, 7..8); // HH
byte3 = (byte3 << 4) | 0b1111; // IJKL
let frame_length = adts_header_length + sample.bytes.len() as u16;
byte3 = (byte3 << 2) | get_bits(frame_length, 3..5) as u8; // MM
// MMMM_MMMM
let byte4 = get_bits(frame_length, 6..13) as u8;
// MMMO_OOOO
let mut byte5 = 0b0000_0000;
byte5 = (byte5 << 3) | get_bits(frame_length, 14..16) as u8;
byte5 = (byte5 << 5) | 0b11111; // OOOOO
// OOOO_OOPP
let mut byte6 = 0b0000_0000;
byte6 = (byte6 << 6) | 0b111111; // OOOOOO
byte6 = (byte6 << 2) | 0b00; // PP
return Some(vec![byte0, byte1, byte2, byte3, byte4, byte5, byte6]);
}