X-Git-Url: https://git.nihav.org/?p=nihav.git;a=blobdiff_plain;f=nihav-mpeg%2Fsrc%2Fcodecs%2Faac%2Fmod.rs;h=655b45ba5d9823597362d84a304742cbc85fd9a5;hp=de9fbe5e1882f901d8b917bc43545c89870bba83;hb=HEAD;hpb=9c3cd867ce7645f6f828675bd5d383033d6263f7 diff --git a/nihav-mpeg/src/codecs/aac/mod.rs b/nihav-mpeg/src/codecs/aac/mod.rs index de9fbe5..192b4e3 100644 --- a/nihav-mpeg/src/codecs/aac/mod.rs +++ b/nihav-mpeg/src/codecs/aac/mod.rs @@ -11,12 +11,18 @@ mod coeff_read; use coeff_read::*; mod info; use info::*; +#[allow(clippy::needless_range_loop)] +mod sbr; +use sbr::{SBRHeader, SBRCodebooks, SBRState, SBRChannel, SBRDSP, sbr_read_sce, sbr_read_cpe}; #[allow(clippy::excessive_precision)] mod tables; use tables::*; mod tools; use tools::*; +mod packetiser; +pub use packetiser::get_packetiser_adts; + const MAX_WINDOWS: usize = 8; const MAX_SFBS: usize = 64; @@ -62,7 +68,7 @@ impl ICSInfo { let ics_reserved_bit = br.read(1)?; validate!(ics_reserved_bit == 0); self.window_sequence = br.read(2)? as u8; - match self.prev_window_sequence { + /*match self.prev_window_sequence { ONLY_LONG_SEQUENCE | LONG_STOP_SEQUENCE => { if (self.window_sequence != ONLY_LONG_SEQUENCE) && (self.window_sequence != LONG_START_SEQUENCE) { @@ -76,7 +82,7 @@ impl ICSInfo { } }, _ => {}, - }; + };*/ self.window_shape = br.read_bool()?; self.window_groups = 1; if self.window_sequence == EIGHT_SHORT_SEQUENCE { @@ -181,6 +187,9 @@ impl ICS { fn get_intensity_dir(&self, g: usize, sfb: usize) -> bool { self.sfb_cb[g][sfb] == INTENSITY_HCB } + fn is_noise(&self, g: usize, sfb: usize) -> bool { + self.sfb_cb[g][sfb] == NOISE_HCB + } fn decode_scale_factor_data(&mut self, br: &mut BitReader, codebooks: &Codebooks) -> DecoderResult<()> { decode_scale_factor_data(br, &mut self.scales, self.global_gain, &self.info, &self.sfb_cb, codebooks) } @@ -288,6 +297,10 @@ struct ChannelPair { ms_mask_present: u8, ms_used: [[bool; MAX_SFBS]; MAX_WINDOWS], ics: [ICS; 2], + sbr_hdr: SBRHeader, + sbr_state: SBRState, + sbr_ch: [SBRChannel; 2], + do_sbr: bool, } impl ChannelPair { @@ -298,6 +311,10 @@ impl ChannelPair { ms_mask_present: 0, ms_used: [[false; MAX_SFBS]; MAX_WINDOWS], ics: [ICS::new(sbinfo), ICS::new(sbinfo)], + sbr_hdr: SBRHeader::new(), + sbr_state: SBRState::new(), + sbr_ch: [SBRChannel::new(), SBRChannel::new()], + do_sbr: false, } } fn decode_ga_sce(&mut self, br: &mut BitReader, codebooks: &Codebooks, m4atype: M4AType) -> DecoderResult<()> { @@ -317,12 +334,14 @@ impl ChannelPair { self.ms_used[g][sfb] = br.read_bool()?; } } + } else { + self.ms_used = [[false; MAX_SFBS]; MAX_WINDOWS]; } self.ics[1].info = self.ics[0].info; } self.ics[0].decode_ics(br, codebooks, m4atype, common_window, true)?; self.ics[1].decode_ics(br, codebooks, m4atype, common_window, true)?; - if common_window && self.ms_mask_present != 0 { + if common_window { let mut g = 0; for w in 0..self.ics[0].info.num_windows { if w > 0 && !self.ics[0].info.scale_factor_grouping[w - 1] { @@ -331,11 +350,11 @@ impl ChannelPair { for sfb in 0..self.ics[0].info.max_sfb { let start = w * 128 + self.ics[0].get_band_start(sfb); let end = w * 128 + self.ics[0].get_band_start(sfb + 1); - if self.ics[0].is_intensity(g, sfb) { + if self.ics[1].is_intensity(g, sfb) { let invert = (self.ms_mask_present == 1) && self.ms_used[g][sfb]; - let dir = self.ics[0].get_intensity_dir(g, sfb) ^ invert; - let scale = 0.5f32.powf(0.25 * (f32::from(self.ics[0].scales[g][sfb]) + f32::from(INTENSITY_SCALE_MIN))); - if !dir { + let dir = self.ics[1].get_intensity_dir(g, sfb) ^ invert; + let scale = 0.5f32.powf(0.25 * (f32::from(self.ics[1].scales[g][sfb]) + f32::from(INTENSITY_SCALE_MIN))); + if dir { for i in start..end { self.ics[1].coeffs[i] = scale * self.ics[0].coeffs[i]; } @@ -344,7 +363,7 @@ impl ChannelPair { self.ics[1].coeffs[i] = -scale * self.ics[0].coeffs[i]; } } - } else if (self.ms_mask_present == 2) || self.ms_used[g][sfb] { + } else if ((self.ms_mask_present == 2) || self.ms_used[g][sfb]) && !self.ics[0].is_noise(g, sfb) { for i in start..end { let tmp = self.ics[0].coeffs[i] - self.ics[1].coeffs[i]; self.ics[0].coeffs[i] += self.ics[1].coeffs[i]; @@ -356,14 +375,59 @@ impl ChannelPair { } Ok(()) } - fn synth_audio(&mut self, dsp: &mut DSP, abuf: &mut NABufferType, srate_idx: usize) { + fn decode_sbr(&mut self, buf: &[u8], has_crc: bool, cbs: &SBRCodebooks, srate: u32) -> DecoderResult<()> { + let mut br = BitReader::new(buf, BitReaderMode::BE); + if has_crc { + let _bs_sbr_crc_bits = br.read(10)?; + } + if br.read_bool()? { + if let Ok(hdr) = SBRHeader::read(&mut br) { + if self.sbr_hdr.differs_from(&hdr) { + self.do_sbr = self.sbr_state.init(&hdr, srate).is_ok(); + self.sbr_ch[0].reset(); + self.sbr_ch[1].reset(); + } + self.sbr_hdr = hdr; + } else { + self.do_sbr = false; + } + } + if self.do_sbr { + if !self.pair { + sbr_read_sce(&mut br, self.sbr_hdr.amp_res, &self.sbr_state, cbs, &mut self.sbr_ch[0])?; + } else { + sbr_read_cpe(&mut br, self.sbr_hdr.amp_res, &self.sbr_state, cbs, &mut self.sbr_ch)?; + } + } + + Ok(()) + } + fn synth_audio(&mut self, dsp: &mut DSP, abuf: &mut NABufferType, srate_idx: usize, upsample: bool) { let mut adata = abuf.get_abuf_f32().unwrap(); let output = adata.get_data_mut().unwrap(); let off0 = abuf.get_offset(self.channel); let off1 = abuf.get_offset(self.channel + 1); - self.ics[0].synth_channel(dsp, &mut output[off0..], srate_idx); - if self.pair { - self.ics[1].synth_channel(dsp, &mut output[off1..], srate_idx); + if !upsample { + self.ics[0].synth_channel(dsp, &mut output[off0..], srate_idx); + if self.pair { + self.ics[1].synth_channel(dsp, &mut output[off1..], srate_idx); + } + } else { + let mut tmp = [0.0; 1024]; + let nchannels = if self.pair { 2 } else { 1 }; + for ch in 0..nchannels { + let off = if ch == 0 { off0 } else { off1 }; + self.ics[ch].synth_channel(dsp, &mut tmp, srate_idx); + self.sbr_ch[ch].analysis(&mut dsp.sbr_dsp, &tmp); + if self.do_sbr { + self.sbr_ch[ch].hf_generate(&self.sbr_state); + self.sbr_ch[ch].hf_adjust(&self.sbr_state, &self.sbr_hdr); + } else { + self.sbr_ch[ch].bypass(); + } + self.sbr_ch[ch].synthesis(&mut dsp.sbr_dsp, &mut output[off..][..2048]); + self.sbr_ch[ch].update_frame(); + } } } } @@ -377,6 +441,7 @@ struct DSP { imdct_short: IMDCT, tmp: [f32; 2048], ew_buf: [f32; 1152], + sbr_dsp: SBRDSP, } const SHORT_WIN_POINT0: usize = 512 - 64; @@ -398,6 +463,7 @@ impl DSP { imdct_long: IMDCT::new(1024 * 2, true), imdct_short: IMDCT::new(128 * 2, true), tmp: [0.0; 2048], ew_buf: [0.0; 1152], + sbr_dsp: SBRDSP::new(), } } #[allow(clippy::cognitive_complexity)] @@ -419,9 +485,7 @@ impl DSP { self.ew_buf[w * 128 + i] += src[i] * short_win[i]; } } else { // to be left-windowed - for i in 0..128 { - self.ew_buf[i] = src[i]; - } + self.ew_buf[..128].copy_from_slice(&src[..128]); } for i in 0..128 { self.ew_buf[w * 128 + i + 128] += src[i + 128] * short_win[127 - i]; @@ -443,55 +507,45 @@ impl DSP { } }, EIGHT_SHORT_SEQUENCE => { - for i in 0..SHORT_WIN_POINT0 { - dst[i] = delay[i]; - } + dst[..SHORT_WIN_POINT0].copy_from_slice(&delay[..SHORT_WIN_POINT0]); for i in SHORT_WIN_POINT0..SHORT_WIN_POINT1 { let j = i - SHORT_WIN_POINT0; dst[i] = delay[i] + self.ew_buf[j] * left_short_win[j]; } - for i in SHORT_WIN_POINT1..1024 { - let j = i - SHORT_WIN_POINT0; - dst[i] = self.ew_buf[j]; - } + dst[SHORT_WIN_POINT1..1024].copy_from_slice( + &self.ew_buf[SHORT_WIN_POINT1-SHORT_WIN_POINT0..1024-SHORT_WIN_POINT0]); }, LONG_STOP_SEQUENCE => { - for i in 0..SHORT_WIN_POINT0 { - dst[i] = delay[i]; - } + dst[..SHORT_WIN_POINT0].copy_from_slice(&delay[..SHORT_WIN_POINT0]); for i in SHORT_WIN_POINT0..SHORT_WIN_POINT1 { dst[i] = delay[i] + self.tmp[i] * left_short_win[i - SHORT_WIN_POINT0]; } - for i in SHORT_WIN_POINT1..1024 { - dst[i] = self.tmp[i]; - } + dst[SHORT_WIN_POINT1..1024].copy_from_slice(&self.tmp[SHORT_WIN_POINT1..1024]); }, _ => unreachable!(""), }; // save delay match seq { ONLY_LONG_SEQUENCE | LONG_STOP_SEQUENCE => { - for i in 0..1024 { - delay[i] = self.tmp[i + 1024] * long_win[1023 - i]; + for (dst, (&src, &win)) in delay.iter_mut() + .zip(self.tmp[1024..].iter().zip(long_win.iter().rev())) { + *dst = src * win; } }, EIGHT_SHORT_SEQUENCE => { - for i in 0..SHORT_WIN_POINT1 { // last part is already windowed - delay[i] = self.ew_buf[i + 512+64]; - } - for i in SHORT_WIN_POINT1..1024 { - delay[i] = 0.0; + // last part is already windowed + delay[..SHORT_WIN_POINT1].copy_from_slice(&self.ew_buf[512+64..][..SHORT_WIN_POINT1]); + for el in delay[SHORT_WIN_POINT1..].iter_mut() { + *el = 0.0; } }, LONG_START_SEQUENCE => { - for i in 0..SHORT_WIN_POINT0 { - delay[i] = self.tmp[i + 1024]; - } + delay[..SHORT_WIN_POINT0].copy_from_slice(&self.tmp[1024..][..SHORT_WIN_POINT0]); for i in SHORT_WIN_POINT0..SHORT_WIN_POINT1 { delay[i] = self.tmp[i + 1024] * short_win[127 - (i - SHORT_WIN_POINT0)]; } - for i in SHORT_WIN_POINT1..1024 { - delay[i] = 0.0; + for el in delay[SHORT_WIN_POINT1..].iter_mut() { + *el = 0.0; } }, _ => unreachable!(""), @@ -507,6 +561,8 @@ struct AACDecoder { codebooks: Codebooks, dsp: DSP, sbinfo: GASubbandInfo, + sbr_cbs: SBRCodebooks, + upsample: bool, } impl AACDecoder { @@ -519,6 +575,8 @@ impl AACDecoder { codebooks: Codebooks::new(), dsp: DSP::new(), sbinfo: AAC_SUBBAND_INFO[0], + sbr_cbs: SBRCodebooks::new(), + upsample: false, } } fn set_pair(&mut self, pair_no: usize, channel: usize, pair: bool) -> DecoderResult<()> { @@ -564,8 +622,8 @@ impl AACDecoder { 4 => { // ID_DSE let _id = br.read(4)?; let align = br.read_bool()?; - let mut count = br.read(8)? as u32; - if count == 255 { count += br.read(8)? as u32; } + let mut count = br.read(8)?; + if count == 255 { count += br.read(8)?; } if align { br.align(); } br.skip(count * 8)?; // no SBR payload or such }, @@ -578,9 +636,28 @@ impl AACDecoder { count += br.read(8)? as usize; count -= 1; } - for _ in 0..count { - // ext payload + if count > 0 { + let extension_type = br.read(4)?; + match extension_type { + 0xD | 0xE => { // SBR data without or with CRC + let has_crc = extension_type == 0xE; + + let mut buf = [0; 256 + 16]; + for el in buf[..count - 1].iter_mut() { + *el = br.read(8)? as u8; + } + buf[count - 1] = br.read(4)? as u8; + if cur_pair > 0 { + self.pairs[cur_pair - 1].decode_sbr(&buf[..count], has_crc, &self.sbr_cbs, self.m4ainfo.srate * 2)?; + } + }, + _ => { + for _ in 0..count-1 { br.skip(8)?; + } + br.skip(4)?; + }, + }; } }, 7 => { // ID_TERM @@ -591,7 +668,7 @@ impl AACDecoder { } let srate_idx = GASubbandInfo::find_idx(self.m4ainfo.srate); for pair in 0..cur_pair { - self.pairs[pair].synth_audio(&mut self.dsp, abuf, srate_idx); + self.pairs[pair].synth_audio(&mut self.dsp, abuf, srate_idx, self.upsample); } Ok(()) } @@ -603,7 +680,6 @@ impl NADecoder for AACDecoder { let edata = info.get_extradata().unwrap(); validate!(edata.len() >= 2); -//print!("edata:"); for s in edata.iter() { print!(" {:02X}", *s);}println!(""); if (edata.len() > 12) && (&edata[4..8] == b"esds") { let mut mr = MemoryReader::new_read(edata.as_slice()); let mut br = ByteReader::new(&mut mr); @@ -665,8 +741,15 @@ impl NADecoder for AACDecoder { } self.sbinfo = GASubbandInfo::find(self.m4ainfo.srate); - let ainfo = NAAudioInfo::new(self.m4ainfo.srate, self.m4ainfo.channels as u8, - SND_F32P_FORMAT, self.m4ainfo.samples); + self.upsample = self.m4ainfo.srate < 32000; + let (srate, samples) = if !self.upsample { + (self.m4ainfo.srate, self.m4ainfo.samples) + } else { + (self.m4ainfo.srate * 2, self.m4ainfo.samples * 2) + }; + + let ainfo = NAAudioInfo::new(srate, self.m4ainfo.channels as u8, + SND_F32P_FORMAT, samples); self.info = info.replace_info(NACodecTypeInfo::Audio(ainfo)); if self.m4ainfo.channels >= DEFAULT_CHANNEL_MAP.len() { @@ -687,7 +770,8 @@ impl NADecoder for AACDecoder { let pktbuf = pkt.get_buffer(); let ainfo = self.info.get_properties().get_audio_info().unwrap(); - let mut abuf = alloc_audio_buffer(ainfo, self.m4ainfo.samples, self.chmap.clone())?; + let samples = if !self.upsample { self.m4ainfo.samples } else { self.m4ainfo.samples * 2 }; + let mut abuf = alloc_audio_buffer(ainfo, samples, self.chmap.clone())?; let mut br = BitReader::new(&pktbuf, BitReaderMode::BE); match self.m4ainfo.otype { @@ -726,6 +810,8 @@ mod test { use nihav_codec_support::test::dec_video::test_decode_audio; use crate::mpeg_register_all_decoders; use nihav_realmedia::realmedia_register_all_demuxers; + use std::io::Read; + #[test] fn test_aac() { let mut dmx_reg = RegisteredDemuxers::new(); @@ -737,6 +823,34 @@ mod test { let file = "assets/RV/rv40_weighted_mc_2.rmvb"; test_decode_audio("realmedia", file, Some(12000), None/*Some("aac")*/, &dmx_reg, &dec_reg); } + #[test] + fn test_aac_sbr() { + let mut dmx_reg = RegisteredDemuxers::new(); + nihav_commonfmt::generic_register_all_demuxers(&mut dmx_reg); + let mut dec_reg = RegisteredDecoders::new(); + mpeg_register_all_decoders(&mut dec_reg); + + let file = "assets/MPEG/SBRtestStereoAot29Sig0.mp4"; + test_decode_audio("mov", file, Some(400), None/*Some("aacsbr")*/, &dmx_reg, &dec_reg); + } + #[test] + fn test_adts_packetiser() { + let mut buf = [0; 4096]; + // sample obtained with yt-dlp -f 234 + let mut file = std::fs::File::open("assets/MPEG/Vf9Lvifxwk4.adts").unwrap(); + + let mut pkts = super::get_packetiser_adts(); + file.read_exact(&mut buf).unwrap(); + pkts.add_data(&buf); + let stream = pkts.parse_stream(0).unwrap(); + let mut frame_sizes = Vec::with_capacity(15); + while let Some(pkt) = pkts.get_packet(stream.clone()).unwrap() { + let frame_size = pkt.get_buffer().len(); + println!("pkt size {}", frame_size); + frame_sizes.push(frame_size); + } + assert_eq!(&frame_sizes, &[371, 372, 394, 402, 474, 400, 407, 399, 385]); + } } const DEFAULT_CHANNEL_MAP: [&str; 9] = [