nihav_itu: ignore high-profile extradata tail when it is not correct
[nihav.git] / nihav-itu / src / codecs / h264 / decoder_mt.rs
CommitLineData
11d7aef2
KS
1use nihav_core::codecs::*;
2use nihav_core::io::bitreader::*;
3
4use super::*;
5use super::dispatch::*;
6
cc818ce8
KS
7const AVG_BUF_VINFO: NAVideoInfo = NAVideoInfo { width: 32, height: 32, flipped: false, format: YUV420_FORMAT, bits: 12 };
8
11d7aef2
KS
9pub struct FrameDecoder {
10 pub slices: Vec<(SliceHeader, usize, SliceRefs, Vec<u8>)>,
11 pub cur_pic: PictureInfo,
12 sps: Arc<SeqParameterSet>,
13 pps: Arc<PicParameterSet>,
14 pub num_mbs: usize,
15 mc_dsp: H264MC,
16 dispatch: Shareable<ThreadDispatcher>,
17 sstate: SliceState,
18 cavlc_cb: Arc<CAVLCTables>,
19 ipcm_buf: [u8; 256 + 64 + 64],
20 is_mbaff: bool,
21 deblock_skip: bool,
22}
23
24impl FrameDecoder {
25 pub fn decode_slice(&mut self, hdr: &SliceHeader, hdr_size: usize, refs: &SliceRefs, nal: &[u8]) -> DecoderResult<usize> {
26 self.sstate.reset(self.sps.pic_width_in_mbs, self.sps.pic_height_in_mbs, hdr.first_mb_in_slice);
27
28 let mut full_size = nal.len() * 8;
29 for &byte in nal.iter().rev() {
30 if byte == 0 {
31 full_size -= 8;
32 } else {
33 full_size -= (byte.trailing_zeros() + 1) as usize;
34 break;
35 }
36 }
37 validate!(full_size > 0);
38
5f223cdb
KS
39 let sslice_refs = SimplifiedSliceRefs::new(refs);
40
11d7aef2 41 let mut br = BitReader::new(&nal[hdr_size / 8..], BitReaderMode::BE);
fe64781d
KS
42 let mut dst_pic = self.cur_pic.clone();
43 let mut dst_frm = NASimpleVideoFrame::from_video_buf(&mut dst_pic.buf).unwrap();
11d7aef2
KS
44 if !self.pps.entropy_coding_mode {
45 br.skip((hdr_size & 7) as u32)?;
fe64781d 46 self.decode_slice_cavlc(&mut br, full_size - (hdr_size & !7), hdr, &sslice_refs, &mut dst_frm)
11d7aef2
KS
47 } else {
48 let csrc = &nal[(hdr_size + 7) / 8..];
49 validate!(csrc.len() >= 2);
50 let mut cabac = CABAC::new(csrc, hdr.slice_type, hdr.slice_qp, hdr.cabac_init_idc as usize)?;
fe64781d 51 self.decode_slice_cabac(&mut cabac, hdr, &sslice_refs, &mut dst_frm)
11d7aef2
KS
52 }
53 }
fe64781d 54 fn decode_slice_cavlc(&mut self, br: &mut BitReader, full_size: usize, slice_hdr: &SliceHeader, refs: &SimplifiedSliceRefs, frm: &mut NASimpleVideoFrame<u8>) -> DecoderResult<usize> {
11d7aef2
KS
55 const INTRA_CBP: [u8; 48] = [
56 47, 31, 15, 0, 23, 27, 29, 30, 7, 11, 13, 14, 39, 43, 45, 46,
57 16, 3, 5, 10, 12, 19, 21, 26, 28, 35, 37, 42, 44, 1, 2, 4,
58 8, 17, 18, 20, 24, 6, 9, 22, 25, 32, 33, 34, 36, 40, 38, 41
59 ];
60 const INTER_CBP: [u8; 48] = [
61 0, 16, 1, 2, 4, 8, 32, 3, 5, 10, 12, 15, 47, 7, 11, 13,
62 14, 6, 9, 31, 35, 37, 42, 44, 33, 34, 36, 40, 39, 43, 45, 46,
63 17, 18, 20, 24, 19, 21, 26, 28, 23, 27, 29, 30, 22, 25, 38, 41
64 ];
65
e6aaad5c 66 let mut mb_idx = slice_hdr.first_mb_in_slice;
11d7aef2
KS
67 let mut mb_info = CurrentMBInfo { qp_y: slice_hdr.slice_qp, ..Default::default() };
68 let skip_type = if slice_hdr.slice_type.is_p() { MBType::PSkip } else { MBType::BSkip };
69 while br.tell() < full_size && mb_idx < self.num_mbs {
70 mb_info.coded = [false; 25];
71 mb_info.ref_l0 = [ZERO_REF; 4];
72 mb_info.ref_l1 = [ZERO_REF; 4];
73 mb_info.mv_l0 = [ZERO_MV; 16];
74 mb_info.mv_l1 = [ZERO_MV; 16];
75 mb_info.chroma_dc = [[0; 4]; 2];
76 mb_info.cbpy = 0;
77 mb_info.cbpc = 0;
78
79 if !slice_hdr.slice_type.is_intra() {
80 let mb_skip_run = br.read_ue()? as usize;
81 validate!(mb_idx + mb_skip_run <= self.num_mbs);
82 mb_info.mb_type = skip_type;
83 for _ in 0..mb_skip_run {
fe64781d 84 self.handle_macroblock(slice_hdr, &mut mb_info, refs, frm)?;
11d7aef2
KS
85 mb_idx += 1;
86 }
87 if mb_idx == self.num_mbs || br.tell() >= full_size {
88 break;
89 }
90 }
91 if br.tell() < full_size {
92 if self.is_mbaff && ((mb_idx & 1) == 0) {
93 let _mb_field_decoding = br.read_bool()?;
94 }
95 let mut mb_type = decode_mb_type_cavlc(br, slice_hdr)?;
96 mb_info.mb_type = mb_type;
97 mb_info.transform_size_8x8 = false;
98 if mb_type == MBType::PCM {
99 br.align();
100 for pix in self.ipcm_buf[..256 + 64 + 64].iter_mut() {
101 *pix = br.read(8)? as u8;
102 }
103 self.sstate.fill_ncoded(16);
104 } else {
105 if self.pps.transform_8x8_mode && mb_type == MBType::Intra4x4 {
106 mb_info.transform_size_8x8 = br.read_bool()?;
107 if mb_info.transform_size_8x8 {
108 mb_type = MBType::Intra8x8;
109 mb_info.mb_type = MBType::Intra8x8;
110 }
111 }
112 decode_mb_pred_cavlc(br, slice_hdr, mb_type, &mut self.sstate, &mut mb_info)?;
113 let (cbpy, cbpc) = if let MBType::Intra16x16(_, cbpy, cbpc) = mb_type {
114 (cbpy, cbpc)
115 } else {
116 let cbp_id = br.read_ue()? as usize;
117 validate!(cbp_id < INTRA_CBP.len());
118 let cbp = if mb_type == MBType::Intra4x4 || mb_type == MBType::Intra8x8 {
119 INTRA_CBP[cbp_id]
120 } else {
121 INTER_CBP[cbp_id]
122 };
123 if self.pps.transform_8x8_mode && (cbp & 0xF) != 0 && mb_info.can_have_8x8_tx(self.sps.direct_8x8_inference) {
124 mb_info.transform_size_8x8 = br.read_bool()?;
125 }
126 ((cbp & 0xF), (cbp >> 4))
127 };
128 mb_info.cbpy = cbpy;
129 mb_info.cbpc = cbpc;
130 self.sstate.get_cur_mb().cbp = (cbpc << 4) | cbpy;
131 if cbpy != 0 || cbpc != 0 || mb_type.is_intra16x16() {
132 let mb_qp_delta = br.read_se()?;
133 validate!(mb_qp_delta >= -26 && mb_qp_delta <= 25);
134 let new_qp = mb_qp_delta + i32::from(mb_info.qp_y);
135 mb_info.qp_y = if new_qp < 0 {
136 (new_qp + 52) as u8
137 } else if new_qp >= 52 {
138 (new_qp - 52) as u8
139 } else {
140 new_qp as u8
141 };
142 mb_info.coeffs = [[0; 16]; 25];
143 if self.pps.transform_8x8_mode {
144 mb_info.clear_coeffs8x8();
145 }
146 mb_info.chroma_dc = [[0; 4]; 2];
147 decode_residual_cavlc(br, &mut self.sstate, &mut mb_info, &self.cavlc_cb)?;
148 }
149 }
fe64781d 150 self.handle_macroblock(slice_hdr, &mut mb_info, refs, frm)?;
11d7aef2
KS
151 }
152 mb_idx += 1;
153 if let Ok(disp) = self.dispatch.read() {
154 disp.update_pos(self.cur_pic.full_id, mb_idx);
155 }
156 }
157 Ok(mb_idx)
158 }
fe64781d 159 fn decode_slice_cabac(&mut self, cabac: &mut CABAC, slice_hdr: &SliceHeader, refs: &SimplifiedSliceRefs, frm: &mut NASimpleVideoFrame<u8>) -> DecoderResult<usize> {
e6aaad5c 160 let mut mb_idx = slice_hdr.first_mb_in_slice;
11d7aef2
KS
161 let mut prev_mb_skipped = false;
162 let skip_type = if slice_hdr.slice_type.is_p() { MBType::PSkip } else { MBType::BSkip };
163 let mut last_qp_diff = false;
164
165 let mut mb_info = CurrentMBInfo { qp_y: slice_hdr.slice_qp, ..Default::default() };
166
167 while mb_idx < self.num_mbs {
168 mb_info.coded = [false; 25];
169 mb_info.ref_l0 = [ZERO_REF; 4];
170 mb_info.ref_l1 = [ZERO_REF; 4];
171 mb_info.mv_l0 = [ZERO_MV; 16];
172 mb_info.mv_l1 = [ZERO_MV; 16];
173 mb_info.chroma_dc = [[0; 4]; 2];
174 mb_info.cbpy = 0;
175 mb_info.cbpc = 0;
176 let mb_skip = cabac_decode_mbskip(cabac, &self.sstate, slice_hdr);
177 if !mb_skip {
178 if self.is_mbaff && (((mb_idx & 1) == 0) || (prev_mb_skipped && ((mb_idx & 1) == 1))) {
179 let _mb_field_decoding = cabac.decode_bit(70);
180 }
181 let mut mb_type = cabac_decode_mb_type(cabac, slice_hdr, &self.sstate);
182 mb_info.mb_type = mb_type;
183 mb_info.transform_size_8x8 = false;
184 if mb_type == MBType::PCM {
185 let ipcm_size = 256 + 64 + 64;
186 validate!(cabac.pos + ipcm_size <= cabac.src.len());
187 self.ipcm_buf[..ipcm_size].copy_from_slice(&cabac.src[cabac.pos..][..ipcm_size]);
188 cabac.pos += ipcm_size;
189 cabac.reinit()?;
190 last_qp_diff = false;
191 } else {
192 if self.pps.transform_8x8_mode && mb_type == MBType::Intra4x4 {
193 let mut ctx = 0;
194 if self.sstate.get_top_mb().transform_8x8 {
195 ctx += 1;
196 }
197 if self.sstate.get_left_mb().transform_8x8 {
198 ctx += 1;
199 }
200 mb_info.transform_size_8x8 = cabac.decode_bit(399 + ctx);
201 if mb_info.transform_size_8x8 {
202 mb_type = MBType::Intra8x8;
203 mb_info.mb_type = MBType::Intra8x8;
204 }
205 }
206 decode_mb_pred_cabac(cabac, slice_hdr, mb_type, &mut self.sstate, &mut mb_info);
207 let (cbpy, cbpc) = if let MBType::Intra16x16(_, cbpy, cbpc) = mb_type {
208 (cbpy, cbpc)
209 } else {
210 decode_cbp_cabac(cabac, &self.sstate)
211 };
212 if self.pps.transform_8x8_mode && cbpy != 0 && mb_info.can_have_8x8_tx(self.sps.direct_8x8_inference) {
213 let mut ctx = 0;
214 if self.sstate.get_top_mb().transform_8x8 {
215 ctx += 1;
216 }
217 if self.sstate.get_left_mb().transform_8x8 {
218 ctx += 1;
219 }
220 mb_info.transform_size_8x8 = cabac.decode_bit(399 + ctx);
221 }
222 if mb_type.is_intra() {
223 self.sstate.get_cur_mb().cmode = mb_info.chroma_ipred;
224 }
225 mb_info.cbpy = cbpy;
226 mb_info.cbpc = cbpc;
227 self.sstate.get_cur_mb().cbp = (cbpc << 4) | cbpy;
228 if cbpy != 0 || cbpc != 0 || mb_type.is_intra16x16() {
229 let mb_qp_delta = decode_mb_qp_delta_cabac(cabac, last_qp_diff as usize);
230 validate!(mb_qp_delta >= -26 && mb_qp_delta <= 25);
231 last_qp_diff = mb_qp_delta != 0;
232 let new_qp = mb_qp_delta + i32::from(mb_info.qp_y);
233 mb_info.qp_y = if new_qp < 0 {
234 (new_qp + 52) as u8
235 } else if new_qp >= 52 {
236 (new_qp - 52) as u8
237 } else {
238 new_qp as u8
239 };
240 mb_info.coeffs = [[0; 16]; 25];
241 if self.pps.transform_8x8_mode {
242 mb_info.clear_coeffs8x8();
243 }
244 mb_info.chroma_dc = [[0; 4]; 2];
245 decode_residual_cabac(cabac, &mut self.sstate, &mut mb_info);
246 } else {
247 last_qp_diff = false;
248 }
249 }
250 } else {
251 mb_info.mb_type = skip_type;
252 mb_info.transform_size_8x8 = false;
253 last_qp_diff = false;
254 }
fe64781d 255 self.handle_macroblock(slice_hdr, &mut mb_info, refs, frm)?;
11d7aef2
KS
256 prev_mb_skipped = mb_skip;
257 if !(self.is_mbaff && ((mb_idx & 1) == 0)) && cabac.decode_terminate() {
258 if let Ok(disp) = self.dispatch.read() {
259 disp.update_pos(self.cur_pic.full_id, mb_idx + 1);
260 }
261 return Ok(mb_idx + 1);
262 }
263 mb_idx += 1;
264 if let Ok(disp) = self.dispatch.read() {
265 disp.update_pos(self.cur_pic.full_id, mb_idx);
266 }
267 }
268 Err(DecoderError::InvalidData)
269 }
270 #[allow(clippy::cognitive_complexity)]
fe64781d 271 fn handle_macroblock(&mut self, slice_hdr: &SliceHeader, mb_info: &mut CurrentMBInfo, refs: &SimplifiedSliceRefs, frm: &mut NASimpleVideoFrame<u8>) -> DecoderResult<()> {
11d7aef2
KS
272 let qp_y = mb_info.qp_y;
273 let qpr = ((qp_y as i8) + self.pps.chroma_qp_index_offset).max(0).min(51) as usize;
274 let qp_u = CHROMA_QUANTS[qpr];
275 let qpb = ((qp_y as i8) + self.pps.second_chroma_qp_index_offset).max(0).min(51) as usize;
276 let qp_v = CHROMA_QUANTS[qpb];
277
278 let tx_bypass = qp_y == 0 && self.sps.qpprime_y_zero_transform_bypass;
279
280 self.sstate.get_cur_mb().mb_type = mb_info.mb_type.into();
281 if mb_info.mb_type != MBType::PCM {
282 self.sstate.get_cur_mb().qp_y = qp_y;
283 self.sstate.get_cur_mb().qp_u = qp_u;
284 self.sstate.get_cur_mb().qp_v = qp_v;
285 self.sstate.get_cur_mb().transform_8x8 = mb_info.transform_size_8x8;
286 }
287 let has_dc = mb_info.mb_type.is_intra16x16() && mb_info.coded[24];
288 if has_dc {
289 idct_luma_dc(&mut mb_info.coeffs[24], qp_y);
290 for i in 0..16 {
291 mb_info.coeffs[i][0] = mb_info.coeffs[24][i];
292 }
293 }
294 if !mb_info.transform_size_8x8 {
295 let quant_dc = !mb_info.mb_type.is_intra16x16();
fe64781d
KS
296 if quant_dc {
297 for i in 0..16 {
298 if mb_info.coded[i] {
299 if !tx_bypass {
300 idct(&mut mb_info.coeffs[i], qp_y);
301 }
302 } else if has_dc {
303 if !tx_bypass {
304 idct_dc(&mut mb_info.coeffs[i], qp_y, quant_dc);
305 }
306 mb_info.coded[i] = true;
11d7aef2 307 }
fe64781d
KS
308 }
309 } else {
310 for i in 0..16 {
311 if mb_info.coded[i] {
312 if !tx_bypass {
313 idct_skip_dc(&mut mb_info.coeffs[i], qp_y);
314 }
315 } else if has_dc {
316 if !tx_bypass {
317 idct_dc(&mut mb_info.coeffs[i], qp_y, quant_dc);
318 }
319 mb_info.coded[i] = true;
11d7aef2 320 }
11d7aef2
KS
321 }
322 }
323 } else {
324 for i in 0..4 {
325 if mb_info.coded[(i & 1) * 2 + (i & 2) * 4] && !tx_bypass {
326 dequant8x8(&mut mb_info.coeffs8x8[i].coeffs, &self.pps.scaling_list_8x8[!mb_info.mb_type.is_intra() as usize]);
327 idct8x8(&mut mb_info.coeffs8x8[i].coeffs, qp_y);
328 }
329 }
330 }
331 for chroma in 0..2 {
332 let qp_c = if chroma == 0 { qp_u } else { qp_v };
333 if mb_info.cbpc != 0 {
334 chroma_dc_transform(&mut mb_info.chroma_dc[chroma], qp_c);
335 }
336 for i in 0..4 {
337 let blk_no = 16 + chroma * 4 + i;
338 mb_info.coeffs[blk_no][0] = mb_info.chroma_dc[chroma][i];
339 if mb_info.coded[blk_no] {
fe64781d 340 idct_skip_dc(&mut mb_info.coeffs[blk_no], qp_c);
11d7aef2
KS
341 } else if mb_info.coeffs[blk_no][0] != 0 {
342 idct_dc(&mut mb_info.coeffs[blk_no], qp_c, false);
343 mb_info.coded[blk_no] = true;
344 }
345 }
346 }
347 if !self.pps.entropy_coding_mode || mb_info.mb_type.is_skip() || mb_info.mb_type.is_intra() {
348 self.sstate.reset_mb_mv();
349 }
350 if !mb_info.mb_type.is_intra() {
351 let temporal_mv = !slice_hdr.direct_spatial_mv_pred;
352 let cur_id = self.cur_pic.full_id as u16;
353 // wait for the reference macroblock MV to be available
354 if matches!(mb_info.mb_type, MBType::Direct | MBType::BSkip | MBType::B8x8) {
355 if let Some(ref_id) = refs.get_ref_id(0, mb_info.ref_l1[0].index()) {
356 wait_for_mb(&self.dispatch, &self.sstate, self.sstate.mb_x * 16, self.sstate.mb_y * 16, ZERO_MV, ref_id)?;
357 }
358 }
359 Self::pred_mv(&mut self.sstate, refs, mb_info, cur_id, temporal_mv, self.sps.direct_8x8_inference);
360 }
361 if !self.pps.constrained_intra_pred && mb_info.mb_type != MBType::Intra4x4 && mb_info.mb_type != MBType::Intra8x8 {
362 self.sstate.fill_ipred(IntraPredMode::DC);
363 }
364
365 let xpos = self.sstate.mb_x * 16;
366 let ypos = self.sstate.mb_y * 16;
11d7aef2
KS
367 if mb_info.mb_type != MBType::PCM {
368 let weight_mode = if self.pps.weighted_pred && slice_hdr.slice_type.is_p() {
369 1
370 } else if slice_hdr.slice_type.is_b() {
371 self.pps.weighted_bipred_idc
372 } else {
373 0
374 };
fe64781d 375 recon_mb_mt(frm, slice_hdr, mb_info, &mut self.sstate, refs, &mut self.mc_dsp, weight_mode, &self.dispatch)?;
11d7aef2
KS
376 } else {
377 for (dline, src) in frm.data[frm.offset[0] + xpos + ypos * frm.stride[0]..].chunks_mut(frm.stride[0]).take(16).zip(self.ipcm_buf.chunks(16)) {
378 dline[..16].copy_from_slice(src);
379 }
380 for (dline, src) in frm.data[frm.offset[1] + xpos/2 + ypos/2 * frm.stride[1]..].chunks_mut(frm.stride[1]).take(8).zip(self.ipcm_buf[256..].chunks(8)) {
381 dline[..8].copy_from_slice(src);
382 }
383 for (dline, src) in frm.data[frm.offset[2] + xpos/2 + ypos/2 * frm.stride[2]..].chunks_mut(frm.stride[2]).take(8).zip(self.ipcm_buf[256 + 64..].chunks(8)) {
384 dline[..8].copy_from_slice(src);
385 }
386 }
fe64781d 387 self.sstate.save_ipred_context(frm);
11d7aef2
KS
388
389 let mv_info = &mut self.cur_pic.mv_info;
390 let mb_pos = self.sstate.mb_x + self.sstate.mb_y * mv_info.mb_stride;
391 let mut mb = FrameMBInfo::new();
392 mb.mb_type = mb_info.mb_type.into();
393 for blk4 in 0..16 {
394 mb.mv[blk4] = self.sstate.get_cur_blk4(blk4).mv;
395 }
396 for blk8 in 0..4 {
397 mb.ref_poc[blk8] = refs.map_refs(self.sstate.get_cur_blk8(blk8).ref_idx);
398 mb.ref_idx[blk8] = self.sstate.get_cur_blk8(blk8).ref_idx;
399 }
400 mv_info.mbs[mb_pos] = mb;
401
402 let deblock_mode = slice_hdr.disable_deblocking_filter_idc;
403 if !self.deblock_skip && deblock_mode != 1 {
404 let is_s = slice_hdr.slice_type == SliceType::SI || slice_hdr.slice_type == SliceType::SP;
405 self.sstate.fill_deblock(refs, deblock_mode, is_s);
406 let mut frm = NASimpleVideoFrame::from_video_buf(&mut self.cur_pic.buf).unwrap();
407 let lf_alpha = slice_hdr.slice_alpha_c0_offset;
408 let lf_beta = slice_hdr.slice_beta_offset;
409 loop_filter_mb(&mut frm, &self.sstate, lf_alpha, lf_beta);
410 }
411 self.sstate.next_mb();
412 Ok(())
413 }
414
5f223cdb 415 fn pred_mv(sstate: &mut SliceState, frame_refs: &SimplifiedSliceRefs, mb_info: &mut CurrentMBInfo, cur_id: u16, temporal_mv: bool, direct_8x8: bool) {
11d7aef2
KS
416 let mb_type = mb_info.mb_type;
417 if !mb_type.is_4x4() {
418 let (pw, ph) = mb_type.size();
419 let mut xoff = 0;
420 let mut yoff = 0;
421 if mb_type == MBType::Direct || mb_type == MBType::BSkip {
422 sstate.predict_direct_mb(frame_refs, temporal_mv, direct_8x8, cur_id);
423 }
424 for part in 0..mb_type.num_parts() {
425 if !mb_type.is_l1(part) {
426 match mb_type {
427 MBType::PSkip => sstate.predict_pskip(),
428 MBType::BSkip | MBType::Direct => {
429 },
430 _ => {
431 sstate.predict(xoff, yoff, pw, ph, 0,
432 mb_info.mv_l0[part], mb_info.ref_l0[part]);
433 },
434 };
435 }
436 if !mb_type.is_l0(part) && mb_type != MBType::BSkip && mb_type != MBType::Direct {
437 sstate.predict(xoff, yoff, pw, ph, 1, mb_info.mv_l1[part], mb_info.ref_l1[part]);
438 }
439 if pw != 16 {
440 xoff += pw;
441 } else {
442 yoff += ph;
443 }
444 }
445 } else {
446 for part in 0..4 {
447 let sub_type = mb_info.sub_mb_type[part];
448 let mut xoff = (part & 1) * 8;
449 let mut yoff = (part & 2) * 4;
450 let orig_x = xoff;
451 let (pw, ph) = sub_type.size();
452 for subpart in 0..sub_type.num_parts() {
453 if sub_type != SubMBType::Direct8x8 {
454 if !sub_type.is_l1() {
455 sstate.predict(xoff, yoff, pw, ph, 0, mb_info.mv_l0[part * 4 + subpart], mb_info.ref_l0[part]);
456 }
457 if !sub_type.is_l0() {
458 sstate.predict(xoff, yoff, pw, ph, 1, mb_info.mv_l1[part * 4 + subpart], mb_info.ref_l1[part]);
459 }
460 } else {
461 for sblk in 0..4 {
462 sstate.predict_direct_sub(frame_refs, temporal_mv, direct_8x8, cur_id, (xoff / 4) + (sblk & 1) + (yoff / 4) * 4 + (sblk & 2) * 2);
463 }
464 }
465 xoff += pw;
466 if xoff == orig_x + 8 {
467 xoff -= 8;
468 yoff += ph;
469 }
470 }
471 }
472 }
473 }
474}
475
476struct H264MTDecoder {
477 info: NACodecInfoRef,
478 nal_len: u8,
479 dispatch: Shareable<ThreadDispatcher>,
480 frame_refs: FrameRefs,
481 skip_mode: FrameSkipMode,
482 sps: Vec<Arc<SeqParameterSet>>,
483 cur_sps: usize,
484 pps: Vec<Arc<PicParameterSet>>,
485 cur_pps: usize,
486 cur_fdec: Option<FrameDecoder>,
487 cavlc_cb: Arc<CAVLCTables>,
488 deblock_skip: bool,
489 max_last_poc: u32,
490 poc_base: u32,
cc818ce8 491 avg_pool: NAVideoBufferPool<u8>,
11d7aef2
KS
492}
493
494impl H264MTDecoder {
495 fn new() -> Self {
496 Self {
497 info: NACodecInfoRef::default(),
498 nal_len: 0,
499 dispatch: Arc::new(RwLock::new(ThreadDispatcher::new())),
500 frame_refs: FrameRefs::new(),
501 skip_mode: FrameSkipMode::default(),
502 sps: Vec::new(),
503 cur_sps: 0,
504 pps: Vec::new(),
505 cur_pps: 0,
506 cur_fdec: None,
507 cavlc_cb: Arc::new(CAVLCTables::new()),
508 deblock_skip: false,
509 max_last_poc: 0,
510 poc_base: 0,
cc818ce8 511 avg_pool: NAVideoBufferPool::new(8),
11d7aef2
KS
512 }
513 }
514 fn handle_nal(&mut self, src: Vec<u8>, supp: &mut NADecoderSupport, skip_decoding: bool, user_id: u32, time: NATimeInfo) -> DecoderResult<()> {
515 validate!(!src.is_empty());
516 validate!((src[0] & 0x80) == 0);
517 let nal_ref_idc = src[0] >> 5;
518 let nal_unit_type = src[0] & 0x1F;
519
520 let mut full_size = src.len() * 8;
521 for &byte in src.iter().rev() {
522 if byte == 0 {
523 full_size -= 8;
524 } else {
525 full_size -= (byte.trailing_zeros() + 1) as usize;
526 break;
527 }
528 }
529 validate!(full_size > 0);
530 match nal_unit_type {
531 1 | 5 if !skip_decoding => {
532 let is_idr = nal_unit_type == 5;
533 let mut br = BitReader::new(&src[..(full_size + 7)/8], BitReaderMode::BE);
534 br.skip(8)?;
535
536 let slice_hdr = parse_slice_header(&mut br, self.sps.as_slice(), self.pps.as_slice(), is_idr, nal_ref_idc)?;
537 let hdr_size = br.tell();
538 validate!(br.tell() < full_size);
539 let full_id;
540 if slice_hdr.first_mb_in_slice == 0 {
541 validate!(self.cur_fdec.is_none());
542 for (i, pps) in self.pps.iter().enumerate() {
543 if pps.pic_parameter_set_id == slice_hdr.pic_parameter_set_id {
544 self.cur_pps = i;
545 break;
546 }
547 }
548 for (i, sps) in self.sps.iter().enumerate() {
549 if sps.seq_parameter_set_id == self.pps[self.cur_pps].seq_parameter_set_id {
550 self.cur_sps = i;
551 break;
552 }
553 }
554
555 let mut cur_full_id = self.frame_refs.calc_picture_num(&slice_hdr, is_idr, nal_ref_idc, &self.sps[self.cur_sps]) + self.poc_base;
556 if is_idr {
557 if cur_full_id <= self.max_last_poc {
558 self.poc_base = self.max_last_poc + 2 - (cur_full_id - self.poc_base);
559 cur_full_id = self.max_last_poc + 2;
560 }
561 }
562 self.max_last_poc = self.max_last_poc.max(cur_full_id);
563 full_id = cur_full_id;
564
565 let sps = &self.sps[self.cur_sps];
566 if sps.chroma_format_idc != 1 || sps.bit_depth_luma != 8 || sps.bit_depth_chroma != 8 {
567 println!(" chroma fmt {} bits {}/{}", sps.chroma_format_idc, sps.bit_depth_luma, sps.bit_depth_chroma);
568 return Err(DecoderError::NotImplemented);
569 }
570
571 if is_idr {
572 self.frame_refs.clear_refs();
573 }
574
575 let width = sps.pic_width_in_mbs << 4;
576 let height = sps.pic_height_in_mbs << 4;
577 let num_mbs = sps.pic_width_in_mbs * sps.pic_height_in_mbs;
578
cc818ce8
KS
579 let avg_buf = if let Some(buf) = self.avg_pool.get_free() {
580 buf
581 } else {
582 let new_avg_buf = alloc_video_buffer(AVG_BUF_VINFO, 4).unwrap().get_vbuf().unwrap();
583 self.avg_pool.add_frame(new_avg_buf.clone());
584 new_avg_buf
585 };
11d7aef2
KS
586 let mut mc_dsp = H264MC::new(avg_buf);
587 mc_dsp.set_dimensions(width, height);
588
589 let is_mbaff = sps.mb_adaptive_frame_field && !slice_hdr.field_pic;
590 if is_mbaff {
591 println!("MBAFF");
592 return Err(DecoderError::NotImplemented);
593 }
594 if !sps.frame_mbs_only {
595 println!("PAFF?");
596 return Err(DecoderError::NotImplemented);
597 }
598
599 let cur_vinfo = supp.pool_u8.get_info();
600 let tmp_vinfo = NAVideoInfo::new(width, height, false, YUV420_FORMAT);
601 if cur_vinfo != Some(tmp_vinfo) {
602 supp.pool_u8.reset();
603 supp.pool_u8.prealloc_video(tmp_vinfo, 4)?;
604 }
605
606 let buf = if let Some(pic) = supp.pool_u8.get_free() {
607 pic
608 } else {
609 if supp.pool_u8.get_num_used() > 256 {
610 return Err(DecoderError::AllocError);
611 }
612 if let Ok(nbuf) = alloc_video_buffer(tmp_vinfo, 4) {
613 let vbuf = nbuf.get_vbuf().unwrap();
614 supp.pool_u8.add_frame(vbuf.clone());
615 vbuf
616 } else {
617 return Err(DecoderError::AllocError);
618 }
619 };
620
621 let cur_pic = PictureInfo {
622 id: slice_hdr.frame_num,
623 full_id, user_id, time,
624 pic_type: slice_hdr.slice_type.to_frame_type(),
625 buf,
626 cur_mb: 0,
627 is_ref: nal_ref_idc != 0,
628 is_idr,
629 long_term: get_long_term_id(is_idr, &slice_hdr),
630 mv_info: NABufferRef::new(FrameMV::new(sps.pic_width_in_mbs, sps.pic_height_in_mbs)),
631 };
632
633 self.cur_fdec = Some(FrameDecoder{
634 slices: Vec::new(),
635 sstate: SliceState::new(),
636 ipcm_buf: [0; 256 + 64 + 64],
637 //width, height,
638 num_mbs,
639 sps: Arc::clone(sps),
640 pps: Arc::clone(&self.pps[self.cur_pps]),
641 dispatch: Arc::clone(&self.dispatch),
642 cavlc_cb: Arc::clone(&self.cavlc_cb),
643 mc_dsp,
644 cur_pic,
645 is_mbaff,
646 deblock_skip: self.deblock_skip,
647 });
648 } else {
649 if let Some(ref mut fdec) = self.cur_fdec {
650 let new_type = slice_hdr.slice_type.to_frame_type();
651 let pic = &mut fdec.cur_pic;
652 pic.pic_type = match (pic.pic_type, new_type) {
653 (FrameType::I, _) => new_type,
654 (_, FrameType::B) => FrameType::B,
655 _ => pic.pic_type,
656 };
657 full_id = pic.full_id;
658 } else {
659 return Ok(());
660 }
661 }
662
663 let sps = &self.sps[self.cur_sps];
664
665 self.frame_refs.select_refs(sps, &slice_hdr, full_id);
666
667 if slice_hdr.adaptive_ref_pic_marking_mode {
668 self.frame_refs.apply_adaptive_marking(&slice_hdr.adaptive_ref_pic_marking, slice_hdr.frame_num, 1 << self.sps[self.cur_sps].log2_max_frame_num)?;
669 }
670 if let Some(ref mut fdec) = self.cur_fdec {
671 fdec.slices.push((slice_hdr, hdr_size, self.frame_refs.cur_refs.clone(), src));
672 }
673 },
674 2 => { // slice data partition A
675 //slice header
676 //slice id = read_ue()
677 //cat 2 slice data (all but MB layer residual)
678 return Err(DecoderError::NotImplemented);
679 },
680 3 => { // slice data partition B
681 //slice id = read_ue()
682 //if pps.redundant_pic_cnt_present { redundant_pic_cnt = read_ue() }
683 //cat 3 slice data (MB layer residual)
684 return Err(DecoderError::NotImplemented);
685 },
686 4 => { // slice data partition C
687 //slice id = read_ue()
688 //if pps.redundant_pic_cnt_present { redundant_pic_cnt = read_ue() }
689 //cat 4 slice data (MB layer residual)
690 return Err(DecoderError::NotImplemented);
691 },
692 6 => {}, //SEI
693 7 => {
694 let sps = parse_sps(&src[1..])?;
695 self.sps.push(Arc::new(sps));
696 },
697 8 => {
698 validate!(full_size >= 8 + 16);
699 let pps = parse_pps(&src[1..], self.sps.as_slice(), full_size - 8)?;
700 let mut found = false;
701 for stored_pps in self.pps.iter_mut() {
702 if stored_pps.pic_parameter_set_id == pps.pic_parameter_set_id {
703 *stored_pps = Arc::clone(&pps);
704 found = true;
705 break;
706 }
707 }
708 if !found {
709 self.pps.push(pps);
710 }
711 },
712 9 => { // access unit delimiter
713 },
714 10 => {}, //end of sequence
715 11 => {}, //end of stream
716 12 => {}, //filler
717 _ => {},
718 };
719
720 Ok(())
721 }
722}
723
724impl NADecoderMT for H264MTDecoder {
725 fn init(&mut self, supp: &mut NADecoderSupport, info: NACodecInfoRef, nthreads: usize) -> DecoderResult<()> {
726 if let NACodecTypeInfo::Video(vinfo) = info.get_properties() {
727 let fmt = YUV420_FORMAT;
728 let myinfo = NACodecTypeInfo::Video(NAVideoInfo::new(0, 0, false, fmt));
729 self.info = NACodecInfo::new_ref(info.get_name(), myinfo, info.get_extradata()).into_ref();
730
731 let edata = info.get_extradata().unwrap();
732//print!("edata:"); for &el in edata.iter() { print!(" {:02X}", el); } println!();
733 if edata.len() > 11 && &edata[0..4] == b"avcC" {
734 let mut mr = MemoryReader::new_read(edata.as_slice());
735 let mut br = ByteReader::new(&mut mr);
736
737 br.read_skip(4)?;
738 let version = br.read_byte()?;
739 validate!(version == 1);
740 let profile = br.read_byte()?;
741 let _compatibility = br.read_byte()?;
742 let _level = br.read_byte()?;
743 let b = br.read_byte()?;
744 validate!((b & 0xFC) == 0xFC);
745 self.nal_len = (b & 3) + 1;
746 let b = br.read_byte()?;
747 validate!((b & 0xE0) == 0xE0);
748 let num_sps = (b & 0x1F) as usize;
749 for _ in 0..num_sps {
750 let len = br.read_u16be()? as usize;
751 let offset = br.tell() as usize;
752 validate!((br.peek_byte()? & 0x1F) == 7);
753 let mut nal_buf = Vec::new();
754 let _size = unescape_nal(&edata[offset..][..len], &mut nal_buf);
755 self.handle_nal(nal_buf, supp, true, 0, NATimeInfo::new(None, None, None, 0, 0))?;
756 br.read_skip(len)?;
757 }
758 let num_pps = br.read_byte()? as usize;
759 for _ in 0..num_pps {
760 let len = br.read_u16be()? as usize;
761 let offset = br.tell() as usize;
762 validate!((br.peek_byte()? & 0x1F) == 8);
763 let mut nal_buf = Vec::new();
764 let _size = unescape_nal(&edata[offset..][..len], &mut nal_buf);
765 self.handle_nal(nal_buf, supp, true, 0, NATimeInfo::new(None, None, None, 0, 0))?;
766 br.read_skip(len)?;
767 }
768 if br.left() > 0 {
769 match profile {
770 100 | 110 | 122 | 144 => {
771 let b = br.read_byte()?;
e12dabcd
KS
772 // some encoders put something different here
773 if (b & 0xFC) != 0xFC {
774 return Ok(());
775 }
11d7aef2
KS
776 // b & 3 -> chroma format
777 let b = br.read_byte()?;
778 validate!((b & 0xF8) == 0xF8);
779 // b & 7 -> luma depth minus 8
780 let b = br.read_byte()?;
781 validate!((b & 0xF8) == 0xF8);
782 // b & 7 -> chroma depth minus 8
783 let num_spsext = br.read_byte()? as usize;
784 for _ in 0..num_spsext {
785 let len = br.read_u16be()? as usize;
786 // parse spsext
787 br.read_skip(len)?;
788 }
789 },
790 _ => {},
791 };
792 }
793 } else {
794 return Err(DecoderError::NotImplemented);
795 }
796
797 let mut width = vinfo.get_width();
798 let mut height = vinfo.get_height();
799
800 if (width == 0 || height == 0) && !self.sps.is_empty() {
801 width = self.sps[0].pic_width_in_mbs * 16;
802 height = self.sps[0].pic_height_in_mbs * 16;
803 }
804
805 let num_bufs = if !self.sps.is_empty() {
e6aaad5c 806 self.sps[0].num_ref_frames + 1
11d7aef2
KS
807 } else {
808 3
809 }.max(16 + 1);
810 if let Ok(ref mut sd) = self.dispatch.write() {
811 sd.max_threads = nthreads;
812 } else {
813 return Err(DecoderError::Bug);
814 }
815 supp.pool_u8.set_dec_bufs(num_bufs + nthreads);
816 supp.pool_u8.prealloc_video(NAVideoInfo::new(width, height, false, fmt), 4)?;
817
cc818ce8
KS
818 self.avg_pool.prealloc_video(AVG_BUF_VINFO, 4)?;
819
11d7aef2
KS
820 Ok(())
821 } else {
822 Err(DecoderError::InvalidData)
823 }
824 }
825 fn can_take_input(&mut self) -> bool {
826 if let Ok(ref sd) = self.dispatch.read() {
827 sd.can_decode_more()
828 } else {
829 false
830 }
831 }
832 fn queue_pkt(&mut self, supp: &mut NADecoderSupport, pkt: &NAPacket, user_id: u32) -> DecoderResult<bool> {
833 if !self.can_take_input() {
834 return Ok(false);
835 }
836
837 let src = pkt.get_buffer();
838
839 let mut mr = MemoryReader::new_read(&src);
840 let mut br = ByteReader::new(&mut mr);
841 let mut nal_buf = Vec::with_capacity(src.len());
842
843 if self.nal_len > 0 {
844 let mut skip_decoding = false;
845 if self.skip_mode != FrameSkipMode::None {
846 let mut pic_type = FrameType::I;
847 let mut is_ref = false;
848 while br.left() > 0 {
849 let size = match self.nal_len {
850 1 => br.read_byte()? as usize,
851 2 => br.read_u16be()? as usize,
852 3 => br.read_u24be()? as usize,
853 4 => br.read_u32be()? as usize,
854 _ => unreachable!(),
855 };
856 validate!(br.left() >= (size as i64));
857 let offset = br.tell() as usize;
858 let size = unescape_nal(&src[offset..][..size], &mut nal_buf);
859 validate!(size > 0);
860 let nal_ref_idc = nal_buf[0] >> 5;
861 let nal_unit_type = nal_buf[0] & 0x1F;
862 if nal_unit_type == 1 || nal_unit_type == 5 {
863 let mut bitr = BitReader::new(&nal_buf[1..], BitReaderMode::BE);
864 let (first_mb, slice_type) = parse_slice_header_minimal(&mut bitr)?;
865 if first_mb == 0 && nal_ref_idc != 0 {
866 is_ref = true;
867 }
868 let new_type = slice_type.to_frame_type();
869 pic_type = match (pic_type, new_type) {
870 (FrameType::I, _) => new_type,
871 (_, FrameType::B) => FrameType::B,
872 _ => pic_type,
873 };
874 }
875 br.read_skip(size)?;
876 }
877 match self.skip_mode {
878 FrameSkipMode::IntraOnly => {
879 skip_decoding = pic_type != FrameType::I;
880 },
881 FrameSkipMode::KeyframesOnly => {
882 if !is_ref {
883 skip_decoding = true;
884 }
885 },
886 _ => {},
887 };
888 br.seek(SeekFrom::Start(0))?;
889 }
890
891 let mut initial_ref_frames = Vec::new();
892 self.frame_refs.fill_ref_nums(&mut initial_ref_frames);
893
894 while br.left() > 0 {
895 let size = match self.nal_len {
896 1 => br.read_byte()? as usize,
897 2 => br.read_u16be()? as usize,
898 3 => br.read_u24be()? as usize,
899 4 => br.read_u32be()? as usize,
900 _ => unreachable!(),
901 };
902 validate!(br.left() >= (size as i64));
903 let offset = br.tell() as usize;
904 let mut cur_nal_buf = Vec::with_capacity(size);
905 let _size = unescape_nal(&src[offset..][..size], &mut cur_nal_buf);
906 self.handle_nal(cur_nal_buf, supp, skip_decoding, user_id, pkt.ts)?;
907 br.read_skip(size)?;
908 }
909 let mut fdec = None;
910 std::mem::swap(&mut fdec, &mut self.cur_fdec);
911 if let Some(fdc) = fdec {
912 let cpic = &fdc.cur_pic;
913 if cpic.is_ref {
914 self.frame_refs.add_short_term(cpic.clone(), self.sps[self.cur_sps].num_ref_frames);
915 }
916 if let Some(lt_idx) = cpic.long_term {
917 self.frame_refs.add_long_term(lt_idx, cpic.clone());
918 }
919 let mut ref_frames = Vec::new();
920 self.frame_refs.fill_ref_nums(&mut ref_frames);
921 queue_decoding(&mut self.dispatch, fdc, &initial_ref_frames, &ref_frames);
922 }
923 } else {
924//todo NAL detection
925 unimplemented!();
926 }
927 Ok(true)
928 }
929 fn has_output(&mut self) -> bool {
930 if let Ok(ref ds) = self.dispatch.read() {
931 ds.has_output()
932 } else {
933 panic!("can't peek into status");
934 }
935 }
936 fn get_frame(&mut self) -> (DecoderResult<NAFrameRef>, u32) {
937 match wait_for_one(&mut self.dispatch) {
938 Ok(cpic) => {
939 let bufinfo = NABufferType::Video(cpic.buf.clone());
940 let ftype = cpic.pic_type;
941 let dts = Some(u64::from(cpic.full_id));
942 let mut frm = NAFrame::new(cpic.time, ftype, cpic.is_idr, self.info.clone(), bufinfo);
943 if let (Some(mydts), None) = (dts, frm.get_dts()) {
944 frm.set_dts(Some(mydts));
945 }
946 frm.set_id(cpic.user_id as i64);
947 (Ok(frm.into_ref()), cpic.user_id)
948 },
949 Err((err, id)) => (Err(err), id),
950 }
951 }
952 fn flush(&mut self) {
953 clear_threads(&mut self.dispatch);
f2cb96ff 954 self.frame_refs.clear_refs();
11d7aef2
KS
955 }
956}
957
958impl NAOptionHandler for H264MTDecoder {
959 fn get_supported_options(&self) -> &[NAOptionDefinition] { DECODER_OPTIONS }
960 fn set_options(&mut self, options: &[NAOption]) {
961 for option in options.iter() {
962 for opt_def in DECODER_OPTIONS.iter() {
963 if opt_def.check(option).is_ok() {
964 match (option.name, &option.value) {
965 (FRAME_SKIP_OPTION, NAValue::String(ref strval)) => {
966 if let Ok(smode) = FrameSkipMode::from_str(strval) {
967 self.skip_mode = smode;
968 }
969 },
970 (DEBLOCK_SKIP_OPTION, NAValue::Bool(val)) => {
971 self.deblock_skip = *val;
972 },
973 _ => {},
974 }
975 }
976 }
977 }
978 }
979 fn query_option_value(&self, name: &str) -> Option<NAValue> {
980 match name {
981 FRAME_SKIP_OPTION => Some(NAValue::String(self.skip_mode.to_string())),
982 DEBLOCK_SKIP_OPTION => Some(NAValue::Bool(self.deblock_skip)),
983 _ => None,
984 }
985 }
986}
987
988pub fn get_decoder_mt() -> Box<dyn NADecoderMT + Send> {
989 Box::new(H264MTDecoder::new())
990}