h264: introduce frame pool for average block buffers in MT decoder
[nihav.git] / nihav-itu / src / codecs / h264 / decoder_mt.rs
CommitLineData
11d7aef2
KS
1use nihav_core::codecs::*;
2use nihav_core::io::bitreader::*;
3
4use super::*;
5use super::dispatch::*;
6
cc818ce8
KS
7const AVG_BUF_VINFO: NAVideoInfo = NAVideoInfo { width: 32, height: 32, flipped: false, format: YUV420_FORMAT, bits: 12 };
8
11d7aef2
KS
9pub struct FrameDecoder {
10 pub slices: Vec<(SliceHeader, usize, SliceRefs, Vec<u8>)>,
11 pub cur_pic: PictureInfo,
12 sps: Arc<SeqParameterSet>,
13 pps: Arc<PicParameterSet>,
14 pub num_mbs: usize,
15 mc_dsp: H264MC,
16 dispatch: Shareable<ThreadDispatcher>,
17 sstate: SliceState,
18 cavlc_cb: Arc<CAVLCTables>,
19 ipcm_buf: [u8; 256 + 64 + 64],
20 is_mbaff: bool,
21 deblock_skip: bool,
22}
23
24impl FrameDecoder {
25 pub fn decode_slice(&mut self, hdr: &SliceHeader, hdr_size: usize, refs: &SliceRefs, nal: &[u8]) -> DecoderResult<usize> {
26 self.sstate.reset(self.sps.pic_width_in_mbs, self.sps.pic_height_in_mbs, hdr.first_mb_in_slice);
27
28 let mut full_size = nal.len() * 8;
29 for &byte in nal.iter().rev() {
30 if byte == 0 {
31 full_size -= 8;
32 } else {
33 full_size -= (byte.trailing_zeros() + 1) as usize;
34 break;
35 }
36 }
37 validate!(full_size > 0);
38
39 let mut br = BitReader::new(&nal[hdr_size / 8..], BitReaderMode::BE);
40 if !self.pps.entropy_coding_mode {
41 br.skip((hdr_size & 7) as u32)?;
42 self.decode_slice_cavlc(&mut br, full_size - (hdr_size & !7), hdr, refs)
43 } else {
44 let csrc = &nal[(hdr_size + 7) / 8..];
45 validate!(csrc.len() >= 2);
46 let mut cabac = CABAC::new(csrc, hdr.slice_type, hdr.slice_qp, hdr.cabac_init_idc as usize)?;
47 self.decode_slice_cabac(&mut cabac, hdr, refs)
48 }
49 }
50 fn decode_slice_cavlc(&mut self, br: &mut BitReader, full_size: usize, slice_hdr: &SliceHeader, refs: &SliceRefs) -> DecoderResult<usize> {
51 const INTRA_CBP: [u8; 48] = [
52 47, 31, 15, 0, 23, 27, 29, 30, 7, 11, 13, 14, 39, 43, 45, 46,
53 16, 3, 5, 10, 12, 19, 21, 26, 28, 35, 37, 42, 44, 1, 2, 4,
54 8, 17, 18, 20, 24, 6, 9, 22, 25, 32, 33, 34, 36, 40, 38, 41
55 ];
56 const INTER_CBP: [u8; 48] = [
57 0, 16, 1, 2, 4, 8, 32, 3, 5, 10, 12, 15, 47, 7, 11, 13,
58 14, 6, 9, 31, 35, 37, 42, 44, 33, 34, 36, 40, 39, 43, 45, 46,
59 17, 18, 20, 24, 19, 21, 26, 28, 23, 27, 29, 30, 22, 25, 38, 41
60 ];
61
e6aaad5c 62 let mut mb_idx = slice_hdr.first_mb_in_slice;
11d7aef2
KS
63 let mut mb_info = CurrentMBInfo { qp_y: slice_hdr.slice_qp, ..Default::default() };
64 let skip_type = if slice_hdr.slice_type.is_p() { MBType::PSkip } else { MBType::BSkip };
65 while br.tell() < full_size && mb_idx < self.num_mbs {
66 mb_info.coded = [false; 25];
67 mb_info.ref_l0 = [ZERO_REF; 4];
68 mb_info.ref_l1 = [ZERO_REF; 4];
69 mb_info.mv_l0 = [ZERO_MV; 16];
70 mb_info.mv_l1 = [ZERO_MV; 16];
71 mb_info.chroma_dc = [[0; 4]; 2];
72 mb_info.cbpy = 0;
73 mb_info.cbpc = 0;
74
75 if !slice_hdr.slice_type.is_intra() {
76 let mb_skip_run = br.read_ue()? as usize;
77 validate!(mb_idx + mb_skip_run <= self.num_mbs);
78 mb_info.mb_type = skip_type;
79 for _ in 0..mb_skip_run {
80 self.handle_macroblock(slice_hdr, &mut mb_info, refs)?;
81 mb_idx += 1;
82 }
83 if mb_idx == self.num_mbs || br.tell() >= full_size {
84 break;
85 }
86 }
87 if br.tell() < full_size {
88 if self.is_mbaff && ((mb_idx & 1) == 0) {
89 let _mb_field_decoding = br.read_bool()?;
90 }
91 let mut mb_type = decode_mb_type_cavlc(br, slice_hdr)?;
92 mb_info.mb_type = mb_type;
93 mb_info.transform_size_8x8 = false;
94 if mb_type == MBType::PCM {
95 br.align();
96 for pix in self.ipcm_buf[..256 + 64 + 64].iter_mut() {
97 *pix = br.read(8)? as u8;
98 }
99 self.sstate.fill_ncoded(16);
100 } else {
101 if self.pps.transform_8x8_mode && mb_type == MBType::Intra4x4 {
102 mb_info.transform_size_8x8 = br.read_bool()?;
103 if mb_info.transform_size_8x8 {
104 mb_type = MBType::Intra8x8;
105 mb_info.mb_type = MBType::Intra8x8;
106 }
107 }
108 decode_mb_pred_cavlc(br, slice_hdr, mb_type, &mut self.sstate, &mut mb_info)?;
109 let (cbpy, cbpc) = if let MBType::Intra16x16(_, cbpy, cbpc) = mb_type {
110 (cbpy, cbpc)
111 } else {
112 let cbp_id = br.read_ue()? as usize;
113 validate!(cbp_id < INTRA_CBP.len());
114 let cbp = if mb_type == MBType::Intra4x4 || mb_type == MBType::Intra8x8 {
115 INTRA_CBP[cbp_id]
116 } else {
117 INTER_CBP[cbp_id]
118 };
119 if self.pps.transform_8x8_mode && (cbp & 0xF) != 0 && mb_info.can_have_8x8_tx(self.sps.direct_8x8_inference) {
120 mb_info.transform_size_8x8 = br.read_bool()?;
121 }
122 ((cbp & 0xF), (cbp >> 4))
123 };
124 mb_info.cbpy = cbpy;
125 mb_info.cbpc = cbpc;
126 self.sstate.get_cur_mb().cbp = (cbpc << 4) | cbpy;
127 if cbpy != 0 || cbpc != 0 || mb_type.is_intra16x16() {
128 let mb_qp_delta = br.read_se()?;
129 validate!(mb_qp_delta >= -26 && mb_qp_delta <= 25);
130 let new_qp = mb_qp_delta + i32::from(mb_info.qp_y);
131 mb_info.qp_y = if new_qp < 0 {
132 (new_qp + 52) as u8
133 } else if new_qp >= 52 {
134 (new_qp - 52) as u8
135 } else {
136 new_qp as u8
137 };
138 mb_info.coeffs = [[0; 16]; 25];
139 if self.pps.transform_8x8_mode {
140 mb_info.clear_coeffs8x8();
141 }
142 mb_info.chroma_dc = [[0; 4]; 2];
143 decode_residual_cavlc(br, &mut self.sstate, &mut mb_info, &self.cavlc_cb)?;
144 }
145 }
146 self.handle_macroblock(slice_hdr, &mut mb_info, refs)?;
147 }
148 mb_idx += 1;
149 if let Ok(disp) = self.dispatch.read() {
150 disp.update_pos(self.cur_pic.full_id, mb_idx);
151 }
152 }
153 Ok(mb_idx)
154 }
155 fn decode_slice_cabac(&mut self, cabac: &mut CABAC, slice_hdr: &SliceHeader, refs: &SliceRefs) -> DecoderResult<usize> {
e6aaad5c 156 let mut mb_idx = slice_hdr.first_mb_in_slice;
11d7aef2
KS
157 let mut prev_mb_skipped = false;
158 let skip_type = if slice_hdr.slice_type.is_p() { MBType::PSkip } else { MBType::BSkip };
159 let mut last_qp_diff = false;
160
161 let mut mb_info = CurrentMBInfo { qp_y: slice_hdr.slice_qp, ..Default::default() };
162
163 while mb_idx < self.num_mbs {
164 mb_info.coded = [false; 25];
165 mb_info.ref_l0 = [ZERO_REF; 4];
166 mb_info.ref_l1 = [ZERO_REF; 4];
167 mb_info.mv_l0 = [ZERO_MV; 16];
168 mb_info.mv_l1 = [ZERO_MV; 16];
169 mb_info.chroma_dc = [[0; 4]; 2];
170 mb_info.cbpy = 0;
171 mb_info.cbpc = 0;
172 let mb_skip = cabac_decode_mbskip(cabac, &self.sstate, slice_hdr);
173 if !mb_skip {
174 if self.is_mbaff && (((mb_idx & 1) == 0) || (prev_mb_skipped && ((mb_idx & 1) == 1))) {
175 let _mb_field_decoding = cabac.decode_bit(70);
176 }
177 let mut mb_type = cabac_decode_mb_type(cabac, slice_hdr, &self.sstate);
178 mb_info.mb_type = mb_type;
179 mb_info.transform_size_8x8 = false;
180 if mb_type == MBType::PCM {
181 let ipcm_size = 256 + 64 + 64;
182 validate!(cabac.pos + ipcm_size <= cabac.src.len());
183 self.ipcm_buf[..ipcm_size].copy_from_slice(&cabac.src[cabac.pos..][..ipcm_size]);
184 cabac.pos += ipcm_size;
185 cabac.reinit()?;
186 last_qp_diff = false;
187 } else {
188 if self.pps.transform_8x8_mode && mb_type == MBType::Intra4x4 {
189 let mut ctx = 0;
190 if self.sstate.get_top_mb().transform_8x8 {
191 ctx += 1;
192 }
193 if self.sstate.get_left_mb().transform_8x8 {
194 ctx += 1;
195 }
196 mb_info.transform_size_8x8 = cabac.decode_bit(399 + ctx);
197 if mb_info.transform_size_8x8 {
198 mb_type = MBType::Intra8x8;
199 mb_info.mb_type = MBType::Intra8x8;
200 }
201 }
202 decode_mb_pred_cabac(cabac, slice_hdr, mb_type, &mut self.sstate, &mut mb_info);
203 let (cbpy, cbpc) = if let MBType::Intra16x16(_, cbpy, cbpc) = mb_type {
204 (cbpy, cbpc)
205 } else {
206 decode_cbp_cabac(cabac, &self.sstate)
207 };
208 if self.pps.transform_8x8_mode && cbpy != 0 && mb_info.can_have_8x8_tx(self.sps.direct_8x8_inference) {
209 let mut ctx = 0;
210 if self.sstate.get_top_mb().transform_8x8 {
211 ctx += 1;
212 }
213 if self.sstate.get_left_mb().transform_8x8 {
214 ctx += 1;
215 }
216 mb_info.transform_size_8x8 = cabac.decode_bit(399 + ctx);
217 }
218 if mb_type.is_intra() {
219 self.sstate.get_cur_mb().cmode = mb_info.chroma_ipred;
220 }
221 mb_info.cbpy = cbpy;
222 mb_info.cbpc = cbpc;
223 self.sstate.get_cur_mb().cbp = (cbpc << 4) | cbpy;
224 if cbpy != 0 || cbpc != 0 || mb_type.is_intra16x16() {
225 let mb_qp_delta = decode_mb_qp_delta_cabac(cabac, last_qp_diff as usize);
226 validate!(mb_qp_delta >= -26 && mb_qp_delta <= 25);
227 last_qp_diff = mb_qp_delta != 0;
228 let new_qp = mb_qp_delta + i32::from(mb_info.qp_y);
229 mb_info.qp_y = if new_qp < 0 {
230 (new_qp + 52) as u8
231 } else if new_qp >= 52 {
232 (new_qp - 52) as u8
233 } else {
234 new_qp as u8
235 };
236 mb_info.coeffs = [[0; 16]; 25];
237 if self.pps.transform_8x8_mode {
238 mb_info.clear_coeffs8x8();
239 }
240 mb_info.chroma_dc = [[0; 4]; 2];
241 decode_residual_cabac(cabac, &mut self.sstate, &mut mb_info);
242 } else {
243 last_qp_diff = false;
244 }
245 }
246 } else {
247 mb_info.mb_type = skip_type;
248 mb_info.transform_size_8x8 = false;
249 last_qp_diff = false;
250 }
251 self.handle_macroblock(slice_hdr, &mut mb_info, refs)?;
252 prev_mb_skipped = mb_skip;
253 if !(self.is_mbaff && ((mb_idx & 1) == 0)) && cabac.decode_terminate() {
254 if let Ok(disp) = self.dispatch.read() {
255 disp.update_pos(self.cur_pic.full_id, mb_idx + 1);
256 }
257 return Ok(mb_idx + 1);
258 }
259 mb_idx += 1;
260 if let Ok(disp) = self.dispatch.read() {
261 disp.update_pos(self.cur_pic.full_id, mb_idx);
262 }
263 }
264 Err(DecoderError::InvalidData)
265 }
266 #[allow(clippy::cognitive_complexity)]
267 fn handle_macroblock(&mut self, slice_hdr: &SliceHeader, mb_info: &mut CurrentMBInfo, refs: &SliceRefs) -> DecoderResult<()> {
268 let qp_y = mb_info.qp_y;
269 let qpr = ((qp_y as i8) + self.pps.chroma_qp_index_offset).max(0).min(51) as usize;
270 let qp_u = CHROMA_QUANTS[qpr];
271 let qpb = ((qp_y as i8) + self.pps.second_chroma_qp_index_offset).max(0).min(51) as usize;
272 let qp_v = CHROMA_QUANTS[qpb];
273
274 let tx_bypass = qp_y == 0 && self.sps.qpprime_y_zero_transform_bypass;
275
276 self.sstate.get_cur_mb().mb_type = mb_info.mb_type.into();
277 if mb_info.mb_type != MBType::PCM {
278 self.sstate.get_cur_mb().qp_y = qp_y;
279 self.sstate.get_cur_mb().qp_u = qp_u;
280 self.sstate.get_cur_mb().qp_v = qp_v;
281 self.sstate.get_cur_mb().transform_8x8 = mb_info.transform_size_8x8;
282 }
283 let has_dc = mb_info.mb_type.is_intra16x16() && mb_info.coded[24];
284 if has_dc {
285 idct_luma_dc(&mut mb_info.coeffs[24], qp_y);
286 for i in 0..16 {
287 mb_info.coeffs[i][0] = mb_info.coeffs[24][i];
288 }
289 }
290 if !mb_info.transform_size_8x8 {
291 let quant_dc = !mb_info.mb_type.is_intra16x16();
292 for i in 0..16 {
293 if mb_info.coded[i] {
294 if !tx_bypass {
295 idct(&mut mb_info.coeffs[i], qp_y, quant_dc);
296 }
297 } else if has_dc {
298 if !tx_bypass {
299 idct_dc(&mut mb_info.coeffs[i], qp_y, quant_dc);
300 }
301 mb_info.coded[i] = true;
302 }
303 }
304 } else {
305 for i in 0..4 {
306 if mb_info.coded[(i & 1) * 2 + (i & 2) * 4] && !tx_bypass {
307 dequant8x8(&mut mb_info.coeffs8x8[i].coeffs, &self.pps.scaling_list_8x8[!mb_info.mb_type.is_intra() as usize]);
308 idct8x8(&mut mb_info.coeffs8x8[i].coeffs, qp_y);
309 }
310 }
311 }
312 for chroma in 0..2 {
313 let qp_c = if chroma == 0 { qp_u } else { qp_v };
314 if mb_info.cbpc != 0 {
315 chroma_dc_transform(&mut mb_info.chroma_dc[chroma], qp_c);
316 }
317 for i in 0..4 {
318 let blk_no = 16 + chroma * 4 + i;
319 mb_info.coeffs[blk_no][0] = mb_info.chroma_dc[chroma][i];
320 if mb_info.coded[blk_no] {
321 idct(&mut mb_info.coeffs[blk_no], qp_c, false);
322 } else if mb_info.coeffs[blk_no][0] != 0 {
323 idct_dc(&mut mb_info.coeffs[blk_no], qp_c, false);
324 mb_info.coded[blk_no] = true;
325 }
326 }
327 }
328 if !self.pps.entropy_coding_mode || mb_info.mb_type.is_skip() || mb_info.mb_type.is_intra() {
329 self.sstate.reset_mb_mv();
330 }
331 if !mb_info.mb_type.is_intra() {
332 let temporal_mv = !slice_hdr.direct_spatial_mv_pred;
333 let cur_id = self.cur_pic.full_id as u16;
334 // wait for the reference macroblock MV to be available
335 if matches!(mb_info.mb_type, MBType::Direct | MBType::BSkip | MBType::B8x8) {
336 if let Some(ref_id) = refs.get_ref_id(0, mb_info.ref_l1[0].index()) {
337 wait_for_mb(&self.dispatch, &self.sstate, self.sstate.mb_x * 16, self.sstate.mb_y * 16, ZERO_MV, ref_id)?;
338 }
339 }
340 Self::pred_mv(&mut self.sstate, refs, mb_info, cur_id, temporal_mv, self.sps.direct_8x8_inference);
341 }
342 if !self.pps.constrained_intra_pred && mb_info.mb_type != MBType::Intra4x4 && mb_info.mb_type != MBType::Intra8x8 {
343 self.sstate.fill_ipred(IntraPredMode::DC);
344 }
345
346 let xpos = self.sstate.mb_x * 16;
347 let ypos = self.sstate.mb_y * 16;
348 let mut frm = NASimpleVideoFrame::from_video_buf(&mut self.cur_pic.buf).unwrap();
349 if mb_info.mb_type != MBType::PCM {
350 let weight_mode = if self.pps.weighted_pred && slice_hdr.slice_type.is_p() {
351 1
352 } else if slice_hdr.slice_type.is_b() {
353 self.pps.weighted_bipred_idc
354 } else {
355 0
356 };
357 recon_mb_mt(&mut frm, slice_hdr, mb_info, &mut self.sstate, refs, &mut self.mc_dsp, weight_mode, &self.dispatch)?;
358 } else {
359 for (dline, src) in frm.data[frm.offset[0] + xpos + ypos * frm.stride[0]..].chunks_mut(frm.stride[0]).take(16).zip(self.ipcm_buf.chunks(16)) {
360 dline[..16].copy_from_slice(src);
361 }
362 for (dline, src) in frm.data[frm.offset[1] + xpos/2 + ypos/2 * frm.stride[1]..].chunks_mut(frm.stride[1]).take(8).zip(self.ipcm_buf[256..].chunks(8)) {
363 dline[..8].copy_from_slice(src);
364 }
365 for (dline, src) in frm.data[frm.offset[2] + xpos/2 + ypos/2 * frm.stride[2]..].chunks_mut(frm.stride[2]).take(8).zip(self.ipcm_buf[256 + 64..].chunks(8)) {
366 dline[..8].copy_from_slice(src);
367 }
368 }
369 self.sstate.save_ipred_context(&frm);
370
371 let mv_info = &mut self.cur_pic.mv_info;
372 let mb_pos = self.sstate.mb_x + self.sstate.mb_y * mv_info.mb_stride;
373 let mut mb = FrameMBInfo::new();
374 mb.mb_type = mb_info.mb_type.into();
375 for blk4 in 0..16 {
376 mb.mv[blk4] = self.sstate.get_cur_blk4(blk4).mv;
377 }
378 for blk8 in 0..4 {
379 mb.ref_poc[blk8] = refs.map_refs(self.sstate.get_cur_blk8(blk8).ref_idx);
380 mb.ref_idx[blk8] = self.sstate.get_cur_blk8(blk8).ref_idx;
381 }
382 mv_info.mbs[mb_pos] = mb;
383
384 let deblock_mode = slice_hdr.disable_deblocking_filter_idc;
385 if !self.deblock_skip && deblock_mode != 1 {
386 let is_s = slice_hdr.slice_type == SliceType::SI || slice_hdr.slice_type == SliceType::SP;
387 self.sstate.fill_deblock(refs, deblock_mode, is_s);
388 let mut frm = NASimpleVideoFrame::from_video_buf(&mut self.cur_pic.buf).unwrap();
389 let lf_alpha = slice_hdr.slice_alpha_c0_offset;
390 let lf_beta = slice_hdr.slice_beta_offset;
391 loop_filter_mb(&mut frm, &self.sstate, lf_alpha, lf_beta);
392 }
393 self.sstate.next_mb();
394 Ok(())
395 }
396
397 fn pred_mv(sstate: &mut SliceState, frame_refs: &SliceRefs, mb_info: &mut CurrentMBInfo, cur_id: u16, temporal_mv: bool, direct_8x8: bool) {
398 let mb_type = mb_info.mb_type;
399 if !mb_type.is_4x4() {
400 let (pw, ph) = mb_type.size();
401 let mut xoff = 0;
402 let mut yoff = 0;
403 if mb_type == MBType::Direct || mb_type == MBType::BSkip {
404 sstate.predict_direct_mb(frame_refs, temporal_mv, direct_8x8, cur_id);
405 }
406 for part in 0..mb_type.num_parts() {
407 if !mb_type.is_l1(part) {
408 match mb_type {
409 MBType::PSkip => sstate.predict_pskip(),
410 MBType::BSkip | MBType::Direct => {
411 },
412 _ => {
413 sstate.predict(xoff, yoff, pw, ph, 0,
414 mb_info.mv_l0[part], mb_info.ref_l0[part]);
415 },
416 };
417 }
418 if !mb_type.is_l0(part) && mb_type != MBType::BSkip && mb_type != MBType::Direct {
419 sstate.predict(xoff, yoff, pw, ph, 1, mb_info.mv_l1[part], mb_info.ref_l1[part]);
420 }
421 if pw != 16 {
422 xoff += pw;
423 } else {
424 yoff += ph;
425 }
426 }
427 } else {
428 for part in 0..4 {
429 let sub_type = mb_info.sub_mb_type[part];
430 let mut xoff = (part & 1) * 8;
431 let mut yoff = (part & 2) * 4;
432 let orig_x = xoff;
433 let (pw, ph) = sub_type.size();
434 for subpart in 0..sub_type.num_parts() {
435 if sub_type != SubMBType::Direct8x8 {
436 if !sub_type.is_l1() {
437 sstate.predict(xoff, yoff, pw, ph, 0, mb_info.mv_l0[part * 4 + subpart], mb_info.ref_l0[part]);
438 }
439 if !sub_type.is_l0() {
440 sstate.predict(xoff, yoff, pw, ph, 1, mb_info.mv_l1[part * 4 + subpart], mb_info.ref_l1[part]);
441 }
442 } else {
443 for sblk in 0..4 {
444 sstate.predict_direct_sub(frame_refs, temporal_mv, direct_8x8, cur_id, (xoff / 4) + (sblk & 1) + (yoff / 4) * 4 + (sblk & 2) * 2);
445 }
446 }
447 xoff += pw;
448 if xoff == orig_x + 8 {
449 xoff -= 8;
450 yoff += ph;
451 }
452 }
453 }
454 }
455 }
456}
457
458struct H264MTDecoder {
459 info: NACodecInfoRef,
460 nal_len: u8,
461 dispatch: Shareable<ThreadDispatcher>,
462 frame_refs: FrameRefs,
463 skip_mode: FrameSkipMode,
464 sps: Vec<Arc<SeqParameterSet>>,
465 cur_sps: usize,
466 pps: Vec<Arc<PicParameterSet>>,
467 cur_pps: usize,
468 cur_fdec: Option<FrameDecoder>,
469 cavlc_cb: Arc<CAVLCTables>,
470 deblock_skip: bool,
471 max_last_poc: u32,
472 poc_base: u32,
cc818ce8 473 avg_pool: NAVideoBufferPool<u8>,
11d7aef2
KS
474}
475
476impl H264MTDecoder {
477 fn new() -> Self {
478 Self {
479 info: NACodecInfoRef::default(),
480 nal_len: 0,
481 dispatch: Arc::new(RwLock::new(ThreadDispatcher::new())),
482 frame_refs: FrameRefs::new(),
483 skip_mode: FrameSkipMode::default(),
484 sps: Vec::new(),
485 cur_sps: 0,
486 pps: Vec::new(),
487 cur_pps: 0,
488 cur_fdec: None,
489 cavlc_cb: Arc::new(CAVLCTables::new()),
490 deblock_skip: false,
491 max_last_poc: 0,
492 poc_base: 0,
cc818ce8 493 avg_pool: NAVideoBufferPool::new(8),
11d7aef2
KS
494 }
495 }
496 fn handle_nal(&mut self, src: Vec<u8>, supp: &mut NADecoderSupport, skip_decoding: bool, user_id: u32, time: NATimeInfo) -> DecoderResult<()> {
497 validate!(!src.is_empty());
498 validate!((src[0] & 0x80) == 0);
499 let nal_ref_idc = src[0] >> 5;
500 let nal_unit_type = src[0] & 0x1F;
501
502 let mut full_size = src.len() * 8;
503 for &byte in src.iter().rev() {
504 if byte == 0 {
505 full_size -= 8;
506 } else {
507 full_size -= (byte.trailing_zeros() + 1) as usize;
508 break;
509 }
510 }
511 validate!(full_size > 0);
512 match nal_unit_type {
513 1 | 5 if !skip_decoding => {
514 let is_idr = nal_unit_type == 5;
515 let mut br = BitReader::new(&src[..(full_size + 7)/8], BitReaderMode::BE);
516 br.skip(8)?;
517
518 let slice_hdr = parse_slice_header(&mut br, self.sps.as_slice(), self.pps.as_slice(), is_idr, nal_ref_idc)?;
519 let hdr_size = br.tell();
520 validate!(br.tell() < full_size);
521 let full_id;
522 if slice_hdr.first_mb_in_slice == 0 {
523 validate!(self.cur_fdec.is_none());
524 for (i, pps) in self.pps.iter().enumerate() {
525 if pps.pic_parameter_set_id == slice_hdr.pic_parameter_set_id {
526 self.cur_pps = i;
527 break;
528 }
529 }
530 for (i, sps) in self.sps.iter().enumerate() {
531 if sps.seq_parameter_set_id == self.pps[self.cur_pps].seq_parameter_set_id {
532 self.cur_sps = i;
533 break;
534 }
535 }
536
537 let mut cur_full_id = self.frame_refs.calc_picture_num(&slice_hdr, is_idr, nal_ref_idc, &self.sps[self.cur_sps]) + self.poc_base;
538 if is_idr {
539 if cur_full_id <= self.max_last_poc {
540 self.poc_base = self.max_last_poc + 2 - (cur_full_id - self.poc_base);
541 cur_full_id = self.max_last_poc + 2;
542 }
543 }
544 self.max_last_poc = self.max_last_poc.max(cur_full_id);
545 full_id = cur_full_id;
546
547 let sps = &self.sps[self.cur_sps];
548 if sps.chroma_format_idc != 1 || sps.bit_depth_luma != 8 || sps.bit_depth_chroma != 8 {
549 println!(" chroma fmt {} bits {}/{}", sps.chroma_format_idc, sps.bit_depth_luma, sps.bit_depth_chroma);
550 return Err(DecoderError::NotImplemented);
551 }
552
553 if is_idr {
554 self.frame_refs.clear_refs();
555 }
556
557 let width = sps.pic_width_in_mbs << 4;
558 let height = sps.pic_height_in_mbs << 4;
559 let num_mbs = sps.pic_width_in_mbs * sps.pic_height_in_mbs;
560
cc818ce8
KS
561 let avg_buf = if let Some(buf) = self.avg_pool.get_free() {
562 buf
563 } else {
564 let new_avg_buf = alloc_video_buffer(AVG_BUF_VINFO, 4).unwrap().get_vbuf().unwrap();
565 self.avg_pool.add_frame(new_avg_buf.clone());
566 new_avg_buf
567 };
11d7aef2
KS
568 let mut mc_dsp = H264MC::new(avg_buf);
569 mc_dsp.set_dimensions(width, height);
570
571 let is_mbaff = sps.mb_adaptive_frame_field && !slice_hdr.field_pic;
572 if is_mbaff {
573 println!("MBAFF");
574 return Err(DecoderError::NotImplemented);
575 }
576 if !sps.frame_mbs_only {
577 println!("PAFF?");
578 return Err(DecoderError::NotImplemented);
579 }
580
581 let cur_vinfo = supp.pool_u8.get_info();
582 let tmp_vinfo = NAVideoInfo::new(width, height, false, YUV420_FORMAT);
583 if cur_vinfo != Some(tmp_vinfo) {
584 supp.pool_u8.reset();
585 supp.pool_u8.prealloc_video(tmp_vinfo, 4)?;
586 }
587
588 let buf = if let Some(pic) = supp.pool_u8.get_free() {
589 pic
590 } else {
591 if supp.pool_u8.get_num_used() > 256 {
592 return Err(DecoderError::AllocError);
593 }
594 if let Ok(nbuf) = alloc_video_buffer(tmp_vinfo, 4) {
595 let vbuf = nbuf.get_vbuf().unwrap();
596 supp.pool_u8.add_frame(vbuf.clone());
597 vbuf
598 } else {
599 return Err(DecoderError::AllocError);
600 }
601 };
602
603 let cur_pic = PictureInfo {
604 id: slice_hdr.frame_num,
605 full_id, user_id, time,
606 pic_type: slice_hdr.slice_type.to_frame_type(),
607 buf,
608 cur_mb: 0,
609 is_ref: nal_ref_idc != 0,
610 is_idr,
611 long_term: get_long_term_id(is_idr, &slice_hdr),
612 mv_info: NABufferRef::new(FrameMV::new(sps.pic_width_in_mbs, sps.pic_height_in_mbs)),
613 };
614
615 self.cur_fdec = Some(FrameDecoder{
616 slices: Vec::new(),
617 sstate: SliceState::new(),
618 ipcm_buf: [0; 256 + 64 + 64],
619 //width, height,
620 num_mbs,
621 sps: Arc::clone(sps),
622 pps: Arc::clone(&self.pps[self.cur_pps]),
623 dispatch: Arc::clone(&self.dispatch),
624 cavlc_cb: Arc::clone(&self.cavlc_cb),
625 mc_dsp,
626 cur_pic,
627 is_mbaff,
628 deblock_skip: self.deblock_skip,
629 });
630 } else {
631 if let Some(ref mut fdec) = self.cur_fdec {
632 let new_type = slice_hdr.slice_type.to_frame_type();
633 let pic = &mut fdec.cur_pic;
634 pic.pic_type = match (pic.pic_type, new_type) {
635 (FrameType::I, _) => new_type,
636 (_, FrameType::B) => FrameType::B,
637 _ => pic.pic_type,
638 };
639 full_id = pic.full_id;
640 } else {
641 return Ok(());
642 }
643 }
644
645 let sps = &self.sps[self.cur_sps];
646
647 self.frame_refs.select_refs(sps, &slice_hdr, full_id);
648
649 if slice_hdr.adaptive_ref_pic_marking_mode {
650 self.frame_refs.apply_adaptive_marking(&slice_hdr.adaptive_ref_pic_marking, slice_hdr.frame_num, 1 << self.sps[self.cur_sps].log2_max_frame_num)?;
651 }
652 if let Some(ref mut fdec) = self.cur_fdec {
653 fdec.slices.push((slice_hdr, hdr_size, self.frame_refs.cur_refs.clone(), src));
654 }
655 },
656 2 => { // slice data partition A
657 //slice header
658 //slice id = read_ue()
659 //cat 2 slice data (all but MB layer residual)
660 return Err(DecoderError::NotImplemented);
661 },
662 3 => { // slice data partition B
663 //slice id = read_ue()
664 //if pps.redundant_pic_cnt_present { redundant_pic_cnt = read_ue() }
665 //cat 3 slice data (MB layer residual)
666 return Err(DecoderError::NotImplemented);
667 },
668 4 => { // slice data partition C
669 //slice id = read_ue()
670 //if pps.redundant_pic_cnt_present { redundant_pic_cnt = read_ue() }
671 //cat 4 slice data (MB layer residual)
672 return Err(DecoderError::NotImplemented);
673 },
674 6 => {}, //SEI
675 7 => {
676 let sps = parse_sps(&src[1..])?;
677 self.sps.push(Arc::new(sps));
678 },
679 8 => {
680 validate!(full_size >= 8 + 16);
681 let pps = parse_pps(&src[1..], self.sps.as_slice(), full_size - 8)?;
682 let mut found = false;
683 for stored_pps in self.pps.iter_mut() {
684 if stored_pps.pic_parameter_set_id == pps.pic_parameter_set_id {
685 *stored_pps = Arc::clone(&pps);
686 found = true;
687 break;
688 }
689 }
690 if !found {
691 self.pps.push(pps);
692 }
693 },
694 9 => { // access unit delimiter
695 },
696 10 => {}, //end of sequence
697 11 => {}, //end of stream
698 12 => {}, //filler
699 _ => {},
700 };
701
702 Ok(())
703 }
704}
705
706impl NADecoderMT for H264MTDecoder {
707 fn init(&mut self, supp: &mut NADecoderSupport, info: NACodecInfoRef, nthreads: usize) -> DecoderResult<()> {
708 if let NACodecTypeInfo::Video(vinfo) = info.get_properties() {
709 let fmt = YUV420_FORMAT;
710 let myinfo = NACodecTypeInfo::Video(NAVideoInfo::new(0, 0, false, fmt));
711 self.info = NACodecInfo::new_ref(info.get_name(), myinfo, info.get_extradata()).into_ref();
712
713 let edata = info.get_extradata().unwrap();
714//print!("edata:"); for &el in edata.iter() { print!(" {:02X}", el); } println!();
715 if edata.len() > 11 && &edata[0..4] == b"avcC" {
716 let mut mr = MemoryReader::new_read(edata.as_slice());
717 let mut br = ByteReader::new(&mut mr);
718
719 br.read_skip(4)?;
720 let version = br.read_byte()?;
721 validate!(version == 1);
722 let profile = br.read_byte()?;
723 let _compatibility = br.read_byte()?;
724 let _level = br.read_byte()?;
725 let b = br.read_byte()?;
726 validate!((b & 0xFC) == 0xFC);
727 self.nal_len = (b & 3) + 1;
728 let b = br.read_byte()?;
729 validate!((b & 0xE0) == 0xE0);
730 let num_sps = (b & 0x1F) as usize;
731 for _ in 0..num_sps {
732 let len = br.read_u16be()? as usize;
733 let offset = br.tell() as usize;
734 validate!((br.peek_byte()? & 0x1F) == 7);
735 let mut nal_buf = Vec::new();
736 let _size = unescape_nal(&edata[offset..][..len], &mut nal_buf);
737 self.handle_nal(nal_buf, supp, true, 0, NATimeInfo::new(None, None, None, 0, 0))?;
738 br.read_skip(len)?;
739 }
740 let num_pps = br.read_byte()? as usize;
741 for _ in 0..num_pps {
742 let len = br.read_u16be()? as usize;
743 let offset = br.tell() as usize;
744 validate!((br.peek_byte()? & 0x1F) == 8);
745 let mut nal_buf = Vec::new();
746 let _size = unescape_nal(&edata[offset..][..len], &mut nal_buf);
747 self.handle_nal(nal_buf, supp, true, 0, NATimeInfo::new(None, None, None, 0, 0))?;
748 br.read_skip(len)?;
749 }
750 if br.left() > 0 {
751 match profile {
752 100 | 110 | 122 | 144 => {
753 let b = br.read_byte()?;
754 validate!((b & 0xFC) == 0xFC);
755 // b & 3 -> chroma format
756 let b = br.read_byte()?;
757 validate!((b & 0xF8) == 0xF8);
758 // b & 7 -> luma depth minus 8
759 let b = br.read_byte()?;
760 validate!((b & 0xF8) == 0xF8);
761 // b & 7 -> chroma depth minus 8
762 let num_spsext = br.read_byte()? as usize;
763 for _ in 0..num_spsext {
764 let len = br.read_u16be()? as usize;
765 // parse spsext
766 br.read_skip(len)?;
767 }
768 },
769 _ => {},
770 };
771 }
772 } else {
773 return Err(DecoderError::NotImplemented);
774 }
775
776 let mut width = vinfo.get_width();
777 let mut height = vinfo.get_height();
778
779 if (width == 0 || height == 0) && !self.sps.is_empty() {
780 width = self.sps[0].pic_width_in_mbs * 16;
781 height = self.sps[0].pic_height_in_mbs * 16;
782 }
783
784 let num_bufs = if !self.sps.is_empty() {
e6aaad5c 785 self.sps[0].num_ref_frames + 1
11d7aef2
KS
786 } else {
787 3
788 }.max(16 + 1);
789 if let Ok(ref mut sd) = self.dispatch.write() {
790 sd.max_threads = nthreads;
791 } else {
792 return Err(DecoderError::Bug);
793 }
794 supp.pool_u8.set_dec_bufs(num_bufs + nthreads);
795 supp.pool_u8.prealloc_video(NAVideoInfo::new(width, height, false, fmt), 4)?;
796
cc818ce8
KS
797 self.avg_pool.prealloc_video(AVG_BUF_VINFO, 4)?;
798
11d7aef2
KS
799 Ok(())
800 } else {
801 Err(DecoderError::InvalidData)
802 }
803 }
804 fn can_take_input(&mut self) -> bool {
805 if let Ok(ref sd) = self.dispatch.read() {
806 sd.can_decode_more()
807 } else {
808 false
809 }
810 }
811 fn queue_pkt(&mut self, supp: &mut NADecoderSupport, pkt: &NAPacket, user_id: u32) -> DecoderResult<bool> {
812 if !self.can_take_input() {
813 return Ok(false);
814 }
815
816 let src = pkt.get_buffer();
817
818 let mut mr = MemoryReader::new_read(&src);
819 let mut br = ByteReader::new(&mut mr);
820 let mut nal_buf = Vec::with_capacity(src.len());
821
822 if self.nal_len > 0 {
823 let mut skip_decoding = false;
824 if self.skip_mode != FrameSkipMode::None {
825 let mut pic_type = FrameType::I;
826 let mut is_ref = false;
827 while br.left() > 0 {
828 let size = match self.nal_len {
829 1 => br.read_byte()? as usize,
830 2 => br.read_u16be()? as usize,
831 3 => br.read_u24be()? as usize,
832 4 => br.read_u32be()? as usize,
833 _ => unreachable!(),
834 };
835 validate!(br.left() >= (size as i64));
836 let offset = br.tell() as usize;
837 let size = unescape_nal(&src[offset..][..size], &mut nal_buf);
838 validate!(size > 0);
839 let nal_ref_idc = nal_buf[0] >> 5;
840 let nal_unit_type = nal_buf[0] & 0x1F;
841 if nal_unit_type == 1 || nal_unit_type == 5 {
842 let mut bitr = BitReader::new(&nal_buf[1..], BitReaderMode::BE);
843 let (first_mb, slice_type) = parse_slice_header_minimal(&mut bitr)?;
844 if first_mb == 0 && nal_ref_idc != 0 {
845 is_ref = true;
846 }
847 let new_type = slice_type.to_frame_type();
848 pic_type = match (pic_type, new_type) {
849 (FrameType::I, _) => new_type,
850 (_, FrameType::B) => FrameType::B,
851 _ => pic_type,
852 };
853 }
854 br.read_skip(size)?;
855 }
856 match self.skip_mode {
857 FrameSkipMode::IntraOnly => {
858 skip_decoding = pic_type != FrameType::I;
859 },
860 FrameSkipMode::KeyframesOnly => {
861 if !is_ref {
862 skip_decoding = true;
863 }
864 },
865 _ => {},
866 };
867 br.seek(SeekFrom::Start(0))?;
868 }
869
870 let mut initial_ref_frames = Vec::new();
871 self.frame_refs.fill_ref_nums(&mut initial_ref_frames);
872
873 while br.left() > 0 {
874 let size = match self.nal_len {
875 1 => br.read_byte()? as usize,
876 2 => br.read_u16be()? as usize,
877 3 => br.read_u24be()? as usize,
878 4 => br.read_u32be()? as usize,
879 _ => unreachable!(),
880 };
881 validate!(br.left() >= (size as i64));
882 let offset = br.tell() as usize;
883 let mut cur_nal_buf = Vec::with_capacity(size);
884 let _size = unescape_nal(&src[offset..][..size], &mut cur_nal_buf);
885 self.handle_nal(cur_nal_buf, supp, skip_decoding, user_id, pkt.ts)?;
886 br.read_skip(size)?;
887 }
888 let mut fdec = None;
889 std::mem::swap(&mut fdec, &mut self.cur_fdec);
890 if let Some(fdc) = fdec {
891 let cpic = &fdc.cur_pic;
892 if cpic.is_ref {
893 self.frame_refs.add_short_term(cpic.clone(), self.sps[self.cur_sps].num_ref_frames);
894 }
895 if let Some(lt_idx) = cpic.long_term {
896 self.frame_refs.add_long_term(lt_idx, cpic.clone());
897 }
898 let mut ref_frames = Vec::new();
899 self.frame_refs.fill_ref_nums(&mut ref_frames);
900 queue_decoding(&mut self.dispatch, fdc, &initial_ref_frames, &ref_frames);
901 }
902 } else {
903//todo NAL detection
904 unimplemented!();
905 }
906 Ok(true)
907 }
908 fn has_output(&mut self) -> bool {
909 if let Ok(ref ds) = self.dispatch.read() {
910 ds.has_output()
911 } else {
912 panic!("can't peek into status");
913 }
914 }
915 fn get_frame(&mut self) -> (DecoderResult<NAFrameRef>, u32) {
916 match wait_for_one(&mut self.dispatch) {
917 Ok(cpic) => {
918 let bufinfo = NABufferType::Video(cpic.buf.clone());
919 let ftype = cpic.pic_type;
920 let dts = Some(u64::from(cpic.full_id));
921 let mut frm = NAFrame::new(cpic.time, ftype, cpic.is_idr, self.info.clone(), bufinfo);
922 if let (Some(mydts), None) = (dts, frm.get_dts()) {
923 frm.set_dts(Some(mydts));
924 }
925 frm.set_id(cpic.user_id as i64);
926 (Ok(frm.into_ref()), cpic.user_id)
927 },
928 Err((err, id)) => (Err(err), id),
929 }
930 }
931 fn flush(&mut self) {
932 clear_threads(&mut self.dispatch);
f2cb96ff 933 self.frame_refs.clear_refs();
11d7aef2
KS
934 }
935}
936
937impl NAOptionHandler for H264MTDecoder {
938 fn get_supported_options(&self) -> &[NAOptionDefinition] { DECODER_OPTIONS }
939 fn set_options(&mut self, options: &[NAOption]) {
940 for option in options.iter() {
941 for opt_def in DECODER_OPTIONS.iter() {
942 if opt_def.check(option).is_ok() {
943 match (option.name, &option.value) {
944 (FRAME_SKIP_OPTION, NAValue::String(ref strval)) => {
945 if let Ok(smode) = FrameSkipMode::from_str(strval) {
946 self.skip_mode = smode;
947 }
948 },
949 (DEBLOCK_SKIP_OPTION, NAValue::Bool(val)) => {
950 self.deblock_skip = *val;
951 },
952 _ => {},
953 }
954 }
955 }
956 }
957 }
958 fn query_option_value(&self, name: &str) -> Option<NAValue> {
959 match name {
960 FRAME_SKIP_OPTION => Some(NAValue::String(self.skip_mode.to_string())),
961 DEBLOCK_SKIP_OPTION => Some(NAValue::Bool(self.deblock_skip)),
962 _ => None,
963 }
964 }
965}
966
967pub fn get_decoder_mt() -> Box<dyn NADecoderMT + Send> {
968 Box::new(H264MTDecoder::new())
969}