replace vec.truncate(0) with vec.clear()
[nihav.git] / nihav-commonfmt / src / codecs / cinepakenc.rs
1 use nihav_core::codecs::*;
2 use nihav_core::io::byteio::*;
3 use nihav_codec_support::vq::*;
4
5 #[derive(Default,Clone,Copy,PartialEq,Debug)]
6 struct YUVCode {
7 y: [u8; 4],
8 u: u8,
9 v: u8,
10 }
11 impl VQElement for YUVCode {
12 fn dist(&self, rval: Self) -> u32 {
13 let mut ysum = 0;
14 for (y0, y1) in self.y.iter().zip(rval.y.iter()) {
15 let yd = i32::from(*y0) - i32::from(*y1);
16 ysum += yd * yd;
17 }
18 let ud = i32::from(self.u) - i32::from(rval.u);
19 let vd = i32::from(self.v) - i32::from(rval.v);
20 (ysum + ud * ud + vd * vd) as u32
21 }
22 fn min_cw() -> Self { YUVCode { y: [0; 4], u: 0, v: 0 } }
23 fn max_cw() -> Self { YUVCode { y: [255; 4], u: 255, v: 255 } }
24 fn min(&self, rval: Self) -> Self {
25 let mut ycode = YUVCode::default();
26 for i in 0..4 {
27 ycode.y[i] = self.y[i].min(rval.y[i]);
28 }
29 ycode.u = self.u.min(rval.u);
30 ycode.v = self.v.min(rval.v);
31 ycode
32 }
33 fn max(&self, rval: Self) -> Self {
34 let mut ycode = YUVCode::default();
35 for i in 0..4 {
36 ycode.y[i] = self.y[i].max(rval.y[i]);
37 }
38 ycode.u = self.u.max(rval.u);
39 ycode.v = self.v.max(rval.v);
40 ycode
41 }
42 fn num_components() -> usize { 6 }
43 fn sort_by_component(arr: &mut [Self], component: usize) {
44 let mut counts = [0; 256];
45 for entry in arr.iter() {
46 let idx = match component {
47 0 | 1 | 2 | 3 => entry.y[component],
48 4 => entry.u,
49 _ => entry.v,
50 } as usize;
51 counts[idx] += 1;
52 }
53 let mut offs = [0; 256];
54 for i in 0..255 {
55 offs[i + 1] = offs[i] + counts[i];
56 }
57 let mut dst = vec![YUVCode::default(); arr.len()];
58 for entry in arr.iter() {
59 let idx = match component {
60 0 | 1 | 2 | 3 => entry.y[component],
61 4 => entry.u,
62 _ => entry.v,
63 } as usize;
64 dst[offs[idx]] = *entry;
65 offs[idx] += 1;
66 }
67 arr.copy_from_slice(dst.as_slice());
68 }
69 fn max_dist_component(min: &Self, max: &Self) -> usize {
70 let mut comp = 0;
71 let mut diff = 0;
72 for i in 0..4 {
73 let d = u32::from(max.y[i]) - u32::from(min.y[i]);
74 if d > diff {
75 diff = d;
76 comp = i;
77 }
78 }
79 let ud = u32::from(max.u) - u32::from(min.u);
80 if ud > diff {
81 diff = ud;
82 comp = 4;
83 }
84 let vd = u32::from(max.v) - u32::from(min.v);
85 if vd > diff {
86 comp = 5;
87 }
88 comp
89 }
90 }
91
92 #[derive(Default)]
93 struct YUVCodeSum {
94 ysum: [u64; 4],
95 usum: u64,
96 vsum: u64,
97 count: u64,
98 }
99
100 impl VQElementSum<YUVCode> for YUVCodeSum {
101 fn zero() -> Self { Self::default() }
102 fn add(&mut self, rval: YUVCode, count: u64) {
103 for i in 0..4 {
104 self.ysum[i] += u64::from(rval.y[i]) * count;
105 }
106 self.usum += u64::from(rval.u) * count;
107 self.vsum += u64::from(rval.v) * count;
108 self.count += count;
109 }
110 fn get_centroid(&self) -> YUVCode {
111 if self.count != 0 {
112 let mut ycode = YUVCode::default();
113 for i in 0..4 {
114 ycode.y[i] = ((self.ysum[i] + self.count / 2) / self.count) as u8;
115 }
116 ycode.u = ((self.usum + self.count / 2) / self.count) as u8;
117 ycode.v = ((self.vsum + self.count / 2) / self.count) as u8;
118 ycode
119 } else {
120 YUVCode::default()
121 }
122 }
123 }
124
125 struct RNG {
126 seed: u32,
127 }
128
129 impl RNG {
130 fn new() -> Self { Self { seed: 0x12345678 } }
131 fn next(&mut self) -> u8 {
132 let mut x = self.seed;
133 x ^= x.wrapping_shl(13);
134 x ^= x >> 17;
135 self.seed = x;
136 (self.seed >> 24) as u8
137 }
138 fn fill_entry(&mut self, entry: &mut YUVCode) {
139 for y in entry.y.iter_mut() {
140 *y = self.next();
141 }
142 entry.u = self.next();
143 entry.v = self.next();
144 }
145 }
146
147 const GRAY_FORMAT: NAPixelFormaton = NAPixelFormaton {
148 model: ColorModel::YUV(YUVSubmodel::YUVJ),
149 components: 1,
150 comp_info: [Some(NAPixelChromaton{h_ss: 0, v_ss: 0, packed: false, depth: 8, shift: 0, comp_offs: 0, next_elem: 1}), None, None, None, None],
151 elem_size: 1,
152 be: true,
153 alpha: false,
154 palette: false,
155 };
156
157 struct MaskWriter {
158 masks: Vec<u32>,
159 mask: u32,
160 pos: u8,
161 }
162
163 impl MaskWriter {
164 fn new() -> Self {
165 Self {
166 masks: Vec::new(),
167 mask: 0,
168 pos: 0,
169 }
170 }
171 fn reset(&mut self) {
172 self.masks.clear();
173 self.mask = 0;
174 self.pos = 0;
175 }
176 fn put_v1(&mut self) {
177 self.mask <<= 1;
178 self.pos += 1;
179 if self.pos == 32 {
180 self.flush();
181 }
182 }
183 fn put_v4(&mut self) {
184 self.mask <<= 1;
185 self.mask |= 1;
186 self.pos += 1;
187 if self.pos == 32 {
188 self.flush();
189 }
190 }
191 fn put_inter(&mut self, skip: bool) {
192 self.mask <<= 1;
193 self.mask |= !skip as u32;
194 self.pos += 1;
195 if self.pos == 32 {
196 self.flush();
197 }
198 }
199 fn flush(&mut self) {
200 self.masks.push(self.mask);
201 self.mask = 0;
202 self.pos = 0;
203 }
204 fn end(&mut self) {
205 if self.pos == 0 { return; }
206 while self.pos < 32 {
207 self.mask <<= 1;
208 self.pos += 1;
209 }
210 self.flush();
211 }
212 }
213
214 #[derive(Clone,Copy,PartialEq)]
215 enum QuantMode {
216 ELBG,
217 Hybrid,
218 MedianCut,
219 }
220
221 impl std::string::ToString for QuantMode {
222 fn to_string(&self) -> String {
223 match *self {
224 QuantMode::ELBG => "elbg".to_string(),
225 QuantMode::Hybrid => "hybrid".to_string(),
226 QuantMode::MedianCut => "mediancut".to_string(),
227 }
228 }
229 }
230
231 struct CinepakEncoder {
232 stream: Option<NAStreamRef>,
233 lastfrm: Option<NAVideoBufferRef<u8>>,
234 pkt: Option<NAPacket>,
235 frmcount: u8,
236 key_int: u8,
237 qmode: QuantMode,
238 quality: u8,
239 nstrips: usize,
240 cur_strip: usize,
241 v1_entries: Vec<YUVCode>,
242 v4_entries: Vec<YUVCode>,
243 v1_cb: Vec<[YUVCode; 256]>,
244 v4_cb: Vec<[YUVCode; 256]>,
245 v1_cur_cb: Vec<[YUVCode; 256]>,
246 v4_cur_cb: Vec<[YUVCode; 256]>,
247 v1_len: usize,
248 v4_len: usize,
249 v1_idx: Vec<u8>,
250 v4_idx: Vec<u8>,
251 grayscale: bool,
252 rng: RNG,
253 masks: MaskWriter,
254 skip_dist: Vec<u32>,
255 }
256
257 fn avg4(a: u8, b: u8, c: u8, d: u8) -> u8 {
258 ((u16::from(a) + u16::from(b) + u16::from(c) + u16::from(d) + 3) >> 2) as u8
259 }
260
261 fn patch_size(bw: &mut ByteWriter, pos: u64) -> EncoderResult<()> {
262 let size = bw.tell() - pos;
263 bw.seek(SeekFrom::Current(-((size + 3) as i64)))?;
264 bw.write_u24be((size + 4) as u32)?;
265 bw.seek(SeekFrom::End(0))?;
266 Ok(())
267 }
268
269 impl CinepakEncoder {
270 fn new() -> Self {
271 Self {
272 stream: None,
273 pkt: None,
274 lastfrm: None,
275 frmcount: 0,
276 qmode: QuantMode::MedianCut,
277 key_int: 25,
278 quality: 0,
279 nstrips: 2,
280 cur_strip: 0,
281 v1_entries: Vec::new(),
282 v4_entries: Vec::new(),
283 v1_cb: Vec::with_capacity(2),
284 v4_cb: Vec::with_capacity(2),
285 v1_cur_cb: Vec::with_capacity(2),
286 v4_cur_cb: Vec::with_capacity(2),
287 v1_len: 0,
288 v4_len: 0,
289 grayscale: false,
290 rng: RNG::new(),
291 v1_idx: Vec::new(),
292 v4_idx: Vec::new(),
293 masks: MaskWriter::new(),
294 skip_dist: Vec::new(),
295 }
296 }
297 fn read_strip(&mut self, in_frm: &NAVideoBuffer<u8>, start: usize, end: usize) {
298 let ystride = in_frm.get_stride(0);
299 let mut yoff = in_frm.get_offset(0) + start * ystride;
300 let ustride = in_frm.get_stride(1);
301 let mut uoff = in_frm.get_offset(1) + start / 2 * ustride;
302 let vstride = in_frm.get_stride(2);
303 let mut voff = in_frm.get_offset(2) + start / 2 * vstride;
304 let (width, _) = in_frm.get_dimensions(0);
305 let data = in_frm.get_data();
306 self.v1_entries.clear();
307 self.v4_entries.clear();
308 for _ in (start..end).step_by(4) {
309 for x in (0..width).step_by(4) {
310 let mut yblk = [0; 16];
311 let mut ublk = [128; 4];
312 let mut vblk = [128; 4];
313 for j in 0..4 {
314 for i in 0..4 {
315 yblk[i + j * 4] = data[yoff + x + i + j * ystride];
316 }
317 }
318 if !self.grayscale {
319 for j in 0..2 {
320 for i in 0..2 {
321 ublk[i + j * 2] = data[uoff + x / 2 + i + j * ustride];
322 vblk[i + j * 2] = data[voff + x / 2 + i + j * vstride];
323 }
324 }
325 }
326 self.v1_entries.push(YUVCode {
327 y: [avg4(yblk[ 0], yblk[ 1], yblk[ 4], yblk[ 5]),
328 avg4(yblk[ 2], yblk[ 3], yblk[ 6], yblk[ 7]),
329 avg4(yblk[ 8], yblk[ 9], yblk[12], yblk[13]),
330 avg4(yblk[10], yblk[11], yblk[14], yblk[15])],
331 u: avg4(ublk[0], ublk[1], ublk[2], ublk[3]),
332 v: avg4(vblk[0], vblk[1], vblk[2], vblk[3]),
333 });
334 for i in 0..4 {
335 let yidx = (i & 1) * 2 + (i & 2) * 4;
336 self.v4_entries.push(YUVCode {
337 y: [ yblk[yidx], yblk[yidx + 1], yblk[yidx + 4], yblk[yidx + 5] ],
338 u: ublk[i],
339 v: vblk[i],
340 });
341 }
342 }
343 yoff += ystride * 4;
344 uoff += ustride * 2;
345 voff += vstride * 2;
346 }
347 }
348 fn find_nearest(codebook: &[YUVCode], code: YUVCode) -> (u8, u32) {
349 let mut min_dist = std::u32::MAX;
350 let mut idx = 0;
351 for (i, cw) in codebook.iter().enumerate() {
352 let dist = cw.dist(code);
353 if dist < min_dist {
354 min_dist = dist;
355 idx = i;
356 if dist == 0 {
357 break;
358 }
359 }
360 }
361 (idx as u8, min_dist)
362 }
363 fn can_update_cb(new_cb: &[YUVCode; 256], old_cb: &[YUVCode; 256], cb_size: usize) -> bool {
364 let mut skip_count = 0;
365 for (new, old) in new_cb.iter().zip(old_cb.iter()) {
366 if new == old {
367 skip_count += 1;
368 }
369 }
370 let full_size = cb_size * 256;
371 let upd_size = cb_size * (256 - skip_count) + 64;
372 upd_size < full_size
373 }
374 fn write_cb(bw: &mut ByteWriter, mut id: u8, new_cb: &[YUVCode; 256], old_cb: &[YUVCode; 256], grayscale: bool, update: bool) -> EncoderResult<()> {
375 if grayscale {
376 id |= 4;
377 }
378 if update {
379 id |= 1;
380 }
381 bw.write_byte(id)?;
382 bw.write_u24be(0)?;
383 let chunk_pos = bw.tell();
384 if !update {
385 for entry in new_cb.iter() {
386 bw.write_buf(&entry.y)?;
387 if !grayscale {
388 bw.write_byte(entry.u ^ 0x80)?;
389 bw.write_byte(entry.v ^ 0x80)?;
390 }
391 }
392 } else {
393 let mut end = 256;
394 for (i, (ncw, ocw)) in new_cb.iter().rev().zip(old_cb.iter().rev()).enumerate() {
395 if ncw == ocw {
396 end = i;
397 } else {
398 break;
399 }
400 }
401 for i in (0..end).step_by(32) {
402 let mut mask = 0;
403 for j in 0..32 {
404 mask <<= 1;
405 if new_cb[i + j] != old_cb[i + j] {
406 mask |= 1;
407 }
408 }
409 bw.write_u32be(mask)?;
410 for j in 0..32 {
411 if new_cb[i + j] == old_cb[i + j] { continue; }
412 bw.write_buf(&new_cb[i + j].y)?;
413 if !grayscale {
414 bw.write_byte(new_cb[i + j].u ^ 0x80)?;
415 bw.write_byte(new_cb[i + j].v ^ 0x80)?;
416 }
417 }
418 }
419 }
420 patch_size(bw, chunk_pos)?;
421 Ok(())
422 }
423 fn render_stripe(&mut self, intra: bool, start: usize, end: usize) {
424 if let Some(ref mut dst_frm) = self.lastfrm {
425 let ystride = dst_frm.get_stride(0);
426 let mut yoff = dst_frm.get_offset(0) + start * ystride;
427 let ustride = dst_frm.get_stride(1);
428 let mut uoff = dst_frm.get_offset(1) + start / 2 * ustride;
429 let vstride = dst_frm.get_stride(2);
430 let mut voff = dst_frm.get_offset(2) + start / 2 * vstride;
431 let (width, _) = dst_frm.get_dimensions(0);
432 let data = dst_frm.get_data_mut().unwrap();
433 let mut miter = self.masks.masks.iter();
434 let mut v1_iter = self.v1_idx.iter();
435 let mut v4_iter = self.v4_idx.iter();
436 let mut cur_mask = 0;
437 let mut cur_bit = 0;
438 for _ in (start..end).step_by(4) {
439 for x in (0..width).step_by(4) {
440 if cur_bit == 0 {
441 if !intra || !self.v1_idx.is_empty() {
442 cur_mask = *miter.next().unwrap();
443 } else {
444 cur_mask = 0xFFFFFFFF;
445 }
446 cur_bit = 1 << 31;
447 }
448 if !intra {
449 if (cur_mask & cur_bit) == 0 {
450 cur_bit >>= 1;
451 continue;
452 }
453 cur_bit >>= 1;
454 if cur_bit == 0 {
455 cur_mask = *miter.next().unwrap();
456 cur_bit = 1 << 31;
457 }
458 }
459 if (cur_mask & cur_bit) == 0 {
460 let idx = *v1_iter.next().unwrap() as usize;
461 let cb = &self.v1_cur_cb[self.cur_strip][idx];
462
463 let mut coff = yoff + x;
464 data[coff] = cb.y[0]; data[coff + 1] = cb.y[0];
465 data[coff + 2] = cb.y[1]; data[coff + 3] = cb.y[1];
466 coff += ystride;
467 data[coff] = cb.y[0]; data[coff + 1] = cb.y[0];
468 data[coff + 2] = cb.y[1]; data[coff + 3] = cb.y[1];
469 coff += ystride;
470 data[coff] = cb.y[2]; data[coff + 1] = cb.y[2];
471 data[coff + 2] = cb.y[3]; data[coff + 3] = cb.y[3];
472 coff += ystride;
473 data[coff] = cb.y[2]; data[coff + 1] = cb.y[2];
474 data[coff + 2] = cb.y[3]; data[coff + 3] = cb.y[3];
475
476 if !self.grayscale {
477 let mut coff = uoff + x / 2;
478 data[coff] = cb.u; data[coff + 1] = cb.u;
479 coff += ustride;
480 data[coff] = cb.u; data[coff + 1] = cb.u;
481
482 let mut coff = voff + x / 2;
483 data[coff] = cb.v; data[coff + 1] = cb.v;
484 coff += vstride;
485 data[coff] = cb.v; data[coff + 1] = cb.v;
486 }
487 } else {
488 let idx0 = *v4_iter.next().unwrap() as usize;
489 let cb0 = &self.v4_cur_cb[self.cur_strip][idx0];
490 let idx1 = *v4_iter.next().unwrap() as usize;
491 let cb1 = &self.v4_cur_cb[self.cur_strip][idx1];
492 let idx2 = *v4_iter.next().unwrap() as usize;
493 let cb2 = &self.v4_cur_cb[self.cur_strip][idx2];
494 let idx3 = *v4_iter.next().unwrap() as usize;
495 let cb3 = &self.v4_cur_cb[self.cur_strip][idx3];
496
497 let mut coff = yoff + x;
498 data[coff] = cb0.y[0]; data[coff + 1] = cb0.y[1];
499 data[coff + 2] = cb1.y[0]; data[coff + 3] = cb1.y[1];
500 coff += ystride;
501 data[coff] = cb0.y[2]; data[coff + 1] = cb0.y[3];
502 data[coff + 2] = cb1.y[2]; data[coff + 3] = cb1.y[3];
503 coff += ystride;
504 data[coff] = cb2.y[0]; data[coff + 1] = cb2.y[1];
505 data[coff + 2] = cb3.y[0]; data[coff + 3] = cb3.y[1];
506 coff += ystride;
507 data[coff] = cb2.y[2]; data[coff + 1] = cb2.y[3];
508 data[coff + 2] = cb3.y[2]; data[coff + 3] = cb3.y[3];
509
510 if !self.grayscale {
511 let mut coff = uoff + x / 2;
512 data[coff] = cb0.u; data[coff + 1] = cb1.u;
513 coff += ustride;
514 data[coff] = cb2.u; data[coff + 1] = cb3.u;
515
516 let mut coff = voff + x / 2;
517 data[coff] = cb0.v; data[coff + 1] = cb1.v;
518 coff += vstride;
519 data[coff] = cb2.v; data[coff + 1] = cb3.v;
520 }
521 }
522 cur_bit >>= 1;
523 }
524 yoff += ystride * 4;
525 uoff += ustride * 2;
526 voff += vstride * 2;
527 }
528 } else {
529 unreachable!();
530 }
531 }
532 fn calc_skip_dist(&mut self, in_frm: &NAVideoBuffer<u8>, start: usize, end: usize) {
533 self.skip_dist.clear();
534 if let Some(ref ref_frm) = self.lastfrm {
535 let rystride = ref_frm.get_stride(0);
536 let mut ryoff = ref_frm.get_offset(0) + start * rystride;
537 let rustride = ref_frm.get_stride(1);
538 let mut ruoff = ref_frm.get_offset(1) + start / 2 * rustride;
539 let rvstride = ref_frm.get_stride(2);
540 let mut rvoff = ref_frm.get_offset(2) + start / 2 * rvstride;
541 let (width, _) = ref_frm.get_dimensions(0);
542 let rdata = ref_frm.get_data();
543
544 let iystride = in_frm.get_stride(0);
545 let mut iyoff = in_frm.get_offset(0) + start * iystride;
546 let iustride = in_frm.get_stride(1);
547 let mut iuoff = in_frm.get_offset(1) + start / 2 * iustride;
548 let ivstride = in_frm.get_stride(2);
549 let mut ivoff = in_frm.get_offset(2) + start / 2 * ivstride;
550 let idata = in_frm.get_data();
551
552 for _ in (start..end).step_by(4) {
553 for x in (0..width).step_by(4) {
554 let mut dist = 0;
555 let mut roff = ryoff + x;
556 let mut ioff = iyoff + x;
557 for _ in 0..4 {
558 for i in 0..4 {
559 let d = i32::from(rdata[roff + i]) - i32::from(idata[ioff + i]);
560 dist += d * d;
561 }
562 roff += rystride;
563 ioff += iystride;
564 }
565 if !self.grayscale {
566 let mut roff = ruoff + x / 2;
567 let mut ioff = iuoff + x / 2;
568 let ud = i32::from(rdata[roff]) - i32::from(idata[ioff]);
569 dist += ud * ud;
570 let ud = i32::from(rdata[roff + 1]) - i32::from(idata[ioff + 1]);
571 dist += ud * ud;
572 roff += rustride; ioff += iustride;
573 let ud = i32::from(rdata[roff]) - i32::from(idata[ioff]);
574 dist += ud * ud;
575 let ud = i32::from(rdata[roff + 1]) - i32::from(idata[ioff + 1]);
576 dist += ud * ud;
577
578 let mut roff = rvoff + x / 2;
579 let mut ioff = ivoff + x / 2;
580 let vd = i32::from(rdata[roff]) - i32::from(idata[ioff]);
581 dist += vd * vd;
582 let vd = i32::from(rdata[roff + 1]) - i32::from(idata[ioff + 1]);
583 dist += vd * vd;
584 roff += rvstride; ioff += ivstride;
585 let vd = i32::from(rdata[roff]) - i32::from(idata[ioff]);
586 dist += vd * vd;
587 let vd = i32::from(rdata[roff + 1]) - i32::from(idata[ioff + 1]);
588 dist += vd * vd;
589 }
590 self.skip_dist.push(dist as u32);
591 }
592
593 iyoff += iystride * 4;
594 iuoff += iustride * 2;
595 ivoff += ivstride * 2;
596 ryoff += rystride * 4;
597 ruoff += rustride * 2;
598 rvoff += rvstride * 2;
599 }
600 } else {
601 unreachable!();
602 }
603 }
604 fn quant_vectors(&mut self) {
605 match self.qmode {
606 QuantMode::ELBG => {
607 let mut elbg_v1: ELBG<YUVCode, YUVCodeSum> = ELBG::new(&self.v1_cb[self.cur_strip]);
608 let mut elbg_v4: ELBG<YUVCode, YUVCodeSum> = ELBG::new(&self.v4_cb[self.cur_strip]);
609
610 for entry in self.v1_cb[self.cur_strip].iter_mut().skip(self.v1_len) {
611 self.rng.fill_entry(entry);
612 }
613 for entry in self.v4_cb[self.cur_strip].iter_mut().skip(self.v4_len) {
614 self.rng.fill_entry(entry);
615 }
616
617 self.v1_len = elbg_v1.quantise(&self.v1_entries, &mut self.v1_cur_cb[self.cur_strip]);
618 self.v4_len = elbg_v4.quantise(&self.v4_entries, &mut self.v4_cur_cb[self.cur_strip]);
619 },
620 QuantMode::Hybrid => {
621 quantise_median_cut::<YUVCode, YUVCodeSum>(&self.v1_entries, &mut self.v1_cur_cb[self.cur_strip]);
622 quantise_median_cut::<YUVCode, YUVCodeSum>(&self.v4_entries, &mut self.v4_cur_cb[self.cur_strip]);
623 let mut elbg_v1: ELBG<YUVCode, YUVCodeSum> = ELBG::new(&self.v1_cur_cb[self.cur_strip]);
624 let mut elbg_v4: ELBG<YUVCode, YUVCodeSum> = ELBG::new(&self.v4_cur_cb[self.cur_strip]);
625 self.v1_len = elbg_v1.quantise(&self.v1_entries, &mut self.v1_cur_cb[self.cur_strip]);
626 self.v4_len = elbg_v4.quantise(&self.v4_entries, &mut self.v4_cur_cb[self.cur_strip]);
627 },
628 QuantMode::MedianCut => {
629 self.v1_len = quantise_median_cut::<YUVCode, YUVCodeSum>(&self.v1_entries, &mut self.v1_cur_cb[self.cur_strip]);
630 self.v4_len = quantise_median_cut::<YUVCode, YUVCodeSum>(&self.v4_entries, &mut self.v4_cur_cb[self.cur_strip]);
631 },
632 };
633
634 for e in self.v1_cur_cb[self.cur_strip].iter_mut().skip(self.v1_len) { *e = YUVCode::default(); }
635 for e in self.v4_cur_cb[self.cur_strip].iter_mut().skip(self.v4_len) { *e = YUVCode::default(); }
636 }
637 fn encode_intra(&mut self, bw: &mut ByteWriter, in_frm: &NAVideoBuffer<u8>) -> EncoderResult<bool> {
638 let (width, height) = in_frm.get_dimensions(0);
639 let mut strip_h = (height / self.nstrips + 3) & !3;
640 if strip_h == 0 {
641 self.nstrips = 1;
642 strip_h = height;
643 }
644 let mut start_line = 0;
645 let mut end_line = strip_h;
646
647 bw.write_byte(0)?; // intra flag
648 bw.write_u24be(0)?; // frame size
649 let frame_data_pos = bw.tell();
650 bw.write_u16be(width as u16)?;
651 bw.write_u16be(height as u16)?;
652 bw.write_u16be(self.nstrips as u16)?;
653
654 self.cur_strip = 0;
655 for entry in self.v1_cb[self.cur_strip].iter_mut() {
656 self.rng.fill_entry(entry);
657 }
658 for entry in self.v4_cb[self.cur_strip].iter_mut() {
659 self.rng.fill_entry(entry);
660 }
661 while start_line < height {
662 self.read_strip(in_frm, start_line, end_line);
663
664 if self.cur_strip > 0 {
665 self.v1_cb[self.cur_strip] = self.v1_cb[self.cur_strip - 1];
666 self.v4_cb[self.cur_strip] = self.v4_cb[self.cur_strip - 1];
667 }
668 self.quant_vectors();
669 if self.grayscale {
670 for cw in self.v1_cur_cb[self.cur_strip].iter_mut() {
671 cw.u = 128;
672 cw.v = 128;
673 }
674 for cw in self.v4_cur_cb[self.cur_strip].iter_mut() {
675 cw.u = 128;
676 cw.v = 128;
677 }
678 }
679
680 self.v1_idx.clear();
681 self.v4_idx.clear();
682 self.masks.reset();
683
684 for (v1_entry, v4_entries) in self.v1_entries.iter().zip(self.v4_entries.chunks(4)) {
685 let (v1_idx, v1_dist) = Self::find_nearest(&self.v1_cur_cb[self.cur_strip][..self.v1_len], *v1_entry);
686 if v1_dist == 0 {
687 self.masks.put_v1();
688 self.v1_idx.push(v1_idx);
689 continue;
690 }
691 let (v40_idx, v40_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[0]);
692 let (v41_idx, v41_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[1]);
693 let (v42_idx, v42_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[2]);
694 let (v43_idx, v43_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[3]);
695 if v40_dist + v41_dist + v42_dist + v43_dist > v1_dist {
696 self.masks.put_v4();
697 self.v4_idx.push(v40_idx);
698 self.v4_idx.push(v41_idx);
699 self.v4_idx.push(v42_idx);
700 self.v4_idx.push(v43_idx);
701 } else {
702 self.masks.put_v1();
703 self.v1_idx.push(v1_idx);
704 }
705 }
706 self.masks.end();
707
708 let mut is_intra_strip = start_line == 0;
709 let (upd_v1, upd_v4) = if !is_intra_strip {
710 let cb_size = if self.grayscale { 4 } else { 6 };
711 (Self::can_update_cb(&self.v1_cur_cb[self.cur_strip], &self.v1_cb[self.cur_strip], cb_size),
712 Self::can_update_cb(&self.v4_cur_cb[self.cur_strip], &self.v4_cb[self.cur_strip], cb_size))
713 } else {
714 (false, false)
715 };
716 if !is_intra_strip && !upd_v1 && !upd_v4 {
717 is_intra_strip = true;
718 }
719 bw.write_byte(if is_intra_strip { 0x10 } else { 0x11 })?;
720 bw.write_u24be(0)?; // strip size
721 let strip_data_pos = bw.tell();
722 bw.write_u16be(0)?; // yoff
723 bw.write_u16be(0)?; // xoff
724 bw.write_u16be((end_line - start_line) as u16)?;
725 bw.write_u16be(width as u16)?;
726
727 Self::write_cb(bw, 0x20, &self.v4_cur_cb[self.cur_strip], &self.v4_cb[self.cur_strip], self.grayscale, upd_v4)?;
728 Self::write_cb(bw, 0x22, &self.v1_cur_cb[self.cur_strip], &self.v1_cb[self.cur_strip], self.grayscale, upd_v1)?;
729
730 self.render_stripe(true, start_line, end_line);
731
732 if self.v4_idx.is_empty() {
733 bw.write_byte(0x32)?;
734 bw.write_u24be((self.v1_idx.len() + 4) as u32)?;
735 bw.write_buf(self.v1_idx.as_slice())?;
736 } else {
737 bw.write_byte(0x30)?;
738 bw.write_u24be(0)?;
739 let chunk_pos = bw.tell();
740 let mut v1_pos = 0;
741 let mut v4_pos = 0;
742 for _ in 0..32 {
743 self.v1_idx.push(0);
744 self.v4_idx.push(0);
745 self.v4_idx.push(0);
746 self.v4_idx.push(0);
747 self.v4_idx.push(0);
748 }
749 for mask in self.masks.masks.iter() {
750 bw.write_u32be(*mask)?;
751 for j in (0..32).rev() {
752 if (mask & (1 << j)) == 0 {
753 bw.write_byte(self.v1_idx[v1_pos])?;
754 v1_pos += 1;
755 } else {
756 bw.write_byte(self.v4_idx[v4_pos])?;
757 bw.write_byte(self.v4_idx[v4_pos + 1])?;
758 bw.write_byte(self.v4_idx[v4_pos + 2])?;
759 bw.write_byte(self.v4_idx[v4_pos + 3])?;
760 v4_pos += 4;
761 }
762 }
763 }
764 patch_size(bw, chunk_pos)?;
765 }
766
767 patch_size(bw, strip_data_pos)?;
768
769 self.v1_cb[self.cur_strip].copy_from_slice(&self.v1_cur_cb[self.cur_strip]);
770 self.v4_cb[self.cur_strip].copy_from_slice(&self.v4_cur_cb[self.cur_strip]);
771 start_line = end_line;
772 end_line = (end_line + strip_h).min(height);
773
774 self.cur_strip += 1;
775 }
776 patch_size(bw, frame_data_pos)?;
777 Ok(true)
778 }
779 fn encode_inter(&mut self, bw: &mut ByteWriter, in_frm: &NAVideoBuffer<u8>) -> EncoderResult<bool> {
780 let (width, height) = in_frm.get_dimensions(0);
781 let mut strip_h = (height / self.nstrips + 3) & !3;
782 if strip_h == 0 {
783 self.nstrips = 1;
784 strip_h = height;
785 }
786 let mut start_line = 0;
787 let mut end_line = strip_h;
788
789 bw.write_byte(1)?; // intra flag
790 bw.write_u24be(0)?; // frame size
791 let frame_data_pos = bw.tell();
792 bw.write_u16be(width as u16)?;
793 bw.write_u16be(height as u16)?;
794 bw.write_u16be(self.nstrips as u16)?;
795
796 self.cur_strip = 0;
797 while start_line < height {
798 self.read_strip(in_frm, start_line, end_line);
799 self.calc_skip_dist(in_frm, start_line, end_line);
800
801 self.quant_vectors();
802 if self.grayscale {
803 for cw in self.v1_cur_cb[self.cur_strip].iter_mut() {
804 cw.u = 128;
805 cw.v = 128;
806 }
807 for cw in self.v4_cur_cb[self.cur_strip].iter_mut() {
808 cw.u = 128;
809 cw.v = 128;
810 }
811 }
812
813 self.v1_idx.clear();
814 self.v4_idx.clear();
815 self.masks.reset();
816
817 let mut skip_iter = self.skip_dist.iter();
818 for (v1_entry, v4_entries) in self.v1_entries.iter().zip(self.v4_entries.chunks(4)) {
819 let skip_dist = *skip_iter.next().unwrap();
820 if skip_dist == 0 {
821 self.masks.put_inter(true);
822 continue;
823 }
824 let (v1_idx, v1_dist) = Self::find_nearest(&self.v1_cur_cb[self.cur_strip][..self.v1_len], *v1_entry);
825 if skip_dist < v1_dist {
826 self.masks.put_inter(true);
827 continue;
828 } else {
829 self.masks.put_inter(false);
830 }
831 if v1_dist == 0 {
832 self.masks.put_v1();
833 self.v1_idx.push(v1_idx);
834 continue;
835 }
836 let (v40_idx, v40_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[0]);
837 let (v41_idx, v41_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[1]);
838 let (v42_idx, v42_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[2]);
839 let (v43_idx, v43_dist) = Self::find_nearest(&self.v4_cur_cb[self.cur_strip][..self.v4_len], v4_entries[3]);
840 if v40_dist + v41_dist + v42_dist + v43_dist > v1_dist {
841 self.masks.put_v4();
842 self.v4_idx.push(v40_idx);
843 self.v4_idx.push(v41_idx);
844 self.v4_idx.push(v42_idx);
845 self.v4_idx.push(v43_idx);
846 } else {
847 self.masks.put_v1();
848 self.v1_idx.push(v1_idx);
849 }
850 }
851 self.masks.end();
852
853 let (upd_v1, upd_v4) = {
854 let cb_size = if self.grayscale { 4 } else { 6 };
855 (Self::can_update_cb(&self.v1_cur_cb[self.cur_strip], &self.v1_cb[self.cur_strip], cb_size),
856 Self::can_update_cb(&self.v4_cur_cb[self.cur_strip], &self.v4_cb[self.cur_strip], cb_size))
857 };
858 bw.write_byte(0x11)?;
859 bw.write_u24be(0)?; // strip size
860 let strip_data_pos = bw.tell();
861 bw.write_u16be(0)?; // yoff
862 bw.write_u16be(0)?; // xoff
863 bw.write_u16be((end_line - start_line) as u16)?;
864 bw.write_u16be(width as u16)?;
865
866 Self::write_cb(bw, 0x20, &self.v4_cur_cb[self.cur_strip], &self.v4_cb[self.cur_strip], self.grayscale, upd_v4)?;
867 Self::write_cb(bw, 0x22, &self.v1_cur_cb[self.cur_strip], &self.v1_cb[self.cur_strip], self.grayscale, upd_v1)?;
868
869 self.render_stripe(false, start_line, end_line);
870
871 bw.write_byte(0x31)?;
872 bw.write_u24be(0)?;
873 let chunk_pos = bw.tell();
874 let mut v1_pos = 0;
875 let mut v4_pos = 0;
876 for _ in 0..32 {
877 self.v1_idx.push(0);
878 self.v4_idx.push(0);
879 self.v4_idx.push(0);
880 self.v4_idx.push(0);
881 self.v4_idx.push(0);
882 }
883 let mut skip = true;
884 for mask in self.masks.masks.iter() {
885 bw.write_u32be(*mask)?;
886 if *mask == 0 { continue; }
887 let mut bit = 1 << 31;
888 while bit > 0 {
889 if skip {
890 skip = (mask & bit) == 0;
891 bit >>= 1;
892 } else {
893 if (mask & bit) == 0 {
894 bw.write_byte(self.v1_idx[v1_pos])?;
895 v1_pos += 1;
896 } else {
897 bw.write_byte(self.v4_idx[v4_pos])?;
898 bw.write_byte(self.v4_idx[v4_pos + 1])?;
899 bw.write_byte(self.v4_idx[v4_pos + 2])?;
900 bw.write_byte(self.v4_idx[v4_pos + 3])?;
901 v4_pos += 4;
902 }
903 bit >>= 1;
904 skip = true;
905 }
906 }
907 }
908 patch_size(bw, chunk_pos)?;
909
910 patch_size(bw, strip_data_pos)?;
911
912 self.v1_cb[self.cur_strip].copy_from_slice(&self.v1_cur_cb[self.cur_strip]);
913 self.v4_cb[self.cur_strip].copy_from_slice(&self.v4_cur_cb[self.cur_strip]);
914 start_line = end_line;
915 end_line = (end_line + strip_h).min(height);
916
917 self.cur_strip += 1;
918 }
919 patch_size(bw, frame_data_pos)?;
920 Ok(true)
921 }
922 }
923
924 impl NAEncoder for CinepakEncoder {
925 fn negotiate_format(&self, encinfo: &EncodeParameters) -> EncoderResult<EncodeParameters> {
926 match encinfo.format {
927 NACodecTypeInfo::None => {
928 let mut ofmt = EncodeParameters::default();
929 ofmt.format = NACodecTypeInfo::Video(NAVideoInfo::new(0, 0, true, YUV420_FORMAT));
930 Ok(ofmt)
931 },
932 NACodecTypeInfo::Audio(_) => Err(EncoderError::FormatError),
933 NACodecTypeInfo::Video(vinfo) => {
934 let pix_fmt = if vinfo.format == GRAY_FORMAT { GRAY_FORMAT } else { YUV420_FORMAT };
935 let outinfo = NAVideoInfo::new((vinfo.width + 3) & !3, (vinfo.height + 3) & !3, false, pix_fmt);
936 let mut ofmt = *encinfo;
937 ofmt.format = NACodecTypeInfo::Video(outinfo);
938 Ok(ofmt)
939 }
940 }
941 }
942 fn init(&mut self, stream_id: u32, encinfo: EncodeParameters) -> EncoderResult<NAStreamRef> {
943 match encinfo.format {
944 NACodecTypeInfo::None => Err(EncoderError::FormatError),
945 NACodecTypeInfo::Audio(_) => Err(EncoderError::FormatError),
946 NACodecTypeInfo::Video(vinfo) => {
947 if vinfo.format != YUV420_FORMAT && vinfo.format != GRAY_FORMAT {
948 return Err(EncoderError::FormatError);
949 }
950 if ((vinfo.width | vinfo.height) & 3) != 0 {
951 return Err(EncoderError::FormatError);
952 }
953 if (vinfo.width | vinfo.height) >= (1 << 16) {
954 return Err(EncoderError::FormatError);
955 }
956
957 let out_info = NAVideoInfo::new(vinfo.width, vinfo.height, false, vinfo.format);
958 let info = NACodecInfo::new("cinepak", NACodecTypeInfo::Video(out_info), None);
959 let mut stream = NAStream::new(StreamType::Video, stream_id, info, encinfo.tb_num, encinfo.tb_den, 0);
960 stream.set_num(stream_id as usize);
961 let stream = stream.into_ref();
962
963 self.stream = Some(stream.clone());
964 self.quality = encinfo.quality;
965 self.grayscale = vinfo.format != YUV420_FORMAT;
966 let num_blocks = vinfo.width / 2 * vinfo.height / 2;
967 self.v1_entries = Vec::with_capacity(num_blocks);
968 self.v4_entries = Vec::with_capacity(num_blocks * 4);
969 self.v1_idx = Vec::with_capacity(num_blocks);
970 self.v4_idx = Vec::with_capacity(num_blocks * 4);
971 self.skip_dist = Vec::with_capacity(vinfo.width / 4 * vinfo.height / 4);
972
973 let buf = alloc_video_buffer(out_info, 2)?;
974 self.lastfrm = Some(buf.get_vbuf().unwrap());
975
976 Ok(stream)
977 },
978 }
979 }
980 fn encode(&mut self, frm: &NAFrame) -> EncoderResult<()> {
981 let buf = frm.get_buffer();
982 if let Some(ref vbuf) = buf.get_vbuf() {
983 let cur_strips = self.v1_cb.len();
984 if cur_strips != self.nstrips {
985 self.frmcount = 0;
986 }
987 if cur_strips < self.nstrips {
988 for _ in cur_strips..self.nstrips {
989 self.v1_cb.push([YUVCode::default(); 256]);
990 self.v4_cb.push([YUVCode::default(); 256]);
991 self.v1_cur_cb.push([YUVCode::default(); 256]);
992 self.v4_cur_cb.push([YUVCode::default(); 256]);
993 }
994 }
995
996 let mut dbuf = Vec::with_capacity(4);
997 let mut gw = GrowableMemoryWriter::new_write(&mut dbuf);
998 let mut bw = ByteWriter::new(&mut gw);
999 let is_intra = if self.frmcount == 0 {
1000 self.encode_intra(&mut bw, vbuf)?
1001 } else {
1002 self.encode_inter(&mut bw, vbuf)?
1003 };
1004 self.pkt = Some(NAPacket::new(self.stream.clone().unwrap(), frm.ts, is_intra, dbuf));
1005 self.frmcount += 1;
1006 if self.frmcount == self.key_int {
1007 self.frmcount = 0;
1008 }
1009 Ok(())
1010 } else {
1011 Err(EncoderError::InvalidParameters)
1012 }
1013 }
1014 fn get_packet(&mut self) -> EncoderResult<Option<NAPacket>> {
1015 let mut npkt = None;
1016 std::mem::swap(&mut self.pkt, &mut npkt);
1017 Ok(npkt)
1018 }
1019 fn flush(&mut self) -> EncoderResult<()> {
1020 self.frmcount = 0;
1021 Ok(())
1022 }
1023 }
1024
1025 const ENCODER_OPTS: &[NAOptionDefinition] = &[
1026 NAOptionDefinition {
1027 name: KEYFRAME_OPTION, description: KEYFRAME_OPTION_DESC,
1028 opt_type: NAOptionDefinitionType::Int(Some(0), Some(128)) },
1029 NAOptionDefinition {
1030 name: "nstrips", description: "Number of strips per frame (0 - automatic)",
1031 opt_type: NAOptionDefinitionType::Int(Some(0), Some(16)) },
1032 NAOptionDefinition {
1033 name: "quant_mode", description: "Quantisation mode",
1034 opt_type: NAOptionDefinitionType::String(Some(&["elbg", "hybrid", "mediancut"])) },
1035 ];
1036
1037 impl NAOptionHandler for CinepakEncoder {
1038 fn get_supported_options(&self) -> &[NAOptionDefinition] { ENCODER_OPTS }
1039 fn set_options(&mut self, options: &[NAOption]) {
1040 for option in options.iter() {
1041 for opt_def in ENCODER_OPTS.iter() {
1042 if opt_def.check(option).is_ok() {
1043 match option.name {
1044 KEYFRAME_OPTION => {
1045 if let NAValue::Int(intval) = option.value {
1046 self.key_int = intval as u8;
1047 }
1048 },
1049 "nstrips" => {
1050 if let NAValue::Int(intval) = option.value {
1051 self.nstrips = intval as usize;
1052 }
1053 },
1054 "quant_mode" => {
1055 if let NAValue::String(ref str) = option.value {
1056 match str.as_str() {
1057 "elbg" => self.qmode = QuantMode::ELBG,
1058 "hybrid" => self.qmode = QuantMode::Hybrid,
1059 "mediancut" => self.qmode = QuantMode::MedianCut,
1060 _ => {},
1061 };
1062 }
1063 },
1064 _ => {},
1065 };
1066 }
1067 }
1068 }
1069 }
1070 fn query_option_value(&self, name: &str) -> Option<NAValue> {
1071 match name {
1072 KEYFRAME_OPTION => Some(NAValue::Int(i64::from(self.key_int))),
1073 "nstrips" => Some(NAValue::Int(self.nstrips as i64)),
1074 "quant_mode" => Some(NAValue::String(self.qmode.to_string())),
1075 _ => None,
1076 }
1077 }
1078 }
1079
1080 pub fn get_encoder() -> Box<dyn NAEncoder + Send> {
1081 Box::new(CinepakEncoder::new())
1082 }
1083
1084 #[cfg(test)]
1085 mod test {
1086 use nihav_core::codecs::*;
1087 use nihav_core::demuxers::*;
1088 use nihav_core::muxers::*;
1089 use crate::*;
1090 use nihav_codec_support::test::enc_video::*;
1091
1092 #[test]
1093 fn test_cinepak_encoder() {
1094 let mut dmx_reg = RegisteredDemuxers::new();
1095 generic_register_all_demuxers(&mut dmx_reg);
1096 let mut dec_reg = RegisteredDecoders::new();
1097 generic_register_all_decoders(&mut dec_reg);
1098 let mut mux_reg = RegisteredMuxers::new();
1099 generic_register_all_muxers(&mut mux_reg);
1100 let mut enc_reg = RegisteredEncoders::new();
1101 generic_register_all_encoders(&mut enc_reg);
1102
1103 let dec_config = DecoderTestParams {
1104 demuxer: "avi",
1105 in_name: "assets/Misc/TalkingHead_352x288.avi",
1106 stream_type: StreamType::Video,
1107 limit: Some(2),
1108 dmx_reg, dec_reg,
1109 };
1110 let enc_config = EncoderTestParams {
1111 muxer: "avi",
1112 enc_name: "cinepak",
1113 out_name: "cinepak.avi",
1114 mux_reg, enc_reg,
1115 };
1116 let dst_vinfo = NAVideoInfo {
1117 width: 0,
1118 height: 0,
1119 format: YUV420_FORMAT,
1120 flipped: true,
1121 bits: 12,
1122 };
1123 let enc_params = EncodeParameters {
1124 format: NACodecTypeInfo::Video(dst_vinfo),
1125 quality: 0,
1126 bitrate: 0,
1127 tb_num: 0,
1128 tb_den: 0,
1129 flags: 0,
1130 };
1131 //test_encoding_to_file(&dec_config, &enc_config, enc_params, &[]);
1132 test_encoding_md5(&dec_config, &enc_config, enc_params, &[],
1133 &[0xd73cb3c7, 0x30d59f90, 0x1d6e0e28, 0x5b72cc0c]);
1134 }
1135 }