cac264b8c51301060a45e860085799f26a19ceed
[nihav.git] / nihav-duck / src / codecs / vpcommon.rs
1 use nihav_core::codecs::*;
2
3 #[derive(Clone,Copy,Debug,PartialEq)]
4 #[allow(dead_code)]
5 pub enum VPMBType {
6 Intra,
7 InterNoMV,
8 InterMV,
9 InterNearest,
10 InterNear,
11 InterFourMV,
12 GoldenNoMV,
13 GoldenMV,
14 GoldenNearest,
15 GoldenNear,
16 }
17
18 #[allow(dead_code)]
19 impl VPMBType {
20 pub fn is_intra(self) -> bool { self == VPMBType::Intra }
21 pub fn get_ref_id(self) -> u8 {
22 match self {
23 VPMBType::Intra => 0,
24 VPMBType::InterNoMV |
25 VPMBType::InterMV |
26 VPMBType::InterNearest |
27 VPMBType::InterNear |
28 VPMBType::InterFourMV => 1,
29 _ => 2,
30 }
31 }
32 }
33
34 impl Default for VPMBType {
35 fn default() -> Self { VPMBType::Intra }
36 }
37
38 #[derive(Default)]
39 pub struct VPShuffler {
40 lastframe: Option<NAVideoBufferRef<u8>>,
41 goldframe: Option<NAVideoBufferRef<u8>>,
42 }
43
44 impl VPShuffler {
45 pub fn new() -> Self { VPShuffler { lastframe: None, goldframe: None } }
46 pub fn clear(&mut self) { self.lastframe = None; self.goldframe = None; }
47 pub fn add_frame(&mut self, buf: NAVideoBufferRef<u8>) {
48 self.lastframe = Some(buf);
49 }
50 pub fn add_golden_frame(&mut self, buf: NAVideoBufferRef<u8>) {
51 self.goldframe = Some(buf);
52 }
53 pub fn get_last(&mut self) -> Option<NAVideoBufferRef<u8>> {
54 if let Some(ref frm) = self.lastframe {
55 Some(frm.clone())
56 } else {
57 None
58 }
59 }
60 pub fn get_golden(&mut self) -> Option<NAVideoBufferRef<u8>> {
61 if let Some(ref frm) = self.goldframe {
62 Some(frm.clone())
63 } else {
64 None
65 }
66 }
67 }
68
69 const C1S7: i32 = 64277;
70 const C2S6: i32 = 60547;
71 const C3S5: i32 = 54491;
72 const C4S4: i32 = 46341;
73 const C5S3: i32 = 36410;
74 const C6S2: i32 = 25080;
75 const C7S1: i32 = 12785;
76
77 fn mul16(a: i32, b: i32) -> i32 {
78 (a * b) >> 16
79 }
80
81 macro_rules! idct_step {
82 ($s0:expr, $s1:expr, $s2:expr, $s3:expr, $s4:expr, $s5:expr, $s6:expr, $s7:expr,
83 $d0:expr, $d1:expr, $d2:expr, $d3:expr, $d4:expr, $d5:expr, $d6:expr, $d7:expr,
84 $bias:expr, $shift:expr, $otype:ty) => {
85 let t_a = mul16(C1S7, i32::from($s1)) + mul16(C7S1, i32::from($s7));
86 let t_b = mul16(C7S1, i32::from($s1)) - mul16(C1S7, i32::from($s7));
87 let t_c = mul16(C3S5, i32::from($s3)) + mul16(C5S3, i32::from($s5));
88 let t_d = mul16(C3S5, i32::from($s5)) - mul16(C5S3, i32::from($s3));
89 let t_a1 = mul16(C4S4, t_a - t_c);
90 let t_b1 = mul16(C4S4, t_b - t_d);
91 let t_c = t_a + t_c;
92 let t_d = t_b + t_d;
93 let t_e = mul16(C4S4, i32::from($s0 + $s4)) + $bias;
94 let t_f = mul16(C4S4, i32::from($s0 - $s4)) + $bias;
95 let t_g = mul16(C2S6, i32::from($s2)) + mul16(C6S2, i32::from($s6));
96 let t_h = mul16(C6S2, i32::from($s2)) - mul16(C2S6, i32::from($s6));
97 let t_e1 = t_e - t_g;
98 let t_g = t_e + t_g;
99 let t_a = t_f + t_a1;
100 let t_f = t_f - t_a1;
101 let t_b = t_b1 - t_h;
102 let t_h = t_b1 + t_h;
103
104 $d0 = ((t_g + t_c) >> $shift) as $otype;
105 $d7 = ((t_g - t_c) >> $shift) as $otype;
106 $d1 = ((t_a + t_h) >> $shift) as $otype;
107 $d2 = ((t_a - t_h) >> $shift) as $otype;
108 $d3 = ((t_e1 + t_d) >> $shift) as $otype;
109 $d4 = ((t_e1 - t_d) >> $shift) as $otype;
110 $d5 = ((t_f + t_b) >> $shift) as $otype;
111 $d6 = ((t_f - t_b) >> $shift) as $otype;
112 }
113 }
114
115 pub fn vp_idct(coeffs: &mut [i16; 64]) {
116 let mut tmp = [0i32; 64];
117 for (src, dst) in coeffs.chunks(8).zip(tmp.chunks_mut(8)) {
118 idct_step!(src[0], src[1], src[2], src[3], src[4], src[5], src[6], src[7],
119 dst[0], dst[1], dst[2], dst[3], dst[4], dst[5], dst[6], dst[7], 0, 0, i32);
120 }
121 let src = &tmp;
122 let dst = coeffs;
123 for i in 0..8 {
124 idct_step!(src[0 * 8 + i], src[1 * 8 + i], src[2 * 8 + i], src[3 * 8 + i],
125 src[4 * 8 + i], src[5 * 8 + i], src[6 * 8 + i], src[7 * 8 + i],
126 dst[0 * 8 + i], dst[1 * 8 + i], dst[2 * 8 + i], dst[3 * 8 + i],
127 dst[4 * 8 + i], dst[5 * 8 + i], dst[6 * 8 + i], dst[7 * 8 + i], 8, 4, i16);
128 }
129 }
130
131 pub fn vp_idct_dc(coeffs: &mut [i16; 64]) {
132 let dc = ((mul16(C4S4, mul16(C4S4, i32::from(coeffs[0]))) + 8) >> 4) as i16;
133 for i in 0..64 {
134 coeffs[i] = dc;
135 }
136 }
137
138 pub fn unquant(coeffs: &mut [i16; 64], qmat: &[i16; 64]) {
139 for i in 1..64 {
140 coeffs[i] = coeffs[i].wrapping_mul(qmat[i]);
141 }
142 }
143
144 pub fn vp_put_block(coeffs: &mut [i16; 64], bx: usize, by: usize, plane: usize, frm: &mut NASimpleVideoFrame<u8>) {
145 vp_idct(coeffs);
146 let mut off = frm.offset[plane] + bx * 8 + by * 8 * frm.stride[plane];
147 for y in 0..8 {
148 for x in 0..8 {
149 frm.data[off + x] = (coeffs[x + y * 8] + 128).min(255).max(0) as u8;
150 }
151 off += frm.stride[plane];
152 }
153 }
154
155 pub fn vp_put_block_dc(coeffs: &mut [i16; 64], bx: usize, by: usize, plane: usize, frm: &mut NASimpleVideoFrame<u8>) {
156 vp_idct_dc(coeffs);
157 let dc = (coeffs[0] + 128).min(255).max(0) as u8;
158 let mut off = frm.offset[plane] + bx * 8 + by * 8 * frm.stride[plane];
159 for _ in 0..8 {
160 for x in 0..8 {
161 frm.data[off + x] = dc;
162 }
163 off += frm.stride[plane];
164 }
165 }
166
167 pub fn vp_add_block(coeffs: &mut [i16; 64], bx: usize, by: usize, plane: usize, frm: &mut NASimpleVideoFrame<u8>) {
168 vp_idct(coeffs);
169 let mut off = frm.offset[plane] + bx * 8 + by * 8 * frm.stride[plane];
170 for y in 0..8 {
171 for x in 0..8 {
172 frm.data[off + x] = (coeffs[x + y * 8] + (frm.data[off + x] as i16)).min(255).max(0) as u8;
173 }
174 off += frm.stride[plane];
175 }
176 }
177
178 pub fn vp_add_block_dc(coeffs: &mut [i16; 64], bx: usize, by: usize, plane: usize, frm: &mut NASimpleVideoFrame<u8>) {
179 vp_idct_dc(coeffs);
180 let dc = coeffs[0];
181 let mut off = frm.offset[plane] + bx * 8 + by * 8 * frm.stride[plane];
182 for _ in 0..8 {
183 for x in 0..8 {
184 frm.data[off + x] = (dc + (frm.data[off + x] as i16)).min(255).max(0) as u8;
185 }
186 off += frm.stride[plane];
187 }
188 }