core/scale: make sure that yuv2rgb kernel outputs to planar RGB
[nihav.git] / nihav-core / src / scale / colorcvt.rs
1 use super::*;
2 use super::kernel::Kernel;
3
4 const YUV_PARAMS: &[[f32; 2]] = &[
5 [ 0.333, 0.333 ], // RGB
6 [ 0.2126, 0.0722 ], // ITU-R BT709
7 [ 0.333, 0.333 ], // unspecified
8 [ 0.333, 0.333 ], // reserved
9 [ 0.299, 0.114 ], // ITU-R BT601
10 [ 0.299, 0.114 ], // ITU-R BT470
11 [ 0.299, 0.114 ], // SMPTE 170M
12 [ 0.212, 0.087 ], // SMPTE 240M
13 [ 0.333, 0.333 ], // YCoCg
14 [ 0.2627, 0.0593 ], // ITU-R BT2020
15 [ 0.2627, 0.0593 ], // ITU-R BT2020
16 ];
17
18 const BT_PAL_COEFFS: [f32; 2] = [ 0.493, 0.877 ];
19
20 const SMPTE_NTSC_COEFFS: &[f32; 4] = &[ -0.268, 0.7358, 0.4127, 0.4778 ];
21
22 /*const RGB2YCOCG: [[f32; 3]; 3] = [
23 [ 0.25, 0.5, 0.25 ],
24 [ -0.25, 0.5, -0.25 ],
25 [ 0.5, 0.0, -0.5 ]
26 ];
27 const YCOCG2RGB: [[f32; 3]; 3] = [
28 [ 1.0, -1.0, 1.0 ],
29 [ 1.0, 1.0, 0.0 ],
30 [ 1.0, -1.0, -1.0 ]
31 ];
32
33 const XYZ2RGB: [[f32; 3]; 3] = [
34 [ 0.49, 0.31, 0.2 ],
35 [ 0.17697, 0.8124, 0.01063 ],
36 [ 0.0, 0.01, 0.99 ]
37 ];
38 const RGB2XYZ: [[f32; 3]; 3] = [
39 [ 2.364613, -0.89654, -0.46807 ],
40 [ -0.515167, 1.42641, 0.08876 ],
41 [ 0.0052, -0.01441, 1.00920 ]
42 ];*/
43
44 fn make_rgb2yuv(kr: f32, kb: f32, mat: &mut [[f32; 3]; 3]) {
45 // Y
46 mat[0][0] = kr;
47 mat[0][1] = 1.0 - kr - kb;
48 mat[0][2] = kb;
49 // Cb
50 mat[1][0] = -mat[0][0] * 0.5 / (1.0 - kb);
51 mat[1][1] = -mat[0][1] * 0.5 / (1.0 - kb);
52 mat[1][2] = 0.5;
53 // Cr
54 mat[2][0] = 0.5;
55 mat[2][1] = -mat[0][1] * 0.5 / (1.0 - kr);
56 mat[2][2] = -mat[0][2] * 0.5 / (1.0 - kr);
57 }
58
59 fn make_yuv2rgb(kr: f32, kb: f32, mat: &mut [[f32; 3]; 3]) {
60 let kg = 1.0 - kr - kb;
61
62 // R
63 mat[0][0] = 1.0;
64 mat[0][1] = 0.0;
65 mat[0][2] = 2.0 * (1.0 - kr);
66 // G
67 mat[1][0] = 1.0;
68 mat[1][1] = -kb * 2.0 * (1.0 - kb) / kg;
69 mat[1][2] = -kr * 2.0 * (1.0 - kr) / kg;
70 // B
71 mat[2][0] = 1.0;
72 mat[2][1] = 2.0 * (1.0 - kb);
73 mat[2][2] = 0.0;
74 }
75
76 fn apply_pal_rgb2yuv(eu: f32, ev: f32, mat: &mut [[f32; 3]; 3]) {
77 let ufac = 2.0 * (1.0 - mat[0][2]) * eu;
78 let vfac = 2.0 * (1.0 - mat[0][0]) * ev;
79
80 // U
81 mat[1][0] *= ufac;
82 mat[1][1] *= ufac;
83 mat[1][2] = eu * (1.0 - mat[0][2]);
84 // V
85 mat[2][0] = ev * (1.0 - mat[0][0]);
86 mat[2][1] *= vfac;
87 mat[2][2] *= vfac;
88 }
89
90 fn apply_pal_yuv2rgb(eu: f32, ev: f32, mat: &mut [[f32; 3]; 3]) {
91 let ufac = 1.0 / (mat[2][1] * eu);
92 let vfac = 1.0 / (mat[0][2] * ev);
93
94 // R
95 mat[0][2] *= vfac;
96 // G
97 mat[1][1] *= ufac;
98 mat[1][2] *= vfac;
99 // B
100 mat[2][1] *= ufac;
101 }
102
103 fn apply_ntsc_rgb2yiq(params: &[f32; 4], mat: &mut [[f32; 3]; 3]) {
104 let ufac = 2.0 * (1.0 - mat[0][2]);
105 let vfac = 2.0 * (1.0 - mat[0][0]);
106 let mut tmp: [[f32; 3]; 2] = [[0.0; 3]; 2];
107
108 for i in 0..3 {
109 tmp[0][i] = mat[1][i] * ufac;
110 tmp[1][i] = mat[2][i] * vfac;
111 }
112 for i in 0..3 {
113 mat[1][i] = params[0] * tmp[0][i] + params[1] * tmp[1][i];
114 mat[2][i] = params[2] * tmp[0][i] + params[3] * tmp[1][i];
115 }
116 }
117
118 fn subm_det(mat: &[[f32; 3]; 3], col: usize, row: usize) -> f32 {
119 let row0 = if row == 0 { 1 } else { 0 };
120 let row1 = if (row == 1) || (row0 == 1) { 2 } else { 1 };
121 let col0 = if col == 0 { 1 } else { 0 };
122 let col1 = if (col == 1) || (col0 == 1) { 2 } else { 1 };
123
124 let det = mat[row0][col0] * mat[row1][col1] - mat[row0][col1] * mat[row1][col0];
125 if ((col ^ row) & 1) == 0 {
126 det
127 } else {
128 -det
129 }
130 }
131
132 fn invert_matrix(mat: &mut [[f32; 3]; 3]) {
133 let d00 = subm_det(mat, 0, 0);
134 let d01 = subm_det(mat, 0, 1);
135 let d02 = subm_det(mat, 0, 2);
136 let d10 = subm_det(mat, 1, 0);
137 let d11 = subm_det(mat, 1, 1);
138 let d12 = subm_det(mat, 1, 2);
139 let d20 = subm_det(mat, 2, 0);
140 let d21 = subm_det(mat, 2, 1);
141 let d22 = subm_det(mat, 2, 2);
142 let det = 1.0 / (mat[0][0] * d00 + mat[0][1] * d10 + mat[0][2] * d20).abs();
143
144 mat[0][0] = det * d00;
145 mat[0][1] = det * d01;
146 mat[0][2] = det * d02;
147 mat[1][0] = det * d10;
148 mat[1][1] = det * d11;
149 mat[1][2] = det * d12;
150 mat[2][0] = det * d20;
151 mat[2][1] = det * d21;
152 mat[2][2] = det * d22;
153 }
154
155 fn matrix_mul(mat: &[[f32; 3]; 3], a: f32, b: f32, c: f32) -> (f32, f32, f32) {
156 (a * mat[0][0] + b * mat[0][1] + c * mat[0][2],
157 a * mat[1][0] + b * mat[1][1] + c * mat[1][2],
158 a * mat[2][0] + b * mat[2][1] + c * mat[2][2] )
159 }
160
161 #[derive(Default)]
162 struct RgbToYuv {
163 matrix: [[f32; 3]; 3],
164 }
165
166 impl RgbToYuv {
167 fn new() -> Self { Self::default() }
168 }
169
170 #[allow(clippy::many_single_char_names)]
171 impl Kernel for RgbToYuv {
172 fn init(&mut self, in_fmt: &ScaleInfo, dest_fmt: &ScaleInfo) -> ScaleResult<NABufferType> {
173 let mut df = dest_fmt.fmt;
174 //todo coeff selection
175 make_rgb2yuv(YUV_PARAMS[2][0], YUV_PARAMS[2][1], &mut self.matrix);
176 if let ColorModel::YUV(yuvsm) = df.get_model() {
177 match yuvsm {
178 YUVSubmodel::YCbCr => {},
179 YUVSubmodel::YIQ => { apply_ntsc_rgb2yiq(SMPTE_NTSC_COEFFS, &mut self.matrix); },
180 YUVSubmodel::YUVJ => { apply_pal_rgb2yuv(BT_PAL_COEFFS[0], BT_PAL_COEFFS[1], &mut self.matrix); },
181 };
182 } else {
183 return Err(ScaleError::InvalidArgument);
184 }
185 for i in 0..MAX_CHROMATONS {
186 if let Some(ref mut chr) = df.comp_info[i] {
187 chr.packed = false;
188 chr.comp_offs = i as u8;
189 chr.h_ss = 0;
190 chr.v_ss = 0;
191 }
192 }
193 println!(" [intermediate format {}]", df);
194 let res = alloc_video_buffer(NAVideoInfo::new(in_fmt.width, in_fmt.height, false, df), 3);
195 if res.is_err() { return Err(ScaleError::AllocError); }
196 Ok(res.unwrap())
197 }
198 fn process(&mut self, pic_in: &NABufferType, pic_out: &mut NABufferType) {
199 if let (Some(ref sbuf), Some(ref mut dbuf)) = (pic_in.get_vbuf(), pic_out.get_vbuf()) {
200 if dbuf.get_info().get_format().get_num_comp() < 3 {
201 return self.process_grayscale(sbuf, dbuf);
202 }
203 let istrides = [sbuf.get_stride(0), sbuf.get_stride(1), sbuf.get_stride(2)];
204 let dstrides = [dbuf.get_stride(0), dbuf.get_stride(1), dbuf.get_stride(2)];
205 let (w, h) = sbuf.get_dimensions(0);
206
207 let mut roff = sbuf.get_offset(0);
208 let mut goff = sbuf.get_offset(1);
209 let mut boff = sbuf.get_offset(2);
210 let mut yoff = dbuf.get_offset(0);
211 let mut uoff = dbuf.get_offset(1);
212 let mut voff = dbuf.get_offset(2);
213 let src = sbuf.get_data();
214 let dst = dbuf.get_data_mut().unwrap();
215 for _y in 0..h {
216 for x in 0..w {
217 let r = f32::from(src[roff + x]);
218 let g = f32::from(src[goff + x]);
219 let b = f32::from(src[boff + x]);
220 let (y, u, v) = matrix_mul(&self.matrix, r, g, b);
221
222 dst[yoff + x] = (y as i16).max(0).min(255) as u8;
223 dst[uoff + x] = ((u as i16).max(-128).min(128) + 128) as u8;
224 dst[voff + x] = ((v as i16).max(-128).min(128) + 128) as u8;
225 }
226 roff += istrides[0];
227 goff += istrides[1];
228 boff += istrides[2];
229 yoff += dstrides[0];
230 uoff += dstrides[1];
231 voff += dstrides[2];
232 }
233 }
234 }
235 }
236
237 impl RgbToYuv {
238 fn process_grayscale(&self, sbuf: &NAVideoBuffer<u8>, dbuf: &mut NAVideoBuffer<u8>) {
239 let istrides = [sbuf.get_stride(0), sbuf.get_stride(1), sbuf.get_stride(2)];
240 let ystride = dbuf.get_stride(0);
241 let (w, h) = sbuf.get_dimensions(0);
242
243 let mut roff = sbuf.get_offset(0);
244 let mut goff = sbuf.get_offset(1);
245 let mut boff = sbuf.get_offset(2);
246 let mut yoff = dbuf.get_offset(0);
247 let src = sbuf.get_data();
248 let dst = dbuf.get_data_mut().unwrap();
249 for _y in 0..h {
250 for x in 0..w {
251 let r = f32::from(src[roff + x]);
252 let g = f32::from(src[goff + x]);
253 let b = f32::from(src[boff + x]);
254 let (y, _u, _v) = matrix_mul(&self.matrix, r, g, b);
255
256 dst[yoff + x] = (y as i16).max(0).min(255) as u8;
257 }
258 roff += istrides[0];
259 goff += istrides[1];
260 boff += istrides[2];
261 yoff += ystride;
262 }
263 }
264 }
265
266 pub fn create_rgb2yuv() -> Box<dyn Kernel> {
267 Box::new(RgbToYuv::new())
268 }
269
270 #[derive(Default)]
271 struct YuvToRgb {
272 matrix: [[f32; 3]; 3],
273 yscale: Vec<i16>,
274 r_chr: Vec<i16>,
275 g_u: Vec<i16>,
276 g_v: Vec<i16>,
277 b_chr: Vec<i16>,
278 }
279
280 impl YuvToRgb {
281 fn new() -> Self { Self::default() }
282 }
283
284 #[allow(clippy::many_single_char_names)]
285 impl Kernel for YuvToRgb {
286 fn init(&mut self, in_fmt: &ScaleInfo, dest_fmt: &ScaleInfo) -> ScaleResult<NABufferType> {
287 let mut df = dest_fmt.fmt;
288 df.palette = false;
289 if !df.is_unpacked() || df.get_max_depth() != 8 || df.get_total_depth() != df.get_num_comp() as u8 * 8 {
290 df = NAPixelFormaton {
291 model: ColorModel::RGB(RGBSubmodel::RGB), components: 3,
292 comp_info: [
293 Some(NAPixelChromaton{ h_ss: 0, v_ss: 0, packed: false, depth: 8, shift: 0, comp_offs: 0, next_elem: 1 }),
294 Some(NAPixelChromaton{ h_ss: 0, v_ss: 0, packed: false, depth: 8, shift: 0, comp_offs: 1, next_elem: 1 }),
295 Some(NAPixelChromaton{ h_ss: 0, v_ss: 0, packed: false, depth: 8, shift: 0, comp_offs: 2, next_elem: 1 }),
296 None, None],
297 elem_size: 3, be: false, alpha: false, palette: false };
298 if in_fmt.fmt.alpha && dest_fmt.fmt.alpha {
299 df.alpha = true;
300 df.components = 4;
301 df.comp_info[3] = Some(NAPixelChromaton{ h_ss: 0, v_ss: 0, packed: false, depth: 8, shift: 0, comp_offs: 3, next_elem: 1 });
302 }
303 }
304 //todo coeff selection
305 make_yuv2rgb(YUV_PARAMS[2][0], YUV_PARAMS[2][1], &mut self.matrix);
306 if let ColorModel::YUV(yuvsm) = in_fmt.fmt.get_model() {
307 match yuvsm {
308 YUVSubmodel::YCbCr => {},
309 YUVSubmodel::YIQ => {
310 make_rgb2yuv(YUV_PARAMS[2][0], YUV_PARAMS[2][1], &mut self.matrix);
311 apply_ntsc_rgb2yiq(SMPTE_NTSC_COEFFS, &mut self.matrix);
312 invert_matrix(&mut self.matrix);
313 },
314 YUVSubmodel::YUVJ => {
315 apply_pal_yuv2rgb(BT_PAL_COEFFS[0], BT_PAL_COEFFS[1], &mut self.matrix);
316 },
317 };
318 if yuvsm != YUVSubmodel::YIQ {
319 self.yscale = Vec::with_capacity(256);
320 self.r_chr = Vec::with_capacity(256);
321 self.g_u = Vec::with_capacity(256);
322 self.g_v = Vec::with_capacity(256);
323 self.b_chr = Vec::with_capacity(256);
324 for i in 0..256 {
325 let yval = i as i16; // todo limited range as well
326 self.yscale.push(yval);
327 let rval = (((i as f32) - 128.0) * self.matrix[0][2]) as i16;
328 self.r_chr.push(rval);
329 let uval = (((i as f32) - 128.0) * self.matrix[1][1]) as i16;
330 self.g_u.push(uval);
331 let vval = (((i as f32) - 128.0) * self.matrix[1][2]) as i16;
332 self.g_v.push(vval);
333 let bval = (((i as f32) - 128.0) * self.matrix[2][1]) as i16;
334 self.b_chr.push(bval);
335 }
336 }
337 } else {
338 return Err(ScaleError::InvalidArgument);
339 }
340 for i in 0..MAX_CHROMATONS {
341 if let Some(ref mut chr) = df.comp_info[i] {
342 chr.packed = false;
343 chr.comp_offs = i as u8;
344 }
345 }
346 println!(" [intermediate format {}]", df);
347 let res = alloc_video_buffer(NAVideoInfo::new(in_fmt.width, in_fmt.height, false, df), 3);
348 if res.is_err() { return Err(ScaleError::AllocError); }
349 Ok(res.unwrap())
350 }
351 fn process(&mut self, pic_in: &NABufferType, pic_out: &mut NABufferType) {
352 if let (Some(ref sbuf), Some(ref mut dbuf)) = (pic_in.get_vbuf(), pic_out.get_vbuf()) {
353 let istrides = [sbuf.get_stride(0), sbuf.get_stride(1), sbuf.get_stride(2)];
354 let dstrides = [dbuf.get_stride(0), dbuf.get_stride(1), dbuf.get_stride(2)];
355 let (w, h) = sbuf.get_dimensions(0);
356 if sbuf.get_info().get_format().get_num_comp() < 3 {
357 return self.process_grayscale(sbuf, dbuf);
358 }
359 let (sv0, sh0) = sbuf.get_info().get_format().get_chromaton(1).unwrap().get_subsampling();
360 let (sv1, sh1) = sbuf.get_info().get_format().get_chromaton(2).unwrap().get_subsampling();
361
362 let uhmask = (1 << sh0) - 1;
363 let vhmask = (1 << sh1) - 1;
364 let mut roff = dbuf.get_offset(0);
365 let mut goff = dbuf.get_offset(1);
366 let mut boff = dbuf.get_offset(2);
367 let mut yoff = sbuf.get_offset(0);
368 let mut uoff = sbuf.get_offset(1);
369 let mut voff = sbuf.get_offset(2);
370 let src = sbuf.get_data();
371 let dst = dbuf.get_data_mut().unwrap();
372 if self.yscale.len() > 0 {
373 for y in 0..h {
374 for x in 0..w {
375 let y = self.yscale[src[yoff + x] as usize];
376 let u = src[uoff + (x >> sv0)] as usize;
377 let v = src[voff + (x >> sv1)] as usize;
378 let r = y + self.r_chr[v];
379 let g = y + self.g_u[u] + self.g_v[v];
380 let b = y + self.b_chr[u];
381 dst[roff + x] = r.max(0).min(255) as u8;
382 dst[goff + x] = g.max(0).min(255) as u8;
383 dst[boff + x] = b.max(0).min(255) as u8;
384 }
385 roff += dstrides[0];
386 goff += dstrides[1];
387 boff += dstrides[2];
388 yoff += istrides[0];
389 if (y & uhmask) == uhmask {
390 uoff += istrides[1];
391 }
392 if (y & vhmask) == vhmask {
393 voff += istrides[2];
394 }
395 }
396 return;
397 }
398 for y in 0..h {
399 for x in 0..w {
400 let y = f32::from(src[yoff + x]);
401 let u = f32::from(i16::from(src[uoff + (x >> sv0)]) - 128);
402 let v = f32::from(i16::from(src[voff + (x >> sv1)]) - 128);
403
404 let (r, g, b) = matrix_mul(&self.matrix, y, u, v);
405 dst[roff + x] = (r as i16).max(0).min(255) as u8;
406 dst[goff + x] = (g as i16).max(0).min(255) as u8;
407 dst[boff + x] = (b as i16).max(0).min(255) as u8;
408 }
409 roff += dstrides[0];
410 goff += dstrides[1];
411 boff += dstrides[2];
412 yoff += istrides[0];
413 if (y & uhmask) == uhmask {
414 uoff += istrides[1];
415 }
416 if (y & vhmask) == vhmask {
417 voff += istrides[2];
418 }
419 }
420 }
421 }
422 }
423
424 impl YuvToRgb {
425 fn process_grayscale(&self, sbuf: &NAVideoBuffer<u8>, dbuf: &mut NAVideoBuffer<u8>) {
426 let ystride = sbuf.get_stride(0);
427 let dstrides = [dbuf.get_stride(0), dbuf.get_stride(1), dbuf.get_stride(2)];
428 let (w, h) = sbuf.get_dimensions(0);
429 let mut roff = dbuf.get_offset(0);
430 let mut goff = dbuf.get_offset(1);
431 let mut boff = dbuf.get_offset(2);
432 let mut yoff = sbuf.get_offset(0);
433 let src = sbuf.get_data();
434 let dst = dbuf.get_data_mut().unwrap();
435 if self.yscale.len() > 0 {
436 for _y in 0..h {
437 for x in 0..w {
438 let y = self.yscale[src[yoff + x] as usize];
439 let r = y + self.r_chr[128];
440 let g = y + self.g_u[128] + self.g_v[128];
441 let b = y + self.b_chr[128];
442 dst[roff + x] = r.max(0).min(255) as u8;
443 dst[goff + x] = g.max(0).min(255) as u8;
444 dst[boff + x] = b.max(0).min(255) as u8;
445 }
446 roff += dstrides[0];
447 goff += dstrides[1];
448 boff += dstrides[2];
449 yoff += ystride;
450 }
451 } else {
452 for _y in 0..h {
453 for x in 0..w {
454 let y = f32::from(src[yoff + x]);
455 let (r, g, b) = matrix_mul(&self.matrix, y, 0.0, 0.0);
456 dst[roff + x] = (r as i16).max(0).min(255) as u8;
457 dst[goff + x] = (g as i16).max(0).min(255) as u8;
458 dst[boff + x] = (b as i16).max(0).min(255) as u8;
459 }
460 roff += dstrides[0];
461 goff += dstrides[1];
462 boff += dstrides[2];
463 yoff += ystride;
464 }
465 }
466 }
467 }
468
469 pub fn create_yuv2rgb() -> Box<dyn Kernel> {
470 Box::new(YuvToRgb::new())
471 }