1 /*
2 * software YUV to RGB converter
3 *
4 * Copyright (C) 2009 Konstantin Shishkov
5 *
6 * 1,4,8bpp support and context / deglobalize stuff
7 * by Michael Niedermayer (michaelni@gmx.at)
8 *
9 * This file is part of FFmpeg.
10 *
11 * FFmpeg is free software; you can redistribute it and/or
12 * modify it under the terms of the GNU Lesser General Public
13 * License as published by the Free Software Foundation; either
14 * version 2.1 of the License, or (at your option) any later version.
15 *
16 * FFmpeg is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 * Lesser General Public License for more details.
20 *
21 * You should have received a copy of the GNU Lesser General Public
22 * License along with FFmpeg; if not, write to the Free Software
23 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24 */
25
26 #include <stdio.h>
27 #include <stdlib.h>
28 #include <inttypes.h>
29
32 #include "config.h"
37
39 { 117504, 138453, 13954, 34903 }, /* no sequence_display_extension */
40 { 117504, 138453, 13954, 34903 }, /* ITU-R Rec. 709 (1990) */
41 { 104597, 132201, 25675, 53279 }, /* unspecified */
42 { 104597, 132201, 25675, 53279 }, /* reserved */
43 { 104448, 132798, 24759, 53109 }, /* FCC */
44 { 104597, 132201, 25675, 53279 }, /* ITU-R Rec. 624-4 System B, G */
45 { 104597, 132201, 25675, 53279 }, /* SMPTE 170M */
46 { 117579, 136230, 16907, 35559 } /* SMPTE 240M (1987) */
47 };
48
50 {
51 if (colorspace > 7 || colorspace < 0)
54 }
55
56 #define LOADCHROMA(i) \
57 U = pu[i]; \
58 V = pv[i]; \
59 r = (void *)c->table_rV[V+YUVRGB_TABLE_HEADROOM]; \
60 g = (void *)(c->table_gU[U+YUVRGB_TABLE_HEADROOM] + c->table_gV[V+YUVRGB_TABLE_HEADROOM]); \
61 b = (void *)c->table_bU[U+YUVRGB_TABLE_HEADROOM];
62
63 #define PUTRGB(dst, src, i) \
64 Y = src[2 * i]; \
65 dst[2 * i] = r[Y] + g[Y] + b[Y]; \
66 Y = src[2 * i + 1]; \
67 dst[2 * i + 1] = r[Y] + g[Y] + b[Y];
68
69 #define PUTRGB24(dst, src, i) \
70 Y = src[2 * i]; \
71 dst[6 * i + 0] = r[Y]; \
72 dst[6 * i + 1] = g[Y]; \
73 dst[6 * i + 2] = b[Y]; \
74 Y = src[2 * i + 1]; \
75 dst[6 * i + 3] = r[Y]; \
76 dst[6 * i + 4] = g[Y]; \
77 dst[6 * i + 5] = b[Y];
78
79 #define PUTBGR24(dst, src, i) \
80 Y = src[2 * i]; \
81 dst[6 * i + 0] = b[Y]; \
82 dst[6 * i + 1] = g[Y]; \
83 dst[6 * i + 2] = r[Y]; \
84 Y = src[2 * i + 1]; \
85 dst[6 * i + 3] = b[Y]; \
86 dst[6 * i + 4] = g[Y]; \
87 dst[6 * i + 5] = r[Y];
88
89 #define PUTRGBA(dst, ysrc, asrc, i, s) \
90 Y = ysrc[2 * i]; \
91 dst[2 * i] = r[Y] + g[Y] + b[Y] + (asrc[2 * i] << s); \
92 Y = ysrc[2 * i + 1]; \
93 dst[2 * i + 1] = r[Y] + g[Y] + b[Y] + (asrc[2 * i + 1] << s);
94
95 #define PUTRGB48(dst, src, i) \
96 Y = src[ 2 * i]; \
97 dst[12 * i + 0] = dst[12 * i + 1] = r[Y]; \
98 dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
99 dst[12 * i + 4] = dst[12 * i + 5] = b[Y]; \
100 Y = src[ 2 * i + 1]; \
101 dst[12 * i + 6] = dst[12 * i + 7] = r[Y]; \
102 dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
103 dst[12 * i + 10] = dst[12 * i + 11] = b[Y];
104
105 #define PUTBGR48(dst, src, i) \
106 Y = src[2 * i]; \
107 dst[12 * i + 0] = dst[12 * i + 1] = b[Y]; \
108 dst[12 * i + 2] = dst[12 * i + 3] = g[Y]; \
109 dst[12 * i + 4] = dst[12 * i + 5] = r[Y]; \
110 Y = src[2 * i + 1]; \
111 dst[12 * i + 6] = dst[12 * i + 7] = b[Y]; \
112 dst[12 * i + 8] = dst[12 * i + 9] = g[Y]; \
113 dst[12 * i + 10] = dst[12 * i + 11] = r[Y];
114
115 #define YUV2RGBFUNC(func_name, dst_type, alpha) \
116 static int func_name(SwsContext *c, const uint8_t *src[], \
117 int srcStride[], int srcSliceY, int srcSliceH, \
118 uint8_t *dst[], int dstStride[]) \
119 { \
120 int y; \
121 \
122 if (!alpha && c->srcFormat == AV_PIX_FMT_YUV422P) { \
123 srcStride[1] *= 2; \
124 srcStride[2] *= 2; \
125 } \
126 for (y = 0; y < srcSliceH; y += 2) { \
127 dst_type *dst_1 = \
128 (dst_type *)(dst[0] + (y + srcSliceY) * dstStride[0]); \
129 dst_type *dst_2 = \
130 (dst_type *)(dst[0] + (y + srcSliceY + 1) * dstStride[0]); \
131 dst_type av_unused *r, *g, *b; \
132 const uint8_t *py_1 = src[0] + y * srcStride[0]; \
133 const uint8_t *py_2 = py_1 + srcStride[0]; \
134 const uint8_t *pu = src[1] + (y >> 1) * srcStride[1]; \
135 const uint8_t *pv = src[2] + (y >> 1) * srcStride[2]; \
136 const uint8_t av_unused *pa_1, *pa_2; \
137 unsigned int h_size = c->dstW >> 3; \
138 if (alpha) { \
139 pa_1 = src[3] + y * srcStride[3]; \
140 pa_2 = pa_1 + srcStride[3]; \
141 } \
142 while (h_size--) { \
143 int av_unused U, V, Y; \
144
145 #define ENDYUV2RGBLINE(dst_delta, ss) \
146 pu += 4 >> ss; \
147 pv += 4 >> ss; \
148 py_1 += 8 >> ss; \
149 py_2 += 8 >> ss; \
150 dst_1 += dst_delta >> ss; \
151 dst_2 += dst_delta >> ss; \
152 } \
153 if (c->dstW & (4 >> ss)) { \
154 int av_unused Y, U, V; \
155
156 #define ENDYUV2RGBFUNC() \
157 } \
158 } \
159 return srcSliceH; \
160 }
161
162 #define CLOSEYUV2RGBFUNC(dst_delta) \
163 ENDYUV2RGBLINE(dst_delta, 0) \
164 ENDYUV2RGBFUNC()
165
170
174
178
186
195
200
201 LOADCHROMA(1);
204
205 LOADCHROMA(2);
208
209 LOADCHROMA(3);
213 LOADCHROMA(0);
216
217 LOADCHROMA(1);
221 LOADCHROMA(0);
225
227 LOADCHROMA(0);
230
231 LOADCHROMA(1);
234
235 LOADCHROMA(2);
238
239 LOADCHROMA(3);
243 LOADCHROMA(0);
246
247 LOADCHROMA(1);
251 LOADCHROMA(0);
255
257 LOADCHROMA(0);
260
261 LOADCHROMA(1);
262 PUTRGBA(dst_2, py_2, pa_2, 1, 24);
263 PUTRGBA(dst_1, py_1, pa_1, 1, 24);
264
265 LOADCHROMA(2);
266 PUTRGBA(dst_1, py_1, pa_1, 2, 24);
267 PUTRGBA(dst_2, py_2, pa_2, 2, 24);
268
269 LOADCHROMA(3);
270 PUTRGBA(dst_2, py_2, pa_2, 3, 24);
271 PUTRGBA(dst_1, py_1, pa_1, 3, 24);
275 LOADCHROMA(0);
276 PUTRGBA(dst_1, py_1, pa_1, 0, 24);
277 PUTRGBA(dst_2, py_2, pa_2, 0, 24);
278
279 LOADCHROMA(1);
280 PUTRGBA(dst_2, py_2, pa_2, 1, 24);
281 PUTRGBA(dst_1, py_1, pa_1, 1, 24);
282 pa_1 += 4;
283 pa_2 += 4;
285 LOADCHROMA(0);
286 PUTRGBA(dst_1, py_1, pa_1, 0, 24);
287 PUTRGBA(dst_2, py_2, pa_2, 0, 24);
289
291 LOADCHROMA(0);
292 PUTRGBA(dst_1, py_1, pa_1, 0, 0);
293 PUTRGBA(dst_2, py_2, pa_2, 0, 0);
294
295 LOADCHROMA(1);
296 PUTRGBA(dst_2, py_2, pa_2, 1, 0);
297 PUTRGBA(dst_1, py_1, pa_1, 1, 0);
298
299 LOADCHROMA(2);
300 PUTRGBA(dst_1, py_1, pa_1, 2, 0);
301 PUTRGBA(dst_2, py_2, pa_2, 2, 0);
302
303 LOADCHROMA(3);
304 PUTRGBA(dst_2, py_2, pa_2, 3, 0);
305 PUTRGBA(dst_1, py_1, pa_1, 3, 0);
306 pa_1 += 8;
307 pa_2 += 8;
309 LOADCHROMA(0);
310 PUTRGBA(dst_1, py_1, pa_1, 0, 0);
311 PUTRGBA(dst_2, py_2, pa_2, 0, 0);
312
313 LOADCHROMA(1);
314 PUTRGBA(dst_2, py_2, pa_2, 1, 0);
315 PUTRGBA(dst_1, py_1, pa_1, 1, 0);
316 pa_1 += 4;
317 pa_2 += 4;
319 LOADCHROMA(0);
320 PUTRGBA(dst_1, py_1, pa_1, 0, 0);
321 PUTRGBA(dst_2, py_2, pa_2, 0, 0);
323
325 LOADCHROMA(0);
328
329 LOADCHROMA(1);
332
333 LOADCHROMA(2);
336
337 LOADCHROMA(3);
341 LOADCHROMA(0);
344
345 LOADCHROMA(1);
349 LOADCHROMA(0);
353
354 // only trivial mods from yuv2rgb_c_24_rgb
356 LOADCHROMA(0);
359
360 LOADCHROMA(1);
363
364 LOADCHROMA(2);
367
368 LOADCHROMA(3);
372 LOADCHROMA(0);
375
376 LOADCHROMA(1);
380 LOADCHROMA(0);
384
385 YUV2RGBFUNC(yuv2rgb_c_16_ordered_dither, uint16_t, 0)
389
390 #define PUTRGB16(dst, src, i, o) \
391 Y = src[2 * i]; \
392 dst[2 * i] = r[Y + d16[0 + o]] + \
393 g[Y + e16[0 + o]] + \
394 b[Y + f16[0 + o]]; \
395 Y = src[2 * i + 1]; \
396 dst[2 * i + 1] = r[Y + d16[1 + o]] + \
397 g[Y + e16[1 + o]] + \
398 b[Y + f16[1 + o]];
402
406
410
415
416 YUV2RGBFUNC(yuv2rgb_c_15_ordered_dither, uint16_t, 0)
419
420 #define PUTRGB15(dst, src, i, o) \
421 Y = src[2 * i]; \
422 dst[2 * i] = r[Y + d16[0 + o]] + \
423 g[Y + d16[1 + o]] + \
424 b[Y + e16[0 + o]]; \
425 Y = src[2 * i + 1]; \
426 dst[2 * i + 1] = r[Y + d16[1 + o]] + \
427 g[Y + d16[0 + o]] + \
428 b[Y + e16[1 + o]];
432
436
440
445
446 // r, g, b, dst_1, dst_2
447 YUV2RGBFUNC(yuv2rgb_c_12_ordered_dither, uint16_t, 0)
449
450 #define PUTRGB12(dst, src, i, o) \
451 Y = src[2 * i]; \
452 dst[2 * i] = r[Y + d16[0 + o]] + \
453 g[Y + d16[0 + o]] + \
454 b[Y + d16[0 + o]]; \
455 Y = src[2 * i + 1]; \
456 dst[2 * i + 1] = r[Y + d16[1 + o]] + \
457 g[Y + d16[1 + o]] + \
458 b[Y + d16[1 + o]];
459
463
467
471
476
477 // r, g, b, dst_1, dst_2
478 YUV2RGBFUNC(yuv2rgb_c_8_ordered_dither, uint8_t, 0)
481
482 #define PUTRGB8(dst, src, i, o) \
483 Y = src[2 * i]; \
484 dst[2 * i] = r[Y + d32[0 + o]] + \
485 g[Y + d32[0 + o]] + \
486 b[Y + d64[0 + o]]; \
487 Y = src[2 * i + 1]; \
488 dst[2 * i + 1] = r[Y + d32[1 + o]] + \
489 g[Y + d32[1 + o]] + \
490 b[Y + d64[1 + o]];
491
494 PUTRGB8(dst_2, py_2, 0, 0 + 8);
495
497 PUTRGB8(dst_2, py_2, 1, 2 + 8);
499
502 PUTRGB8(dst_2, py_2, 2, 4 + 8);
503
505 PUTRGB8(dst_2, py_2, 3, 6 + 8);
508
509 YUV2RGBFUNC(yuv2rgb_c_4_ordered_dither, uint8_t, 0)
513
514 #define PUTRGB4D(dst, src, i, o) \
515 Y = src[2 * i]; \
516 acc = r[Y + d128[0 + o]] + \
517 g[Y + d64[0 + o]] + \
518 b[Y + d128[0 + o]]; \
519 Y = src[2 * i + 1]; \
520 acc |= (r[Y + d128[1 + o]] + \
521 g[Y + d64[1 + o]] + \
522 b[Y + d128[1 + o]]) << 4; \
523 dst[i] = acc;
524
528
532
536
541
542 YUV2RGBFUNC(yuv2rgb_c_4b_ordered_dither, uint8_t, 0)
545
546 #define PUTRGB4DB(dst, src, i, o) \
547 Y = src[2 * i]; \
548 dst[2 * i] = r[Y + d128[0 + o]] + \
549 g[Y + d64[0 + o]] + \
550 b[Y + d128[0 + o]]; \
551 Y = src[2 * i + 1]; \
552 dst[2 * i + 1] = r[Y + d128[1 + o]] + \
553 g[Y + d64[1 + o]] + \
554 b[Y + d128[1 + o]];
555
559
563
567
572
573 YUV2RGBFUNC(yuv2rgb_c_1_ordered_dither, uint8_t, 0)
577
578 #define PUTRGB1(out, src, i, o) \
579 Y = src[2 * i]; \
580 out += out + g[Y + d128[0 + o]]; \
581 Y = src[2 * i + 1]; \
582 out += out + g[Y + d128[1 + o]];
583
585 PUTRGB1(out_2, py_2, 0, 0 + 8);
586
587 PUTRGB1(out_2, py_2, 1, 2 + 8);
589
591 PUTRGB1(out_2, py_2, 2, 4 + 8);
592
593 PUTRGB1(out_2, py_2, 3, 6 + 8);
595
599
601 {
603
604 if (ARCH_BFIN)
606 if (ARCH_PPC)
608 if (HAVE_VIS)
610 if (ARCH_X86)
612
613 if (t)
615
617 "No accelerated colorspace conversion found from %s to %s.\n",
619
620 switch (c->dstFormat) {
623 return yuv2rgb_c_bgr48;
626 return yuv2rgb_c_48;
629 if (CONFIG_SWSCALE_ALPHA &&
isALPHA(c->srcFormat))
630 return yuva2argb_c;
633 return (CONFIG_SWSCALE_ALPHA &&
isALPHA(c->srcFormat)) ? yuva2rgba_c : yuv2rgb_c_32;
635 return yuv2rgb_c_24_rgb;
637 return yuv2rgb_c_24_bgr;
640 return yuv2rgb_c_16_ordered_dither;
643 return yuv2rgb_c_15_ordered_dither;
646 return yuv2rgb_c_12_ordered_dither;
649 return yuv2rgb_c_8_ordered_dither;
652 return yuv2rgb_c_4_ordered_dither;
655 return yuv2rgb_c_4b_ordered_dither;
657 return yuv2rgb_c_1_ordered_dither;
658 }
659 return NULL;
660 }
661
662 static void fill_table(uint8_t*
table[256 + 2*YUVRGB_TABLE_HEADROOM],
const int elemsize,
663 const int64_t inc, void *y_tab)
664 {
665 int i;
666 uint8_t *y_table = y_tab;
667
668 y_table -= elemsize * (inc >> 9);
669
671 int64_t
cb = av_clip(i-YUVRGB_TABLE_HEADROOM, 0, 255)*inc;
672 table[i] = y_table + elemsize * (cb >> 16);
673 }
674 }
675
676 static void fill_gv_table(
int table[256 + 2*YUVRGB_TABLE_HEADROOM],
const int elemsize,
const int64_t inc)
677 {
678 int i;
679 int off = -(inc >> 9);
680
682 int64_t
cb = av_clip(i-YUVRGB_TABLE_HEADROOM, 0, 255)*inc;
683 table[i] = elemsize * (off + (cb >> 16));
684 }
685 }
686
688 {
689 int r = (f + (1 << 15)) >> 16;
690
691 if (r < -0x7FFF)
692 return 0x8000;
693 else if (r > 0x7FFF)
694 return 0x7FFF;
695 else
697 }
698
702 {
723 uint8_t *y_table;
724 uint16_t *y_table16;
725 uint32_t *y_table32;
726 int i, base, rbase, gbase, bbase,
av_uninit(abase), needAlpha;
727 const int yoffs = fullRange ? 384 : 326;
728
729 int64_t crv = inv_table[0];
730 int64_t cbu = inv_table[1];
731 int64_t cgu = -inv_table[2];
732 int64_t cgv = -inv_table[3];
733 int64_t cy = 1 << 16;
734 int64_t oy = 0;
735 int64_t yb = 0;
736
737 if (!fullRange) {
738 cy = (cy * 255) / 219;
739 oy = 16 << 16;
740 } else {
741 crv = (crv * 224) / 255;
742 cbu = (cbu * 224) / 255;
743 cgu = (cgu * 224) / 255;
744 cgv = (cgv * 224) / 255;
745 }
746
753
754 c->
uOffset = 0x0400040004000400LL;
755 c->
vOffset = 0x0400040004000400LL;
762
769
770 //scale coefficients by cy
771 crv = ((crv << 16) + 0x8000) /
FFMAX(cy, 1);
772 cbu = ((cbu << 16) + 0x8000) /
FFMAX(cy, 1);
773 cgu = ((cgu << 16) + 0x8000) /
FFMAX(cy, 1);
774 cgv = ((cgv << 16) + 0x8000) /
FFMAX(cy, 1);
775
777
778 switch (bpp) {
779 case 1:
782 yb = -(384 << 16) - oy;
783 for (i = 0; i < 1024 - 110; i++) {
784 y_table[i + 110] = av_clip_uint8((yb + 0x8000) >> 16) >> 7;
785 yb += cy;
786 }
789 break;
790 case 4:
791 case 4 | 128:
792 rbase = isRgb ? 3 : 0;
793 gbase = 1;
794 bbase = isRgb ? 0 : 3;
797 yb = -(384 << 16) - oy;
798 for (i = 0; i < 1024 - 110; i++) {
799 int yval = av_clip_uint8((yb + 0x8000) >> 16);
800 y_table[i + 110] = (yval >> 7) << rbase;
801 y_table[i + 37 + 1024] = ((yval + 43) / 85) << gbase;
802 y_table[i + 110 + 2048] = (yval >> 7) << bbase;
803 yb += cy;
804 }
809 break;
810 case 8:
811 rbase = isRgb ? 5 : 0;
812 gbase = isRgb ? 2 : 3;
813 bbase = isRgb ? 0 : 6;
816 yb = -(384 << 16) - oy;
817 for (i = 0; i < 1024 - 38; i++) {
818 int yval = av_clip_uint8((yb + 0x8000) >> 16);
819 y_table[i + 16] = ((yval + 18) / 36) << rbase;
820 y_table[i + 16 + 1024] = ((yval + 18) / 36) << gbase;
821 y_table[i + 37 + 2048] = ((yval + 43) / 85) << bbase;
822 yb += cy;
823 }
828 break;
829 case 12:
830 rbase = isRgb ? 8 : 0;
831 gbase = 4;
832 bbase = isRgb ? 0 : 8;
835 yb = -(384 << 16) - oy;
836 for (i = 0; i < 1024; i++) {
837 uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
838 y_table16[i] = (yval >> 4) << rbase;
839 y_table16[i + 1024] = (yval >> 4) << gbase;
840 y_table16[i + 2048] = (yval >> 4) << bbase;
841 yb += cy;
842 }
843 if (isNotNe)
844 for (i = 0; i < 1024 * 3; i++)
850 break;
851 case 15:
852 case 16:
853 rbase = isRgb ? bpp - 5 : 0;
854 gbase = 5;
855 bbase = isRgb ? 0 : (bpp - 5);
858 yb = -(384 << 16) - oy;
859 for (i = 0; i < 1024; i++) {
860 uint8_t yval = av_clip_uint8((yb + 0x8000) >> 16);
861 y_table16[i] = (yval >> 3) << rbase;
862 y_table16[i + 1024] = (yval >> (18 - bpp)) << gbase;
863 y_table16[i + 2048] = (yval >> 3) << bbase;
864 yb += cy;
865 }
866 if (isNotNe)
867 for (i = 0; i < 1024 * 3; i++)
873 break;
874 case 24:
875 case 48:
878 yb = -(384 << 16) - oy;
879 for (i = 0; i < 1024; i++) {
880 y_table[i] = av_clip_uint8((yb + 0x8000) >> 16);
881 yb += cy;
882 }
887 break;
888 case 32:
889 case 64:
892 rbase = base + (isRgb ? 16 : 0);
893 gbase = base + 8;
894 bbase = base + (isRgb ? 0 : 16);
896 if (!needAlpha)
897 abase = (base + 24) & 31;
900 yb = -(384 << 16) - oy;
901 for (i = 0; i < 1024; i++) {
902 unsigned yval = av_clip_uint8((yb + 0x8000) >> 16);
903 y_table32[i] = (yval << rbase) +
904 (needAlpha ? 0 : (255
u << abase));
905 y_table32[i + 1024] = yval << gbase;
906 y_table32[i + 2048] = yval << bbase;
907 yb += cy;
908 }
913 break;
914 default:
917 return -1;
918 }
919 return 0;
920 }