Diff of /trunk/xvidcore/src/image/colorspace.c

-revision 433, Fri Sep  6 17:37:07 2002 UTC
+revision 1382, Mon Mar 22 22:36:25 2004 UTC
 Line 1
  /*****************************************************************************
   *
   *  XVID MPEG-4 VIDEO CODEC
-  *  - colorspace conversion module -
+  *  - Colorspace conversion functions -
   *
-  *  Copyright(C) 2002 Peter Ross <pross@xvid.org>
+  *  Copyright(C) 2001-2003 Peter Ross <pross@xvid.org>
-  *
-  *  This program is an implementation of a part of one or more MPEG-4
-  *  Video tools as specified in ISO/IEC 14496-2 standard.  Those intending
-  *  to use this software module in hardware or software products are
-  *  advised that its use may infringe existing patents or copyrights, and
-  *  any such use would be at such party's own risk.  The original
-  *  developer of this software module and his/her company, and subsequent
-  *  editors and their companies, will have no liability for use of this
-  *  software or modifications or derivatives thereof.
   *
   *  This program is free software; you can redistribute it and/or modify
   *  it under the terms of the GNU General Public License as published by
-Line 28
+Line 19
   *  along with this program; if not, write to the Free Software
   *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
   *
+  * $Id: colorspace.c,v 1.9 2004-03-22 22:36:23 edgomez Exp $
+  *
   ****************************************************************************/
- #include <string.h>                             // memcpy
+ #include <string.h>                             /* memcpy */
+ #include "../global.h"
  #include "colorspace.h"
- #include "../divx4.h"                   // DEC_PICTURE
- // function pointers
+ /* function pointers */
  /* input */
- color_inputFuncPtr rgb555_to_yv12;
+ packedFuncPtr rgb555_to_yv12;
- color_inputFuncPtr rgb565_to_yv12;
+ packedFuncPtr rgb565_to_yv12;
- color_inputFuncPtr rgb24_to_yv12;
+ packedFuncPtr bgr_to_yv12;
- color_inputFuncPtr rgb32_to_yv12;
+ packedFuncPtr bgra_to_yv12;
- color_inputFuncPtr yuv_to_yv12;
+ packedFuncPtr abgr_to_yv12;
- color_inputFuncPtr yuyv_to_yv12;
+ packedFuncPtr rgba_to_yv12;
- color_inputFuncPtr uyvy_to_yv12;
+ packedFuncPtr argb_to_yv12;
+ packedFuncPtr yuv_to_yv12;
+ packedFuncPtr yuyv_to_yv12;
+ packedFuncPtr uyvy_to_yv12;
+ packedFuncPtr rgb555i_to_yv12;
+ packedFuncPtr rgb565i_to_yv12;
+ packedFuncPtr bgri_to_yv12;
+ packedFuncPtr bgrai_to_yv12;
+ packedFuncPtr abgri_to_yv12;
+ packedFuncPtr rgbai_to_yv12;
+ packedFuncPtr argbi_to_yv12;
+ packedFuncPtr yuyvi_to_yv12;
+ packedFuncPtr uyvyi_to_yv12;
  /* output */
- color_outputFuncPtr yv12_to_rgb555;
+ packedFuncPtr yv12_to_rgb555;
- color_outputFuncPtr yv12_to_rgb565;
+ packedFuncPtr yv12_to_rgb565;
- color_outputFuncPtr yv12_to_rgb24;
+ packedFuncPtr yv12_to_bgr;
- color_outputFuncPtr yv12_to_rgb32;
+ packedFuncPtr yv12_to_bgra;
- color_outputFuncPtr yv12_to_yuv;
+ packedFuncPtr yv12_to_abgr;
- color_outputFuncPtr yv12_to_yuyv;
+ packedFuncPtr yv12_to_rgba;
- color_outputFuncPtr yv12_to_uyvy;
+ packedFuncPtr yv12_to_argb;
+ packedFuncPtr yv12_to_yuv;
+ packedFuncPtr yv12_to_yuyv;
+ packedFuncPtr yv12_to_uyvy;
+ packedFuncPtr yv12_to_rgb555i;
+ packedFuncPtr yv12_to_rgb565i;
+ packedFuncPtr yv12_to_bgri;
+ packedFuncPtr yv12_to_bgrai;
+ packedFuncPtr yv12_to_abgri;
+ packedFuncPtr yv12_to_rgbai;
+ packedFuncPtr yv12_to_argbi;
+ packedFuncPtr yv12_to_yuyvi;
+ packedFuncPtr yv12_to_uyvyi;
+ planarFuncPtr yv12_to_yv12;
+ int32_t RGB_Y_tab[256];
+ int32_t B_U_tab[256];
+ int32_t G_U_tab[256];
+ int32_t G_V_tab[256];
+ int32_t R_V_tab[256];
+ /********** generic colorspace macro **********/
+ #define MAKE_COLORSPACE(NAME,SIZE,PIXELS,VPIXELS,FUNC,C1,C2,C3,C4) \
+ void    \
+ NAME(uint8_t * x_ptr, int x_stride,     \
+                                  uint8_t * y_ptr, uint8_t * u_ptr, uint8_t * v_ptr,     \
+                                  int y_stride, int uv_stride,   \
+                                  int width, int height, int vflip)      \
+ {       \
+         int fixed_width = (width + 1) & ~1;                             \
+         int x_dif = x_stride - (SIZE)*fixed_width;              \
+         int y_dif = y_stride - fixed_width;                             \
+         int uv_dif = uv_stride - (fixed_width / 2);             \
+         int x, y;                                                                               \
+         if (vflip) {                                                            \
+                 x_ptr += (height - 1) * x_stride;                       \
+                 x_dif = -(SIZE)*fixed_width - x_stride;         \
+                 x_stride = -x_stride;                                           \
+         }                                                                                               \
+         for (y = 0; y < height; y+=(VPIXELS)) {                 \
+                 FUNC##_ROW(SIZE,C1,C2,C3,C4);                           \
+                 for (x = 0; x < fixed_width; x+=(PIXELS)) {     \
+                         FUNC(SIZE,C1,C2,C3,C4);                         \
+                         x_ptr += (PIXELS)*(SIZE);                               \
+                         y_ptr += (PIXELS);                                              \
+                         u_ptr += (PIXELS)/2;                                    \
+                         v_ptr += (PIXELS)/2;                                    \
+                 }                                                                                       \
+                 x_ptr += x_dif + (VPIXELS-1)*x_stride;          \
+                 y_ptr += y_dif + (VPIXELS-1)*y_stride;          \
+                 u_ptr += uv_dif + ((VPIXELS/2)-1)*uv_stride;    \
+                 v_ptr += uv_dif + ((VPIXELS/2)-1)*uv_stride;    \
+         }                                                                                               \
+ }
- #define MIN(A,B)        ((A)<(B)?(A):(B))
+ /********** colorspace input (xxx_to_yv12) functions **********/
- #define MAX(A,B)        ((A)>(B)?(A):(B))
  /*      rgb -> yuv def's
-Line 87
+Line 154
  #define FIX_IN(x)               ((uint16_t) ((x) * (1L<<SCALEBITS_IN) + 0.5))
- int32_t RGB_Y_tab[256];
+ /* rgb16/rgb16i input */
- int32_t B_U_tab[256];
- int32_t G_U_tab[256];
- int32_t G_V_tab[256];
- int32_t R_V_tab[256];
- /* rgb555 -> yuv 4:2:0 planar */
- void
- rgb555_to_yv12_c(uint8_t * y_out,
-                                  uint8_t * u_out,
-                                  uint8_t * v_out,
-                                  uint8_t * src,
-                                  int width,
-                                  int height,
-                                  int y_stride)
- {
-         int32_t src_stride = width * 2;
-         uint32_t y_dif = y_stride - width;
-         uint32_t uv_dif = (y_stride - width) / 2;
-         uint32_t x, y;
-         if (height < 0) {
-                 height = -height;
-                 src += (height - 1) * src_stride;
-                 src_stride = -src_stride;
-         }
-         for (y = height / 2; y; y--) {
-                 // process one 2x2 block per iteration
-                 for (x = 0; x < (uint32_t) width; x += 2) {
-                         int rgb, r, g, b, r4, g4, b4;
-                         rgb = *(uint16_t *) (src + x * 2);
-                         b4 = b = (rgb << 3) & 0xf8;
-                         g4 = g = (rgb >> 2) & 0xf8;
-                         r4 = r = (rgb >> 7) & 0xf8;
-                         y_out[0] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         rgb = *(uint16_t *) (src + x * 2 + src_stride);
-                         b4 += b = (rgb << 3) & 0xf8;
-                         g4 += g = (rgb >> 2) & 0xf8;
-                         r4 += r = (rgb >> 7) & 0xf8;
-                         y_out[y_stride] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         rgb = *(uint16_t *) (src + x * 2 + 2);
-                         b4 += b = (rgb << 3) & 0xf8;
-                         g4 += g = (rgb >> 2) & 0xf8;
-                         r4 += r = (rgb >> 7) & 0xf8;
-                         y_out[1] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         rgb = *(uint16_t *) (src + x * 2 + src_stride + 2);
-                         b4 += b = (rgb << 3) & 0xf8;
-                         g4 += g = (rgb >> 2) & 0xf8;
-                         r4 += r = (rgb >> 7) & 0xf8;
-                         y_out[y_stride + 1] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         *u_out++ =
-                                 (uint8_t) ((-FIX_IN(U_R_IN) * r4 - FIX_IN(U_G_IN) * g4 +
-                                                         FIX_IN(U_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
-                                 U_ADD_IN;
-                         *v_out++ =
-                                 (uint8_t) ((FIX_IN(V_R_IN) * r4 - FIX_IN(V_G_IN) * g4 -
-                                                         FIX_IN(V_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
-                                 V_ADD_IN;
-                         y_out += 2;
-                 }
-                 src += src_stride * 2;
-                 y_out += y_dif + y_stride;
-                 u_out += uv_dif;
-                 v_out += uv_dif;
-         }
- }
- /* rgb565_to_yuv_c
-         NOTE:   identical to rgb555 except for shift/mask
-                         not tested */
- void
- rgb565_to_yv12_c(uint8_t * y_out,
-                                  uint8_t * u_out,
-                                  uint8_t * v_out,
-                                  uint8_t * src,
-                                  int width,
-                                  int height,
-                                  int y_stride)
- {
-         int32_t src_stride = width * 2;
-         uint32_t y_dif = y_stride - width;
-         uint32_t uv_dif = (y_stride - width) / 2;
-         uint32_t x, y;
-         if (height < 0) {
-                 height = -height;
-                 src += (height - 1) * src_stride;
-                 src_stride = -src_stride;
-         }
-         for (y = height / 2; y; y--) {
-                 // process one 2x2 block per iteration
-                 for (x = 0; x < (uint32_t) width; x += 2) {
-                         int rgb, r, g, b, r4, g4, b4;
-                         rgb = *(uint16_t *) (src + x * 2);
-                         b4 = b = (rgb << 3) & 0xf8;
-                         g4 = g = (rgb >> 3) & 0xfc;
-                         r4 = r = (rgb >> 8) & 0xf8;
-                         y_out[0] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         rgb = *(uint16_t *) (src + x * 2 + src_stride);
-                         b4 += b = (rgb << 3) & 0xf8;
-                         g4 += g = (rgb >> 3) & 0xfc;
-                         r4 += r = (rgb >> 8) & 0xf8;
-                         y_out[y_stride] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         rgb = *(uint16_t *) (src + x * 2 + 2);
-                         b4 += b = (rgb << 3) & 0xf8;
-                         g4 += g = (rgb >> 3) & 0xfc;
-                         r4 += r = (rgb >> 8) & 0xf8;
-                         y_out[1] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         rgb = *(uint16_t *) (src + x * 2 + src_stride + 2);
-                         b4 += b = (rgb << 3) & 0xf8;
-                         g4 += g = (rgb >> 3) & 0xfc;
-                         r4 += r = (rgb >> 8) & 0xf8;
-                         y_out[y_stride + 1] =
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         *u_out++ =
-                                 (uint8_t) ((-FIX_IN(U_R_IN) * r4 - FIX_IN(U_G_IN) * g4 +
-                                                         FIX_IN(U_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
-                                 U_ADD_IN;
-                         *v_out++ =
-                                 (uint8_t) ((FIX_IN(V_R_IN) * r4 - FIX_IN(V_G_IN) * g4 -
-                                                         FIX_IN(V_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
-                                 V_ADD_IN;
-                         y_out += 2;
-                 }
-                 src += src_stride * 2;
-                 y_out += y_dif + y_stride;
-                 u_out += uv_dif;
-                 v_out += uv_dif;
-         }
- }
+ #define MK_RGB555_B(RGB)  ((RGB) << 3) & 0xf8
- /*      rgb24 -> yuv 4:2:0 planar
+ #define MK_RGB555_G(RGB)  ((RGB) >> 2) & 0xf8
+ #define MK_RGB555_R(RGB)  ((RGB) >> 7) & 0xf8
-         NOTE: always flips.
- */
+ #define MK_RGB565_B(RGB)  ((RGB) << 3) & 0xf8
+ #define MK_RGB565_G(RGB)  ((RGB) >> 3) & 0xfc
- void
+ #define MK_RGB565_R(RGB)  ((RGB) >> 8) & 0xf8
- rgb24_to_yv12_c(uint8_t * y_out,
-                                 uint8_t * u_out,
-                                 uint8_t * v_out,
+ #define READ_RGB16_Y(ROW, UVID, C1,C2,C3,C4)    \
-                                 uint8_t * src,
+         rgb = *(uint16_t *) (x_ptr + ((ROW)*x_stride) + 0);     \
-                                 int width,
+         b##UVID += b = C1##_B(rgb);                             \
-                                 int height,
+         g##UVID += g = C1##_G(rgb);                             \
-                                 int stride)
+         r##UVID += r = C1##_R(rgb);                             \
- {
+         y_ptr[(ROW)*y_stride+0] =                               \
-         uint32_t width3 = (width << 1) + width; /* width * 3 */
+                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +   \
-         uint32_t src_dif = (width << 3) + width;        /* width3 * 3 */
+                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;        \
-         uint32_t y_dif = (stride << 1) - width;
+         rgb = *(uint16_t *) (x_ptr + ((ROW)*x_stride) + 2);     \
-         uint32_t uv_dif = (stride - width) >> 1;
+         b##UVID += b = C1##_B(rgb);                             \
-         uint32_t x, y;
+         g##UVID += g = C1##_G(rgb);                             \
+         r##UVID += r = C1##_R(rgb);                             \
-         src += (height - 2) * width3;
+         y_ptr[(ROW)*y_stride+1] =                               \
+                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +                   \
+                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-         for (y = height >> 1; y; y--) {
-                 for (x = width >> 1; x; x--) {
+ #define READ_RGB16_UV(UV_ROW,UVID)      \
-                         uint32_t r, g, b, r4, g4, b4;
+         u_ptr[(UV_ROW)*uv_stride] =                                                                                                             \
+                 (uint8_t) ((-FIX_IN(U_R_IN) * r##UVID - FIX_IN(U_G_IN) * g##UVID +                      \
-                         b4 = b = src[0];
+                                         FIX_IN(U_B_IN) * b##UVID) >> (SCALEBITS_IN + 2)) + U_ADD_IN;    \
-                         g4 = g = src[1];
+         v_ptr[(UV_ROW)*uv_stride] =                                                                                                             \
-                         r4 = r = src[2];
+                 (uint8_t) ((FIX_IN(V_R_IN) * r##UVID - FIX_IN(V_G_IN) * g##UVID -                       \
-                         y_out[stride + 0] =
+                                         FIX_IN(V_B_IN) * b##UVID) >> (SCALEBITS_IN + 2)) + V_ADD_IN;
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
+ #define RGB16_TO_YV12_ROW(SIZE,C1,C2,C3,C4) \
+         /* nothing */
-                         b4 += (b = src[3]);
+ #define RGB16_TO_YV12(SIZE,C1,C2,C3,C4) \
-                         g4 += (g = src[4]);
+         uint32_t rgb, r, g, b, r0, g0, b0;      \
-                         r4 += (r = src[5]);
+         r0 = g0 = b0 = 0;                                       \
-                         y_out[stride + 1] =
+         READ_RGB16_Y (0, 0, C1,C2,C3,C4)        \
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
+         READ_RGB16_Y (1, 0, C1,C2,C3,C4)        \
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
+         READ_RGB16_UV(0, 0)
-                         b4 += (b = src[width3 + 0]);
-                         g4 += (g = src[width3 + 1]);
+ #define RGB16I_TO_YV12_ROW(SIZE,C1,C2,C3,C4) \
-                         r4 += (r = src[width3 + 2]);
+         /* nothing */
-                         y_out[0] =
+ #define RGB16I_TO_YV12(SIZE,C1,C2,C3,C4)        \
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
+         uint32_t rgb, r, g, b, r0, g0, b0, r1, g1, b1;  \
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
+         r0 = g0 = b0 = r1 = g1 = b1 = 0;        \
+         READ_RGB16_Y (0, 0, C1,C2,C3,C4)        \
-                         b4 += (b = src[width3 + 3]);
+         READ_RGB16_Y (1, 1, C1,C2,C3,C4)        \
-                         g4 += (g = src[width3 + 4]);
+         READ_RGB16_Y (2, 0, C1,C2,C3,C4)        \
-                         r4 += (r = src[width3 + 5]);
+         READ_RGB16_Y (3, 1, C1,C2,C3,C4)        \
-                         y_out[1] =
+         READ_RGB16_UV(0, 0)                                     \
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
+         READ_RGB16_UV(1, 1)
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                         *u_out++ =
+ /* rgb/rgbi input */
-                                 (uint8_t) ((-FIX_IN(U_R_IN) * r4 - FIX_IN(U_G_IN) * g4 +
-                                                         FIX_IN(U_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
+ #define READ_RGB_Y(SIZE, ROW, UVID, C1,C2,C3,C4)        \
-                                 U_ADD_IN;
+         r##UVID += r = x_ptr[(ROW)*x_stride+(C1)];                                              \
+         g##UVID += g = x_ptr[(ROW)*x_stride+(C2)];                                              \
+         b##UVID += b = x_ptr[(ROW)*x_stride+(C3)];                                              \
-                         *v_out++ =
+         y_ptr[(ROW)*y_stride+0] =                                                                       \
-                                 (uint8_t) ((FIX_IN(V_R_IN) * r4 - FIX_IN(V_G_IN) * g4 -
+                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +   \
-                                                         FIX_IN(V_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
+                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;        \
-                                 V_ADD_IN;
+         r##UVID += r = x_ptr[(ROW)*x_stride+(SIZE)+(C1)];                               \
+         g##UVID += g = x_ptr[(ROW)*x_stride+(SIZE)+(C2)];                               \
+         b##UVID += b = x_ptr[(ROW)*x_stride+(SIZE)+(C3)];                               \
-                         src += 6;
+         y_ptr[(ROW)*y_stride+1] =                                                                       \
-                         y_out += 2;
+                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +   \
-                 }
+                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
-                 src -= src_dif;
-                 y_out += y_dif;
+ #define READ_RGB_UV(UV_ROW,UVID)        \
-                 u_out += uv_dif;
+         u_ptr[(UV_ROW)*uv_stride] =                                                                                                             \
-                 v_out += uv_dif;
+                 (uint8_t) ((-FIX_IN(U_R_IN) * r##UVID - FIX_IN(U_G_IN) * g##UVID +                      \
-         }
+                                         FIX_IN(U_B_IN) * b##UVID) >> (SCALEBITS_IN + 2)) + U_ADD_IN;    \
- }
+         v_ptr[(UV_ROW)*uv_stride] =                                                                                                             \
+                 (uint8_t) ((FIX_IN(V_R_IN) * r##UVID - FIX_IN(V_G_IN) * g##UVID -                       \
+                                         FIX_IN(V_B_IN) * b##UVID) >> (SCALEBITS_IN + 2)) + V_ADD_IN;
- /*      rgb32 -> yuv 4:2:0 planar
-         NOTE: always flips
+ #define RGB_TO_YV12_ROW(SIZE,C1,C2,C3,C4) \
- */
+         /* nothing */
+ #define RGB_TO_YV12(SIZE,C1,C2,C3,C4)   \
- void
+         uint32_t r, g, b, r0, g0, b0;           \
- rgb32_to_yv12_c(uint8_t * y_out,
+         r0 = g0 = b0 = 0;                                       \
-                                 uint8_t * u_out,
+         READ_RGB_Y(SIZE, 0, 0, C1,C2,C3,C4)     \
-                                 uint8_t * v_out,
+         READ_RGB_Y(SIZE, 1, 0, C1,C2,C3,C4)     \
-                                 uint8_t * src,
+         READ_RGB_UV(     0, 0)
-                                 int width,
-                                 int height,
+ #define RGBI_TO_YV12_ROW(SIZE,C1,C2,C3,C4) \
-                                 int stride)
+         /* nothing */
- {
+ #define RGBI_TO_YV12(SIZE,C1,C2,C3,C4)  \
-         uint32_t width4 = (width << 2); /* width * 4 */
+         uint32_t r, g, b, r0, g0, b0, r1, g1, b1;       \
-         uint32_t src_dif = 3 * width4;
+         r0 = g0 = b0 = r1 = g1 = b1 = 0;        \
-         uint32_t y_dif = (stride << 1) - width;
+         READ_RGB_Y(SIZE, 0, 0, C1,C2,C3,C4)     \
-         uint32_t uv_dif = (stride - width) >> 1;
+         READ_RGB_Y(SIZE, 1, 1, C1,C2,C3,C4)     \
-         uint32_t x, y;
+         READ_RGB_Y(SIZE, 2, 0, C1,C2,C3,C4)     \
+         READ_RGB_Y(SIZE, 3, 1, C1,C2,C3,C4)     \
-         src += (height - 2) * width4;
+         READ_RGB_UV(     0, 0)                          \
+         READ_RGB_UV(     1, 1)
-         for (y = height >> 1; y; y--) {
-                 for (x = width >> 1; x; x--) {
-                         uint32_t r, g, b, r4, g4, b4;
+ /* yuyv/yuyvi input */
-                         b4 = b = src[0];
+ #define READ_YUYV_Y(ROW,C1,C2,C3,C4)    \
-                         g4 = g = src[1];
+         y_ptr[(ROW)*y_stride+0] = x_ptr[(ROW)*x_stride+(C1)];   \
-                         r4 = r = src[2];
+         y_ptr[(ROW)*y_stride+1] = x_ptr[(ROW)*x_stride+(C3)];
-                         y_out[stride + 0] =
+ #define READ_YUYV_UV(UV_ROW,ROW1,ROW2,C1,C2,C3,C4) \
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
+         u_ptr[(UV_ROW)*uv_stride] = (x_ptr[(ROW1)*x_stride+(C2)] + x_ptr[(ROW2)*x_stride+(C2)] + 1) / 2;        \
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
+         v_ptr[(UV_ROW)*uv_stride] = (x_ptr[(ROW1)*x_stride+(C4)] + x_ptr[(ROW2)*x_stride+(C4)] + 1) / 2;
-                         b4 += (b = src[4]);
+ #define YUYV_TO_YV12_ROW(SIZE,C1,C2,C3,C4) \
-                         g4 += (g = src[5]);
+         /* nothing */
-                         r4 += (r = src[6]);
+ #define YUYV_TO_YV12(SIZE,C1,C2,C3,C4)  \
-                         y_out[stride + 1] =
+         READ_YUYV_Y (0,      C1,C2,C3,C4)       \
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
+         READ_YUYV_Y (1,      C1,C2,C3,C4)       \
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
+         READ_YUYV_UV(0, 0,1, C1,C2,C3,C4)
-                         b4 += (b = src[width4 + 0]);
+ #define YUYVI_TO_YV12_ROW(SIZE,C1,C2,C3,C4) \
-                         g4 += (g = src[width4 + 1]);
+         /* nothing */
-                         r4 += (r = src[width4 + 2]);
+ #define YUYVI_TO_YV12(SIZE,C1,C2,C3,C4) \
+         READ_YUYV_Y (0, C1,C2,C3,C4)    \
-                         y_out[0] =
+         READ_YUYV_Y (1, C1,C2,C3,C4)    \
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
+         READ_YUYV_Y (2, C1,C2,C3,C4)    \
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
+         READ_YUYV_Y (3, C1,C2,C3,C4)    \
+         READ_YUYV_UV(0, 0,2, C1,C2,C3,C4)       \
-                         b4 += (b = src[width4 + 4]);
+         READ_YUYV_UV(1, 1,3, C1,C2,C3,C4)
-                         g4 += (g = src[width4 + 5]);
-                         r4 += (r = src[width4 + 6]);
-                         y_out[1] =
+ MAKE_COLORSPACE(rgb555_to_yv12_c,  2,2,2, RGB16_TO_YV12,  MK_RGB555, 0,0,0)
-                                 (uint8_t) ((FIX_IN(Y_R_IN) * r + FIX_IN(Y_G_IN) * g +
+ MAKE_COLORSPACE(rgb565_to_yv12_c,  2,2,2, RGB16_TO_YV12,  MK_RGB565, 0,0,0)
-                                                         FIX_IN(Y_B_IN) * b) >> SCALEBITS_IN) + Y_ADD_IN;
+ MAKE_COLORSPACE(bgr_to_yv12_c,     3,2,2, RGB_TO_YV12,    2,1,0, 0)
+ MAKE_COLORSPACE(bgra_to_yv12_c,    4,2,2, RGB_TO_YV12,    2,1,0, 0)
-                         *u_out++ =
+ MAKE_COLORSPACE(abgr_to_yv12_c,    4,2,2, RGB_TO_YV12,    3,2,1, 0)
-                                 (uint8_t) ((-FIX_IN(U_R_IN) * r4 - FIX_IN(U_G_IN) * g4 +
+ MAKE_COLORSPACE(rgba_to_yv12_c,    4,2,2, RGB_TO_YV12,    0,1,2, 0)
-                                                         FIX_IN(U_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
+ MAKE_COLORSPACE(argb_to_yv12_c,    4,2,2, RGB_TO_YV12,    1,2,3, 0)
-                                 U_ADD_IN;
+ MAKE_COLORSPACE(yuyv_to_yv12_c,    2,2,2, YUYV_TO_YV12,   0,1,2,3)
+ MAKE_COLORSPACE(uyvy_to_yv12_c,    2,2,2, YUYV_TO_YV12,   1,0,3,2)
-                         *v_out++ =
-                                 (uint8_t) ((FIX_IN(V_R_IN) * r4 - FIX_IN(V_G_IN) * g4 -
+ MAKE_COLORSPACE(rgb555i_to_yv12_c, 2,2,4, RGB16I_TO_YV12, MK_RGB555, 0,0,0)
-                                                         FIX_IN(V_B_IN) * b4) >> (SCALEBITS_IN + 2)) +
+ MAKE_COLORSPACE(rgb565i_to_yv12_c, 2,2,4, RGB16I_TO_YV12, MK_RGB565, 0,0,0)
-                                 V_ADD_IN;
+ MAKE_COLORSPACE(bgri_to_yv12_c,    3,2,4, RGBI_TO_YV12,   2,1,0, 0)
+ MAKE_COLORSPACE(bgrai_to_yv12_c,   4,2,4, RGBI_TO_YV12,   2,1,0, 0)
-                         src += 8;
+ MAKE_COLORSPACE(abgri_to_yv12_c,   4,2,4, RGBI_TO_YV12,   3,2,1, 0)
-                         y_out += 2;
+ MAKE_COLORSPACE(rgbai_to_yv12_c,   4,2,4, RGBI_TO_YV12,   0,1,2, 0)
-                 }
+ MAKE_COLORSPACE(argbi_to_yv12_c,   4,2,4, RGBI_TO_YV12,   1,2,3, 0)
-                 src -= src_dif;
+ MAKE_COLORSPACE(yuyvi_to_yv12_c,   2,2,4, YUYVI_TO_YV12,  0,1,2,3)
-                 y_out += y_dif;
+ MAKE_COLORSPACE(uyvyi_to_yv12_c,   2,2,4, YUYVI_TO_YV12,  1,0,3,2)
-                 u_out += uv_dif;
-                 v_out += uv_dif;
-         }
- }
- /*      yuv planar -> yuv 4:2:0 planar
-         NOTE: does not flip */
- void
- yuv_to_yv12_c(uint8_t * y_out,
-                           uint8_t * u_out,
-                           uint8_t * v_out,
-                           uint8_t * src,
-                           int width,
-                           int height,
-                           int stride)
- {
-         uint32_t stride2 = stride >> 1;
-         uint32_t width2 = width >> 1;
-         uint32_t y;
-         for (y = height; y; y--) {
-                 memcpy(y_out, src, width);
-                 src += width;
-                 y_out += stride;
-         }
-         for (y = height >> 1; y; y--) {
-                 memcpy(u_out, src, width2);
-                 src += width2;
-                 u_out += stride2;
-         }
-         for (y = height >> 1; y; y--) {
-                 memcpy(v_out, src, width2);
-                 src += width2;
-                 v_out += stride2;
-         }
- }
- /* yuyv (yuv2) packed -> yuv 4:2:0 planar
-    NOTE: does not flip */
- void
- yuyv_to_yv12_c(uint8_t * y_out,
-                            uint8_t * u_out,
-                            uint8_t * v_out,
-                            uint8_t * src,
-                            int width,
-                            int height,
-                            int stride)
- {
-         uint32_t width2 = width + width;
-         uint32_t y_dif = stride - width;
-         uint32_t uv_dif = y_dif >> 1;
-         uint32_t x, y;
-         for (y = height >> 1; y; y--) {
-                 for (x = width >> 1; x; x--) {
-                         *y_out++ = *src++;
-                         //*u_out++ = *src++;
-                         *u_out++ = (*(src + width2) + *src) >> 1;
-                         src++;
-                         *y_out++ = *src++;
-                         //*v_out++ = *src++;
-                         *v_out++ = (*(src + width2) + *src) >> 1;
-                         src++;
-                 }
-                 y_out += y_dif;
-                 u_out += uv_dif;
-                 v_out += uv_dif;
-                 for (x = width >> 1; x; x--) {
-                         *y_out++ = *src++;
-                         src++;
-                         *y_out++ = *src++;
-                         src++;
-                 }
-                 y_out += y_dif;
-         }
- }
+ /********** colorspace output (yv12_to_xxx) functions **********/
- /* uyvy packed -> yuv 4:2:0 planar
-    NOTE: does not flip */
- void
- uyvy_to_yv12_c(uint8_t * y_out,
-                            uint8_t * u_out,
-                            uint8_t * v_out,
-                            uint8_t * src,
-                            int width,
-                            int height,
-                            int stride)
- {
-         uint32_t width2 = width + width;
-         uint32_t y_dif = stride - width;
-         uint32_t uv_dif = y_dif >> 1;
-         uint32_t x, y;
-         for (y = height >> 1; y; y--) {
-                 for (x = width >> 1; x; x--) {
-                         *u_out++ = *src++;
-                         // *u_out++ = (*(src+width2) + *src++) >> 1;
-                         *y_out++ = *src++;
-                         //*v_out++ = *src++;
-                         *v_out++ = (*(src + width2) + *src) >> 1;
-                         src++;
-                         *y_out++ = *src++;
-                 }
-                 y_out += y_dif;
-                 u_out += uv_dif;;
-                 v_out += uv_dif;;
-                 for (x = width >> 1; x; x--) {
-                         src++;
-                         *y_out++ = *src++;
-                         src++;
-                         *y_out++ = *src++;
-                 }
-                 y_out += y_dif;
-         }
- }
  /*      yuv -> rgb def's */
-Line 563
+Line 322
  #define R_V_OUT                 1.596
  #define V_ADD_OUT               128
  #define SCALEBITS_OUT   13
  #define FIX_OUT(x)              ((uint16_t) ((x) * (1L<<SCALEBITS_OUT) + 0.5))
- /* initialize rgb lookup tables */
+ /* rgb16/rgb16i output */
- void
+ #define MK_RGB555(R,G,B)        \
- colorspace_init(void)
+         ((MAX(0,MIN(255, R)) << 7) & 0x7c00) | \
- {
-         int32_t i;
-         for (i = 0; i < 256; i++) {
-                 RGB_Y_tab[i] = FIX_OUT(RGB_Y_OUT) * (i - Y_ADD_OUT);
-                 B_U_tab[i] = FIX_OUT(B_U_OUT) * (i - U_ADD_OUT);
-                 G_U_tab[i] = FIX_OUT(G_U_OUT) * (i - U_ADD_OUT);
-                 G_V_tab[i] = FIX_OUT(G_V_OUT) * (i - V_ADD_OUT);
-                 R_V_tab[i] = FIX_OUT(R_V_OUT) * (i - V_ADD_OUT);
-         }
- }
- /* yuv 4:2:0 planar -> rgb555 + very simple error diffusion
- */
- #define MK_RGB555(R,G,B)        ((MAX(0,MIN(255, R)) << 7) & 0x7c00) | \
                                                          ((MAX(0,MIN(255, G)) << 2) & 0x03e0) | \
                                                          ((MAX(0,MIN(255, B)) >> 3) & 0x001f)
+ #define MK_RGB565(R,G,B)        \
- void
+         ((MAX(0,MIN(255, R)) << 8) & 0xf800) | \
- yv12_to_rgb555_c(uint8_t * dst,
-                                  int dst_stride,
-                                  uint8_t * y_src,
-                                  uint8_t * u_src,
-                                  uint8_t * v_src,
-                                  int y_stride,
-                                  int uv_stride,
-                                  int width,
-                                  int height)
- {
-         const uint32_t dst_dif = 4 * dst_stride - 2 * width;
-         int32_t y_dif = 2 * y_stride - width;
-         uint8_t *dst2 = dst + 2 * dst_stride;
-         uint8_t *y_src2 = y_src + y_stride;
-         uint32_t x, y;
-         if (height < 0) {
-                 height = -height;
-                 y_src += (height - 1) * y_stride;
-                 y_src2 = y_src - y_stride;
-                 u_src += (height / 2 - 1) * uv_stride;
-                 v_src += (height / 2 - 1) * uv_stride;
-                 y_dif = -width - 2 * y_stride;
-                 uv_stride = -uv_stride;
-         }
-         for (y = height / 2; y; y--) {
-                 int r, g, b;
-                 int r2, g2, b2;
-                 r = g = b = 0;
-                 r2 = g2 = b2 = 0;
-                 // process one 2x2 block per iteration
-                 for (x = 0; x < (uint32_t) width / 2; x++) {
-                         int u, v;
-                         int b_u, g_uv, r_v, rgb_y;
-                         u = u_src[x];
-                         v = v_src[x];
-                         b_u = B_U_tab[u];
-                         g_uv = G_U_tab[u] + G_V_tab[v];
-                         r_v = R_V_tab[v];
-                         rgb_y = RGB_Y_tab[*y_src];
-                         b = (b & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
-                         g = (g & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
-                         r = (r & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
-                         *(uint16_t *) dst = MK_RGB555(r, g, b);
-                         y_src++;
-                         rgb_y = RGB_Y_tab[*y_src];
-                         b = (b & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
-                         g = (g & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
-                         r = (r & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
-                         *(uint16_t *) (dst + 2) = MK_RGB555(r, g, b);
-                         y_src++;
-                         rgb_y = RGB_Y_tab[*y_src2];
-                         b2 = (b2 & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
-                         g2 = (g2 & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
-                         r2 = (r2 & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
-                         *(uint16_t *) (dst2) = MK_RGB555(r2, g2, b2);
-                         y_src2++;
-                         rgb_y = RGB_Y_tab[*y_src2];
-                         b2 = (b2 & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
-                         g2 = (g2 & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
-                         r2 = (r2 & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
-                         *(uint16_t *) (dst2 + 2) = MK_RGB555(r2, g2, b2);
-                         y_src2++;
-                         dst += 4;
-                         dst2 += 4;
-                 }
-                 dst += dst_dif;
-                 dst2 += dst_dif;
-                 y_src += y_dif;
-                 y_src2 += y_dif;
-                 u_src += uv_stride;
-                 v_src += uv_stride;
-         }
- }
- /* yuv 4:2:0 planar -> rgb565 + very simple error diffusion
-         NOTE:   identical to rgb555 except for shift/mask  */
- #define MK_RGB565(R,G,B)        ((MAX(0,MIN(255, R)) << 8) & 0xf800) | \
                                                          ((MAX(0,MIN(255, G)) << 3) & 0x07e0) | \
                                                          ((MAX(0,MIN(255, B)) >> 3) & 0x001f)
- void
+ #define WRITE_RGB16(ROW,UV_ROW,C1)      \
- yv12_to_rgb565_c(uint8_t * dst,
+         rgb_y = RGB_Y_tab[ y_ptr[y_stride + 0] ];                       \
-                                  int dst_stride,
+         b[ROW] = (b[ROW] & 0x7) + ((rgb_y + b_u##UV_ROW) >> SCALEBITS_OUT);     \
-                                  uint8_t * y_src,
+         g[ROW] = (g[ROW] & 0x7) + ((rgb_y - g_uv##UV_ROW) >> SCALEBITS_OUT);    \
-                                  uint8_t * u_src,
+         r[ROW] = (r[ROW] & 0x7) + ((rgb_y + r_v##UV_ROW) >> SCALEBITS_OUT);             \
-                                  uint8_t * v_src,
+         *(uint16_t *) (x_ptr+((ROW)*x_stride)+0) = C1(r[ROW], g[ROW], b[ROW]);  \
-                                  int y_stride,
+         rgb_y = RGB_Y_tab[ y_ptr[y_stride + 1] ];                               \
-                                  int uv_stride,
+         b[ROW] = (b[ROW] & 0x7) + ((rgb_y + b_u##UV_ROW) >> SCALEBITS_OUT);             \
-                                  int width,
+         g[ROW] = (g[ROW] & 0x7) + ((rgb_y - g_uv##UV_ROW) >> SCALEBITS_OUT);    \
-                                  int height)
+         r[ROW] = (r[ROW] & 0x7) + ((rgb_y + r_v##UV_ROW) >> SCALEBITS_OUT);             \
- {
+         *(uint16_t *) (x_ptr+((ROW)*x_stride)+2) = C1(r[ROW], g[ROW], b[ROW]);
-         const uint32_t dst_dif = 4 * dst_stride - 2 * width;
-         int32_t y_dif = 2 * y_stride - width;
+ #define YV12_TO_RGB16_ROW(SIZE,C1,C2,C3,C4) \
+         int r[2], g[2], b[2];                                   \
-         uint8_t *dst2 = dst + 2 * dst_stride;
+         r[0] = r[1] = g[0] = g[1] = b[0] = b[1] = 0;
-         uint8_t *y_src2 = y_src + y_stride;
+ #define YV12_TO_RGB16(SIZE,C1,C2,C3,C4)         \
-         uint32_t x, y;
+         int rgb_y;                                                                                              \
+         int b_u0 = B_U_tab[ u_ptr[0] ];                                                         \
-         if (height < 0) {                       // flip image?
+         int g_uv0 = G_U_tab[ u_ptr[0] ] + G_V_tab[ v_ptr[0] ];          \
-                 height = -height;
+         int r_v0 = R_V_tab[ v_ptr[0] ];                                                         \
-                 y_src += (height - 1) * y_stride;
+         WRITE_RGB16(0, 0, C1)                                                                           \
-                 y_src2 = y_src - y_stride;
+         WRITE_RGB16(1, 0, C1)
-                 u_src += (height / 2 - 1) * uv_stride;
-                 v_src += (height / 2 - 1) * uv_stride;
+ #define YV12_TO_RGB16I_ROW(SIZE,C1,C2,C3,C4) \
-                 y_dif = -width - 2 * y_stride;
+         int r[4], g[4], b[4];                                   \
-                 uv_stride = -uv_stride;
+         r[0] = r[1] = r[2] = r[3] = 0;                  \
-         }
+         g[0] = g[1] = g[2] = g[3] = 0;                  \
+         b[0] = b[1] = b[2] = b[3] = 0;
-         for (y = height / 2; y; y--) {
+ #define YV12_TO_RGB16I(SIZE,C1,C2,C3,C4)                \
-                 int r, g, b;
+         int rgb_y;                                                                                                      \
-                 int r2, g2, b2;
+         int b_u0 = B_U_tab[ u_ptr[0] ];                                                         \
+         int g_uv0 = G_U_tab[ u_ptr[0] ] + G_V_tab[ v_ptr[0] ];          \
-                 r = g = b = 0;
+         int r_v0 = R_V_tab[ v_ptr[0] ];                                                         \
-                 r2 = g2 = b2 = 0;
+     int b_u1 = B_U_tab[ u_ptr[uv_stride] ];                                             \
+         int g_uv1 = G_U_tab[ u_ptr[uv_stride] ] + G_V_tab[ v_ptr[uv_stride] ];  \
-                 // process one 2x2 block per iteration
+         int r_v1 = R_V_tab[ v_ptr[uv_stride] ];                                         \
-                 for (x = 0; x < (uint32_t) width / 2; x++) {
+     WRITE_RGB16(0, 0, C1)                                                                               \
-                         int u, v;
+         WRITE_RGB16(1, 1, C1)                                                                           \
-                         int b_u, g_uv, r_v, rgb_y;
+     WRITE_RGB16(2, 0, C1)                                                                               \
+         WRITE_RGB16(3, 1, C1)                                                                           \
-                         u = u_src[x];
-                         v = v_src[x];
+ /* rgb/rgbi output */
-                         b_u = B_U_tab[u];
-                         g_uv = G_U_tab[u] + G_V_tab[v];
+ #define WRITE_RGB(SIZE,ROW,UV_ROW,C1,C2,C3,C4)  \
-                         r_v = R_V_tab[v];
+         rgb_y = RGB_Y_tab[ y_ptr[(ROW)*y_stride + 0] ];                                         \
+         x_ptr[(ROW)*x_stride+(C3)] = MAX(0, MIN(255, (rgb_y + b_u##UV_ROW) >> SCALEBITS_OUT));  \
-                         rgb_y = RGB_Y_tab[*y_src];
+         x_ptr[(ROW)*x_stride+(C2)] = MAX(0, MIN(255, (rgb_y - g_uv##UV_ROW) >> SCALEBITS_OUT)); \
-                         b = (b & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
+         x_ptr[(ROW)*x_stride+(C1)] = MAX(0, MIN(255, (rgb_y + r_v##UV_ROW) >> SCALEBITS_OUT));  \
-                         g = (g & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
+         if ((SIZE)>3) x_ptr[(ROW)*x_stride+(C4)] = 0;                                                                   \
-                         r = (r & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
+         rgb_y = RGB_Y_tab[ y_ptr[(ROW)*y_stride + 1] ];                                                                 \
-                         *(uint16_t *) dst = MK_RGB565(r, g, b);
+         x_ptr[(ROW)*x_stride+(SIZE)+(C3)] = MAX(0, MIN(255, (rgb_y + b_u##UV_ROW) >> SCALEBITS_OUT));   \
+         x_ptr[(ROW)*x_stride+(SIZE)+(C2)] = MAX(0, MIN(255, (rgb_y - g_uv##UV_ROW) >> SCALEBITS_OUT));  \
-                         y_src++;
+         x_ptr[(ROW)*x_stride+(SIZE)+(C1)] = MAX(0, MIN(255, (rgb_y + r_v##UV_ROW) >> SCALEBITS_OUT));   \
-                         rgb_y = RGB_Y_tab[*y_src];
+         if ((SIZE)>3) x_ptr[(ROW)*x_stride+(SIZE)+(C4)] = 0;
-                         b = (b & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
-                         g = (g & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
-                         r = (r & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
+ #define YV12_TO_RGB_ROW(SIZE,C1,C2,C3,C4)       /* nothing */
-                         *(uint16_t *) (dst + 2) = MK_RGB565(r, g, b);
+ #define YV12_TO_RGB(SIZE,C1,C2,C3,C4)                           \
-                         y_src++;
+         int rgb_y;                                                                                              \
+         int b_u0 = B_U_tab[ u_ptr[0] ];                                                 \
-                         rgb_y = RGB_Y_tab[*y_src2];
+         int g_uv0 = G_U_tab[ u_ptr[0] ] + G_V_tab[ v_ptr[0] ];  \
-                         b2 = (b2 & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
+         int r_v0 = R_V_tab[ v_ptr[0] ];                                                 \
-                         g2 = (g2 & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
+         WRITE_RGB(SIZE, 0, 0, C1,C2,C3,C4)                                              \
-                         r2 = (r2 & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
+         WRITE_RGB(SIZE, 1, 0, C1,C2,C3,C4)
-                         *(uint16_t *) (dst2) = MK_RGB565(r2, g2, b2);
-                         y_src2++;
+ #define YV12_TO_RGBI_ROW(SIZE,C1,C2,C3,C4)      /* nothing */
+ #define YV12_TO_RGBI(SIZE,C1,C2,C3,C4)                          \
-                         rgb_y = RGB_Y_tab[*y_src2];
+         int rgb_y;                                                                                              \
-                         b2 = (b2 & 0x7) + ((rgb_y + b_u) >> SCALEBITS_OUT);
+         int b_u0 = B_U_tab[ u_ptr[0] ];                                                 \
-                         g2 = (g2 & 0x7) + ((rgb_y - g_uv) >> SCALEBITS_OUT);
+         int g_uv0 = G_U_tab[ u_ptr[0] ] + G_V_tab[ v_ptr[0] ];  \
-                         r2 = (r2 & 0x7) + ((rgb_y + r_v) >> SCALEBITS_OUT);
+         int r_v0 = R_V_tab[ v_ptr[0] ];                                                 \
-                         *(uint16_t *) (dst2 + 2) = MK_RGB565(r2, g2, b2);
+     int b_u1 = B_U_tab[ u_ptr[uv_stride] ];                                     \
-                         y_src2++;
+         int g_uv1 = G_U_tab[ u_ptr[uv_stride] ] + G_V_tab[ v_ptr[uv_stride] ];  \
+         int r_v1 = R_V_tab[ v_ptr[uv_stride] ];                                 \
-                         dst += 4;
+         WRITE_RGB(SIZE, 0, 0, C1,C2,C3,C4)              \
-                         dst2 += 4;
+         WRITE_RGB(SIZE, 1, 1, C1,C2,C3,C4)              \
-                 }
+         WRITE_RGB(SIZE, 2, 0, C1,C2,C3,C4)              \
+         WRITE_RGB(SIZE, 3, 1, C1,C2,C3,C4)
-                 dst += dst_dif;
-                 dst2 += dst_dif;
+ /* yuyv/yuyvi output */
-                 y_src += y_dif;
-                 y_src2 += y_dif;
+ #define WRITE_YUYV(ROW,UV_ROW,C1,C2,C3,C4)      \
+         x_ptr[(ROW)*x_stride+(C1)] = y_ptr[   (ROW)*y_stride +0];       \
-                 u_src += uv_stride;
+         x_ptr[(ROW)*x_stride+(C2)] = u_ptr[(UV_ROW)*uv_stride+0];       \
-                 v_src += uv_stride;
+         x_ptr[(ROW)*x_stride+(C3)] = y_ptr[   (ROW)*y_stride +1];       \
-         }
+         x_ptr[(ROW)*x_stride+(C4)] = v_ptr[(UV_ROW)*uv_stride+0];       \
- }
+ #define YV12_TO_YUYV_ROW(SIZE,C1,C2,C3,C4)      /* nothing */
+ #define YV12_TO_YUYV(SIZE,C1,C2,C3,C4)  \
+         WRITE_YUYV(0, 0, C1,C2,C3,C4)           \
- /* yuv 4:2:0 planar -> rgb24 */
+         WRITE_YUYV(1, 0, C1,C2,C3,C4)
- void
+ #define YV12_TO_YUYVI_ROW(SIZE,C1,C2,C3,C4) /* nothing */
- yv12_to_rgb24_c(uint8_t * dst,
+ #define YV12_TO_YUYVI(SIZE,C1,C2,C3,C4) \
-                                 int dst_stride,
+         WRITE_YUYV(0, 0, C1,C2,C3,C4)           \
-                                 uint8_t * y_src,
+         WRITE_YUYV(1, 1, C1,C2,C3,C4)           \
-                                 uint8_t * u_src,
+         WRITE_YUYV(2, 0, C1,C2,C3,C4)           \
-                                 uint8_t * v_src,
+         WRITE_YUYV(3, 1, C1,C2,C3,C4)
-                                 int y_stride,
-                                 int uv_stride,
-                                 int width,
+ MAKE_COLORSPACE(yv12_to_rgb555_c,  2,2,2, YV12_TO_RGB16,  MK_RGB555, 0,0,0)
-                                 int height)
+ MAKE_COLORSPACE(yv12_to_rgb565_c,  2,2,2, YV12_TO_RGB16,  MK_RGB565, 0,0,0)
- {
+ MAKE_COLORSPACE(yv12_to_bgr_c,     3,2,2, YV12_TO_RGB,    2,1,0, 0)
-         const uint32_t dst_dif = 6 * dst_stride - 3 * width;
+ MAKE_COLORSPACE(yv12_to_bgra_c,    4,2,2, YV12_TO_RGB,    2,1,0,3)
-         int32_t y_dif = 2 * y_stride - width;
+ MAKE_COLORSPACE(yv12_to_abgr_c,    4,2,2, YV12_TO_RGB,    3,2,1,0)
+ MAKE_COLORSPACE(yv12_to_rgba_c,    4,2,2, YV12_TO_RGB,    0,1,2,3)
-         uint8_t *dst2 = dst + 3 * dst_stride;
+ MAKE_COLORSPACE(yv12_to_argb_c,    4,2,2, YV12_TO_RGB,    1,2,3,0)
-         uint8_t *y_src2 = y_src + y_stride;
+ MAKE_COLORSPACE(yv12_to_yuyv_c,    2,2,2, YV12_TO_YUYV,   0,1,2,3)
-         uint32_t x, y;
+ MAKE_COLORSPACE(yv12_to_uyvy_c,    2,2,2, YV12_TO_YUYV,   1,0,3,2)
-         if (height < 0) {                       // flip image?
+ MAKE_COLORSPACE(yv12_to_rgb555i_c, 2,2,4, YV12_TO_RGB16I, MK_RGB555, 0,0,0)
-                 height = -height;
+ MAKE_COLORSPACE(yv12_to_rgb565i_c, 2,2,4, YV12_TO_RGB16I, MK_RGB565, 0,0,0)
-                 y_src += (height - 1) * y_stride;
+ MAKE_COLORSPACE(yv12_to_bgri_c,    3,2,4, YV12_TO_RGBI,   2,1,0, 0)
-                 y_src2 = y_src - y_stride;
+ MAKE_COLORSPACE(yv12_to_bgrai_c,   4,2,4, YV12_TO_RGBI,   2,1,0,3)
-                 u_src += (height / 2 - 1) * uv_stride;
+ MAKE_COLORSPACE(yv12_to_abgri_c,   4,2,4, YV12_TO_RGBI,   3,2,1,0)
-                 v_src += (height / 2 - 1) * uv_stride;
+ MAKE_COLORSPACE(yv12_to_rgbai_c,   4,2,4, YV12_TO_RGBI,   0,1,2,3)
-                 y_dif = -width - 2 * y_stride;
+ MAKE_COLORSPACE(yv12_to_argbi_c,   4,2,4, YV12_TO_RGBI,   1,2,3,0)
-                 uv_stride = -uv_stride;
+ MAKE_COLORSPACE(yv12_to_yuyvi_c,   2,2,4, YV12_TO_YUYVI,  0,1,2,3)
-         }
+ MAKE_COLORSPACE(yv12_to_uyvyi_c,   2,2,4, YV12_TO_YUYVI,  1,0,3,2)
-         for (y = height / 2; y; y--) {
-                 // process one 2x2 block per iteration
-                 for (x = 0; x < (uint32_t) width / 2; x++) {
+ /* yv12 to yv12 copy function */
-                         int u, v;
-                         int b_u, g_uv, r_v, rgb_y;
+ void
-                         int r, g, b;
+ yv12_to_yv12_c(uint8_t * y_dst, uint8_t * u_dst, uint8_t * v_dst,
+                                 int y_dst_stride, int uv_dst_stride,
-                         u = u_src[x];
+                                 uint8_t * y_src, uint8_t * u_src, uint8_t * v_src,
-                         v = v_src[x];
+                                 int y_src_stride, int uv_src_stride,
+                                 int width, int height, int vflip)
-                         b_u = B_U_tab[u];
+ {
-                         g_uv = G_U_tab[u] + G_V_tab[v];
+         int width2 = width / 2;
-                         r_v = R_V_tab[v];
+         int height2 = height / 2;
+         int y;
-                         rgb_y = RGB_Y_tab[*y_src];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
+         if (vflip) {
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
+                 y_src += (height - 1) * y_src_stride;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
+                 u_src += (height2 - 1) * uv_src_stride;
-                         dst[0] = MAX(0, MIN(255, b));
+                 v_src += (height2 - 1) * uv_src_stride;
-                         dst[1] = MAX(0, MIN(255, g));
+                 y_src_stride = -y_src_stride;
-                         dst[2] = MAX(0, MIN(255, r));
+                 uv_src_stride = -uv_src_stride;
-                         y_src++;
-                         rgb_y = RGB_Y_tab[*y_src];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
-                         dst[3] = MAX(0, MIN(255, b));
-                         dst[4] = MAX(0, MIN(255, g));
-                         dst[5] = MAX(0, MIN(255, r));
-                         y_src++;
-                         rgb_y = RGB_Y_tab[*y_src2];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
-                         dst2[0] = MAX(0, MIN(255, b));
-                         dst2[1] = MAX(0, MIN(255, g));
-                         dst2[2] = MAX(0, MIN(255, r));
-                         y_src2++;
-                         rgb_y = RGB_Y_tab[*y_src2];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
-                         dst2[3] = MAX(0, MIN(255, b));
-                         dst2[4] = MAX(0, MIN(255, g));
-                         dst2[5] = MAX(0, MIN(255, r));
-                         y_src2++;
-                         dst += 6;
-                         dst2 += 6;
-                 }
-                 dst += dst_dif;
-                 dst2 += dst_dif;
-                 y_src += y_dif;
-                 y_src2 += y_dif;
-                 u_src += uv_stride;
-                 v_src += uv_stride;
-         }
- }
- /* yuv 4:2:0 planar -> rgb32 */
- void
- yv12_to_rgb32_c(uint8_t * dst,
-                                 int dst_stride,
-                                 uint8_t * y_src,
-                                 uint8_t * v_src,
-                                 uint8_t * u_src,
-                                 int y_stride,
-                                 int uv_stride,
-                                 int width,
-                                 int height)
- {
-         const uint32_t dst_dif = 8 * dst_stride - 4 * width;
-         int32_t y_dif = 2 * y_stride - width;
-         uint8_t *dst2 = dst + 4 * dst_stride;
-         uint8_t *y_src2 = y_src + y_stride;
-         uint32_t x, y;
-         if (height < 0) {                       // flip image?
-                 height = -height;
-                 y_src += (height - 1) * y_stride;
-                 y_src2 = y_src - y_stride;
-                 u_src += (height / 2 - 1) * uv_stride;
-                 v_src += (height / 2 - 1) * uv_stride;
-                 y_dif = -width - 2 * y_stride;
-                 uv_stride = -uv_stride;
-         }
-         for (y = height / 2; y; y--) {
-                 // process one 2x2 block per iteration
-                 for (x = 0; x < (uint32_t) width / 2; x++) {
-                         int u, v;
-                         int b_u, g_uv, r_v, rgb_y;
-                         int r, g, b;
-                         u = u_src[x];
-                         v = v_src[x];
-                         b_u = B_U_tab[u];
-                         g_uv = G_U_tab[u] + G_V_tab[v];
-                         r_v = R_V_tab[v];
-                         rgb_y = RGB_Y_tab[*y_src];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
-                         dst[0] = MAX(0, MIN(255, r));
-                         dst[1] = MAX(0, MIN(255, g));
-                         dst[2] = MAX(0, MIN(255, b));
-                         dst[3] = 0;
-                         y_src++;
-                         rgb_y = RGB_Y_tab[*y_src];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
-                         dst[4] = MAX(0, MIN(255, r));
-                         dst[5] = MAX(0, MIN(255, g));
-                         dst[6] = MAX(0, MIN(255, b));
-                         dst[7] = 0;
-                         y_src++;
-                         rgb_y = RGB_Y_tab[*y_src2];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
-                         dst2[0] = MAX(0, MIN(255, r));
-                         dst2[1] = MAX(0, MIN(255, g));
-                         dst2[2] = MAX(0, MIN(255, b));
-                         dst2[3] = 0;
-                         y_src2++;
-                         rgb_y = RGB_Y_tab[*y_src2];
-                         b = (rgb_y + b_u) >> SCALEBITS_OUT;
-                         g = (rgb_y - g_uv) >> SCALEBITS_OUT;
-                         r = (rgb_y + r_v) >> SCALEBITS_OUT;
-                         dst2[4] = MAX(0, MIN(255, r));
-                         dst2[5] = MAX(0, MIN(255, g));
-                         dst2[6] = MAX(0, MIN(255, b));
-                         dst2[7] = 0;
-                         y_src2++;
-                         dst += 8;
-                         dst2 += 8;
-                 }
-                 dst += dst_dif;
-                 dst2 += dst_dif;
-                 y_src += y_dif;
-                 y_src2 += y_dif;
-                 u_src += uv_stride;
-                 v_src += uv_stride;
-         }
- }
- /*      yuv 4:2:0 planar -> yuv planar */
- void
- yv12_to_yuv_c(uint8_t * dst,
-                           int dst_stride,
-                           uint8_t * y_src,
-                           uint8_t * u_src,
-                           uint8_t * v_src,
-                           int y_stride,
-                           int uv_stride,
-                           int width,
-                           int height)
- {
-         uint32_t dst_stride2 = dst_stride >> 1;
-         uint32_t width2 = width >> 1;
-         uint32_t y;
-         if (height < 0) {
-                 height = -height;
-                 y_src += (height - 1) * y_stride;
-                 u_src += (height / 2 - 1) * uv_stride;
-                 v_src += (height / 2 - 1) * uv_stride;
-                 y_stride = -y_stride;
-                 uv_stride = -uv_stride;
          }
          for (y = height; y; y--) {
-                 memcpy(dst, y_src, width);
+                 memcpy(y_dst, y_src, width);
-                 dst += dst_stride;
+                 y_src += y_src_stride;
-                 y_src += y_stride;
+                 y_dst += y_dst_stride;
          }
-         for (y = height >> 1; y; y--) {
+         for (y = height2; y; y--) {
-                 memcpy(dst, u_src, width2);
+                 memcpy(u_dst, u_src, width2);
-                 dst += dst_stride2;
+                 u_src += uv_src_stride;
-                 u_src += uv_stride;
+                 u_dst += uv_dst_stride;
          }
-         for (y = height >> 1; y; y--) {
+         for (y = height2; y; y--) {
-                 memcpy(dst, v_src, width2);
+                 memcpy(v_dst, v_src, width2);
-                 dst += dst_stride2;
+                 v_src += uv_src_stride;
-                 v_src += uv_stride;
+                 v_dst += uv_dst_stride;
          }
  }
+ /* initialize rgb lookup tables */
- /* yuv 4:2:0 planar -> yuyv (yuv2) packed */
- void
- yv12_to_yuyv_c(uint8_t * dst,
-                            int dst_stride,
-                            uint8_t * y_src,
-                            uint8_t * u_src,
-                            uint8_t * v_src,
-                            int y_stride,
-                            int uv_stride,
-                            int width,
-                            int height)
- {
-         const uint32_t dst_dif = 2 * (dst_stride - width);
-         uint32_t x, y;
-         if (height < 0) {
-                 height = -height;
-                 y_src += (height - 1) * y_stride;
-                 u_src += (height / 2 - 1) * uv_stride;
-                 v_src += (height / 2 - 1) * uv_stride;
-                 y_stride = -y_stride;
-                 uv_stride = -uv_stride;
-         }
-         for (y = 0; y < (uint32_t) height; y++) {
-                 for (x = 0; x < (uint32_t) width / 2; x++) {
-                         dst[0] = y_src[2 * x];
-                         dst[1] = u_src[x];
-                         dst[2] = y_src[2 * x + 1];
-                         dst[3] = v_src[x];
-                         dst += 4;
-                 }
-                 dst += dst_dif;
-                 y_src += y_stride;
-                 if (y & 1) {
-                         u_src += uv_stride;
-                         v_src += uv_stride;
-                 }
-         }
- }
- /* yuv 4:2:0 planar -> uyvy packed */
- void
- yv12_to_uyvy_c(uint8_t * dst,
-                            int dst_stride,
-                            uint8_t * y_src,
-                            uint8_t * u_src,
-                            uint8_t * v_src,
-                            int y_stride,
-                            int uv_stride,
-                            int width,
-                            int height)
- {
-         const uint32_t dst_dif = 2 * (dst_stride - width);
-         uint32_t x, y;
-         if (height < 0) {
-                 height = -height;
-                 y_src += (height - 1) * y_stride;
-                 u_src += (height / 2 - 1) * uv_stride;
-                 v_src += (height / 2 - 1) * uv_stride;
-                 y_stride = -y_stride;
-                 uv_stride = -uv_stride;
-         }
-         for (y = 0; y < (uint32_t) height; y++) {
-                 for (x = 0; x < (uint32_t) width / 2; x++) {
-                         dst[0] = u_src[x];
-                         dst[1] = y_src[2 * x];
-                         dst[2] = v_src[x];
-                         dst[3] = y_src[2 * x + 1];
-                         dst += 4;
-                 }
-                 dst += dst_dif;
-                 y_src += y_stride;
-                 if (y & 1) {
-                         u_src += uv_stride;
-                         v_src += uv_stride;
-                 }
-         }
- }
- /*      user yuv planar -> yuv 4:2:0 planar
-         NOTE: does not flip */
  void
- user_to_yuv_c(uint8_t * y_out,
+ colorspace_init(void)
-                           uint8_t * u_out,
-                           uint8_t * v_out,
-                           int stride,
-                           DEC_PICTURE * picture,
-                           int width,
-                           int height)
  {
-         uint32_t stride2 = stride >> 1;
+         int32_t i;
-         uint32_t width2 = width >> 1;
-         uint32_t y;
-         uint8_t *src;
-         src = picture->y;
-         for (y = height; y; y--) {
-                 memcpy(y_out, src, width);
-                 src += picture->stride_y;
-                 y_out += stride;
-         }
-         src = picture->u;
-         for (y = height >> 1; y; y--) {
-                 memcpy(u_out, src, width2);
-                 src += picture->stride_uv;
-                 u_out += stride2;
-         }
-         src = picture->v;
+         for (i = 0; i < 256; i++) {
-         for (y = height >> 1; y; y--) {
+                 RGB_Y_tab[i] = FIX_OUT(RGB_Y_OUT) * (i - Y_ADD_OUT);
-                 memcpy(v_out, src, width2);
+                 B_U_tab[i] = FIX_OUT(B_U_OUT) * (i - U_ADD_OUT);
-                 src += picture->stride_uv;
+                 G_U_tab[i] = FIX_OUT(G_U_OUT) * (i - U_ADD_OUT);
-                 v_out += stride2;
+                 G_V_tab[i] = FIX_OUT(G_V_OUT) * (i - V_ADD_OUT);
+                 R_V_tab[i] = FIX_OUT(R_V_OUT) * (i - V_ADD_OUT);
          }
  }

 Legend:



Removed from v.433
 


changed lines


 
Added in v.1382
 Legend:



Removed from v.433
 


changed lines


 
Added in v.1382
-Removed from v.433
+Added in v.1382

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4