Diff of /trunk/xvidcore/src/image/image.c

-revision 851, Sat Feb 15 15:22:19 2003 UTC
+revision 1959, Tue Mar  8 19:18:44 2011 UTC
 Line 1
  /**************************************************************************
   *
   *      XVID MPEG-4 VIDEO CODEC
-  *      image stuff
+  *  - Image management functions -
   *
-  *      This program is an implementation of a part of one or more MPEG-4
+  *  Copyright(C) 2001-2010 Peter Ross <pross@xvid.org>
-  *      Video tools as specified in ISO/IEC 14496-2 standard.  Those intending
-  *      to use this software module in hardware or software products are
-  *      advised that its use may infringe existing patents or copyrights, and
-  *      any such use would be at such party's own risk.  The original
-  *      developer of this software module and his/her company, and subsequent
-  *      editors and their companies, will have no liability for use of this
-  *      software or modifications or derivatives thereof.
   *
   *      This program is free software; you can redistribute it and/or modify
   *      it under the terms of the GNU General Public License as published by
-Line 24
+Line 17
   *
   *      You should have received a copy of the GNU General Public License
   *      along with this program; if not, write to the Free Software
-  *      Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
   *
-  *************************************************************************/
+  * $Id: image.c,v 1.48 2011-03-08 19:16:32 Isibaar Exp $
- /**************************************************************************
-  *
-  *      History:
   *
-  *  05.10.2002  support for interpolated images in qpel mode - Isibaar
+  ****************************************************************************/
-  *      01.05.2002      BFRAME image-based u,v interpolation
-  *  22.04.2002  added some B-frame support
-  *      14.04.2002      added image_dump_yuvpgm(), added image_mad()
-  *              XVID_CSP_USER input support
-  *  09.04.2002  PSNR calculations - Isibaar
-  *      06.04.2002      removed interlaced edging from U,V blocks (as per spec)
-  *  26.03.2002  interlacing support (field-based edging in set_edges)
-  *      26.01.2002      rgb555, rgb565
-  *      07.01.2001      commented u,v interpolation (not required for uv-block-based)
-  *  23.12.2001  removed #ifdefs, added function pointers + init_common()
-  *      22.12.2001      cpu #ifdefs
-  *  19.12.2001  image_dump(); useful for debugging
-  *       6.12.2001      inital version; (c)2001 peter ross <pross@cs.rmit.edu.au>
-  *
-  *************************************************************************/
  #include <stdlib.h>
- #include <string.h>                             // memcpy, memset
+ #include <string.h>                             /* memcpy, memset */
  #include <math.h>
  #include "../portab.h"
- #include "../global.h"                  // XVID_CSP_XXX's
+ #include "../global.h"                  /* XVID_CSP_XXX's */
- #include "../xvid.h"                    // XVID_CSP_XXX's
+ #include "../xvid.h"                    /* XVID_CSP_XXX's */
  #include "image.h"
  #include "colorspace.h"
  #include "interpolate8x8.h"
- #include "reduced.h"
- #include "../divx4.h"
  #include "../utils/mem_align.h"
+ #include "../motion/sad.h"
+ #include "../utils/emms.h"
- #include "font.h"               // XXX: remove later
+ #include "font.h"               /* XXX: remove later */
  #define SAFETY  64
  #define EDGE_SIZE2  (EDGE_SIZE/2)
-Line 76
+Line 49
  {
          const uint32_t edged_width2 = edged_width / 2;
          const uint32_t edged_height2 = edged_height / 2;
-         uint32_t i;
          image->y =
                  xvid_malloc(edged_width * (edged_height + 1) + SAFETY, CACHE_LINE);
          if (image->y == NULL) {
                  return -1;
          }
+         memset(image->y, 0, edged_width * (edged_height + 1) + SAFETY);
-         for (i = 0; i < edged_width * edged_height + SAFETY; i++) {
-                 image->y[i] = 0;
-         }
          image->u = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE);
          if (image->u == NULL) {
                  xvid_free(image->y);
+                 image->y = NULL;
                  return -1;
          }
+         memset(image->u, 0, edged_width2 * edged_height2 + SAFETY);
          image->v = xvid_malloc(edged_width2 * edged_height2 + SAFETY, CACHE_LINE);
          if (image->v == NULL) {
                  xvid_free(image->u);
+                 image->u = NULL;
                  xvid_free(image->y);
+                 image->y = NULL;
                  return -1;
          }
+         memset(image->v, 0, edged_width2 * edged_height2 + SAFETY);
          image->y += EDGE_SIZE * edged_width + EDGE_SIZE;
          image->u += EDGE_SIZE2 * edged_width2 + EDGE_SIZE2;
-Line 118
+Line 93
          if (image->y) {
                  xvid_free(image->y - (EDGE_SIZE * edged_width + EDGE_SIZE));
+                 image->y = NULL;
          }
          if (image->u) {
                  xvid_free(image->u - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2));
+                 image->u = NULL;
          }
          if (image->v) {
                  xvid_free(image->v - (EDGE_SIZE2 * edged_width2 + EDGE_SIZE2));
+                 image->v = NULL;
          }
  }
-Line 132
+Line 110
  image_swap(IMAGE * image1,
                     IMAGE * image2)
  {
-         uint8_t *tmp;
+     SWAP(uint8_t*, image1->y, image2->y);
+     SWAP(uint8_t*, image1->u, image2->u);
-         tmp = image1->y;
+     SWAP(uint8_t*, image1->v, image2->v);
-         image1->y = image2->y;
-         image2->y = tmp;
-         tmp = image1->u;
-         image1->u = image2->u;
-         image2->u = tmp;
-         tmp = image1->v;
-         image1->v = image2->v;
-         image2->v = tmp;
  }
-Line 159
+Line 127
          memcpy(image1->v, image2->v, edged_width * height / 4);
  }
+ /* setedges bug was in this BS versions */
+ #define SETEDGES_BUG_BEFORE             18
+ #define SETEDGES_BUG_AFTER              57
+ #define SETEDGES_BUG_REFIXED            63
  void
  image_setedges(IMAGE * image,
                             uint32_t edged_width,
                             uint32_t edged_height,
                             uint32_t width,
-                            uint32_t height)
+                            uint32_t height,
+                            int bs_version)
  {
          const uint32_t edged_width2 = edged_width / 2;
-         const uint32_t width2 = width / 2;
+         uint32_t width2;
          uint32_t i;
          uint8_t *dst;
          uint8_t *src;
          dst = image->y - (EDGE_SIZE + EDGE_SIZE * edged_width);
          src = image->y;
+         /* According to the Standard Clause 7.6.4, padding is done starting at 16
+          * pixel width and height multiples. This was not respected in old xvids */
+         if (bs_version >= SETEDGES_BUG_BEFORE &&
+                 bs_version <  SETEDGES_BUG_AFTER ||
+                 bs_version >= SETEDGES_BUG_REFIXED) {
+                 width  = (width+15)&~15;
+                 height = (height+15)&~15;
+         }
+         width2 = width/2;
          for (i = 0; i < EDGE_SIZE; i++) {
                  memset(dst, *src, EDGE_SIZE);
                  memcpy(dst + EDGE_SIZE, src, width);
-Line 202
+Line 185
          }
- //U
+         /* U */
          dst = image->u - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2);
          src = image->u;
-Line 230
+Line 213
          }
- // V
+         /* V */
          dst = image->v - (EDGE_SIZE2 + EDGE_SIZE2 * edged_width2);
          src = image->v;
-Line 258
+Line 241
          }
  }
- // bframe encoding requires image-based u,v interpolation
  void
- image_interpolate(const IMAGE * refn,
+ image_interpolate(const uint8_t * refn,
-                                   IMAGE * refh,
+                                   uint8_t * refh,
-                                   IMAGE * refv,
+                                   uint8_t * refv,
-                                   IMAGE * refhv,
+                                   uint8_t * refhv,
                                    uint32_t edged_width,
                                    uint32_t edged_height,
                                    uint32_t quarterpel,
                                    uint32_t rounding)
  {
-         const uint32_t offset = EDGE_SIZE2 * (edged_width + 1); // we only interpolate half of the edge area
+         const uint32_t offset = EDGE_SIZE2 * (edged_width + 1); /* we only interpolate half of the edge area */
          const uint32_t stride_add = 7 * edged_width;
- /*
- #ifdef BFRAMES
-         const uint32_t edged_width2 = edged_width / 2;
-         const uint32_t edged_height2 = edged_height / 2;
-         const uint32_t offset2 = EDGE_SIZE2 * (edged_width2 + 1);
-         const uint32_t stride_add2 = 7 * edged_width2;
- #endif
- */
-         uint8_t *n_ptr, *h_ptr, *v_ptr, *hv_ptr;
-         uint32_t x, y;
+         uint8_t *n_ptr;
+         uint8_t *h_ptr, *v_ptr, *hv_ptr;
+         uint32_t x, y;
-         n_ptr = refn->y;
+         n_ptr = (uint8_t*)refn;
-         h_ptr = refh->y;
+         h_ptr = refh;
-         v_ptr = refv->y;
+         v_ptr = refv;
-         hv_ptr = refhv->y;
          n_ptr -= offset;
          h_ptr -= offset;
          v_ptr -= offset;
-         hv_ptr -= offset;
+         /* Note we initialize the hv pointer later, as we can optimize code a bit
+          * doing it down to up in quarterpel and up to down in halfpel */
          if(quarterpel) {
                  for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) {
-Line 314
+Line 289
                          n_ptr += stride_add;
                  }
-                 h_ptr = refh->y;
+                 h_ptr = refh + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2;
-                 h_ptr -= offset;
+                 hv_ptr = refhv + (edged_height - EDGE_SIZE - EDGE_SIZE2)*edged_width - EDGE_SIZE2;
                  for (y = 0; y < (edged_height - EDGE_SIZE); y = y + 8) {
+                         hv_ptr -= stride_add;
+                         h_ptr -= stride_add;
+                         hv_ptr -= EDGE_SIZE;
+                         h_ptr -= EDGE_SIZE;
                          for (x = 0; x < (edged_width - EDGE_SIZE); x = x + 8) {
+                                 hv_ptr -= 8;
+                                 h_ptr -= 8;
                                  interpolate8x8_6tap_lowpass_v(hv_ptr, h_ptr, edged_width, rounding);
-                                 hv_ptr += 8;
-                                 h_ptr += 8;
-                         }
-                         hv_ptr += EDGE_SIZE;
-                         h_ptr += EDGE_SIZE;
-                         hv_ptr += stride_add;
-                         h_ptr += stride_add;
                  }
          }
-         else {
+         } else {
+                 hv_ptr = refhv;
+                 hv_ptr -= offset;
                  for (y = 0; y < (edged_height - EDGE_SIZE); y += 8) {
                          for (x = 0; x < (edged_width - EDGE_SIZE); x += 8) {
-Line 356
+Line 332
                          n_ptr += stride_add;
                  }
          }
- /*
- #ifdef BFRAMES
-         n_ptr = refn->u;
-         h_ptr = refh->u;
-         v_ptr = refv->u;
-         hv_ptr = refhv->u;
-         n_ptr -= offset2;
-         h_ptr -= offset2;
-         v_ptr -= offset2;
-         hv_ptr -= offset2;
-         for (y = 0; y < edged_height2; y += 8) {
-                 for (x = 0; x < edged_width2; x += 8) {
-                         interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width2, rounding);
-                         interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width2, rounding);
-                         interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width2, rounding);
-                         n_ptr += 8;
-                         h_ptr += 8;
-                         v_ptr += 8;
-                         hv_ptr += 8;
-                 }
-                 h_ptr += stride_add2;
-                 v_ptr += stride_add2;
-                 hv_ptr += stride_add2;
-                 n_ptr += stride_add2;
-         }
-         n_ptr = refn->v;
-         h_ptr = refh->v;
-         v_ptr = refv->v;
-         hv_ptr = refhv->v;
-         n_ptr -= offset2;
-         h_ptr -= offset2;
-         v_ptr -= offset2;
-         hv_ptr -= offset2;
-         for (y = 0; y < edged_height2; y = y + 8) {
-                 for (x = 0; x < edged_width2; x = x + 8) {
-                         interpolate8x8_halfpel_h(h_ptr, n_ptr, edged_width2, rounding);
-                         interpolate8x8_halfpel_v(v_ptr, n_ptr, edged_width2, rounding);
-                         interpolate8x8_halfpel_hv(hv_ptr, n_ptr, edged_width2, rounding);
-                         n_ptr += 8;
-                         h_ptr += 8;
-                         v_ptr += 8;
-                         hv_ptr += 8;
-                 }
-                 h_ptr += stride_add2;
-                 v_ptr += stride_add2;
-                 hv_ptr += stride_add2;
-                 n_ptr += stride_add2;
-         }
- #endif
- */
-         /*
-            interpolate_halfpel_h(
-            refh->y - offset,
-            refn->y - offset,
-            edged_width, edged_height,
-            rounding);
-            interpolate_halfpel_v(
-            refv->y - offset,
-            refn->y - offset,
-            edged_width, edged_height,
-            rounding);
-            interpolate_halfpel_hv(
-            refhv->y - offset,
-            refn->y - offset,
-            edged_width, edged_height,
-            rounding);
-          */
-         /* uv-image-based compensation
-            offset = EDGE_SIZE2 * (edged_width / 2 + 1);
-            interpolate_halfpel_h(
-            refh->u - offset,
-            refn->u - offset,
-            edged_width / 2, edged_height / 2,
-            rounding);
-            interpolate_halfpel_v(
-            refv->u - offset,
-            refn->u - offset,
-            edged_width / 2, edged_height / 2,
-            rounding);
-            interpolate_halfpel_hv(
-            refhv->u - offset,
-            refn->u - offset,
-            edged_width / 2, edged_height / 2,
-            rounding);
-            interpolate_halfpel_h(
-            refh->v - offset,
-            refn->v - offset,
-            edged_width / 2, edged_height / 2,
-            rounding);
-            interpolate_halfpel_v(
-            refv->v - offset,
-            refn->v - offset,
-            edged_width / 2, edged_height / 2,
-            rounding);
-            interpolate_halfpel_hv(
-            refhv->v - offset,
-            refn->v - offset,
-            edged_width / 2, edged_height / 2,
-            rounding);
-          */
  }
-Line 512
+Line 371
  #undef IMG_V
          }
-         DPRINTF(DPRINTF_DEBUG,"chroma_optimized_pixels = %i/%i", pixels, width*height/4);
+         DPRINTF(XVID_DEBUG_DEBUG,"chroma_optimized_pixels = %i/%i\n", pixels, width*height/4);
  }
-Line 530
+Line 389
                                   uint8_t * y_ptr, uint8_t * u_ptr, uint8_t * v_ptr,
                                   int y_stride, int uv_stride,
                                   int width, int height, int vflip,
-                                  packedFunc * func_opt, packedFunc func_c, int size)
+                                  packedFunc * func_opt, packedFunc func_c,
+                  int size, int interlacing)
  {
-         int width_opt, width_c;
+         int width_opt, width_c, height_opt;
+     if (width<0 || width==1 || height==1) return; /* forget about it */
          if (func_opt != func_c && x_stride < size*((width+15)/16)*16)
          {
                  width_opt = width & (~15);
-                 width_c = width - width_opt;
+                 width_c = (width - width_opt) & (~1);
          }
-         else
+         else if (func_opt != func_c && !(width&1) && (size==3))
          {
-                 width_opt = width;
+         /* MMX reads 4 bytes per pixel for RGB/BGR */
+         width_opt = width - 2;
+         width_c = 2;
+     }
+     else {
+         /* Enforce the width to be divisable by two. */
+                 width_opt = width & (~1);
                  width_c = 0;
          }
+     /* packed conversions require height to be divisable by 2
+        (or even by 4 for interlaced conversion) */
+     if (interlacing)
+         height_opt = height & (~3);
+     else
+         height_opt = height & (~1);
          func_opt(x_ptr, x_stride,
                          y_ptr, u_ptr, v_ptr, y_stride, uv_stride,
-                         width_opt, height, vflip);
+                         width_opt, height_opt, vflip);
          if (width_c)
          {
                  func_c(x_ptr + size*width_opt, x_stride,
                          y_ptr + width_opt, u_ptr + width_opt/2, v_ptr + width_opt/2,
-                         y_stride, uv_stride, width_c, height, vflip);
+                         y_stride, uv_stride, width_c, height_opt, vflip);
          }
  }
-Line 564
+Line 439
                          uint32_t width,
                          int height,
                          uint32_t edged_width,
-                         uint8_t * src,
+                         uint8_t * src[4],
-                         int src_stride,
+                         int src_stride[4],
                          int csp,
                          int interlacing)
  {
          const int edged_width2 = edged_width/2;
          const int width2 = width/2;
          const int height2 = height/2;
-         //const int height_signed = (csp & XVID_CSP_VFLIP) ? -height : height;
+ #if 0
+         const int height_signed = (csp & XVID_CSP_VFLIP) ? -height : height;
+ #endif
-         //      int src_stride = width;
-         // --- xvid 2.1 compatiblity patch ---
-         // --- remove when xvid_dec_frame->stride equals real stride
-         /*
-         if ((csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB555 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB565 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_YUY2 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_YVYU ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_UYVY)
-         {
-                 src_stride *= 2;
-         }
-         else if ((csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB24)
-         {
-                 src_stride *= 3;
-         }
-         else if ((csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB32 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_ABGR ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGBA)
-         {
-                 src_stride *= 4;
-         }
-         */
-         // ^--- xvid 2.1 compatiblity fix ---^
          switch (csp & ~XVID_CSP_VFLIP) {
          case XVID_CSP_RGB555:
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?rgb555i_to_yv12  :rgb555_to_yv12,
-                         interlacing?rgb555i_to_yv12_c:rgb555_to_yv12_c, 2);
+                         interlacing?rgb555i_to_yv12_c:rgb555_to_yv12_c, 2, interlacing);
                  break;
          case XVID_CSP_RGB565:
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?rgb565i_to_yv12  :rgb565_to_yv12,
-                         interlacing?rgb565i_to_yv12_c:rgb565_to_yv12_c, 2);
+                         interlacing?rgb565i_to_yv12_c:rgb565_to_yv12_c, 2, interlacing);
                  break;
-         case XVID_CSP_RGB24:
+         case XVID_CSP_BGR:
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?bgri_to_yv12  :bgr_to_yv12,
-                         interlacing?bgri_to_yv12_c:bgr_to_yv12_c, 3);
+                         interlacing?bgri_to_yv12_c:bgr_to_yv12_c, 3, interlacing);
                  break;
-         case XVID_CSP_RGB32:
+         case XVID_CSP_BGRA:
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?bgrai_to_yv12  :bgra_to_yv12,
-                         interlacing?bgrai_to_yv12_c:bgra_to_yv12_c, 4);
+                         interlacing?bgrai_to_yv12_c:bgra_to_yv12_c, 4, interlacing);
                  break;
          case XVID_CSP_ABGR :
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?abgri_to_yv12  :abgr_to_yv12,
-                         interlacing?abgri_to_yv12_c:abgr_to_yv12_c, 4);
+                         interlacing?abgri_to_yv12_c:abgr_to_yv12_c, 4, interlacing);
+                 break;
+         case XVID_CSP_RGB:
+                 safe_packed_conv(
+                         src[0], src_stride[0], image->y, image->u, image->v,
+                         edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
+                         interlacing?rgbi_to_yv12  :rgb_to_yv12,
+                         interlacing?rgbi_to_yv12_c:rgb_to_yv12_c, 3, interlacing);
                  break;
          case XVID_CSP_RGBA :
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?rgbai_to_yv12  :rgba_to_yv12,
-                         interlacing?rgbai_to_yv12_c:rgba_to_yv12_c, 4);
+                         interlacing?rgbai_to_yv12_c:rgba_to_yv12_c, 4, interlacing);
+                 break;
+         case XVID_CSP_ARGB:
+                 safe_packed_conv(
+                         src[0], src_stride[0], image->y, image->u, image->v,
+                         edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
+                         interlacing?argbi_to_yv12  : argb_to_yv12,
+                         interlacing?argbi_to_yv12_c: argb_to_yv12_c, 4, interlacing);
                  break;
          case XVID_CSP_YUY2:
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yuyvi_to_yv12  :yuyv_to_yv12,
-                         interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2);
+                         interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2, interlacing);
                  break;
          case XVID_CSP_YVYU:             /* u/v swapped */
                  safe_packed_conv(
-                         src, src_stride, image->y, image->v, image->y,
+                         src[0], src_stride[0], image->y, image->v, image->u,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yuyvi_to_yv12  :yuyv_to_yv12,
-                         interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2);
+                         interlacing?yuyvi_to_yv12_c:yuyv_to_yv12_c, 2, interlacing);
                  break;
          case XVID_CSP_UYVY:
                  safe_packed_conv(
-                         src, src_stride, image->y, image->u, image->v,
+                         src[0], src_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?uyvyi_to_yv12  :uyvy_to_yv12,
-                         interlacing?uyvyi_to_yv12_c:uyvy_to_yv12_c, 2);
+                         interlacing?uyvyi_to_yv12_c:uyvy_to_yv12_c, 2, interlacing);
                  break;
-         case XVID_CSP_I420:
+         case XVID_CSP_I420:     /* YCbCr == YUV == internal colorspace for MPEG */
                  yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2,
-                         src, src + src_stride*height, src + src_stride*height + (src_stride/2)*height2,
+                         src[0], src[0] + src_stride[0]*height, src[0] + src_stride[0]*height + (src_stride[0]/2)*height2,
-                         src_stride, src_stride/2, width, height, (csp & XVID_CSP_VFLIP));
+                         src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP));
-                 break
+                 break;
-                         ;
-         case XVID_CSP_YV12:             /* u/v swapped */
+         case XVID_CSP_YV12: /* YCrCb == YVA == U and V plane swapped */
                  yv12_to_yv12(image->y, image->v, image->u, edged_width, edged_width2,
-                         src, src + src_stride*height, src + src_stride*height + (src_stride/2)*height2,
+                         src[0], src[0] + src_stride[0]*height, src[0] + src_stride[0]*height + (src_stride[0]/2)*height2,
-                         src_stride, src_stride/2, width, height, (csp & XVID_CSP_VFLIP));
+                         src_stride[0], src_stride[0]/2, width, height, (csp & XVID_CSP_VFLIP));
                  break;
-         case XVID_CSP_USER:
+         case XVID_CSP_PLANAR:  /* YCbCr with arbitrary pointers and different strides for Y and UV */
-                 {
-                         DEC_PICTURE * pic = (DEC_PICTURE*)src;
                          yv12_to_yv12(image->y, image->u, image->v, edged_width, edged_width2,
-                                 pic->y, pic->u, pic->v, pic->stride_y, pic->stride_y,
+                         src[0], src[1], src[2], src_stride[0], src_stride[1],  /* v: dst_stride[2] not yet supported */
                                  width, height, (csp & XVID_CSP_VFLIP));
-                 }
                  break;
          case XVID_CSP_NULL:
-Line 759
+Line 622
                           uint32_t width,
                           int height,
                           uint32_t edged_width,
-                          uint8_t * dst,
+                          uint8_t * dst[4],
-                          uint32_t dst_stride,
+                          int dst_stride[4],
                           int csp,
                           int interlacing)
  {
-Line 773
+Line 636
          image_dump_yuvpgm(image, edged_width, width, height, "\\decode.pgm");
  */
-         // --- xvid 2.1 compatiblity patch ---
-         // --- remove when xvid_dec_frame->stride equals real stride
-         /*
-         if ((csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB555 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB565 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_YUY2 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_YVYU ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_UYVY)
-         {
-                 dst_stride *= 2;
-         }
-         else if ((csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB24)
-         {
-                 dst_stride *= 3;
-         }
-         else if ((csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGB32 ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_ABGR ||
-                 (csp & ~XVID_CSP_VFLIP) == XVID_CSP_RGBA)
-         {
-                 dst_stride *= 4;
-         }
-         */
-         // ^--- xvid 2.1 compatiblity fix ---^
          switch (csp & ~XVID_CSP_VFLIP) {
          case XVID_CSP_RGB555:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_rgb555i  :yv12_to_rgb555,
-                         interlacing?yv12_to_rgb555i_c:yv12_to_rgb555_c, 2);
+                         interlacing?yv12_to_rgb555i_c:yv12_to_rgb555_c, 2, interlacing);
                  return 0;
          case XVID_CSP_RGB565:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_rgb565i  :yv12_to_rgb565,
-                         interlacing?yv12_to_rgb565i_c:yv12_to_rgb565_c, 2);
+                         interlacing?yv12_to_rgb565i_c:yv12_to_rgb565_c, 2, interlacing);
                  return 0;
-         case XVID_CSP_RGB24:
+     case XVID_CSP_BGR:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_bgri  :yv12_to_bgr,
-                         interlacing?yv12_to_bgri_c:yv12_to_bgr_c, 3);
+                         interlacing?yv12_to_bgri_c:yv12_to_bgr_c, 3, interlacing);
                  return 0;
-         case XVID_CSP_RGB32:
+         case XVID_CSP_BGRA:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_bgrai  :yv12_to_bgra,
-                         interlacing?yv12_to_bgrai_c:yv12_to_bgra_c, 4);
+                         interlacing?yv12_to_bgrai_c:yv12_to_bgra_c, 4, interlacing);
                  return 0;
          case XVID_CSP_ABGR:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_abgri  :yv12_to_abgr,
-                         interlacing?yv12_to_abgri_c:yv12_to_abgr_c, 4);
+                         interlacing?yv12_to_abgri_c:yv12_to_abgr_c, 4, interlacing);
+                 return 0;
+         case XVID_CSP_RGB:
+                 safe_packed_conv(
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
+                         edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
+                         interlacing?yv12_to_rgbi  :yv12_to_rgb,
+                         interlacing?yv12_to_rgbi_c:yv12_to_rgb_c, 3, interlacing);
                  return 0;
          case XVID_CSP_RGBA:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_rgbai  :yv12_to_rgba,
-                         interlacing?yv12_to_rgbai_c:yv12_to_rgba_c, 4);
+                         interlacing?yv12_to_rgbai_c:yv12_to_rgba_c, 4, interlacing);
+                 return 0;
+         case XVID_CSP_ARGB:
+                 safe_packed_conv(
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
+                         edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
+                         interlacing?yv12_to_argbi  :yv12_to_argb,
+                         interlacing?yv12_to_argbi_c:yv12_to_argb_c, 4, interlacing);
                  return 0;
          case XVID_CSP_YUY2:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_yuyvi  :yv12_to_yuyv,
-                         interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2);
+                         interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2, interlacing);
                  return 0;
-         case XVID_CSP_YVYU:             // u,v swapped
+         case XVID_CSP_YVYU:             /* u,v swapped */
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->v, image->u,
+                         dst[0], dst_stride[0], image->y, image->v, image->u,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_yuyvi  :yv12_to_yuyv,
-                         interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2);
+                         interlacing?yv12_to_yuyvi_c:yv12_to_yuyv_c, 2, interlacing);
                  return 0;
          case XVID_CSP_UYVY:
                  safe_packed_conv(
-                         dst, dst_stride, image->y, image->u, image->v,
+                         dst[0], dst_stride[0], image->y, image->u, image->v,
                          edged_width, edged_width2, width, height, (csp & XVID_CSP_VFLIP),
                          interlacing?yv12_to_uyvyi  :yv12_to_uyvy,
-                         interlacing?yv12_to_uyvyi_c:yv12_to_uyvy_c, 2);
+                         interlacing?yv12_to_uyvyi_c:yv12_to_uyvy_c, 2, interlacing);
                  return 0;
-         case XVID_CSP_I420:
+         case XVID_CSP_I420: /* YCbCr == YUV == internal colorspace for MPEG */
-                 yv12_to_yv12(dst, dst + dst_stride*height, dst + dst_stride*height + (dst_stride/2)*height2,
+                 yv12_to_yv12(dst[0], dst[0] + dst_stride[0]*height, dst[0] + dst_stride[0]*height + (dst_stride[0]/2)*height2,
-                         dst_stride, dst_stride/2,
+                         dst_stride[0], dst_stride[0]/2,
                          image->y, image->u, image->v, edged_width, edged_width2,
                          width, height, (csp & XVID_CSP_VFLIP));
                  return 0;
-         case XVID_CSP_YV12:             // u,v swapped
+         case XVID_CSP_YV12:     /* YCrCb == YVU == U and V plane swapped */
-                 yv12_to_yv12(dst, dst + dst_stride*height, dst + dst_stride*height + (dst_stride/2)*height2,
+                 yv12_to_yv12(dst[0], dst[0] + dst_stride[0]*height, dst[0] + dst_stride[0]*height + (dst_stride[0]/2)*height2,
-                         dst_stride, dst_stride/2,
+                         dst_stride[0], dst_stride[0]/2,
                          image->y, image->v, image->u, edged_width, edged_width2,
                          width, height, (csp & XVID_CSP_VFLIP));
                  return 0;
-         case XVID_CSP_USER:
+         case XVID_CSP_PLANAR:  /* YCbCr with arbitrary pointers and different strides for Y and UV */
-                 {
+                 yv12_to_yv12(dst[0], dst[1], dst[2],
-                         DEC_PICTURE * pic = (DEC_PICTURE*)dst;
+                         dst_stride[0], dst_stride[1],   /* v: dst_stride[2] not yet supported */
-                         pic->y = image->y;
+                         image->y, image->u, image->v, edged_width, edged_width2,
-                         pic->u = image->u;
+                         width, height, (csp & XVID_CSP_VFLIP));
-                         pic->v = image->v;
+                 return 0;
-                         pic->stride_y = edged_width;
-                         pic->stride_uv = edged_width / 2;
+         case XVID_CSP_INTERNAL :
-                 }
+                 dst[0] = image->y;
+                 dst[1] = image->u;
+                 dst[2] = image->v;
+                 dst_stride[0] = edged_width;
+                 dst_stride[1] = edged_width/2;
+                 dst_stride[2] = edged_width/2;
                  return 0;
          case XVID_CSP_NULL:
-         case XVID_CSP_EXTERN:
+         case XVID_CSP_SLICE:
                  return 0;
          }
-Line 944
+Line 802
          if (sse==0)
                  return 99.99F;
-         return 48.131F - 10*(float)log10((float)sse/(float)(pixels));   // log10(255*255)=4.8131
+         return 48.131F - 10*(float)log10((float)sse/(float)(pixels));   /* log10(255*255)=4.8131 */
  }
-Line 954
+Line 812
                     uint16_t width,
                     uint16_t height)
  {
-         int diff, x, y;
+         int y, bwidth, bheight;
          long sse=0;
-         for (y = 0; y < height; y++) {
+         bwidth  = width  & (~0x07);
+         bheight = height & (~0x07);
+         /* Compute the 8x8 integer part */
+         for (y = 0; y<bheight; y += 8) {
+                 int x;
+                 /* Compute sse for the band */
+                 for (x = 0; x<bwidth; x += 8)
+                         sse += sse8_8bit(orig  + x, recon + x, stride);
+                 /* remaining pixels of the 8 pixels high band */
+                 for (x = bwidth; x < width; x++) {
+                         int diff;
+                         diff = *(orig + 0*stride + x) - *(recon + 0*stride + x);
+                         sse += diff * diff;
+                         diff = *(orig + 1*stride + x) - *(recon + 1*stride + x);
+                         sse += diff * diff;
+                         diff = *(orig + 2*stride + x) - *(recon + 2*stride + x);
+                         sse += diff * diff;
+                         diff = *(orig + 3*stride + x) - *(recon + 3*stride + x);
+                         sse += diff * diff;
+                         diff = *(orig + 4*stride + x) - *(recon + 4*stride + x);
+                         sse += diff * diff;
+                         diff = *(orig + 5*stride + x) - *(recon + 5*stride + x);
+                         sse += diff * diff;
+                         diff = *(orig + 6*stride + x) - *(recon + 6*stride + x);
+                         sse += diff * diff;
+                         diff = *(orig + 7*stride + x) - *(recon + 7*stride + x);
+                         sse += diff * diff;
+                 }
+                 orig  += 8*stride;
+                 recon += 8*stride;
+         }
+         /* Compute the down rectangle sse */
+         for (y = bheight; y < height; y++) {
+                 int x;
                  for (x = 0; x < width; x++) {
+                         int diff;
                          diff = *(orig + x) - *(recon + x);
                          sse += diff * diff;
                  }
                  orig += stride;
                  recon += stride;
          }
-         return sse;
+         return (sse);
  }
- /*
+ void image_block_variance(IMAGE * orig_image,
+                                           uint16_t stride,
+                                           MACROBLOCK *mbs,
+                                           uint16_t mb_width,
+                                           uint16_t mb_height)
+ {
+         DECLARE_ALIGNED_MATRIX(sums, 1, 4, uint16_t, CACHE_LINE);
+         DECLARE_ALIGNED_MATRIX(squares, 1, 4, uint32_t, CACHE_LINE);
+         int x, y, i, j;
+         uint8_t *orig_y = orig_image->y;
+         uint8_t *orig_u = orig_image->u;
+         uint8_t *orig_v = orig_image->v;
+         for (y = 0; y < mb_height; y++) {
+                 for (x = 0; x < mb_width; x++) {
+                         MACROBLOCK *pMB = &mbs[x + y * mb_width];
+                         uint32_t var4[4];
+                         uint32_t sum = 0, square = 0;
+                         /* y-blocks */
+                         for (j = 0; j < 2; j++) {
+                                 for (i = 0; i < 2; i++) {
+                                         int lsum = blocksum8(orig_y + ((y<<4) + (j<<3))*stride + (x<<4) + (i<<3),
+                                                                                  stride, sums, squares);
+                                         int lsquare = (squares[0] + squares[1] + squares[2] + squares[3])<<6;
+                                         sum += lsum;
+                                         square += lsquare;
+                                         var4[0] = (squares[0]<<4) - sums[0]*sums[0];
+                                         var4[1] = (squares[1]<<4) - sums[1]*sums[1];
+                                         var4[2] = (squares[2]<<4) - sums[2]*sums[2];
+                                         var4[3] = (squares[3]<<4) - sums[3]*sums[3];
+                                         pMB->rel_var8[j*2 + i] = lsquare - lsum*lsum;
+                                         if (pMB->rel_var8[j*2 + i])
+                                                 pMB->rel_var8[j*2 + i] = ((var4[0] + var4[1] + var4[2] + var4[3])<<8) /
+                                                                                                  pMB->rel_var8[j*2 + i]; /* 4*(Var(Di)/Var(D)) */
+                                         else
+                                                 pMB->rel_var8[j*2 + i] = 64;
+                                 }
+                         }
+                         /* u */
+                         {
+                                 int lsum = blocksum8(orig_u + (y<<3)*(stride>>1) + (x<<3),
+                                                                          stride, sums, squares);
+                                 int lsquare = (squares[0] + squares[1] + squares[2] + squares[3])<<6;
+                                 sum += lsum;
+                                 square += lsquare;
+                                 var4[0] = (squares[0]<<4) - sums[0]*sums[0];
+                                 var4[1] = (squares[1]<<4) - sums[1]*sums[1];
+                                 var4[2] = (squares[2]<<4) - sums[2]*sums[2];
+                                 var4[3] = (squares[3]<<4) - sums[3]*sums[3];
+                                 pMB->rel_var8[4] = lsquare - lsum*lsum;
+                                 if (pMB->rel_var8[4])
+                                         pMB->rel_var8[4] = ((var4[0] + var4[1] + var4[2] + var4[3])<<8) /
+                                                                                  pMB->rel_var8[4]; /* 4*(Var(Di)/Var(D)) */
+                                 else
+                                         pMB->rel_var8[4] = 64;
+                         }
+                         /* v */
+                         {
+                                 int lsum = blocksum8(orig_v + (y<<3)*(stride>>1) + (x<<3),
+                                                                          stride, sums, squares);
+                                 int lsquare = (squares[0] + squares[1] + squares[2] + squares[3])<<6;
+                                 sum += lsum;
+                                 square += lsquare;
+                                 var4[0] = (squares[0]<<4) - sums[0]*sums[0];
+                                 var4[1] = (squares[1]<<4) - sums[1]*sums[1];
+                                 var4[2] = (squares[2]<<4) - sums[2]*sums[2];
+                                 var4[3] = (squares[3]<<4) - sums[3]*sums[3];
+                                 pMB->rel_var8[5] = lsquare - lsum*lsum;
+                                 if (pMB->rel_var8[5])
+                                         pMB->rel_var8[5] = ((var4[0] + var4[1] + var4[2] + var4[3])<<8) /
+                                                                                  pMB->rel_var8[5]; /* 4*(Var(Di)/Var(D)) */
+                                 else
+                                         pMB->rel_var8[5] = 64;
+                         }
+                 }
+         }
+ }
+ #if 0
  #include <stdio.h>
  #include <string.h>
-Line 992
+Line 982
  }
- // dump image+edges to yuv pgm files
+ /* dump image+edges to yuv pgm files */
  int image_dump(IMAGE * image, uint32_t edged_width, uint32_t edged_height, char * path, int number)
  {
-Line 1015
+Line 1005
          return 0;
  }
- */
+ #endif
-Line 1080
+Line 1070
          for (y = 0; y < height; y++)
                  for (x = 0; x < width; x++)
-                         sum += ABS(img1->y[x + y * stride] - img2->y[x + y * stride]);
+                         sum += abs(img1->y[x + y * stride] - img2->y[x + y * stride]);
          for (y = 0; y < height2; y++)
                  for (x = 0; x < width2; x++)
-                         sum += ABS(img1->u[x + y * stride2] - img2->u[x + y * stride2]);
+                         sum += abs(img1->u[x + y * stride2] - img2->u[x + y * stride2]);
          for (y = 0; y < height2; y++)
                  for (x = 0; x < width2; x++)
-                         sum += ABS(img1->v[x + y * stride2] - img2->v[x + y * stride2]);
+                         sum += abs(img1->v[x + y * stride2] - img2->v[x + y * stride2]);
          return (float) sum / (width * height * 3 / 2);
  }
  void
- output_slice(IMAGE * cur, int std, int width, XVID_DEC_PICTURE* out_frm, int mbx, int mby,int mbl) {
+ output_slice(IMAGE * cur, int stride, int width, xvid_image_t* out_frm, int mbx, int mby,int mbl) {
    uint8_t *dY,*dU,*dV,*sY,*sU,*sV;
-   int std2 = std >> 1;
+   int stride2 = stride >> 1;
    int w = mbl << 4, w2,i;
    if(w > width)
      w = width;
    w2 = w >> 1;
-   dY = (uint8_t*)out_frm->y + (mby << 4) * out_frm->stride_y + (mbx << 4);
+   dY = (uint8_t*)out_frm->plane[0] + (mby << 4) * out_frm->stride[0] + (mbx << 4);
-   dU = (uint8_t*)out_frm->u + (mby << 3) * out_frm->stride_u + (mbx << 3);
+   dU = (uint8_t*)out_frm->plane[1] + (mby << 3) * out_frm->stride[1] + (mbx << 3);
-   dV = (uint8_t*)out_frm->v + (mby << 3) * out_frm->stride_v + (mbx << 3);
+   dV = (uint8_t*)out_frm->plane[2] + (mby << 3) * out_frm->stride[2] + (mbx << 3);
-   sY = cur->y + (mby << 4) * std + (mbx << 4);
+   sY = cur->y + (mby << 4) * stride + (mbx << 4);
-   sU = cur->u + (mby << 3) * std2 + (mbx << 3);
+   sU = cur->u + (mby << 3) * stride2 + (mbx << 3);
-   sV = cur->v + (mby << 3) * std2 + (mbx << 3);
+   sV = cur->v + (mby << 3) * stride2 + (mbx << 3);
    for(i = 0 ; i < 16 ; i++) {
      memcpy(dY,sY,w);
-     dY += out_frm->stride_y;
+     dY += out_frm->stride[0];
-     sY += std;
+     sY += stride;
    }
    for(i = 0 ; i < 8 ; i++) {
      memcpy(dU,sU,w2);
-     dU += out_frm->stride_u;
+     dU += out_frm->stride[1];
-     sU += std2;
+     sU += stride2;
    }
    for(i = 0 ; i < 8 ; i++) {
      memcpy(dV,sV,w2);
-     dV += out_frm->stride_v;
+     dV += out_frm->stride[2];
-     sV += std2;
+     sV += stride2;
    }
  }
-Line 1154
+Line 1144
          }
  }
+ /****************************************************************************/
- /* reduced resolution deblocking filter
+ static void (*deintl_core)(uint8_t *, int width, int height, const int stride) = 0;
-         block = block size (16=rrv, 8=full resolution)
+ extern void xvid_deinterlace_sse(uint8_t *, int width, int height, const int stride);
-         flags = XVID_DEC_YDEBLOCK|XVID_DEC_UVDEBLOCK
- */
- void
- image_deblock_rrv(IMAGE * img, int edged_width,
-                                 const MACROBLOCK * mbs, int mb_width, int mb_height, int mb_stride,
-                                 int block, int flags)
- {
-         const int edged_width2 = edged_width /2;
-         const int nblocks = block / 8;  /* skals code uses 8pixel block uints */
-         int i,j;
-         /* luma: j,i in block units */
+ #define CLIP_255(x)   ( ((x)&~255) ? ((-(x)) >> (8*sizeof((x))-1))&0xff : (x) )
-         if ((flags & XVID_DEC_DEBLOCKY))
-         {
-                 for (j = 1; j < mb_height*2; j++)               /* horizontal deblocking */
-                 for (i = 0; i < mb_width*2; i++)
-                 {
-                         if (mbs[(j-1)/2*mb_stride + (i/2)].mode != MODE_NOT_CODED ||
-                                 mbs[(j+0)/2*mb_stride + (i/2)].mode != MODE_NOT_CODED)
-                         {
-                                 hfilter_31(img->y + (j*block - 1)*edged_width + i*block,
-                                                                   img->y + (j*block + 0)*edged_width + i*block, nblocks);
-                         }
-                 }
-                 for (j = 0; j < mb_height*2; j++)               /* vertical deblocking */
+ static void deinterlace_c(uint8_t *pix, int width, int height, const int bps)
-                 for (i = 1; i < mb_width*2; i++)
                  {
-                         if (mbs[(j/2)*mb_stride + (i-1)/2].mode != MODE_NOT_CODED ||
+   pix += bps;
-                                 mbs[(j/2)*mb_stride + (i+0)/2].mode != MODE_NOT_CODED)
+   while(width-->0)
                          {
-                                 vfilter_31(img->y + (j*block)*edged_width + i*block - 1,
+     int p1 = pix[-bps];
-                                                    img->y + (j*block)*edged_width + i*block + 0,
+     int p2 = pix[0];
-                                                    edged_width, nblocks);
+     int p0 = p2;
+     int j = (height>>1) - 1;
+     int V;
+     unsigned char *P = pix++;
+     while(j-->0)
+     {
+       const int  p3 = P[  bps];
+       const int  p4 = P[2*bps];
+       V =  ((p1+p3+1)>>1) + ((p2 - ((p0+p4+1)>>1)) >> 2);
+       P[0] = CLIP_255( V );
+       p0 = p2;
+       p1 = p3;
+       p2 = p4;
+       P += 2*bps;
                          }
+     V =  ((p1+p1+1)>>1) + ((p2 - ((p0+p2+1)>>1)) >> 2);
+     P[0] = CLIP_255( V );
                  }
          }
+ #undef CLIP_255
+ int xvid_image_deinterlace(xvid_image_t* img, int width, int height, int bottom_first)
-         /* chroma */
-         if ((flags & XVID_DEC_DEBLOCKUV))
-         {
-                 for (j = 1; j < mb_height; j++)         /* horizontal deblocking */
-                 for (i = 0; i < mb_width; i++)
                  {
-                         if (mbs[(j-1)*mb_stride + i].mode != MODE_NOT_CODED ||
+         if (height&1)
-                                 mbs[(j+0)*mb_stride + i].mode != MODE_NOT_CODED)
+                 return 0;
-                         {
+         if (img->csp!=XVID_CSP_PLANAR && img->csp!=XVID_CSP_I420 && img->csp!=XVID_CSP_YV12)
-                                 hfilter_31(img->u + (j*block - 1)*edged_width2 + i*block,
+                 return 0;       /* not yet supported */
-                                                    img->u + (j*block + 0)*edged_width2 + i*block, nblocks);
+         if (deintl_core==0) {
-                                 hfilter_31(img->v + (j*block - 1)*edged_width2 + i*block,
+                 deintl_core = deinterlace_c;
-                                                    img->v + (j*block + 0)*edged_width2 + i*block, nblocks);
+ #if defined(ARCH_IS_IA32) || defined(ARCH_IS_X86_64)
-                         }
+                 {
+                         int cpu_flags = check_cpu_features();
+                         if (cpu_flags & XVID_CPU_MMX)
+                                 deintl_core = xvid_deinterlace_sse;
                  }
+ #endif
-                 for (j = 0; j < mb_height; j++)         /* vertical deblocking */
-                 for (i = 1; i < mb_width; i++)
-                 {
-                         if (mbs[j*mb_stride + i - 1].mode != MODE_NOT_CODED ||
-                                 mbs[j*mb_stride + i + 0].mode != MODE_NOT_CODED)
-                         {
-                                 vfilter_31(img->u + (j*block)*edged_width2 + i*block - 1,
-                                                    img->u + (j*block)*edged_width2 + i*block + 0,
-                                                    edged_width2, nblocks);
-                                 vfilter_31(img->v + (j*block)*edged_width2 + i*block - 1,
-                                                    img->v + (j*block)*edged_width2 + i*block + 0,
-                                                    edged_width2, nblocks);
                          }
+         if (!bottom_first) {
+                 deintl_core(img->plane[0], width,    height,    img->stride[0]);
+                 deintl_core(img->plane[1], width>>1, height>>1, img->stride[1]);
+                 deintl_core(img->plane[2], width>>1, height>>1, img->stride[2]);
                  }
+         else {
+                 deintl_core((uint8_t *)img->plane[0] + ( height    -1)*img->stride[0], width,    height,    -img->stride[0]);
+                 deintl_core((uint8_t *)img->plane[1] + ((height>>1)-1)*img->stride[1], width>>1, height>>1, -img->stride[1]);
+                 deintl_core((uint8_t *)img->plane[2] + ((height>>1)-1)*img->stride[2], width>>1, height>>1, -img->stride[2]);
          }
+         emms();
+         return 1;
  }

 Legend:



Removed from v.851
 


changed lines


 
Added in v.1959
 Legend:



Removed from v.851
 


changed lines


 
Added in v.1959
-Removed from v.851
+Added in v.1959

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4