Diff of /branches/dev-api-4/xvidcore/src/motion/ppc_asm/sad_altivec.c

-revision 98, Wed Apr  3 14:17:05 2002 UTC
+revision 430, Fri Sep  6 16:59:47 2002 UTC
 Line 1
- /*
+ /*****************************************************************************
+  *
+  *  XVID MPEG-4 VIDEO CODEC
+  *  - altivec sum of absolute difference (C version)
+  *
+  *  Copyright (C) 2002 Benjamin Herrenschmidt <benh@kernel.crashing.org>
+  *
+  *  This program is an implementation of a part of one or more MPEG-4
+  *  Video tools as specified in ISO/IEC 14496-2 standard.  Those intending
+  *  to use this software module in hardware or software products are
+  *  advised that its use may infringe existing patents or copyrights, and
+  *  any such use would be at such party's own risk.  The original
+  *  developer of this software module and his/her company, and subsequent
+  *  editors and their companies, will have no liability for use of this
+  *  software or modifications or derivatives thereof.
+  *
+  *  This program is free software; you can redistribute it and/or modify
+  *  it under the terms of the GNU General Public License as published by
+  *  the Free Software Foundation; either version 2 of the License, or
+  *  (at your option) any later version.
+  *
+  *  This program is distributed in the hope that it will be useful,
+  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+  *  GNU General Public License for more details.
+  *
+  *  You should have received a copy of the GNU General Public License
+  *  along with this program; if not, write to the Free Software
+  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
+  *
+  *  $Id: sad_altivec.c,v 1.4 2002-09-06 16:59:47 chl Exp $
+  *
+  ****************************************************************************/
+ #define G_REG
+ #ifdef G_REG
+ register vector unsigned char perm0 asm("%v29");
+ register vector unsigned char perm1 asm("%v30");
+ register vector unsigned int zerovec asm("%v31");
+ #endif
-     Copyright (C) 2002 Benjamin Herrenschmidt <benh@kernel.crashing.org>
+ #include <stdio.h>
-     This program is free software; you can redistribute it and/or modify
+ #undef DEBUG
-     it under the terms of the GNU General Public License as published by
-     the Free Software Foundation; either version 2 of the License, or
-     (at your option) any later version.
-     This program is distributed in the hope that it will be useful,
-     but WITHOUT ANY WARRANTY; without even the implied warranty of
-     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-     GNU General Public License for more details.
-     You should have received a copy of the GNU General Public License
-     along with this program; if not, write to the Free Software
-     Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
-     $Id: sad_altivec.c,v 1.1 2002-04-03 14:17:05 canard Exp $
-     $Source: /home/xvid/cvs_copy/cvs-server-root/xvid/xvidcore/src/motion/ppc_asm/sad_altivec.c,v $
-     $Date: 2002-04-03 14:17:05 $
-     $Author: canard $
- */
+ static const vector unsigned char perms[2] = {
+         (vector unsigned char) (        /* Used when cur is aligned */
+x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
+x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17),
+         (vector unsigned char) (        /* Used when cur is unaligned */
+x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
+x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f),
+ };
- #include <stdio.h>
+ #ifdef G_REG
+ void
+ sadInit_altivec(void)
+ {
+         perm0 = perms[0];
+         perm1 = perms[1];
+         zerovec = (vector unsigned int) (0);
+ }
+ static inline const vector unsigned char
+ get_perm(unsigned long i)
+ {
+         return i ? perm1 : perm0;
+ }
+ #define ZERODEF
+ #define ZEROVEC zerovec
+ #else
+ void
+ sadInit_altivec(void)
+ {
+ }
+ static inline const vector unsigned char
+ get_perm(unsigned long i)
+ {
+         return perms[i];
+ }
+ #define ZERODEF vector unsigned int zerovec = (vector unsigned int)(0)
+ #define ZEROVEC zerovec
+ #endif
- #undef DEBUG
  #define SAD16() \
  t1  = vec_perm(ref[0], ref[1], perm);  /* align current vector  */ \
-Line 47
+Line 104
  {
    vector unsigned char perm;
    vector unsigned char t1, t2, t3, t4 ;
-   vector unsigned int sad, zero;
+         vector unsigned int sad;
    vector signed int sumdiffs, best_vec;
    unsigned long result;
+         ZERODEF;
  #ifdef DEBUG
    if (((unsigned long)cur) & 0xf)
          fprintf(stderr, "sad16_altivec:incorrect align, cur: %x\n", cur);
-Line 60
+Line 119
          fprintf(stderr, "sad16_altivec:incorrect align, stride: %x\n", stride);
  #endif
    /* initialization */
-   zero = (vector unsigned int)(0);
+         sad = (vector unsigned int) (ZEROVEC);
-   sad  = (vector unsigned int)(0);
    stride >>= 4;
    perm = vec_lvsl(0, (unsigned char *)ref);
    *((unsigned long *)&best_vec) = best_sad;
-Line 73
+Line 131
    SAD16();
    SAD16();
    /* Temp sum for exit */
-   sumdiffs = vec_sums((vector signed int) sad, (vector signed int) zero);
+         sumdiffs = vec_sums((vector signed int) sad, (vector signed int) ZEROVEC);
    if (vec_all_ge(sumdiffs, best_vec))
          goto bail;
    SAD16();
    SAD16();
    SAD16();
    SAD16();
-   sumdiffs = vec_sums((vector signed int) sad, (vector signed int) zero);
+         sumdiffs = vec_sums((vector signed int) sad, (vector signed int) ZEROVEC);
    if (vec_all_ge(sumdiffs, best_vec))
          goto bail;
    SAD16();
-Line 93
+Line 151
    SAD16();
    /* sum all parts of difference into one 32 bit quantity */
-   sumdiffs = vec_sums((vector signed int) sad, (vector signed int) zero);
+         sumdiffs = vec_sums((vector signed int) sad, (vector signed int) ZEROVEC);
  bail:
    /* copy vector sum into unaligned result */
    sumdiffs = vec_splat( sumdiffs, 3 );
-Line 112
+Line 170
  sad = vec_sum4s(t5, sad);                /* accumulate sum of differences */ \
  cur += stride<<1; ref += stride<<1;
- static const vector unsigned char perms[2] = {
-         (vector unsigned char)( /* Used when cur is aligned */
-x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
-x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17
-         ),
-         (vector unsigned char)( /* Used when cur is unaligned */
-x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
-x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f
-         ),
- };
  /*
   * This function assumes cur is 8 bytes aligned, stride is 16 bytes
   * aligned and ref is unaligned
-Line 133
+Line 180
                  unsigned long stride)
  {
    vector unsigned char t1, t2, t3, t4, t5, tp ;
-   vector unsigned int sad, zero;
+         vector unsigned int sad;
    vector signed int sumdiffs;
    vector unsigned char perm_cur;
    vector unsigned char perm_ref1, perm_ref2;
    unsigned long result;
+         ZERODEF;
  #ifdef DEBUG
    if (((unsigned long)cur) & 0x7)
          fprintf(stderr, "sad8_altivec:incorrect align, cur: %x\n", cur);
-Line 148
+Line 197
          fprintf(stderr, "sad8_altivec:incorrect align, stride: %x\n", stride);
  #endif
-   perm_cur = perms[(((unsigned long)cur)>>3) & 0x01];
+         perm_cur = get_perm((((unsigned long) cur) >> 3) & 0x01);
    perm_ref1 = vec_lvsl(0, (unsigned char *)ref);
-   perm_ref2 = perms[0];
+         perm_ref2 = get_perm(0);
    /* initialization */
-   zero = (vector unsigned int)(0);
+         sad = (vector unsigned int) (ZEROVEC);
-   sad  = (vector unsigned int)(0);
    stride >>= 4;
    /* perform sum of differences between current and previous */
-Line 164
+Line 212
    SAD8();
    /* sum all parts of difference into one 32 bit quantity */
-   sumdiffs = vec_sums((vector signed int) sad, (vector signed int) zero);
+         sumdiffs = vec_sums((vector signed int) sad, (vector signed int) ZEROVEC);
    /* copy vector sum into unaligned result */
    sumdiffs = vec_splat( sumdiffs, 3 );
-Line 188
+Line 236
                  unsigned long stride)
  {
    vector unsigned char t2,t3,t4, mn;
-   vector unsigned int mean, dev, zero;
+         vector unsigned int mean, dev;
    vector signed int sumdiffs;
-   vector unsigned char c0,c1,c2,c3,c4,c5,c6,c7,c8,c9,c10,c11,c12,c13,c14,c15;
+         vector unsigned char c0, c1, c2, c3, c4, c5, c6, c7, c8, c9, c10, c11, c12,
+                 c13, c14, c15;
    unsigned long result;
-   zero = (vector unsigned int)(0);
+         ZERODEF;
-   mean = (vector unsigned int)(0);
-   dev = (vector unsigned int)(0);
+         mean = (vector unsigned int) (ZEROVEC);
+         dev = (vector unsigned int) (ZEROVEC);
    stride >>= 4;
    MEAN16(0);
-Line 215
+Line 265
    MEAN16(14);
    MEAN16(15);
-   sumdiffs = vec_sums((vector signed int) mean, (vector signed int) zero);
+         sumdiffs = vec_sums((vector signed int) mean, (vector signed int) ZEROVEC);
-   mn = vec_perm((vector unsigned char)sumdiffs, (vector unsigned char)sumdiffs,
+         mn = vec_perm((vector unsigned char) sumdiffs,
-         (vector unsigned char)(14,14,14,14,14,14,14,14,14,14,14,14,14,14,14,14));
+                                   (vector unsigned char) sumdiffs, (vector unsigned char) (14,
+,
+,
+,
+,
+,
+,
+,
+,
+,
+,
+,
+,
+,
+,
+));
    DEV16(0);
    DEV16(1);
    DEV16(2);
-Line 236
+Line 301
    DEV16(15);
    /* sum all parts of difference into one 32 bit quantity */
-   sumdiffs = vec_sums((vector signed int) dev, (vector signed int) zero);
+         sumdiffs = vec_sums((vector signed int) dev, (vector signed int) ZEROVEC);
    /* copy vector sum into unaligned result */
    sumdiffs = vec_splat( sumdiffs, 3 );

 Legend:



Removed from v.98
 


changed lines


 
Added in v.430
 Legend:



Removed from v.98
 


changed lines


 
Added in v.430
-Removed from v.98
+Added in v.430

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4