Diff of /branches/dev-api-4/xvidcore/src/image/x86_asm/interpolate8x8_mmx.asm

-revision 886, Fri Feb 21 14:49:29 2003 UTC
+revision 1192, Tue Oct 28 22:23:03 2003 UTC
 Line 1
- ;/**************************************************************************
+ ;/*****************************************************************************
  ; *
  ; *     XVID MPEG-4 VIDEO CODEC
- ; *     mmx 8x8 block-based halfpel interpolation
+ ; *  - mmx 8x8 block-based halfpel interpolation -
+ ; *
+ ; *  Copyright(C) 2001 Peter Ross <pross@xvid.org>
+ ; *               2002 Michael Militzer <isibaar@xvid.org>
  ; *
  ; *     This program is free software; you can redistribute it and/or modify
  ; *     it under the terms of the GNU General Public License as published by
-Line 15
+Line 18
  ; *
  ; *     You should have received a copy of the GNU General Public License
  ; *     along with this program; if not, write to the Free Software
- ; *     Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
+ ; *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
  ; *
- ; *************************************************************************/
+ ; ****************************************************************************/
- ;/**************************************************************************
+ BITS 32
- ; *
- ; *     History:
- ; *
- ; * 05.10.2002  added some qpel mmx code - Isibaar
- ; * 06.07.2002  mmx cleanup - Isibaar
- ; *     22.12.2001      inital version; (c)2001 peter ross <pross@cs.rmit.edu.au>
- ; *
- ; *************************************************************************/
- bits 32
  %macro cglobal 1
          %ifdef PREFIX
-Line 41
+Line 33
          %endif
  %endmacro
- section .data
+ ;=============================================================================
+ ; Read only data
+ ;=============================================================================
- align 16
+ SECTION .rodata
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ; (16 - r) rounding table
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
- rounding_lowpass_mmx
+ ALIGN 16
+ rounding_lowpass_mmx:
  times 4 dw 16
  times 4 dw 15
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ; (1 - r) rounding table
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
- rounding1_mmx
+ rounding1_mmx:
  times 4 dw 1
  times 4 dw 0
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ; (2 - r) rounding table
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
- rounding2_mmx
+ rounding2_mmx:
  times 4 dw 2
  times 4 dw 1
- mmx_one
+ mmx_one:
  times 8 db 1
- mmx_two
+ mmx_two:
  times 8 db 2
- mmx_three
+ mmx_three:
  times 8 db 3
- mmx_five
+ mmx_five:
  times 4 dw 5
- mmx_mask
+ mmx_mask:
  times 8 db 254
- mmx_mask2
+ mmx_mask2:
  times 8 db 252
- section .text
+ ;=============================================================================
+ ; Code
+ ;=============================================================================
+ SECTION .text
+ cglobal interpolate8x8_halfpel_h_mmx
+ cglobal interpolate8x8_halfpel_v_mmx
+ cglobal interpolate8x8_halfpel_hv_mmx
+ cglobal interpolate8x8_avg4_mmx
+ cglobal interpolate8x8_avg2_mmx
+ cglobal interpolate8x8_6tap_lowpass_h_mmx
+ cglobal interpolate8x8_6tap_lowpass_v_mmx
  %macro  CALC_AVG 6
          punpcklbw %3, %6
-Line 100
+Line 107
          psrlw %1, 1                     ; mm01 >>= 1
          psrlw %2, 1
  %endmacro
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ;
  ; void interpolate8x8_halfpel_h_mmx(uint8_t * const dst,
  ;                                               const uint8_t * const src,
  ;                                               const uint32_t stride,
  ;                                               const uint32_t rounding);
  ;
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  %macro COPY_H_MMX 0
                  movq mm0, [esi]
-Line 131
+Line 137
                  add edi, edx            ; dst += stride
  %endmacro
- align 16
+ ALIGN 16
- cglobal interpolate8x8_halfpel_h_mmx
+ interpolate8x8_halfpel_h_mmx:
- interpolate8x8_halfpel_h_mmx
                  push    esi
                  push    edi
                  mov     eax, [esp + 8 + 16]             ; rounding
- interpolate8x8_halfpel_h_mmx.start
                  movq mm7, [rounding1_mmx + eax * 8]
                  mov     edi, [esp + 8 + 4]              ; dst
-Line 164
+Line 167
                  ret
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ;
  ; void interpolate8x8_halfpel_v_mmx(uint8_t * const dst,
  ;                                               const uint8_t * const src,
  ;                                               const uint32_t stride,
  ;                                               const uint32_t rounding);
  ;
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  %macro COPY_V_MMX 0
                  movq mm0, [esi]
-Line 191
+Line 194
                  add edi, edx            ; dst += stride
  %endmacro
- align 16
+ ALIGN 16
- cglobal interpolate8x8_halfpel_v_mmx
+ interpolate8x8_halfpel_v_mmx:
- interpolate8x8_halfpel_v_mmx
                  push    esi
                  push    edi
                  mov     eax, [esp + 8 + 16]             ; rounding
- interpolate8x8_halfpel_v_mmx.start
                  movq mm7, [rounding1_mmx + eax * 8]
                  mov     edi, [esp + 8 + 4]              ; dst
-Line 225
+Line 226
                  ret
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ;
  ; void interpolate8x8_halfpel_hv_mmx(uint8_t * const dst,
  ;                                               const uint8_t * const src,
-Line 233
+Line 234
  ;                                               const uint32_t rounding);
  ;
  ;
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  %macro COPY_HV_MMX 0
                  ; current row
                  movq mm0, [esi]
                  movq mm2, [esi + 1]
 Line 253
                  paddusw mm1, mm3
                  ; next row
                  movq mm4, [esi + edx]
                  movq mm2, [esi + edx + 1]
-Line 269
+Line 268
                  paddusw mm5, mm3
                  ; add current + next row
                  paddusw mm0, mm4                ; mm01 += mm45
                  paddusw mm1, mm5
                  paddusw mm0, mm7                ; mm01 += rounding2
-Line 285
+Line 283
                  add edi, edx            ; dst += stride
  %endmacro
- align 16
+ ALIGN 16
- cglobal interpolate8x8_halfpel_hv_mmx
+ interpolate8x8_halfpel_hv_mmx:
- interpolate8x8_halfpel_hv_mmx
                  push    esi
                  push    edi
                  mov     eax, [esp + 8 + 16]             ; rounding
- interpolate8x8_halfpel_hv_mmx.start
                  movq mm7, [rounding2_mmx + eax * 8]
-Line 320
+Line 316
                  ret
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ;
  ; void interpolate8x8_avg2_mmx(uint8_t const *dst,
  ;                                                          const uint8_t * const src1,
-Line 329
+Line 325
  ;                                                          const uint32_t rounding,
  ;                                                          const uint32_t height);
  ;
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  %macro AVG2_MMX_RND0 0
          movq    mm0, [eax]                      ; src1 -> mm0
-Line 425
+Line 421
          movq    [ecx+edx], mm4
  %endmacro
- align 16
+ ALIGN 16
- cglobal interpolate8x8_avg2_mmx
+ interpolate8x8_avg2_mmx:
- interpolate8x8_avg2_mmx
          push ebx
-Line 496
+Line 491
          ret
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ;
  ; void interpolate8x8_avg4_mmx(uint8_t const *dst,
  ;                                                          const uint8_t * const src1,
-Line 506
+Line 501
  ;                                                          const uint32_t stride,
  ;                                                          const uint32_t rounding);
  ;
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  %macro AVG4_MMX_RND0 0
          movq    mm0, [eax]                      ; src1 -> mm0
-Line 618
+Line 613
          movq    [ecx], mm0                      ; (src1 + src2 + src3 + src4 + 2) / 4 -> dst
  %endmacro
- align 16
+ ALIGN 16
- cglobal interpolate8x8_avg4_mmx
+ interpolate8x8_avg4_mmx:
- interpolate8x8_avg4_mmx
          push ebx
          push edi
-Line 685
+Line 679
          ret
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ;
  ; void interpolate8x8_6tap_lowpass_h_mmx(uint8_t const *dst,
  ;                                                                            const uint8_t * const src,
  ;                                                                            const uint32_t stride,
  ;                                                                            const uint32_t rounding);
  ;
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  %macro LOWPASS_6TAP_H_MMX 0
          movq    mm0, [eax]
-Line 763
+Line 757
          movq    [ecx], mm0
  %endmacro
- align 16
+ ALIGN 16
- cglobal interpolate8x8_6tap_lowpass_h_mmx
+ interpolate8x8_6tap_lowpass_h_mmx:
- interpolate8x8_6tap_lowpass_h_mmx
          mov     eax, [esp + 16]                 ; rounding
-Line 795
+Line 788
          ret
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  ;
  ; void interpolate8x8_6tap_lowpass_v_mmx(uint8_t const *dst,
  ;                                                                                const uint8_t * const src,
  ;                                                                                const uint32_t stride,
  ;                                                                            const uint32_t rounding);
  ;
- ;===========================================================================
+ ;-----------------------------------------------------------------------------
  %macro LOWPASS_6TAP_V_MMX 0
          movq    mm0, [eax]
-Line 874
+Line 867
          movq    [ecx], mm0
  %endmacro
- align 16
+ ALIGN 16
- cglobal interpolate8x8_6tap_lowpass_v_mmx
+ interpolate8x8_6tap_lowpass_v_mmx:
- interpolate8x8_6tap_lowpass_v_mmx
          push ebx

 Legend:



Removed from v.886
 


changed lines


 
Added in v.1192
 Legend:



Removed from v.886
 


changed lines


 
Added in v.1192
-Removed from v.886
+Added in v.1192

No admin address has been configured	ViewVC Help
Powered by ViewVC 1.0.4