20 |
* along with this program ; if not, write to the Free Software |
* along with this program ; if not, write to the Free Software |
21 |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
22 |
* |
* |
23 |
* $Id: decoder.c,v 1.64 2004-07-26 19:32:28 edgomez Exp $ |
* $Id: decoder.c,v 1.65 2004-08-10 21:58:55 edgomez Exp $ |
24 |
* |
* |
25 |
****************************************************************************/ |
****************************************************************************/ |
26 |
|
|
62 |
#include "image/postprocessing.h" |
#include "image/postprocessing.h" |
63 |
#include "utils/mem_align.h" |
#include "utils/mem_align.h" |
64 |
|
|
|
#ifdef ARCH_IS_IA32 |
|
|
#define interpolate16x16_quarterpel new_interpolate16x16_quarterpel |
|
|
#define interpolate8x8_quarterpel new_interpolate8x8_quarterpel |
|
|
#endif |
|
|
|
|
65 |
static int |
static int |
66 |
decoder_resize(DECODER * dec) |
decoder_resize(DECODER * dec) |
67 |
{ |
{ |
1110 |
|
|
1111 |
if(dec->quarterpel) { |
if(dec->quarterpel) { |
1112 |
if(!direct) { |
if(!direct) { |
1113 |
interpolate16x16_quarterpel(dec->tmp.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
interpolate16x16_add_quarterpel(dec->cur.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
1114 |
dec->qtmp.y + 128, 16*x_pos, 16*y_pos, |
dec->qtmp.y + 128, 16*x_pos, 16*y_pos, |
1115 |
pMB->b_mvs[0].x, pMB->b_mvs[0].y, stride, 0); |
pMB->b_mvs[0].x, pMB->b_mvs[0].y, stride, 0); |
1116 |
} else { |
} else { |
1117 |
interpolate8x8_quarterpel(dec->tmp.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
interpolate8x8_add_quarterpel(dec->cur.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
1118 |
dec->qtmp.y + 128, 16*x_pos, 16*y_pos, |
dec->qtmp.y + 128, 16*x_pos, 16*y_pos, |
1119 |
pMB->b_mvs[0].x, pMB->b_mvs[0].y, stride, 0); |
pMB->b_mvs[0].x, pMB->b_mvs[0].y, stride, 0); |
1120 |
interpolate8x8_quarterpel(dec->tmp.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
interpolate8x8_add_quarterpel(dec->cur.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
1121 |
dec->qtmp.y + 128, 16*x_pos + 8, 16*y_pos, |
dec->qtmp.y + 128, 16*x_pos + 8, 16*y_pos, |
1122 |
pMB->b_mvs[1].x, pMB->b_mvs[1].y, stride, 0); |
pMB->b_mvs[1].x, pMB->b_mvs[1].y, stride, 0); |
1123 |
interpolate8x8_quarterpel(dec->tmp.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
interpolate8x8_add_quarterpel(dec->cur.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
1124 |
dec->qtmp.y + 128, 16*x_pos, 16*y_pos + 8, |
dec->qtmp.y + 128, 16*x_pos, 16*y_pos + 8, |
1125 |
pMB->b_mvs[2].x, pMB->b_mvs[2].y, stride, 0); |
pMB->b_mvs[2].x, pMB->b_mvs[2].y, stride, 0); |
1126 |
interpolate8x8_quarterpel(dec->tmp.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
interpolate8x8_add_quarterpel(dec->cur.y, backward.y, dec->qtmp.y, dec->qtmp.y + 64, |
1127 |
dec->qtmp.y + 128, 16*x_pos + 8, 16*y_pos + 8, |
dec->qtmp.y + 128, 16*x_pos + 8, 16*y_pos + 8, |
1128 |
pMB->b_mvs[3].x, pMB->b_mvs[3].y, stride, 0); |
pMB->b_mvs[3].x, pMB->b_mvs[3].y, stride, 0); |
1129 |
} |
} |
1130 |
} else { |
} else { |
1131 |
interpolate8x8_switch(dec->tmp.y, backward.y, 16 * x_pos, 16 * y_pos, |
interpolate8x8_add_switch(dec->cur.y, backward.y, 16 * x_pos, 16 * y_pos, |
1132 |
pMB->b_mvs[0].x, pMB->b_mvs[0].y, stride, 0); |
pMB->b_mvs[0].x, pMB->b_mvs[0].y, stride, 0); |
1133 |
interpolate8x8_switch(dec->tmp.y, backward.y, 16 * x_pos + 8, |
interpolate8x8_add_switch(dec->cur.y, backward.y, 16 * x_pos + 8, |
1134 |
16 * y_pos, pMB->b_mvs[1].x, pMB->b_mvs[1].y, stride, 0); |
16 * y_pos, pMB->b_mvs[1].x, pMB->b_mvs[1].y, stride, 0); |
1135 |
interpolate8x8_switch(dec->tmp.y, backward.y, 16 * x_pos, |
interpolate8x8_add_switch(dec->cur.y, backward.y, 16 * x_pos, |
1136 |
16 * y_pos + 8, pMB->b_mvs[2].x, pMB->b_mvs[2].y, stride, 0); |
16 * y_pos + 8, pMB->b_mvs[2].x, pMB->b_mvs[2].y, stride, 0); |
1137 |
interpolate8x8_switch(dec->tmp.y, backward.y, 16 * x_pos + 8, |
interpolate8x8_add_switch(dec->cur.y, backward.y, 16 * x_pos + 8, |
1138 |
16 * y_pos + 8, pMB->b_mvs[3].x, pMB->b_mvs[3].y, stride, 0); |
16 * y_pos + 8, pMB->b_mvs[3].x, pMB->b_mvs[3].y, stride, 0); |
1139 |
} |
} |
1140 |
|
|
1141 |
interpolate8x8_switch(dec->tmp.u, backward.u, 8 * x_pos, 8 * y_pos, |
interpolate8x8_add_switch(dec->cur.u, backward.u, 8 * x_pos, 8 * y_pos, |
1142 |
b_uv_dx, b_uv_dy, stride2, 0); |
b_uv_dx, b_uv_dy, stride2, 0); |
1143 |
interpolate8x8_switch(dec->tmp.v, backward.v, 8 * x_pos, 8 * y_pos, |
interpolate8x8_add_switch(dec->cur.v, backward.v, 8 * x_pos, 8 * y_pos, |
1144 |
b_uv_dx, b_uv_dy, stride2, 0); |
b_uv_dx, b_uv_dy, stride2, 0); |
1145 |
|
|
|
interpolate8x8_avg2(dec->cur.y + (16 * y_pos * stride) + 16 * x_pos, |
|
|
dec->cur.y + (16 * y_pos * stride) + 16 * x_pos, |
|
|
dec->tmp.y + (16 * y_pos * stride) + 16 * x_pos, |
|
|
stride, 0, 8); |
|
|
|
|
|
interpolate8x8_avg2(dec->cur.y + (16 * y_pos * stride) + 16 * x_pos + 8, |
|
|
dec->cur.y + (16 * y_pos * stride) + 16 * x_pos + 8, |
|
|
dec->tmp.y + (16 * y_pos * stride) + 16 * x_pos + 8, |
|
|
stride, 0, 8); |
|
|
|
|
|
interpolate8x8_avg2(dec->cur.y + ((16 * y_pos + 8) * stride) + 16 * x_pos, |
|
|
dec->cur.y + ((16 * y_pos + 8) * stride) + 16 * x_pos, |
|
|
dec->tmp.y + ((16 * y_pos + 8) * stride) + 16 * x_pos, |
|
|
stride, 0, 8); |
|
|
|
|
|
interpolate8x8_avg2(dec->cur.y + ((16 * y_pos + 8) * stride) + 16 * x_pos + 8, |
|
|
dec->cur.y + ((16 * y_pos + 8) * stride) + 16 * x_pos + 8, |
|
|
dec->tmp.y + ((16 * y_pos + 8) * stride) + 16 * x_pos + 8, |
|
|
stride, 0, 8); |
|
|
|
|
|
interpolate8x8_avg2(dec->cur.u + (8 * y_pos * stride2) + 8 * x_pos, |
|
|
dec->cur.u + (8 * y_pos * stride2) + 8 * x_pos, |
|
|
dec->tmp.u + (8 * y_pos * stride2) + 8 * x_pos, |
|
|
stride2, 0, 8); |
|
|
|
|
|
interpolate8x8_avg2(dec->cur.v + (8 * y_pos * stride2) + 8 * x_pos, |
|
|
dec->cur.v + (8 * y_pos * stride2) + 8 * x_pos, |
|
|
dec->tmp.v + (8 * y_pos * stride2) + 8 * x_pos, |
|
|
stride2, 0, 8); |
|
|
|
|
1146 |
stop_comp_timer(); |
stop_comp_timer(); |
1147 |
|
|
1148 |
if (cbp) |
if (cbp) |