You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
765 lines
22 KiB
765 lines
22 KiB
/* File: sv_h263_me4.c */
|
|
/*****************************************************************************
|
|
** Copyright (c) Digital Equipment Corporation, 1995, 1997 **
|
|
** **
|
|
** All Rights Reserved. Unpublished rights reserved under the copyright **
|
|
** laws of the United States. **
|
|
** **
|
|
** The software contained on this media is proprietary to and embodies **
|
|
** the confidential technology of Digital Equipment Corporation. **
|
|
** Possession, use, duplication or dissemination of the software and **
|
|
** media is authorized only pursuant to a valid written license from **
|
|
** Digital Equipment Corporation. **
|
|
** **
|
|
** RESTRICTED RIGHTS LEGEND Use, duplication, or disclosure by the U.S. **
|
|
** Government is subject to restrictions as set forth in Subparagraph **
|
|
** (c)(1)(ii) of DFARS 252.227-7013, or in FAR 52.227-19, as applicable. **
|
|
******************************************************************************/
|
|
|
|
#include "sv_h263.h"
|
|
#include "proto.h"
|
|
#ifndef USE_C
|
|
#include "perr.h"
|
|
#endif
|
|
|
|
#define THREEBYEIGHT .375
|
|
#define THREEBYFOUR .75
|
|
#define MINUSONEBYEIGHT -0.125
|
|
|
|
#define FIVEBY32 0.15625
|
|
#define FIFTEENBY16 0.9375
|
|
#define MINUSTHREEBY32 -0.09375
|
|
|
|
#define SEVENBY16 0.4375
|
|
#define TWENTYONEBY32 0.65625
|
|
|
|
/**********************************************************************
|
|
*
|
|
* Name: MotionEstimation
|
|
* Description: Estimate all motionvectors for one MB
|
|
*
|
|
* Input: pointers to current an previous image,
|
|
* pointers to current slice and current MB
|
|
* Returns:
|
|
* Side effects: motion vector information in MB changed
|
|
*
|
|
***********************************************************************/
|
|
|
|
|
|
void sv_H263ME_2levels_7_pihp(SvH263CompressInfo_t *H263Info,
|
|
unsigned char *curr, unsigned char *prev, int x_curr,
|
|
int y_curr, int xoff, int yoff, int seek_dist,
|
|
H263_MotionVector *MV[6][H263_MBR+1][H263_MBC+2], int *SAD_0)
|
|
{
|
|
|
|
int Min_FRAME[5];
|
|
H263_MotionVector MVFrame[5];
|
|
unsigned char *aa,*ii;
|
|
unsigned char *adv_search_area = NULL, *zero_area = NULL;
|
|
int sxy,i,k,j,l;
|
|
int ihigh,ilow,jhigh,jlow,h_length,v_length;
|
|
int adv_ihigh,adv_ilow,adv_jhigh,adv_jlow,adv_h_length,adv_v_length;
|
|
int xmax,ymax,block,sad,lx;
|
|
int adv_x_curr, adv_y_curr,xvec,yvec;
|
|
|
|
unsigned char *act_block_subs2, *search_area_subs2, *adv_search_area_subs2;
|
|
int h_lenby2,v_lenby2,adv_h_lenby2,adv_v_lenby2;
|
|
int xlevel1,ylevel1,sxylevel1;
|
|
int xlevel1_block[4], ylevel1_block[4];
|
|
/*
|
|
int level0_x_curr,level0_y_curr,sxylevel0;
|
|
*/
|
|
int start_x, start_y, stop_x, stop_y, new_x, new_y;
|
|
int AE[5];
|
|
H263_Point search[5];
|
|
H263_Point half[5];
|
|
int pym1,pxm1,pxp1,pyp1;
|
|
int pym05,pxm05,pxp05,pyp05;
|
|
int AE_minx, AE_miny, min_posx, min_posy, min_hposx, min_hposy;
|
|
|
|
|
|
xmax = H263Info->pels;
|
|
ymax = H263Info->lines;
|
|
sxy = seek_dist;
|
|
if (!H263Info->long_vectors) {
|
|
/* Maximum normal search range centered around _zero-vector_ */
|
|
sxy = mmin(15, sxy);
|
|
}
|
|
else {
|
|
/* Maximum extended search range centered around _predictor_ */
|
|
sxy = mmin(15 - (2*H263_DEF_8X8_WIN+1), sxy);
|
|
|
|
/* NB! */
|
|
|
|
/* It is only possible to transmit motion vectors within
|
|
a 15x15 window around the motion vector predictor
|
|
for any 8x8 or 16x16 block */
|
|
|
|
/* The reason for the search window's reduction above with
|
|
2*DEF_8X8_WIN+1 is that the 8x8 search may change the MV
|
|
predictor for some of the blocks within the macroblock. When we
|
|
impose the limitation above, we are sure that any 8x8 vector we
|
|
might find is possible to transmit */
|
|
|
|
/* We have found that with OBMC, DEF_8X8_WIN should be quite small
|
|
for two reasons: (i) a good filtering effect, and (ii) not too
|
|
many bits used for transferring the vectors. As can be seen
|
|
above this is also useful to avoid a large limitation on the MV
|
|
search range */
|
|
|
|
/* It is possible to make sure the motion vectors found are legal
|
|
in other less limiting ways than above, but this would be more
|
|
complicated as well as time-consuming. Any good suggestions for
|
|
improvement is welcome, though */
|
|
#ifdef USE_C
|
|
xoff = mmin(16,mmax(-16,xoff));
|
|
yoff = mmin(16,mmax(-16,yoff));
|
|
#else
|
|
xoff = sv_H263lim_S(xoff,-16,16);
|
|
yoff = sv_H263lim_S(yoff,-16,16);
|
|
#endif
|
|
|
|
/* in case xoff or yoff is odd */
|
|
xoff= 2 * ((xoff)>>1);
|
|
yoff= 2 * ((yoff)>>1);
|
|
|
|
/* There is no need to check if (xoff + x_curr) points outside
|
|
the picture, since the Extended Motion Vector Range is
|
|
always used together with the Unrestricted MV mode */
|
|
}
|
|
|
|
|
|
lx = (H263Info->mv_outside_frame ? H263Info->pels + (H263Info->long_vectors?64:32) : H263Info->pels);
|
|
|
|
ilow = x_curr + xoff - sxy;
|
|
ihigh = x_curr + xoff + sxy;
|
|
|
|
jlow = y_curr + yoff - sxy;
|
|
jhigh = y_curr + yoff + sxy;
|
|
|
|
if (!H263Info->mv_outside_frame) {
|
|
if (ilow<0) ilow = 0;
|
|
if (ihigh>xmax-16) ihigh = xmax-16;
|
|
if (jlow<0) jlow = 0;
|
|
if (jhigh>ymax-16) jhigh = ymax-16;
|
|
}
|
|
|
|
h_length = ihigh - ilow + 16;
|
|
v_length = jhigh - jlow + 16;
|
|
|
|
/* subsampled version for ME level 1 */
|
|
h_lenby2 = (h_length-1)>>1;
|
|
v_lenby2 = (v_length-1)>>1;
|
|
act_block_subs2 = sv_H263LoadSubs2Area(curr, x_curr, y_curr, 8, 8, H263Info->pels);
|
|
search_area_subs2 = sv_H263LoadSubs2Area(prev, ilow, jlow, h_lenby2, v_lenby2, lx);
|
|
|
|
for (k = 0; k < 5; k++) {
|
|
Min_FRAME[k] = INT_MAX;
|
|
MVFrame[k].x = 0;
|
|
MVFrame[k].y = 0;
|
|
MVFrame[k].x_half = 0;
|
|
MVFrame[k].y_half = 0;
|
|
}
|
|
|
|
/* match for zero (or [xoff,yoff]) motion vector on subsampled images */
|
|
ii = search_area_subs2 + ((x_curr+xoff-ilow)>>1) + ((y_curr+yoff-jlow)>>1)*h_lenby2;
|
|
#ifdef USE_C
|
|
Min_FRAME[0] = sv_H263MySADBlock(ii, act_block_subs2, h_lenby2, 8, Min_FRAME[0]);
|
|
#else
|
|
Min_FRAME[0] = sv_H263PError8x8_S(ii,act_block_subs2,h_lenby2,8,Min_FRAME[0]);
|
|
#endif
|
|
|
|
MVFrame[0].x = (short)xoff;
|
|
MVFrame[0].y = (short)yoff;
|
|
|
|
/*** Spiral search (+-7) on subsampled images ***/
|
|
|
|
sxylevel1 = (sxy-1)>>1;
|
|
|
|
for (l = 1; l <= sxylevel1; l++) {
|
|
i = x_curr + xoff - 2*l;
|
|
j = y_curr + yoff - 2*l;
|
|
for (k = 0; k < 8*l; k++) {
|
|
if (i>=ilow && i<=ihigh && j>=jlow && j<=jhigh) {
|
|
|
|
/* 8x8 integer pel MV */
|
|
ii = search_area_subs2 + ((i-ilow)>>1) + ((j-jlow)>>1)*h_lenby2;
|
|
#ifdef USE_C
|
|
sad = sv_H263MySADBlock(ii, act_block_subs2, h_lenby2, 8, Min_FRAME[0]);
|
|
#else
|
|
sad = sv_H263PError8x8_S(ii,act_block_subs2,h_lenby2,8,Min_FRAME[0]);
|
|
#endif
|
|
if (sad < Min_FRAME[0]) {
|
|
MVFrame[0].x = i - x_curr;
|
|
MVFrame[0].y = j - y_curr;
|
|
Min_FRAME[0] = sad;
|
|
}
|
|
|
|
}
|
|
if (k<2*l) i+=2;
|
|
else if (k<4*l) j+=2;
|
|
else if (k<6*l) i-=2;
|
|
else j-=2;
|
|
}
|
|
}
|
|
|
|
/* motion vectors after level1 */
|
|
xlevel1=MVFrame[0].x;
|
|
ylevel1=MVFrame[0].y;
|
|
|
|
/* reset */
|
|
Min_FRAME[0] = INT_MAX;
|
|
MVFrame[0].x = 0;
|
|
MVFrame[0].y = 0;
|
|
|
|
/* Zero vector search*/
|
|
if (x_curr-ilow < 0 || y_curr-jlow < 0 ||
|
|
x_curr-ilow+H263_MB_SIZE > h_length || y_curr-jlow+H263_MB_SIZE > v_length) {
|
|
/* in case the zero vector is outside the loaded area in search_area */
|
|
|
|
zero_area = sv_H263LoadSubs2Area(prev, x_curr, y_curr, 8, 8, lx);
|
|
#ifdef USE_C
|
|
*SAD_0 = 4*sv_H263MySADBlock(zero_area, act_block_subs2, 8, 8, Min_FRAME[0]) -
|
|
H263_PREF_NULL_VEC;
|
|
#else
|
|
*SAD_0 = 4*sv_H263PError8x8_S(zero_area, act_block_subs2, 8, 8, Min_FRAME[0]) -
|
|
H263_PREF_NULL_VEC;
|
|
#endif
|
|
ScFree(zero_area);
|
|
}
|
|
else {
|
|
/* the zero vector is within search_area */
|
|
|
|
ii = search_area_subs2 + ((x_curr-ilow)>>1) + ((y_curr-jlow)>>1)*h_lenby2;
|
|
#ifdef USE_C
|
|
*SAD_0 = 4*sv_H263MySADBlock(ii, act_block_subs2, h_lenby2, 8, Min_FRAME[0]) -
|
|
H263_PREF_NULL_VEC;
|
|
#else
|
|
*SAD_0 = 4*sv_H263PError8x8_S(ii, act_block_subs2, h_lenby2, 8, Min_FRAME[0]) -
|
|
H263_PREF_NULL_VEC;
|
|
#endif
|
|
}
|
|
|
|
/*** +-1 search on full-resolution images done by polynomial interpolation ***/
|
|
|
|
start_x = -1;
|
|
stop_x = 1;
|
|
start_y = -1;
|
|
stop_y = 1;
|
|
|
|
new_x = x_curr + xlevel1;
|
|
new_y = y_curr + ylevel1;
|
|
|
|
/* Make sure that no addressing is outside the frame */
|
|
if (!H263Info->mv_outside_frame) {
|
|
if ((new_x) <= (ilow+1))
|
|
start_x = 0;
|
|
if ((new_y) <= (jlow+1))
|
|
start_y = 0;
|
|
if ((new_x) >= (ihigh-1))
|
|
stop_x = 0;
|
|
if ((new_y) >= (jhigh-1))
|
|
stop_y = 0;
|
|
}
|
|
|
|
/* 1 */
|
|
/* 2 0 3 */
|
|
/* 4 */
|
|
|
|
search[0].x = 0; search[0].y = 0;
|
|
search[1].x = 0; search[1].y = (short)start_y;
|
|
search[2].x = (short)start_x; search[2].y = 0;
|
|
search[3].x = (short)stop_x; search[3].y = 0;
|
|
search[4].x = 0; search[4].y = (short)stop_y;
|
|
|
|
half[0].x = 0; half[0].y = 0;
|
|
half[1].x = 0; half[1].y = (short)start_y;
|
|
half[2].x = (short)start_x; half[2].y = 0;
|
|
half[3].x = (short)stop_x; half[3].y = 0;
|
|
half[4].x = 0; half[4].y = (short)stop_y;
|
|
|
|
for (l = 0; l < 5 ; l++) {
|
|
AE[l] = INT_MAX;
|
|
i = new_x + 2*search[l].x;
|
|
j = new_y + 2*search[l].y;
|
|
/* 8x8 integer pel MV */
|
|
ii = search_area_subs2 + ((i-ilow)>>1) + ((j-jlow)>>1)*h_lenby2;
|
|
#ifdef USE_C
|
|
AE[l] = sv_H263MySADBlock(ii, act_block_subs2, h_lenby2, 8, INT_MAX);
|
|
#else
|
|
AE[l] = sv_H263PEr8_init_S(ii, act_block_subs2, h_lenby2, 8);
|
|
#endif
|
|
}
|
|
|
|
/* 1D polynomial interpolation along x and y respectively */
|
|
|
|
AE_minx = AE[0];
|
|
min_posx = 0;
|
|
min_hposx = 0;
|
|
|
|
pxm1 = (int)(THREEBYEIGHT * (double) AE[2]
|
|
+ THREEBYFOUR * (double) AE[0]
|
|
+ MINUSONEBYEIGHT * (double) AE[3]) ;
|
|
|
|
if (pxm1<AE_minx) {
|
|
AE_minx = pxm1;
|
|
min_posx = 2;
|
|
}
|
|
|
|
pxp1 = (int)(MINUSONEBYEIGHT * (double) AE[2]
|
|
+ THREEBYFOUR * (double) AE[0]
|
|
+ THREEBYEIGHT * (double) AE[3]);
|
|
|
|
if (pxp1<AE_minx) {
|
|
AE_minx = pxp1;
|
|
min_posx = 3;
|
|
}
|
|
|
|
switch(min_posx) {
|
|
|
|
case 0: /* now check +- 1/2 */
|
|
pxm05 = (int)( FIVEBY32 * (double) AE[2]
|
|
+ FIFTEENBY16 * (double) AE[0]
|
|
+ MINUSTHREEBY32 * (double) AE[3]);
|
|
|
|
if (pxm05<AE_minx) {
|
|
AE_minx = pxm05;
|
|
min_hposx = 2;
|
|
}
|
|
|
|
pxp05 = (int)( MINUSTHREEBY32 * (double) AE[2]
|
|
+ FIFTEENBY16 * (double) AE[0]
|
|
+ FIVEBY32 * (double) AE[3]);
|
|
|
|
if (pxp05<AE_minx) {
|
|
AE_minx = pxp05;
|
|
min_hposx = 3;
|
|
}
|
|
break;
|
|
|
|
case 2: /* now check -3/2 -1/2 */
|
|
pxp05 = (int)(FIVEBY32 * AE[2]
|
|
+ FIFTEENBY16 * AE[0]
|
|
+ MINUSTHREEBY32 * AE[3]);
|
|
|
|
if (pxp05<AE_minx) {
|
|
AE_minx = pxp05;
|
|
min_hposx = 3;
|
|
}
|
|
break;
|
|
|
|
case 3: /* now check +1/2 +3/2 */
|
|
pxm05 = (int)( MINUSTHREEBY32 * (double)AE[2]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ FIVEBY32 * (double)AE[3]);
|
|
|
|
if (pxm05<AE_minx) {
|
|
AE_minx = pxm05;
|
|
min_hposx = 2;
|
|
}
|
|
break;
|
|
}
|
|
|
|
/* along y */
|
|
|
|
AE_miny = AE[0];
|
|
min_posy = 0;
|
|
min_hposy = 0;
|
|
|
|
pym1 = (int)(THREEBYEIGHT * (double)AE[1]
|
|
+ THREEBYFOUR * (double)AE[0]
|
|
+ MINUSONEBYEIGHT * (double)AE[4]);
|
|
|
|
if (pym1<AE_miny) {
|
|
AE_miny = pym1;
|
|
min_posy = 1;
|
|
}
|
|
|
|
pyp1 = (int)( MINUSONEBYEIGHT * (double)AE[1]
|
|
+ THREEBYFOUR * (double)AE[0]
|
|
+ THREEBYEIGHT * (double)AE[4]);
|
|
|
|
if (pyp1<AE_miny) {
|
|
AE_miny = pyp1;
|
|
min_posy = 4;
|
|
}
|
|
|
|
switch(min_posy) {
|
|
|
|
case 0: /* +- 1/2 */
|
|
pym05 = (int)( FIVEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ MINUSTHREEBY32 * (double)AE[4]);
|
|
|
|
if (pym05<AE_miny) {
|
|
AE_miny = pym05;
|
|
min_hposy = 1;
|
|
}
|
|
|
|
pyp05 = (int)(MINUSTHREEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ FIVEBY32 * (double)AE[4]);
|
|
|
|
if (pyp05<AE_miny) {
|
|
AE_miny = pyp05;
|
|
min_hposy = 4;
|
|
}
|
|
break;
|
|
|
|
case 1: /* -3/2 -1/2 */
|
|
pyp05 = (int)(FIVEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ MINUSTHREEBY32 * (double)AE[4]);
|
|
|
|
if (pyp05<AE_miny) {
|
|
AE_miny = pyp05;
|
|
min_hposy = 4;
|
|
}
|
|
break;
|
|
|
|
case 4: /* +1/2 +3/2 */
|
|
pym05 = (int)( MINUSTHREEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ FIVEBY32 * (double)AE[4]);
|
|
|
|
if (pym05<AE_miny) {
|
|
AE_miny = pym05;
|
|
min_hposy = 1;
|
|
}
|
|
break;
|
|
|
|
}
|
|
|
|
/* Store optimal values */
|
|
Min_FRAME[0] = (AE_minx<AE_miny ? 4*AE_minx : 4*AE_miny);
|
|
MVFrame[0].x = new_x + search[min_posx].x - x_curr;
|
|
MVFrame[0].y = new_y + search[min_posy].y - y_curr;
|
|
MVFrame[0].x_half = half[min_hposx].x;
|
|
MVFrame[0].y_half = half[min_hposy].y;
|
|
|
|
if (H263Info->advanced) {
|
|
|
|
/* Center the 8x8 search around the 16x16 vector. This is
|
|
different than in TMN5 where the 8x8 search is also a full
|
|
search. The reasons for this is: (i) it is faster, and (ii) it
|
|
generally gives better results because of a better OBMC
|
|
filtering effect and less bits spent for vectors, and (iii) if
|
|
the Extended MV Range is used, the search range around the
|
|
motion vector predictor will be less limited */
|
|
|
|
xvec = MVFrame[0].x;
|
|
yvec = MVFrame[0].y;
|
|
|
|
if (!H263Info->long_vectors) {
|
|
if (xvec > 15 - H263_DEF_8X8_WIN) { xvec = 15 - H263_DEF_8X8_WIN ;}
|
|
if (yvec > 15 - H263_DEF_8X8_WIN) { yvec = 15 - H263_DEF_8X8_WIN ;}
|
|
|
|
if (xvec < -15 + H263_DEF_8X8_WIN) { xvec = -15 + H263_DEF_8X8_WIN ;}
|
|
if (yvec < -15 + H263_DEF_8X8_WIN) { yvec = -15 + H263_DEF_8X8_WIN ;}
|
|
}
|
|
|
|
adv_x_curr = x_curr + xvec;
|
|
adv_y_curr = y_curr + yvec;
|
|
|
|
sxy = H263_DEF_8X8_WIN;
|
|
|
|
adv_ilow = adv_x_curr - sxy;
|
|
adv_ihigh = adv_x_curr + sxy;
|
|
|
|
adv_jlow = adv_y_curr - sxy;
|
|
adv_jhigh = adv_y_curr + sxy;
|
|
|
|
adv_h_length = adv_ihigh - adv_ilow + 16;
|
|
adv_v_length = adv_jhigh - adv_jlow + 16;
|
|
|
|
/* BUG
|
|
adv_h_lenby2 = (adv_h_length-1)>>1;
|
|
adv_v_lenby2 = (adv_v_length-1)>>1;
|
|
*/
|
|
adv_h_lenby2 = (adv_h_length)>>1;
|
|
adv_v_lenby2 = (adv_v_length)>>1;
|
|
/*
|
|
adv_search_area_subs2 = sv_H263LoadSubs2Area(prev, adv_ilow, adv_jlow,
|
|
adv_h_lenby2, adv_v_lenby2, lx);
|
|
*/
|
|
adv_search_area_subs2 = sv_H263LoadSubs2Area(prev, adv_ilow, adv_jlow,
|
|
adv_h_length, adv_v_length, lx);
|
|
|
|
for (block = 0; block < 4; block++) {
|
|
ii = adv_search_area_subs2 + ((adv_x_curr-adv_ilow)>>1) + ((block&1)<<2) +
|
|
(((adv_y_curr-adv_jlow)>>1) + ((block&2)<<1) )*adv_h_lenby2;
|
|
aa = act_block_subs2 + ((block&1)<<2) + ((block&2)<<1)*8;
|
|
/*
|
|
Min_FRAME[block+1] = sv_H263MySADSubBlock(ii,aa,adv_h_lenby2,Min_FRAME[block+1]);
|
|
*/
|
|
Min_FRAME[block+1] = sv_H263MySADSubBlock(ii,aa,adv_h_length,Min_FRAME[block+1]);
|
|
|
|
MVFrame[block+1].x = MVFrame[0].x;
|
|
MVFrame[block+1].y = MVFrame[0].y;
|
|
}
|
|
|
|
/* Spiral search */
|
|
sxylevel1 = (sxy-1)>>1;
|
|
|
|
for (l = 1; l <= sxylevel1; l++) {
|
|
i = adv_x_curr - 2*l;
|
|
j = adv_y_curr - 2*l;
|
|
for (k = 0; k < 8*l; k++) {
|
|
if (i>=adv_ilow && i<=adv_ihigh && j>=adv_jlow && j<=adv_jhigh) {
|
|
|
|
/* 8x8 integer pel MVs */
|
|
for (block = 0; block < 4; block++) {
|
|
ii = adv_search_area_subs2 + ((i-adv_ilow)>>1) + ((block&1)<<2) +
|
|
(((j-adv_jlow)>>1) + ((block&2)<<1) )*adv_h_lenby2;
|
|
aa = act_block_subs2 + ((block&1)<<2) + ((block&2)<<1)*8;
|
|
/*
|
|
sad = sv_H263MySADSubBlock(ii, aa, adv_h_lenby2, Min_FRAME[block+1]);
|
|
*/
|
|
sad = sv_H263MySADSubBlock(ii, aa, adv_h_length, Min_FRAME[block+1]);
|
|
|
|
if (sad < Min_FRAME[block+1]) {
|
|
MVFrame[block+1].x = i - x_curr;
|
|
MVFrame[block+1].y = j - y_curr;
|
|
Min_FRAME[block+1] = sad;
|
|
}
|
|
}
|
|
|
|
}
|
|
if (k<2*l) i++;
|
|
else if (k<4*l) j++;
|
|
else if (k<6*l) i--;
|
|
else j--;
|
|
}
|
|
}
|
|
|
|
for (block = 0; block < 4; block++) {
|
|
xlevel1_block[block] = MVFrame[block+1].x;
|
|
ylevel1_block[block] = MVFrame[block+1].y;
|
|
|
|
/* reset */
|
|
Min_FRAME[block+1] = INT_MAX;
|
|
MVFrame[block+1].x = 0;
|
|
MVFrame[block+1].y = 0;
|
|
}
|
|
|
|
/* +-1 search on full resolution on full-resolution images */
|
|
/* by polynomial interpolation */
|
|
|
|
for (block = 0; block < 4; block++) {
|
|
start_x = -1;
|
|
stop_x = 1;
|
|
start_y = -1;
|
|
stop_y = 1;
|
|
|
|
adv_x_curr = x_curr + xlevel1_block[block];
|
|
adv_y_curr = y_curr + ylevel1_block[block];
|
|
|
|
/* 1 */
|
|
/* 2 0 3 */
|
|
/* 4 */
|
|
|
|
search[0].x = 0; search[0].y = 0;
|
|
search[1].x = 0; search[1].y = (short)start_y;
|
|
search[2].x = (short)start_x; search[2].y = 0;
|
|
search[3].x = (short)stop_x; search[3].y = 0;
|
|
search[4].x = 0; search[4].y = (short)stop_y;
|
|
|
|
half[0].x = 0; half[0].y = 0;
|
|
half[1].x = 0; half[1].y = (short)start_y;
|
|
half[2].x = (short)start_x; half[2].y = 0;
|
|
half[3].x = (short)stop_x; half[3].y = 0;
|
|
half[4].x = 0; half[4].y = (short)stop_y;
|
|
|
|
for (l = 0; l < 5 ; l++) {
|
|
AE[l] = INT_MAX;
|
|
i = adv_x_curr + 2*search[l].x;
|
|
j = adv_y_curr + 2*search[l].y;
|
|
/* 8x8 integer pel MV */
|
|
ii = adv_search_area_subs2 + ((i-adv_ilow)>>1) + ((block&1)<<2) +
|
|
(((j-adv_jlow)>>1) + ((block&2)<<1) )*adv_h_lenby2;
|
|
aa = act_block_subs2 + ((block&1)<<2) + ((block&2)<<1)*8;
|
|
/*
|
|
AE[l] = sv_H263MySADSubBlock(ii, aa, adv_h_lenby2, INT_MAX);
|
|
*/
|
|
AE[l] = sv_H263MySADSubBlock(ii, aa, adv_h_length, INT_MAX);
|
|
|
|
}
|
|
|
|
/* 1D polynomial interpolation along x and y respectively */
|
|
|
|
AE_minx = AE[0];
|
|
min_posx = 0;
|
|
min_hposx = 0;
|
|
|
|
pxm1 = (int)( THREEBYEIGHT * (double)AE[2]
|
|
+ THREEBYFOUR * (double)AE[0]
|
|
+ MINUSONEBYEIGHT * (double)AE[3]);
|
|
|
|
if (pxm1<AE_minx) {
|
|
AE_minx = pxm1;
|
|
min_posx = 2;
|
|
}
|
|
|
|
pxp1 = (int)( MINUSONEBYEIGHT * (double)AE[2]
|
|
+ THREEBYFOUR * (double)AE[0]
|
|
+ THREEBYEIGHT * (double)AE[3]);
|
|
|
|
if (pxp1<AE_minx) {
|
|
AE_minx = pxp1;
|
|
min_posx = 3;
|
|
}
|
|
|
|
switch(min_posx) {
|
|
|
|
case 0: /* now check +- 1/2 */
|
|
pxm05 = (int) (FIVEBY32 * (double)AE[2]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ MINUSTHREEBY32 * (double)AE[3]);
|
|
|
|
if (pxm05<AE_minx) {
|
|
AE_minx = pxm05;
|
|
min_hposx = 2;
|
|
}
|
|
|
|
pxp05 = (int)(MINUSTHREEBY32 * (double)AE[2]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ FIVEBY32 * (double)AE[3]);
|
|
|
|
if (pxp05<AE_minx) {
|
|
AE_minx = pxp05;
|
|
min_hposx = 3;
|
|
}
|
|
break;
|
|
|
|
case 2: /* now check -3/2 -1/2 */
|
|
pxp05 = (int)( FIVEBY32 * (double)AE[2]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ MINUSTHREEBY32 * (double)AE[3]);
|
|
|
|
if (pxp05<AE_minx) {
|
|
AE_minx = pxp05;
|
|
min_hposx = 3;
|
|
}
|
|
break;
|
|
|
|
case 3: /* now check +1/2 +3/2 */
|
|
pxm05 = (int)(MINUSTHREEBY32 * (double)AE[2]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ FIVEBY32 * (double)AE[3]);
|
|
|
|
if (pxm05<AE_minx) {
|
|
AE_minx = pxm05;
|
|
min_hposx = 2;
|
|
}
|
|
break;
|
|
}
|
|
|
|
/* along y */
|
|
|
|
AE_miny = AE[0];
|
|
min_posy = 0;
|
|
min_hposy = 0;
|
|
|
|
pym1 = (int)(THREEBYEIGHT * (double)AE[1]
|
|
+ THREEBYFOUR * (double)AE[0]
|
|
+ MINUSONEBYEIGHT * (double)AE[4]);
|
|
|
|
if (pym1<AE_miny) {
|
|
AE_miny = pym1;
|
|
min_posy = 1;
|
|
}
|
|
|
|
pyp1 = (int)(MINUSONEBYEIGHT * (double)AE[1] +
|
|
+ THREEBYFOUR * (double)AE[0]
|
|
+ THREEBYEIGHT * (double)AE[4]);
|
|
|
|
if (pyp1<AE_miny) {
|
|
AE_miny = pyp1;
|
|
min_posy = 4;
|
|
}
|
|
|
|
switch(min_posy) {
|
|
|
|
case 0: /* +- 1/2 */
|
|
pym05 = (int)(FIVEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ MINUSTHREEBY32 * (double)AE[4]);
|
|
|
|
if (pym05<AE_miny) {
|
|
AE_miny = pym05;
|
|
min_hposy = 1;
|
|
}
|
|
|
|
pyp05 = (int)(MINUSTHREEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ FIVEBY32 * (double)AE[4]);
|
|
|
|
if (pyp05<AE_miny) {
|
|
AE_miny = pyp05;
|
|
min_hposy = 4;
|
|
}
|
|
break;
|
|
|
|
case 1: /* -3/2 -1/2 */
|
|
pyp05 = (int)(FIVEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ MINUSTHREEBY32 * (double)AE[4]);
|
|
|
|
if (pyp05<AE_miny) {
|
|
AE_miny = pyp05;
|
|
min_hposy = 4;
|
|
}
|
|
break;
|
|
|
|
case 4: /* +1/2 +3/2 */
|
|
pym05 = (int)(MINUSTHREEBY32 * (double)AE[1]
|
|
+ FIFTEENBY16 * (double)AE[0]
|
|
+ FIVEBY32 * (double)AE[4]);
|
|
|
|
if (pym05<AE_miny) {
|
|
AE_miny = pym05;
|
|
min_hposy = 1;
|
|
}
|
|
break;
|
|
|
|
}
|
|
|
|
/* Store optimal values */
|
|
Min_FRAME[block+1] = (AE_minx<AE_miny ? 4*AE_minx : 4*AE_miny);
|
|
MVFrame[block+1].x = adv_x_curr + search[min_posx].x - x_curr;
|
|
MVFrame[block+1].y = adv_y_curr + search[min_posy].y - y_curr;
|
|
MVFrame[block+1].x_half = half[min_hposx].x;
|
|
MVFrame[block+1].y_half = half[min_hposy].y;
|
|
|
|
}
|
|
}
|
|
|
|
i = x_curr/H263_MB_SIZE+1;
|
|
j = y_curr/H263_MB_SIZE+1;
|
|
|
|
if (!H263Info->advanced) {
|
|
MV[0][j][i]->x = MVFrame[0].x;
|
|
MV[0][j][i]->y = MVFrame[0].y;
|
|
MV[0][j][i]->x_half = MVFrame[0].x_half;
|
|
MV[0][j][i]->y_half = MVFrame[0].y_half;
|
|
MV[0][j][i]->min_error = (short)Min_FRAME[0];
|
|
}
|
|
else {
|
|
for (k = 0; k < 5; k++) {
|
|
MV[k][j][i]->x = MVFrame[k].x;
|
|
MV[k][j][i]->y = MVFrame[k].y;
|
|
MV[k][j][i]->x_half = MVFrame[k].x_half;
|
|
MV[k][j][i]->y_half = MVFrame[k].y_half;
|
|
MV[k][j][i]->min_error = (short)Min_FRAME[k];
|
|
}
|
|
}
|
|
|
|
ScFree(act_block_subs2);
|
|
ScFree(search_area_subs2);
|
|
|
|
if (H263Info->advanced)
|
|
ScFree(adv_search_area);
|
|
return;
|
|
}
|
|
|
|
|