📄 fast_me.c
字号:
best_x = cand_x;
best_y = cand_y;
}
iXMinNow = best_x;
iYMinNow = best_y;
for (m = 0; m < 4; m++)
{
cand_x = iXMinNow + Diamond_x[m];
cand_y = iYMinNow + Diamond_y[m];
SEARCH_ONE_PIXEL
}
if(center_x != pic_pix_x || center_y != pic_pix_y)
{
cand_x = pic_pix_x ;
cand_y = pic_pix_y ;
SEARCH_ONE_PIXEL
iXMinNow = best_x;
iYMinNow = best_y;
for (m = 0; m < 4; m++)
{
cand_x = iXMinNow + Diamond_x[m];
cand_y = iYMinNow + Diamond_y[m];
SEARCH_ONE_PIXEL
}
}
if(blocktype>1)
{
cand_x = pic_pix_x + (pred_MV_uplayer[0]/4);
cand_y = pic_pix_y + (pred_MV_uplayer[1]/4);
SEARCH_ONE_PIXEL
if ((min_mcost-pred_SAD_uplayer)<pred_SAD_uplayer*betaThird)
goto third_step;
else if((min_mcost-pred_SAD_uplayer)<pred_SAD_uplayer*betaSec)
goto sec_step;
}
//prediciton using mV of last ref moiton vector
if (img->field_picture)
{
if ((list==0 && ref>1) || (img->type == B_SLICE && list == 0 && (ref==0 ||ref==1 ) ))
//Notes: for interlace case, ref==1 should be added
{
cand_x = pic_pix_x + pred_MV_ref[0]/4;
cand_y = pic_pix_y + pred_MV_ref[1]/4;
SEARCH_ONE_PIXEL
}
}
else
{
if ((list==0 && ref > 0) || (img->type == B_SLICE && list == 0 && ref==0 ))
//Notes: for interlace case, ref==1 should be added
{
cand_x = pic_pix_x + pred_MV_ref[0]/4;
cand_y = pic_pix_y + pred_MV_ref[1]/4;
SEARCH_ONE_PIXEL
}
}
//small local search
iXMinNow = best_x;
iYMinNow = best_y;
for (m = 0; m < 4; m++)
{
cand_x = iXMinNow + Diamond_x[m];
cand_y = iYMinNow + Diamond_y[m];
SEARCH_ONE_PIXEL
}
//early termination alogrithm, refer to JVT-G016
EARLY_TERMINATION
if(blocktype>6)
goto sec_step;
else
goto first_step;
first_step: //Unsymmetrical-cross search
iXMinNow = best_x;
iYMinNow = best_y;
for(i=1;i<=search_range/2;i++)
{
search_step = 2*i - 1;
cand_x = iXMinNow + search_step;
cand_y = iYMinNow ;
SEARCH_ONE_PIXEL
cand_x = iXMinNow - search_step;
cand_y = iYMinNow ;
SEARCH_ONE_PIXEL
}
for(i=1;i<=search_range/4;i++)
{
search_step = 2*i - 1;
cand_x = iXMinNow ;
cand_y = iYMinNow + search_step;
SEARCH_ONE_PIXEL
cand_x = iXMinNow ;
cand_y = iYMinNow - search_step;
SEARCH_ONE_PIXEL
}
//early termination alogrithm, refer to JVT-G016
EARLY_TERMINATION
iXMinNow = best_x;
iYMinNow = best_y;
// Uneven Multi-Hexagon-grid Search
for(pos=1;pos<25;pos++)
{
cand_x = iXMinNow + spiral_search_x[pos];
cand_y = iYMinNow + spiral_search_y[pos];
SEARCH_ONE_PIXEL
}
//early termination alogrithm, refer to JVT-G016
for(i=1;i<=search_range/4; i++)
{
for (m = 0; m < 16; m++)
{
cand_x = iXMinNow + Big_Hexagon_x[m]*i;
cand_y = iYMinNow + Big_Hexagon_y[m]*i;
SEARCH_ONE_PIXEL1(1)
}
}
sec_step: //Extended Hexagon-based Search
iXMinNow = best_x;
iYMinNow = best_y;
for(i=0;i<search_range;i++)
{
iAbort = 1;
for (m = 0; m < 6; m++)
{
cand_x = iXMinNow + Hexagon_x[m];
cand_y = iYMinNow + Hexagon_y[m];
SEARCH_ONE_PIXEL1(0)
}
if(iAbort)
break;
iXMinNow = best_x;
iYMinNow = best_y;
}
third_step: // the third step with a small search pattern
iXMinNow = best_x;
iYMinNow = best_y;
for(i=0;i<search_range;i++)
{
iAbort = 1;
for (m = 0; m < 4; m++)
{
cand_x = iXMinNow + Diamond_x[m];
cand_y = iYMinNow + Diamond_y[m];
SEARCH_ONE_PIXEL1(0)
}
if(iAbort)
break;
iXMinNow = best_x;
iYMinNow = best_y;
}
*mv_x = best_x - pic_pix_x;
*mv_y = best_y - pic_pix_y;
return min_mcost;
}
/*!
************************************************************************
* \brief
* Functions for fast fractional pel motion estimation.
* 1. int AddUpSADQuarter() returns SADT of a fractiona pel MV
* 2. int FastSubPelBlockMotionSearch () proceed the fast fractional pel ME
* \authors
* Zhibo Chen
* Dept.of EE, Tsinghua Univ.
* \date
* 2003.4
************************************************************************
*/
int AddUpSADQuarter(int pic_pix_x,int pic_pix_y,int blocksize_x,int blocksize_y,
int cand_mv_x,int cand_mv_y, StorablePicture *ref_picture, pel_t** orig_pic,
int Mvmcost, int min_mcost,int useABT, int blocktype)
{
int j, i, k;
int diff[16], *d;
int mcost = Mvmcost;
int c_diff[MB_PIXELS];
int y_offset, ypels =(128 - 64 * (blocktype == 3));
int ry0, ry4, ry8, ry12;
int y0, y1, y2, y3;
int x0, x1, x2, x3;
int abort_search, rx0;
int img_width = ((ref_picture->size_x + 2*IMG_PAD_SIZE - 1)<<2);
int img_height = ((ref_picture->size_y + 2*IMG_PAD_SIZE - 1)<<2);
//===== Use weighted Reference for ME ====
pel_t **ref_pic;
pel_t *ref_line;
pel_t *orig_line;
int apply_weights = ( (active_pps->weighted_pred_flag && (img->type == P_SLICE || img->type == SP_SLICE)) ||
(active_pps->weighted_bipred_idc && (img->type == B_SLICE)));
if (apply_weights && input->UseWeightedReferenceME)
{
ref_pic = ref_picture->imgY_ups_w;
}
else
ref_pic = ref_picture->imgY_ups;
///////////////////////////////////////////
for (y0=0, abort_search=0; y0<blocksize_y && !abort_search; y0+=4)
{
y_offset = (y0>7)*ypels;
ry0 = (y0<<2) + cand_mv_y;
ry4 = ry0 + 4;
ry8 = ry4 + 4;
ry12 = ry8 + 4;
y1 = y0 + 1;
y2 = y1 + 1;
y3 = y2 + 1;
for (x0=0; x0<blocksize_x; x0+=4)
{
rx0 = (x0<<2) + cand_mv_x;
x1 = x0 + 1;
x2 = x1 + 1;
x3 = x2 + 1;
d = diff;
orig_line = orig_pic [y0];
ref_line = get_line (ref_pic, ry0, rx0, img_height, img_width);
*d++ = orig_line[x0] - *(ref_line );
*d++ = orig_line[x1] - *(ref_line + 4 );
*d++ = orig_line[x2] - *(ref_line + 8 );
*d++ = orig_line[x3] - *(ref_line + 12);
orig_line = orig_pic [y1];
ref_line = get_line (ref_pic, ry4, rx0, img_height, img_width);
*d++ = orig_line[x0] - *(ref_line );
*d++ = orig_line[x1] - *(ref_line + 4 );
*d++ = orig_line[x2] - *(ref_line + 8 );
*d++ = orig_line[x3] - *(ref_line + 12);
orig_line = orig_pic [y2];
ref_line = get_line (ref_pic, ry8, rx0, img_height, img_width);
*d++ = orig_line[x0] - *(ref_line );
*d++ = orig_line[x1] - *(ref_line += 4 );
*d++ = orig_line[x2] - *(ref_line += 4 );
*d++ = orig_line[x3] - *(ref_line += 4);
orig_line = orig_pic [y3];
ref_line = get_line (ref_pic, ry12, rx0, img_height, img_width);
*d++ = orig_line[x0] - *(ref_line );
*d++ = orig_line[x1] - *(ref_line += 4);
*d++ = orig_line[x2] - *(ref_line += 4);
*d = orig_line[x3] - *(ref_line += 4);
if (!useABT)
{
if ((mcost += SATD (diff, input->hadamard)) > min_mcost)
{
abort_search = 1;
break;
}
}
else // copy diff to curr_diff for ABT SATD calculation
{
i = (x0&0x7) + (x0>7) * 64 + y_offset;
for(k=0, j=y0; j<BLOCK_SIZE + y0; j++, k+=BLOCK_SIZE)
memcpy(&(c_diff[i + ((j&0x7)<<3)]), &diff[k], BLOCK_SIZE*sizeof(int));
}
}
}
if(useABT)
{
mcost += find_SATD (c_diff, blocktype);
}
return mcost;
}
int // ==> minimum motion cost after search
FastSubPelBlockMotionSearch (pel_t** orig_pic, // <-- original pixel values for the AxB block
short ref, // <-- reference frame (0... or -1 (backward))
int list,
int pic_pix_x, // <-- absolute x-coordinate of regarded AxB block
int pic_pix_y, // <-- absolute y-coordinate of regarded AxB block
int blocktype, // <-- block type (1-16x16 ... 7-4x4)
short pred_mv_x, // <-- motion vector predictor (x) in sub-pel units
short pred_mv_y, // <-- motion vector predictor (y) in sub-pel units
short* mv_x, // <--> in: search center (x) / out: motion vector (x) - in pel units
short* mv_y, // <--> in: search center (y) / out: motion vector (y) - in pel units
int search_pos2, // <-- search positions for half-pel search (default: 9)
int search_pos4, // <-- search positions for quarter-pel search (default: 9)
int min_mcost, // <-- minimum motion cost (cost for center or huge value)
int lambda_factor,
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -