📄 estimation_gmc.c
字号:
/*****************************************************************************
*
* XVID MPEG-4 VIDEO CODEC
* - Global Motion Estimation -
*
* Copyright(C) 2003 Christoph Lampert <gruel@web.de>
*
* This program is free software ; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation ; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program ; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*
* $Id: estimation_gmc.c,v 1.5 2004/12/05 04:53:01 syskin Exp $
*
****************************************************************************/
#include <assert.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <math.h>
#include "../encoder.h"
#include "../prediction/mbprediction.h"
#include "estimation.h"
#include "motion.h"
#include "sad.h"
#include "gmc.h"
#include "../utils/emms.h"
#include "motion_inlines.h"
static void
CheckCandidate16I(const int x, const int y, SearchData * const data, const unsigned int Direction)
{
int sad;
const uint8_t * Reference;
if ( (x > data->max_dx) || ( x < data->min_dx)
|| (y > data->max_dy) || (y < data->min_dy) ) return;
Reference = GetReference(x, y, data);
sad = sad16(data->Cur, Reference, data->iEdgedWidth, 256*4096);
if (sad < data->iMinSAD[0]) {
data->iMinSAD[0] = sad;
data->currentMV[0].x = x; data->currentMV[0].y = y;
data->dir = Direction;
}
}
static __inline void
GMEanalyzeMB ( const uint8_t * const pCur,
const uint8_t * const pRef,
const uint8_t * const pRefH,
const uint8_t * const pRefV,
const uint8_t * const pRefHV,
const int x,
const int y,
const MBParam * const pParam,
MACROBLOCK * const pMBs,
SearchData * const Data)
{
MACROBLOCK * const pMB = &pMBs[x + y * pParam->mb_width];
Data->iMinSAD[0] = MV_MAX_ERROR;
Data->predMV = get_pmv2(pMBs, pParam->mb_width, 0, x, y, 0);
get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 4,
pParam->width, pParam->height, 16, 1);
Data->Cur = pCur + 16*(x + y * pParam->edged_width);
Data->RefP[0] = pRef + 16*(x + y * pParam->edged_width);
Data->RefP[1] = pRefV + 16*(x + y * pParam->edged_width);
Data->RefP[2] = pRefH + 16*(x + y * pParam->edged_width);
Data->RefP[3] = pRefHV + 16*(x + y * pParam->edged_width);
Data->currentMV[0].x = Data->currentMV[0].y = 0;
CheckCandidate16I(0, 0, Data, 255);
if ( (Data->predMV.x !=0) || (Data->predMV.y != 0) )
CheckCandidate16I(Data->predMV.x, Data->predMV.y, Data, 255);
xvid_me_DiamondSearch(Data->currentMV[0].x, Data->currentMV[0].y, Data, 255, CheckCandidate16I);
xvid_me_SubpelRefine(Data->currentMV[0], Data, CheckCandidate16I, 0);
/* for QPel halfpel positions are worse than in halfpel mode :( */
/* if (Data->qpel) {
Data->currentQMV->x = 2*Data->currentMV->x;
Data->currentQMV->y = 2*Data->currentMV->y;
Data->qpel_precision = 1;
get_range(&Data->min_dx, &Data->max_dx, &Data->min_dy, &Data->max_dy, x, y, 4,
pParam->width, pParam->height, iFcode, 2, 0);
SubpelRefine(Data);
}
*/
pMB->mvs[0] = pMB->mvs[1] = pMB->mvs[2] = pMB->mvs[3] = Data->currentMV[0];
pMB->sad16 = Data->iMinSAD[0];
pMB->mode = MODE_INTER;
pMB->sad16 += 10*d_mv_bits(pMB->mvs[0].x, pMB->mvs[0].y, Data->predMV, Data->iFcode, 0);
return;
}
void
GMEanalysis(const MBParam * const pParam,
const FRAMEINFO * const current,
const FRAMEINFO * const reference,
const IMAGE * const pRefH,
const IMAGE * const pRefV,
const IMAGE * const pRefHV)
{
uint32_t x, y;
MACROBLOCK * const pMBs = current->mbs;
const IMAGE * const pCurrent = ¤t->image;
const IMAGE * const pReference = &reference->image;
SearchData Data;
memset(&Data, 0, sizeof(SearchData));
Data.iEdgedWidth = pParam->edged_width;
Data.rounding = pParam->m_rounding_type;
Data.iFcode = current->fcode;
if (sadInit) (*sadInit) ();
for (y = 0; y < pParam->mb_height; y ++) {
for (x = 0; x < pParam->mb_width; x ++) {
GMEanalyzeMB(pCurrent->y, pReference->y, pRefH->y, pRefV->y, pRefHV->y, x, y, pParam, pMBs, &Data);
}
}
return;
}
WARPPOINTS
GlobalMotionEst(MACROBLOCK * const pMBs,
const MBParam * const pParam,
const FRAMEINFO * const current,
const FRAMEINFO * const reference,
const IMAGE * const pRefH,
const IMAGE * const pRefV,
const IMAGE * const pRefHV)
{
const int deltax=8; /* upper bound for difference between a MV and it's neighbour MVs */
const int deltay=8;
const unsigned int gradx=512; /* lower bound for gradient in MB (ignore "flat" blocks) */
const unsigned int grady=512;
double sol[4] = { 0., 0., 0., 0. };
WARPPOINTS gmc;
uint32_t mx, my;
int MBh = pParam->mb_height;
int MBw = pParam->mb_width;
const int minblocks = 9; /* was = /MBh*MBw/32+3 */ /* just some reasonable number 3% + 3 */
const int maxblocks = MBh*MBw/4; /* just some reasonable number 3% + 3 */
int num=0;
int oldnum;
gmc.duv[0].x = gmc.duv[0].y = gmc.duv[1].x = gmc.duv[1].y = gmc.duv[2].x = gmc.duv[2].y = 0;
GMEanalysis(pParam,current, reference, pRefH, pRefV, pRefHV);
/* block based ME isn't done, yet, so do a quick presearch */
/* filter mask of all blocks */
for (my = 0; my < (uint32_t)MBh; my++)
for (mx = 0; mx < (uint32_t)MBw; mx++)
{
const int mbnum = mx + my * MBw;
pMBs[mbnum].mcsel = 0;
}
for (my = 1; my < (uint32_t)MBh-1; my++) /* ignore boundary blocks */
for (mx = 1; mx < (uint32_t)MBw-1; mx++) /* theirs MVs are often wrong */
{
const int mbnum = mx + my * MBw;
MACROBLOCK *const pMB = &pMBs[mbnum];
const VECTOR mv = pMB->mvs[0];
/* don't use object boundaries */
if ( (abs(mv.x - (pMB-1)->mvs[0].x) < deltax)
&& (abs(mv.y - (pMB-1)->mvs[0].y) < deltay)
&& (abs(mv.x - (pMB+1)->mvs[0].x) < deltax)
&& (abs(mv.y - (pMB+1)->mvs[0].y) < deltay)
&& (abs(mv.x - (pMB-MBw)->mvs[0].x) < deltax)
&& (abs(mv.y - (pMB-MBw)->mvs[0].y) < deltay)
&& (abs(mv.x - (pMB+MBw)->mvs[0].x) < deltax)
&& (abs(mv.y - (pMB+MBw)->mvs[0].y) < deltay) )
{ const int iEdgedWidth = pParam->edged_width;
const uint8_t *const pCur = current->image.y + 16*(my*iEdgedWidth + mx);
if ( (sad16 ( pCur, pCur+1 , iEdgedWidth, 65536) >= gradx )
&& (sad16 ( pCur, pCur+iEdgedWidth, iEdgedWidth, 65536) >= grady ) )
{ pMB->mcsel = 1;
num++;
}
/* only use "structured" blocks */
}
}
emms();
/* further filtering would be possible, but during iteration, remaining
outliers usually are removed, too */
if (num>= minblocks)
do { /* until convergence */
double DtimesF[4];
double a,b,c,n,invdenom;
double meanx,meany;
a = b = c = n = 0;
DtimesF[0] = DtimesF[1] = DtimesF[2] = DtimesF[3] = 0.;
for (my = 1; my < (uint32_t)MBh-1; my++)
for (mx = 1; mx < (uint32_t)MBw-1; mx++)
{
const int mbnum = mx + my * MBw;
const VECTOR mv = pMBs[mbnum].mvs[0];
if (!pMBs[mbnum].mcsel)
continue;
n++;
a += 16*mx+8;
b += 16*my+8;
c += (16*mx+8)*(16*mx+8)+(16*my+8)*(16*my+8);
DtimesF[0] += (double)mv.x;
DtimesF[1] += (double)mv.x*(16*mx+8) + (double)mv.y*(16*my+8);
DtimesF[2] += (double)mv.x*(16*my+8) - (double)mv.y*(16*mx+8);
DtimesF[3] += (double)mv.y;
}
invdenom = a*a+b*b-c*n;
/* Solve the system: sol = (D'*E*D)^{-1} D'*E*F */
/* D'*E*F has been calculated in the same loop as matrix */
sol[0] = -c*DtimesF[0] + a*DtimesF[1] + b*DtimesF[2];
sol[1] = a*DtimesF[0] - n*DtimesF[1] + b*DtimesF[3];
sol[2] = b*DtimesF[0] - n*DtimesF[2] - a*DtimesF[3];
sol[3] = b*DtimesF[1] - a*DtimesF[2] - c*DtimesF[3];
sol[0] /= invdenom;
sol[1] /= invdenom;
sol[2] /= invdenom;
sol[3] /= invdenom;
meanx = meany = 0.;
oldnum = 0;
for (my = 1; my < (uint32_t)MBh-1; my++)
for (mx = 1; mx < (uint32_t)MBw-1; mx++)
{
const int mbnum = mx + my * MBw;
const VECTOR mv = pMBs[mbnum].mvs[0];
if (!pMBs[mbnum].mcsel)
continue;
oldnum++;
meanx += fabs(( sol[0] + (16*mx+8)*sol[1] + (16*my+8)*sol[2] ) - (double)mv.x );
meany += fabs(( sol[3] - (16*mx+8)*sol[2] + (16*my+8)*sol[1] ) - (double)mv.y );
}
if (4*meanx > oldnum) /* better fit than 0.25 (=1/4pel) is useless */
meanx /= oldnum;
else
meanx = 0.25;
if (4*meany > oldnum)
meany /= oldnum;
else
meany = 0.25;
num = 0;
for (my = 0; my < (uint32_t)MBh; my++)
for (mx = 0; mx < (uint32_t)MBw; mx++)
{
const int mbnum = mx + my * MBw;
const VECTOR mv = pMBs[mbnum].mvs[0];
if (!pMBs[mbnum].mcsel)
continue;
if ( ( fabs(( sol[0] + (16*mx+8)*sol[1] + (16*my+8)*sol[2] ) - (double)mv.x ) > meanx )
|| ( fabs(( sol[3] - (16*mx+8)*sol[2] + (16*my+8)*sol[1] ) - (double)mv.y ) > meany ) )
pMBs[mbnum].mcsel=0;
else
num++;
}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -