📄 pixel.c
字号:
return pixel_satd_wxh( pix1, i_stride_pix1, pix2, i_stride_pix2, width, height ); \
}
PIXEL_SATD_C( x264_pixel_satd_16x16, 16, 16 )
PIXEL_SATD_C( x264_pixel_satd_16x8, 16, 8 )
PIXEL_SATD_C( x264_pixel_satd_8x16, 8, 16 )
PIXEL_SATD_C( x264_pixel_satd_8x8, 8, 8 )
PIXEL_SATD_C( x264_pixel_satd_8x4, 8, 4 )
PIXEL_SATD_C( x264_pixel_satd_4x8, 4, 8 )
PIXEL_SATD_C( x264_pixel_satd_4x4, 4, 4 )
/****************************************************************************
* pixel_sa8d_WxH: sum of 8x8 Hadamard transformed differences
****************************************************************************/
#define SA8D_1D {\
const int a0 = SRC(0) + SRC(4);\
const int a4 = SRC(0) - SRC(4);\
const int a1 = SRC(1) + SRC(5);\
const int a5 = SRC(1) - SRC(5);\
const int a2 = SRC(2) + SRC(6);\
const int a6 = SRC(2) - SRC(6);\
const int a3 = SRC(3) + SRC(7);\
const int a7 = SRC(3) - SRC(7);\
const int b0 = a0 + a2;\
const int b2 = a0 - a2;\
const int b1 = a1 + a3;\
const int b3 = a1 - a3;\
const int b4 = a4 + a6;\
const int b6 = a4 - a6;\
const int b5 = a5 + a7;\
const int b7 = a5 - a7;\
DST(0, b0 + b1);\
DST(1, b0 - b1);\
DST(2, b2 + b3);\
DST(3, b2 - b3);\
DST(4, b4 + b5);\
DST(5, b4 - b5);\
DST(6, b6 + b7);\
DST(7, b6 - b7);\
}
static inline int pixel_sa8d_wxh( uint8_t *pix1, int i_pix1, uint8_t *pix2, int i_pix2,
int i_width, int i_height )
{
int16_t diff[8][8];
int i_satd = 0;
int x, y;
for( y = 0; y < i_height; y += 8 )
{
for( x = 0; x < i_width; x += 8 )
{
int i;
pixel_sub_wxh( (int16_t*)diff, 8, pix1+x, i_pix1, pix2+x, i_pix2 );
#define SRC(x) diff[i][x]
#define DST(x,rhs) diff[i][x] = (rhs)
for( i = 0; i < 8; i++ )
SA8D_1D
#undef SRC
#undef DST
#define SRC(x) diff[x][i]
#define DST(x,rhs) i_satd += abs(rhs)
for( i = 0; i < 8; i++ )
SA8D_1D
#undef SRC
#undef DST
}
pix1 += 8 * i_pix1;
pix2 += 8 * i_pix2;
}
return i_satd;
}
#define PIXEL_SA8D_C( width, height ) \
static int x264_pixel_sa8d_##width##x##height( uint8_t *pix1, int i_stride_pix1, \
uint8_t *pix2, int i_stride_pix2 ) \
{ \
return ( pixel_sa8d_wxh( pix1, i_stride_pix1, pix2, i_stride_pix2, width, height ) + 2 ) >> 2; \
}
PIXEL_SA8D_C( 16, 16 )
PIXEL_SA8D_C( 16, 8 )
PIXEL_SA8D_C( 8, 16 )
PIXEL_SA8D_C( 8, 8 )
#define SAD_X( size ) \
static void x264_pixel_sad_x3_##size( uint8_t *fenc, uint8_t *pix0, uint8_t *pix1, uint8_t *pix2, int i_stride, int scores[3] )\
{\
scores[0] = x264_pixel_sad_##size( fenc, FENC_STRIDE, pix0, i_stride );\
scores[1] = x264_pixel_sad_##size( fenc, FENC_STRIDE, pix1, i_stride );\
scores[2] = x264_pixel_sad_##size( fenc, FENC_STRIDE, pix2, i_stride );\
}\
static void x264_pixel_sad_x4_##size( uint8_t *fenc, uint8_t *pix0, uint8_t *pix1, uint8_t *pix2, uint8_t *pix3, int i_stride, int scores[4] )\
{\
scores[0] = x264_pixel_sad_##size( fenc, FENC_STRIDE, pix0, i_stride );\
scores[1] = x264_pixel_sad_##size( fenc, FENC_STRIDE, pix1, i_stride );\
scores[2] = x264_pixel_sad_##size( fenc, FENC_STRIDE, pix2, i_stride );\
scores[3] = x264_pixel_sad_##size( fenc, FENC_STRIDE, pix3, i_stride );\
}
SAD_X( 16x16 )
SAD_X( 16x8 )
SAD_X( 8x16 )
SAD_X( 8x8 )
SAD_X( 8x4 )
SAD_X( 4x8 )
SAD_X( 4x4 )
#ifdef ARCH_UltraSparc
SAD_X( 16x16_vis )
SAD_X( 16x8_vis )
SAD_X( 8x16_vis )
SAD_X( 8x8_vis )
#endif
/****************************************************************************
* x264_pixel_init:
****************************************************************************/
void x264_pixel_init( int cpu, x264_pixel_function_t *pixf )
{
memset( pixf, 0, sizeof(*pixf) );
#define INIT( name, cpu ) \
pixf->name[PIXEL_16x16] = x264_pixel_##name##_16x16##cpu;\
pixf->name[PIXEL_16x8] = x264_pixel_##name##_16x8##cpu;\
pixf->name[PIXEL_8x16] = x264_pixel_##name##_8x16##cpu;\
pixf->name[PIXEL_8x8] = x264_pixel_##name##_8x8##cpu;\
pixf->name[PIXEL_8x4] = x264_pixel_##name##_8x4##cpu;\
pixf->name[PIXEL_4x8] = x264_pixel_##name##_4x8##cpu;\
pixf->name[PIXEL_4x4] = x264_pixel_##name##_4x4##cpu;
INIT( sad, );
INIT( sad_x3, );
INIT( sad_x4, );
INIT( ssd, );
INIT( satd, );
pixf->sa8d[PIXEL_16x16]= x264_pixel_sa8d_16x16;
pixf->sa8d[PIXEL_16x8] = x264_pixel_sa8d_16x8;
pixf->sa8d[PIXEL_8x16] = x264_pixel_sa8d_8x16;
pixf->sa8d[PIXEL_8x8] = x264_pixel_sa8d_8x8;
#ifdef HAVE_MMXEXT
if( cpu&X264_CPU_MMX )
{
INIT( ssd, _mmx );
}
if( cpu&X264_CPU_MMXEXT )
{
INIT( sad, _mmxext );
INIT( sad_x3, _mmxext );
INIT( sad_x4, _mmxext );
INIT( satd, _mmxext );
pixf->sad_pde[PIXEL_16x16] = x264_pixel_sad_pde_16x16_mmxext;
pixf->sad_pde[PIXEL_16x8 ] = x264_pixel_sad_pde_16x8_mmxext;
pixf->sad_pde[PIXEL_8x16 ] = x264_pixel_sad_pde_8x16_mmxext;
#ifdef ARCH_X86
pixf->sa8d[PIXEL_16x16] = x264_pixel_sa8d_16x16_mmxext;
pixf->sa8d[PIXEL_8x8] = x264_pixel_sa8d_8x8_mmxext;
pixf->intra_sa8d_x3_8x8 = x264_intra_sa8d_x3_8x8_mmxext;
#endif
pixf->intra_satd_x3_16x16 = x264_intra_satd_x3_16x16_mmxext;
pixf->intra_satd_x3_8x8c = x264_intra_satd_x3_8x8c_mmxext;
pixf->intra_satd_x3_4x4 = x264_intra_satd_x3_4x4_mmxext;
}
#endif
#ifdef HAVE_SSE2
// disable on AMD processors since it is slower
if( (cpu&X264_CPU_SSE2) && !(cpu&X264_CPU_3DNOW) )
{
pixf->sad[PIXEL_16x16] = x264_pixel_sad_16x16_sse2;
pixf->sad[PIXEL_16x8 ] = x264_pixel_sad_16x8_sse2;
pixf->satd[PIXEL_16x16]= x264_pixel_satd_16x16_sse2;
pixf->satd[PIXEL_16x8] = x264_pixel_satd_16x8_sse2;
pixf->satd[PIXEL_8x16] = x264_pixel_satd_8x16_sse2;
pixf->satd[PIXEL_8x8] = x264_pixel_satd_8x8_sse2;
pixf->satd[PIXEL_8x4] = x264_pixel_satd_8x4_sse2;
#ifdef ARCH_X86
pixf->sad_x3[PIXEL_16x16] = x264_pixel_sad_x3_16x16_sse2;
pixf->sad_x3[PIXEL_16x8 ] = x264_pixel_sad_x3_16x8_sse2;
pixf->sad_x4[PIXEL_16x16] = x264_pixel_sad_x4_16x16_sse2;
pixf->sad_x4[PIXEL_16x8 ] = x264_pixel_sad_x4_16x8_sse2;
#endif
}
// these are faster on both Intel and AMD
if( cpu&X264_CPU_SSE2 )
{
pixf->ssd[PIXEL_16x16] = x264_pixel_ssd_16x16_sse2;
pixf->ssd[PIXEL_16x8] = x264_pixel_ssd_16x8_sse2;
#ifdef ARCH_X86_64
pixf->sa8d[PIXEL_16x16] = x264_pixel_sa8d_16x16_sse2;
pixf->sa8d[PIXEL_8x8] = x264_pixel_sa8d_8x8_sse2;
pixf->intra_sa8d_x3_8x8 = x264_intra_sa8d_x3_8x8_sse2;
#endif
}
#endif
#ifdef ARCH_PPC
if( cpu&X264_CPU_ALTIVEC )
{
x264_pixel_altivec_init( pixf );
}
#endif
#ifdef ARCH_UltraSparc
pixf->sad[PIXEL_8x8] = x264_pixel_sad_8x8_vis;
pixf->sad[PIXEL_8x16] = x264_pixel_sad_8x16_vis;
pixf->sad[PIXEL_16x8] = x264_pixel_sad_16x8_vis;
pixf->sad[PIXEL_16x16] = x264_pixel_sad_16x16_vis;
pixf->sad_x3[PIXEL_8x8] = x264_pixel_sad_x3_8x8_vis;
pixf->sad_x3[PIXEL_8x16] = x264_pixel_sad_x3_8x16_vis;
pixf->sad_x3[PIXEL_16x8] = x264_pixel_sad_x3_16x8_vis;
pixf->sad_x3[PIXEL_16x16] = x264_pixel_sad_x3_16x16_vis;
pixf->sad_x4[PIXEL_8x8] = x264_pixel_sad_x4_8x8_vis;
pixf->sad_x4[PIXEL_8x16] = x264_pixel_sad_x4_8x16_vis;
pixf->sad_x4[PIXEL_16x8] = x264_pixel_sad_x4_16x8_vis;
pixf->sad_x4[PIXEL_16x16] = x264_pixel_sad_x4_16x16_vis;
#endif
}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -