📄 dsputil.c
字号:
src+= stride;
}
#endif
}
STATIC_FUNC void avg_h264_chroma_mc8_c(uint8_t *dst/*align 8*/, uint8_t *src/*align 1*/, int stride, int h, int x, int y)
{
const int A=(8-x)*(8-y);
const int B=( x)*(8-y);
const int C=(8-x)*( y);
const int D=( x)*( y);
int i;
assert(x<8 && y<8 && x>=0 && y>=0);
for(i=0; i<h; i++)
{
dst[0] = (dst[0] + (((A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1])+32)>>6) + 1)>>1;
dst[1] = (dst[1] + (((A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2])+32)>>6) + 1)>>1;
dst[2] = (dst[2] + (((A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3])+32)>>6) + 1)>>1;
dst[3] = (dst[3] + (((A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4])+32)>>6) + 1)>>1;
dst[4] = (dst[4] + (((A*src[4] + B*src[5] + C*src[stride+4] + D*src[stride+5])+32)>>6) + 1)>>1;
dst[5] = (dst[5] + (((A*src[5] + B*src[6] + C*src[stride+5] + D*src[stride+6])+32)>>6) + 1)>>1;
dst[6] = (dst[6] + (((A*src[6] + B*src[7] + C*src[stride+6] + D*src[stride+7])+32)>>6) + 1)>>1;
dst[7] = (dst[7] + (((A*src[7] + B*src[8] + C*src[stride+7] + D*src[stride+8])+32)>>6) + 1)>>1;
dst+= stride;
src+= stride;
}
}
#endif /* ] */
#endif /* ] */
STATIC_FUNC void put_no_rnd_h264_chroma_mc8_c(uint8_t *dst/*align 8*/, uint8_t *src/*align 1*/, int stride, int h, int x, int y){
const int A=(8-x)*(8-y);
const int B=( x)*(8-y);
const int C=(8-x)*( y);
const int D=( x)*( y);
int i;
assert(x<8 && y<8 && x>=0 && y>=0);
for(i=0; i<h; i++)
{
dst[0] = (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1] + 32 - 4) >> 6;
dst[1] = (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2] + 32 - 4) >> 6;
dst[2] = (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3] + 32 - 4) >> 6;
dst[3] = (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4] + 32 - 4) >> 6;
dst[4] = (A*src[4] + B*src[5] + C*src[stride+4] + D*src[stride+5] + 32 - 4) >> 6;
dst[5] = (A*src[5] + B*src[6] + C*src[stride+5] + D*src[stride+6] + 32 - 4) >> 6;
dst[6] = (A*src[6] + B*src[7] + C*src[stride+6] + D*src[stride+7] + 32 - 4) >> 6;
dst[7] = (A*src[7] + B*src[8] + C*src[stride+7] + D*src[stride+8] + 32 - 4) >> 6;
dst+= stride;
src+= stride;
}
}
STATIC_FUNC inline void copy_block2(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
{
int i;
for(i=0; i<h; i++)
{
ST16(dst , LD16(src ));
dst+=dstStride;
src+=srcStride;
}
}
STATIC_FUNC inline void copy_block4(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
{
int i;
for(i=0; i<h; i++)
{
ST32(dst , LD32(src ));
dst+=dstStride;
src+=srcStride;
}
}
STATIC_FUNC inline void copy_block8(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
{
int i;
for(i=0; i<h; i++)
{
ST32(dst , LD32(src ));
ST32(dst+4 , LD32(src+4 ));
dst+=dstStride;
src+=srcStride;
}
}
STATIC_FUNC inline void copy_block16(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
{
int i;
for(i=0; i<h; i++)
{
ST32(dst , LD32(src ));
ST32(dst+4 , LD32(src+4 ));
ST32(dst+8 , LD32(src+8 ));
ST32(dst+12, LD32(src+12));
dst+=dstStride;
src+=srcStride;
}
}
STATIC_FUNC void put_h264_qpel2_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride)
{
const int h=2;
uint8_t *cm = cropTbl + MAX_NEG_CROP;
int i;
for(i=0; i<h; i++)
{
const int srcB= src[-2];
const int srcA= src[-1];
const int src0= src[0 ];
const int src1= src[1];
const int src2= src[2 ];
const int src3= src[3 ];
const int src4= src[4 ];
dst[0] = cm[(((src0+src1)*20 - (srcA+src2)*5 + (srcB+src3))+16)>>5];
dst[1] = cm[(((src1+src2)*20 - (src0+src3)*5 + (srcA+src4))+16)>>5];
dst+=dstStride;
src+=srcStride;
}
}
STATIC_FUNC void put_h264_qpel2_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride)
{
const int w=2;
uint8_t *cm = cropTbl + MAX_NEG_CROP;
int i;
for(i=0; i<w; i++)
{
const int srcB= src[-2*srcStride];
const int srcA= src[-1*srcStride];
const int src0= src[0 *srcStride];
const int src1= src[1 *srcStride];
const int src2= src[2 *srcStride];
const int src3= src[3 *srcStride];
const int src4= src[4 *srcStride];
dst[0*dstStride] = cm[(((src0+src1)*20 - (srcA+src2)*5 + (srcB+src3))+16)>>5];
dst[1*dstStride] = cm[(((src1+src2)*20 - (src0+src3)*5 + (srcA+src4))+16)>>5];
dst++;
src++;
}
}
STATIC_FUNC void put_h264_qpel2_hv_lowpass(uint8_t *dst, int16_t *tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride)
{
const int h=2;
const int w=2;
uint8_t *cm = cropTbl + MAX_NEG_CROP;
int i;
src -= 2*srcStride;
for(i=0; i<h+5; i++)
{
const int srcB= src[-2];
const int srcA= src[-1];
const int src0= src[0 ];
const int src1= src[1 ];
const int src2= src[2];
const int src3= src[3];
const int src4= src[4];
tmp[0]= (src0+src1)*20 - (srcA+src2)*5 + (srcB+src3);
tmp[1]= (src1+src2)*20 - (src0+src3)*5 + (srcA+src4);
tmp+=tmpStride;
src+=srcStride;
}
tmp -= tmpStride*(h+5-2);
for(i=0; i<w; i++)
{
const int tmpB= tmp[-2*tmpStride];
const int tmpA= tmp[-1*tmpStride];
const int tmp0= tmp[0 *tmpStride];
const int tmp1= tmp[1 *tmpStride];
const int tmp2= tmp[2 *tmpStride];
const int tmp3= tmp[3 *tmpStride];
const int tmp4= tmp[4 *tmpStride];
dst[0*dstStride] = cm[(((tmp0+tmp1)*20 - (tmpA+tmp2)*5 + (tmpB+tmp3))+512)>>10];
dst[1*dstStride] = cm[(((tmp1+tmp2)*20 - (tmp0+tmp3)*5 + (tmpA+tmp4))+512)>>10];
dst++;
tmp++;
}
}
STATIC_FUNC void put_h264_qpel4_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride)
{
const int h=4;
uint8_t *cm = cropTbl + MAX_NEG_CROP;
int i;
for(i=0; i<h; i++)
{
const int srcB= src[-2];
const int srcA= src[-1];
const int src0= src[0 ];
const int src1= src[1 ];
const int src2= src[2 ];
const int src3= src[3 ];
const int src4= src[4 ];
const int src5= src[5 ];
const int src6= src[6 ];
dst[0] = cm[(((src0+src1)*20 - (srcA+src2)*5 + (srcB+src3))+16)>>5];
dst[1] = cm[(((src1+src2)*20 - (src0+src3)*5 + (srcA+src4))+16)>>5];
dst[2] = cm[(((src2+src3)*20 - (src1+src4)*5 + (src0+src5))+16)>>5];
dst[3] = cm[(((src3+src4)*20 - (src2+src5)*5 + (src1+src6))+16)>>5];
dst+=dstStride;
src+=srcStride;
}
}
#ifdef USE_ASM_VERSION /* [ */
//use ASM functions in asm_dsputil.s
extern void put_h264_qpel4_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride);
extern void put_h264_qpel4_hv_lowpass(uint8_t *dst, int16_t *tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride);
extern void put_h264_qpel8_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride);
extern void put_h264_qpel8_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride);
extern void put_h264_qpel8_hv_lowpass(uint8_t *dst, int16_t *tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride);
#else /* ] [ */
STATIC_FUNC void put_h264_qpel4_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride)
{
const int w=4;
uint8_t *cm = cropTbl + MAX_NEG_CROP;
int i;
for(i=0; i<w; i++)
{
const int srcB= src[-2*srcStride];
const int srcA= src[-1*srcStride];
const int src0= src[0 *srcStride];
const int src1= src[1 *srcStride];
const int src2= src[2 *srcStride];
const int src3= src[3 *srcStride];
const int src4= src[4 *srcStride];
const int src5= src[5 *srcStride];
const int src6= src[6 *srcStride];
dst[0*dstStride] = cm[(((src0+src1)*20 - (srcA+src2)*5 + (srcB+src3))+16)>>5];
dst[1*dstStride] = cm[(((src1+src2)*20 - (src0+src3)*5 + (srcA+src4))+16)>>5];
dst[2*dstStride] = cm[(((src2+src3)*20 - (src1+src4)*5 + (src0+src5))+16)>>5];
dst[3*dstStride] = cm[(((src3+src4)*20 - (src2+src5)*5 + (src1+src6))+16)>>5];
dst++;
src++;
}
}
STATIC_FUNC void put_h264_qpel4_hv_lowpass(uint8_t *dst, int16_t *tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride)
{
const int h=4;
const int w=4;
uint8_t *cm = cropTbl + MAX_NEG_CROP;
int i;
src -= 2*srcStride;
for(i=0; i<h+5; i++)
{
const int srcB= src[-2];
const int srcA= src[-1];
const int src0= src[0 ];
const int src1= src[1 ];
const int src2= src[2 ];
const int src3= src[3 ];
const int src4= src[4 ];
const int src5= src[5 ];
const int src6= src[6 ];
tmp[0]= (src0+src1)*20 - (srcA+src2)*5 + (srcB+src3);
tmp[1]= (src1+src2)*20 - (src0+src3)*5 + (srcA+src4);
tmp[2]= (src2+src3)*20 - (src1+src4)*5 + (src0+src5);
tmp[3]= (src3+src4)*20 - (src2+src5)*5 + (src1+src6);
tmp+=tmpStride;
src+=srcStride;
}
tmp -= tmpStride*(h+5-2);
for(i=0; i<w; i++)
{
const int tmpB= tmp[-2*tmpStride];
const int tmpA= tmp[-1*tmpStride];
const int tmp0= tmp[0 *tmpStride];
const int tmp1= tmp[1 *tmpStride];
const int tmp2= tmp[2 *tmpStride];
const int tmp3= tmp[3 *tmpStride];
const int tmp4= tmp[4 *tmpStride];
const int tmp5= tmp[5 *tmpStride];
const int tmp6= tmp[6 *tmpStride];
dst[0*dstStride] = cm[(((tmp0+tmp1)*20 - (tmpA+tmp2)*5 + (tmpB+tmp3))+512)>>10];
dst[1*dstStride] = cm[(((tmp1+tmp2)*20 - (tmp0+tmp3)*5 + (tmpA+tmp4))+512)>>10];
dst[2*dstStride] = cm[(((tmp2+tmp3)*20 - (tmp1+tmp4)*5 + (tmp0+tmp5))+512)>>10];
dst[3*dstStride] = cm[(((tmp3+tmp4)*20 - (tmp2+tmp5)*5 + (tmp1+tmp6))+512)>>10];
dst++;
tmp++;
}
}
STATIC_FUNC void put_h264_qpel8_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride)
{
const int h=8;
uint8_t *cm = cropTbl + MAX_NEG_CROP;
int i;
for (i=0; i<h; i++)
{
const srcB= src[-2];
const srcA= src[-1];
const src0= src[0 ];
const src1= src[1 ];
const src2= src[2 ];
const src3= src[3];
const src4= src[4 ];
const src5= src[5 ];
const src6= src[6 ];
const src7= src[7 ];
const src8= src[8 ];
const src9= src[9 ];
const src10=src[10];
dst[0] = cm[(((src0+src1)*20 - (srcA+src2)*5 + (srcB+src3))+16)>>5];
dst[1] = cm[(((src1+src2)*20 - (src0+src3)*5 + (srcA+src4))+16)>>5];
dst[2] = cm[(((src2+src3)*20 - (src1+src4)*5 + (src0+src5))+16)>>5];
dst[3] = cm[(((src3+src4)*20 - (src2+src5)*5 + (src1+src6))+16)>>5];
dst[4] = cm[(((src4+src5)*20 - (src3+src6)*5 + (src2+src7))+16)>>5];
dst[5] = cm[(((src5+src6)*20 - (src4+src7)*5 + (src3+src8))+16)>>5];
dst[6] = cm[(((src6+src7)*20 - (src5+src8)*5 + (src4+src9))+16)>>5];
dst[7] = cm[(((src7+src8)*20 - (src6+src9)*5 + (src5+src10))+16)>>5];
dst+=dstStride;
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -