📄 dsputil.h

📁 ffmpeg源码分析
💻 H
📖 第 1 页 / 共 2 页
字号:
上一页 12
    /**     * idct input permutation.     * several optimized IDCTs need a permutated input (relative to the normal order of the reference     * IDCT)     * this permutation must be performed before the idct_put/add, note, normally this can be merged     * with the zigzag/alternate scan<br>     * an example to avoid confusion:     * - (->decode coeffs -> zigzag reorder -> dequant -> reference idct ->...)     * - (x -> referece dct -> reference idct -> x)     * - (x -> referece dct -> simple_mmx_perm = idct_permutation -> simple_idct_mmx -> x)     * - (->decode coeffs -> zigzag reorder -> simple_mmx_perm -> dequant -> simple_idct_mmx ->...)     */    uint8_t idct_permutation[64];    int idct_permutation_type;#define FF_NO_IDCT_PERM 1#define FF_LIBMPEG2_IDCT_PERM 2#define FF_SIMPLE_IDCT_PERM 3#define FF_TRANSPOSE_IDCT_PERM 4#define FF_PARTTRANS_IDCT_PERM 5    int (*try_8x8basis)(int16_t rem[64], int16_t weight[64], int16_t basis[64], int scale);    void (*add_8x8basis)(int16_t rem[64], int16_t basis[64], int scale);#define BASIS_SHIFT 16#define RECON_SHIFT 6    void (*h264_idct_add)(uint8_t *dst, DCTELEM *block, int stride);    void (*h264_idct8_add)(uint8_t *dst, DCTELEM *block, int stride);    void (*h264_idct_dc_add)(uint8_t *dst, DCTELEM *block, int stride);    void (*h264_idct8_dc_add)(uint8_t *dst, DCTELEM *block, int stride);    /* snow wavelet */    void (*vertical_compose97i)(DWTELEM *b0, DWTELEM *b1, DWTELEM *b2, DWTELEM *b3, DWTELEM *b4, DWTELEM *b5, int width);    void (*horizontal_compose97i)(DWTELEM *b, int width);    void (*inner_add_yblock)(uint8_t *obmc, const int obmc_stride, uint8_t * * block, int b_w, int b_h, int src_x, int src_y, int src_stride, slice_buffer * sb, int add, uint8_t * dst8);    void (*prefetch)(void *mem, int stride, int h);    void (*shrink[4])(uint8_t *dst, int dst_wrap, const uint8_t *src, int src_wrap, int width, int height);} DSPContext;void dsputil_static_init(void);void dsputil_init(DSPContext* p, AVCodecContext *avctx);/** * permute block according to permuatation. * @param last last non zero element in scantable order */void ff_block_permute(DCTELEM *block, uint8_t *permutation, const uint8_t *scantable, int last);void ff_set_cmp(DSPContext* c, me_cmp_func *cmp, int type);#define         BYTE_VEC32(c)   ((c)*0x01010101UL)static inline uint32_t rnd_avg32(uint32_t a, uint32_t b){    return (a | b) - (((a ^ b) & ~BYTE_VEC32(0x01)) >> 1);}static inline uint32_t no_rnd_avg32(uint32_t a, uint32_t b){    return (a & b) + (((a ^ b) & ~BYTE_VEC32(0x01)) >> 1);}static inline int get_penalty_factor(int lambda, int lambda2, int type){    switch(type&0xFF){    default:    case FF_CMP_SAD:        return lambda>>FF_LAMBDA_SHIFT;    case FF_CMP_DCT:        return (3*lambda)>>(FF_LAMBDA_SHIFT+1);    case FF_CMP_W53:        return (4*lambda)>>(FF_LAMBDA_SHIFT);    case FF_CMP_W97:        return (2*lambda)>>(FF_LAMBDA_SHIFT);    case FF_CMP_SATD:    case FF_CMP_DCT264:        return (2*lambda)>>FF_LAMBDA_SHIFT;    case FF_CMP_RD:    case FF_CMP_PSNR:    case FF_CMP_SSE:    case FF_CMP_NSSE:        return lambda2>>FF_LAMBDA_SHIFT;    case FF_CMP_BIT:        return 1;    }}/** * Empty mmx state. * this must be called between any dsp function and float/double code. * for example sin(); dsp->idct_put(); emms_c(); cos() */#define emms_c()/* should be defined by architectures supporting   one or more MultiMedia extension */int mm_support(void);#ifdef __GNUC__  #define DECLARE_ALIGNED_16(t,v)       t v __attribute__ ((aligned (16)))#else  #define DECLARE_ALIGNED_16(t,v)      __declspec(align(16)) t v#endif#if defined(HAVE_MMX)#undef emms_c#define MM_MMX    0x0001 /* standard MMX */#define MM_3DNOW  0x0004 /* AMD 3DNOW */#define MM_MMXEXT 0x0002 /* SSE integer functions or AMD MMX ext */#define MM_SSE    0x0008 /* SSE functions */#define MM_SSE2   0x0010 /* PIV SSE2 functions */#define MM_3DNOWEXT  0x0020 /* AMD 3DNowExt */extern int mm_flags;void add_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size);void put_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size);void put_signed_pixels_clamped_mmx(const DCTELEM *block, uint8_t *pixels, int line_size);static inline void emms(void){    __asm __volatile ("emms;":::"memory");}#define emms_c() \{\    if (mm_flags & MM_MMX)\        emms();\}#ifdef __GNUC__  #define DECLARE_ALIGNED_8(t,v)       t v __attribute__ ((aligned (8)))#else  #define DECLARE_ALIGNED_8(t,v)      __declspec(align(8)) t v#endif#define STRIDE_ALIGN 8void dsputil_init_mmx(DSPContext* c, AVCodecContext *avctx);void dsputil_init_pix_mmx(DSPContext* c, AVCodecContext *avctx);#elif defined(ARCH_ARMV4L)/* This is to use 4 bytes read to the IDCT pointers for some 'zero'   line optimizations */#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (4)))#define STRIDE_ALIGN 4#define MM_IWMMXT    0x0100 /* XScale IWMMXT */extern int mm_flags;void dsputil_init_armv4l(DSPContext* c, AVCodecContext *avctx);#elif defined(HAVE_MLIB)/* SPARC/VIS IDCT needs 8-byte aligned DCT blocks */#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (8)))#define STRIDE_ALIGN 8void dsputil_init_mlib(DSPContext* c, AVCodecContext *avctx);#elif defined(ARCH_SPARC)/* SPARC/VIS IDCT needs 8-byte aligned DCT blocks */#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (8)))#define STRIDE_ALIGN 8void dsputil_init_vis(DSPContext* c, AVCodecContext *avctx);#elif defined(ARCH_ALPHA)#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (8)))#define STRIDE_ALIGN 8void dsputil_init_alpha(DSPContext* c, AVCodecContext *avctx);#elif defined(ARCH_POWERPC)#define MM_ALTIVEC    0x0001 /* standard AltiVec */extern int mm_flags;#if defined(HAVE_ALTIVEC) && !defined(CONFIG_DARWIN)#define pixel altivec_pixel#include <altivec.h>#undef pixel#endif#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (16)))#define STRIDE_ALIGN 16void dsputil_init_ppc(DSPContext* c, AVCodecContext *avctx);#elif defined(HAVE_MMI)#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (16)))#define STRIDE_ALIGN 16void dsputil_init_mmi(DSPContext* c, AVCodecContext *avctx);#elif defined(ARCH_SH4)#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (8)))#define STRIDE_ALIGN 8void dsputil_init_sh4(DSPContext* c, AVCodecContext *avctx);#else#define DECLARE_ALIGNED_8(t,v)    t v __attribute__ ((aligned (8)))#define STRIDE_ALIGN 8#endif#ifdef __GNUC__struct unaligned_64 { uint64_t l; } __attribute__((packed));struct unaligned_32 { uint32_t l; } __attribute__((packed));struct unaligned_16 { uint16_t l; } __attribute__((packed));#define LD16(a) (((const struct unaligned_16 *) (a))->l)#define LD32(a) (((const struct unaligned_32 *) (a))->l)#define LD64(a) (((const struct unaligned_64 *) (a))->l)#define ST16(a, b) (((struct unaligned_16 *) (a))->l) = (b)#define ST32(a, b) (((struct unaligned_32 *) (a))->l) = (b)#else /* __GNUC__ */#define LD16(a) (*((uint16_t*)(a)))#define LD32(a) (*((uint32_t*)(a)))#define LD64(a) (*((uint64_t*)(a)))#define ST16(a, b) *((uint16_t*)(a)) = (b)#define ST32(a, b) *((uint32_t*)(a)) = (b)#endif /* !__GNUC__ *//* PSNR */void get_psnr(uint8_t *orig_image[3], uint8_t *coded_image[3],              int orig_linesize[3], int coded_linesize,              AVCodecContext *avctx);/* FFT computation *//* NOTE: soon integer code will be added, so you must use the   FFTSample type */typedef float FFTSample;typedef struct FFTComplex {    FFTSample re, im;} FFTComplex;typedef struct FFTContext {    int nbits;    int inverse;    uint16_t *revtab;    FFTComplex *exptab;    FFTComplex *exptab1; /* only used by SSE code */    void (*fft_calc)(struct FFTContext *s, FFTComplex *z);} FFTContext;int ff_fft_init(FFTContext *s, int nbits, int inverse);void ff_fft_permute(FFTContext *s, FFTComplex *z);void ff_fft_calc_c(FFTContext *s, FFTComplex *z);void ff_fft_calc_sse(FFTContext *s, FFTComplex *z);void ff_fft_calc_3dn(FFTContext *s, FFTComplex *z);void ff_fft_calc_3dn2(FFTContext *s, FFTComplex *z);void ff_fft_calc_altivec(FFTContext *s, FFTComplex *z);static inline void ff_fft_calc(FFTContext *s, FFTComplex *z){    s->fft_calc(s, z);}void ff_fft_end(FFTContext *s);/* MDCT computation */typedef struct MDCTContext {    int n;  /* size of MDCT (i.e. number of input data * 2) */    int nbits; /* n = 2^nbits */    /* pre/post rotation tables */    FFTSample *tcos;    FFTSample *tsin;    FFTContext fft;} MDCTContext;int ff_mdct_init(MDCTContext *s, int nbits, int inverse);void ff_imdct_calc(MDCTContext *s, FFTSample *output,                const FFTSample *input, FFTSample *tmp);void ff_mdct_calc(MDCTContext *s, FFTSample *out,               const FFTSample *input, FFTSample *tmp);void ff_mdct_end(MDCTContext *s);#define WARPER8_16(name8, name16)\static int name16(void /*MpegEncContext*/ *s, uint8_t *dst, uint8_t *src, int stride, int h){\    return name8(s, dst           , src           , stride, h)\          +name8(s, dst+8         , src+8         , stride, h);\}#define WARPER8_16_SQ(name8, name16)\static int name16(void /*MpegEncContext*/ *s, uint8_t *dst, uint8_t *src, int stride, int h){\    int score=0;\    score +=name8(s, dst           , src           , stride, 8);\    score +=name8(s, dst+8         , src+8         , stride, 8);\    if(h==16){\        dst += 8*stride;\        src += 8*stride;\        score +=name8(s, dst           , src           , stride, 8);\        score +=name8(s, dst+8         , src+8         , stride, 8);\    }\    return score;\}#endif
上一页 12
💿 文件大小 2612 K
👤 上传用户 xiaoy2000
📂 所属分类其他
🏷️ 相关标签

#ffmpeg #源码分析
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -