📄 h264.c
字号:
/* * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at> * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA * */ /** * @file h264.c * H.264 / AVC / MPEG4 part10 codec. * @author Michael Niedermayer <michaelni@gmx.at> */#include "common.h"#include "dsputil.h"#include "avcodec.h"#include "mpegvideo.h"#include "h264data.h"#include "golomb.h"#undef NDEBUG#include <assert.h>#define interlaced_dct interlaced_dct_is_a_bad_name#define mb_intra mb_intra_isnt_initalized_see_mb_type#define LUMA_DC_BLOCK_INDEX 25#define CHROMA_DC_BLOCK_INDEX 26#define CHROMA_DC_COEFF_TOKEN_VLC_BITS 8#define COEFF_TOKEN_VLC_BITS 8#define TOTAL_ZEROS_VLC_BITS 9#define CHROMA_DC_TOTAL_ZEROS_VLC_BITS 3#define RUN_VLC_BITS 3#define RUN7_VLC_BITS 6#define MAX_SPS_COUNT 32#define MAX_PPS_COUNT 256#define MAX_MMCO_COUNT 66/** * Sequence parameter set */typedef struct SPS{ int profile_idc; int level_idc; int log2_max_frame_num; ///< log2_max_frame_num_minus4 + 4 int poc_type; ///< pic_order_cnt_type int log2_max_poc_lsb; ///< log2_max_pic_order_cnt_lsb_minus4 int delta_pic_order_always_zero_flag; int offset_for_non_ref_pic; int offset_for_top_to_bottom_field; int poc_cycle_length; ///< num_ref_frames_in_pic_order_cnt_cycle int ref_frame_count; ///< num_ref_frames int gaps_in_frame_num_allowed_flag; int mb_width; ///< frame_width_in_mbs_minus1 + 1 int mb_height; ///< frame_height_in_mbs_minus1 + 1 int frame_mbs_only_flag; int mb_aff; ///<mb_adaptive_frame_field_flag int direct_8x8_inference_flag; int crop; ///< frame_cropping_flag int crop_left; ///< frame_cropping_rect_left_offset int crop_right; ///< frame_cropping_rect_right_offset int crop_top; ///< frame_cropping_rect_top_offset int crop_bottom; ///< frame_cropping_rect_bottom_offset int vui_parameters_present_flag; AVRational sar; short offset_for_ref_frame[256]; //FIXME dyn aloc?}SPS;/** * Picture parameter set */typedef struct PPS{ int sps_id; int cabac; ///< entropy_coding_mode_flag int pic_order_present; ///< pic_order_present_flag int slice_group_count; ///< num_slice_groups_minus1 + 1 int mb_slice_group_map_type; int ref_count[2]; ///< num_ref_idx_l0/1_active_minus1 + 1 int weighted_pred; ///< weighted_pred_flag int weighted_bipred_idc; int init_qp; ///< pic_init_qp_minus26 + 26 int init_qs; ///< pic_init_qs_minus26 + 26 int chroma_qp_index_offset; int deblocking_filter_parameters_present; ///< deblocking_filter_parameters_present_flag int constrained_intra_pred; ///< constrained_intra_pred_flag int redundant_pic_cnt_present; ///< redundant_pic_cnt_present_flag}PPS;/** * Memory management control operation opcode. */typedef enum MMCOOpcode{ MMCO_END=0, MMCO_SHORT2UNUSED, MMCO_LONG2UNUSED, MMCO_SHORT2LONG, MMCO_SET_MAX_LONG, MMCO_RESET, MMCO_LONG,} MMCOOpcode;/** * Memory management control operation. */typedef struct MMCO{ MMCOOpcode opcode; int short_frame_num; int long_index;} MMCO;/** * H264Context */typedef struct H264Context{ MpegEncContext s; int nal_ref_idc; int nal_unit_type;#define NAL_SLICE 1#define NAL_DPA 2#define NAL_DPB 3#define NAL_DPC 4#define NAL_IDR_SLICE 5#define NAL_SEI 6#define NAL_SPS 7#define NAL_PPS 8#define NAL_PICTURE_DELIMITER 9#define NAL_FILTER_DATA 10 uint8_t *rbsp_buffer; int rbsp_buffer_size; int chroma_qp; //QPc int prev_mb_skiped; //FIXME remove (IMHO not used) //prediction stuff int chroma_pred_mode; int intra16x16_pred_mode; int8_t intra4x4_pred_mode_cache[5*8]; int8_t (*intra4x4_pred_mode)[8]; void (*pred4x4 [9+3])(uint8_t *src, uint8_t *topright, int stride);//FIXME move to dsp? void (*pred8x8 [4+3])(uint8_t *src, int stride); void (*pred16x16[4+3])(uint8_t *src, int stride); unsigned int topleft_samples_available; unsigned int top_samples_available; unsigned int topright_samples_available; unsigned int left_samples_available; /** * non zero coeff count cache. * is 64 if not available. */ uint8_t non_zero_count_cache[6*8]; uint8_t (*non_zero_count)[16]; /** * Motion vector cache. */ int16_t mv_cache[2][5*8][2]; int8_t ref_cache[2][5*8];#define LIST_NOT_USED -1 //FIXME rename?#define PART_NOT_AVAILABLE -2 /** * is 1 if the specific list MV&references are set to 0,0,-2. */ int mv_cache_clean[2]; int block_offset[16+8]; int chroma_subblock_offset[16]; //FIXME remove uint16_t *mb2b_xy; //FIXME are these 4 a good idea? uint16_t *mb2b8_xy; int b_stride; int b8_stride; int halfpel_flag; int thirdpel_flag; int unknown_svq3_flag; int next_slice_index; SPS sps_buffer[MAX_SPS_COUNT]; SPS sps; ///< current sps PPS pps_buffer[MAX_PPS_COUNT]; /** * current pps */ PPS pps; //FIXME move tp Picture perhaps? (->no) do we need that? int slice_num; uint8_t *slice_table_base; uint8_t *slice_table; ///< slice_table_base + mb_stride + 1 int slice_type; int slice_type_fixed; //interlacing specific flags int mb_field_decoding_flag; int sub_mb_type[4]; //POC stuff int poc_lsb; int poc_msb; int delta_poc_bottom; int delta_poc[2]; int frame_num; int prev_poc_msb; ///< poc_msb of the last reference pic for POC type 0 int prev_poc_lsb; ///< poc_lsb of the last reference pic for POC type 0 int frame_num_offset; ///< for POC type 2 int prev_frame_num_offset; ///< for POC type 2 int prev_frame_num; ///< frame_num of the last pic for POC type 1/2 /** * frame_num for frames or 2*frame_num for field pics. */ int curr_pic_num; /** * max_frame_num or 2*max_frame_num for field pics. */ int max_pic_num; //Weighted pred stuff int luma_log2_weight_denom; int chroma_log2_weight_denom; int luma_weight[2][16]; int luma_offset[2][16]; int chroma_weight[2][16][2]; int chroma_offset[2][16][2]; //deblock int disable_deblocking_filter_idc; int slice_alpha_c0_offset_div2; int slice_beta_offset_div2; int redundant_pic_count; int direct_spatial_mv_pred; /** * num_ref_idx_l0/1_active_minus1 + 1 */ int ref_count[2];// FIXME split for AFF Picture *short_ref[16]; Picture *long_ref[16]; Picture default_ref_list[2][32]; Picture ref_list[2][32]; //FIXME size? Picture field_ref_list[2][32]; //FIXME size? /** * memory management control operations buffer. */ MMCO mmco[MAX_MMCO_COUNT]; int mmco_index; int long_ref_count; ///< number of actual long term references int short_ref_count; ///< number of actual short term references //data partitioning GetBitContext intra_gb; GetBitContext inter_gb; GetBitContext *intra_gb_ptr; GetBitContext *inter_gb_ptr; DCTELEM mb[16*24] __align8;}H264Context;static VLC coeff_token_vlc[4];static VLC chroma_dc_coeff_token_vlc;static VLC total_zeros_vlc[15];static VLC chroma_dc_total_zeros_vlc[3];static VLC run_vlc[6];static VLC run7_vlc;static void svq3_luma_dc_dequant_idct_c(DCTELEM *block, int qp);static void svq3_add_idct_c(uint8_t *dst, DCTELEM *block, int stride, int qp, int dc);static inline uint32_t pack16to32(int a, int b){#ifdef WORDS_BIGENDIAN return (b&0xFFFF) + (a<<16);#else return (a&0xFFFF) + (b<<16);#endif}/** * fill a rectangle. * @param h height of the recatangle, should be a constant * @param w width of the recatangle, should be a constant * @param size the size of val (1 or 4), should be a constant */static inline void fill_rectangle(void *vp, int w, int h, int stride, uint32_t val, int size){ //FIXME ensure this IS inlined uint8_t *p= (uint8_t*)vp; assert(size==1 || size==4); w *= size; stride *= size; //FIXME check what gcc generates for 64 bit on x86 and possible write a 32 bit ver of it if(w==2 && h==2){ *(uint16_t*)(p + 0)= *(uint16_t*)(p + stride)= size==4 ? val : val*0x0101; }else if(w==2 && h==4){ *(uint16_t*)(p + 0*stride)= *(uint16_t*)(p + 1*stride)= *(uint16_t*)(p + 2*stride)= *(uint16_t*)(p + 3*stride)= size==4 ? val : val*0x0101; }else if(w==4 && h==1){ *(uint32_t*)(p + 0*stride)= size==4 ? val : val*0x01010101; }else if(w==4 && h==2){ *(uint32_t*)(p + 0*stride)= *(uint32_t*)(p + 1*stride)= size==4 ? val : val*0x01010101; }else if(w==4 && h==4){ *(uint32_t*)(p + 0*stride)= *(uint32_t*)(p + 1*stride)= *(uint32_t*)(p + 2*stride)= *(uint32_t*)(p + 3*stride)= size==4 ? val : val*0x01010101; }else if(w==8 && h==1){ *(uint32_t*)(p + 0)= *(uint32_t*)(p + 4)= size==4 ? val : val*0x01010101; }else if(w==8 && h==2){ *(uint32_t*)(p + 0 + 0*stride)= *(uint32_t*)(p + 4 + 0*stride)= *(uint32_t*)(p + 0 + 1*stride)= *(uint32_t*)(p + 4 + 1*stride)= size==4 ? val : val*0x01010101; }else if(w==8 && h==4){ *(uint64_t*)(p + 0*stride)= *(uint64_t*)(p + 1*stride)= *(uint64_t*)(p + 2*stride)= *(uint64_t*)(p + 3*stride)= size==4 ? val*0x0100000001ULL : val*0x0101010101010101ULL; }else if(w==16 && h==2){ *(uint64_t*)(p + 0+0*stride)= *(uint64_t*)(p + 8+0*stride)= *(uint64_t*)(p + 0+1*stride)= *(uint64_t*)(p + 8+1*stride)= size==4 ? val*0x0100000001ULL : val*0x0101010101010101ULL; }else if(w==16 && h==4){ *(uint64_t*)(p + 0+0*stride)= *(uint64_t*)(p + 8+0*stride)= *(uint64_t*)(p + 0+1*stride)= *(uint64_t*)(p + 8+1*stride)= *(uint64_t*)(p + 0+2*stride)= *(uint64_t*)(p + 8+2*stride)= *(uint64_t*)(p + 0+3*stride)= *(uint64_t*)(p + 8+3*stride)= size==4 ? val*0x0100000001ULL : val*0x0101010101010101ULL; }else assert(0);}static inline void fill_caches(H264Context *h, int mb_type){ MpegEncContext * const s = &h->s; const int mb_xy= s->mb_x + s->mb_y*s->mb_stride; int topleft_xy, top_xy, topright_xy, left_xy[2]; int topleft_type, top_type, topright_type, left_type[2]; int left_block[4]; int i; //wow what a mess, why didnt they simplify the interlacing&intra stuff, i cant imagine that these complex rules are worth it if(h->sps.mb_aff){ //FIXME topleft_xy = 0; /* avoid warning */ top_xy = 0; /* avoid warning */ topright_xy = 0; /* avoid warning */ }else{ topleft_xy = mb_xy-1 - s->mb_stride; top_xy = mb_xy - s->mb_stride;
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -