H.264从SPS中提取视频宽高

H.264有两种封装模式:

(1)annexb模式:传统模式,使用start code来分隔NAL, SPS和PPS是在ES流的头部;

(2)mp4模式:没有start code,使用NALU长度(固定字节,通常为4个字节)来分隔NAL。AVCodecContext的extradata内部保存着分隔的字节数,SPS和PPS;

1. 找到SPS

视频的宽高保存在SPS中。那么提取宽高首先要找到SPS。annexb模式直接读取视频数据,根据NAL type找到SPS即可。mp4模式应该从extradata中找到SPS。

mp4格式的extradata格式如下图:

H.264从SPS中提取视频宽高

FFMpeg中解析extradata的函数是ff_h264_decode_extradata()。注意第5字节的最后2位,表示的就是NAL size的字节数-1。在AVCC格式中,每个NAL前面都会有NAL size字段。NAL size可能是1字节、2字节或4字节(4字节较常见),解析extradata重要目的就是确认这个值,之后2个字节是SPS长度,长度之后就是SPS。

2. 从SPS中提取宽高

以下代码是网上常见的,但是很明显写的有问题,宽高不一定非要是16的倍数。

        width=(pic_width_in_mbs_minus1+)*;
height=(pic_height_in_map_units_minus1+)*;

当宽高不是16整数倍时,frame_cropping_flag值为1,frame_mbs_only_flag为1以下为修正的代码:

#include <stdio.h>
#include <stdint.h>
#include <string.h>
#include <math.h> typedef unsigned int UINT;
typedef unsigned char BYTE;
typedef unsigned long DWORD; UINT Ue(BYTE *pBuff, UINT nLen, UINT &nStartBit)
{
//计算0bit的个数
UINT nZeroNum = ;
while (nStartBit < nLen * )
{
if (pBuff[nStartBit / ] & (0x80 >> (nStartBit % ))) //&:按位与,%取余
{
break;
}
nZeroNum++;
nStartBit++;
}
nStartBit ++; //计算结果
DWORD dwRet = ;
for (UINT i=; i<nZeroNum; i++)
{
dwRet <<= ;
if (pBuff[nStartBit / ] & (0x80 >> (nStartBit % )))
{
dwRet += ;
}
nStartBit++;
}
return ( << nZeroNum) - + dwRet;
} int Se(BYTE *pBuff, UINT nLen, UINT &nStartBit)
{
int UeVal=Ue(pBuff,nLen,nStartBit);
double k=UeVal;
int nValue=ceil(k/);//ceil函数:ceil函数的作用是求不小于给定实数的最小整数。ceil(2)=ceil(1.2)=cei(1.5)=2.00
if (UeVal % ==)
nValue=-nValue;
return nValue;
} DWORD u(UINT BitCount,BYTE * buf,UINT &nStartBit)
{
DWORD dwRet = ;
for (UINT i=; i<BitCount; i++)
{
dwRet <<= ;
if (buf[nStartBit / ] & (0x80 >> (nStartBit % )))
{
dwRet += ;
}
nStartBit++;
}
return dwRet;
} /**
* H264的NAL起始码防竞争机制
*
* @param buf SPS数据内容
*
* @无返回值
*/
void de_emulation_prevention(BYTE* buf,unsigned int* buf_size)
{
int i=,j=;
BYTE* tmp_ptr=NULL;
unsigned int tmp_buf_size=;
int val=; tmp_ptr=buf;
tmp_buf_size=*buf_size;
for(i=;i<(tmp_buf_size-);i++)
{
//check for 0x000003
val=(tmp_ptr[i]^0x00) +(tmp_ptr[i+]^0x00)+(tmp_ptr[i+]^0x03);
if(val==)
{
//kick out 0x03
for(j=i+;j<tmp_buf_size-;j++)
tmp_ptr[j]=tmp_ptr[j+]; //and so we should devrease bufsize
(*buf_size)--;
}
} return;
} /**
* 解码SPS,获取视频图像宽、高信息
*
* @param buf SPS数据内容
* @param nLen SPS数据的长度
* @param width 图像宽度
* @param height 图像高度 * @成功则返回1 , 失败则返回0
*/
int h264_decode_sps(BYTE * buf,unsigned int nLen,int &width,int &height,int &fps)
{
UINT StartBit=;
fps=;
de_emulation_prevention(buf,&nLen); int forbidden_zero_bit=u(,buf,StartBit);
int nal_ref_idc=u(,buf,StartBit);
int nal_unit_type=u(,buf,StartBit);
if(nal_unit_type==)
{
int profile_idc=u(,buf,StartBit);
int constraint_set0_flag=u(,buf,StartBit);//(buf[1] & 0x80)>>7;
int constraint_set1_flag=u(,buf,StartBit);//(buf[1] & 0x40)>>6;
int constraint_set2_flag=u(,buf,StartBit);//(buf[1] & 0x20)>>5;
int constraint_set3_flag=u(,buf,StartBit);//(buf[1] & 0x10)>>4;
int reserved_zero_4bits=u(,buf,StartBit);
int level_idc=u(,buf,StartBit); int seq_parameter_set_id=Ue(buf,nLen,StartBit); if( profile_idc == || profile_idc == ||
profile_idc == || profile_idc == )
{
int chroma_format_idc=Ue(buf,nLen,StartBit);
if( chroma_format_idc == )
int residual_colour_transform_flag=u(,buf,StartBit);
int bit_depth_luma_minus8=Ue(buf,nLen,StartBit);
int bit_depth_chroma_minus8=Ue(buf,nLen,StartBit);
int qpprime_y_zero_transform_bypass_flag=u(,buf,StartBit);
int seq_scaling_matrix_present_flag=u(,buf,StartBit); int seq_scaling_list_present_flag[];
if( seq_scaling_matrix_present_flag )
{
for( int i = ; i < ; i++ ) {
seq_scaling_list_present_flag[i]=u(,buf,StartBit);
}
}
}
int log2_max_frame_num_minus4=Ue(buf,nLen,StartBit);
int pic_order_cnt_type=Ue(buf,nLen,StartBit);
if( pic_order_cnt_type == )
int log2_max_pic_order_cnt_lsb_minus4=Ue(buf,nLen,StartBit);
else if( pic_order_cnt_type == )
{
int delta_pic_order_always_zero_flag=u(,buf,StartBit);
int offset_for_non_ref_pic=Se(buf,nLen,StartBit);
int offset_for_top_to_bottom_field=Se(buf,nLen,StartBit);
int num_ref_frames_in_pic_order_cnt_cycle=Ue(buf,nLen,StartBit); int *offset_for_ref_frame=new int[num_ref_frames_in_pic_order_cnt_cycle];
for( int i = ; i < num_ref_frames_in_pic_order_cnt_cycle; i++ )
offset_for_ref_frame[i]=Se(buf,nLen,StartBit);
delete [] offset_for_ref_frame;
}
int num_ref_frames=Ue(buf,nLen,StartBit);
int gaps_in_frame_num_value_allowed_flag=u(,buf,StartBit);
int pic_width_in_mbs_minus1=Ue(buf,nLen,StartBit);
int pic_height_in_map_units_minus1=Ue(buf,nLen,StartBit); //width=(pic_width_in_mbs_minus1+1)*16;
//height=(pic_height_in_map_units_minus1+1)*16; int frame_mbs_only_flag=u(,buf,StartBit);
if(!frame_mbs_only_flag)
int mb_adaptive_frame_field_flag=u(,buf,StartBit); int direct_8x8_inference_flag=u(,buf,StartBit);
int frame_cropping_flag=u(,buf,StartBit);
int frame_crop_left_offset=;
int frame_crop_right_offset=;
int frame_crop_top_offset=;
int frame_crop_bottom_offset=;
if(frame_cropping_flag)
{
frame_crop_left_offset=Ue(buf,nLen,StartBit);
frame_crop_right_offset=Ue(buf,nLen,StartBit);
frame_crop_top_offset=Ue(buf,nLen,StartBit);
frame_crop_bottom_offset=Ue(buf,nLen,StartBit);
} width = ((pic_width_in_mbs_minus1 +)*) - frame_crop_left_offset* - frame_crop_right_offset*;
height= (( - frame_mbs_only_flag)* (pic_height_in_map_units_minus1 +) * ) - (frame_crop_top_offset * ) - (frame_crop_bottom_offset * ); int vui_parameter_present_flag=u(,buf,StartBit);
if(vui_parameter_present_flag)
{
int aspect_ratio_info_present_flag=u(,buf,StartBit);
if(aspect_ratio_info_present_flag)
{
int aspect_ratio_idc=u(,buf,StartBit);
if(aspect_ratio_idc==)
{
int sar_width=u(,buf,StartBit);
int sar_height=u(,buf,StartBit);
}
}
int overscan_info_present_flag=u(,buf,StartBit);
if(overscan_info_present_flag)
int overscan_appropriate_flagu=u(,buf,StartBit);
int video_signal_type_present_flag=u(,buf,StartBit);
if(video_signal_type_present_flag)
{
int video_format=u(,buf,StartBit);
int video_full_range_flag=u(,buf,StartBit);
int colour_description_present_flag=u(,buf,StartBit);
if(colour_description_present_flag)
{
int colour_primaries=u(,buf,StartBit);
int transfer_characteristics=u(,buf,StartBit);
int matrix_coefficients=u(,buf,StartBit);
}
}
int chroma_loc_info_present_flag=u(,buf,StartBit);
if(chroma_loc_info_present_flag)
{
int chroma_sample_loc_type_top_field=Ue(buf,nLen,StartBit);
int chroma_sample_loc_type_bottom_field=Ue(buf,nLen,StartBit);
}
int timing_info_present_flag=u(,buf,StartBit);
if(timing_info_present_flag)
{
int num_units_in_tick=u(,buf,StartBit);
int time_scale=u(,buf,StartBit);
fps=time_scale/(*num_units_in_tick);
}
}
return true;
}
else
return false;
}

参考资料:

1. http://www.latelee.org/my-study/get-width-height-framerate-from-bitstream.html

2. https://blog.csdn.net/yue_huang/article/details/75126155

上一篇:HDU5086:Revenge of Segment Tree(规律题)


下一篇:详解Maple中的基础工具栏