視音頻數據處理入門:H.264視頻碼流解析 git
=====================================================github
視音頻數據處理入門系列文章:ide
視音頻數據處理入門:RGB、YUV像素數據處理函數
視音頻數據處理入門:PCM音頻採樣數據處理測試
視音頻數據處理入門:H.264視頻碼流解析url
視音頻數據處理入門:AAC音頻碼流解析spa
視音頻數據處理入門:FLV封裝格式解析.net
視音頻數據處理入門:UDP-RTP協議解析code
=====================================================orm
前兩篇文章介紹的YUV/RGB處理程序以及PCM處理程序都屬於視音頻原始數據的處理程序。從本文開始介紹視音頻碼流的處理程序。本文介紹的程序是視頻碼流處理程序。視頻碼流在視頻播放器中的位置以下所示。

本文中的程序是一個H.264碼流解析程序。該程序能夠從H.264碼流中分析獲得它的基本單元NALU,而且能夠簡單解析NALU首部的字段。經過修改該程序能夠實現不一樣的H.264碼流處理功能。
原理
H.264原始碼流(又稱爲「裸流」)是由一個一個的NALU組成的。他們的結構以下圖所示。

其中每一個NALU之間經過startcode(起始碼)進行分隔,起始碼分紅兩種:0x000001(3Byte)或者0x00000001(4Byte)。若是NALU對應的Slice爲一幀的開始就用0x00000001,不然就用0x000001。
H.264碼流解析的步驟就是首先從碼流中搜索0x000001和0x00000001,分離出NALU;而後再分析NALU的各個字段。本文的程序即實現了上述的兩個步驟。
代碼
整個程序位於simplest_h264_parser()函數中,以下所示。
- #include <stdio.h>
- #include <stdlib.h>
- #include <string.h>
-
- typedef enum {
- NALU_TYPE_SLICE = 1,
- NALU_TYPE_DPA = 2,
- NALU_TYPE_DPB = 3,
- NALU_TYPE_DPC = 4,
- NALU_TYPE_IDR = 5,
- NALU_TYPE_SEI = 6,
- NALU_TYPE_SPS = 7,
- NALU_TYPE_PPS = 8,
- NALU_TYPE_AUD = 9,
- NALU_TYPE_EOSEQ = 10,
- NALU_TYPE_EOSTREAM = 11,
- NALU_TYPE_FILL = 12,
- } NaluType;
-
- typedef enum {
- NALU_PRIORITY_DISPOSABLE = 0,
- NALU_PRIRITY_LOW = 1,
- NALU_PRIORITY_HIGH = 2,
- NALU_PRIORITY_HIGHEST = 3
- } NaluPriority;
-
-
- typedef struct
- {
- int startcodeprefix_len;
- unsigned len;
- unsigned max_size;
- int forbidden_bit;
- int nal_reference_idc;
- int nal_unit_type;
- char *buf;
- } NALU_t;
-
- FILE *h264bitstream = NULL;
-
- int info2=0, info3=0;
-
- static int FindStartCode2 (unsigned char *Buf){
- if(Buf[0]!=0 || Buf[1]!=0 || Buf[2] !=1) return 0;
- else return 1;
- }
-
- static int FindStartCode3 (unsigned char *Buf){
- if(Buf[0]!=0 || Buf[1]!=0 || Buf[2] !=0 || Buf[3] !=1) return 0;
- else return 1;
- }
-
-
- int GetAnnexbNALU (NALU_t *nalu){
- int pos = 0;
- int StartCodeFound, rewind;
- unsigned char *Buf;
-
- if ((Buf = (unsigned char*)calloc (nalu->max_size , sizeof(char))) == NULL)
- printf ("GetAnnexbNALU: Could not allocate Buf memory\n");
-
- nalu->startcodeprefix_len=3;
-
- if (3 != fread (Buf, 1, 3, h264bitstream)){
- free(Buf);
- return 0;
- }
- info2 = FindStartCode2 (Buf);
- if(info2 != 1) {
- if(1 != fread(Buf+3, 1, 1, h264bitstream)){
- free(Buf);
- return 0;
- }
- info3 = FindStartCode3 (Buf);
- if (info3 != 1){
- free(Buf);
- return -1;
- }
- else {
- pos = 4;
- nalu->startcodeprefix_len = 4;
- }
- }
- else{
- nalu->startcodeprefix_len = 3;
- pos = 3;
- }
- StartCodeFound = 0;
- info2 = 0;
- info3 = 0;
-
- while (!StartCodeFound){
- if (feof (h264bitstream)){
- nalu->len = (pos-1)-nalu->startcodeprefix_len;
- memcpy (nalu->buf, &Buf[nalu->startcodeprefix_len], nalu->len);
- nalu->forbidden_bit = nalu->buf[0] & 0x80;
- nalu->nal_reference_idc = nalu->buf[0] & 0x60;
- nalu->nal_unit_type = (nalu->buf[0]) & 0x1f;
- free(Buf);
- return pos-1;
- }
- Buf[pos++] = fgetc (h264bitstream);
- info3 = FindStartCode3(&Buf[pos-4]);
- if(info3 != 1)
- info2 = FindStartCode2(&Buf[pos-3]);
- StartCodeFound = (info2 == 1 || info3 == 1);
- }
-
-
-
- rewind = (info3 == 1)? -4 : -3;
-
- if (0 != fseek (h264bitstream, rewind, SEEK_CUR)){
- free(Buf);
- printf("GetAnnexbNALU: Cannot fseek in the bit stream file");
- }
-
-
-
-
-
- nalu->len = (pos+rewind)-nalu->startcodeprefix_len;
- memcpy (nalu->buf, &Buf[nalu->startcodeprefix_len], nalu->len);
- nalu->forbidden_bit = nalu->buf[0] & 0x80;
- nalu->nal_reference_idc = nalu->buf[0] & 0x60;
- nalu->nal_unit_type = (nalu->buf[0]) & 0x1f;
- free(Buf);
-
- return (pos+rewind);
- }
-
- int simplest_h264_parser(char *url){
-
- NALU_t *n;
- int buffersize=100000;
-
-
- FILE *myout=stdout;
-
- h264bitstream=fopen(url, "rb+");
- if (h264bitstream==NULL){
- printf("Open file error\n");
- return 0;
- }
-
- n = (NALU_t*)calloc (1, sizeof (NALU_t));
- if (n == NULL){
- printf("Alloc NALU Error\n");
- return 0;
- }
-
- n->max_size=buffersize;
- n->buf = (char*)calloc (buffersize, sizeof (char));
- if (n->buf == NULL){
- free (n);
- printf ("AllocNALU: n->buf");
- return 0;
- }
-
- int data_offset=0;
- int nal_num=0;
- printf("-----+-------- NALU Table ------+---------+\n");
- printf(" NUM | POS | IDC | TYPE | LEN |\n");
- printf("-----+---------+--------+-------+---------+\n");
-
- while(!feof(h264bitstream))
- {
- int data_lenth;
- data_lenth=GetAnnexbNALU(n);
-
- char type_str[20]={0};
- switch(n->nal_unit_type){
- case NALU_TYPE_SLICE:sprintf(type_str,"SLICE");break;
- case NALU_TYPE_DPA:sprintf(type_str,"DPA");break;
- case NALU_TYPE_DPB:sprintf(type_str,"DPB");break;
- case NALU_TYPE_DPC:sprintf(type_str,"DPC");break;
- case NALU_TYPE_IDR:sprintf(type_str,"IDR");break;
- case NALU_TYPE_SEI:sprintf(type_str,"SEI");break;
- case NALU_TYPE_SPS:sprintf(type_str,"SPS");break;
- case NALU_TYPE_PPS:sprintf(type_str,"PPS");break;
- case NALU_TYPE_AUD:sprintf(type_str,"AUD");break;
- case NALU_TYPE_EOSEQ:sprintf(type_str,"EOSEQ");break;
- case NALU_TYPE_EOSTREAM:sprintf(type_str,"EOSTREAM");break;
- case NALU_TYPE_FILL:sprintf(type_str,"FILL");break;
- }
- char idc_str[20]={0};
- switch(n->nal_reference_idc>>5){
- case NALU_PRIORITY_DISPOSABLE:sprintf(idc_str,"DISPOS");break;
- case NALU_PRIRITY_LOW:sprintf(idc_str,"LOW");break;
- case NALU_PRIORITY_HIGH:sprintf(idc_str,"HIGH");break;
- case NALU_PRIORITY_HIGHEST:sprintf(idc_str,"HIGHEST");break;
- }
-
- fprintf(myout,"%5d| %8d| %7s| %6s| %8d|\n",nal_num,data_offset,idc_str,type_str,n->len);
-
- data_offset=data_offset+data_lenth;
-
- nal_num++;
- }
-
-
- if (n){
- if (n->buf){
- free(n->buf);
- n->buf=NULL;
- }
- free (n);
- }
- return 0;
- }
上文中的函數調用方法以下所示。
- simplest_h264_parser("sintel.h264");
結果
本程序的輸入爲一個H.264原始碼流(裸流)的文件路徑,輸出爲該碼流的NALU統計數據,以下圖所示。

下載
Simplest mediadata test
項目主頁
SourceForge:https://sourceforge.net/projects/simplest-mediadata-test/
Github:https://github.com/leixiaohua1020/simplest_mediadata_test
開源中國:http://git.oschina.net/leixiaohua1020/simplest_mediadata_test
CSDN下載地址:http://download.csdn.net/detail/leixiaohua1020/9422409
本項目包含以下幾種視音頻數據解析示例:
(1)像素數據處理程序。包含RGB和YUV像素格式處理的函數。
(2)音頻採樣數據處理程序。包含PCM音頻採樣格式處理的函數。
(3)H.264碼流分析程序。能夠分離並解析NALU。
(4)AAC碼流分析程序。能夠分離並解析ADTS幀。
(5)FLV封裝格式分析程序。能夠將FLV中的MP3音頻碼流分離出來。
(6)UDP-RTP協議分析程序。能夠將分析UDP/RTP/MPEG-TS數據包。
雷霄驊 (Lei Xiaohua)leixiaohua1020@126.comhttp://blog.csdn.net/leixiaohua1020