【多媒体封装格式详解】---MP4【4】-mandagod-ChinaUnix博客

Ryan's&nbsp;Blogmanda.blog.chinaunix.net

首页　| 　博文目录　| 　关于我

mandagod

博客访问： 682073
博文数量： 160
博客积分： 2384
博客等级：大尉
技术积分： 1366
用户组：普通用户
注册时间： 2008-12-01 11:35

文章分类

全部博文（160）

Java（2）
Android（33）
面试相关（18）
多媒体技术（17）
嵌入式webserver（0）
算法与数据结构（3）
随意杂记（5）
Linux-ARM Embedd（14）
Linux内核（6）
Linux工具配置（20）
OpenOffice（8）
未分配的博文（34）

文章存档

2015年（45）

2014年（36）

2012年（28）

2011年（37）

2010年（2）

2009年（10）

2008年（2）

我的朋友

相关博文

【多媒体封装格式详解】---MP4【4】

分类：其他平台

2015-05-29 11:30:02

前面介绍过的几种格式flv、mkv、asf等。他们音视频的数据包一般都是按照文件的顺序交叉安放。你解析完头部信息后。剩下的一般就按照文件顺序一个数据包一个数据包的解析就行了。但是MP4完全不是这种概念。他的媒体信息和数据是分开存放的。就是你想获得数据之前必须要解析出每个帧数据所有的位置。mp4存放这个帧信息的是放在stbl这个box里。而真实的数据放在mdat中。接下来就讲讲stbl与mdat的对应关系。

Sample Table Box(stbl)

来一张典型的stbl结构图：

常见子box

stts: Decoding Time to Sample Box 时间戳和Sample映射表
stsd: Sample Description Box
stsz, stz2: Sample Size Boxes 每个Sample大小的表。
stsc: Sample to chunk 的映射表。
‘stco’, ‘co64’: Chunk位置偏移表
stss：关键帧index。

1.解析stsd可获得coding类型、视频宽高、音频samplesize、channelcount这些和解码器有关信息。

[cpp]view plaincopy
			
			aligned(8) class SampleDescriptionBox (unsigned int(32) handler_type)  
		
			extends FullBox('stsd', 0, 0){  
		
			int i ;  
		
			unsigned int(32) entry_count;  
		
			for (i = 1 ; i u entry_count ; i++){  
		
			switch (handler_type){  
		
			case ‘soun’: // for audio tracks  
		
			AudioSampleEntry();  
		
			break;  
		
			case ‘vide’: // for video tracks  
		
			VisualSampleEntry();  
		
			break;  
		
			case ‘hint’: // Hint track  
		
			HintSampleEntry();  
		
			break;  
		
			}  
		
			}  
		
			}

[cpp]view plaincopy
			
			aligned(8) abstract class SampleEntry (unsigned int(32) format)  
		
			extends Box(format){  
		
			const unsigned int(8)[6] reserved = 0;  
		
			unsigned int(16) data_reference_index;  
		
			}  
		
			class HintSampleEntry() extends SampleEntry (protocol) {  
		
			unsigned int(8) data [];  
		
			}  
		
			// Visual Sequences  
		
			class VisualSampleEntry(codingname) extends SampleEntry (codingname){  
		
			unsigned int(16) pre_defined = 0;  
		
			const unsigned int(16) reserved = 0;  
		
			unsigned int(32)[3] pre_defined = 0;  
		
			unsigned int(16) width;  
		
			unsigned int(16) height;  
		
			template unsigned int(32) horizresolution = 0x00480000; // 72 dpi  
		
			template unsigned int(32) vertresolution = 0x00480000; // 72 dpi  
		
			const unsigned int(32) reserved = 0;  
		
			template unsigned int(16) frame_count = 1;  
		
			string[32] compressorname;  
		
			template unsigned int(16) depth = 0x0018;  
		
			int(16) pre_defined = -1;  
		
			}  
		
			// Audio Sequences  
		
			class AudioSampleEntry(codingname) extends SampleEntry (codingname){  
		
			const unsigned int(32)[2] reserved = 0;  
		
			template unsigned int(16) channelcount = 2;  
		
			template unsigned int(16) samplesize = 16;  
		
			unsigned int(16) pre_defined = 0;  
		
			const unsigned int(16) reserved = 0 ;  
		
			template unsigned int(32) samplerate = {timescale of media}<<16;  
		
			}

2.解析stsz box 可以获得一个sample size的表

[cpp]view plaincopy
			
			aligned(8) class SampleSizeBox extends FullBox(‘stsz’, version = 0, 0) {  
		
			unsigned int(32) sample_size;  
		
			unsigned int(32) sample_count;  
		
			if (sample_size==0) {  
		
			for (i=1; i u sample_count; i++) {  
		
			unsigned int(32) entry_size;  
		
			}  
		
			}  
		
			}

3.解析stts

[cpp]view plaincopy
			
			aligned(8) class TimeToSampleBox  
		
			extends FullBox(’stts’, version = 0, 0) {  
		
			unsigned int(32) entry_count;  
		
			int i;  
		
			for (i=0; i < entry_count; i++) {  
		
			unsigned int(32) sample_count;  
		
			unsigned int(32) sample_delta;  
		
			}  
		
			}

4.解析stsc 还原Sample 与chunk的映射表

Sample 是存储的最基本单元，mp4把Sample 存在chunk中。chunk的长度、chunk的大小、chunk中Sample的数量及大小都是不定的。

通过解析这部分box来还原这个映射表。

[cpp]view plaincopy
			
			aligned(8) class SampleToChunkBox  
		
			extends FullBox(‘stsc’, version = 0, 0) {  
		
			unsigned int(32) entry_count;  
		
			for (i=1; i u entry_count; i++) {  
		
			unsigned int(32) first_chunk;  
		
			unsigned int(32) samples_per_chunk;  
		
			unsigned int(32) sample_description_index;  
		
			}  
		
			}

每个entry 表示着一组数据，entry_count 表示这数量。这一组其实是相同类型的chunk。

first_chunk 表示这一组相同类型的chunk中的第一个chunk数。

这些chunk 中包含的Sample 数量，即samples_per_chunk 是一致的。

每个Sample 可以通过sample_description_index 去stsd box 找到描述信息。

看ffmpeg中mov_read_stsc() 它把这些数据放在一个结构体数组中备用。

[cpp]view plaincopy
			
			static int mov_read_stsc(MOVContext *c, AVIOContext *pb, MOVAtom atom)  
		
			{  
		
			    AVStream *st;  
		
			    MOVStreamContext *sc;  
		
			    unsigned int i, entries;  
		
			    if (c->fc->nb_streams < 1)  
		
			        return 0;  
		
			    st = c->fc->streams[c->fc->nb_streams-1];  
		
			    sc = st->priv_data;  
		
			    avio_r8(pb); /* version */  
		
			    avio_rb24(pb); /* flags */  
		
			    entries = avio_rb32(pb);  
		
			    av_dlog(c->fc, "track[%i].stsc.entries = %i\n", c->fc->nb_streams-1, entries);  
		
			    if (!entries)  
		
			        return 0;  
		
			    if (entries >= UINT_MAX / sizeof(*sc->stsc_data))  
		
			        return AVERROR_INVALIDDATA;  
		
			    sc->stsc_data = av_malloc(entries * sizeof(*sc->stsc_data));  
		
			    if (!sc->stsc_data)  
		
			        return AVERROR(ENOMEM);  
		
			    for (i = 0; i < entries && !pb->eof_reached; i++) {  
		
			        sc->stsc_data[i].first = avio_rb32(pb);  
		
			        sc->stsc_data[i].count = avio_rb32(pb);  
		
			        sc->stsc_data[i].id = avio_rb32(pb);  
		
			    }  
		
			    sc->stsc_count = i;  
		
			    if (pb->eof_reached)  
		
			        return AVERROR_EOF;  
		
			    return 0;  
		
			}

在获得完整的映射表，我们还需要chunk总个数信息。这些信息放在‘stco’, ‘co64’中。

5.解析‘stco’, ‘co64’

“stco”定义了每个thunk在媒体流中的位置。位置有两种可能，32位的和64位的，后者对非常大的电影很有用。

32位

[cpp]view plaincopy
			
			aligned(8) class ChunkOffsetBox  
		
			extends FullBox(‘stco’, version = 0, 0) {  
		
			unsigned int(32) entry_count;  
		
			for (i=1; i u entry_count; i++) {  
		
			unsigned int(32) chunk_offset;  
		
			}  
		
			}

64位

[cpp]view plaincopy
			
			aligned(8) class ChunkLargeOffsetBox  
		
			extends FullBox(‘co64’, version = 0, 0) {  
		
			unsigned int(32) entry_count;  
		
			for (i=1; i u entry_count; i++) {  
		
			unsigned int(64) chunk_offset;  
		
			}  
		
			}

从这个box我们就可以获得 chunk 的总数量，entry_count。

1.解析‘stco’, ‘co64’我们有了chunk 表，知道了chunk 的总数及每个chunk所在文件的位置。

2.解析stsc 配合着上面的chunk表，我们就能弄个Sample与chunk的关系表。我们也就能获得每个Sample的位置信息。

3.配合上面的stts 时间表和解码器信息等。搞出ES流已经不成问题了。

4.想获得关键帧的index，需要解析stss’

[cpp]view plaincopy
			
			aligned(8) class SyncSampleBox  
		
			extends FullBox(‘stss’, version = 0, 0) {  
		
			unsigned int(32) entry_count;  
		
			int i;  
		
			for (i=0; i < entry_count; i++) {  
		
			unsigned int(32) sample_number;  
		
			}  
		
			}

阅读(2416) | 评论(0) | 转发(0) |

上一篇：【多媒体封装格式详解】---MP4【3】

下一篇：【多媒体基础知识】 ---常见音频编码格式总结

给主人留下些什么吧！~~

感谢所有关心和支持过ChinaUnix的朋友们

16024965号-6