ffmpeg源码分析--11.mov的mov_read_header

最新推荐文章于 2024-05-15 11:29:46 发布

wangcong02345

最新推荐文章于 2024-05-15 11:29:46 发布

阅读量2.8k

点赞数

分类专栏：音视频

本文链接：https://blog.csdn.net/wangcong02345/article/details/52441835

版权

音视频专栏收录该内容

39 篇文章 5 订阅

订阅专栏

avformat_open_input
s->iformat->read_header(s)
--> mov_read_header

mov_read_default
-->mov_read_trak
-->mov_build_index

 
  static void mov_build_index(MOVContext *mov, AVStream *st)
 
 {
 
     MOVStreamContext *sc = st->priv_data;
 
     int64_t current_offset;
 
     int64_t current_dts = 0;
 
     uint64_t stream_size = 0;
     /*从媒体文件中读到video_trak的elst, sound_trak没有这个elst
  
        0000 0001               -->edit_count=1
 
     0014 6595               -->segment duration=0x146595
 
     0000 03e9               -->media time=0x3e9=1001  ;;这个就是video的开始时间，负的
 
     0001 0000               -->rate=0x1000,rate/65536=1.0
     */
     //下面这个if,因为只有video的elst_count=1,所以只是得出video的start_time
 
     if (sc->elst_count) {                                             //video:elst_count=1,sound:elst_count=0
         int i, edit_start_index = 0, unsupported = 0;
 
         int64_t empty_duration = 0; // empty duration of the first edit list entry
 
         int64_t start_time = 0; // start time of the media
 
         for (i = 0; i < sc->elst_count; i++) {
 
             const MOVElst *e = &sc->elst_data[i];                     
 
             if (i == 0 && e->time == -1) {                          //video:e->time=1001          
 
                 empty_duration = e->duration;
                 edit_start_index = 1;
 
             } else if (i == edit_start_index && e->time >= 0) {
 
                 start_time = e->time;                               //所以video的开始时间是1001,start_time=1001
 
             } else
                 unsupported = 1;
 
         }
 
         if ((empty_duration || start_time) && mov->time_scale > 0) {     //empty_duration=0
             if (empty_duration)
 
                 empty_duration = av_rescale(empty_duration, sc->time_scale, mov->time_scale);  //empty_duration=0
 
             sc->time_offset = start_time - empty_duration;                   //video:sc->time_offset=1001; sound:sc->time_offet=0
             current_dts = -sc->time_offset;                                  //video:current_dts=-1001;  sound:current_dts=0;
 
             if (sc->ctts_count>0 && sc->stts_count>0 &&
 
                 sc->ctts_data[0].duration / FFMAX(sc->stts_data[0].duration, 1) > 16) {
 
                 sc->wrong_dts = 1;
                 st->codec->has_b_frames = 1;
 
             }
 
         }
 
     }
 
     /* only use old uncompressed audio chunk demuxing when stts specifies it */
 
     if (!(st->codec->codec_type == AVMEDIA_TYPE_AUDIO &&
 
           sc->stts_count == 1 && sc->stts_data[0].duration == 1)) {
 
         unsigned int current_sample = 0;
 
         unsigned int stts_sample = 0;
 
         unsigned int sample_size;
 
         unsigned int distance = 0;
 
         unsigned int rap_group_index = 0;
 
         unsigned int rap_group_sample = 0;
 
         int64_t last_dts = 0;
 
         int64_t dts_correction = 0;
 
         int rap_group_present = sc->rap_group_count && sc->rap_group;
 
         int key_off = (sc->keyframe_count && sc->keyframes[0] > 0) || (sc->stps_count && sc->stps_data[0] > 0);
 
         current_dts -= sc; 
 
         last_dts = current_dts;                                         //video的current_dts=1001,sound的current_dts=0
 
         av_reallocp_array(&st->index_entries, st->nb_index_entries + sc->sample_count, sizeof(*st->index_entries));  //分配空间
         st->index_entries_allocated_size = (st->nb_index_entries + sc->sample_count) * sizeof(*st->index_entries);
 
         for (i = 0; i < sc->chunk_count; i++) {  //这个sc->chunk_count就是从"stco"中读取的video_chuk_cnt=0x4e56,sound_chunk_count=0xe10c
 
             int64_t next_offset = i+1 < sc->chunk_count ? sc->chunk_offsets[i+1] : INT64_MAX;
 
             current_offset = sc->chunk_offsets[i];          //chunk_offset表出自"stco",video与sound各自都有各自的"stco"
 
             while (stsc_index + 1 < sc->stsc_count &&  i + 1 == sc->stsc_data[stsc_index + 1].first)    //video与sound的stsc_count=1，所以stsc_index=0且一直为0
                 stsc_index++;
 
             for (j = 0; j < sc->stsc_data[stsc_index].count; j++) {
 
                 int keyframe = 0;
 
                 if (!sc->keyframe_absent && (!sc->keyframe_count || current_sample+key_off == sc->keyframes[stss_index])) {
 
                     keyframe = 1;
 
                     if (stss_index + 1 < sc->keyframe_count)
 
                         stss_index++;                                    //stss_index=0且一直为0
 
                 } else if (sc->stps_count && current_sample+key_off == sc->stps_data[stps_index]) {
 
                     keyframe = 1;
 
                     if (stps_index + 1 < sc->stps_count)
 
                         stps_index++;                            
 
                 }
 
                 if (sc->keyframe_absent && !sc->stps_count && !rap_group_present && (st->codec->codec_type == AVMEDIA_TYPE_AUDIO || (i==0 && j==0)))
                     keyframe = 1;
                 if (keyframe)
 
                     distance = 0;
 
                 sample_size = sc->stsz_sample_size > 0 ? sc->stsz_sample_size : sc->sample_sizes[current_sample];
 
                 if (sc->pseudo_stream_id == -1 ||
 
                    sc->stsc_data[stsc_index].id - 1 == sc->pseudo_stream_id) {
 
                     AVIndexEntry *e = &st->index_entries[st->nb_index_entries++];
 
                     e->pos = current_offset;
 
                     e->timestamp = current_dts;                                   //这个timestamp就是dts,计算过程就是start_time累加sample_duration
 
                     e->size = sample_size;
 
                     e->min_distance = distance;
 
                     e->flags = keyframe ? AVINDEX_KEYFRAME : 0;                    
                     if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO && st->nb_index_entries < 100)
 
                         ff_rfps_add_frame(mov->fc, st, current_dts);
 
                 }
 
                 current_offset += sample_size;
 
                 stream_size += sample_size;
 
                 if (sc->stts_data[stts_index].duration < 0) {                    
                     dts_correction += sc->stts_data[stts_index].duration - 1;
 
                     sc->stts_data[stts_index].duration = 1;
 
                 }
 
                 current_dts += sc->stts_data[stts_index].duration;
 
                 if (!dts_correction || current_dts + dts_correction > last_dts) {
 
                     current_dts += dts_correction;
 
                     dts_correction = 0;
 
                 } else {
 
                     dts_correction += current_dts - last_dts - 1;
                     current_dts = last_dts + 1;
 
                 }
 
                 last_dts = current_dts;
 
                 distance++;
 
                 stts_sample++;
 
                 current_sample++;
 
                 if (stts_index + 1 < sc->stts_count && stts_sample == sc->stts_data[stts_index].count) {
 
                     stts_sample = 0;              //对于video来说有很多个stts的entries，所以这个stts_index是累加的
 
                     stts_index++;                 //但对于sounde来说只有一个stts的entries，所以这个stts_index是不加的，一直为0
 
                 }
 
             }
 
         }
 
         if (st->duration > 0)
 
             st->codec->bit_rate = stream_size*8*sc->time_scale/st->duration;   //每条trak的bit_rate的计算
     } else {                                                        //video的0x7f0bb=520379,audio的bit_rate=0x14ec7=85703
         //这个else没有用到
     }
 
 }

video的dts的由来:
AVIndex stream=0, sample=0x0, offset=0x30, dts=-1001, size=0x1333, distance=0, keyframe=1
AVIndex stream=0, sample=0x1, offset=0x137d, dts=0x0, size=0xf6f, distance=1, keyframe=0
AVIndex stream=0, sample=0x2, offset=0x253c, dts=0xbbb, size=0x991, distance=2, keyframe=0
AVIndex stream=0, sample=0x3, offset=0x3143, dts=0x138d, size=0x9ab, distance=3, keyframe=0
AVIndex stream=0, sample=0x4, offset=0x3ca7, dts=0x1776, size=0x8e4, distance=4, keyframe=0

第0个dts就是从 video_trak的elst中解析出来的media time=0x3e9=1001 ，
然后把这个值 current_dts = -sc->time_offset; 取了个负值，所以dts_0 =-1001
以后的dts就是dts_0与sample_duration(在stts中)累加

00 020b a873 7474 73 -->stts的长度=0x20ba8,type=stts
00 0000 00 -->stts的version与flag
00 0041 73 -->entries=0x4173=16755 ::剩下的就是sample_count与sample_duration的entry
00 0000 01 -->sample_count=0x01 ::sample_count=1, sample_duration=1001
00 0003 e9 -->sample_duration=0x3e9
00 0000 01 -->sample_count=0x1 ::sample_count=1, sample_duration=3003
00 000b bb -->sample_duration=0xbbb
...

sound的dts的由来:
sc->chunk_count=0xe10c
AVIndex stream=1, sample=0x0, offset=0x1363, dts=0x0, size=0x1a, distance=0, keyframe=1
AVIndex stream=1, sample=0x1, offset=0x22ec, dts=0x400, size=0x9, distance=0, keyframe=1
AVIndex stream=1, sample=0x2, offset=0x22f5, dts=0x800, size=0x9, distance=0, keyframe=1
AVIndex stream=1, sample=0x3, offset=0x22fe, dts=0xc00, size=0xa1, distance=0, keyframe=1
AVIndex stream=1, sample=0x4, offset=0x239f, dts=0x1000, size=0xc9, distance=0, keyframe=1
sound没有elst这个box,所以 current_dts = 0，所以dts_0 =0
以后的dts就是dts_0与 sample_duration( 在stts中 )累加
但sounde只有一个stts的entries，所以这个sample_duration=0x400,恒定的

00 0000 1873 7474 73 -->stts的长度=0x18，type=stts
00 0000 00 -->stts的version与flag
00 0000 01 -->entries=0x01
00 00e1 0c -->sample_count=0xe10c=67612
00 0004 00 -->sample_duration=0x400

 
  static int mov_read_header(AVFormatContext *s)
 
 {
 
     MOVContext *mov = s->priv_data;
 
     AVIOContext *pb = s->pb;
 
     int j, err;
 
     MOVAtom atom = { AV_RL32("root") };
 
     int i;
 
     mov->fc = s;
 
     mov->trak_index = -1;
 
     /* .mov and .mp4 aren't streamable anyway (only progressive download if moov is before mdat) */
 
     if (pb->seekable)
 
         atom.size = avio_size(pb);
 
     else
 
         atom.size = INT64_MAX;
 
     /* check MOV header */
 
     do {
 
         if (mov->moov_retry)
 
             avio_seek(pb, 0, SEEK_SET);
 
         if ((err = mov_read_default(mov, pb, atom)) < 0) {
 
             av_log(s, AV_LOG_ERROR, "error reading header\n");
 
             mov_read_close(s);
 
             return err;
 
         }
 
     } while (pb->seekable && !mov->found_moov && !mov->moov_retry++);
 
     if (!mov->found_moov) {
 
         av_log(s, AV_LOG_ERROR, "moov atom not found\n");
 
         mov_read_close(s);
 
         return AVERROR_INVALIDDATA;
 
     }
 
     if (pb->seekable) {
         if (mov->chapter_track > 0 && !mov->ignore_chapters)
 
             mov_read_chapters(s);
 
         for (i = 0; i < s->nb_streams; i++)
 
             if (s->streams[i]->codec->codec_tag == AV_RL32("tmcd"))
 
                 mov_read_timecode_track(s, s->streams[i]);
 
     }
 
     /* copy timecode metadata from tmcd tracks to the related video streams */
 
     for (i = 0; i < s->nb_streams; i++) {
 
         AVStream *st = s->streams[i];
 
         MOVStreamContext *sc = st->priv_data;
 
         if (sc->timecode_track > 0) {
 
             AVDictionaryEntry *tcr;
 
             int tmcd_st_id = -1;
 
             for (j = 0; j < s->nb_streams; j++)
 
                 if (s->streams[j]->id == sc->timecode_track)
 
                     tmcd_st_id = j;
 
             if (tmcd_st_id < 0 || tmcd_st_id == i)
 
                 continue;
 
             tcr = av_dict_get(s->streams[tmcd_st_id]->metadata, "timecode", NULL, 0);
 
             if (tcr)
 
                 av_dict_set(&st->metadata, "timecode", tcr->value, 0);
 
         }
 
     }
 
     export_orphan_timecode(s);
 
     for (i = 0; i < s->nb_streams; i++) {
 
         AVStream *st = s->streams[i];
 
         MOVStreamContext *sc = st->priv_data;
 
         fix_timescale(mov, sc);
 
         if(st->codec->codec_type == AVMEDIA_TYPE_AUDIO && st->codec->codec_id == AV_CODEC_ID_AAC) {
 
             st->skip_samples = sc->start_pad;
 
         }
 
         if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO && sc->nb_frames_for_fps > 0 && sc->duration_for_fps > 0)
 
             av_reduce(&st->avg_frame_rate.num, &st->avg_frame_rate.den,
 
                     sc->time_scale*(int64_t)sc->nb_frames_for_fps, sc->duration_for_fps, INT_MAX);
 
         if (st->codec->codec_type == AVMEDIA_TYPE_SUBTITLE) {
 
             if (st->codec->width <= 0 || st->codec->height <= 0) {
 
                 st->codec->width = sc->width;
 
                 st->codec->height = sc->height;
 
             }
 
             if (st->codec->codec_id == AV_CODEC_ID_DVD_SUBTITLE) {
 
                 if ((err = mov_rewrite_dvd_sub_extradata(st)) < 0)
 
                     return err;
 
             }
 
         }
 
         if (mov->handbrake_version && mov->handbrake_version <= 1000000*0 + 1000*10 + 2 && st->codec->codec_id == AV_CODEC_ID_MP3) {
             st->need_parsing = AVSTREAM_PARSE_FULL;
         }
 
     }
 
     if (mov->trex_data) {
 
         for (i = 0; i < s->nb_streams; i++) {
 
             AVStream *st = s->streams[i];
 
             MOVStreamContext *sc = st->priv_data;
 
             if (st->duration > 0)
 
                 st->codec->bit_rate = sc->data_size * 8 * sc->time_scale / st->duration;
 
         }
 
     }
 
     if (mov->use_mfra_for > 0) {
 
         for (i = 0; i < s->nb_streams; i++) {
 
             AVStream *st = s->streams[i];
 
             MOVStreamContext *sc = st->priv_data;
 
             if (sc->duration_for_fps > 0) {
 
                 st->codec->bit_rate = sc->data_size * 8 * sc->time_scale /
 
                     sc->duration_for_fps;
 
             }
 
         }
 
     }
 
     for (i = 0; i < mov->bitrates_count && i < s->nb_streams; i++) {
 
         if (mov->bitrates[i]) {
 
             s->streams[i]->codec->bit_rate = mov->bitrates[i];
 
         }
 
     }
 
     ff_rfps_calculate(s);
 
     for (i = 0; i < s->nb_streams; i++) {
 
         AVStream *st = s->streams[i];
 
         MOVStreamContext *sc = st->priv_data;
 
         switch (st->codec->codec_type) {
 
             case AVMEDIA_TYPE_AUDIO:
 
                 err = ff_replaygain_export(st, s->metadata);
 
                 if (err < 0) {
 
                     mov_read_close(s);
 
                     return err;
 
                 }
 
                 break;
 
             case AVMEDIA_TYPE_VIDEO:
 
                 if (sc->display_matrix) {
 
                     AVPacketSideData *sd, *tmp;
 
                     tmp = av_realloc_array(st->side_data,
 
                             st->nb_side_data + 1, sizeof(*tmp));
 
                     if (!tmp)
 
                         return AVERROR(ENOMEM);
 
                     st->side_data = tmp;
 
                     st->nb_side_data++;
 
                     sd = &st->side_data[st->nb_side_data - 1];
 
                     sd->type = AV_PKT_DATA_DISPLAYMATRIX;
 
                     sd->size = sizeof(int32_t) * 9;
 
                     sd->data = (uint8_t*)sc->display_matrix;
 
                     sc->display_matrix = NULL;
 
                 }
 
                 break;
 
         }
 
     }
 
     ff_configure_buffers_for_index(s, AV_TIME_BASE);
 
     return 0;
 
 }

 
  static int mov_read_default(MOVContext *c, AVIOContext *pb, MOVAtom atom)
 
 {
 
     int64_t total_size = 0;
 
     MOVAtom a;
 
     int i;
 
     if (c->atom_depth > 10) {
 
         return AVERROR_INVALIDDATA;
     }
 
     c->atom_depth ++;
 
     if (atom.size < 0)
 
         atom.size = INT64_MAX;
 
     while (total_size + 8 <= atom.size && !avio_feof(pb)) {
 
         int (*parse)(MOVContext*, AVIOContext*, MOVAtom) = NULL;
 
         a.size = atom.size;
 
         a.type=0;
 
         if (atom.size >= 8) {
 
             a.size = avio_rb32(pb);
 
             a.type = avio_rl32(pb);
 
             if (a.type == MKTAG('f','r','e','e') &&
 
                     a.size >= 8 &&
 
                     c->moov_retry) {
 
                 uint8_t buf[8];
 
                 uint32_t *type = (uint32_t *)buf + 1;
 
                 if (avio_read(pb, buf, 8) != 8)
 
                     return AVERROR_INVALIDDATA;
 
                 avio_seek(pb, -8, SEEK_CUR);
 
                 if (*type == MKTAG('m','v','h','d') ||
 
                         *type == MKTAG('c','m','o','v')) {
 
                     a.type = MKTAG('m','o','o','v');
                 }
 
             }
 
             if (atom.type != MKTAG('r','o','o','t') && atom.type != MKTAG('m','o','o','v'))
             {
 
                 if (a.type == MKTAG('t','r','a','k') || a.type == MKTAG('m','d','a','t'))
 
                 {
 
                     avio_skip(pb, -8);
                     c->atom_depth --;
 
                     return 0;
 
                 }
 
             }
 
             total_size += 8;
 
             if (a.size == 1 && total_size + 8 <= atom.size) { /* 64 bit extended size */
 
                 a.size = avio_rb64(pb) - 8;
 
                 total_size += 8;
 
             }
 
         }
 
         if (a.size == 0) {
             a.size = atom.size - total_size + 8;
 
         }
 
         a.size -= 8;
 
         if (a.size < 0)
 
             break;
 
         a.size = FFMIN(a.size, atom.size - total_size);
 
         for (i = 0; mov_default_parse_table[i].type; i++)
 
             if (mov_default_parse_table[i].type == a.type) {
 
                 parse = mov_default_parse_table[i].parse;         //匹配type,调用各个box的读函数
 
                 break;
 
             }
 
         if (!parse && (atom.type == MKTAG('u','d','t','a') ||
                     atom.type == MKTAG('i','l','s','t')))
 
             parse = mov_read_udta_string;
 
         if (!parse && c->found_hdlr_mdta &&
 
                 atom.type == MKTAG('m','e','t','a') &&
 
                 a.type == MKTAG('k','e','y','s')) {
 
             parse = mov_read_keys;
 
         }
 
         if (!parse) { /* skip leaf atoms data */
 
             avio_skip(pb, a.size);
 
         } else {
 
             int64_t start_pos = avio_tell(pb);
 
             int64_t left;
 
             int err = parse(c, pb, a);
 
             if (err < 0) {
 
                 c->atom_depth --;
 
                 return err;
 
             }
 
             if (c->found_moov && c->found_mdat &&
 
                     ((!pb->seekable || c->fc->flags & AVFMT_FLAG_IGNIDX || c->fragment_index_complete) ||
 
                      start_pos + a.size == avio_size(pb))) {
 
                 if (!pb->seekable || c->fc->flags & AVFMT_FLAG_IGNIDX || c->fragment_index_complete)
 
                     c->next_root_atom = start_pos + a.size;
 
                 c->atom_depth --;
 
                 return 0;
 
             }
 
             left = a.size - avio_tell(pb) + start_pos;
 
             if (left > 0) 
 
                 avio_skip(pb, left);
 
             else if (left < 0) {            
                 avio_seek(pb, left, SEEK_CUR);
 
             }
 
         }
 
         total_size += a.size;
 
     }
 
     if (total_size < atom.size && atom.size < 0x7ffff)
 
         avio_skip(pb, atom.size - total_size);
 
     c->atom_depth --;
 
     return 0;
 
 }

所以box有如下:

 
  type='ftyp' ,parent='root',sz=32 8 102119991
 
 type='free' ,parent='root',sz=8 40 102119991
 
 type='mdat' ,parent='root',sz=101281678 48 102119991
 
 type='moov' ,parent='root',sz=838273 101281726 102119991
 
 type='mvhd' ,parent='moov',sz=108 8 838265
 
 type='trak' ,parent='moov',sz=376733 116 838265
 
 type='tkhd' ,parent='trak',sz=92 8 376725
 
 type='edts' ,parent='trak',sz=36 100 376725
 
 type='elst' ,parent='edts',sz=28 8 28
 
 type='mdia' ,parent='trak',sz=376597 136 376725
 
 type='mdhd' ,parent='mdia',sz=32 8 376589
 
 type='hdlr' ,parent='mdia',sz=45 40 376589
 
 type='minf' ,parent='mdia',sz=376512 85 376589
 
 type='vmhd' ,parent='minf',sz=20 8 376504
 
 type='dinf' ,parent='minf',sz=36 28 376504
 
 type='dref' ,parent='dinf',sz=28 8 28
 
 type='stbl' ,parent='minf',sz=376448 64 376504
 
 type='stsd' ,parent='stbl',sz=148 8 376440
 
 type='avcC' ,parent='stsd',sz=46 8 46
 
 type='stts' ,parent='stbl',sz=134056 156 376440
 
 type='stss' ,parent='stbl',sz=516 134212 376440
 
 type='ctts' ,parent='stbl',sz=81224 134728 376440
 
 type='stsc' ,parent='stbl',sz=28 215952 376440
 
 type='stsz' ,parent='stbl',sz=80236 215980 376440
 
 type='stco' ,parent='stbl',sz=80232 296216 376440
 
 type='trak' ,parent='moov',sz=461328 376849 838265
 
 type='tkhd' ,parent='trak',sz=92 8 461320
 
 type='mdia' ,parent='trak',sz=461228 100 461320
 
 type='mdhd' ,parent='mdia',sz=32 8 461220
 
 type='hdlr' ,parent='mdia',sz=45 40 461220
 
 type='minf' ,parent='mdia',sz=461143 85 461220
 
 type='smhd' ,parent='minf',sz=16 8 461135
 
 type='dinf' ,parent='minf',sz=36 24 461135
 
 type='dref' ,parent='dinf',sz=28 8 28
 
 type='stbl' ,parent='minf',sz=461083 60 461135
 
 type='stsd' ,parent='stbl',sz=91 8 461075
 
 type='esds' ,parent='stsd',sz=39 8 39
 
 type='stts' ,parent='stbl',sz=24 99 461075
 
 type='stsc' ,parent='stbl',sz=28 123 461075
 
 type='stsz' ,parent='stbl',sz=230468 151 461075
 
 type='stco' ,parent='stbl',sz=230464 230619 461075
 
 type='udta' ,parent='moov',sz=96 838177 838265
 
 type='meta' ,parent='udta',sz=88 8 88
 
 type='hdlr' ,parent='meta',sz=33 8 76
 
 type='ilst' ,parent='meta',sz=43 41 76
 
 type='?too' ,parent='ilst',sz=35 8 35