据传输媒体的质量不同,MPEG-2中定义了两种复合信息流:传送流(TS:TransportStream)和节目流(PS:ProgramStream)
PS文件分为3层:ps层(Program Stream)、pes层(Packet Elemental Stream)、es层(Elementary Stream)。es层就是音视频数据,pes层是在音视频数据上加了时间戳等对数据帧的说明信息,ps层是在pes层上加入了数据流识别和传输的必要信息。
1.Ps和Ts的区别
2.Ps文件结构
一个完整的MPEG-2文件就是一个PS流文件。使用Elecard StreamAnalyzer打开一个MPEG-2文件,得到下面信息。
2.1.Ps层
Ps层主要由pack header和数据组成,pack header中各个bit的意义如下
我们可以通过分析一个示例文件来了解它
scr += packet_size * 90000LL / (mux_rate * 50LL);
struct pack_header { unsigned char pack_start_code[4]; unsigned char system_clock_reference_base21 : 2; unsigned char marker_bit : 1; unsigned char system_clock_reference_base1 : 3; unsigned char fix_bit : 2; unsigned char system_clock_reference_base22; unsigned char system_clock_reference_base31 : 2; unsigned char marker_bit1 : 1; unsigned char system_clock_reference_base23 : 5; unsigned char system_clock_reference_base32; unsigned char system_clock_reference_extension1 : 2; unsigned char marker_bit2 : 1; unsigned char system_clock_reference_base33 : 5; unsigned char marker_bit3 : 1; unsigned char system_clock_reference_extension2 : 7; unsigned char program_mux_rate1; unsigned char program_mux_rate2; unsigned char marker_bit5 : 1; unsigned char marker_bit4 : 1; unsigned char program_mux_rate3 : 6; unsigned char pack_stuffing_length : 3; unsigned char reserved : 5; pack_header() { pack_start_code[0] = 0x00; pack_start_code[1] = 0x00; pack_start_code[2] = 0x01; pack_start_code[3] = 0xBA; fix_bit = 0x01; marker_bit = 0x01; marker_bit1 = 0x01; marker_bit2 = 0x01; marker_bit3 = 0x01; marker_bit4 = 0x01; marker_bit5 = 0x01; reserved = 0x1F; pack_stuffing_length = 0x00; system_clock_reference_extension1 = 0; system_clock_reference_extension2 = 0; } void getSystem_clock_reference_base(UINT64 &_ui64SCR) { _ui64SCR = (system_clock_reference_base1 << 30) | (system_clock_reference_base21 << 28) | (system_clock_reference_base22 << 20) | (system_clock_reference_base23 << 15) | (system_clock_reference_base31 << 13) | (system_clock_reference_base32 << 5) | (system_clock_reference_base33); } void setSystem_clock_reference_base(UINT64 _ui64SCR) { system_clock_reference_base1 = (_ui64SCR >> 30) & 0x07; system_clock_reference_base21 = (_ui64SCR >> 28) & 0x03; system_clock_reference_base22 = (_ui64SCR >> 20) & 0xFF; system_clock_reference_base23 = (_ui64SCR >> 15) & 0x1F; system_clock_reference_base31 = (_ui64SCR >> 13) & 0x03; system_clock_reference_base32 = (_ui64SCR >> 5) & 0xFF; system_clock_reference_base33 = _ui64SCR & 0x1F; } void getProgram_mux_rate(unsigned int &_uiMux_rate) { _uiMux_rate = (program_mux_rate1 << 14) | (program_mux_rate2 << 6) | program_mux_rate3; } void setProgram_mux_rate(unsigned int _uiMux_rate) { program_mux_rate1 = (_uiMux_rate >> 14) & 0xFF; program_mux_rate2 = (_uiMux_rate >> 6) & 0xFF; program_mux_rate3 = _uiMux_rate & 0x3F; } };
这样的好处是可以直接通过
pack_header header; header.setProgram_mux_rate(25200); header.setSystem_clock_reference_base(0); os.write((char *)&header, sizeof(header));
来写入文件,但是不方便抽象成类,所以就参考ffmpeg使用了put_bits的方式
class PackHeader : public HeaderBase { public: UINT64 SCRBase; UINT8 SCRExt; UINT32 programMuxRate; UINT8 stuffingLength; PackHeader(); virtual ~PackHeader(); int Serialize(); };
然后在类中加一个序列化函数,来将整个类序列化
int PackHeader::Serialize() { int calcBinaryBitLen = 32 //pack_start_code + 2 // '01' + 3 //system_clock_reference_base [32..30] + 1 //marker_bit + 15 //system_clock_reference_base [29..15] + 1 //marker_bit + 15 //system_clock_reference_base [14..0] + 1 //marker_bit + 9 //system_clock_reference_extension + 1 //marker_bit + 22 // program_mux_rate + 1 //marker_bit + 1 //marker_bit + 5 //reserved + 3; //pack_stuffing_length if (stuffingLength > 0) { for (int i = 0; i < stuffingLength; i++) { calcBinaryBitLen += 8; } } if ((calcBinaryBitLen / 8) > binaryLen) { if (binary) delete[] binary; binary = new BYTE[calcBinaryBitLen / 8]; } binaryLen = calcBinaryBitLen / 8; BYTE* p = binary; bits_buffer_t bw; bits_initwrite(&bw, binaryLen, p); bits_write(&bw, 32, PACK_HEADER_START_CODE); //pack_start_code bits_write(&bw, 2, 0x1); // '01' bits_write(&bw, 3, (SCRBase >> 30) & 0x07); //system_clock_reference_base [32..30] bits_write(&bw, 1, 1); //marker_bit bits_write(&bw, 15, (SCRBase >> 15) & 0x7FFF); //system_clock_reference_base [29..15] bits_write(&bw, 1, 1); //marker_bit bits_write(&bw, 15, SCRBase & 0x7FFF); //system_clock_reference_base [14..0] bits_write(&bw, 1, 1); //marker_bit bits_write(&bw, 9, SCRExt); //system_clock_reference_extension bits_write(&bw, 1, 1); //marker_bit bits_write(&bw, 22, programMuxRate & 0x3FFFFF); // program_mux_rate bits_write(&bw, 1, 1); //marker_bit bits_write(&bw, 1, 1); //marker_bit bits_write(&bw, 5, 0x1F); //reserved bits_write(&bw, 3, stuffingLength & 0x07); //pack_stuffing_length if (stuffingLength > 0) { for (int i = 0; i < stuffingLength; i++) { bits_write(&bw, 8, 0xFF); //stuffing } } return 1; }
对于DVD而言,一般开始的pack里面还有一个System header
我们也可以通过分析一个示例文件来了解它
2.2.Pes层
Pes层由编码的音频或视频数据(es)加上Pes头组成的,Pes头主要是通过PTS和DTS来提供音视频同步的信息,Pes头的各个bit的意义如下所示
Pes头之后紧跟着的就是编码的音频或视频数据(es)了,对于DVD而言,一个program pack的大小问0x800,所以一帧MPEG-2视频被分在多个Pes包里,不够一个包的就写在下一帧的第一个pack里,或在Pes Header后面填充FF(PES_header_data_length要加上填充的字节数)。