ffmpeg解码音频的两种方式（一）av_parser_parse解析器

最新推荐文章于 2025-03-20 15:23:03 发布
且行且探索
最新推荐文章于 2025-03-20 15:23:03 发布
阅读量4.2k
点赞数
分类专栏： FFMPEG
本文链接：https://blog.csdn.net/encoder1234/article/details/78832618
版权
FFMPEG 专栏收录该内容
16 篇文章
订阅专栏
使用ffmpeg解析器自动提取音频单帧数据：
#include "stdafx.h"
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
extern "C"
{
#include "libavcodec/avcodec.h"
#include "libavformat/avformat.h"
#include "libswresample/swresample.h"
//SDL
#include "sdl/SDL.h"
#include "sdl/SDL_thread.h"
};

#define MAX_AUDIO_FRAME_SIZE 192000 // 1 second of 48khz 32bit audio

//Output PCM
#define OUTPUT_PCM 1
//Use SDL
#define USE_SDL 1

static  Uint8  *audio_chunk; 
static  Uint32  audio_len; 
static  Uint8  *audio_pos; 

void  fill_audio(void *udata,Uint8 *stream,int len){ 
	//SDL 2.0
	SDL_memset(stream, 0, len);
	if(audio_len==0)		/*  Only  play  if  we  have  data  left  */ 
			return; 
	len=(len>audio_len?audio_len:len);	/*  Mix  as  much  data  as  possible  */ 

	SDL_MixAudio(stream,audio_pos,len,SDL_MIX_MAXVOLUME);
	audio_pos += len; 
	audio_len -= len; 
} 
//-----------------

static char err_buf[128] = {0};
static char* av_get_err(int errnum)
{  
    av_strerror(errnum, err_buf, 128);
    return err_buf;
}

int nWriteBytes=0;
int _tmain(int argc, _TCHAR* argv[])
{
	AVFormatContext	*pFormatCtx;
	int				i, audioStream;
	AVCodecContext	*pCodecCtx;
	AVCodec			*pCodec;
	AVCodecParserContext * pParser;

	//char url[]="WavinFlag.aac";
	//char url[]="1.mp2";
	char url[]="2.mp3";

	av_register_all();
	pCodec=avcodec_find_decoder(AV_CODEC_ID_MP3/*AV_CODEC_ID_AAC*/);//AV_CODEC_ID_MP2
	if(pCodec==NULL){
		printf("Codec not found.\n");
		return -1;
	}

	pCodecCtx = avcodec_alloc_context3(pCodec);

	// Open codec
	if(avcodec_open2(pCodecCtx, pCodec,NULL)<0){
		printf("Could not open codec.\n");
		return -1;
	}

	pParser = av_parser_init(/*AV_CODEC_ID_AAC*/AV_CODEC_ID_MP3);
	if(!pParser){
		printf("av_parser_init AV_CODEC_ID_MP3 failed.\n");
		return -1;
	}

	FILE *pFile=NULL;
	FILE *pInFile = NULL;
#if OUTPUT_PCM
	pFile=fopen("output.pcm", "wb");
	pInFile=fopen(url, "rb");
#endif
	
	//Out Audio Param
	uint64_t out_channel_layout=AV_CH_LAYOUT_STEREO;
	int out_nb_samples=/*1024*/1152;
	AVSampleFormat out_sample_fmt=AV_SAMPLE_FMT_S16;
	int out_sample_rate=44100;
	int out_channels=av_get_channel_layout_nb_channels(out_channel_layout);
	//输出内存大小
	int out_buffer_size=av_samples_get_buffer_size(NULL,out_channels ,out_nb_samples,out_sample_fmt, 1);

	uint8_t *out_buffer=(uint8_t *)av_malloc(MAX_AUDIO_FRAME_SIZE*2);
	
	AVFrame *pFrame = av_frame_alloc();
	avcodec_get_frame_defaults(pFrame);

//SDL------------------
#if USE_SDL
	//Init
	if(SDL_Init(SDL_INIT_VIDEO | SDL_INIT_AUDIO | SDL_INIT_TIMER)) {  
		printf( "Could not initialize SDL - %s\n", SDL_GetError()); 
		return -1;
	}
	//SDL_AudioSpec
	SDL_AudioSpec wanted_spec;
	wanted_spec.freq = out_sample_rate; 
	wanted_spec.format = AUDIO_S16SYS; 
	wanted_spec.channels = out_channels; 
	wanted_spec.silence = 0; 
	wanted_spec.samples = out_nb_samples/*pCodecCtx->frame_size*/; 
	wanted_spec.callback = fill_audio; 
	wanted_spec.userdata = pCodecCtx; 
		
	if (SDL_OpenAudio(&wanted_spec, NULL)<0){ 
		printf("can't open audio.\n"); 
		return -1; 
	} 
#endif
	printf("Bitrate:\t %3d\n", pFormatCtx->bit_rate);
	//printf("Decoder Name:\t %s\n", pCodecCtx->codec->long_name);
	//printf("Channels:\t %d\n", pCodecCtx->channels);
	//printf("Sample per Second\t %d \n", pCodecCtx->sample_rate);

	uint32_t ret,len = 0;
	int got_picture;
	int index = 0;
	struct SwrContext *au_convert_ctx;
	au_convert_ctx = swr_alloc();
	//au_convert_ctx=swr_alloc_set_opts(au_convert_ctx,out_channel_layout, out_sample_fmt, out_sample_rate,
	//	pCodecCtx->channel_layout,pCodecCtx->sample_fmt , pCodecCtx->sample_rate,0, NULL);
	//swr_init(au_convert_ctx);
	
	int data_size = 0;
	int size = 0;
	int cnt=0;
	int offset=0;

	//FILE *myout=fopen("output_log.txt","wb+");
	FILE *myout=stdout;

	unsigned char *aacframe=(unsigned char *)malloc(1024*5);
	unsigned char *aacbuffer=(unsigned char *)malloc(1024*1024);

	FILE *ifile = fopen(url, "rb");
	if(!ifile){
		printf("Open file error");
		return -1;
	}

	printf(" aac 帧: NUM - Profile - Frequency - Size |\n");
	
	while(!feof(ifile)){
		data_size = fread(aacbuffer+offset, 1, 1024*1024-offset, ifile);
		unsigned char* input_data = aacbuffer+offset;

		uint8_t *pParserBufOut = NULL;
		int pParserOutLength = 0;

		while(data_size>0){
			int nParserLen = av_parser_parse2(pParser, pCodecCtx, &pParserBufOut, &pParserOutLength,
												(uint8_t *)input_data, data_size,0, 0, 0);			
			if(nParserLen>0){
				input_data += nParserLen;
				data_size  -= nParserLen;

				if(pParserOutLength>0){
					AVPacket avpkt;
					av_init_packet(&avpkt);
					avpkt.data = (uint8_t *)pParserBufOut;  
					avpkt.size = pParserOutLength;

					//此处不需要循环，每次解析的都是一个es流的一个单帧，直接解码成功
					while(avpkt.size>0){
						ret = avcodec_decode_audio4( pCodecCtx, pFrame,&got_picture, &avpkt);
						if ( ret < 0 ) {
							printf("Error in decoding audio frame.\n");
							return -1;
						}
						//printf("avcodec_decode_audio4 %s \n", av_get_err(ret));
						//if(AVERROR_INVALIDDATA==ret){
						//	continue;
						//}

						//需要解码后初始化，否则pCodecCtx的参数尚未获取到（纯净版不用预先指定参数）
						static bool bSwrInit=false;
						if(!bSwrInit){
							au_convert_ctx=swr_alloc_set_opts(au_convert_ctx,out_channel_layout, out_sample_fmt, out_sample_rate,
								pCodecCtx->channel_layout,pCodecCtx->sample_fmt , pCodecCtx->sample_rate,0, NULL);
							swr_init(au_convert_ctx);
							bSwrInit=true;
						}
						
						if(got_picture > 0){					
							int nBytes = swr_convert(au_convert_ctx,&out_buffer, MAX_AUDIO_FRAME_SIZE,(const uint8_t **)pFrame->data , pFrame->nb_samples);
							if(nBytes<0){
								printf("swr_convert failed \n");
								return 0;
							}
							nWriteBytes = av_samples_get_buffer_size(NULL, out_channels, nBytes, out_sample_fmt, 1);
							if(nWriteBytes<0){
								printf("av_samples_get_buffer_size failed \n");
								return 0;
							}
							fwrite(out_buffer, 1, nWriteBytes, pFile);
						}

						//设置音频数据缓冲,PCM数据
						audio_chunk = (Uint8 *) out_buffer; 
						//设置音频数据长度
						audio_len = nWriteBytes;
						audio_pos = audio_chunk;
						//回放音频数据 
						SDL_PauseAudio(0);
						while(audio_len>0)//等待直到音频数据播放完毕! 
							SDL_Delay(1); 
	
						avpkt.data+=ret;
						avpkt.size-=ret;
					}
					av_free_packet(&avpkt);
				}
			}
		}		
	}
	fclose(ifile);
	free(aacbuffer);
	fclose(pFile);

#if USE_SDL
	SDL_CloseAudio();//关闭音频设备 
	SDL_Quit();
#endif
	
	swr_free(&au_convert_ctx);
	av_free(out_buffer);
	avcodec_close(pCodecCtx);
	av_parser_close(pParser);
	
	return 0;
}