ffmpeg音频转码，采用swr_convert重取样

最新推荐文章于 2023-06-29 20:14:07 发布
wishfly
最新推荐文章于 2023-06-29 20:14:07 发布
阅读量2.9k
点赞数 1
1、概述：

和上一篇音频转码流程一样，只是把filter重取样改为了swr_convert重取样，理解本例子对AVFrame中data如何存储音频数据有更好的理解。
2、代码：

[cpp]view plaincopy 
    
 /* 
 *最简单的音频转码器（只处理音频） 
 *缪国凯 Mickel 
 *821486004@qq.com 
 *本程序实现从一个视频格式转码到另一个视频格式，只处理音频，视频忽略，若有多个音频流，只处理第一个,采用swr_convert重取样 
 *2015-5-8 
 */  
   
   
 #include "stdafx.h"  
   
 #ifdef __cplusplus  
 extern"C"  
 {  
 #endif  
 #include <libavformat/avformat.h>  
 #include "libavcodec/avcodec.h"  
 #include "libavfilter/avfiltergraph.h"  
 #include "libavfilter/buffersink.h"  
 #include "libavfilter/buffersrc.h"  
 #include "libavutil/avutil.h"  
 #include "libavutil/opt.h"  
 #include "libavutil/pixdesc.h"  
 #include "libswresample\swresample.h"  
 #include "libavutil\fifo.h"  
   
   
 #pragma comment(lib, "avcodec.lib")  
 #pragma comment(lib, "avformat.lib")  
 #pragma comment(lib, "avutil.lib")  
     //#pragma comment(lib, "avdevice.lib")  
 #pragma comment(lib, "avfilter.lib")  
     //#pragma comment(lib, "postproc.lib")  
 #pragma comment(lib, "swresample.lib")  
     //#pragma comment(lib, "swscale.lib")  
 #ifdef __cplusplus  
 };  
 #endif  
   
 #define BUF_SIZE_20K 2048000  
 #define BUF_SIZE_1K 1024000  
   
 SwrContext* pSwrCtx = NULL;  
 AVStream *out_stream = NULL;  
 AVFormatContext *in_fmt_ctx = NULL, *out_fmt_ctx = NULL;  
 int audio_index = -1;  
   
 void initSwr()  
 {  
     if (out_fmt_ctx->streams[0]->codec->channels != in_fmt_ctx->streams[audio_index]->codec->channels  
         || out_fmt_ctx->streams[0]->codec->sample_rate != in_fmt_ctx->streams[audio_index]->codec->sample_rate  
         || out_fmt_ctx->streams[0]->codec->sample_fmt != in_fmt_ctx->streams[audio_index]->codec->sample_fmt)  
     {  
         if ( NULL == pSwrCtx )   
         {  
             pSwrCtx = swr_alloc();  
         }  
 #if LIBSWRESAMPLE_VERSION_MINOR >= 17    // 根据版本不同，选用适当函数  
         av_opt_set_int(pSwrCtx, "ich", in_fmt_ctx->streams[audio_index]->codec->channels, 0);  
         av_opt_set_int(pSwrCtx, "och", out_fmt_ctx->streams[0]->codec->channels, 0);  
         av_opt_set_int(pSwrCtx, "in_sample_rate",  in_fmt_ctx->streams[audio_index]->codec->sample_rate, 0);  
         av_opt_set_int(pSwrCtx, "out_sample_rate",  out_fmt_ctx->streams[0]->codec->sample_rate, 0);  
         av_opt_set_sample_fmt(pSwrCtx, "in_sample_fmt", in_fmt_ctx->streams[audio_index]->codec->sample_fmt, 0);  
         av_opt_set_sample_fmt(pSwrCtx, "out_sample_fmt", out_fmt_ctx->streams[0]->codec->sample_fmt, 0);  
   
 #else  
         pSwrCtx = swr_alloc_set_opts(pSwrCtx,             
             out_fmt_ctx->streams[0]->codec->channel_layout,   
             out_fmt_ctx->streams[0]->codec->sample_fmt,   
             out_fmt_ctx->streams[0]->codec->->sample_rate,  
             in_fmt_ctx->streams[audio_index]->codec->channel_layout,   
             in_fmt_ctx->streams[audio_index]->codec->sample_fmt,   
             in_fmt_ctx->streams[audio_index]->codec->sample_rate,  
             0, NULL);  
 #endif  
         swr_init(pSwrCtx);  
     }  
 }  
   
 //setup_array函数摘自ffmpeg例程  
 static void setup_array(uint8_t* out[SWR_CH_MAX], AVFrame* in_frame, int format, int samples)  
 {  
     if (av_sample_fmt_is_planar((AVSampleFormat)format))   
     {  
         int i;int plane_size = av_get_bytes_per_sample((AVSampleFormat)(format & 0xFF)) * samples;format &= 0xFF;  
           
         //从decoder出来的frame中的data数据不是连续分布的，所以不能这样写：  
         in_frame->data[0]+i*plane_size;  
         for (i = 0; i < in_frame->channels; i++)  
         {  
             out[i] = in_frame->data[i];  
         }  
     }   
     else  
     {  
         out[0] = in_frame->data[0];  
     }  
 }  
   
 int TransSample(AVFrame *in_frame, AVFrame *out_frame)  
 {  
     int ret;  
     int max_dst_nb_samples = 4096;  
     //int64_t dst_nb_samples;  
     int64_t src_nb_samples = in_frame->nb_samples;  
     out_frame->pts = in_frame->pts;  
     uint8_t* paudiobuf;  
     int decode_size, input_size, len;  
     if (pSwrCtx != NULL)   
     {  
         out_frame->nb_samples = av_rescale_rnd(swr_get_delay(pSwrCtx, out_fmt_ctx->streams[0]->codec->sample_rate) + src_nb_samples,  
             out_fmt_ctx->streams[0]->codec->sample_rate, in_fmt_ctx->streams[audio_index]->codec->sample_rate, AV_ROUND_UP);  
   
         ret = av_samples_alloc(out_frame->data,   
             &out_frame->linesize[0],   
             out_fmt_ctx->streams[0]->codec->channels,   
             out_frame->nb_samples,   
             out_fmt_ctx->streams[0]->codec->sample_fmt, 0);  
           
         if (ret < 0)  
         {  
             av_log(NULL, AV_LOG_WARNING, "[%s.%d %s() Could not allocate samples Buffer\n", __FILE__, __LINE__, __FUNCTION__);  
             return -1;  
         }  
           
         max_dst_nb_samples = out_frame->nb_samples;  
         //输入也可能是分平面的，所以要做如下处理  
         uint8_t* m_ain[SWR_CH_MAX];  
         setup_array(m_ain, in_frame, in_fmt_ctx->streams[audio_index]->codec->sample_fmt, src_nb_samples);  
           
         //注意这里，out_count和in_count是samples单位，不是byte  
         //所以这样av_get_bytes_per_sample(in_fmt_ctx->streams[audio_index]->codec->sample_fmt) * src_nb_samples是错的  
         len = swr_convert(pSwrCtx, out_frame->data, out_frame->nb_samples, (const uint8_t**)m_ain, src_nb_samples);  
         if (len < 0)  
         {  
             char errmsg[BUF_SIZE_1K];  
             av_strerror(len, errmsg, sizeof(errmsg));  
             av_log(NULL, AV_LOG_WARNING, "[%s:%d] swr_convert!(%d)(%s)", __FILE__, __LINE__, len, errmsg);  
             return -1;  
         }  
     }  
     else  
     {  
         printf("pSwrCtx with out init!\n");  
         return -1;  
     }  
     return 0;  
 }  
   
 int flush_encoder(AVFormatContext *fmt_ctx, unsigned int stream_index)  
 {  
     int ret;  
     int got_frame;  
     AVPacket enc_pkt;  
     if (!(fmt_ctx->streams[stream_index]->codec->codec->capabilities &CODEC_CAP_DELAY))  
     {  
         return 0;  
     }  
       
     int i = 0;  
     while(1)  
     {  
         enc_pkt.data = NULL;  
         enc_pkt.size = 0;  
         av_init_packet(&enc_pkt);  
         ret = avcodec_encode_audio2(out_fmt_ctx->streams[stream_index]->codec, &enc_pkt,NULL, &got_frame);  
         if (ret < 0)  
             break;  
           
         if (!got_frame)  
             break;  
           
         /* prepare packet for muxing */  
         enc_pkt.stream_index = stream_index;  
           
         enc_pkt.dts = av_rescale_q_rnd(enc_pkt.dts,out_fmt_ctx->streams[stream_index]->codec->time_base,  
             out_fmt_ctx->streams[stream_index]->time_base,(AVRounding)(AV_ROUND_NEAR_INF|AV_ROUND_PASS_MINMAX));  
           
         enc_pkt.pts = av_rescale_q_rnd(enc_pkt.pts,out_fmt_ctx->streams[stream_index]->codec->time_base,  
             out_fmt_ctx->streams[stream_index]->time_base,(AVRounding)(AV_ROUND_NEAR_INF|AV_ROUND_PASS_MINMAX));  
           
         enc_pkt.duration = av_rescale_q(enc_pkt.duration,out_fmt_ctx->streams[stream_index]->codec->time_base,  
             out_fmt_ctx->streams[stream_index]->time_base);  
           
         /* mux encoded frame */  
         ret = av_interleaved_write_frame(out_fmt_ctx, &enc_pkt);  
           
         av_free_packet(&enc_pkt);  
           
         if (ret < 0)  
         {  
             break;  
         }  
         i++;  
     }  
       
     printf("flusher write %d frame", i);  
       
     return ret;  
 }  
   
 int _tmain(int argc, _TCHAR* argv[])  
 {  
     AVFrame *frame, *frame_out;  
     AVPacket pkt_in, pkt_out;  
     int ret;  
       
     if (argc < 3)  
     {  
         printf("error in input param");  
         getchar();  
         return -1;  
     }  
       
     av_register_all();  
     avfilter_register_all();  
       
     //input  
     if (avformat_open_input(&in_fmt_ctx, argv[1], NULL, NULL) < 0)  
     {  
         printf("can not open input file context");  
         goto end;  
     }  
       
     if (avformat_find_stream_info(in_fmt_ctx, NULL) < 0)  
     {  
         printf("can not find input stream info!\n");  
         goto end;  
     }  
       
     //output  
     avformat_alloc_output_context2(&out_fmt_ctx, NULL, NULL, argv[2]);  
     if (!out_fmt_ctx)  
     {  
         printf("can not alloc output context!\n");  
         goto end;  
     }  
       
     //open decoder & new out stream & open encoder  
     for (int i = 0; i < in_fmt_ctx->nb_streams; i++)  
     {  
         if (in_fmt_ctx->streams[i]->codec->codec_type == AVMEDIA_TYPE_AUDIO)  
         {  
             //open decoder  
             if(0 > avcodec_open2(in_fmt_ctx->streams[i]->codec, avcodec_find_decoder(in_fmt_ctx->streams[i]->codec->codec_id), NULL))  
             {  
                 printf("can not find or open decoder!\n");  
                 goto end;  
             }  
             audio_index = i;  
               
             //new stream  
             out_stream = avformat_new_stream(out_fmt_ctx, NULL);  
             if (!out_stream)  
             {  
                 printf("can not new stream for output!\n");  
                 goto end;  
             }  
             //set codec context param  
             //use default audio encoder  
             out_stream->codec->codec = avcodec_find_encoder(out_fmt_ctx->oformat->audio_codec);  
             //use the input audio encoder  
             //  
             out_stream->codec->codec = avcodec_find_encoder(in_fmt_ctx->streams[i]->codec->codec_id);  
             out_stream->codec->sample_rate = in_fmt_ctx->streams[i]->codec->sample_rate;  
             out_stream->codec->channel_layout = in_fmt_ctx->streams[i]->codec->channel_layout;  
             out_stream->codec->channels = av_get_channel_layout_nb_channels(out_stream->codec->channel_layout);  
               
             // take first format from list of supported formats  
             out_stream->codec->sample_fmt = out_stream->codec->codec->sample_fmts[0];  
             AVRational time_base={1, out_stream->codec->sample_rate};  
             out_stream->codec->time_base = time_base;  
               
             //open encoder  
             if (!out_stream->codec->codec)  
             {  
                 printf("can not find the encoder!\n");  
                 goto end;  
             }  
             if ((avcodec_open2(out_stream->codec, out_stream->codec->codec, NULL)) < 0)  
             {  
                 printf("can not open the encoder\n");  
                 goto end;  
             }  
             if (out_fmt_ctx->oformat->flags & AVFMT_GLOBALHEADER)  
                 out_stream->codec->flags |= CODEC_FLAG_GLOBAL_HEADER;  
             break;  
         }  
     }  
     //dump input info  
     av_dump_format(in_fmt_ctx, 0, argv[1], 0);  
     //dump output info  
     av_dump_format(out_fmt_ctx, 0, argv[2], 1);  
     if (-1 == audio_index)  
     {  
         printf("found no audio stream in input file!\n");  
         goto end;  
     }  
     if (!(out_fmt_ctx->oformat->flags & AVFMT_NOFILE))  
     {  
         if(avio_open(&out_fmt_ctx->pb, argv[2], AVIO_FLAG_WRITE) < 0)  
         {  
             printf("can not open output file handle!\n");  
             goto end;  
         }  
     }  
       
     if(avformat_write_header(out_fmt_ctx, NULL) < 0)  
     {  
         printf("can not write the header of the output file!\n");  
         goto end;  
     }  
     //  
     initSwr();  
     int got_frame, got_picture;  
     int frame_index = 0;  
     int i = 0;  
       
     for(int i = 0; ;i++)  
     {  
         pkt_in.data = NULL;  
         pkt_in.size = 0;  
         got_frame = -1;  
         got_picture = -1;  
         if (av_read_frame(in_fmt_ctx, &pkt_in) < 0)  
         {  
             break;  
         }  
   
         if (pkt_in.stream_index != audio_index)  
         {  
             continue;  
         }  
           
         frame = av_frame_alloc();  
           
         if ((ret = avcodec_decode_audio4(in_fmt_ctx->streams[audio_index]->codec, frame, &got_frame, &pkt_in)) < 0)  
         {  
             av_frame_free(&frame);  
             printf("can not decoder a frame");  
             break;  
         }  
           
         av_free_packet(&pkt_in);  
           
         if (got_frame)  
         {  
             frame->pts = av_frame_get_best_effort_timestamp(frame);  
             frame_out = av_frame_alloc();  
             if (0 != TransSample(frame, frame_out))  
             {  
                 printf("can not swr the audio data!\n");  
                 break;  
             }  
               
             av_init_packet(&pkt_out);  
             int ret = avcodec_encode_audio2(out_fmt_ctx->streams[0]->codec, &pkt_out, frame_out, &got_picture);  
               
             av_free(frame_out->data[0]);  
             av_frame_free(&frame_out);  
               
             if (got_picture )   
             {  
                 pkt_out.stream_index = out_stream->index;  
                 pkt_out.dts = av_rescale_q_rnd(pkt_out.dts,  
                     out_fmt_ctx->streams[out_stream->index]->codec->time_base,  
                     out_fmt_ctx->streams[out_stream->index]->time_base,  
                     (AVRounding)(AV_ROUND_NEAR_INF|AV_ROUND_PASS_MINMAX));  
                 pkt_out.pts = av_rescale_q_rnd(pkt_out.pts,  
                     out_fmt_ctx->streams[out_stream->index]->codec->time_base,  
                     out_fmt_ctx->streams[out_stream->index]->time_base,  
                     (AVRounding)(AV_ROUND_NEAR_INF|AV_ROUND_PASS_MINMAX));  
                 pkt_out.duration = av_rescale_q(pkt_out.duration,  
                     out_fmt_ctx->streams[out_stream->index]->codec->time_base,  
                     out_fmt_ctx->streams[out_stream->index]->time_base);  
                   
                 av_log(NULL, AV_LOG_DEBUG, "Muxing frame\n");  
                   
                 /* mux encoded frame */  
                 ret = av_interleaved_write_frame(out_fmt_ctx, &pkt_out);  
                 av_free_packet(&pkt_out);  
                   
                 if (ret < 0)  
                 {  
                     printf("write a frame failed!\n");  
                     break;  
                 }  
                   
                 printf("success write a frame:index %d\n", frame_index++);  
             }  
         }  
     }  
   
     ret = flush_encoder(out_fmt_ctx, out_stream->index);  
     if (ret < 0)  
     {  
         printf("Flushing encoder failed");  
         return -1;  
     }  
       
     //write file trailer      
     av_write_trailer(out_fmt_ctx);  
       
     //clean  
     avcodec_close(out_stream->codec);  
     avcodec_close(in_fmt_ctx->streams[audio_index]->codec);  
   
 end:  
     avformat_close_input(&in_fmt_ctx);  
     if (out_fmt_ctx && !(out_fmt_ctx->oformat->flags & AVFMT_NOFILE))  
     {  
         avio_close(out_fmt_ctx->pb);  
     }  
     avformat_free_context(out_fmt_ctx);  
     getchar();  
     return 0;  
 }  
 
    
  

 

 

 
http://blog.csdn.net/dancing_night/article/details/45642107
 
wishfly
关注
1
点赞
踩
1

收藏

觉得还不错? 一键收藏
0
评论
ffmpeg音频转码，采用swr_convert重取样

1、概述：和上一篇音频转码流程一样，只是把filter重取样改为了swr_convert重取样，理解本例子对AVFrame中data如何存储音频数据有更好的理解。2、代码：[cpp] view plain copy /* *最简单的音频转码器（只处理音频） *缪国凯 Mickel *[email protected] *本程
复制链接

扫一扫