FFmpeg 混音学习【三】两路混流完整代码

最新推荐文章于 2024-07-18 16:08:26 发布
HiddenTrackMJ
最新推荐文章于 2024-07-18 16:08:26 发布
阅读量2k
点赞数 2
分类专栏： FFmpeg学习记录文章标签： ffmpeg c++ filter aac
本文链接：https://blog.csdn.net/qq_37984341/article/details/107404909
版权
FFmpeg学习记录专栏收录该内容
4 篇文章 2 订阅
订阅专栏
前言

本文是简单的混流实现，输入为两个媒体文件（音频或带音频的视频文件），输出为混流后的aac文件。
完整代码

/*
 * Copyright (c) 2010 Nicolas George
 * Copyright (c) 2011 Stefano Sabatini
 * Copyright (c) 2012 ClÃ©ment BÅ“sch
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */

/**
 * @file
 * API example for audio decoding and filtering
 * @example filtering_audio.c
 */

extern "C" {
#include <libavcodec/avcodec.h>
#include <libavfilter/avfiltergraph.h>
#include <libavfilter/buffersink.h>
#include <libavfilter/buffersrc.h>
#include <libavformat/avformat.h>
#include <libavutil/opt.h>
}
//#include <unistd.h>

#include <string>
#include <iostream>

#define ENABLE_FILTERS 1

static const char* filter_descr ="[in0][in1]amix=inputs=2[out]";  

static AVFormatContext* fmt_ctx1;
static AVFormatContext* fmt_ctx2;

static AVCodecContext* dec_ctx1;
static AVCodecContext* dec_ctx2;

AVFilterContext* buffersink_ctx;
AVFilterContext* buffersrc_ctx1;
AVFilterContext* buffersrc_ctx2;

AVFormatContext* ofmt_ctx;
AVCodecContext* enc_ctx;  //输出文件的codec
int pkt_count = 0;
AVFrame* frame;

AVFilterGraph* filter_graph;
static int audio_stream_index_1 = -1;
static int audio_stream_index_2 = -1;


static int open_input_file_1(const char* filename) {
  int ret;
  AVCodec* dec;

  if ((ret = avformat_open_input(&fmt_ctx1, filename, NULL, NULL)) < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot open input file\n");
    return ret;
  }

  if ((ret = avformat_find_stream_info(fmt_ctx1, NULL)) < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot find stream information\n");
    return ret;
  }

  /* select the audio stream */
  ret = av_find_best_stream(fmt_ctx1, AVMEDIA_TYPE_AUDIO, -1, -1, &dec, 0);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR,
           "Cannot find an audio stream in the input file\n");
    return ret;
  }
  audio_stream_index_1 = ret;
  dec_ctx1 = fmt_ctx1->streams[audio_stream_index_1]->codec;
  av_opt_set_int(dec_ctx1, "refcounted_frames", 1, 0);

  /* init the audio decoder */
  if ((ret = avcodec_open2(dec_ctx1, dec, NULL)) < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot open audio decoder\n");
    return ret;
  }

  return 0;
}

static int open_input_file_2(const char* filename) {
  int ret;
  AVCodec* dec;

  if ((ret = avformat_open_input(&fmt_ctx2, filename, NULL, NULL)) < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot open input file\n");
    return ret;
  }

  if ((ret = avformat_find_stream_info(fmt_ctx2, NULL)) < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot find stream information\n");
    return ret;
  }

  /* select the audio stream */
  ret = av_find_best_stream(fmt_ctx2, AVMEDIA_TYPE_AUDIO, -1, -1, &dec, 0);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR,
           "Cannot find an audio stream in the input file\n");
    return ret;
  }
  audio_stream_index_2 = ret;
  dec_ctx2 = fmt_ctx2->streams[audio_stream_index_2]->codec;
  av_opt_set_int(dec_ctx2, "refcounted_frames", 1, 0);

  /* init the audio decoder */
  if ((ret = avcodec_open2(dec_ctx2, dec, NULL)) < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot open audio decoder\n");
    return ret;
  }

  return 0;
}

int encode_write_frame(AVFrame* filt_frame, unsigned int stream_index) {
  int ret;
  I_LOG("Write frame {}", filt_frame->nb_samples);
  ret = avcodec_send_frame(enc_ctx, filt_frame);
  if (ret < 0) {
    E_LOG("Error while sending a frame to the encoder: {}", ret);
    return -1;
  }

  while (ret >= 0) {
    AVPacket pkt;
    av_init_packet(&pkt);
    ret = avcodec_receive_packet(enc_ctx, &pkt);
    if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF)
      break;
    else if (ret < 0) {
      E_LOG("Error while encoding a frame: {}", ret);
      return -1;
    }

    /* rescale output packet timestamp values from codec to stream timebase */
    av_packet_rescale_ts(&pkt, enc_ctx->time_base,
                         ofmt_ctx->streams[stream_index]->time_base);
    pkt.stream_index = stream_index;

    /* Write the compressed frame to the media file. */
    // log_packet(fmt_ctx, &pkt);

    pkt.pts = pkt_count * ofmt_ctx->streams[stream_index]->codec->frame_size;
    pkt.dts = pkt.pts;
    pkt.duration = ofmt_ctx->streams[stream_index]->codec->frame_size;

    pkt.pts = av_rescale_q_rnd(
        pkt.pts, ofmt_ctx->streams[stream_index]->codec->time_base,
        ofmt_ctx->streams[stream_index]->time_base,
        (AVRounding)(AV_ROUND_NEAR_INF | AV_ROUND_PASS_MINMAX));
    pkt.dts = pkt.pts;
    pkt.duration = av_rescale_q_rnd(
        pkt.duration, ofmt_ctx->streams[stream_index]->codec->time_base,
        ofmt_ctx->streams[stream_index]->time_base,
        (AVRounding)(AV_ROUND_NEAR_INF | AV_ROUND_PASS_MINMAX));

    ret = av_interleaved_write_frame(ofmt_ctx, &pkt);
    ++pkt_count;
    av_packet_unref(&pkt);
    if (ret < 0) {
      E_LOG("Error while writing output packet: {}", ret);
      return -1;
    }
  }
  return ret;
}

int open_output_file(const char* filename) {
  AVStream* out_stream;
  AVCodec* encoder;
  int ret;
  ofmt_ctx = NULL;
  avformat_alloc_output_context2(&ofmt_ctx, NULL, NULL, filename);
  if (!ofmt_ctx) {
    av_log(NULL, AV_LOG_ERROR, "Could not create output context\n");
    return AVERROR_UNKNOWN;
  }
  {
    out_stream = avformat_new_stream(ofmt_ctx, NULL);
    out_stream->index = 0;
    if (!out_stream) {
      av_log(NULL, AV_LOG_ERROR, "Failed allocating output stream\n");
      return AVERROR_UNKNOWN;
    }

    encoder = avcodec_find_encoder(AV_CODEC_ID_AAC);
    enc_ctx = avcodec_alloc_context3(encoder);
    if (!enc_ctx) {
      E_LOG("Could not alloc an encoding context\n");
      return -1;
    }
    enc_ctx = out_stream->codec;
    enc_ctx->codec_type = AVMEDIA_TYPE_AUDIO;
    enc_ctx->sample_rate = 48000;
    enc_ctx->channels = 2;
    enc_ctx->channel_layout = 3;
    enc_ctx->sample_fmt = AV_SAMPLE_FMT_FLTP;
    // enc_ctx->bit_rate = 320000;
    enc_ctx->codec_tag = 0;
    AVRational ar = {1, enc_ctx->sample_rate};
    enc_ctx->time_base = ar;

    ret = avcodec_open2(enc_ctx, encoder, NULL);
    if (ret < 0) {
      av_log(NULL, AV_LOG_ERROR, "Cannot open audio encoder for stream \n");
      return ret;
    }

    ret = avcodec_parameters_from_context(out_stream->codecpar, enc_ctx);
    if (ret < 0) {
      E_LOG("Could not copy the stream parameters\n");
      return ret;
    }

    if (ofmt_ctx->oformat->flags & AVFMT_GLOBALHEADER)
      enc_ctx->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
  }

  av_dump_format(ofmt_ctx, 0, filename, 1);

  // if (!(ofmt_ctx->oformat->flags & AVFMT_NOFILE)) {
  ret = avio_open(&ofmt_ctx->pb, filename, AVIO_FLAG_WRITE);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Could not open output file '%s'", filename);
    return ret;
  }
  // }
  /* init Mixer, write output file header */
  ret = avformat_write_header(ofmt_ctx, NULL);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Error occurred when opening output file\n");
    return ret;
  }
  return 0;
}

static int init_filters(const char* filters_descr) {
  char args1[512];
  char args2[512];
  int ret = 0;
  const AVFilter* abuffersrc1 = avfilter_get_by_name("abuffer");
  const AVFilter* abuffersrc2 = avfilter_get_by_name("abuffer");
  const AVFilter* abuffersink = avfilter_get_by_name("abuffersink");

  AVFilterInOut* outputs1 = avfilter_inout_alloc();
  AVFilterInOut* outputs2 = avfilter_inout_alloc();
  AVFilterInOut* inputs = avfilter_inout_alloc();

  static const enum AVSampleFormat out_sample_fmts[] = {
      AV_SAMPLE_FMT_FLTP  ,// dec_ctx1->sample_fmt,
      (enum AVSampleFormat) - 1};  //{AV_SAMPLE_FMT_S16}
  static const int64_t out_channel_layouts[] =
      //{dec_ctx1->channel_layout,  -1};
      {3, -1};
  static const int out_sample_rates[] = {48000, -1};//{dec_ctx1->sample_rate, -1};
  const AVFilterLink* outlink;

  AVRational time_base_1 = fmt_ctx1->streams[audio_stream_index_1]->time_base;
  AVRational time_base_2 = fmt_ctx2->streams[audio_stream_index_2]->time_base;

  filter_graph = avfilter_graph_alloc();
  if (!outputs1 || !inputs || !filter_graph) {
    ret = AVERROR(ENOMEM);
    goto end;
  }

  /* buffer audio source: the decoded frames from the decoder will be inserted
   * here. */
  if (!dec_ctx1->channel_layout)
    dec_ctx1->channel_layout =
        av_get_default_channel_layout(dec_ctx1->channels);
  snprintf(
      args1, sizeof(args1),
      "time_base=%d/%d:sample_rate=%d:sample_fmt=%s:channel_layout=0x%" PRIx64,
      time_base_1.num, time_base_1.den, dec_ctx1->sample_rate,
      av_get_sample_fmt_name(dec_ctx1->sample_fmt), dec_ctx1->channel_layout);
  ret = avfilter_graph_create_filter(&buffersrc_ctx1, abuffersrc1, "in1", args1,
                                     NULL, filter_graph);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot create audio buffer source\n");
    goto end;
  }

#if (ENABLE_FILTERS)
  /* buffer audio source: the decoded frames from the decoder will be inserted
   * here. */
  if (!dec_ctx2->channel_layout)
    dec_ctx2->channel_layout =
        av_get_default_channel_layout(dec_ctx2->channels);
  snprintf(
      args2, sizeof(args2),
      "time_base=%d/%d:sample_rate=%d:sample_fmt=%s:channel_layout=0x%" PRIx64,
      time_base_2.num, time_base_2.den, dec_ctx2->sample_rate,
      av_get_sample_fmt_name(dec_ctx2->sample_fmt), dec_ctx2->channel_layout);
  ret = avfilter_graph_create_filter(&buffersrc_ctx2, abuffersrc1, "in2", args2,
                                     NULL, filter_graph);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot create audio buffer source\n");
    goto end;
  }
#endif
  /* buffer audio sink: to terminate the filter chain. */
  ret = avfilter_graph_create_filter(&buffersink_ctx, abuffersink, "out", NULL,
                                     NULL, filter_graph);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot create audio buffer sink\n");
    goto end;
  }

  ret = av_opt_set_int_list(buffersink_ctx, "sample_fmts", out_sample_fmts, -1,
                            AV_OPT_SEARCH_CHILDREN);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot set output sample format\n");
    goto end;
  }

  ret = av_opt_set_int_list(buffersink_ctx, "channel_layouts",
                            out_channel_layouts, -1, AV_OPT_SEARCH_CHILDREN);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot set output channel layout\n");
    goto end;
  }

  ret = av_opt_set_int_list(buffersink_ctx, "sample_rates", out_sample_rates,
                            -1, AV_OPT_SEARCH_CHILDREN);
  if (ret < 0) {
    av_log(NULL, AV_LOG_ERROR, "Cannot set output sample rate\n");
    goto end;
  }

  /*
   * Set the endpoints for the filter graph. The filter_graph will
   * be linked to the graph described by filters_descr.
   */

  /*
   * The buffer source output must be connected to the input pad of
   * the first filter described by filters_descr; since the first
   * filter input label is not specified, it is set to "in" by
   * default.
   */
  outputs1->name = av_strdup("in0");
  outputs1->filter_ctx = buffersrc_ctx1;
  outputs1->pad_idx = 0;
#if (ENABLE_FILTERS)
  outputs1->next = outputs2;

  outputs2->name = av_strdup("in1");
  outputs2->filter_ctx = buffersrc_ctx2;
  outputs2->pad_idx = 0;
  outputs2->next = NULL;
#else
  outputs1->next = NULL;
#endif
  /*
   * The buffer sink input must be connected to the output pad of
   * the last filter described by filters_descr; since the last
   * filter output label is not specified, it is set to "out" by
   * default.
   */
  inputs->name = av_strdup("out");
  inputs->filter_ctx = buffersink_ctx;
  inputs->pad_idx = 0;
  inputs->next = NULL;

  AVFilterInOut* filter_outputs[2];
  filter_outputs[0] = outputs1;
#if (ENABLE_FILTERS)
  filter_outputs[1] = outputs2;
#endif

  if ((ret = avfilter_graph_parse_ptr(filter_graph, filters_descr, &inputs,
                                      &outputs1, NULL)) < 0)  // filter_outputs
  {
    av_log(NULL, AV_LOG_ERROR, "parse ptr fail, ret: %d\n", ret);
    goto end;
  }

  if ((ret = avfilter_graph_config(filter_graph, NULL)) < 0) {
    av_log(NULL, AV_LOG_ERROR, "config graph fail, ret: %d\n", ret);
    goto end;
  }

  /* Print summary of the sink buffer
   * Note: args buffer is reused to store channel layout string */
  outlink = buffersink_ctx->inputs[0];
  av_get_channel_layout_string(args1, sizeof(args1), -1,
                               outlink->channel_layout);
  av_log(NULL, AV_LOG_INFO, "Output: srate:%dHz fmt:%s chlayout:%s\n",
         (int)outlink->sample_rate,
         (char*)av_x_if_null(
             av_get_sample_fmt_name((enum AVSampleFormat)outlink->format), "?"),
         args1);

end:
  avfilter_inout_free(&inputs);
  avfilter_inout_free(&outputs1);

  return ret;
}

int main(int argc, char** argv) {
  int ret;
  AVFrame* frame = av_frame_alloc();
  AVFrame* filt_frame = av_frame_alloc();
  int got_frame;

  if (!frame || !filt_frame) {
    perror("Could not allocate frame");
    exit(1);
  }
  /*
  if (argc != 2) {
      fprintf(stderr, "Usage: %s file | %s\n", argv[0], player);
      exit(1);
  }
  */


  if ((ret = open_input_file_1("./recv.aac")) < 0) { //打开第一个输入文件
    av_log(NULL, AV_LOG_ERROR, "open input file fail, ret: %d\n", ret);
    goto end;
  }
  if ((ret = open_input_file_2("./trip.aac")) < 0) { //打开第二个输入文件
    av_log(NULL, AV_LOG_ERROR, "open input file fail, ret: %d\n", ret);
    goto end;
  }
  if ((ret = init_filters(filter_descr)) < 0) {      //初始化filter
    av_log(NULL, AV_LOG_ERROR, "init filters fail, ret: %d\n", ret);
    goto end;
  }

  if ((ret = open_output_file("./AAC/mix.aac")) < 0) return ret; //打开输出文件

  AVPacket packet0, packet;
  AVPacket _packet0, _packet;

  /* read all packets */
  packet0.data = NULL;
  packet.data = NULL;

  _packet0.data = NULL;
  _packet.data = NULL;
  while (1) {
    if (!packet0.data) {
      if ((ret = av_read_frame(fmt_ctx1, &packet)) < 0) break;
      packet0 = packet;
    }

    if (packet.stream_index == audio_stream_index_1) {
      got_frame = 0;
      ret = avcodec_decode_audio4(dec_ctx1, frame, &got_frame, &packet);
      if (ret < 0) {
        av_log(NULL, AV_LOG_ERROR, "Error decoding audio\n");
        continue;
      }
      packet.size -= ret;
      packet.data += ret;

      if (got_frame) {
        /* push the audio data from decoded frame into the filtergraph */
        if (av_buffersrc_add_frame_flags(buffersrc_ctx1, frame, 0) < 0) {
          av_log(NULL, AV_LOG_ERROR,
                 "Error while feeding the audio filtergraph\n");
          break;
        }
      }

      if (packet.size <= 0) av_packet_unref(&packet0);
    } else {
      /* discard non-wanted packets */
      av_packet_unref(&packet0);
    }

    if (!_packet0.data) {
      if ((ret = av_read_frame(fmt_ctx2, &_packet)) < 0) break;
      _packet0 = _packet;
    }

    if (_packet.stream_index == audio_stream_index_2) {
      got_frame = 0;
      ret = avcodec_decode_audio4(dec_ctx2, frame, &got_frame, &_packet);
      if (ret < 0) {
        av_log(NULL, AV_LOG_ERROR, "Error decoding audio\n");
        continue;
      }
      _packet.size -= ret;
      _packet.data += ret;

      if (got_frame) {
        /* push the audio data from decoded frame into the filtergraph */
        if (av_buffersrc_add_frame_flags(buffersrc_ctx2, frame, 0) < 0) {
          av_log(NULL, AV_LOG_ERROR,
                 "Error while feeding the audio filtergraph\n");
          break;
        }
      }

      if (_packet.size <= 0) av_packet_unref(&_packet0);
    } else {
      /* discard non-wanted packets */
      av_packet_unref(&_packet0);
    }
    /* pull filtered audio from the filtergraph */
    if (got_frame) {
      while (1) {
        ret = av_buffersink_get_frame(buffersink_ctx, filt_frame);
        if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) break;
        if (ret < 0) {
          av_log(NULL, AV_LOG_ERROR, "buffersink get frame fail, ret: %d\n",
                 ret);
          goto end;
        }
        encode_write_frame(filt_frame, 0);
        av_frame_unref(filt_frame);
      }
    }
  }
end:
  avfilter_graph_free(&filter_graph);
  avcodec_close(dec_ctx1);
  avformat_close_input(&fmt_ctx1);
  avcodec_close(dec_ctx2);
  avformat_close_input(&fmt_ctx2);
  av_frame_free(&frame);
  av_frame_free(&filt_frame);

  if (ret < 0 && ret != AVERROR_EOF) {
    fprintf(stderr, "Error occurred: %s\n",ret);
    exit(1);
  }

  av_write_trailer(ofmt_ctx);
  if (ofmt_ctx && !(ofmt_ctx->oformat->flags & AVFMT_NOFILE))
    avio_closep(&ofmt_ctx->pb);
  avformat_free_context(ofmt_ctx);
  return 0;
}
转载请注明本文url，引用请注明出处，谢谢支持！！！

HiddenTrackMJ
关注
2
点赞
踩
9

收藏

觉得还不错? 一键收藏
3
评论
FFmpeg 混音学习【三】两路混流完整代码

前言本文是简单的混流实现，输入为两个媒体文件（音频或带音频的视频文件），输出为混流后的aac文件。完整代码/* * Copyright (c) 2010 Nicolas George * Copyright (c) 2011 Stefano Sabatini * Copyright (c) 2012 ClÃ©ment BÅ“sch * * Permission is hereby granted, free of charge, to any person obtaining a copy
复制链接

扫一扫