PCM 编码为AAC

最新推荐文章于 2024-05-11 12:56:21 发布

jaygno

最新推荐文章于 2024-05-11 12:56:21 发布

阅读量1.9k

点赞数

分类专栏：音视频文章标签： ffmpeg 编码

本文链接：https://blog.csdn.net/gyj072001/article/details/78414904

版权

音视频专栏收录该内容

8 篇文章 2 订阅

订阅专栏

PCM 编码为AAC

简介

ffmpeg version 3.4 Copyright (c) 2003-2017 the FFmpeg developers

built with Apple LLVM version 7.3.0 (clang-703.0.31)

configuration: --prefix=/usr/local/media/ffmpeg_34 --enable-gpl --enable-avresample --disable-x86asm --disable-encoder=aac --disable-decoder=aac --enable-libfdk_aac --enable-nonfree --extra-cflags=-I/usr/local/media/libfdkaac/include/ --extra-ldflags=-L/usr/local/media/libfdkaac/lib --extra-cflags=-I/usr/local/media/libx264/include/ --extra-ldflags=-L/usr/local/media/libx264/lib

由于音频数据在采样率、format有多种参数格式， ffmpeg自带的AAC支持有限，本例采样率8000就不支持，需要用fdkaac第三方库，本例编码依赖库为libfdk_aac.

AAC

AAC 封装格式

AAC音频格式有ADIF和ADTS：

ADIF：Audio Data Interchange Format 音频数据交换格式。这种格式的特征是可以确定的找到这个音频数据的开始，不需进行在音频数据流中间开始的解码，即它的解码必须在明确定义的开始处进行。故这种格式常用在磁盘文件中。

ADTS：Audio Data Transport Stream 音频数据传输流。这种格式的特征是它是一个有同步字的比特流，解码可以在这个流中任何位置开始。它的特征类似于mp3数据流格式。

简单说，ADTS可以在任意帧解码，也就是说它每一帧都有头信息。ADIF只有一个统一的头，所以必须得到所有的数据后解码。且这两种的header的格式也是不同的，目前一般编码后的和抽取出的都是ADTS格式的音频流。

ADTS是帧序列，本身具备流特征，在音频流的传输与处理方面更加合适。

/**
 * 添加ADTS头部
 *
 * @param packet    ADTS header 的 byte[]，长度为7
 * @param packetLen 该帧的长度，包括header的长度
 */
private void addADTStoPacket(byte[] packet, int packetLen) {
    int profile = 2; // AAC LC
    int freqIdx = 3; // 48000Hz
    int chanCfg = 2; // 2 Channel

    packet[0] = (byte) 0xFF;
    packet[1] = (byte) 0xF9;
    packet[2] = (byte) (((profile - 1) << 6) + (freqIdx << 2) + (chanCfg >> 2));
    packet[3] = (byte) (((chanCfg & 3) << 6) + (packetLen >> 11));
    packet[4] = (byte) ((packetLen & 0x7FF) >> 3);
    packet[5] = (byte) (((packetLen & 7) << 5) + 0x1F);
    packet[6] = (byte) 0xFC;
}

其中profile表示使用哪个级别的AAC，在MPEG-2 AAC中定义了3种：

aac profile

AAC编解码

AAC 编解码器初始化时，nb_samples 固定为 1024。每次编码需要的样本数由av_samples_get_buffer_size计算得出，需要足够的数据，才能编码成功。

源码

#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <math.h>

#include <libavcodec/avcodec.h>

#include <libavutil/opt.h>
#include <libavutil/channel_layout.h>
#include <libavutil/common.h>
#include <libavutil/imgutils.h>
#include <libavutil/mathematics.h>
#include <libavutil/samplefmt.h>
#include <libavutil/frame.h>
#include <libavformat/avformat.h>
#include <libswscale/swscale.h>

#include <libavutil/channel_layout.h>
#include <libavutil/common.h>
#include <libavutil/frame.h>
#include <libavutil/samplefmt.h>


static int write_aac_header(FILE* fp, AVPacket* pkt);

/* check that a given sample format is supported by the encoder */
static int check_sample_fmt(const AVCodec *codec, enum AVSampleFormat sample_fmt)
{
    const enum AVSampleFormat *p = codec->sample_fmts;

    while (*p != AV_SAMPLE_FMT_NONE) {
        if (*p == sample_fmt)
            return 1;
        p++;
    }
    return 0;
}

static void encode(AVCodecContext *ctx, AVFrame *frame, AVPacket *pkt,
                   FILE *output)
{
    int ret;

    /* send the frame for encoding */
    ret = avcodec_send_frame(ctx, frame);
    if (ret < 0) {
        fprintf(stderr, "Error sending the frame to the encoder\n");
        exit(1);
    }

    fprintf(stdout, "Sending the frame to the encoder\n");

    /* read all the available output packets (in general there may be any
     * number of them */
    while (ret >= 0) {
        ret = avcodec_receive_packet(ctx, pkt);
        if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF)
            return;
        else if (ret < 0) {
            fprintf(stderr, "Error encoding audio frame\n");
            exit(1);
        }

        write_aac_header(output, pkt);
        fwrite(pkt->data, 1, pkt->size, output);
        fprintf(stdout, "write %d\n", pkt->size);
        av_packet_unref(pkt);
    }

    return;
}


//AAC有两种封装格式，分别是ADIF ADTS，多与流媒体一般使用ADTS格式。见：
//http://www.jianshu.com/p/839b11e0638b aac freqIdx

char aac_adts_header[7] = {0};
int chanCfg = 1;            //MPEG-4 Audio Channel Configuration. 1 Channel front-center

static int init_aac_header() {
    int profile = 2;   //AAC LC
    int freqIdx = 11;   //8000HZ

    aac_adts_header[0] = (char)0xFF;      // 11111111     = syncword
    aac_adts_header[1] = (char)0xF1;      // 1111 1 00 1  = syncword MPEG-2 Layer CRC
    aac_adts_header[2] = (char)(((profile - 1) << 6) + (freqIdx << 2) + (chanCfg >> 2));
    aac_adts_header[6] = (char)0xFC;

    return 0;
}

static int write_aac_header(FILE* fp, AVPacket* pkt) {
    aac_adts_header[3] = (char)(((chanCfg & 3) << 6) + ((7 + pkt->size) >> 11));
    aac_adts_header[4] = (char)(((7 + pkt->size) & 0x7FF) >> 3);
    aac_adts_header[5] = (char)((((7 + pkt->size) & 7) << 5) + 0x1F);

    fwrite(aac_adts_header, 7, 1, fp);

    return 0;
}

int main(int argc, char **argv){
    AVFrame *frame;
    AVCodec *codec = NULL;
    AVPacket *pkt;
    AVCodecContext *codecContext;
    int readSize=0;
    FILE * fileIn,*fileOut;
    int frameCount=0;
    /* register all the codecs */
    av_register_all();

    init_aac_header();

    if(argc!=3){
        fprintf(stdout,"usage:./a.out xxx.pcm xxx.aac\n");
        return -1;
    }

    fileIn =fopen(argv[1],"r+");
    if (fileIn == NULL) {
        fprintf(stderr, "fopen failed %s\n", argv[1]);
        exit(1);
    }

    //3.读出来的数据，我们需要编码，因此需要编码器
    //下面的函数找到h.264类型的编码器
    /* find the mpeg1 video encoder */
    codec = avcodec_find_encoder(AV_CODEC_ID_AAC);
    if (!codec){
        fprintf(stderr, "Codec not found\n");
        exit(1);
    }

    //有了编码器，我们还需要编码器的上下文环境，用来控制编码的过程
    codecContext = avcodec_alloc_context3(codec);//分配AVCodecContext实例
    if (!codecContext){
        fprintf(stderr, "Could not allocate video codec context\n");
        return -1;
    }

    /* put sample parameters */
    codecContext->bit_rate = 64000;

    /* check that the encoder supports s16 pcm input */
    codecContext->sample_fmt = AV_SAMPLE_FMT_S16;
    if (!check_sample_fmt(codec, codecContext->sample_fmt)) {
        fprintf(stderr, "Encoder does not support sample format %s",
                av_get_sample_fmt_name(codecContext->sample_fmt));
        exit(1);
    }

    codecContext->sample_rate = 8000;
    codecContext->channel_layout = AV_CH_LAYOUT_MONO;
    codecContext->channels = av_get_channel_layout_nb_channels(codecContext->channel_layout);

    /* select other audio parameters supported by the encoder */
    //准备好了编码器和编码器上下文环境，现在可以打开编码器了
    //根据编码器上下文打开编码器
    if (avcodec_open2(codecContext, codec, NULL) < 0){
        fprintf(stderr, "Could not open codec\n");
        return -1;
    }

    /* packet for holding encoded output */
    pkt = av_packet_alloc();
    if (!pkt) {
        fprintf(stderr, "could not allocate the packet\n");
        exit(1);
    }

    //读出的一帧数据保存在AVFrame中。
    frame  = av_frame_alloc();
    if (!frame) {
        fprintf(stderr, "Could not allocate audio frame\n");
        exit(1);
    }

    frame->nb_samples = codecContext->frame_size;;
    frame->format = codecContext->sample_fmt;
    frame->channel_layout = codecContext->channel_layout;

    /* allocate the data buffers */
    int ret = av_frame_get_buffer(frame, 0);
    if (ret < 0) {
        fprintf(stderr, "Could not allocate audio data buffers\n");
        exit(1);
    }

    int data_size = av_samples_get_buffer_size(NULL, codecContext->channels, frame->nb_samples, frame->format, 0);

    //4.准备输出文件
    fileOut= fopen(argv[2],"w+");
    //下面开始编码
    while(1){
        //读一帧数据出来
        //frame->pts = 1;
        readSize = fread(frame->data[0], 1,data_size,fileIn);
        if(readSize == 0){
            fprintf(stdout,"end of file\n");
            frameCount++;
            break;
        }

        encode(codecContext, frame, pkt, fileOut);
    }

    //flush
    encode(codecContext, NULL, pkt, fileOut);

    fclose(fileIn);
    fclose(fileOut);
    av_frame_free(&frame);
    av_packet_free(&pkt);
    avcodec_free_context(&codecContext);
    return 0;
}

源码下载

GITHUB ： https://github.com/jaygno/pcm_2_aac

参考资料

FFmpeg(2016)PCM编码AAC
AAC ADTS结构分析
 AAC 格式简介
 Android音视频处理之AAC编码

jaygno

关注

0
点赞
踩
4

收藏

觉得还不错? 一键收藏
0
评论
PCM 编码为AAC

PCM 编码为AAC简介ffmpeg version 3.4 Copyright (c) 2003-2017 the FFmpeg developersbuilt with Apple LLVM version 7.3.0 (clang-703.0.31)configuration: --prefix=/usr/local/media/ffmpeg_34 --enable-gpl --enable-
复制链接

扫一扫