extern "C"
{
#include <libavcodec/avcodec.h>
#include <libavformat/avformat.h>
#include <libswscale/swscale.h>
#include <libswresample/swresample.h>
#include <libavutil/avstring.h>
#include <libavutil/pixfmt.h>
#include <libavutil/log.h>
};
#include <stdio.h>
#include <math.h>
#include <SDL.h>
#include <SDL_thread.h>
#pragma comment(lib, "libmingwex.lib")
#pragma comment(lib, "libgcc.lib")
#pragma comment(lib, "avformat.lib")
#pragma comment(lib, "avutil.lib")
#pragma comment(lib, "avcodec.lib")
#pragma comment(lib, "swresample.lib")
#pragma comment(lib, "SDL.lib")
#pragma comment(lib, "SDLmain.lib")
#define SDL_AUDIO_BUFFER_SIZE 1024
#define MAX_AUDIOQ_SIZE (1 * 1024 * 1024)
#define FF_ALLOC_EVENT (SDL_USEREVENT)
#define FF_REFRESH_EVENT (SDL_USEREVENT + 1)
#define FF_QUIT_EVENT (SDL_USEREVENT + 2)
typedef struct PacketQueue {//Queue
AVPacketList *first_pkt, *last_pkt;
int nb_packets;
int size;
SDL_mutex *mutex;
SDL_cond *cond;
} PacketQueue;
typedef struct VideoState {//State
char filename[1024];
AVFormatContext *ic;
AVCodecContext *pCodecCtx;
AVCodec *pCodec;
int videoStream, audioStream;
AVStream *audio_st;
AVFrame *audio_frame;
PacketQueue audioq;
unsigned int audio_buf_size;
unsigned int audio_buf_index;
AVPacket audio_pkt;
uint8_t *audio_pkt_data;
int audio_pkt_size;
uint8_t *audio_buf;
uint8_t *audio_buf1;
DECLARE_ALIGNED(16,uint8_t,audio_buf2)[AVCODEC_MAX_AUDIO_FRAME_SIZE * 4];
enum AVSampleFormat audio_src_fmt;
enum AVSampleFormat audio_tgt_fmt;
int audio_src_channels;
int audio_tgt_channels;
int64_t audio_src_channel_layout;
int64_t audio_tgt_channel_layout;
int audio_src_freq;
int audio_tgt_freq;
struct SwrContext *swr_ctx;
SDL_Thread *parse_tid;//thread id
int quit;//flag
} VideoState;
VideoState *global_video_state;//global state
void packet_queue_init(PacketQueue *q) {//init queue
memset(q, 0, sizeof(PacketQueue));
q->mutex = SDL_CreateMutex();
q->cond = SDL_CreateCond();
}
int packet_queue_put(PacketQueue *q, AVPacket *pkt) {//put pkt to pktQueue
AVPacketList *pkt1;
pkt1 = (AVPacketList *)av_malloc(sizeof(AVPacketList));
if (!pkt1) {
return -1;
}
pkt1->pkt = *pkt;//put pkt to PacketList
pkt1->next = NULL;
SDL_LockMutex(q->mutex);
if (!q->last_pkt) {//last_pkt = NULL, Queue element is PacketList,we can not use packet directly
q->first_pkt = pkt1;
} else {//not first time
q->last_pkt->next = pkt1;
}
q->last_pkt = pkt1;//update
q->nb_packets++;//record nb_packet
q->size += pkt1->pkt.size;//update pkt size in queue
SDL_CondSignal(q->cond);
SDL_UnlockMutex(q->mutex);
return 0;
}
static int packet_queue_get(PacketQueue *q, AVPacket *pkt, int block) {//get data from queue
AVPacketList *pkt1;
int ret;
SDL_LockMutex(q->mutex);//lock
for(;;) {
if(global_video_state->quit) {//is or not quit firstly
ret = -1;
break;
}//quit,跳出循环
pkt1 = q->first_pkt;//queue: first in, first out
if (pkt1) {
q->first_pkt = pkt1->next;
if (!q->first_pkt) {//if queue is over
q->last_pkt = NULL;
}
q->nb_packets--;
q->size -= pkt1->pkt.size;
*pkt = pkt1->pkt;
av_free(pkt1);
ret = 1;//
break;
} else if (!block) {
ret = 0;
break;
} else {
SDL_CondWait(q->cond, q->mutex);//until data enough
}
}
SDL_UnlockMutex(q->mutex);
return ret;
}
static void packet_queue_flush(PacketQueue *q) {//flush queue
AVPacketList *pkt, *pkt1;
SDL_LockMutex(q->mutex);//lock
for (pkt = q->first_pkt; pkt != NULL; pkt = pkt1) {
pkt1 = pkt->next;
av_free_packet(&pkt->pkt);
av_freep(&pkt);
}
q->last_pkt = NULL;
q->first_pkt = NULL;
q->nb_packets = 0;
q->size = 0;
SDL_UnlockMutex(q->mutex);//unlock
}
int audio_decode_frame(VideoState *is) {//core code decoded information is saved in videostate-is
int len1, len2, decoded_data_size;
AVPacket *pkt = &is->audio_pkt;
int got_frame = 0;
int64_t dec_channel_layout;
int wanted_nb_samples, resampled_data_size;
for (;;) {//dead loop
while (is->audio_pkt_size > 0) {
if (!is->audio_frame) {
if (!(is->audio_frame = avcodec_alloc_frame())) {
return AVERROR(ENOMEM);
}
} else
avcodec_get_frame_defaults(is->audio_frame);//AVFrame should be set to default values
len1 = avcodec_decode_audio4(is->audio_st->codec, is->audio_frame, &got_frame, pkt);
if (len1 < 0) {
// error, skip the frame
is->audio_pkt_size = 0;
break;
}
is->audio_pkt_data += len1;
is->audio_pkt_size -= len1;
if (!got_frame)
continue;
/* decoded_data_size = av_samples_get_buffer_size(NULL,
is->audio_frame->channels,
is->audio_frame->nb_samples,
is->audio_frame->format, 1);*/
decoded_data_size = av_samples_get_buffer_size(NULL,
is->pCodecCtx->channels,
is->audio_frame->nb_samples,
AVSampleFormat(is->audio_frame->format), 1);//get decoded_data_size
/* dec_channel_layout = (is->audio_frame->channel_layout && is->audio_frame->channels
== av_get_channel_layout_nb_channels(is->audio_frame->channel_layout))
? is->audio_frame->channel_layout
: av_get_default_channel_layout(is->audio_frame->channels);*/
dec_channel_layout = (is->pCodecCtx->channel_layout && is->pCodecCtx->channels
== av_get_channel_layout_nb_channels(is->pCodecCtx->channel_layout))
? is->pCodecCtx->channel_layout
: av_get_default_channel_layout(is->pCodecCtx->channels);
wanted_nb_samples = is->audio_frame->nb_samples;
//fprintf(stderr, "wanted_nb_samples = %d\n", wanted_nb_samples);
//解码出来的音频与原先设定的格式不一致,则重采样
if (is->audio_frame->format != is->audio_src_fmt ||
dec_channel_layout != is->audio_src_channel_layout ||
is->pCodecCtx->sample_rate != is->audio_src_freq ||
(wanted_nb_samples != is->audio_frame->nb_samples && !is->swr_ctx)) {
if (is->swr_ctx) swr_free(&is->swr_ctx);
is->swr_ctx = swr_alloc_set_opts(NULL, //get swr_ctx
is->audio_tgt_channel_layout,
is->audio_tgt_fmt,
is->audio_tgt_freq,
dec_channel_layout,
AVSampleFormat(is->audio_frame->format),
is->pCodecCtx->sample_rate,
0, NULL);
if (!is->swr_ctx || swr_init(is->swr_ctx) < 0) {//init
fprintf(stderr, "swr_init() failed\n");
break;
}//get src parameters
is->audio_src_channel_layout = dec_channel_layout;
is->audio_src_channels = is->audio_st->codec->channels;
is->audio_src_freq = is->audio_st->codec->sample_rate;
is->audio_src_fmt = is->audio_st->codec->sample_fmt;
}
if (is->swr_ctx) {
// const uint8_t *in[] = { is->audio_frame->data[0] };
const uint8_t **in = (const uint8_t **)is->audio_frame->extended_data;
uint8_t *out[] = { is->audio_buf2 };
if (wanted_nb_samples != is->audio_frame->nb_samples) {//compensate samples
swr_compensate(is->swr_ctx, (wanted_nb_samples - is->audio_frame->nb_samples)
* is->audio_tgt_freq / is->pCodecCtx->sample_rate,
wanted_nb_samples * is->audio_tgt_freq / is->pCodecCtx->sample_rate);
}
len2 = swr_convert(is->swr_ctx, out,// in data is changed by swr_ctx
sizeof(is->audio_buf2)
/ is->audio_tgt_channels
/ av_get_bytes_per_sample(is->audio_tgt_fmt),//tgt_nb_samples
in, is->audio_frame->nb_samples);//convert
if (len2 < 0) {
fprintf(stderr, "swr_convert() failed\n");
break;
}
if (len2 == sizeof(is->audio_buf2) / is->audio_tgt_channels / av_get_bytes_per_sample(is->audio_tgt_fmt)) {
fprintf(stderr, "warning: audio buffer is probably too small\n");
swr_init(is->swr_ctx);
}
is->audio_buf = is->audio_buf2;//audio_buff
resampled_data_size = len2 * is->audio_tgt_channels * av_get_bytes_per_sample(is->audio_tgt_fmt);//resampled_data_size
} else {
resampled_data_size = decoded_data_size;//not resampled
is->audio_buf = is->audio_frame->data[0];
}
// We have data, return it and come back for more later
return resampled_data_size; //返回重采样后的长度
}//decode one frame
if (pkt->data) av_free_packet(pkt);
memset(pkt, 0, sizeof(*pkt));
if (is->quit) return -1;
if (packet_queue_get(&is->audioq, pkt, 1) < 0) return -1;//get next packet
is->audio_pkt_data = pkt->data;
is->audio_pkt_size = pkt->size;
}
}
void audio_callback(void *userdata, Uint8 *stream, int len) {
VideoState *is = (VideoState *)userdata;
int len1, audio_data_size;
printf("audio callback 1 len=%d\n",len);
while (len > 0) {
if (is->audio_buf_index >= is->audio_buf_size) {
audio_data_size = audio_decode_frame(is);//decode one frame,return size
if(audio_data_size < 0) {
/* silence */
is->audio_buf_size = 1024;
memset(is->audio_buf, 0, is->audio_buf_size);
} else {
is->audio_buf_size = audio_data_size;
}
is->audio_buf_index = 0;
printf("audio callback 2 (audio_buf_size,audio_buf_index) = (%d,%d)\n",is->audio_buf_size,is->audio_buf_index);
}
len1 = is->audio_buf_size - is->audio_buf_index;
if (len1 > len) {
len1 = len;
}
memcpy(stream, (uint8_t *)is->audio_buf + is->audio_buf_index, len1);
len -= len1;
stream += len1;
is->audio_buf_index += len1;
printf("audio callback 3 (len1,len,audio_buf_index) = (%d,%d,%d)\n",len1,len,is->audio_buf_index);
}
}
int stream_component_open(VideoState *is, int stream_index) {//open stream
AVFormatContext *ic = is->ic;
AVCodecContext *codecCtx;
AVCodec *codec;
SDL_AudioSpec wanted_spec, spec;
int64_t wanted_channel_layout = 0;
int wanted_nb_channels;
const int next_nb_channels[] = {0, 0, 1 ,6, 2, 6, 4, 6};
if (stream_index < 0 || stream_index >= ic->nb_streams) {
return -1;
}
codecCtx = ic->streams[stream_index]->codec;
is->pCodecCtx=codecCtx;//Add
wanted_nb_channels = codecCtx->channels;//wanted parameters
if(!wanted_channel_layout || wanted_nb_channels != av_get_channel_layout_nb_channels(wanted_channel_layout)) {
wanted_channel_layout = av_get_default_channel_layout(wanted_nb_channels);
wanted_channel_layout &= ~AV_CH_LAYOUT_STEREO_DOWNMIX;
}
wanted_spec.channels = av_get_channel_layout_nb_channels(wanted_channel_layout);
wanted_spec.freq = codecCtx->sample_rate;
if (wanted_spec.freq <= 0 || wanted_spec.channels <= 0) {
fprintf(stderr, "Invalid sample rate or channel count!\n");
return -1;
}
wanted_spec.format = AUDIO_S16SYS;
wanted_spec.silence = 0;
wanted_spec.samples = SDL_AUDIO_BUFFER_SIZE;
wanted_spec.callback = audio_callback;//callback
wanted_spec.userdata = is;
while(SDL_OpenAudio(&wanted_spec, &spec) < 0) {//OpenAudio
fprintf(stderr, "SDL_OpenAudio (%d channels): %s\n", wanted_spec.channels, SDL_GetError());
wanted_spec.channels = next_nb_channels[FFMIN(7, wanted_spec.channels)];
if(!wanted_spec.channels) {
fprintf(stderr, "No more channel combinations to tyu, audio open failed\n");
return -1;
}
wanted_channel_layout = av_get_default_channel_layout(wanted_spec.channels);
}
if (spec.format != AUDIO_S16SYS) {
fprintf(stderr, "SDL advised audio format %d is not supported!\n", spec.format);
return -1;
}
if (spec.channels != wanted_spec.channels) {
wanted_channel_layout = av_get_default_channel_layout(spec.channels);
if (!wanted_channel_layout) {
fprintf(stderr, "SDL advised channel count %d is not supported!\n", spec.channels);
return -1;
}
}
fprintf(stderr, "%d: wanted_spec.format = %d\n", __LINE__, wanted_spec.format);
fprintf(stderr, "%d: wanted_spec.samples = %d\n", __LINE__, wanted_spec.samples);
fprintf(stderr, "%d: wanted_spec.channels = %d\n", __LINE__, wanted_spec.channels);
fprintf(stderr, "%d: wanted_spec.freq = %d\n", __LINE__, wanted_spec.freq);
fprintf(stderr, "%d: spec.format = %d\n", __LINE__, spec.format);
fprintf(stderr, "%d: spec.samples = %d\n", __LINE__, spec.samples);
fprintf(stderr, "%d: spec.channels = %d\n", __LINE__, spec.channels);
fprintf(stderr, "%d: spec.freq = %d\n", __LINE__, spec.freq);
is->audio_src_fmt = is->audio_tgt_fmt = AV_SAMPLE_FMT_S16;//src parameters
is->audio_src_freq = is->audio_tgt_freq = spec.freq;
is->audio_src_channel_layout = is->audio_tgt_channel_layout = wanted_channel_layout;
is->audio_src_channels = is->audio_tgt_channels = spec.channels;
codec = avcodec_find_decoder(codecCtx->codec_id);//find decoder
is->pCodec=codec;//Add
if (!codec || (avcodec_open2(codecCtx, codec, NULL) < 0)) {//Unsupported codec
fprintf(stderr, "Unsupported codec!\n");
return -1;
}
ic->streams[stream_index]->discard = AVDISCARD_DEFAULT;
switch(codecCtx->codec_type) {
case AVMEDIA_TYPE_AUDIO:
is->audioStream = stream_index;
is->audio_st = ic->streams[stream_index];
is->audio_buf_size = 0;
is->audio_buf_index = 0;
memset(&is->audio_pkt, 0, sizeof(is->audio_pkt));
packet_queue_init(&is->audioq);
SDL_PauseAudio(0);
break;
default:
break;
}
}
/*
static void stream_component_close(VideoState *is, int stream_index) {
AVFormatContext *oc = is->;
AVCodecContext *avctx;
if(stream_index < 0 || stream_index >= ic->nb_streams) return;
avctx = ic->streams[stream_index]->codec;
}
*/
static int decode_thread(void *arg) {
//初始化参数,函数内部处理得到的相关参数赋给 is
VideoState *is = (VideoState *)arg;
AVFormatContext *ic = NULL;
AVPacket pkt1, *packet = &pkt1;
int ret, i, audio_index = -1;
is->audioStream=-1;
global_video_state = is;//全局状态
if (avformat_open_input(&ic, is->filename, NULL, NULL) != 0) {
return -1;
}
is->ic = ic;
if (avformat_find_stream_info(ic, NULL) < 0) {//打开流信息
return -1;
}
av_dump_format(ic, 0, is->filename, 0);
for (i=0; i<ic->nb_streams; i++) {
if (ic->streams[i]->codec->codec_type==AVMEDIA_TYPE_AUDIO && audio_index < 0) {//打开第一条音频流
audio_index=i;
break;
}
}
if (audio_index >= 0) {
stream_component_open(is, audio_index);//打开音频流
}
if (is->audioStream < 0) {
fprintf(stderr, "%s: could not open codecs\n", is->filename);
goto fail;
}
// main decode loop
for(;;) {
if(is->quit) break;
if (is->audioq.size > MAX_AUDIOQ_SIZE) {
SDL_Delay(10);//so fast
continue;
}
ret = av_read_frame(is->ic, packet);//read data to one packet
if (ret < 0) {
if(ret == AVERROR_EOF || url_feof(is->ic->pb)) {//error or end
break;
}
if(is->ic->pb && is->ic->pb->error) {
break;
}
continue;
}
if (packet->stream_index == is->audioStream) {//packet data to audioq
packet_queue_put(&is->audioq, packet);
} else {
av_free_packet(packet);
}
}
while (!is->quit) {// delay
SDL_Delay(100);
}
fail: {//if fail
SDL_Event event;
event.type = FF_QUIT_EVENT;
event.user.data1 = is;
SDL_PushEvent(&event);
}
return 0;
}
int main(int argc, char *argv[])
{
SDL_Event event;
VideoState *is;
is = (VideoState *)av_mallocz(sizeof(VideoState));
//if (argc < 2) {
// fprintf(stderr, "Usage: test <file>\n");
// exit(1);
//}
argv[1]="test.mp4";
av_register_all();//注册编解码库
if (SDL_Init(SDL_INIT_AUDIO)) { //初始化音频SDL
fprintf(stderr, "Could not initialize SDL - %s\n", SDL_GetError());
exit(1);
}
av_strlcpy(is->filename,argv[1], sizeof(is->filename));
is->parse_tid = SDL_CreateThread(decode_thread, is);
if (!is->parse_tid) {
av_free(is);
return -1;
}
for(;;) {
SDL_WaitEvent(&event);
switch(event.type) {
case FF_QUIT_EVENT:
case SDL_QUIT://退出
is->quit = 1;
SDL_Quit();
exit(0);
break;
default:
break;
}
}
return 0;
}