前面的文章虽然实现了播放器,但是架构是混乱的,这一篇我们做一个结构清晰的播放器。
播放器架构图
解复用、视频解码、音频解码都是很耗时的
所以我们都要新建线程来完成。
由于音频的播放是由音频设备来来拉取的,所以音频的线程不需要创建。
解复用后的数据要放在队列中,所以我们新建了一个队列,用来存放解复用后的AVPacket,音频放在音频队列,视频放在视频队列。
由于解复用、视频解码、音频解码在不同的线程。所以对队列的操作也是多线程对于数据的操作,要用到SDL锁。
typedef struct PacketQueue
{
AVPacketList *first_pkt, *last_pkt;
int nb_packets;
int size;
SDL_mutex *mutex;
SDL_cond *cond;
int total;
int end;
int useCout;
int flash;
} PacketQueue;
void packet_queue_init(PacketQueue *q)
{
memset(q, 0, sizeof(PacketQueue));
q->mutex = SDL_CreateMutex();
q->cond = SDL_CreateCond();
}
int packet_queue_put(PacketQueue *q, AVPacket *srcpkt)
{
AVPacket *pkt = av_packet_alloc();
AVPacketList *pkt1;
if (av_packet_ref(pkt, srcpkt) < 0)
{
return -1;
}
pkt1 = av_malloc(sizeof(AVPacketList));
if (!pkt1)
return -1;
pkt1->pkt = *pkt;
pkt1->next = NULL;
SDL_LockMutex(q->mutex);
if (!q->last_pkt)
q->first_pkt = pkt1;
else
q->last_pkt->next = pkt1;
q->last_pkt = pkt1;
q->nb_packets++;
q->size += pkt1->pkt.size;
//fprintf(stderr, "enqueue, packets:%d, send cond signal\n", q->nb_packets);
SDL_CondSignal(q->cond);
SDL_UnlockMutex(q->mutex);
return 0;
}
int packet_queue_get(PacketQueue *q, AVPacket *pkt, int block)
{
AVPacketList *pkt1;
int ret;
SDL_LockMutex(q->mutex);
for (;;)
{
if (global_video_state->quit)
{
fprintf(stderr, "quit from queue_get\n");
ret = -1;
break;
}
pkt1 = q->first_pkt;
if (pkt1)
{
q->first_pkt = pkt1->next;
if (!q->first_pkt)
q->last_pkt = NULL;
q->nb_packets--;
q->size -= pkt1->pkt.size;
*pkt = pkt1->pkt;
av_free(pkt1);
ret = 1;
break;
}
else if (!block)
{
ret = 0;
break;
}
else if(!(q->end))
{
fprintf(stderr, "queue is empty, so wait a moment and wait a cond signal\n");
SDL_CondWait(q->cond, q->mutex);
}else{
ret = -1;
break;
}
}
SDL_UnlockMutex(q->mutex);
return ret;
}
从代码总我们可以看到,取元素过程中,如果没有元素了,会通过信号等待函数,等待输入。
else if(!(q->end))
{
fprintf(stderr, "queue is empty, so wait a moment and wait a cond signal\n");
SDL_CondWait(q->cond, q->mutex);
}
对于音频来说最重要的参数是采样大小(位深),采样率,声道数。在重采样的时候,采样个数非常重要,我一般情况下重采样后的采样个数和输入的采样个数要相等。
下面是音频解码的操作:
if (codecCtx->codec_type == AVMEDIA_TYPE_AUDIO)
{
// Set audio settings from codec info
wanted_spec.freq = codecCtx->sample_rate;
wanted_spec.format = AUDIO_S16SYS;
wanted_spec.channels = out_channel;
wanted_spec.silence = 0;
wanted_spec.samples = out_nb_samples;
wanted_spec.callback = audio_callback;
wanted_spec.userdata = is;
if (SDL_OpenAudio(&wanted_spec, &spec) < 0)
{
fprintf(stderr, "SDL_OpenAudio: %s\n", SDL_GetError());
return -1;
}
}
我们通过代码可以知道,音频设备播放会从audio_callback获取播放数据。
void audio_callback(void *userdata, Uint8 *stream, int len)
{
VideoState *is = (VideoState *)userdata;
int len1, audio_size;
SDL_memset(stream, 0, len);
while (len > 0)
{
if (is->audio_buf_index >= is->audio_buf_size)
{
/* We have already sent all our data; get more */
audio_size = audio_decode_frame(is, is->audio_buf, sizeof(is->audio_buf));
if (audio_size < 0)
{
/* If error, output silence */
is->audio_buf_size = 1024 * 2 * 2;
memset(is->audio_buf, 0, is->audio_buf_size);
}
else
{
is->audio_buf_size = audio_size;
}
is->audio_buf_index = 0;
}
len1 = is->audio_buf_size - is->audio_buf_index;
fprintf(stderr, "stream addr:%p, audio_buf_index:%d, audio_buf_size:%d, len1:%d, len:%d\n",
stream,
is->audio_buf_index,
is->audio_buf_size,
len1,
len);
if (len1 > len)
len1 = len;
SDL_MixAudio(stream, (uint8_t *)is->audio_buf + is->audio_buf_index, len1, SDL_MIX_MAXVOLUME);
len -= len1;
stream += len1;
is->audio_buf_index += len1;
}
}
我们会从audio_decode_frame获取解码后的数据
ffmpeg 解码是通过avcodec_send_packet和avcodec_receive_frame来完成的。他们不是一一对应出现的。一个AVPacket中可能包含多个frame。所以一般写代码是这样的
avcodec_send_packet
while(avcodec_receive_frame == 0){
}
我们audio_decode_frame的逻辑是这样的
伪代码
if(avcodec_receive_frame == 0){
return size;
}
从队列中获取AVPacket
avcodec_send_packet
if(avcodec_receive_frame == 0){
return size;
}
return -1;
真正代码
int audio_decode_frame(VideoState *is, uint8_t *audio_buf, int buf_size)
{
static AVPacket pkt;
static uint8_t *audio_pkt_data = NULL;
static int audio_pkt_size = 0;
static AVFrame frame;
int data_size = 0;
int ret = 0;
av_init_packet(&pkt);
pkt.data = NULL;
pkt.size = 0;
int index = 0;
uint64_t out_channel_layout = AV_CH_LAYOUT_STEREO;
frame.channels = is->audio_ctx->channels;
frame.format = is->audio_ctx->sample_fmt;
frame.nb_samples = is->audio_ctx->frame_size;
av_frame_get_buffer(&frame, 0);
for (;;)
{
if (pkt.data)
av_packet_unref(&pkt);
if (is->quit)
{
return -1;
}
ret = avcodec_receive_frame(is->audio_ctx, &frame);
if (ret == 0)
{
goto __SWR_DATA;
}
if (packet_queue_get(&(is->audioq), &pkt, 1) < 0 )
{
if(is->audioq.flash){
goto __RECEIVE;
}
av_log(NULL, AV_LOG_ERROR, "flash audio\n");
is->audioq.flash = 1;
ret = avcodec_send_packet(is->audio_ctx, NULL);
if (ret < 0)
{
return -1;
}
goto __RECEIVE;
}
++(is->audioq.useCout);
ret = avcodec_send_packet(is->audio_ctx, &pkt);
if (ret < 0)
{
ret = -1;
printf("decode error");
av_packet_unref(&pkt);
return -1;
}
if (pkt.data)
{
av_packet_unref(&pkt);
}
__RECEIVE:
index = 0;
ret = avcodec_receive_frame(is->audio_ctx, &frame);
if (ret < 0)
{
return ret;
}
__SWR_DATA:
data_size = av_get_bytes_per_sample(out_format) * out_channel * out_nb_samples;
swr_convert(is->audio_swr_ctx,
&audio_buf,
out_nb_samples,
(const uint8_t **)frame.data,
frame.nb_samples);
return data_size;
}
}
当队列中没有AVPacket时,并且是已经把多媒体文件读完了,我们就要avcodec_send_packet(NULL)用来刷新缓存,告知解码器文件已经读完了。
if (packet_queue_get(&(is->audioq), &pkt, 1) < 0 )
{
if(is->audioq.flash){
goto __RECEIVE;
}
av_log(NULL, AV_LOG_ERROR, "flash audio\n");
is->audioq.flash = 1;
ret = avcodec_send_packet(is->audio_ctx, NULL);
if (ret < 0)
{
return -1;
}
goto __RECEIVE;
}
视频解码与渲染
在主线程中,我们启动一个线程,用来进行视频渲染,如果视频的帧率是25帧,那么我们就每隔1000/25=40ms执行一次渲染。视频解码是很耗时的,所以我们要启动一个线程来对视频进行解码。解码后我们要根据需求缩放为AvFrame为yuv的数据。解码流程同音频解码流程。解码后的数据放在解码视频队列中。渲染函数每隔40ms就从渲染队列中取一条数据进行渲染。
渲染代码
static void schedule_refresh(VideoState *is, int delay)
{
SDL_AddTimer(delay, sdl_refresh_timer_cb, is);
}
static Uint32 sdl_refresh_timer_cb(Uint32 interval, void *opaque)
{
SDL_Event event;
event.type = FF_REFRESH_EVENT;
event.user.data1 = opaque;
SDL_PushEvent(&event);
return 0; /* 0 means stop timer */
}
void video_refresh_timer(void *userdata)
{
VideoState *is = (VideoState *)userdata;
VideoPicture *vp;
if (is->video_st)
{
if (is->pictq_size == 0)
{
schedule_refresh(is, 1); //if the queue is empty, so we shoud be as fast as checking queue of picture
}
else
{
vp = &is->pictq[is->pictq_rindex];
/* Now, normally here goes a ton of code
about timing, etc. we're just going to
guess at a delay for now. You can
increase and decrease this value and hard code
the timing - but I don't suggest that ;)
We'll learn how to do it for real later.
*/
schedule_refresh(is, REFRESH_TIME);
/* show the picture! */
video_display(is);
/* update queue for next picture! */
if (++is->pictq_rindex == VIDEO_PICTURE_QUEUE_SIZE)
{
is->pictq_rindex = 0;
}
SDL_LockMutex(is->pictq_mutex);
is->pictq_size--;
SDL_CondSignal(is->pictq_cond);
SDL_UnlockMutex(is->pictq_mutex);
}
}
else
{
schedule_refresh(is, 100);
}
}
视频解码代码同音频解码类似,视频解码后会放在frame队列中,等待渲染函数去获取。
int video_thread(void *arg)
{
VideoState *is = (VideoState *)arg;
static AVPacket pkt;
static AVFrame pFrame;
int ret = 0;
av_init_packet(&pkt);
pkt.data = NULL;
pkt.size = 0;
for (;;)
{
if (pkt.data)
av_packet_unref(&pkt);
if (packet_queue_get(&is->videoq, &pkt, 1) < 0)
{
if(is->videoq.flash){
goto __RECEIVE;
}
av_log(NULL, AV_LOG_ERROR, "flash audio\n");
is->videoq.flash = 1;
ret = avcodec_send_packet(is->video_ctx, NULL);
if (ret < 0)
{
goto __ERROR;
}
goto __RECEIVE;
}
ret = avcodec_send_packet(is->video_ctx, &pkt);
if (ret != 0)
{
printf("decode error");
goto __ERROR;
}
__RECEIVE:
ret = avcodec_receive_frame(is->video_ctx, &pFrame);
if (ret != 0)
{
continue;
}
ret = queue_picture(is, &pFrame);
if (ret < 0)
{
goto __ERROR;
}
}
__ERROR:
if (pkt.data)
{
av_packet_unref(&pkt);
}
return ret;
}
int queue_picture(VideoState *is, AVFrame *pFrame)
{
VideoPicture *vp;
int dst_pix_fmt;
AVPicture pict;
/* wait until we have space for a new pic */
SDL_LockMutex(is->pictq_mutex);
while (is->pictq_size >= VIDEO_PICTURE_QUEUE_SIZE &&
!is->quit)
{
SDL_CondWait(is->pictq_cond, is->pictq_mutex);
}
SDL_UnlockMutex(is->pictq_mutex);
if (is->quit)
{
fprintf(stderr, "quit from queue_picture....\n");
return -1;
}
// windex is set to 0 initially
vp = &is->pictq[is->pictq_windex];
/*
fprintf(stderr, "vp.width=%d, vp.height=%d, video_ctx.width=%d, video_ctx.height=%d\n",
vp->width,
vp->height,
is->video_ctx->width,
is->video_ctx->height);
*/
/* allocate or resize the buffer! */
if (!vp->yuv_frame ||
vp->width != is->video_ctx->width ||
vp->height != is->video_ctx->height)
{
vp->allocated = 0;
alloc_picture(is);
if (is->quit)
{
fprintf(stderr, "quit from queue_picture2....\n");
return -1;
}
}
/* We have a place to put our picture on the queue */
if (vp->yuv_frame)
{
// Convert the image into YUV format that SDL uses
sws_scale(is->sws_ctx,
(uint8_t const *const *)pFrame->data,
pFrame->linesize,
0,
is->video_ctx->height,
vp->yuv_frame->data,
vp->yuv_frame->linesize);
/* now we inform our display thread that we have a pic ready */
if (++is->pictq_windex == VIDEO_PICTURE_QUEUE_SIZE)
{
is->pictq_windex = 0;
}
SDL_LockMutex(is->pictq_mutex);
is->pictq_size++;
SDL_UnlockMutex(is->pictq_mutex);
}
return 0;
}
我们要在播放过程中能够关闭视频播放器,所以我们要在main函数中放入等待事件的函数。
for (;;)
{
SDL_WaitEvent(&event);
switch (event.type)
{
case FF_QUIT_EVENT:
case SDL_QUIT:
fprintf(stderr, "receive a QUIT event: %d\n", event.type);
is->quit = 1;
SDL_CondSignal(is->audioq.cond);
SDL_CondSignal(is->pictq_cond);
goto __QUIT;
break;
case FF_REFRESH_EVENT:
//fprintf(stderr, "receive a refresh event: %d\n", event.type);
video_refresh_timer(event.user.data1);
break;
default:
break;
}
}
如何关闭所有的线程呢?
我们收到关闭事件后,重置一个全局变量quit,其他线程能够尽快检测到这个变量quit,如果quit==1,就退出当前执行的线程。
case SDL_QUIT:
fprintf(stderr, "receive a QUIT event: %d\n", event.type);
is->quit = 1;
SDL_CondSignal(is->audioq.cond);
SDL_CondSignal(is->pictq_cond);
goto __QUIT;
break;
播放后,我们一定不要忘了释放资源。
下面是完整代码:
#include <stdio.h>
#include <assert.h>
#include <math.h>
#include <SDL2/SDL.h>
#include <libavcodec/avcodec.h>
#include <libavformat/avformat.h>
#include <libswscale/swscale.h>
#include <libswresample/swresample.h>
#include <libavutil/samplefmt.h>
#include <libavutil/imgutils.h>
#include <libavutil/mem.h>
#define MAX_AUDIO_FRAME_SIZE 192000
#define MAX_AUDIOQ_SIZE (5 * 16 * 1024)
#define MAX_VIDEOQ_SIZE (5 * 256 * 1024)
#define FF_REFRESH_EVENT SDL_USEREVENT
#define FF_QUIT_EVENT SDL_USEREVENT + 1
#define REFRESH_TIME 45
#define VIDEO_PICTURE_QUEUE_SIZE 1
static enum AVPixelFormat out_yuv_foramt = AV_PIX_FMT_YUV420P;
typedef struct PacketQueue
{
AVPacketList *first_pkt, *last_pkt;
int nb_packets;
int size;
SDL_mutex *mutex;
SDL_cond *cond;
int total;
int end;
int useCout;
int flash;
} PacketQueue;
typedef struct VideoPicture
{
AVFrame *yuv_frame;
int width, height;
int allocated;
} VideoPicture;
typedef struct VideoState
{
char filename[1024];
AVFormatContext *pFormatCtx;
int videoStream, audioStream;
//audio
AVStream *audio_st;
AVCodecContext *audio_ctx;
PacketQueue audioq;
uint8_t audio_buf[(MAX_AUDIO_FRAME_SIZE * 3) / 2];
unsigned int audio_buf_size;
unsigned int audio_buf_index;
struct SwrContext *audio_swr_ctx;
//video
AVStream *video_st;
AVCodecContext *video_ctx;
PacketQueue videoq;
struct SwsContext *sws_ctx;
VideoPicture pictq[VIDEO_PICTURE_QUEUE_SIZE];
int pictq_size, pictq_rindex, pictq_windex;
//for thread
SDL_mutex *pictq_mutex;
SDL_cond *pictq_cond;
SDL_Thread *parse_tid;
SDL_Thread *video_tid;
int quit;
} VideoState;
//SDL_mutex *texture_mutex;
SDL_Window *win;
SDL_Renderer *renderer;
SDL_Texture *texture;
VideoState *global_video_state;
static Uint8 out_channel = 2;
static enum AVSampleFormat out_format = AV_SAMPLE_FMT_S16;
static int out_nb_samples = 0; //一般情况下输入音频的采样个数要等于输出音频的采样个数
static int out_sample_rate = 0;
static enum AVPixelFormat out_pix_foramt = AV_PIX_FMT_YUV420P;
void packet_queue_init(PacketQueue *q)
{
memset(q, 0, sizeof(PacketQueue));
q->mutex = SDL_CreateMutex();
q->cond = SDL_CreateCond();
}
int packet_queue_put(PacketQueue *q, AVPacket *srcpkt)
{
AVPacket *pkt = av_packet_alloc();
AVPacketList *pkt1;
if (av_packet_ref(pkt, srcpkt) < 0)
{
return -1;
}
pkt1 = av_malloc(sizeof(AVPacketList));
if (!pkt1)
return -1;
pkt1->pkt = *pkt;
pkt1->next = NULL;
SDL_LockMutex(q->mutex);
if (!q->last_pkt)
q->first_pkt = pkt1;
else
q->last_pkt->next = pkt1;
q->last_pkt = pkt1;
q->nb_packets++;
q->size += pkt1->pkt.size;
//fprintf(stderr, "enqueue, packets:%d, send cond signal\n", q->nb_packets);
SDL_CondSignal(q->cond);
SDL_UnlockMutex(q->mutex);
return 0;
}
int packet_queue_get(PacketQueue *q, AVPacket *pkt, int block)
{
AVPacketList *pkt1;
int ret;
SDL_LockMutex(q->mutex);
for (;;)
{
if (global_video_state->quit)
{
fprintf(stderr, "quit from queue_get\n");
ret = -1;
break;
}
pkt1 = q->first_pkt;
if (pkt1)
{
q->first_pkt = pkt1->next;
if (!q->first_pkt)
q->last_pkt = NULL;
q->nb_packets--;
q->size -= pkt1->pkt.size;
*pkt = pkt1->pkt;
av_free(pkt1);
ret = 1;
break;
}
else if (!block)
{
ret = 0;
break;
}
else if(!(q->end))
{
fprintf(stderr, "queue is empty, so wait a moment and wait a cond signal\n");
SDL_CondWait(q->cond, q->mutex);
}else{
ret = -1;
break;
}
}
SDL_UnlockMutex(q->mutex);
return ret;
}
int audio_decode_frame(VideoState *is, uint8_t *audio_buf, int buf_size)
{
static AVPacket pkt;
static uint8_t *audio_pkt_data = NULL;
static int audio_pkt_size = 0;
static AVFrame frame;
int data_size = 0;
int ret = 0;
av_init_packet(&pkt);
pkt.data = NULL;
pkt.size = 0;
int index = 0;
uint64_t out_channel_layout = AV_CH_LAYOUT_STEREO;
frame.channels = is->audio_ctx->channels;
frame.format = is->audio_ctx->sample_fmt;
frame.nb_samples = is->audio_ctx->frame_size;
av_frame_get_buffer(&frame, 0);
for (;;)
{
if (pkt.data)
av_packet_unref(&pkt);
if (is->quit)
{
return -1;
}
ret = avcodec_receive_frame(is->audio_ctx, &frame);
if (ret == 0)
{
goto __SWR_DATA;
}
if (packet_queue_get(&(is->audioq), &pkt, 1) < 0 )
{
if(is->audioq.flash){
goto __RECEIVE;
}
av_log(NULL, AV_LOG_ERROR, "flash audio\n");
is->audioq.flash = 1;
ret = avcodec_send_packet(is->audio_ctx, NULL);
if (ret < 0)
{
return -1;
}
goto __RECEIVE;
}
++(is->audioq.useCout);
ret = avcodec_send_packet(is->audio_ctx, &pkt);
if (ret < 0)
{
ret = -1;
printf("decode error");
av_packet_unref(&pkt);
return -1;
}
if (pkt.data)
{
av_packet_unref(&pkt);
}
__RECEIVE:
index = 0;
ret = avcodec_receive_frame(is->audio_ctx, &frame);
if (ret < 0)
{
return ret;
}
__SWR_DATA:
data_size = av_get_bytes_per_sample(out_format) * out_channel * out_nb_samples;
swr_convert(is->audio_swr_ctx,
&audio_buf,
out_nb_samples,
(const uint8_t **)frame.data,
frame.nb_samples);
return data_size;
}
}
void audio_callback(void *userdata, Uint8 *stream, int len)
{
VideoState *is = (VideoState *)userdata;
int len1, audio_size;
SDL_memset(stream, 0, len);
while (len > 0)
{
if (is->audio_buf_index >= is->audio_buf_size)
{
/* We have already sent all our data; get more */
audio_size = audio_decode_frame(is, is->audio_buf, sizeof(is->audio_buf));
if (audio_size < 0)
{
/* If error, output silence */
is->audio_buf_size = 1024 * 2 * 2;
memset(is->audio_buf, 0, is->audio_buf_size);
}
else
{
is->audio_buf_size = audio_size;
}
is->audio_buf_index = 0;
}
len1 = is->audio_buf_size - is->audio_buf_index;
fprintf(stderr, "stream addr:%p, audio_buf_index:%d, audio_buf_size:%d, len1:%d, len:%d\n",
stream,
is->audio_buf_index,
is->audio_buf_size,
len1,
len);
if (len1 > len)
len1 = len;
SDL_MixAudio(stream, (uint8_t *)is->audio_buf + is->audio_buf_index, len1, SDL_MIX_MAXVOLUME);
len -= len1;
stream += len1;
is->audio_buf_index += len1;
}
}
static Uint32 sdl_refresh_timer_cb(Uint32 interval, void *opaque)
{
SDL_Event event;
event.type = FF_REFRESH_EVENT;
event.user.data1 = opaque;
SDL_PushEvent(&event);
return 0; /* 0 means stop timer */
}
static void schedule_refresh(VideoState *is, int delay)
{
SDL_AddTimer(delay, sdl_refresh_timer_cb, is);
}
void video_display(VideoState *is)
{
SDL_Rect rect;
VideoPicture *vp;
float aspect_ratio;
int w, h, x, y;
int i;
vp = &is->pictq[is->pictq_rindex];
if (vp->yuv_frame)
{
if (is->video_ctx->sample_aspect_ratio.num == 0)
{
aspect_ratio = 0;
}
else
{
aspect_ratio = av_q2d(is->video_ctx->sample_aspect_ratio) *
is->video_ctx->width / is->video_ctx->height;
}
if (aspect_ratio <= 0.0)
{
aspect_ratio = (float)is->video_ctx->width /
(float)is->video_ctx->height;
}
// size_t buffer_size = av_image_get_buffer_size(AV_PIX_FMT_YUV420P, 960, 540, 32);
// uint8_t *buffer = malloc(buffer_size);
// int y_size = 960 * 540;
// memcpy(buffer, vp->yuv_frame->data[0], y_size);
// memcpy(buffer + y_size, vp->yuv_frame->data[1], y_size / 4);
// memcpy(buffer + y_size + y_size / 4, vp->yuv_frame->data[2], y_size / 4);
SDL_UpdateYUVTexture(texture, NULL,
vp->yuv_frame->data[0], vp->yuv_frame->linesize[0],
vp->yuv_frame->data[1], vp->yuv_frame->linesize[1],
vp->yuv_frame->data[2], vp->yuv_frame->linesize[2]);
// SDL_UpdateTexture(texture, NULL, buffer, 960);
rect.x = 0;
rect.y = 0;
rect.w = is->video_ctx->width;
rect.h = is->video_ctx->height;
//SDL_LockMutex(texture_mutex);
SDL_RenderClear(renderer);
SDL_RenderCopy(renderer, texture, NULL, &rect);
SDL_RenderPresent(renderer);
//SDL_UnlockMutex(texture_mutex);
}
}
void video_refresh_timer(void *userdata)
{
VideoState *is = (VideoState *)userdata;
VideoPicture *vp;
if (is->video_st)
{
if (is->pictq_size == 0)
{
schedule_refresh(is, 1); //if the queue is empty, so we shoud be as fast as checking queue of picture
}
else
{
vp = &is->pictq[is->pictq_rindex];
/* Now, normally here goes a ton of code
about timing, etc. we're just going to
guess at a delay for now. You can
increase and decrease this value and hard code
the timing - but I don't suggest that ;)
We'll learn how to do it for real later.
*/
schedule_refresh(is, REFRESH_TIME);
/* show the picture! */
video_display(is);
/* update queue for next picture! */
if (++is->pictq_rindex == VIDEO_PICTURE_QUEUE_SIZE)
{
is->pictq_rindex = 0;
}
SDL_LockMutex(is->pictq_mutex);
is->pictq_size--;
SDL_CondSignal(is->pictq_cond);
SDL_UnlockMutex(is->pictq_mutex);
}
}
else
{
schedule_refresh(is, 100);
}
}
void alloc_picture(void *userdata)
{
VideoState *is = (VideoState *)userdata;
VideoPicture *vp;
vp = &is->pictq[is->pictq_windex];
if (vp->yuv_frame)
{ //free space if vp->pict is not NULL
av_frame_free(&(vp->yuv_frame));
free(vp->yuv_frame);
}
// Allocate a place to put our YUV image on that screen
//SDL_LockMutex(texture_mutex);
vp->yuv_frame = av_frame_alloc();
vp->yuv_frame->width = is->video_ctx->width;
vp->yuv_frame->height = is->video_ctx->height;
vp->yuv_frame->format = out_yuv_foramt;
av_frame_get_buffer(vp->yuv_frame, 32);
vp->width = is->video_ctx->width;
vp->height = is->video_ctx->height;
vp->allocated = 1;
}
int queue_picture(VideoState *is, AVFrame *pFrame)
{
VideoPicture *vp;
int dst_pix_fmt;
AVPicture pict;
/* wait until we have space for a new pic */
SDL_LockMutex(is->pictq_mutex);
while (is->pictq_size >= VIDEO_PICTURE_QUEUE_SIZE &&
!is->quit)
{
SDL_CondWait(is->pictq_cond, is->pictq_mutex);
}
SDL_UnlockMutex(is->pictq_mutex);
if (is->quit)
{
fprintf(stderr, "quit from queue_picture....\n");
return -1;
}
// windex is set to 0 initially
vp = &is->pictq[is->pictq_windex];
/*
fprintf(stderr, "vp.width=%d, vp.height=%d, video_ctx.width=%d, video_ctx.height=%d\n",
vp->width,
vp->height,
is->video_ctx->width,
is->video_ctx->height);
*/
/* allocate or resize the buffer! */
if (!vp->yuv_frame ||
vp->width != is->video_ctx->width ||
vp->height != is->video_ctx->height)
{
vp->allocated = 0;
alloc_picture(is);
if (is->quit)
{
fprintf(stderr, "quit from queue_picture2....\n");
return -1;
}
}
/* We have a place to put our picture on the queue */
if (vp->yuv_frame)
{
// Convert the image into YUV format that SDL uses
sws_scale(is->sws_ctx,
(uint8_t const *const *)pFrame->data,
pFrame->linesize,
0,
is->video_ctx->height,
vp->yuv_frame->data,
vp->yuv_frame->linesize);
/* now we inform our display thread that we have a pic ready */
if (++is->pictq_windex == VIDEO_PICTURE_QUEUE_SIZE)
{
is->pictq_windex = 0;
}
SDL_LockMutex(is->pictq_mutex);
is->pictq_size++;
SDL_UnlockMutex(is->pictq_mutex);
}
return 0;
}
int video_thread(void *arg)
{
VideoState *is = (VideoState *)arg;
static AVPacket pkt;
static AVFrame pFrame;
int ret = 0;
av_init_packet(&pkt);
pkt.data = NULL;
pkt.size = 0;
for (;;)
{
if (pkt.data)
av_packet_unref(&pkt);
if (packet_queue_get(&is->videoq, &pkt, 1) < 0)
{
if(is->videoq.flash){
goto __RECEIVE;
}
av_log(NULL, AV_LOG_ERROR, "flash audio\n");
is->videoq.flash = 1;
ret = avcodec_send_packet(is->video_ctx, NULL);
if (ret < 0)
{
goto __ERROR;
}
goto __RECEIVE;
}
ret = avcodec_send_packet(is->video_ctx, &pkt);
if (ret != 0)
{
printf("decode error");
goto __ERROR;
}
__RECEIVE:
ret = avcodec_receive_frame(is->video_ctx, &pFrame);
if (ret != 0)
{
continue;
}
ret = queue_picture(is, &pFrame);
if (ret < 0)
{
goto __ERROR;
}
}
__ERROR:
if (pkt.data)
{
av_packet_unref(&pkt);
}
return ret;
}
int stream_component_open(VideoState *is, int stream_index)
{
int64_t in_channel_layout, out_channel_layout;
AVFormatContext *pFormatCtx = is->pFormatCtx;
AVCodecContext *codecCtx = NULL;
AVCodec *codec = NULL;
SDL_AudioSpec wanted_spec, spec;
AVCodecParameters *codec_par = NULL;
if (stream_index < 0 || stream_index >= pFormatCtx->nb_streams)
{
return -1;
}
codec_par = pFormatCtx->streams[stream_index]->codecpar;
if(stream_index == is->audioStream){
out_nb_samples = codec_par->frame_size;
out_sample_rate = codec_par->sample_rate;
}
codec = avcodec_find_decoder(codec_par->codec_id);
codecCtx = avcodec_alloc_context3(codec);
avcodec_parameters_to_context(codecCtx, codec_par);
if (!codec)
{
fprintf(stderr, "Unsupported codec!\n");
return -1;
}
if (codecCtx->codec_type == AVMEDIA_TYPE_AUDIO)
{
// Set audio settings from codec info
wanted_spec.freq = codecCtx->sample_rate;
wanted_spec.format = AUDIO_S16SYS;
wanted_spec.channels = out_channel;
wanted_spec.silence = 0;
wanted_spec.samples = out_nb_samples;
wanted_spec.callback = audio_callback;
wanted_spec.userdata = is;
if (SDL_OpenAudio(&wanted_spec, &spec) < 0)
{
fprintf(stderr, "SDL_OpenAudio: %s\n", SDL_GetError());
return -1;
}
}
if (avcodec_open2(codecCtx, codec, NULL) < 0)
{
fprintf(stderr, "Unsupported codec!\n");
return -1;
}
switch (codecCtx->codec_type)
{
case AVMEDIA_TYPE_AUDIO:
is->audio_st = pFormatCtx->streams[stream_index];
is->audio_ctx = codecCtx;
is->audio_buf_size = 0;
is->audio_buf_index = 0;
packet_queue_init(&is->audioq);
SDL_PauseAudio(0);
//Out Audio Param
uint64_t out_channel_layout = av_get_default_channel_layout(out_channel);
//uint8_t *out_buffer=(uint8_t *)av_malloc(MAX_AUDIO_FRAME_SIZE*2);
int64_t in_channel_layout = av_get_default_channel_layout(is->audio_ctx->channels);
struct SwrContext *audio_convert_ctx = NULL;
audio_convert_ctx = swr_alloc();
if (!audio_convert_ctx)
{
printf("Failed to swr_alloc\n");
return -1;
}
swr_alloc_set_opts(audio_convert_ctx,
out_channel_layout,
out_format,
out_sample_rate,
in_channel_layout,
is->audio_ctx->sample_fmt,
is->audio_ctx->sample_rate,
0,
NULL);
fprintf(stderr, "swr opts: out_channel_layout:%lld, out_sample_fmt:%d, out_sample_rate:%d, in_channel_layout:%lld, in_sample_fmt:%d, in_sample_rate:%d\n",
out_channel_layout,
out_format,
out_sample_rate,
in_channel_layout,
is->audio_ctx->sample_fmt,
is->audio_ctx->sample_rate);
swr_init(audio_convert_ctx);
is->audio_swr_ctx = audio_convert_ctx;
break;
case AVMEDIA_TYPE_VIDEO:
is->video_st = pFormatCtx->streams[stream_index];
is->video_ctx = codecCtx;
packet_queue_init(&is->videoq);
is->video_tid = SDL_CreateThread(video_thread, "video_thread", is);
is->sws_ctx = sws_getContext(is->video_ctx->width,
is->video_ctx->height,
is->video_ctx->pix_fmt,
is->video_ctx->width,
is->video_ctx->height,
out_pix_foramt,
SWS_BILINEAR,
NULL, NULL, NULL);
break;
default:
break;
}
return 0;
}
int decode_thread(void *arg)
{
VideoState *is = arg;
AVPacket packet;
av_init_packet(&packet);
packet.data = NULL;
packet.size = 0;
if (is->audioStream >= 0)
{
stream_component_open(is, is->audioStream);
}
if (is->videoStream >= 0)
{
stream_component_open(is, is->videoStream);
}
fprintf(stderr, "video context: width=%d, height=%d\n", is->video_ctx->width, is->video_ctx->height);
// main decode loop
for (;;)
{
if (is->quit)
{
SDL_CondSignal(is->videoq.cond);
SDL_CondSignal(is->audioq.cond);
break;
}
// seek stuff goes here
if (is->audioq.size > MAX_AUDIOQ_SIZE ||
is->videoq.size > MAX_VIDEOQ_SIZE)
{
SDL_Delay(10);
continue;
}
int ret = av_read_frame(is->pFormatCtx, &packet);
fprintf(stderr, "av_read_frame, ret :%s\n", av_err2str(ret));
if (ret < 0)
{
break;
}
// Is this a packet from the video stream?
if (packet.stream_index == is->videoStream)
{
packet_queue_put(&is->videoq, &packet);
++(is->videoq.total);
fprintf(stderr, "put video queue, size :%d\n", is->videoq.total);
}
else if (packet.stream_index == is->audioStream)
{
packet_queue_put(&is->audioq, &packet);
++(is->audioq.total);
fprintf(stderr, "put audio queue, size :%d\n", is->audioq.total);
}
av_packet_unref(&packet);
}
is->audioq.end = 1;
is->videoq.end = 1;
/* all done - wait for it */
while (!is->quit)
{
SDL_Delay(100);
}
fail:
if (1)
{
SDL_Event event;
event.type = FF_QUIT_EVENT;
event.user.data1 = is;
SDL_PushEvent(&event);
}
return 0;
}
int init_VideoState(VideoState *is){
Uint32 pixformat;
AVFormatContext *pFormatCtx = NULL;
AVPacket pkt1, *packet = &pkt1;
int i;
is->videoStream = -1;
is->audioStream = -1;
global_video_state = is;
// Open video file
if (avformat_open_input(&pFormatCtx, is->filename, NULL, NULL) != 0)
return -1; // Couldn't open file
is->pFormatCtx = pFormatCtx;
// Retrieve stream information
if (avformat_find_stream_info(pFormatCtx, NULL) < 0)
return -1; // Couldn't find stream information
// Dump information about file onto standard error
av_dump_format(pFormatCtx, 0, is->filename, 0);
// Find the first video stream
is->videoStream = av_find_best_stream(pFormatCtx, AVMEDIA_TYPE_VIDEO, -1, -1, NULL, -1);
is->audioStream = av_find_best_stream(pFormatCtx, AVMEDIA_TYPE_AUDIO, -1, -1, NULL, -1);
if (is->videoStream < 0 || is->audioStream < 0)
{
av_log(NULL, AV_LOG_ERROR, "%s: could not open codecs\n", is->filename);
return -1;
}
return 0;
}
int main(int argc, char *argv[])
{
int ret = -1;
SDL_Event event;
VideoState *is;
if (argc < 2)
{
fprintf(stderr, "Usage: test <file>\n");
exit(1);
}
av_log_set_level(AV_LOG_INFO);
//big struct, it's core
is = av_mallocz(sizeof(VideoState));
// Register all formats and codecs
if (SDL_Init(SDL_INIT_VIDEO | SDL_INIT_AUDIO | SDL_INIT_TIMER))
{
fprintf(stderr, "Could not initialize SDL - %s\n", SDL_GetError());
exit(1);
}
//texture_mutex = SDL_CreateMutex();
memcpy(is->filename, argv[1], sizeof(is->filename));
is->pictq_mutex = SDL_CreateMutex();
is->pictq_cond = SDL_CreateCond();
ret = init_VideoState(is);
if(ret < 0){
goto __FAIL;
}
AVCodecParameters* video_paramters = is->pFormatCtx->streams[is->videoStream]->codecpar;
win = SDL_CreateWindow("Media Player",
SDL_WINDOWPOS_UNDEFINED,
SDL_WINDOWPOS_UNDEFINED,
video_paramters->width,
video_paramters->height,
SDL_WINDOW_OPENGL | SDL_WINDOW_RESIZABLE);
renderer = SDL_CreateRenderer(win, -1, 0);
texture = SDL_CreateTexture(renderer,
SDL_PIXELFORMAT_IYUV,
SDL_TEXTUREACCESS_STREAMING,
video_paramters->width,
video_paramters->height);
//set timer
schedule_refresh(is, 40);
is->parse_tid = SDL_CreateThread(decode_thread, "decode_thread", is);
if (!is->parse_tid)
{
av_free(is);
goto __FAIL;
}
for (;;)
{
SDL_WaitEvent(&event);
switch (event.type)
{
case FF_QUIT_EVENT:
case SDL_QUIT:
fprintf(stderr, "receive a QUIT event: %d\n", event.type);
is->quit = 1;
SDL_CondSignal(is->audioq.cond);
SDL_CondSignal(is->pictq_cond);
goto __QUIT;
break;
case FF_REFRESH_EVENT:
//fprintf(stderr, "receive a refresh event: %d\n", event.type);
video_refresh_timer(event.user.data1);
break;
default:
break;
}
}
__QUIT:
ret = 0;
__FAIL:
SDL_Delay(20);
SDL_Quit();
if(is){
if(is->audio_swr_ctx){
swr_close(is->audio_swr_ctx);
swr_free(&(is->audio_swr_ctx));
}
if(is->sws_ctx){
sws_freeContext(is->sws_ctx);
}
if(is->audio_ctx){
avcodec_close(is->audio_ctx);
avcodec_free_context(&is->audio_ctx);
}
if(is->video_ctx){
avcodec_close(is->video_ctx);
avcodec_free_context(&is->video_ctx);
}
if(is->pFormatCtx){
avformat_close_input(&(is->pFormatCtx));
avformat_free_context(is->pFormatCtx);
}
}
return ret;
}