最新（2.44）FFmpeg音频播放 ----- 关键点swr_convert

最新推荐文章于 2024-04-18 15:24:35 发布

奚华

最新推荐文章于 2024-04-18 15:24:35 发布

阅读量1.2w

点赞数 1

分类专栏： ffmpeg 文章标签： ffmpeg audio codec

本文链接：https://blog.csdn.net/a907763895/article/details/42016039

版权

ffmpeg 专栏收录该内容

1 篇文章 0 订阅

订阅专栏

ffmpeg 版本：git clone 于 2014-12-02 ，版本接近2.44，在2.44和2.51之间

SDL版本：SDL 1.2（Centos 6.5软件库的相应版本）

有些旧的ffmpeg播放音频示例中，会存在一些音频可以播放一些不能播放，其中一个我们需要考虑的原因和该注意的地方就是 av_decode_audiole类似函数所获的的AVFrame的格式是否是我们(SDL)所需要的，本例代码用来解决该问题，关键点在于swr_convert函数，代码及注释如下：

</pre><pre name="code" class="cpp">#include <libavcodec/avcodec.h>
#include <libavformat/avformat.h>
#include <libswscale/swscale.h>
#include <libswresample/swresample.h>
#include <libavutil/avstring.h>
#include <libavutil/pixfmt.h>
#include <libavutil/log.h>
#include <SDL/SDL.h>
#include <SDL/SDL_thread.h>
#include <stdio.h>
#include <math.h>

#define SDL_AUDIO_BUFFER_SIZE 1024 
#define MAX_AUDIOQ_SIZE (1 * 1024 * 1024)
#define FF_ALLOC_EVENT   (SDL_USEREVENT)
#define FF_REFRESH_EVENT (SDL_USEREVENT + 1)
#define FF_QUIT_EVENT (SDL_USEREVENT + 2)

//该字段存在于旧版本的ffmpeg中，此处粘贴过来使用，勿怪！
#define AVCODEC_MAX_AUDIO_FRAME_SIZE 192000 // 1 second of 48khz 32bit audio

typedef struct PacketQueue {
	AVPacketList *first_pkt, *last_pkt;
	int nb_packets;
	int size;
	SDL_mutex *mutex;
	SDL_cond *cond;
} PacketQueue;

typedef struct VideoState {
	char filename[1024];
	AVFormatContext *ic;
	int videoStream, audioStream;
	AVStream *audio_st;
	AVFrame *audio_frame;
	PacketQueue audioq;
	unsigned int audio_buf_size;
	unsigned int audio_buf_index;
	AVPacket audio_pkt;
	uint8_t *audio_pkt_data;
	int audio_pkt_size;
	uint8_t *audio_buf;
	uint8_t *audio_buf1;
	DECLARE_ALIGNED(16,uint8_t,audio_buf2) [AVCODEC_MAX_AUDIO_FRAME_SIZE * 4];
	enum AVSampleFormat audio_src_fmt;
	enum AVSampleFormat audio_tgt_fmt;
	int audio_src_channels;
	int audio_tgt_channels;
	int64_t audio_src_channel_layout;
	int64_t audio_tgt_channel_layout;
	int audio_src_freq;
	int audio_tgt_freq;
	struct SwrContext *swr_ctx;
	SDL_Thread *parse_tid;
	int quit;
} VideoState;

VideoState *global_video_state;

void packet_queue_init(PacketQueue *q) {
	memset(q, 0, sizeof(PacketQueue));
	q->mutex = SDL_CreateMutex();
	q->cond = SDL_CreateCond();
}

int packet_queue_put(PacketQueue *q, AVPacket *pkt) {
	AVPacketList *pkt1;

	pkt1 = (AVPacketList *) av_malloc(sizeof(AVPacketList));
	if (!pkt1) {
		return -1;
	}
	pkt1->pkt = *pkt;
	pkt1->next = NULL;

	SDL_LockMutex(q->mutex);

	if (!q->last_pkt) {
		q->first_pkt = pkt1;
	} else {
		q->last_pkt->next = pkt1;
	}

	q->last_pkt = pkt1;
	q->nb_packets++;
	q->size += pkt1->pkt.size;
	SDL_CondSignal(q->cond);
	SDL_UnlockMutex(q->mutex);
	return 0;
}

static int packet_queue_get(PacketQueue *q, AVPacket *pkt, int block) {
	AVPacketList *pkt1;
	int ret;

	SDL_LockMutex(q->mutex);

	for (;;) {
		if (global_video_state->quit) {
			ret = -1;
			break;
		}

		pkt1 = q->first_pkt;
		if (pkt1) {
			q->first_pkt = pkt1->next;
			if (!q->first_pkt) {
				q->last_pkt = NULL;
			}
			q->nb_packets--;
			q->size -= pkt1->pkt.size;
			*pkt = pkt1->pkt;

			av_free(pkt1);
			ret = 1;
			break;
		} else if (!block) {
			ret = 0;
			break;
		} else {
			SDL_CondWait(q->cond, q->mutex);
		}
	}

	SDL_UnlockMutex(q->mutex);

	return ret;
}

int audio_decode_frame(VideoState *is) {
	int len1, len2, decoded_data_size;
	AVPacket *pkt = &is->audio_pkt;
	int got_frame = 0;
	int64_t dec_channel_layout;
	int wanted_nb_samples, resampled_data_size;

	for (;;) {
		while (is->audio_pkt_size > 0) {
			if (!is->audio_frame) {
				if (!(is->audio_frame = av_frame_alloc())) {
					return AVERROR(ENOMEM);
				}
			} else
				av_frame_unref(is->audio_frame);
			/**
			 * 当AVPacket中装得是音频时，有可能一个AVPacket中有多个AVFrame，
			 * 而某些解码器只会解出第一个AVFrame，这种情况我们必须循环解码出后续AVFrame
			 */
			len1 = avcodec_decode_audio4(is->audio_st->codec, is->audio_frame,
					&got_frame, pkt);
			if (len1 < 0) {
				// error, skip the frame
				is->audio_pkt_size = 0;
				break;
			}

			is->audio_pkt_data += len1;
			is->audio_pkt_size -= len1;

			if (!got_frame)
				continue;
			//执行到这里我们得到了一个AVFrame

			decoded_data_size = av_samples_get_buffer_size(NULL,
					is->audio_frame->channels, is->audio_frame->nb_samples,
					is->audio_frame->format, 1);

			//得到这个AvFrame的声音布局，比如立体声
			dec_channel_layout =
					(is->audio_frame->channel_layout
							&& is->audio_frame->channels
									== av_get_channel_layout_nb_channels(
											is->audio_frame->channel_layout)) ?
							is->audio_frame->channel_layout :
							av_get_default_channel_layout(
									is->audio_frame->channels);

			//这个AVFrame每个声道的采样数
			wanted_nb_samples = is->audio_frame->nb_samples;


			/**
			 * 接下来判断我们之前设置SDL时设置的声音格式(AV_SAMPLE_FMT_S16)，声道布局，
			 * 采样频率，每个AVFrame的每个声道采样数与
			 * 得到的该AVFrame分别是否相同，如有任意不同，我们就需要swr_convert该AvFrame，
			 * 然后才能符合之前设置好的SDL的需要，才能播放
			 */
			if (is->audio_frame->format != is->audio_src_fmt
					|| dec_channel_layout != is->audio_src_channel_layout
					|| is->audio_frame->sample_rate != is->audio_src_freq
					|| (wanted_nb_samples != is->audio_frame->nb_samples
							&& !is->swr_ctx)) {
				if (is->swr_ctx)
					swr_free(&is->swr_ctx);
				is->swr_ctx = swr_alloc_set_opts(NULL,
						is->audio_tgt_channel_layout, is->audio_tgt_fmt,
						is->audio_tgt_freq, dec_channel_layout,
						is->audio_frame->format, is->audio_frame->sample_rate,
						0, NULL);
				if (!is->swr_ctx || swr_init(is->swr_ctx) < 0) {
					fprintf(stderr, "swr_init() failed\n");
					break;
				}
				is->audio_src_channel_layout = dec_channel_layout;
				is->audio_src_channels = is->audio_st->codec->channels;
				is->audio_src_freq = is->audio_st->codec->sample_rate;
				is->audio_src_fmt = is->audio_st->codec->sample_fmt;
			}

			/**
			 * 如果上面if判断失败，就会初始化好swr_ctx，就会如期进行转换
			 */
			if (is->swr_ctx) {
				// const uint8_t *in[] = { is->audio_frame->data[0] };
				const uint8_t **in =
						(const uint8_t **) is->audio_frame->extended_data;
				uint8_t *out[] = { is->audio_buf2 };
				if (wanted_nb_samples != is->audio_frame->nb_samples) {
					fprintf(stdout, "swr_set_compensation \n");
					if (swr_set_compensation(is->swr_ctx,
							(wanted_nb_samples - is->audio_frame->nb_samples)
									* is->audio_tgt_freq
									/ is->audio_frame->sample_rate,
							wanted_nb_samples * is->audio_tgt_freq
									/ is->audio_frame->sample_rate) < 0) {
						fprintf(stderr, "swr_set_compensation() failed\n");
						break;
					}
				}

				/**
				 * 转换该AVFrame到设置好的SDL需要的样子，有些旧的代码示例最主要就是少了这一部分，
				 * 往往一些音频能播，一些不能播，这就是原因，比如有些源文件音频恰巧是AV_SAMPLE_FMT_S16的。
				 * swr_convert 返回的是转换后每个声道(channel)的采样数
				 */
				len2 = swr_convert(is->swr_ctx, out,
						sizeof(is->audio_buf2) / is->audio_tgt_channels
								/ av_get_bytes_per_sample(is->audio_tgt_fmt),
						in, is->audio_frame->nb_samples);
				if (len2 < 0) {
					fprintf(stderr, "swr_convert() failed\n");
					break;
				}
				if (len2
						== sizeof(is->audio_buf2) / is->audio_tgt_channels
								/ av_get_bytes_per_sample(is->audio_tgt_fmt)) {
					fprintf(stderr,
							"warning: audio buffer is probably too small\n");
					swr_init(is->swr_ctx);
				}
				is->audio_buf = is->audio_buf2;

				//每声道采样数 x 声道数 x 每个采样字节数
				resampled_data_size = len2 * is->audio_tgt_channels
						* av_get_bytes_per_sample(is->audio_tgt_fmt);
			} else {
				resampled_data_size = decoded_data_size;
				is->audio_buf = is->audio_frame->data[0];
			}
			// We have data, return it and come back for more later
			return resampled_data_size;
		}

		if (pkt->data)
			av_free_packet(pkt);
		memset(pkt, 0, sizeof(*pkt));
		if (is->quit)
			return -1;
		if (packet_queue_get(&is->audioq, pkt, 1) < 0)
			return -1;

		is->audio_pkt_data = pkt->data;
		is->audio_pkt_size = pkt->size;
	}
}

void audio_callback(void *userdata, Uint8 *stream, int len) {
	VideoState *is = (VideoState *) userdata;
	int len1, audio_data_size;

	while (len > 0) {
		if (is->audio_buf_index >= is->audio_buf_size) {
			audio_data_size = audio_decode_frame(is);

			if (audio_data_size < 0) {
				/* silence */
				is->audio_buf_size = 1024;
				memset(is->audio_buf, 0, is->audio_buf_size);
			} else {
				is->audio_buf_size = audio_data_size;
			}
			is->audio_buf_index = 0;
		}

		len1 = is->audio_buf_size - is->audio_buf_index;
		if (len1 > len) {
			len1 = len;
		}

		memcpy(stream, (uint8_t *) is->audio_buf + is->audio_buf_index, len1);
		len -= len1;
		stream += len1;
		is->audio_buf_index += len1;
	}
}

/**
 * 设置SDL播放声音的参数如声音采样格式，声道布局，静音值
 */
int stream_component_open(VideoState *is, int stream_index) {
	AVFormatContext *ic = is->ic;
	AVCodecContext *codecCtx;
	AVCodec *codec;
	SDL_AudioSpec wanted_spec, spec;
	int64_t wanted_channel_layout = 0;
	int wanted_nb_channels;
	const int next_nb_channels[] = { 0, 0, 1, 6, 2, 6, 4, 6 };

	if (stream_index < 0 || stream_index >= ic->nb_streams) {
		return -1;
	}

	codecCtx = ic->streams[stream_index]->codec;
	wanted_nb_channels = codecCtx->channels;
	if (!wanted_channel_layout
			|| wanted_nb_channels
					!= av_get_channel_layout_nb_channels(
							wanted_channel_layout)) {
		wanted_channel_layout = av_get_default_channel_layout(
				wanted_nb_channels);
		wanted_channel_layout &= ~AV_CH_LAYOUT_STEREO_DOWNMIX;
	}

	wanted_spec.channels = av_get_channel_layout_nb_channels(
			wanted_channel_layout);
	wanted_spec.freq = codecCtx->sample_rate;
	if (wanted_spec.freq <= 0 || wanted_spec.channels <= 0) {
		fprintf(stderr, "Invalid sample rate or channel count!\n");
		return -1;
	}
	wanted_spec.format = AUDIO_S16SYS;
	wanted_spec.silence = 0;
	wanted_spec.samples = SDL_AUDIO_BUFFER_SIZE;
	wanted_spec.callback = audio_callback;
	wanted_spec.userdata = is;

	while (SDL_OpenAudio(&wanted_spec, &spec) < 0) {
		fprintf(stderr, "SDL_OpenAudio (%d channels): %s\n",
				wanted_spec.channels, SDL_GetError());
		wanted_spec.channels = next_nb_channels[FFMIN(7, wanted_spec.channels)];
		if (!wanted_spec.channels) {
			fprintf(stderr,
					"No more channel combinations to tyu, audio open failed\n");
			return -1;
		}
		wanted_channel_layout = av_get_default_channel_layout(
				wanted_spec.channels);
	}

	if (spec.format != AUDIO_S16SYS) {
		fprintf(stderr, "SDL advised audio format %d is not supported!\n",
				spec.format);
		return -1;
	}
	if (spec.channels != wanted_spec.channels) {
		wanted_channel_layout = av_get_default_channel_layout(spec.channels);
		if (!wanted_channel_layout) {
			fprintf(stderr, "SDL advised channel count %d is not supported!\n",
					spec.channels);
			return -1;
		}
	}

	fprintf(stderr, "%d: wanted_spec.format = %d\n", __LINE__,
			wanted_spec.format);
	fprintf(stderr, "%d: wanted_spec.samples = %d\n", __LINE__,
			wanted_spec.samples);
	fprintf(stderr, "%d: wanted_spec.channels = %d\n", __LINE__,
			wanted_spec.channels);
	fprintf(stderr, "%d: wanted_spec.freq = %d\n", __LINE__, wanted_spec.freq);

	fprintf(stderr, "%d: spec.format = %d\n", __LINE__, spec.format);
	fprintf(stderr, "%d: spec.samples = %d\n", __LINE__, spec.samples);
	fprintf(stderr, "%d: spec.channels = %d\n", __LINE__, spec.channels);
	fprintf(stderr, "%d: spec.freq = %d\n", __LINE__, spec.freq);

	is->audio_src_fmt = is->audio_tgt_fmt = AV_SAMPLE_FMT_S16;
	is->audio_src_freq = is->audio_tgt_freq = spec.freq;
	is->audio_src_channel_layout = is->audio_tgt_channel_layout =
			wanted_channel_layout;
	is->audio_src_channels = is->audio_tgt_channels = spec.channels;

	codec = avcodec_find_decoder(codecCtx->codec_id);
	if (!codec || (avcodec_open2(codecCtx, codec, NULL) < 0)) {
		fprintf(stderr, "Unsupported codec!\n");
		return -1;
	}
	ic->streams[stream_index]->discard = AVDISCARD_DEFAULT;
	switch (codecCtx->codec_type) {
	case AVMEDIA_TYPE_AUDIO:
		is->audioStream = stream_index;
		is->audio_st = ic->streams[stream_index];
		is->audio_buf_size = 0;
		is->audio_buf_index = 0;
		memset(&is->audio_pkt, 0, sizeof(is->audio_pkt));
		packet_queue_init(&is->audioq);
		SDL_PauseAudio(0);
		break;
	default:
		break;
	}
}

/**
 * demuxing出AVPacket
 */
static int decode_thread(void *arg) {
	VideoState *is = (VideoState *) arg;
	AVFormatContext *ic = NULL;
	AVPacket pkt1, *packet = &pkt1;
	int ret, i, audio_index = -1;

	is->audioStream = -1;
	global_video_state = is;
	if (avformat_open_input(&ic, is->filename, NULL, NULL) != 0) {
		return -1;
	}
	is->ic = ic;
	if (avformat_find_stream_info(ic, NULL) < 0) {
		return -1;
	}
	av_dump_format(ic, 0, is->filename, 0);
	for (i = 0; i < ic->nb_streams; i++) {
		if (ic->streams[i]->codec->codec_type == AVMEDIA_TYPE_AUDIO
				&& audio_index < 0) {
			audio_index = i;
			break;
		}
	}
	if (audio_index >= 0) {
		stream_component_open(is, audio_index);
	}
	if (is->audioStream < 0) {
		fprintf(stderr, "%s: could not open codecs\n", is->filename);
		goto fail;
	}
	// main decode loop
	for (;;) {
		if (is->quit)
			break;
		if (is->audioq.size > MAX_AUDIOQ_SIZE) {
			SDL_Delay(10);
			continue;
		}
		ret = av_read_frame(is->ic, packet);
		if (ret < 0) {
			if (ret == AVERROR_EOF || url_feof(is->ic->pb)) {
				break;
			}
			if (is->ic->pb && is->ic->pb->error) {
				break;
			}
			continue;
		}

		if (packet->stream_index == is->audioStream) {
			packet_queue_put(&is->audioq, packet);
		} else {
			av_free_packet(packet);
		}
	}

	while (!is->quit) {
		SDL_Delay(100);
	}

	fail: {
		SDL_Event event;
		event.type = FF_QUIT_EVENT;
		event.user.data1 = is;
		SDL_PushEvent(&event);
	}

	return 0;
}

int main(int argc, char *argv[]) {
	SDL_Event event;
	VideoState *is;

	is = (VideoState *) av_mallocz(sizeof(VideoState));

	if (argc < 2) {
		fprintf(stderr, "Usage: test <file>\n");
		exit(1);
	}

	av_register_all();

	if (SDL_Init(SDL_INIT_AUDIO)) {
		fprintf(stderr, "Could not initialize SDL - %s\n", SDL_GetError());
		exit(1);
	}

	av_strlcpy(is->filename, argv[1], sizeof(is->filename));

	is->parse_tid = SDL_CreateThread(decode_thread, is);
	if (!is->parse_tid) {
		av_free(is);
		return -1;
	}

	for (;;) {
		SDL_WaitEvent(&event);
		switch (event.type) {
		case FF_QUIT_EVENT:
		case SDL_QUIT:
			is->quit = 1;
			SDL_Quit();
			exit(0);
			break;
		default:
			break;
		}
	}
	return 0;
}

FFmpeg版本逐渐更新，代码功能更加丰富和易于使用，掌握音视频基础概念结合ffmpeg就可以方便使用！

奚华

关注

1
点赞
踩
11

收藏

觉得还不错? 一键收藏
0
评论
最新（2.44）FFmpeg音频播放 ----- 关键点swr_convert

关于音频转换 swr_convert有些旧的ffmpeg播放音频示例中，会存在一些音频可以播放一些不能播放，其中一个我们需要考虑的原因和该注意的地方就是 av_decode_audiole类似函数所获的的AVFrame的格式是否是我们(SDL)
复制链接

扫一扫