FFMPEG学习----分离视音频里的PCM数据

/**

*  参考于：http://blog.csdn.net/leixiaohua1020/article/details/46890259

*/

#include <stdio.h>

#include <string.h>

extern "C"

{

#include "libavcodec/avcodec.h"

#include "libavformat/avformat.h"

#include "libswresample/swresample.h"

};

#pragma comment(lib, "avcodec.lib")

#pragma comment(lib, "avformat.lib")

#pragma comment(lib, "swresample.lib")

#pragma comment(lib, "avutil.lib")

// 1 second of 48khz 32bit(4Byte) audio

#define MAX_AUDIO_FRAME_SIZE 192000

int main(int argc, char* argv[])

{

	AVFormatContext		*pFormatCtx = NULL;

	AVCodecContext		*pCodecCtx = NULL;

	AVCodec				*pCodec = NULL;

	AVPacket			packet;

	AVFrame				*pAudioFrame = NULL;

	uint8_t				*buffer = NULL;

	struct SwrContext	*audio_convert_ctx = NULL;

	int					got_picture;

	int					audioIndex;

	char filepath[1024] = "";

	printf("Usage: program.exe *.mp3\n");

	if (argc == 2)

	{

		strcpy(filepath, argv[1]);

	}

	else

	{

		printf("Could not find a audio file\n");

		return -1;

	}

	FILE *fp_pcm = fopen("output.pcm", "wb+");

	if (fp_pcm == NULL)

	{

		printf("FILE open error");

		return -1;

	}

	av_register_all();

	if (avformat_open_input(&pFormatCtx, filepath, NULL, NULL) != 0)

	{

		printf("Couldn't open an input stream.\n");

		return -1;

	}

	if (avformat_find_stream_info(pFormatCtx, NULL) < 0)

	{

		printf("Couldn't find stream information.\n");

		return -1;

	}

	audioIndex = -1;

	for (int i = 0; i < pFormatCtx->nb_streams; i++)

	{

		if (pFormatCtx->streams[i]->codec->codec_type == AVMEDIA_TYPE_AUDIO)

		{

			audioIndex = i;

			break;

		}

	}

	if (audioIndex == -1)

	{

		printf("Couldn't find a audio stream.\n");

		return -1;

	}

	pCodecCtx = pFormatCtx->streams[audioIndex]->codec;

	pCodec = avcodec_find_decoder(pCodecCtx->codec_id);

	if (pCodec == NULL)

	{

		printf("Codec not found.\n");

		return -1;

	}

	if (avcodec_open2(pCodecCtx, pCodec, NULL) < 0)

	{

		printf("Could not open codec.\n");

		return -1;

	}

	pAudioFrame = av_frame_alloc();

	if (pAudioFrame == NULL)

	{

		printf("Could not alloc AVFrame\n");

		return -1;

	}

	//音频输出参数

	uint64_t out_channel_layout = AV_CH_LAYOUT_STEREO;//声道格式

	AVSampleFormat out_sample_fmt = AV_SAMPLE_FMT_S16;//采样格式

	int out_nb_samples = pCodecCtx->frame_size;//nb_samples: AAC-1024 MP3-1152

	int out_sample_rate = 44100;//采样率

	int out_nb_channels = av_get_channel_layout_nb_channels(out_channel_layout);//根据声道格式返回声道个数

	int out_buffer_size = av_samples_get_buffer_size(NULL, out_nb_channels, out_nb_samples, out_sample_fmt, 1);

	buffer = (uint8_t *)av_malloc(MAX_AUDIO_FRAME_SIZE);

	/**

	* 函数声明：struct SwrContext *swr_alloc(void);

	* Allocate SwrContext.

	*

	* If you use this function you will need to set the parameters (manually or

	* with swr_alloc_set_opts()) before calling swr_init().

	*

	* @see swr_alloc_set_opts(), swr_init(), swr_free()

	* @return NULL on error, allocated context otherwise

	*/

	audio_convert_ctx = swr_alloc();

	if (audio_convert_ctx == NULL)

	{

		printf("Could not allocate SwrContext\n");

		return -1;

	}

	/**

	* 函数声明：struct SwrContext *swr_alloc_set_opts(

	* struct SwrContext *s,int64_t out_ch_layout, enum AVSampleFormat out_sample_fmt, int out_sample_rate,

	* int64_t  in_ch_layout, enum AVSampleFormat  in_sample_fmt, int  in_sample_rate,

	* int log_offset, void *log_ctx);

	*

	* Allocate SwrContext if needed and set/reset common parameters.

	*

	* This function does not require s to be allocated with swr_alloc(). On the

	* other hand, swr_alloc() can use swr_alloc_set_opts() to set the parameters

	* on the allocated context.

	*

	* @param s               existing Swr context if available, or NULL if not

	* @param out_ch_layout   output channel layout (AV_CH_LAYOUT_*)

	* @param out_sample_fmt  output sample format (AV_SAMPLE_FMT_*).

	* @param out_sample_rate output sample rate (frequency in Hz)

	* @param in_ch_layout    input channel layout (AV_CH_LAYOUT_*)

	* @param in_sample_fmt   input sample format (AV_SAMPLE_FMT_*).

	* @param in_sample_rate  input sample rate (frequency in Hz)

	* @param log_offset      logging level offset

	* @param log_ctx         parent logging context, can be NULL

	*

	* @see swr_init(), swr_free()

	* @return NULL on error, allocated context otherwise

	*/

	/*

	int64_t in_channel_layout = av_get_default_channel_layout(pCodecCtx->channels);//根据声道数返回默认输入声道格式

	swr_alloc_set_opts(audio_convert_ctx, out_channel_layout, out_sample_fmt, out_sample_rate,

		in_channel_layout, pCodecCtx->sample_fmt, pCodecCtx->sample_rate, 0, NULL);

	*/

	swr_alloc_set_opts(audio_convert_ctx, out_channel_layout, out_sample_fmt,out_sample_rate,

		pCodecCtx->channel_layout, pCodecCtx->sample_fmt, pCodecCtx->sample_rate, 0, NULL);

	/**

	* 函数声明：int swr_init(struct SwrContext *s);

	* Initialize context after user parameters have been set.

	* @note The context must be configured using the AVOption API.

	*

	* @see av_opt_set_int()

	* @see av_opt_set_dict()

	*

	* @param[in,out]   s Swr context to initialize

	* @return AVERROR error code in case of failure.

	*/

	swr_init(audio_convert_ctx);

	int	index = 0;//计数器

	while (av_read_frame(pFormatCtx, &packet) >= 0)

	{

		if (packet.stream_index == audioIndex)

		{

			if (avcodec_decode_audio4(pCodecCtx, pAudioFrame, &got_picture, &packet) < 0)

			{

				printf("Error in decoding audio frame.\n");

				return -1;

			}

			if (got_picture)

			{

				/** Convert audio.

				* 函数声明：int swr_convert(struct SwrContext *s, uint8_t **out, int out_count,

				*                           const uint8_t **in, int in_count);

				* in and in_count can be set to 0 to flush the last few samples out at the

				* end.

				*

				* If more input is provided than output space, then the input will be buffered.

				* You can avoid this buffering by using swr_get_out_samples() to retrieve an

				* upper bound on the required number of output samples for the given number of

				* input samples. Conversion will run directly without copying whenever possible.

				*

				* @param s         allocated Swr context, with parameters set

				* @param out       output buffers, only the first one need be set in case of packed audio

				* @param out_count amount of space available for output in samples per channel

				* @param in        input buffers, only the first one need to be set in case of packed audio

				* @param in_count  number of input samples available in one channel

				*

				* @return number of samples output per channel, negative value on error

				*/

				swr_convert(audio_convert_ctx, &buffer, MAX_AUDIO_FRAME_SIZE, (const uint8_t **)pAudioFrame->data, pAudioFrame->nb_samples);

				printf("index:%5d\t pts:%lld\t packet size:%d\n", index, packet.pts, packet.size);

				//Write PCM

				fwrite(buffer, 1, out_buffer_size, fp_pcm);

				index++;

			}

		}

		av_free_packet(&packet);

	}

	fclose(fp_pcm);

	swr_free(&audio_convert_ctx);

	av_free(buffer);

	av_frame_free(&pAudioFrame);

	avcodec_close(pCodecCtx);

	avformat_close_input(&pFormatCtx);

	return 0;

}

与解析视频里的YUV/RGB（http://blog.csdn.net/x_iya/article/details/52248929）相同的是，解析出音频的AVFrame同样需要转换。

由于ffmpeg最新版本（从2.1开始貌似）使用avcodec_decode_audio4函数来解码音频，但解码得到的数据类型为float 4bit，而播放器播放的格式一般为S16（signed 16bit）,就需要对解码得到的数据进行转换，然而，ffmpeg已经帮我们做好了，只需调用API就可以了，这个函数就是：swr_convert

输出：

使用Audacity打开（注意参数）

问题：

1.有些格式的视频不符合标准，获得的pCodecCtx->frame_size为0

雷老师，我使用wmv格式的视频进行测试，结果不能进行得到正确的pcm文件，文件大小始终为0，发现是out_nb_samples = pCodecCtx->frame_size发生错误，其中pCodecCtx->frame_size为0，导致av_samples_get_buffer_size算出的大小是负数。问过有经验组长，他告诉我有些格式的视频不符合标准，不能从文件头中获取到信息，要在读入一帧后获取，也就是ret = avcodec_decode_audio4( pCodecCtx, pFrame,&got_picture,
packet);之后，从pFrame中获取信息。

发现错误，重新修改程序，就能得到数据了。

2.对于采样率为48000Hz的视频，解析为采样率为44100Hz的pcm时出现杂音，将out_sample_rate设置为

int out_sample_rate = 48000;则没有问题。

FFMPEG学习----分离视音频里的PCM数据的更多相关文章

FFMPEG学习----分离视频里的H.264与YUV数据
#include <stdio.h> extern "C" { #include "libavcodec/avcodec.h" #include & ...
FFmpeg学习4：音频格式转换
前段时间,在学习试用FFmpeg播放音频的时候总是有杂音,网上的很多教程是基于之前版本的FFmpeg的,而新的FFmepg3中audio增加了平面(planar)格式,而SDL播放音频是不支持平面格式 ...
基于FFmpeg的音频编码（PCM数据编码成AAC android）
概述在Android上实现录音,并利用 FFmpeg将PCM数据编码成AAC. 详细代码下载:http://www.demodashi.com/demo/10512.html 之前做的一个demo ...
FFmpeg学习5：多线程播放视音频
在前面的学习中,视频和音频的播放是分开进行的.这主要是为了学习的方便,经过一段时间的学习,对FFmpeg的也有了一定的了解,本文就介绍了如何使用多线程同时播放音频和视频(未实现同步),并对前面的学习 ...
最简单的基于FFmpeg的封装格式处理：视音频分离器（demuxer）
===================================================== 最简单的基于FFmpeg的封装格式处理系列文章列表: 最简单的基于FFmpeg的封装格式处理 ...
最简单的基于FFmpeg的封装格式处理：视音频分离器简化版（demuxer-simple）
===================================================== 最简单的基于FFmpeg的封装格式处理系列文章列表: 最简单的基于FFmpeg的封装格式处理 ...
FFmpeg学习6：视音频同步
在上一篇文章中,视频和音频是各自独立播放的,并不同步.本文主要描述了如何以音频的播放时长为基准,将视频同步到音频上以实现视音频的同步播放的.主要有以下几个方面的内容视音频同步的简单介绍 DTS 和 ...
[总结]FFMPEG视音频编解码零基础学习方法--转
ffmpeg编解码学习目录(?)[-] ffmpeg程序的使用ffmpegexeffplayexeffprobeexe 1 ffmpegexe 2 ffplayexe 3 ffprobeexe ...
FFMPEG视音频编解码零基础学习方法－b
感谢大神分享,虽然现在还看不懂,留着大家一起看啦 PS:有不少人不清楚“FFmpeg”应该怎么读.它读作“ef ef em peg” 0. 背景知识本章主要介绍一下FFMPEG都用在了哪里(在这里仅 ...

随机推荐

POJ2186 Popular Cows 题解强连通分量
题目链接:http://poj.org/problem?id=2186 题目大意: 每头牛都想成为牛群中的红人. 给定N头牛的牛群和M个有序对(A, B),(A, B)表示牛A认为牛B是红人: 该关系 ...
开源工具abaplint的介绍
长期以来,SAP提供的标准ABAP开发工具是我们对代码进行检查的唯一方式.这意味着我们只能对ABAP服务器上的ABAP代码做出分析,而离线代码则成为了纯粹的文本,开发者无法对其进行检查.abaplin ...
你的java服务挂了吗
问题背景最近测试环境服务总是崩溃,运维小哥全部重启后还是崩溃,查看了服务运行情况占用内存确实挺高的,看来是时候优化一波jvm参数了. 优化前 top $(ps -e | grep java | aw ...
JVM系列五（javac 编译器）.
一.概述我们都知道 *.java 文件要首先被编译成 *.class 文件才能被 JVM 认识,这部分的工作主要由 Javac 来完成,类似于 Javac 这样的我们称之为前端编译器: 但是 *.c ...
BFS小记
题目:求从S走到G点所需步数 #S######.#......#..#.#.##.##.#.#........##.##.####....#....#.#######.#....#......#### ...
假设检验的Python实现
结合假设检验的理论知识,本文使用Python对实际数据进行假设检验. 导入测试数据从线上下载测试数据文件,数据链接:https://pan.baidu.com/s/1t4SKF6U2yyjT365F ...
linux下文件解压缩中文乱码问题的解决
将带中文文件名的压缩文件上传到服务器,使用unzip解压后,文件名乱码: 临时解决方法: 通过unzip行命令解压,指定字符集unzip -O CP936 xxx.zip (用GBK, GB18030 ...
Frogger POJ - 2253（求两个石头之间”所有通路中最长边中“的最小边）
题意题目主要说的是,有两只青蛙,在两个石头上,他们之间也有一些石头,一只青蛙要想到达另一只青蛙所在地方,必须跳在石头上.题目中给出了两只青蛙的初始位置,以及剩余石头的位置,问一只青蛙到达另一只青 ...
python异常（理论知识）
异常程序在运行过程当中,不可避免的会出现一些错误,比如: 使用了没有赋值过的变量使用了不存在的索引除0 ... 这些错误在程序中,我们称其为异常. 程序运行过程中,一旦出现异常将会导致程序立即终 ...
MQ队列及常见操作
一. 创建MQ队列管理器 1.1准备工作到所安装websphere mq的机子上,进入/opt/mm/bin目录下,查询相关mq的情况,通过命令行./dspmq. 创建mq队列管理器的的时候要用mq ...

FFMPEG学习----分离视音频里的PCM数据

FFMPEG学习----分离视音频里的PCM数据的更多相关文章

随机推荐

热门专题