ffmpeg音频重采样代码抽取

更新时间:2023-05-03 13:05:59 阅读：评论：0

ffmpeg⾳频重采样代码抽取

本篇博⽂针对的是ffmpeg4.0.1版本进⾏（⾳频重采样代码都能分离出来，其他部分不是肯定可以嘛，往后ffmpeg就可以分⽽⾷之，我们可以把它变成我们⾃⼰的代码）

ffmpeg解压缩之后会有⼀个doc⽬录，此⽬录中有⽰例程序，就在doc/examples。

要想编译examples中的测试程序，可以先编译整个ffmpeg（⽣成主要的库，如：libavcodec.a libavdevice.a libavfilter.a libavformat.a libavutil.a libswresample.a libswscale.a。当然动态库静态库都是可以配置的，我选择默认静态库编译），然后在ffmpeg主⽬录中执⾏make examples即可（make examplesclean可以清除编译⽂件）。

针对于resampleaudio.c这个⽂件，编译完了之后，直接执⾏./resampleaudio out即可（out⽂件查看代码可以知道它的采样率为44100，channel为3，格式为signed16bit），使⽤audacity⼯具导⼊查看如下：

其中前两个通道左右声道都是由正⽞波产⽣，正⽞波是代码中写好的src_data数据，查看resampleaudio.c的fill_samples函数就能知道，如下：

static void fill_samples(double*dst,int nb_samples,int nb_channels,int sample_rate,double*t)

{

int i, j;

double tincr =1.0/ sample_rate,*dstp = dst;

const double c =2* M_PI *440.0;

/* generate sin tone with 440Hz frequency and duplicated channels */

for(i =0; i < nb_samples; i++){

*dstp =sin(c **t);//这就是正⽞波⽣成的采样点赋值的地⽅（为什么没有输⼊源数据？因为代码中已经⾃⼰产⽣了数据）

for(j =1; j < nb_channels; j++)

dstp[j]= dstp[0];

dstp += nb_channels;

*t += tincr;

}

你刚开始看上⾯的波形可能会觉得那⾥是正⽞波，⼀点⼉也看不出来，其实放⼤之后就可以看到了，如下：

数据时间为10s，代码中是通过do{} while（t<10）来控制的，为什么t<10就是10s，你仔细看fill_samp

les函数⾥⾯代码实现就能知道，对于这个⽰例程序，程序中写死了最终输出数据的采样率为44100，也就是说1s秒钟会有44100个采样点，tincr = 1.0 /

sample_rate，什么时候t会等于1（也就是1s），那就要t⾃加sample_rate（44100）次才是⼀秒的数据量。由于nb_samples程序中写死了是1024（其实就是1024个采样点），1024对应于src_date采样率48000的数据量，通过程序执⾏时的打印看出*t=0重复出现了46次，其它都⼀样（*t=1,2,3…），我们计算⼀下就知道了48000/1024=46（46.875），⽽每次输⼊1024个采样点同样会输出941个采样点，这941个采样点对应的是dst_data的44100采样率数据，再次计

算，44100/941=46（46.865037194473963868225292242295），这就对上了。

程序中核⼼函数，也就是实际进⾏采样率转换的函数就是swr_convert函数，我们只需要会使⽤这个函数就⾏，与之相关的函数还有如下：（1）swr_alloc 创建resample context

（2）av_opt_t_int av_opt_t_sample_fmt 设置相关属性（通道，采样率，格式）

（3）swr_init 初始化resample context

（4）av_get_channel_layout_nb_channels av_samples_alloc_array_and_samples 分配内存

（5）fill_samples 填充数据

（6）swr_convert 转换采样率

（7）av_samples_get_buffer_size 获取转换之后的buffer⼤⼩，之后就是写⼊数据到⽂件中

⾮常符合我们⽇常实际开发中的代码逻辑：创建，初始化，设置参数，分配内存，进⾏数据处理，结果输出这个过程。

好了，代码也看了，也能正常运⾏，下⾯就是修改代码了，来个简单的，我要输⼊数据为48000，格式为signed16bit，通道为1（单声道），输出采样率为44100，格式为sig七月份是什么星座 ned16bit，通道为1的数据，怎么搞？很简单，就是上⾯的fill_samples函数，你把数据填到⾥⾯就可以了，具体修改如下：

static int fill_samples(short*dst,int nb_samples,int nb_channels,int src_sample_rate,int dst_sample_rate,double*t, FILE* src_file)

{

int i, j;

int ret =0;

double tincr =1.0/ src_sample_rate;

short* dstp = dst;

const double c =2* M_PI *440.0;

/* generate sin tone with 440Hz frequency and duplicated channels */

/*for (i = 0; i < nb_samples; i++) {

*dstp = sin(c * *t);

for (j = 1; j < nb_channels; j++)

dstp[j] = dstp[0];

dstp += nb_channels;

*t += tincr;

}*/

ret =fread(dst,2, nb_samples, src_file);

if(ret ==0){

printf("read complete, end \n");

return0;

}el if(ret <0){

printf("\n");

return-1;

}

printf("---- ret = %d\n", ret);

//memcpy(dst, );

for(j =1; j < nb_channels; j++)

dstp[j]= dstp[0];

return ret;

}

int main(int argc,char**argv)

{

int64_t src_ch_layout = AV_CH_LAYO排骨怎么炒才好吃 UT_MONO, dst_ch_layout = AV_CH_LAYOUT_MONO;

int src_rate =48000, dst_rate =44100;

uint8_t **src_data =NULL,**dst_data =NULL;

int src_nb_channels =0, dst_nb_channels =0;

int src_linesize, dst_linesize;

int src_nb_samples =1024, dst_nb_samples, max_dst_nb_samples;

enum AVSampleFormat src_sample_fmt = AV_SAMPLE_FMT_S16, dst_sample_fmt = AV_SAMPLE_FMT_S16; const char*dst_filename =NULL;

const char*src_filename =NULL;

FILE *dst_file;

FILE *src_file;

int dst_bufsize;

const char*fmt;

struct SwrContext *swr_ctx;

double t;

int ret;

if(argc !=3){

fprintf(stderr,"Usage: %s output_file\n"

"API example program to show how to resample an audio stream with libswresample.\n"

"This program generates a ries of audio frames, resamples them to a specified "

"output format and rate and saves them to an output file named output_file.\n",

argv[0]);

exit(1);

}

dst_filename = argv[1];

src_filename = argv[2];

dst_file =fopen(dst_filename,"wb");

if(!dst_file){

fprintf(stderr,"Could not open destination file %s\n", dst_filename);

exit(1);

}

src_file =fopen(src_filename,"rb");

if(!src_file){

fprintf(stderr,"Could not open destination file %s\n", src_filename);

exit(1);

}

/* create resampler context */

swr_ctx =swr_alloc();

if(!swr_ctx)生产的英语 {

fprintf(stderr,"Could not allocate resampler context\n");

ret =AVERROR(ENOMEM);

goto end;

}

/* t options */

av_opt_t_int(swr_ctx,"in_channel_layout", src_ch_layout,0);

av_opt_t_int(swr_ctx,"in_sample_rate", src_rate,0);

av_opt_t_sample_fmt(swr_ctx,"in_sample_fmt", src_sample_fmt,0);

av_蜂蜡 opt_t_int(swr_ctx,"out_channel_layout", dst_ch_layout,0);

av_opt_t_int(swr_ctx,"out_sample_rate", dst_rate,0);

av_opt_t_sample_fmt(swr_ctx,"out_sample_fmt", dst_sample_fmt,0);

* initialize the resampling context */

if((ret =swr_init(swr_ctx))<0){

fprintf(stderr,"Failed to initialize the resampling context\n");

goto end;

}

/* allocate source and destination samples buffers */

src_nb_channels =av_get_channel_layout_nb_channels(src_ch_layout);

ret =av_samples_alloc_array_and_samples(&src_data,&src_linesize, src_nb_channels,

src_nb_samples, src_sample_fmt,0);

if(ret <0){

fprintf(stderr,"Could not allocate source samples\n");

goto end;

}

/* compute t朗诵腔 he number of converted samples: buffering is avoided

* ensuring that the output buffer will contain at least all the

* converted input samples */

max_dst_nb_samples = dst_nb_samples =

av_rescale_rnd(src_nb_samples, dst_rate, src_rate, AV_ROUND_UP);

/* buffer is going to be directly written to a rawaudio file, no alignment */

dst_nb_channels =av_get_channel_layout_nb_channels(dst_ch_layout);

ret =av_samples_alloc_array_and_samples(&dst_data,&dst_linesize, dst_nb_channels,

dst_nb_samples, dst_sample_fmt,0);

if(ret <0){

fprintf(stderr,"Could not allocate destination samples\n");

goto end;

}

t =0;

do{

/* generate synthetic audio */

if(fill_samples((short*)src_data[0], src_nb_samples, src_nb_channels, src_rate, dst_rate,&t, src_file)<=0) break;

/* comput跑步节奏音乐 e destination number of samples */

dst_nb_samples =av_rescale_rnd(swr_get_delay(swr_ctx, src_rate)+

src_nb_samples, dst_rate, src_rate, AV_ROUND_UP);

if(dst_nb_samples > max_dst_nb_samples){

av_freep(&dst_data[0]);

ret =av_samples_alloc(dst_data,&dst_linesize, dst_nb_channels,

dst_nb_samples, dst_sample_fmt,1);

if(ret <0)

break;

max_dst_nb_samples = dst_nb_samples;

}

/* convert to destination format */

ret =swr_convert(swr_ctx, dst_data, dst_nb_samples,(const uint8_t **)src_data, src_nb_samples);

if(ret <0){

fprintf(stderr,"Error while converting\n");

goto end;

}

dst_bufsize =av_samples_get_buffer_size(&dst_linesize新生儿支气管肺炎 , dst_nb_channels,

ret, dst_sample_fmt,1);

if(dst_bufsize <0){

fprintf(stderr,"Could not get sample buffer size\n");

goto end;

}

printf("t:%f in:%d out:%d\n", t, src_nb_samples, ret);

fwrite(dst_data[0],1, dst_bufsize, dst_file);

}while(1);

if((ret =get_format_from_sample_fmt(&fmt, dst_sample_fmt))<0)

goto end;

fprintf(stderr,"Resampling succeeded. Play the output file with the command:\n"

"ffplay -f %s -channel_layout %"PRId64" -channels %d -ar %d %s\n",

fmt, dst_ch_layout, dst_nb_channels, dst_rate, dst_filename);

end:

fclo(dst_file);

fclo(src_file);

if(src_data)

av动物图片 _freep(&src_data[0]);

av_freep(&src_data);

if(dst_data)

av_freep(&dst_data[0]);

av_freep(&dst_data);

swr_free(&swr_ctx);

return ret <0;

}

修改之后编译运⾏：

./resampleaudio out say_48.pcm (say_48.pcm为采样率为48000，signed16bit，单声道格式)

结果如下，上图：

这个能实现，其他的所有格式转换都可以，直接修改代码即可，那怎么进⾏⼆次开发（此处就针对于⾳频重采样代码），单独编译resampleaudio.c⽂件如下：

gcc resampling_audio.c -o resampling_audio -I …/…/_install_gcc/include/ -L …/…/_install_gcc/lib/ -lswresample -lavutil -lm -lrt

…/…/_install_gcc/include/为编译ffmpeg之后的头⽂件安装⽬录，…/…/_install_gcc/lib/为编译ffmpeg之后的库⽂件安装⽬录，由此可以看出要编译resampling_audio.c需要⽤到libavutil和libswresample的库，好，那下⾯就把这⼀块⼉代码直接从程序中抽出来，让我们能单独编译resampling_audio.c这个⽂件，⽽不⽤依赖库⽂件。

。。。。。。

。。。。。

。。。。。。

本文发布于:2023-05-03 13:05:59，感谢您对本站的认可！

本文链接：https://www.wtabcd.cn/fanwen/fan/82/520816.html

上一篇：FL水果软件教程简单教学

下一篇：江畔独步寻花的板书

标签：代码采样率编译

留言与评论（共有 0 条评论）