使用libavcodec将mp3音频文件解码为pcm音频采样数据【[mp3float @ 0x561c1ec49940] Header missing】

一.打开和关闭输入文件和输出文件

　　想要解决上面提到的问题，我们需要对mp3文件的格式有个大致了解，为了方便讲解，我这里画了个示意图：

ID3V2	包含了作者，作曲，专辑等信息，长度不固定，扩展了 ID3V1 的信息量。
Frame	一系列的帧，个数由文件大小和帧长决定
ID3V1	包含了作者，作曲，专辑等信息，长度为 128BYTE

　　由于av_parser_parse2()这个方法的输入必须是只包含音频编码数据的“裸流”，所以，我们在读取mp3文件的时候，必须跳过ID3V2标签部分，从Frame开始。所以，我们就必须知道ID3V2标签的总长度。下面，我画了个ID3V2标签头的示意图，方便讲解。

File ID(3)

Version(2)

Flags(1)

Size(4)

　　ID3V2标签头固定为10byte，其中，Size部分的值是指除ID3V2标签头之外数据的总长度。需要注意的是，在实际计算长度的时候，这4个字节的最高位需要舍弃，也就是说，只用到了28bit，即：0xxxxxxx0xxxxxxx0xxxxxxx0xxxxxxx

#define AUDIO_INBUF_SIZE 20480

#define AUDIO_REFILL_THRESH 4096

static FILE* input_file= nullptr;

static FILE* output_file= nullptr;

static const AVCodec* codec= nullptr;

static AVCodecContext* codec_ctx= nullptr;

static AVPacket* pkt= nullptr;

static AVFrame* frame= nullptr;

static AVCodecParserContext* parser= nullptr;

static enum AVCodecID audio_codec_id;

void close_input_output_files(){

    if(input_file!= nullptr){

        fclose(input_file);

        input_file= nullptr;

    }

    if(output_file!= nullptr){

        fclose(output_file);

        output_file= nullptr;

    }

}

int32_t open_input_output_files(const char* input_name,const char* output_name){

    if(strlen(input_name)==0||strlen(output_name)==0){

        cout<<"Error:empty input or output file name."<<endl;

        return -1;

    }

    close_input_output_files();

    input_file=fopen(input_name,"rb");//rb：读取一个二进制文件，该文件必须存在

    if(input_file==nullptr){

        cerr<<"Error:failed to open input file."<<endl;

        return -1;

    }

    output_file=fopen(output_name,"wb");//wb:打开或新建一个二进制文件，只允许写

    if(output_file== nullptr){

        cout<<"Error:failed to open output file."<<endl;

        return -1;

    }

    uint8_t ID3V2_Header[10];

    fread(ID3V2_Header,10,1,input_file);

    long ID3V2_Size=((ID3V2_Header[6]&0x7f)<<21)+((ID3V2_Header[7]&0x7f)<<14)+((ID3V2_Header[8]&0x7f)<<7)+(ID3V2_Header[9]&0x7f)+10;

    fseek(input_file,ID3V2_Size,SEEK_SET);

    return 0;

}

二.音频解码器的初始化以及销毁

int32_t init_audio_decoder(const char* audio_codec){

    if(strcasecmp(audio_codec,"MP3")==0){

        audio_codec_id=AV_CODEC_ID_MP3;

        cout<<"Select codec id:MP3"<<endl;

    }

    else if(strcasecmp(audio_codec,"AAC")==0){

        audio_codec_id=AV_CODEC_ID_AAC;

        cout<<"Select codec id:AAC"<<endl;

    }

    else{

        cerr<<"Error:invalid audio format."<<endl;

        return -1;

    }

    codec=avcodec_find_decoder(audio_codec_id);

    if(!codec){

        cerr<<"Error:could not find codec."<<endl;

        return -1;

    }

    parser= av_parser_init(codec->id);

    if(!parser){

        cerr<<"Error:could not init parser."<<endl;

        return -1;

    }

    codec_ctx= avcodec_alloc_context3(codec);

    if(!codec_ctx){

        cerr<<"Error:could not alloc codec_ctx."<<endl;

        return -1;

    }

    int32_t result=avcodec_open2(codec_ctx,codec, nullptr);

    if(result<0){

        cerr<<"Error:could not open codec."<<endl;

        return -1;

    }

    frame=av_frame_alloc();

    if(!frame){

        cerr<<"Error:could not alloc frame."<<endl;

        return -1;

    }

    pkt=av_packet_alloc();

    if(!pkt){

        cerr<<"Error:could not alloc packet."<<endl;

        return -1;

    }

    return 0;

}

void destroy_audio_decoder(){

    av_parser_close(parser);

    avcodec_free_context(&codec_ctx);

    av_frame_free(&frame);

    av_packet_free(&pkt);

}

三.解码循环体

　　解码循环体至少需要实现以下三个功能：

　　　　1.从输入源中循环获取码流包

　　　　2.将当前帧传入解码器，获取输出的音频采样数据

　　　　3.输出解码获取的音频采样数据到输出文件

　　从输入源中读取音频数据到缓存：　

int32_t read_data_to_buf(uint8_t* buf,int32_t size,int32_t& out_size){

    int32_t read_size=fread(buf,1,size,input_file);

    if(read_size==0){

        cerr<<"Error:read_data_to_buf failed."<<endl;

        return -1;

    }

    out_size=read_size;

    return 0;

}

　　解码循环体：　　

int32_t end_of_input_file(){

    return feof(input_file);

}

static int32_t decode_packet(bool flushing){

    int32_t result=0;

    result= avcodec_send_packet(codec_ctx,flushing? nullptr:pkt);

    if(result<0){

        cerr<<"Error:avcodec_send_packet failed,result:"<<result<<endl;

        return -1;

    }

    while(result>=0){

        result= avcodec_receive_frame(codec_ctx,frame);

        if(result==AVERROR(EAGAIN)||result==AVERROR_EOF){

            return 1;

        }

        else if(result<0){

            cerr<<"Error:avcodec_receive_frame failed."<<endl;

            return -1;

        }

        if(flushing){

            cout<<"flushing:";

        }

        write_samples_to_pcm(frame,codec_ctx);

        cout<<"frame->nb_samples:"<<frame->nb_samples<<",frame->channels:"<<frame->channels<<endl;

    }

    return 0;

}

int32_t audio_decoding(){

    uint8_t inbuf[AUDIO_INBUF_SIZE+AV_INPUT_BUFFER_PADDING_SIZE]={0};

    int32_t result=0;

    uint8_t* data= nullptr;

    int32_t data_size=0;

    while(!end_of_input_file()){

        result= read_data_to_buf(inbuf,AUDIO_INBUF_SIZE,data_size);

        if(result<0){

            cerr<<"Error:read_data_to_buf failed."<<endl;

            return -1;

        }

        data=inbuf;

        while(data_size>0){

            result=av_parser_parse2(parser,codec_ctx,&pkt->data,&pkt->size,data,data_size,AV_NOPTS_VALUE,AV_NOPTS_VALUE,0);

            if(result<0){

                cerr<<"Error:av_parser_parse2 failed."<<endl;

                return -1;

            }

            data+=result;

            data_size-=result;

            if(pkt->size){

                cout<<"Parsed packet size:"<<pkt->size<<endl;

                decode_packet(false);

            }

            if (data_size < AUDIO_REFILL_THRESH) {

                memmove(inbuf, data, data_size);

                data = inbuf;

                int len = fread(data + data_size, 1,AUDIO_INBUF_SIZE - data_size, input_file);

                if (len > 0)

                    data_size += len;

            }

        }

    }

    decode_packet(true);

    return 0;

}

　　输出解码的音频采样数据：　　

int32_t write_samples_to_pcm(AVFrame* frame,AVCodecContext* codec_ctx){

    int data_size= av_get_bytes_per_sample(codec_ctx->sample_fmt);

    if(data_size<0){

        cerr<<"Error:failed to calculate data size."<<endl;

        return -1;

    }

    for(int i=0;i<frame->nb_samples;i++){

        for(int ch=0;ch<codec_ctx->channels;ch++){

            fwrite(frame->data[ch]+i*data_size,1,data_size,output_file);

        }

    }

    return 0;

}

　　最终，main函数的实现如下：

int main(){

    const char* input_file_name="../input.mp3";

    const char* output_file_name="../output.pcm";

    const char* codec_name="MP3";

    int32_t result= open_input_output_files(input_file_name,output_file_name);

    if(result<0){

        return result;

    }

    result=init_audio_decoder(codec_name);

    if(result<0){

        return result;

    }

    result=audio_decoding();

    if(result<0){

        return result;

    }

    destroy_audio_decoder();

    close_input_output_files();

    return 0;

}

　　解码完成后，可以使用ffplay播放output.pcm文件：

　　ffplay -ar 44100 -ac 2 -f f32le -i output.pcm

使用libavcodec将mp3音频文件解码为pcm音频采样数据【[mp3float @ 0x561c1ec49940] Header missing】的更多相关文章

视音频数据处理入门：PCM音频采样数据处理
===================================================== 视音频数据处理入门系列文章: 视音频数据处理入门:RGB.YUV像素数据处理视音频数据处理 ...
解析WAV音频文件----》生成WAV音频文件头
前言:请各大网友尊重本人原创知识分享,谨记本人博客:南国以南i WAV音频文件介绍: WAV文件是在PC机平台上很常见的.最经典的多媒体音频文件,最早于1991年8月出现在Windows3.1操作系统 ...
C# NAudio录音和播放音频文件及实时绘制音频波形图（从音频流数据获取，而非设备获取）
下午写了一篇关于NAudio的录音.播放和波形图的博客,不太满意,感觉写的太乱,又总结了下 NAudio是个相对成熟.开源的C#音频开发工具,它包含录音.播放录音.格式转换.混音调整等功能.本次介绍主 ...
android MediaCodec 音频编解码的实现——转码
原文地址:http://blog.csdn.net/tinsanmr/article/details/51049179 从今天开始每周不定期更新博客,把这一周在工作与学习中遇到的问题做个总结.俗话说 ...
FFMPEG视音频编解码零基础学习方法－b
感谢大神分享,虽然现在还看不懂,留着大家一起看啦 PS:有不少人不清楚“FFmpeg”应该怎么读.它读作“ef ef em peg” 0. 背景知识本章主要介绍一下FFMPEG都用在了哪里(在这里仅 ...
[总结]FFMPEG视音频编解码零基础学习方法
在CSDN上的这一段日子,接触到了很多同行业的人,尤其是使用FFMPEG进行视音频编解码的人,有的已经是有多年经验的“大神”,有的是刚开始学习的初学者.在和大家探讨的过程中,我忽然发现了一个问题:在“ ...
[转载] FFMPEG视音频编解码零基础学习方法
在CSDN上的这一段日子,接触到了很多同行业的人,尤其是使用FFMPEG进行视音频编解码的人,有的已经是有多年经验的“大神”,有的是刚开始学习的初学者.在和大家探讨的过程中,我忽然发现了一个问题:在“ ...
视音频编解码基本术语及解释&MediaInfo
MEDIA INFO 下载: https://mediaarea.net/en/MediaInfo/Download/Windows 摘要: 整理了一些基本视音频术语,用于入门和查询 ...
[总结]FFMPEG视音频编解码零基础学习方法【转】
本文转载自:http://blog.csdn.net/leixiaohua1020/article/details/15811977 在CSDN上的这一段日子,接触到了很多同行业的人,尤其是使用FFM ...
(原创)speex与wav格式音频文件的互相转换(二)
之前写过了如何将speex与wav格式的音频互相转换,如果没有看过的请看一下连接 http://www.cnblogs.com/dongweiq/p/4515186.html 虽然自己实现了相关的压缩 ...

随机推荐

Numpy数组乘法
Numpy数组乘法元素级乘法 numpy.multiply() 或 * : 数组对应位置元素相乘 import numpy as np # 一维数组 a = np.array([1, 2, 3, 4 ...
Vulnhub Development Walkthrough
Vulnhub Development Walkthrough Recon 首先使用netdiscover进行二层Arp扫描. ┌──(kali㉿kali)-[~] └─$ sudo netdisco ...
mysql+proxysql+replication-manager的主从半同步复制+高可用+读写分离
环境: AlmaLinux release 9.1 MySQL Community Server Ver 8.0.33 Replication Manager v2.2.40 for MariaDB ...
笔记：C++学习之旅---IO库
笔记:C++学习之旅---IO库 C++的输入输出分为三种: (1)基于控制台的I/O (2)基于文件的I/O (3)基于字符串的I/O 练习8.4 编写函数,以读模式打开一个文 ...
vue导入Excel数据并展示成表格
前言: 用到的库参考链接: FileReader:https://developer.mozilla.org/zh-CN/docs/Web/API/FileReader 这个在之前的下载exce ...
CSS 点击穿透pointer-events
在项目中,当需要展示一个元素在最顶层,但又不想让它影响下层的交互,可以pointer-events:none pointer-events介绍 pointer-events: auto | none ...
【解决方法】查找比较组时报错：An object (User, Group, or Built-in security principal) with the following nameca..
目录-快速跳转问题描述原因分析: 解决方案: 附言: 问题描述操作环境与场景: 在 VM 内 Windows 2019 中,在组策略管理中,对GPO进行组查找时报错: An object (Us ...
docker常用命令之帮助启动类命令和镜像命令
docker安装之后,启动时会报如下错误: Job for docker.service failed because start of the service was attempted too o ...
MySQL 中读写分离数据延迟
MySQL 中读写分离可能遇到的问题前言读写分离的架构基于客户端实现读写分离基于中间代理实现读写分离 MySQL 中如何保证主从数据一致循环复制问题主从同步延迟主从同步延迟的原因主从延 ...
SpringBoot自定义注解+AOP+redis实现防接口幂等性重复提交，从概念到实战
本文为千锋教育技术团独家创作,更多技术类知识干货,点个关注持续追更~ 接口幂等性是Web开发中非常重要的一个概念,它可以保证多次调用同一个接口不会对结果产生影响.如果你想了解更多关于接口幂等性的知识, ...

使用libavcodec将mp3音频文件解码为pcm音频采样数据【[mp3float @ 0x561c1ec49940] Header missing】

使用libavcodec将mp3音频文件解码为pcm音频采样数据【[mp3float @ 0x561c1ec49940] Header missing】的更多相关文章

随机推荐

热门专题