如何将mp4文件解复用并且解码为单独的.yuv图像序列以及.pcm音频采样数据？

一.初始化解复用器

　　在音视频的解复用的过程中，有一个非常重要的结构体AVFormatContext,即输入文件的上下文句柄结构，代表当前打开的输入文件或流。我们可以将输入文件的路径以及AVFormatContext **format_ctx 传入函数avformat_open_input(),就可以打开对应的音视频文件或流。接下来再调用avformat_find_stream_info()函数去解析输入文件中的音视频流信息，打开对应的解码器，读取文件头的信息进行解码，然后在解码过程中将一些参数的信息保存到AVStream结构对应的成员中。之后，我们便可以通过AVStream去初始化编解码器的上下文结构，下面给出代码：

static AVFormatContext *format_ctx= nullptr;

static AVCodecContext *video_dec_ctx= nullptr,*audio_dec_ctx= nullptr;

static int32_t video_stream_index=-1;

static int32_t audio_stream_index=-1;

static AVStream *video_stream= nullptr,*audio_stream= nullptr;

static FILE *output_video_file= nullptr,*output_audio_file= nullptr;

static AVPacket *pkt= nullptr;

static AVFrame *frame= nullptr;

static int open_codec_context(int32_t *stream_idx,AVCodecContext **dec_ctx,AVFormatContext *fmt_ctx,enum AVMediaType type){

    int ret,stream_index;

    AVStream *st= nullptr;

    const AVCodec *dec= nullptr;

    ret= av_find_best_stream(fmt_ctx,type,-1,-1, nullptr,0);

    if(ret<0){

        cerr<<"Error:Could not find "<<string(av_get_media_type_string(type))<<" stream in input file."<<endl;

        return ret;

    }

    else{

        stream_index=ret;

        st=fmt_ctx->streams[stream_index];

        //find decoder for the stream

        dec= avcodec_find_decoder(st->codecpar->codec_id);

        if(!dec){

            cerr<<"Error:Failed to find codec:"<<string(av_get_media_type_string(type))<<endl;

            return -1;

        }

        *dec_ctx= avcodec_alloc_context3(dec);

        if(!*dec_ctx){

            cerr<<"Error:Failed to alloc codec context:"<<string(av_get_media_type_string(type))<<endl;

            return -1;

        }

        if((ret= avcodec_parameters_to_context(*dec_ctx,st->codecpar))<0){

            cerr<<"Error:Failed to copy codec parameters to decoder context."<<endl;

            return ret;

        }

        if((ret=avcodec_open2(*dec_ctx,dec, nullptr))<0){

            cerr<<"Error:Could not open "<<string(av_get_media_type_string(type))<<" codec."<<endl;

            return ret;

        }

        *stream_idx=stream_index;

    }

    return 0;

}

int32_t init_demuxer(const char *input_name,const char *video_output_name,const char *audio_output_name){

    if(strlen(input_name)==0){

        cerr<<"Error:empty input file name."<<endl;

        exit(-1);

    }

    int32_t result= avformat_open_input(&format_ctx,input_name, nullptr, nullptr);

    if(result<0){

        cerr<<"Error:avformat_open_input failed."<<endl;

        exit(-1);

    }

    result= avformat_find_stream_info(format_ctx, nullptr);

    if(result<0){

        cerr<<"Error:avformat_find_stream_info failed."<<endl;

        exit(-1);

    }

    result= open_codec_context(&video_stream_index,&video_dec_ctx,format_ctx,AVMEDIA_TYPE_VIDEO);

    if(result>=0){

        video_stream=format_ctx->streams[video_stream_index];

        output_video_file=fopen(video_output_name,"wb");

        if(!output_video_file){

            cerr<<"Error:failed to open video output file."<<endl;

            return -1;

        }

    }

    result= open_codec_context(&audio_stream_index,&audio_dec_ctx,format_ctx,AVMEDIA_TYPE_AUDIO);

    if(result>=0){

        audio_stream=format_ctx->streams[audio_stream_index];

        output_audio_file=fopen(audio_output_name,"wb");

        if(!output_audio_file){

            cerr<<"Error:failed to open audio output file."<<endl;

            return -1;

        }

    }

    av_dump_format(format_ctx,0,input_name,0);

    if(!audio_stream&&!video_stream){

        cerr<<"Error:Could not find audio or video stream in the input,aborting"<<endl;

        return -1;

    }

    pkt=av_packet_alloc();

    if(!pkt){

        cerr<<"Error:could not alloc packet."<<endl;

        return -1;

    }

    frame=av_frame_alloc();

    if(!frame){

        cerr<<"Error:could not alloc frame."<<endl;

        return -1;

    }

    if(video_stream){

        cout<<"Demuxing video from file "<<string(input_name)<<" into "<<string(video_output_name)<<endl;

    }

    if(audio_stream){

        cout<<"Demuxing audio from file "<<string(input_name)<<" into "<<string(audio_output_name)<<endl;

    }

    return 0;

}

二.循环读取码流包数据进行解码

　　在这里，我们需要调用一个非常重要的函数av_read_frame()，它可以从打开的音视频文件或流中依次读取下一个码流包结构，然后我们将码流包传入解码器进行解码即可，代码如下：

static int32_t decode_packet(AVCodecContext *dec,const AVPacket *pkt,bool flushing){

    int32_t result=0;

    result= avcodec_send_packet(dec,pkt);

    if(result<0){

        cerr<<"Error:avcodec_send_packet failed."<<endl;

        return -1;

    }

    while(result>=0){

        result=avcodec_receive_frame(dec,frame);

        if(result<0){

            if(result==AVERROR_EOF||result==AVERROR(EAGAIN)){

                return 0;

            }

            cerr<<"Error:Error during decoding,result="<<result<<endl;

            return result;

        }

        if(dec->codec->type==AVMEDIA_TYPE_VIDEO){

            write_frame_to_yuv(frame);

        }

        else{

            write_samples_to_pcm(frame,audio_dec_ctx);

        }

        if(flushing){

            cout<<"flushing"<<endl;

        }

        av_frame_unref(frame);

    }

    return result;

}

int32_t demuxing(){

    int32_t result=0;

    while(av_read_frame(format_ctx,pkt)>=0){

        cout<<"Read packet,pts:"<<pkt->pts<<",stream:"<<pkt->stream_index<<",size:"<<pkt->size<<endl;

        if(pkt->stream_index==audio_stream_index){

            result= decode_packet(audio_dec_ctx,pkt,false);

        }

        else if(pkt->stream_index==video_stream_index){

            result= decode_packet(video_dec_ctx,pkt,false);

        }

        av_packet_unref(pkt);

        if(result<0){

            break;

        }

    }

    if(video_dec_ctx){

        decode_packet(video_dec_ctx, nullptr,true);

    }

    if(audio_dec_ctx){

        decode_packet(audio_dec_ctx, nullptr,true);

    }

    cout<<"Demuxing succeeded."<<endl;

    return 0;

}

三.将解码后的图像序列以及音频采样数据写入相应的文件

　　这个步骤比较简单，不解释，直接上代码：

int32_t write_frame_to_yuv(AVFrame* frame){

    uint8_t** pBuf=frame->data;

    int* pStride=frame->linesize;

    for(size_t i=0;i<3;i++){

        int32_t width=(i==0?frame->width:frame->width/2);

        int32_t height=(i==0?frame->height:frame->height/2);

        for(size_t j=0;j<height;j++){

            fwrite(pBuf[i],1,width,output_video_file);

            pBuf[i]+= pStride[i];

        }

    }

    return 0;

}

int32_t write_samples_to_pcm(AVFrame* frame,AVCodecContext* codec_ctx){

    int data_size= av_get_bytes_per_sample(codec_ctx->sample_fmt);

    if(data_size<0){

        cerr<<"Error:failed to calculate data size."<<endl;

        return -1;

    }

    for(int i=0;i<frame->nb_samples;i++){

        for(int ch=0;ch<codec_ctx->channels;ch++){

            fwrite(frame->data[ch]+i*data_size,1,data_size,output_audio_file);

        }

    }

    return 0;

}

四.销毁资源，释放内存

void destroy_demuxer(){

    avcodec_free_context(&video_dec_ctx);

    avcodec_free_context(&audio_dec_ctx);

    avformat_close_input(&format_ctx);

    if(output_audio_file!= nullptr){

        fclose(output_audio_file);

        output_audio_file= nullptr;

    }

    if(output_video_file!= nullptr){

        fclose(output_video_file);

        output_video_file= nullptr;

    }

}

五.main函数

int main(){

    int32_t result=init_demuxer("../input.mp4","../output.yuv","../output.pcm");

    if(result<0){

        return -1;

    }

    result=demuxing();

    if(result<0){

        return -1;

    }

    destroy_demuxer();

    return 0;

}

　　到这里，就大功告成了，可以使用以下的命令去播放输出的音视频文件：

　　ffplay -ac 2 -ar 44100 -f f32le -i output.pcm

　　ffplay -f rawvideo -video_size 1920x1080 -i output.yuv

如何将mp4文件解复用并且解码为单独的.yuv图像序列以及.pcm音频采样数据？的更多相关文章

音视频编解码问题：javaCV如何快速进行音频预处理和解复用编解码（基于javaCV-FFMPEG）
前言: 前面我用了很多章实现了javaCV的基本操作,包括:音视频捕捉(摄像头视频捕捉和话筒音频捕捉),推流(本地音视频或者摄像头话筒混合推流到服务器),转流(rtsp->rtmp),收流(录制 ...
JavaCV的摄像头实战之六：保存为mp4文件(有声音)
欢迎访问我的GitHub https://github.com/zq2599/blog_demos 内容:所有原创文章分类汇总及配套源码,涉及Java.Docker.Kubernetes.DevOPS ...
FFmpeg(2)-avformat_open_input()函数详解并示例打开mp4文件
一. 解封装 pts 是显示的时间 dts是解码的时间, 这个时间是用来做同步. av_register_all(), 注册所有的格式.包括解封装格式和加封装格式. avformat_network_ ...
mux复用 demux解复用
保存音频包: 直接输出解复用之后的的音频数据码流.只需要在每次调用av_read_frame()之后将得到的音频的AVPacket存为本地文件即可. 但在分离AAC码流的时候,直接存储AVPacket ...
解复用-mpeg2
http://blog.csdn.net/yipie/article/details/7612226 数字高清晰度电视(High Definition Television)简称HDTV,是继黑白电视 ...
嵌入式使用mp4v2将H264+AAC合成mp4文件
录制程序要添加新功能:录制CMMB电视节目,我们的板卡发送出来的是RTP流(H264视频和AAC音频),录制程序要做的工作是: (1)接收并解析RTP包,分离出H264和AAC数据流: (2)将H26 ...
嵌入式 H264—MP4格式及在MP4文件中提取H264的SPS、PPS及码流
一.MP4格式基本概念 MP4格式对应标准MPEG-4标准(ISO/IEC14496) 二.MP4封装格式核心概念 1 MP4封装格式对应标准为 ISO/IEC 14496-12(信息技术视听对象 ...
使用mp4v2将H264+AAC合成mp4文件
录制程序要添加新功能:录制CMMB电视节目,我们的板卡发送出来的是RTP流(H264视频和AAC音频),录制程序要做的工作是: (1)接收并解析RTP包,分离出H264和AAC数据流: (2)将H26 ...
【转】使用ffmpeg转码的MP4文件需要加载完了才能播放的解决办法
1.前一段时间做了一个ffmpeg转码MP4的项目,但是转出来的MP4部署在网站上需要把整个视频加载完成才能播放,到处找资料,最后找到解决方案记录于此备忘. FFMpeg转码由此得到的mp4文件中, ...
[转载]为什么有些MP4文件在Chrome浏览器上播放不了？
http://blog.sina.com.cn/s/blog_6bb7ebcc0101c2ja.html Chrome浏览器支持HTML5,它支持原生播放部分的MP4格式(不用通过Flash等插件). ...

随机推荐

python入门教程之十函数
函数是组织好的,可重复使用的,用来实现单一,或相关联功能的代码段. 函数能提高应用的模块性,和代码的重复利用率.你已经知道Python提供了许多内建函数,比如print().但你也可以自己创建函数,这 ...
开源Apinto网关-流量策略
背景介绍 Apinto是一款高性能.可扩展.易维护的API网关. Apinto网关基于GO语言模块化开发,5分钟极速部署,配置简单.易于维护,支持集群与动态扩容,企业级开箱即用.Apinto除了提供丰 ...
【深度学习】【图像分类网络】（二）VisionTransformer
Transformer简介 ![1png](file:///D:/资料/学习笔记/深度学习/图像分类/transformer/Self-Attention以及Multi-Head Attention/ ...
msp430点灯实验
title: msp430点灯实验 date: 2023-04-15 15:31:25 description: 基于msp430f5529点灯实验一.实验内容使用开发板:msp430f5529 ...
GDOU-CTF-2023新生赛Pwn题解与反思
第一次参加CTF新生赛总结与反思因为昨天学校那边要进行天梯模拟赛,所以被拉过去了.16点30分结束,就跑回来宿舍开始写.第一题和第二题一下子getshell,不用30分钟,可能我没想那么多,对比网上 ...
微信小程序隐藏页面滚动条
开发小程序时,经常会碰到页面长度超过屏幕高度,然后下拉时会出现滚动条,对于一些有强迫症的人来说是不可忍受的. 网上看了好多,写的.都评论有起作用或者不起作用的. 我在这分享一个全局隐藏滚动条的方式. ...
33-module
const { resolve } = require('path') const HtmlWebpackPlugin = require('html-webpack-plugin') module. ...
Lambda表达式和链式编程
一.Lambda表达式 1. Lambda使用条件 Lambda表达式是 JDK8 的一个新特性,可以认为是对匿名内部类的一种简化,但不是所有的匿名内部类都可以简化为Lambda表达式. 只有函数式接 ...
2022-12-01：从不订购的客户。找出所有从不订购任何东西的客户，以下数据的答案输出是Henry和Max，sql语句如何写？ DROP TABLE IF EXISTS `customers`； C
2022-12-01:从不订购的客户.找出所有从不订购任何东西的客户,以下数据的答案输出是Henry和Max,sql语句如何写? DROP TABLE IF EXISTS `customers`; C ...
vue全家桶进阶之路44：Vue3 Element Plus el_row和el_col组件
在 Vue 3 中,Element Plus 也提供了 ElRow 和 ElCol 组件,用于实现栅格布局. ElRow 组件的常用属性: gutter:栅格间距,默认为 0. type:布局模式,可 ...

如何将mp4文件解复用并且解码为单独的.yuv图像序列以及.pcm音频采样数据？

如何将mp4文件解复用并且解码为单独的.yuv图像序列以及.pcm音频采样数据？的更多相关文章

随机推荐

热门专题