FFmpeg视频解码尾部掉帧

《音视频文章汇总》
接触ffmpeg有一段时间了，现遇到一个视频解码尾部掉帧的问题，记录下，缓冲区已经刷过，但还是尾部少帧,虽然尾部少一帧两帧对视频整体效果没啥影响(一般视频疫苗播放25帧)，但学东西就学透吧

FFmpeg从MP4文件中抽取yuv纯视频文件有两种方式

1.命令行工具ffmpeg直接抽取yuv文件

ffmpeg -i in.mp4 out_commandline.yuv

in.mp4文件是一个768x432,yuv420p,23fps的视频文件，抽取出来的yuv文件的总大小为115,955,712字节,可以计算出总帧数115955712/(7684321.5) = 233帧数

image

通过代码解码mp4文件后，看生成的yuv文件是否大小和上述一直

2.通过代码解封装demux，分别获取音频pcm和视频yuv文件,有两个版本的代码

3.1以前的音视频编解码分别用
解码API
avcodec_decode_video2()
avcodec_decode_audio4():
编码API
avcodec_encode_video2()
avcodec_encode_audio2()
3.1之后的音视频编码
解码API
avcodec_send_packet()
avcodec_receive_frame()
编码API
avcodec_send_frame()
avcodec_receive_packet()

I.3.1版本之前的解封装demux代码官方示例程序为如下，解码自己的MP4文件只需更改文件路径

将官方代码抽取为C++一个类的类方法，传入本地in.mp4路径进行解码

image

传入本地路径

图片.png

image

FFmpegs::FFmpegs()
{

}
static int decode_packet(int *got_frame, int cached)
{
    int ret = 0;
        if (pkt.stream_index == video_stream_idx) {
            /* decode video frame */
            ret = avcodec_decode_video2(video_dec_ctx, frame, got_frame, &pkt);
            if (ret < 0) {
                fprintf(stderr, "Error decoding video frame\n");
                return ret;
            }
            if (*got_frame) {
                printf("video_frame%s n:%d coded_n:%d pts:%s\n",
                       cached ? "(cached)" : "",
                       video_frame_count++, frame->coded_picture_number,
                       av_ts2timestr(frame->pts, &video_dec_ctx->time_base));
                /* copy decoded frame to destination buffer:
                 * this is required since rawvideo expects non aligned data */
                av_image_copy(video_dst_data, video_dst_linesize,
                              (const uint8_t **)(frame->data), frame->linesize,
                              video_dec_ctx->pix_fmt, video_dec_ctx->width, video_dec_ctx->height);
                /* write to rawvideo file */
                fwrite(video_dst_data[0], 1, video_dst_bufsize, video_dst_file);
            }
        } else if (pkt.stream_index == audio_stream_idx) {
            /* decode audio frame */
            ret = avcodec_decode_audio4(audio_dec_ctx, frame, got_frame, &pkt);
            if (ret < 0) {
                fprintf(stderr, "Error decoding audio frame\n");
                return ret;
            }
            if (*got_frame) {
                printf("audio_frame%s n:%d nb_samples:%d pts:%s\n",
                       cached ? "(cached)" : "",
                       audio_frame_count++, frame->nb_samples,
                       av_ts2timestr(frame->pts, &audio_dec_ctx->time_base));
                ret = av_samples_alloc(audio_dst_data, &audio_dst_linesize, av_frame_get_channels(frame),
                                       frame->nb_samples, (AVSampleFormat)frame->format, 1);
                if (ret < 0) {
                    fprintf(stderr, "Could not allocate audio buffer\n");
                    return AVERROR(ENOMEM);
                }
                /* TODO: extend return code of the av_samples_* functions so that this call is not needed */
                audio_dst_bufsize =
                    av_samples_get_buffer_size(NULL, av_frame_get_channels(frame),
                                               frame->nb_samples, (AVSampleFormat)frame->format, 1);
                /* copy audio data to destination buffer:
                 * this is required since rawaudio expects non aligned data */
                av_samples_copy(audio_dst_data, frame->data, 0, 0,
                                frame->nb_samples, av_frame_get_channels(frame), (AVSampleFormat)frame->format);
                /* write to rawaudio file */
                fwrite(audio_dst_data[0], 1, audio_dst_bufsize, audio_dst_file);
                av_freep(&audio_dst_data[0]);
            }
        }
        return ret;
}
static int open_codec_context(int *stream_idx,
                              AVFormatContext *fmt_ctx, enum AVMediaType type)
{
    int ret;
    AVStream *st;
    AVCodecContext *dec_ctx = NULL;
    AVCodec *dec = NULL;
    ret = av_find_best_stream(fmt_ctx, type, -1, -1, NULL, 0);
    if (ret < 0) {
        fprintf(stderr, "Could not find %s stream in input file '%s'\n",
                av_get_media_type_string(type), src_filename);
        return ret;
    } else {
        *stream_idx = ret;
        st = fmt_ctx->streams[*stream_idx];
        /* find decoder for the stream */
        dec_ctx = st->codec;
        dec = avcodec_find_decoder(dec_ctx->codec_id);
        if (!dec) {
            fprintf(stderr, "Failed to find %s codec\n",
                    av_get_media_type_string(type));
            return ret;
        }
        if ((ret = avcodec_open2(dec_ctx, dec, NULL)) < 0) {
            fprintf(stderr, "Failed to open %s codec\n",
                    av_get_media_type_string(type));
            return ret;
        }
    }
    return 0;
}
static int get_format_from_sample_fmt(const char **fmt,
                                      enum AVSampleFormat sample_fmt)
{
    int i;
    struct sample_fmt_entry {
        enum AVSampleFormat sample_fmt; const char *fmt_be, *fmt_le;
    } sample_fmt_entries[] = {
        { AV_SAMPLE_FMT_U8,  "u8",    "u8"    },
        { AV_SAMPLE_FMT_S16, "s16be", "s16le" },
        { AV_SAMPLE_FMT_S32, "s32be", "s32le" },
        { AV_SAMPLE_FMT_FLT, "f32be", "f32le" },
        { AV_SAMPLE_FMT_DBL, "f64be", "f64le" },
    };
    *fmt = NULL;
    for (i = 0; i < FF_ARRAY_ELEMS(sample_fmt_entries); i++) {
        struct sample_fmt_entry *entry = &sample_fmt_entries[i];
        if (sample_fmt == entry->sample_fmt) {
            *fmt = AV_NE(entry->fmt_be, entry->fmt_le);
            return 0;
        }
    }
    fprintf(stderr,
            "sample format %s is not supported as output format\n",
            av_get_sample_fmt_name(sample_fmt));
    return -1;
}
void FFmpegs::demuxer(){
    int ret = 0, got_frame;
    int inEnd = 0;
    src_filename = "/Users/cloud/Documents/iOS/音视频/TestMusic/Demux/video2/in.mp4";
    video_dst_filename = "/Users/cloud/Documents/iOS/音视频/TestMusic/Demux/video2/out_video2.yuv";
    audio_dst_filename = "/Users/cloud/Documents/iOS/音视频/TestMusic/Demux/video2/out_video2.pcm";
    /* register all formats and codecs */
    av_register_all();
    /* open input file, and allocate format context */
    if (avformat_open_input(&fmt_ctx, src_filename, NULL, NULL) < 0) {
        fprintf(stderr, "Could not open source file %s\n", src_filename);
        exit(1);
    }
    /* retrieve stream information */
    if (avformat_find_stream_info(fmt_ctx, NULL) < 0) {
        fprintf(stderr, "Could not find stream information\n");
        exit(1);
    }
    if (open_codec_context(&video_stream_idx, fmt_ctx, AVMEDIA_TYPE_VIDEO) >= 0) {
        video_stream = fmt_ctx->streams[video_stream_idx];
        video_dec_ctx = video_stream->codec;
        video_dst_file = fopen(video_dst_filename, "wb");
        if (!video_dst_file) {
            fprintf(stderr, "Could not open destination file %s\n", video_dst_filename);
            ret = 1;
            goto end;
        }
        /* allocate image where the decoded image will be put */
        ret = av_image_alloc(video_dst_data, video_dst_linesize,
                             video_dec_ctx->width, video_dec_ctx->height,
                             video_dec_ctx->pix_fmt, 1);
        if (ret < 0) {
            fprintf(stderr, "Could not allocate raw video buffer\n");
            goto end;
        }
        video_dst_bufsize = ret;
    }
    if (open_codec_context(&audio_stream_idx, fmt_ctx, AVMEDIA_TYPE_AUDIO) >= 0) {
        int nb_planes;
        audio_stream = fmt_ctx->streams[audio_stream_idx];
        audio_dec_ctx = audio_stream->codec;
        audio_dst_file = fopen(audio_dst_filename, "wb");
        if (!audio_dst_file) {
            fprintf(stderr, "Could not open destination file %s\n", video_dst_filename);
            ret = 1;
            goto end;
        }
        nb_planes = av_sample_fmt_is_planar(audio_dec_ctx->sample_fmt) ?
            audio_dec_ctx->channels : 1;
        audio_dst_data = (uint8_t **)av_mallocz(sizeof(uint8_t *) * nb_planes);
        if (!audio_dst_data) {
            fprintf(stderr, "Could not allocate audio data buffers\n");
            ret = AVERROR(ENOMEM);
            goto end;
        }
    }
    /* dump input information to stderr */
    av_dump_format(fmt_ctx, 0, src_filename, 0);
    if (!audio_stream && !video_stream) {
        fprintf(stderr, "Could not find audio or video stream in the input, aborting\n");
        ret = 1;
        goto end;
    }
    frame = av_frame_alloc();
    if (!frame) {
        fprintf(stderr, "Could not allocate frame\n");
        ret = AVERROR(ENOMEM);
        goto end;
    }
    /* initialize packet, set data to NULL, let the demuxer fill it */
    av_init_packet(&pkt);
    pkt.data = NULL;
    pkt.size = 0;
    if (video_stream)
        printf("Demuxing video from file '%s' into '%s'\n", src_filename, video_dst_filename);
    if (audio_stream)
        printf("Demuxing audio from file '%s' into '%s'\n", src_filename, audio_dst_filename);
    /* read frames from the file */
    while (av_read_frame(fmt_ctx, &pkt) >= 0) {
        decode_packet(&got_frame, 0);
        av_free_packet(&pkt);
    }
    /* flush cached frames */
    pkt.data = NULL;
    pkt.size = 0;
    do {
        decode_packet(&got_frame, 1);
    } while (got_frame);

    printf("Demuxing succeeded.\n");
    if (video_stream) {
        printf("Play the output video file with the command:\n"
               "ffplay -f rawvideo -pix_fmt %s -video_size %dx%d %s\n",
               av_get_pix_fmt_name(video_dec_ctx->pix_fmt), video_dec_ctx->width, video_dec_ctx->height,
               video_dst_filename);
    }
    if (audio_stream) {
        const char *fmt;
        if ((ret = get_format_from_sample_fmt(&fmt, audio_dec_ctx->sample_fmt)) < 0)
            goto end;
        printf("Play the output audio file with the command:\n"
               "ffplay -f %s -ac %d -ar %d %s\n",
               fmt, audio_dec_ctx->channels, audio_dec_ctx->sample_rate,
               audio_dst_filename);
    }
end:
    if (video_dec_ctx)
        avcodec_close(video_dec_ctx);
    if (audio_dec_ctx)
        avcodec_close(audio_dec_ctx);
    avformat_close_input(&fmt_ctx);
    if (video_dst_file)
        fclose(video_dst_file);
    if (audio_dst_file)
        fclose(audio_dst_file);
    av_free(frame);
    av_free(video_dst_data[0]);
    av_free(audio_dst_data);
}

此时解码出来的yuv文件大小为115,458,048字节，115458048/(7684321.5)计算出帧数为232帧

image

通过使用YuvEye工具对比命令行生成的YUV文件和代码生成的YUV文件发现尾部少了一帧，YuvEye比对工具从第0帧开始，官方示例代码里面也已经刷新缓冲区了，为何还是少最后一帧呢

image

google搜索答案，看到这样一篇博文ffmpeg视频解码丢帧问题里面说的丢帧的原因是

读取的AVPacket都有pts和dts两个属性，往复杂了说视频帧类型有I/P/B等种类，我们就以简单的方式说，PTS是图像的展示时间，DTS是图像的解码时间，问题就来了，由于视频帧类型，很多时候，PTS基本都是按顺序的，但是DTS却不是，也就是说这个包的解码时候需要在下个包解码之后解码，所以此次就不能解码，因此获取不到视频帧，数据被缓存了，如果之后不去主动去取，那就真的丢了。

while( av_read_frame(format_ctx_, &packet) >= 0 ) {
    if( packet.stream_index == video_stream_index_ ) {
        avcodec_decode_video2(codec_ctx_, frame, &frameFinished, &packet);
        if( frameFinished ) {
            //...
        }
    }

    av_free_packet(&packet);
}

以上的代码基本就是常见的使用场景，基本上文件的最后几帧已经丢失了，虽然很多时候不是太重要，可以忽略，毕竟几帧数据在很大帧率下所占的时间很小。如果需要的话，那如何找回来呢，简单的办法就是继续空包读取即可

给出的解决方案：记录丢掉了多少帧次数，在正常帧读取完毕后，进行空帧读取，读取空帧的次数就是记录的丢掉的帧的次数，这样总数加起来能保持不变，代码模板如下

注意，空包解码的时候必须是packet的data为NULL,size为0。

while( av_read_frame(format_ctx_, &packet) >= 0 ) {
    if( packet.stream_index == video_stream_index_ ) {
        avcodec_decode_video2(codec_ctx_, frame.get(), &frameFinished, &packet);
        if( frameFinished ) {   
            //...
        } else {
            total_skip++;
        }
    }

    av_free_packet(&packet);
}
    
while(total_skip--) {
    avcodec_decode_video2(codec_ctx_, frame.get(), &frameFinished, &packet);
    if( frameFinished ) {
        //...
    }
}

在代码中实现丢帧的空帧读取，这个操作就包含了刷新缓冲区的概念，记录跳跃帧的次数，最后再次读取跳跃帧次数次帧

image

于是喜出望外，请身边人喝了三瓶可口可乐，以为发现了规律总帧数=正常读取帧+缓冲区帧数+跳跃次数=230+1+2=233，正好为总帧数=YUV420P,768x432文件总大小115955712字节/(7684321.5)=233帧

实质后面发现缓冲区中存在2帧，与前面缓冲区中存在一帧不一致

image

再次用两个mp4文件调试,一个mp4文件是568x320,YUV420P,发现如下：命令行生成的yuv文件总大小为66524160字节/(5683201.5) = 244帧，好像也满足上面的规律

图片.png

image

再次换一个30秒的mp4文件768x432,YUV420P,命令行生成的文件总大小为344881152字节/(768x432*1.5) = 693帧，此文件就不符合总帧数693=正常读取帧690+缓冲区帧数2+跳跃次数2的规律了，690+2+2=694帧多出1帧

image

再次换一个60秒的mp4文件768x432,YUV420P,命令行生成的宽高768x432,YUV420P文件的总大小为689264640字节/(768x432*1.5)= 1385帧，此文件就不符合规律了1380+2+6=1388就多出两帧了

image

临时解决办法:多帧要比少帧好，就是最后文件中的数据因为是正常帧+缓冲区的帧+跳跃次数帧=得到的总帧数，可能回比实际帧数多，但总比缺帧好，先暂时找到的不是办法的办法，后面理清楚H264的编码原理后再找解决办法

跳跃帧次数+正常帧+缓冲区帧数>=总帧数
230+2+2=234
116453376/(7684321.5)=234帧

image

代码逻辑如下

image

#include "ffmpegs.h"
#include <QDebug>
static AVFormatContext *fmt_ctx = NULL;
static AVCodecContext *video_dec_ctx = NULL, *audio_dec_ctx;
static AVStream *video_stream = NULL, *audio_stream = NULL;
static const char *src_filename = NULL;
static const char *video_dst_filename = NULL;
static const char *audio_dst_filename = NULL;
static FILE *video_dst_file = NULL;
static FILE *audio_dst_file = NULL;
static uint8_t *video_dst_data[4] = {NULL};
static int      video_dst_linesize[4];
static int video_dst_bufsize;
static uint8_t **audio_dst_data = NULL;
static int       audio_dst_linesize;
static int audio_dst_bufsize;
static int video_stream_idx = -1, audio_stream_idx = -1;
static AVFrame *frame = NULL;
static AVPacket pkt;
static int video_frame_count = 0;
static int audio_frame_count = 0;
static int videoFrameIdx = 0;
static int audioFrameIdx = 0;
//跳跃了多少次空帧呢
static int skipFrameIdx = 0;

//跳跃帧写入了多少帧
static int skipFrameWriteIdx = 0;
//跳跃帧里面的尾部帧，防止开头的跳跃帧被写入
static int isEndFrame = 0;
//正常帧读取后刷新缓冲区刷新了多少帧
static int flushFrameIdx = 0;
//是尾部跳跃帧补齐
static int isSkipFrame = 0;
FFmpegs::FFmpegs()
{

}
static int decode_packet(int *got_frame, int cached)
{
    int ret = 0;
    if (pkt.stream_index == video_stream_idx) {
        /* decode video frame */
        ret = avcodec_decode_video2(video_dec_ctx, frame, got_frame, &pkt);
        if(isEndFrame == 1) qDebug() << "尾部帧刷新后解码器返回值:" << ret << *got_frame << &pkt;
        if (ret < 0) {
            fprintf(stderr, "Error decoding video frame\n");
            return ret;
        }
        if (*got_frame) {
            qDebug() << "正常视频帧:" << ++video_frame_count << "帧宽度:" << frame->width;
            if(isEndFrame == 1){//如果是尾部刷新缓冲区记录下刷新缓冲区刷新了多少帧
                flushFrameIdx++;
                qDebug() << "缓冲区刷新了多少帧" << flushFrameIdx;
            }
            printf("视频帧-------video_frame%s n:%d coded_n:%d pts:%s\n",
                   cached ? "(cached)" : "",
                   video_frame_count, frame->coded_picture_number,
                   av_ts2timestr(frame->pts, &video_dec_ctx->time_base));
            /* copy decoded frame to destination buffer:
             * this is required since rawvideo expects non aligned data */
            av_image_copy(video_dst_data, video_dst_linesize,
                          (const uint8_t **)(frame->data), frame->linesize,
                          video_dec_ctx->pix_fmt, video_dec_ctx->width, video_dec_ctx->height);
            /* write to rawvideo file */
            fwrite(video_dst_data[0], 1, video_dst_bufsize, video_dst_file);
        }else{
            if(isEndFrame==0){//不是尾部刷新缓冲区进入才计算跳跃次数
                skipFrameIdx++;
                qDebug() << "当前pkt的值" << &pkt << "帧宽度:" << frame->width << "--跳跃次数--" << skipFrameIdx;
            }
            else{//是尾部跳跃帧数进来，将尾部帧写入文件尾部
                if(isSkipFrame == 1){
                    qDebug() << "got_frame写入帧为0，写入跳跃帧次数" << ++skipFrameWriteIdx;
                    av_image_copy(video_dst_data, video_dst_linesize,
                                  (const uint8_t **)(frame->data), frame->linesize,
                                  video_dec_ctx->pix_fmt, video_dec_ctx->width, video_dec_ctx->height);
                    fwrite(video_dst_data[0], 1, video_dst_bufsize, video_dst_file);
                }
            }
        }
    }
    else if (pkt.stream_index == audio_stream_idx) {
        /* decode audio frame */
        ret = avcodec_decode_audio4(audio_dec_ctx, frame, got_frame, &pkt);
        if (ret < 0) {
            fprintf(stderr, "Error decoding audio frame\n");
            return ret;
        }
        if (*got_frame) {
            printf("音频帧--------audio_frame%s n:%d nb_samples:%d pts:%s\n",
                   cached ? "(cached)" : "",
                   audio_frame_count++, frame->nb_samples,
                   av_ts2timestr(frame->pts, &audio_dec_ctx->time_base));
            ret = av_samples_alloc(audio_dst_data, &audio_dst_linesize, av_frame_get_channels(frame),
                                   frame->nb_samples, (AVSampleFormat)frame->format, 1);
            if (ret < 0) {
                fprintf(stderr, "Could not allocate audio buffer\n");
                return AVERROR(ENOMEM);
            }
            /* TODO: extend return code of the av_samples_* functions so that this call is not needed */
            audio_dst_bufsize =
                av_samples_get_buffer_size(NULL, av_frame_get_channels(frame),
                                           frame->nb_samples, (AVSampleFormat)frame->format, 1);
            /* copy audio data to destination buffer:
             * this is required since rawaudio expects non aligned data */
            av_samples_copy(audio_dst_data, frame->data, 0, 0,
                            frame->nb_samples, av_frame_get_channels(frame), (AVSampleFormat)frame->format);
            /* write to rawaudio file */
            printf("单次写入音频帧的大小 %d\n写了多少次 %d",audio_dst_bufsize,++audioFrameIdx);
            fwrite(audio_dst_data[0], 1, audio_dst_bufsize, audio_dst_file);
            av_freep(&audio_dst_data[0]);
        }
    }
    return ret;
}
static int open_codec_context(int *stream_idx,
                              AVFormatContext *fmt_ctx, enum AVMediaType type)
{
    int ret;
    AVStream *st;
    AVCodecContext *dec_ctx = NULL;
    AVCodec *dec = NULL;
    ret = av_find_best_stream(fmt_ctx, type, -1, -1, NULL, 0);
    if (ret < 0) {
        fprintf(stderr, "Could not find %s stream in input file '%s'\n",
                av_get_media_type_string(type), src_filename);
        return ret;
    } else {
        *stream_idx = ret;
        st = fmt_ctx->streams[*stream_idx];
        /* find decoder for the stream */
        dec_ctx = st->codec;
        dec = avcodec_find_decoder(dec_ctx->codec_id);
        if (!dec) {
            fprintf(stderr, "Failed to find %s codec\n",
                    av_get_media_type_string(type));
            return ret;
        }
        if ((ret = avcodec_open2(dec_ctx, dec, NULL)) < 0) {
            fprintf(stderr, "Failed to open %s codec\n",
                    av_get_media_type_string(type));
            return ret;
        }
    }
    return 0;
}
static int get_format_from_sample_fmt(const char **fmt,
                                      enum AVSampleFormat sample_fmt)
{
    int i;
    struct sample_fmt_entry {
        enum AVSampleFormat sample_fmt; const char *fmt_be, *fmt_le;
    } sample_fmt_entries[] = {
        { AV_SAMPLE_FMT_U8,  "u8",    "u8"    },
        { AV_SAMPLE_FMT_S16, "s16be", "s16le" },
        { AV_SAMPLE_FMT_S32, "s32be", "s32le" },
        { AV_SAMPLE_FMT_FLT, "f32be", "f32le" },
        { AV_SAMPLE_FMT_DBL, "f64be", "f64le" },
    };
    *fmt = NULL;
    for (i = 0; i < FF_ARRAY_ELEMS(sample_fmt_entries); i++) {
        struct sample_fmt_entry *entry = &sample_fmt_entries[i];
        if (sample_fmt == entry->sample_fmt) {
            *fmt = AV_NE(entry->fmt_be, entry->fmt_le);
            return 0;
        }
    }
    fprintf(stderr,
            "sample format %s is not supported as output format\n",
            av_get_sample_fmt_name(sample_fmt));
    return -1;
}
void FFmpegs::demuxer(){
    int ret = 0, got_frame;
    int inEnd = 0;
    src_filename = "/Users/cloud/Documents/iOS/音视频/TestMusic/Demux/in.mp4";
    video_dst_filename = "/Users/cloud/Documents/iOS/音视频/TestMusic/Demux/out_video2_optimize.yuv";
    audio_dst_filename = "/Users/cloud/Documents/iOS/音视频/TestMusic/Demux/out_video2_optimize.pcm";
    /* register all formats and codecs */
    av_register_all();
    /* open input file, and allocate format context */
    if (avformat_open_input(&fmt_ctx, src_filename, NULL, NULL) < 0) {
        fprintf(stderr, "Could not open source file %s\n", src_filename);
        exit(1);
    }
    /* retrieve stream information */
    if (avformat_find_stream_info(fmt_ctx, NULL) < 0) {
        fprintf(stderr, "Could not find stream information\n");
        exit(1);
    }
    if (open_codec_context(&video_stream_idx, fmt_ctx, AVMEDIA_TYPE_VIDEO) >= 0) {
        video_stream = fmt_ctx->streams[video_stream_idx];
        video_dec_ctx = video_stream->codec;
        video_dst_file = fopen(video_dst_filename, "wb");
        if (!video_dst_file) {
            fprintf(stderr, "Could not open destination file %s\n", video_dst_filename);
            ret = 1;
            goto end;
        }
        /* allocate image where the decoded image will be put */
        ret = av_image_alloc(video_dst_data, video_dst_linesize,
                             video_dec_ctx->width, video_dec_ctx->height,
                             video_dec_ctx->pix_fmt, 1);
        if (ret < 0) {
            fprintf(stderr, "Could not allocate raw video buffer\n");
            goto end;
        }
        video_dst_bufsize = ret;
    }
    if (open_codec_context(&audio_stream_idx, fmt_ctx, AVMEDIA_TYPE_AUDIO) >= 0) {
        int nb_planes;
        audio_stream = fmt_ctx->streams[audio_stream_idx];
        audio_dec_ctx = audio_stream->codec;
        audio_dst_file = fopen(audio_dst_filename, "wb");
        if (!audio_dst_file) {
            fprintf(stderr, "Could not open destination file %s\n", video_dst_filename);
            ret = 1;
            goto end;
        }
        nb_planes = av_sample_fmt_is_planar(audio_dec_ctx->sample_fmt) ?
            audio_dec_ctx->channels : 1;
        audio_dst_data = (uint8_t **)av_mallocz(sizeof(uint8_t *) * nb_planes);
        if (!audio_dst_data) {
            fprintf(stderr, "Could not allocate audio data buffers\n");
            ret = AVERROR(ENOMEM);
            goto end;
        }
    }
    /* dump input information to stderr */
    av_dump_format(fmt_ctx, 0, src_filename, 0);
    if (!audio_stream && !video_stream) {
        fprintf(stderr, "Could not find audio or video stream in the input, aborting\n");
        ret = 1;
        goto end;
    }
    frame = av_frame_alloc();
    if (!frame) {
        fprintf(stderr, "Could not allocate frame\n");
        ret = AVERROR(ENOMEM);
        goto end;
    }
    /* initialize packet, set data to NULL, let the demuxer fill it */
    av_init_packet(&pkt);
    pkt.data = NULL;
    pkt.size = 0;
    if (video_stream)
        printf("Demuxing video from file '%s' into '%s'\n", src_filename, video_dst_filename);
    if (audio_stream)
        printf("Demuxing audio from file '%s' into '%s'\n", src_filename, audio_dst_filename);
    /* read frames from the file */
    //跳跃帧次数+正常帧+缓冲区帧数>=总帧数
    //正常帧
    while (av_read_frame(fmt_ctx, &pkt) >= 0) {
        decode_packet(&got_frame, 0);
        av_free_packet(&pkt);
    }
    /* flush cached frames */
    pkt.data = NULL;
    pkt.size = 0;
    //刷新缓冲区帧
    do {
        qDebug() << "进入刷新缓冲区空帧读取" << got_frame;
        isEndFrame = 1;
        decode_packet(&got_frame, 1);
    } while (got_frame);
    //跳跃帧
    while(skipFrameIdx--){
        isSkipFrame = 1;
        qDebug() << "进入跳跃帧读取" << skipFrameIdx;
        decode_packet(&got_frame, 1);
    }
    printf("Demuxing succeeded.\n");
    if (video_stream) {
        printf("Play the output video file with the command:\n"
               "ffplay -f rawvideo -pix_fmt %s -video_size %dx%d %s\n",
               av_get_pix_fmt_name(video_dec_ctx->pix_fmt), video_dec_ctx->width, video_dec_ctx->height,
               video_dst_filename);
    }
    if (audio_stream) {
        const char *fmt;
        if ((ret = get_format_from_sample_fmt(&fmt, audio_dec_ctx->sample_fmt)) < 0)
            goto end;
        printf("Play the output audio file with the command:\n"
               "ffplay -f %s -ac %d -ar %d %s\n",
               fmt, audio_dec_ctx->channels, audio_dec_ctx->sample_rate,
               audio_dst_filename);
    }
end:
    if (video_dec_ctx)
        avcodec_close(video_dec_ctx);
    if (audio_dec_ctx)
        avcodec_close(audio_dec_ctx);
    avformat_close_input(&fmt_ctx);
    if (video_dst_file)
        fclose(video_dst_file);
    if (audio_dst_file)
        fclose(audio_dst_file);
    av_free(frame);
    av_free(video_dst_data[0]);
    av_free(audio_dst_data);
}

II.新版本的解码代码如何优化呢

avcodec_send_packet和avcodec_receive_frame代码中没有got_frame标识是否获取到了完整一帧，不知道跳跃了多少次

H264编码的原理是：I帧P帧B帧混合组成，P帧的编解码要依赖前面I帧或P帧，B帧的编解码要依赖前后I帧和P帧，若最后截取的字符串是B帧呢，那么它的解封装要依赖后面的B帧或P帧，会导致最后的几帧无法解码出来

3.还有一个问题，ffprobe命令检测出来的帧数和命令行生成的实际帧数也不一致,命令行生成的yuv文件为233帧，ffprobe检测出来为232帧，ffprobe检测出来的总是少几帧

ffprobe -v error -count_frames -select_streams v:0 -show_entries stream=nb_read_frames -of default=nokey=1:noprint_wrappers=1 input.mp4

图片.png

未完待续。。。

GitHub上ffmpeg官方补丁地址patch
查阅文档《H.264编码》
I帧，P帧，B帧的本质

I帧（I Picture、I Frame、Intra Coded Picture），译为：帧内编码图像，也叫做关键帧（Keyframe）
是视频的第一帧，也是GOP的第一帧，一个GOP只有一个I帧
编码
对整帧图像数据进行编码
解码
仅用当前I帧的编码数据就可以解码出完整的图像
是一种自带全部信息的独立帧，无需参考其他图像便可独立进行解码，可以简单理解为一张静态图像

P帧（P Picture、P Frame、Predictive Coded Picture），译为：预测编码图像
编码
并不会对整帧图像数据进行编码
以前面的I帧或P帧作为参考帧，只编码当前P帧与参考帧的差异数据
解码
需要先解码出前面的参考帧，再结合差异数据解码出当前P帧完整的图像

B帧（B Picture、B Frame、Bipredictive Coded Picture），译为：前后预测编码图像
编码
并不会对整帧图像数据进行编码
同时以前面、后面的I帧或P帧作为参考帧，只编码当前B帧与前后参考帧的差异数据
因为可参考的帧变多了，所以只需要存储更少的差异数据
解码
需要先解码出前后的参考帧，再结合差异数据解码出当前B帧完整的图像

最后编辑于：2021.07.15 10:46:19

人面猴
序言：七十年代末，一起剥皮案震惊了整个滨河市，随后出现的几起案子，更是在滨河造成了极大的恐慌，老刑警刘岩，带你破解...
沈念sama阅读 158,736评论 4赞 362
死咒
序言：滨河连续发生了三起死亡事件，死亡现场离奇诡异，居然都是意外死亡，警方通过查阅死者的电脑和手机，发现死者居然都...
沈念sama阅读 67,167评论 1赞 291
救了他两次的神仙让他今天三更去死
文/潘晓璐我一进店门，熙熙楼的掌柜王于贵愁眉苦脸地迎上来，“玉大人，你说我怎么就摊上这事。” “怎么了？”我有些...
开封第一讲书人阅读 108,442评论 0赞 243
道士缉凶录：失踪的卖姜人
文/不坏的土叔我叫张陵，是天一观的道长。经常有香客问我，道长，这世上最难降的妖魔是什么？我笑而不...
开封第一讲书人阅读 43,902评论 0赞 204
港岛之恋（遗憾婚礼）
正文为了忘掉前任，我火速办了婚礼，结果婚礼上，老公的妹妹穿的比我还像新娘。我一直安慰自己，他们只是感情好，可当我...
茶点故事阅读 52,302评论 3赞 287
恶毒庶女顶嫁案：这布局不是一般人想出来的
文/花漫我一把揭开白布。她就那样静静地躺着，像睡着了一般。火红的嫁衣衬着肌肤如雪。梳的纹丝不乱的头发上，一...
开封第一讲书人阅读 40,573评论 1赞 216
城市分裂传说
那天，我揣着相机与录音，去河边找鬼。笑死，一个胖子当着我的面吹牛，可吹牛的内容都是我干的。我是一名探鬼主播，决...
沈念sama阅读 31,847评论 2赞 312
双鸳鸯连环套：你想象不到人心有多黑
文/苍兰香墨我猛地睁开眼，长吁一口气：“原来是场噩梦啊……” “哼！你这毒妇竟也来了？” 一声冷哼从身侧响起，我...
开封第一讲书人阅读 30,562评论 0赞 197
万荣杀人案实录
序言：老挝万荣一对情侣失踪，失踪者是张志新（化名）和其女友刘颖，没想到半个月后，有当地人在树林里发现了一具尸体，经...
沈念sama阅读 34,260评论 1赞 241
护林员之死
正文独居荒郊野岭守林人离奇死亡，尸身上长有42处带血的脓包…… 初始之章·张勋以下内容为张勋视角年9月15日...
茶点故事阅读 30,531评论 2赞 245
白月光启示录
正文我和宋清朗相恋三年，在试婚纱的时候发现自己被绿了。大学时的朋友给我发了我未婚夫和他白月光在一起吃饭的照片。...
茶点故事阅读 32,021评论 1赞 258
活死人
序言：一个原本活蹦乱跳的男人离奇死亡，死状恐怖，灵堂内的尸体忽然破棺而出，到底是诈尸还是另有隐情，我是刑警宁泽，带...
沈念sama阅读 28,367评论 2赞 253
日本核电站爆炸内幕
正文年R本政府宣布，位于F岛的核电站，受9级特大地震影响，放射性物质发生泄漏。R本人自食恶果不足惜，却给世界环境...
茶点故事阅读 33,016评论 3赞 235
男人毒药：我在死后第九天来索命
文/蒙蒙一、第九天我趴在偏房一处隐蔽的房顶上张望。院中可真热闹，春花似锦、人声如沸。这庄子的主人今日做“春日...
开封第一讲书人阅读 26,068评论 0赞 8
一桩弑父案，背后竟有这般阴谋
文/苍兰香墨我抬头看了看天上的太阳。三九已至，却和暖如春，着一层夹袄步出监牢的瞬间，已是汗流浃背。一阵脚步声响...
开封第一讲书人阅读 26,827评论 0赞 194
情欲美人皮
我被黑心中介骗来泰国打工，没想到刚下飞机就差点儿被人妖公主榨干…… 1. 我叫王不留，地道东北人。一个月前我还...
沈念sama阅读 35,610评论 2赞 274
代替公主和亲
正文我出身青楼，却偏偏与公主长得像，于是被迫代替她去往敌国和亲。传闻我的和亲对象是个残疾皇子，可洞房花烛夜当晚...
茶点故事阅读 35,514评论 2赞 269

FFmpeg视频解码尾部掉帧

FFmpeg从MP4文件中抽取yuv纯视频文件有两种方式

1.命令行工具ffmpeg直接抽取yuv文件

2.通过代码解封装demux，分别获取音频pcm和视频yuv文件,有两个版本的代码

I.3.1版本之前的解封装demux代码官方示例程序为如下，解码自己的MP4文件只需更改文件路径

google搜索答案，看到这样一篇博文ffmpeg视频解码丢帧问题里面说的丢帧的原因是

给出的解决方案：记录丢掉了多少帧次数，在正常帧读取完毕后，进行空帧读取，读取空帧的次数就是记录的丢掉的帧的次数，这样总数加起来能保持不变，代码模板如下

在代码中实现丢帧的空帧读取，这个操作就包含了刷新缓冲区的概念，记录跳跃帧的次数，最后再次读取跳跃帧次数次帧

于是喜出望外，请身边人喝了三瓶可口可乐，以为发现了规律总帧数=正常读取帧+缓冲区帧数+跳跃次数=230+1+2=233，正好为总帧数=YUV420P,768x432文件总大小115955712字节/(7684321.5)=233帧

临时解决办法:多帧要比少帧好，就是最后文件中的数据因为是正常帧+缓冲区的帧+跳跃次数帧=得到的总帧数，可能回比实际帧数多，但总比缺帧好，先暂时找到的不是办法的办法，后面理清楚H264的编码原理后再找解决办法

II.新版本的解码代码如何优化呢

H264编码的原理是：I帧P帧B帧混合组成，P帧的编解码要依赖前面I帧或P帧，B帧的编解码要依赖前后I帧和P帧，若最后截取的字符串是B帧呢，那么它的解封装要依赖后面的B帧或P帧，会导致最后的几帧无法解码出来

3.还有一个问题，ffprobe命令检测出来的帧数和命令行生成的实际帧数也不一致,命令行生成的yuv文件为233帧，ffprobe检测出来为232帧，ffprobe检测出来的总是少几帧

未完待续。。。

推荐阅读更多精彩内容