功能:使用FFmpeg与SDL实现音视频解码与播放、实现音视频同步(以音频为基准)

播放器框架:


1:Demuxer 解封装,负责将音频流和视频流分开,将不同流的 Packet 送到不同的 Packet Queue 中。

2:Codec 解码器,分为音频解码器和视频解码器,负责从 Packet Queue 读取 Packet,然后解码成 Frame,并将 Frame 送到不同的 Frame Queue 中。

3:主线程中,从 Video Frame Queue 中读取 Frame,经过 Image Convert 进行像素格式转换,通过 SDL Render 最终渲染至屏幕中。

4:音频线程中,通过 SDL 回调函数去 Audio Frame Queue 中读取 Frame,经过 Audio Resampler 进行重采样,最终通过喇叭播放出声音。

这个框架基本包含了播放器中所有基本要素,后续播放器音画同步、seek 等功能都基于此框架实现。

音视频同步

DTS(Decoding Time Stamp):即解码时间戳,这个时间戳的意义在于告诉播放器该在什么时候解 码这⼀帧的数据。

PTS(Presentation Time Stamp):即显示时间戳,这个时间戳⽤来告诉播放器该在什么时候显示 这⼀帧的数据。

timebase 时基:pts的值的真正单位 ffplay中的pts,ffplay在做⾳视频同步时使⽤秒为单位,使⽤double类型去标识pts,在ffmpeg内部 不会⽤浮点数去标记pts。

当视频流中没有 B 帧时,通常 DTS 和 PTS 的顺序是⼀致的。但存在B帧的时候两者的顺序就不⼀致了。

以音频时钟为主时钟,是最常用的同步方式,也是FFplay里面默认的同步方式。当以音频时钟为主时钟,视频就会向音频同步。

视频播放线程,会缩短或者拉长当前视频帧的播放时长,或者丢弃视频帧来向音频同步。

ffplay中的实现

1:在前面我们已经实现了音视频流的播放,那要实现音视频同步,首先就是要知道当前时刻下播放到了哪里,那么如何知道当前视频流具体播放到哪儿来呢?

在ffplay中,get_clock() 里面会用 av_gettime_relative() 获取当前的系统时间,所以 get_clock() 的计算公式如下:

视频流当前的播放时刻 = 当前帧的 pts - 之前记录的系统时间 + 当前的系统时间
视频流当前的播放时刻 = 当前帧的 pts + 当前的系统时间    - 之前记录的系统时间
视频流当前的播放时刻 = 当前帧的 pts + 消逝的时间

pts_drift 字段的真正作用这样是为了能计算出消逝的时间,这样才能在每时每刻都能准确知道当前视频流或者音频的播放到哪里了。如果你想知道视频流播放到哪里了,调一下 get_clock() 函数即可。

2:知道了如何获取当前播放时刻后, 即用 get_clock() 函数能获取到 视频流,音频流当前的播放时刻,下面再开始理解音视频同步的逻辑。

视频向音频同步的逻辑有两处,其中一处在 compute_target_delay() 函数里面,如下:

/* compute nominal last_duration */
last_duration = vp_duration(is, lastvp, vp);
delay = compute_target_delay(last_duration, is);

last_duration 代表当前帧本来,本来需要显示多长时间。当前帧是指窗口正在显示的帧。

delay 代表当前帧实际,实际应该显示多长时间。

有点抽象,举个例子,1/24 帧的视频流,每帧固定显示 0.04s,当音频跟视频播放不同步的差异不超过阈值的时候,last_durationdelay 都会是 0.04。

但是当视频比音频快了 0.05s 的时候,那 delay 就会从 0.04 变成 0.08,翻倍了,拉长当前视频帧的播放时间来等待音频流追上来。

当视频比音频慢了 0.05s 的时候,那 delay 就会从 0.04 变成 0,这样当前视频帧就会立即结束播放,让下一帧显示出来。

这就是音视频同步的基本原理,就是你追我赶的一个过程,

另一处在视频解码得到帧之后再同步。不过这里不会用到同步阈值,只要视频已经比音频慢了,无论慢多少,都会立即丢帧

其具体如何实现可以参考这里FFplay视频同步分析—ffplay.c源码分析 · FFmpeg原理 (xianwaizhiyin.net)

源码实现

#include <SDL.h>
#include <libavutil/avutil.h>
#include <libavutil/fifo.h>
#include <libavutil/time.h>
#include <libavcodec/avcodec.h>
#include <libavformat/avformat.h>
#include <libswscale/swscale.h>
#include <libswresample/swresample.h>

#define MAX_QUEUE_SIZE (5 * 1024 * 1024)  //limit queue size
#define SDL_AUDIO_BUFFER_SIZE 1024

#define FF_REFRESH_EVENT (SDL_USEREVENT)
#define FF_QUIT_EVENT (SDL_USEREVENT + 1)

#define VIDEO_PICTURE_QUEUE_SIZE 3
#define SAMPLE_QUEUE_SIZE 9
#define FRAME_QUEUE_SIZE FFMAX(SAMPLE_QUEUE_SIZE, VIDEO_PICTURE_QUEUE_SIZE)

#define AV_SYNC_THRESHOLD 0.01
#define AV_NOSYNC_THRESHOLD 10.0

enum {
    AV_SYNC_AUDIO_MASTER,
    AV_SYNC_VIDEO_MASTER,
    AV_SYNC_EXTERNAL_MASTER,
};

typedef struct MyAVPacketList {
    AVPacket* pkt;
} MyAVPacketList;

typedef struct PacketQueue {
    AVFifo* pkt_list;
    int nb_packets;
    int size;
    int64_t duration;
    SDL_mutex* mutex;
    SDL_cond* cond;
} PacketQueue;

typedef struct Frame {
    AVFrame* frame;
    double pts;           /* 显示时间戳 */
    double duration;      /* 该帧的持续时间 */
    int64_t pos;          /* byte position */
    int width;
    int height;
    int format;
    AVRational sar;
} Frame;

typedef struct FrameQueue {
    Frame queue[FRAME_QUEUE_SIZE];
    int rindex;                //// 读索引。待播放时读取此帧进⾏播放,播放后此帧成为上⼀帧
    int windex;
    int size;
    int abort;
    SDL_mutex* mutex;
    SDL_cond* cond;
} FrameQueue;

typedef struct VideoState {

    //for multi-media file
    char* filename;         //文件名指针
    AVFormatContext* ic;    //上下文指针  AVFormatContext主要存储视音频封装格式中包含的信息

    //sync,音视频同步相关
    int             av_sync_type;

    double          audio_clock; ///
    double          frame_timer; ///按照音频同步
    double          frame_last_pts;
    double          frame_last_delay;

    double          video_clock;
    double          video_current_pts;
    int64_t         video_current_pts_time;  ///< sys time (av_gettime)   video_current_pts - used to have running video pts


    //for audio
    int             audio_index; //音频流编号

    /*每个AVStream存储一个视频/音频流的相关数据;
    每个AVStream对应一个AVCodecContext,存储该视频/音频流使用解码方式的相关数据;
    每个AVCodecContext中对应一个AVCodec,包含该视频/音频对应的解码器。
    每种解码器都对应一个AVCodec结构。*/
    AVStream* audio_st;         //流结构体
    AVCodecContext* audio_ctx;
    PacketQueue     audioq;
    uint8_t* audio_buf;
    unsigned int    audio_buf_size;
    unsigned int    audio_buf_index;
    AVFrame         audio_frame;  //解码后数据
    AVPacket        audio_pkt;   //解码前数据
    uint8_t* audio_pkt_data;
    int             audio_pkt_size;
    struct SwrContext* audio_swr_ctx;  //重采样

    //for video
    int             video_index;  //视频流编号
    AVStream* video_st;
    AVCodecContext* video_ctx;
    PacketQueue     videoq;
    AVPacket        video_pkt;
    struct SwsContext* sws_ctx;

    SDL_Texture* texture;

    FrameQueue      pictq;

    int width, height, xleft, ytop;

    SDL_Thread* read_tid;
    SDL_Thread* decode_tid;

    int             quit;

} VideoState;

static const char* input_filename;
static const char* window_title;

static int default_width = 640;
static int default_height = 480;
static int screen_width = 0;
static int screen_height = 0;

static SDL_Window* win;
static SDL_Renderer* renderer;

static int is_full_screen = 0;
static int screen_left = SDL_WINDOWPOS_CENTERED;
static int screen_top = SDL_WINDOWPOS_CENTERED;

static int av_sync_type = AV_SYNC_AUDIO_MASTER;

/* packet queue handling */
static int packet_queue_init(PacketQueue* q)
{
    memset(q, 0, sizeof(PacketQueue));
    q->pkt_list = av_fifo_alloc2(1, sizeof(MyAVPacketList), AV_FIFO_FLAG_AUTO_GROW);
    if (!q->pkt_list)
        return AVERROR(ENOMEM);
    q->mutex = SDL_CreateMutex();
    if (!q->mutex) {
        av_log(NULL, AV_LOG_FATAL, "SDL_CreateMutex(): %s\n", SDL_GetError());
        return AVERROR(ENOMEM);
    }
    q->cond = SDL_CreateCond();
    if (!q->cond) {
        av_log(NULL, AV_LOG_FATAL, "SDL_CreateCond(): %s\n", SDL_GetError());
        return AVERROR(ENOMEM);
    }
    return 0;
}

static int packet_queue_put_private(PacketQueue* q, AVPacket* pkt)
{
    MyAVPacketList pkt1;
    int ret =-1;

    pkt1.pkt = pkt;

    ret = av_fifo_write(q->pkt_list, &pkt1, 1);
    if (ret < 0)
        return ret;
    q->nb_packets++;
    q->size += pkt1.pkt->size + sizeof(pkt1);
    q->duration += pkt1.pkt->duration;
    /* XXX: should duplicate packet data in DV case */
    SDL_CondSignal(q->cond);
    return 0;
}

static int packet_queue_put(PacketQueue* q, AVPacket* pkt)
{
    AVPacket* pkt1;
    int ret =-1;

    pkt1 = av_packet_alloc();
    if (!pkt1) {
        av_packet_unref(pkt);
        return -1;
    }
    av_packet_move_ref(pkt1, pkt);

    SDL_LockMutex(q->mutex);
    ret = packet_queue_put_private(q, pkt1);
    SDL_UnlockMutex(q->mutex);

    if (ret < 0)
        av_packet_free(&pkt1);

    return ret;
}

/* return < 0 if aborted, 0 if no packet and > 0 if packet.  */
static int packet_queue_get(PacketQueue* q, AVPacket* pkt, int block)
{
    MyAVPacketList pkt1;
    int ret = -1;

    SDL_LockMutex(q->mutex);

    for (;;) {
        if (av_fifo_read(q->pkt_list, &pkt1, 1) >= 0) {
            q->nb_packets--;
            q->size -= pkt1.pkt->size + sizeof(pkt1);
            q->duration -= pkt1.pkt->duration;
            av_packet_move_ref(pkt, pkt1.pkt);
            av_packet_free(&pkt1.pkt);
            ret = 1;
            break;
        }
        else if (!block) {
            ret = 0;
            break;
        }
        else {
            SDL_CondWait(q->cond, q->mutex);
        }
    }
    SDL_UnlockMutex(q->mutex);
    return ret;
}

static void packet_queue_flush(PacketQueue* q)
{
    MyAVPacketList pkt1;

    SDL_LockMutex(q->mutex);
    while (av_fifo_read(q->pkt_list, &pkt1, 1) >= 0)
        av_packet_free(&pkt1.pkt);   //释放AVpacket 数据
    q->nb_packets = 0;
    q->size = 0;
    q->duration = 0;
    SDL_UnlockMutex(q->mutex);
}

static void packet_queue_destroy(PacketQueue* q)
{
    packet_queue_flush(q); //清除所有节点
    av_fifo_freep2(&q->pkt_list);
    SDL_DestroyMutex(q->mutex);
    SDL_DestroyCond(q->cond);
}

static int frame_queue_init(FrameQueue* fq, int max_size)
{
    int i = 0;
    memset(fq, 0, sizeof(FrameQueue));
    if (!(fq->mutex = SDL_CreateMutex())) {
        av_log(NULL, AV_LOG_FATAL, "SDL_CreateMutex(): %s\n", SDL_GetError());
        return AVERROR(ENOMEM);
    }
    if (!(fq->cond = SDL_CreateCond())) {
        av_log(NULL, AV_LOG_FATAL, "SDL_CreateCond(): %s\n", SDL_GetError());
        return AVERROR(ENOMEM);
    }
    for (i = 0; i < VIDEO_PICTURE_QUEUE_SIZE; i++)
        if (!(fq->queue[i].frame = av_frame_alloc()))
            return AVERROR(ENOMEM);
    return 0;
}

static void frame_queue_destory(FrameQueue* fq)
{
    int i = 0;
    for (i = 0; i < VIDEO_PICTURE_QUEUE_SIZE; i++) {
        Frame* vp = &fq->queue[i];
        av_frame_unref(vp->frame);
        av_frame_free(&vp->frame);
    }
    SDL_DestroyMutex(fq->mutex);
    SDL_DestroyCond(fq->cond);
}

static void frame_queue_signal(FrameQueue* fq)
{
    SDL_LockMutex(fq->mutex);
    SDL_CondSignal(fq->cond);
    SDL_UnlockMutex(fq->mutex);
}

static Frame* frame_queue_peek(FrameQueue* fq)
{
    return &fq->queue[fq->rindex];
}

static Frame* frame_queue_peek_writable(FrameQueue* fq)
{
    /* wait until we have space to put a new frame */
    SDL_LockMutex(fq->mutex);
    while (fq->size >= VIDEO_PICTURE_QUEUE_SIZE && !fq->abort) {
        SDL_CondWait(fq->cond, fq->mutex);
    }
    SDL_UnlockMutex(fq->mutex);

    return &fq->queue[fq->windex];
}

static void frame_queue_push(FrameQueue* fq)
{
    if (++fq->windex == VIDEO_PICTURE_QUEUE_SIZE)
        fq->windex = 0;
    SDL_LockMutex(fq->mutex);
    fq->size++;
    SDL_CondSignal(fq->cond);
    SDL_UnlockMutex(fq->mutex);
}

static void frame_queue_pop(FrameQueue* fq)
{
    Frame* vp = &fq->queue[fq->rindex];
    av_frame_unref(vp->frame);
    if (++fq->rindex == VIDEO_PICTURE_QUEUE_SIZE)
        fq->rindex = 0;
    SDL_LockMutex(fq->mutex);
    fq->size--;
    SDL_CondSignal(fq->cond);
    SDL_UnlockMutex(fq->mutex);
}

static void frame_queue_abort(FrameQueue* fq)
{
    SDL_LockMutex(fq->mutex);

    fq->abort = 1;

    SDL_CondSignal(fq->cond);

    SDL_UnlockMutex(fq->mutex);
}

double get_audio_clock(VideoState* is) {
    double pts = 0;
    int hw_buf_size = 0, bytes_per_sec = 0, n = 0;

    pts = is->audio_clock; /* maintained in the audio thread */
    hw_buf_size = is->audio_buf_size - is->audio_buf_index;
    bytes_per_sec = 0;
    n = is->audio_ctx->ch_layout.nb_channels * 2;
    if (is->audio_st) {
        bytes_per_sec = is->audio_ctx->sample_rate * n;
    }
    if (bytes_per_sec) {
        pts -= (double)hw_buf_size / bytes_per_sec;
    }
    return pts;
}
double get_video_clock(VideoState* is) {
    double delta;

    delta = (av_gettime() - is->video_current_pts_time) / 1000000.0;
    return is->video_current_pts + delta;
}
double get_external_clock(VideoState* is) {
    return av_gettime() / 1000000.0;
}

double get_master_clock(VideoState* is) {
    if (is->av_sync_type == AV_SYNC_VIDEO_MASTER) {
        return get_video_clock(is);
    }
    else if (is->av_sync_type == AV_SYNC_AUDIO_MASTER) {
        return get_audio_clock(is);
    }
    else {
        return get_external_clock(is);
    }
}

double synchronize_video(VideoState* is, AVFrame* src_frame, double pts) {

    double frame_delay = 0;

    if (pts != 0) {
        /* if we have pts, set video clock to it */
        is->video_clock = pts;
    }
    else {
        /* if we aren't given a pts, set it to the clock */
        pts = is->video_clock;
    }
    /* update the video clock */
    frame_delay = av_q2d(is->video_ctx->time_base);
    /* if we are repeating a frame, adjust clock accordingly */
    frame_delay += src_frame->repeat_pict * (frame_delay * 0.5);
    is->video_clock += frame_delay;
    return pts;
}

static void calculate_display_rect(SDL_Rect* rect,
    int scr_xleft, int scr_ytop, int scr_width, int scr_height,
    int pic_width, int pic_height, AVRational pic_sar)
{
    AVRational aspect_ratio = pic_sar;
    int64_t width = 0, height = 0, x = 0, y = 0;

    if (av_cmp_q(aspect_ratio, av_make_q(0, 1)) <= 0)
        aspect_ratio = av_make_q(1, 1);

    aspect_ratio = av_mul_q(aspect_ratio, av_make_q(pic_width, pic_height));

    /* XXX: we suppose the screen has a 1.0 pixel ratio */
    height = scr_height;
    width = av_rescale(height, aspect_ratio.num, aspect_ratio.den) & ~1;
    if (width > scr_width) {
        width = scr_width;
        height = av_rescale(width, aspect_ratio.den, aspect_ratio.num) & ~1;
    }
    x = (scr_width - width) / 2;
    y = (scr_height - height) / 2;
    rect->x = scr_xleft + x;
    rect->y = scr_ytop + y;
    rect->w = FFMAX((int)width, 1);
    rect->h = FFMAX((int)height, 1);
}

static void set_default_window_size(int width, int height, AVRational sar)
{
    SDL_Rect rect;
    int max_width = screen_width ? screen_width : INT_MAX;
    int max_height = screen_height ? screen_height : INT_MAX;
    if (max_width == INT_MAX && max_height == INT_MAX)
        max_height = height;
    calculate_display_rect(&rect, 0, 0, max_width, max_height, width, height, sar);
    default_width = rect.w;
    default_height = rect.h;
}

int audio_decode_frame(VideoState* is) {

    int ret = -1;
    int data_size = 0;

    int len1 = 0, len2 = 0;

    for (;;) {

        //从队列中读取数据
        if (packet_queue_get(&is->audioq, &is->audio_pkt, 0) <= 0) {
            av_log(NULL, AV_LOG_ERROR, "Could not get packet from audio queue!\n");
            break;
        }

        ret = avcodec_send_packet(is->audio_ctx, &is->audio_pkt);
        av_packet_unref(&is->audio_pkt);
        if (ret < 0) {
            av_log(is->audio_ctx, AV_LOG_ERROR, "Failed to send pkt to decoder!\n");
            goto __OUT;
        }

        while (ret >= 0) {
            ret = avcodec_receive_frame(is->audio_ctx, &is->audio_frame);
            if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) {
                break;
            }
            else if (ret < 0) {
                av_log(is->audio_ctx, AV_LOG_ERROR, "Failed to receive frame from decoder!\n");
                goto __OUT;
            }

            if (!is->audio_swr_ctx) {
                AVChannelLayout in_ch_layout, out_ch_layout;
                av_channel_layout_copy(&in_ch_layout, &is->audio_ctx->ch_layout);
                av_channel_layout_copy(&out_ch_layout, &in_ch_layout);

                if (is->audio_ctx->sample_fmt != AV_SAMPLE_FMT_S16) {
                    swr_alloc_set_opts2(&is->audio_swr_ctx,
                        &out_ch_layout,
                        AV_SAMPLE_FMT_S16,
                        is->audio_ctx->sample_rate,
                        &in_ch_layout,
                        is->audio_ctx->sample_fmt,
                        is->audio_ctx->sample_rate,
                        0,
                        NULL);
                    swr_init(is->audio_swr_ctx);
                }

            }
            //需要重采样
            if (is->audio_swr_ctx) {

                const uint8_t** in = (const uint8_t**)is->audio_frame.extended_data;
                uint8_t** out = &is->audio_buf;
                int out_count = is->audio_frame.nb_samples + 256;

                //data_size = 2 * 2 * is->aframe->nb_samples;
                int out_size = av_samples_get_buffer_size(NULL, is->audio_frame.ch_layout.nb_channels, out_count, AV_SAMPLE_FMT_S16, 0);
                av_fast_malloc(&is->audio_buf, &is->audio_buf_size, out_size);

                //assert(data_size <= buf_size);
                len2 = swr_convert(is->audio_swr_ctx,
                    out,
                    out_count, //MAX_AUDIO_FRAME_SIZE*3/2,
                    in,
                    is->audio_frame.nb_samples);

                //输出
                data_size = len2 * is->audio_frame.ch_layout.nb_channels * av_get_bytes_per_sample(AV_SAMPLE_FMT_S16);
                //av_log(NULL, AV_LOG_DEBUG, "data_size:%d, compare:%d\n", data_size, 2 * 2 * is->audio_frame.nb_samples);
            }

            if (!isnan(is->audio_frame.pts))
                is->audio_clock = is->audio_frame.pts + (double)is->audio_frame.nb_samples / is->audio_frame.sample_rate;//计算音频播放时长,同步关键点!!!
            else
                is->audio_clock = NAN;
            //release pkt
            av_frame_unref(&is->audio_frame);

            return data_size;
        }
    }

__OUT:
    return ret;
}

void sdl_audio_callback(void* userdata, Uint8* stream, int len) {

    VideoState* is = (VideoState*)userdata;
    int len1 = 0;
    int audio_size = 0;

    while (len > 0) {
        //8-2课程 buf中所有数据已经被使用了
        if (is->audio_buf_index >= is->audio_buf_size) {
            /* We have already sent all our data; get more */
            audio_size = audio_decode_frame(is);
            if (audio_size < 0) {
                /* If error, output silence */
                is->audio_buf_size = SDL_AUDIO_BUFFER_SIZE;
                is->audio_buf = NULL;
            }
            else {
                is->audio_buf_size = audio_size;
            }
            is->audio_buf_index = 0;
        }

        len1 = is->audio_buf_size - is->audio_buf_index;
        if (len1 > len)
            len1 = len;

        if (is->audio_buf)
            memcpy(stream, (uint8_t*)is->audio_buf + is->audio_buf_index, len1);
        else
            memset(stream, 0, len1);//静默音
        len -= len1;
        stream += len1;
        is->audio_buf_index += len1;
    }
}

static Uint32 sdl_refresh_timer_cb(Uint32 interval, void* opaque) {
    SDL_Event event;
    event.type = FF_REFRESH_EVENT;
    event.user.data1 = opaque;
    SDL_PushEvent(&event);
    return 0; /* 0 means stop timer */
}

/* schedule a video refresh in 'delay' ms */
static void schedule_refresh(VideoState* is, int delay) {
    SDL_AddTimer(delay, sdl_refresh_timer_cb, is);
}

//设置播放窗口大小
static int video_open(VideoState* is)
{
    int w = 0, h = 0;

    w = screen_width ? screen_width : default_width;
    h = screen_height ? screen_height : default_height;

    if (!window_title)
        window_title = input_filename;
    SDL_SetWindowTitle(win, window_title);

    SDL_SetWindowSize(win, w, h);
    SDL_SetWindowPosition(win, screen_left, screen_top);
    if (is_full_screen)
        SDL_SetWindowFullscreen(win, SDL_WINDOW_FULLSCREEN_DESKTOP);
    SDL_ShowWindow(win);

    is->width = w;
    is->height = h;

    return 0;
}

static void video_display(VideoState* is) {

    Frame* vp = NULL;
    AVFrame* frame = NULL;

    SDL_Rect rect;
    //1. open video
    if (!is->width)
        video_open(is);
    //2. peek frame 获取当前帧
    vp = frame_queue_peek(&is->pictq);

    frame = vp->frame;

    //3. create texture
    if (!is->texture) {
        int width = frame->width;
        int height = frame->height;

        Uint32 pixformat = SDL_PIXELFORMAT_IYUV;

        //create texture for render
        is->texture = SDL_CreateTexture(renderer,
            pixformat,
            SDL_TEXTUREACCESS_STREAMING,
            width,
            height);
        if (!is->texture) {
            av_log(NULL, AV_LOG_ERROR, "Failed to alloct texture, NO MEMORY!\n");
            return;
        }
    }
    //4. calculate rect
    calculate_display_rect(&rect, is->xleft, is->ytop, is->width, is->height, vp->width, vp->height, vp->sar);

    //5. render
    SDL_UpdateYUVTexture(is->texture,
        NULL,
        frame->data[0], frame->linesize[0],
        frame->data[1], frame->linesize[1],
        frame->data[2], frame->linesize[2]);

    SDL_RenderClear(renderer);
    SDL_RenderCopy(renderer, is->texture, NULL, &rect);
    //SDL_RenderCopy(renderer, is->texture, NULL, NULL);
    SDL_RenderPresent(renderer);

    //6. release frame
    frame_queue_pop(&is->pictq);
}

void video_refresh_timer(void* userdata) {

    VideoState* is = (VideoState*)userdata;
    Frame* vp = NULL;

    double actual_delay, delay, sync_threshold, ref_clock, diff;

    if (is->video_st) {
        if (is->pictq.size == 0) {
            schedule_refresh(is, 1); //if the queue is empty, so we shoud be as fast as checking queue of picture
        }
        else {
            /* Now, normally here goes a ton of code
                 about timing, etc. we're just going to
                 guess at a delay for now. You can
                 increase and decrease this value and hard code
                 the timing - but I don't suggest that ;)
                 We'll learn how to do it for real later.
            */
            vp = frame_queue_peek(&is->pictq);
            is->video_current_pts = vp->pts;
            is->video_current_pts_time = av_gettime();
            if (is->frame_last_pts == 0) {
                delay = 0;
            }
            else {
                delay = vp->pts - is->frame_last_pts; /* the pts from last time */
            }

            if (delay <= 0 || delay >= 1.0) {
                /* if incorrect delay, use previous one */
                delay = is->frame_last_delay;
            }

            /* save for next time */
            is->frame_last_delay = delay;
            is->frame_last_pts = vp->pts;

            /* update delay to sync to audio if not master source */
            if (is->av_sync_type != AV_SYNC_VIDEO_MASTER) {
                ref_clock = get_master_clock(is);//音频的时钟
                diff = vp->pts - ref_clock;

                /* Skip or repeat the frame. Take delay into account
                  FFPlay still doesn't "know if this is the best guess." */
                sync_threshold = (delay > AV_SYNC_THRESHOLD) ? delay : AV_SYNC_THRESHOLD;
                if (fabs(diff) < AV_NOSYNC_THRESHOLD) {
                    if (diff <= -sync_threshold) {
                        delay = 0;
                    }
                    else if (diff >= sync_threshold) {
                        delay = 2 * delay;
                    }
                }
            }

            is->frame_timer += delay;
            /* computer the REAL delay */
            actual_delay = is->frame_timer - (av_gettime() / 1000000.0);
            if (actual_delay < 0.010) {
                /* Really it should skip the picture instead */
                actual_delay = 0.010;
            }

            schedule_refresh(is, (int)(actual_delay * 1000 + 0.5));  

            /* show the picture! */
            video_display(is);
        }
    }
    else {
        schedule_refresh(is, 100);
    }
}
static int queue_picture(VideoState* is,
    AVFrame* src_frame,
    double pts,
    double duration,
    int64_t pos)
{
    Frame* vp = NULL;

#if defined(DEBUG_SYNC)
    printf("frame_type=%c pts=%0.3f\n",
        av_get_picture_type_char(src_frame->pict_type), pts);
#endif

    if (!(vp = frame_queue_peek_writable(&is->pictq)))//获取⼀个可写Frame,可以以阻塞或⾮阻塞⽅式进⾏
        return -1;

    vp->sar = src_frame->sample_aspect_ratio;

    vp->width = src_frame->width;
    vp->height = src_frame->height;
    vp->format = src_frame->format;

    vp->pts = pts;
    vp->duration = duration;
    vp->pos = pos;

    //set_default_window_size(vp->width, vp->height, vp->sar);

    av_frame_move_ref(vp->frame, src_frame);
    frame_queue_push(&is->pictq);
    return 0;
}

int decode_thread(void* arg) {

    int ret = -1;

    double pts = 0;
    double duration = 0;

    VideoState* is = (VideoState*)arg;
    AVFrame* video_frame = NULL;
    Frame* vp = NULL;

    AVRational tb = is->video_st->time_base;
    AVRational frame_rate = av_guess_frame_rate(is->ic, is->video_st, NULL);

    video_frame = av_frame_alloc();//接收解码后帧

    for (;;) {
        if (is->quit) {
            break;
        }
        //非阻塞方式读取,没有就退出
        if (packet_queue_get(&is->videoq, &is->video_pkt, 0) <= 0) {
            // means we quit getting packets
            av_log(is->video_ctx, AV_LOG_DEBUG, "video delay 10 ms\n");
            SDL_Delay(10);
            continue;
        }

        ret = avcodec_send_packet(is->video_ctx, &is->video_pkt);
        av_packet_unref(&is->video_pkt);
        if (ret < 0) {
            av_log(is->video_ctx, AV_LOG_ERROR, "Failed to send pkt to video decoder!\n");
            goto __ERROR;
        }
        
        while (ret >= 0) {
            ret = avcodec_receive_frame(is->video_ctx, video_frame);
            if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) {
                break;
            }
            else if (ret < 0) {
                av_log(is->video_ctx, AV_LOG_ERROR, "Failed to receive frame from video decoder!\n");
                ret = -1;
                goto __ERROR;
            }

            //video_display(is);

            //av sync
            duration = (frame_rate.num && frame_rate.den ? av_q2d((AVRational) { frame_rate.den, frame_rate.num }) : 0);
            pts = (video_frame->pts == AV_NOPTS_VALUE) ? NAN : video_frame->pts * av_q2d(tb);
            pts = synchronize_video(is, video_frame, pts);

            //insert FrameQueue
            queue_picture(is, video_frame, pts, duration, video_frame->pkt_pos);

            //sub reference count
            av_frame_unref(video_frame);
        }
    }
    ret = 0;

__ERROR:
    av_frame_free(&video_frame);
    return ret;
}

static int audio_open(void* opaque,
    AVChannelLayout* wanted_channel_layout,
    int wanted_sample_rate) {
    SDL_AudioSpec wanted_spec, spec;
    int wanted_nb_channels = wanted_channel_layout->nb_channels;

    // Set audio settings from codec info
    wanted_spec.freq = wanted_sample_rate;
    wanted_spec.format = AUDIO_S16SYS;
    wanted_spec.channels = wanted_nb_channels;
    wanted_spec.silence = 0;
    wanted_spec.samples = SDL_AUDIO_BUFFER_SIZE;
    wanted_spec.callback = sdl_audio_callback;
    wanted_spec.userdata = (void*)opaque;

    av_log(NULL, AV_LOG_INFO,
        "wanted spec: channels:%d, sample_fmt:%d, sample_rate:%d \n",
        wanted_nb_channels, AUDIO_S16SYS, wanted_sample_rate);

    //SDL自动创建线程
    if (SDL_OpenAudio(&wanted_spec, NULL) < 0) {
        av_log(NULL, AV_LOG_ERROR, "SDL_OpenAudio: %s\n", SDL_GetError());
        return -1;
    }
    //return spec.size;
    return 1;
}


int stream_component_open(VideoState* is, int stream_index) {

    int ret = -1;

    AVFormatContext* ic = is->ic;
    AVCodecContext* avctx = NULL;
    const AVCodec* codec = NULL;

    int sample_rate = 0;
    AVChannelLayout ch_layout = { 0, };

    AVStream* st = NULL;
    int codec_id = -1;

    if (stream_index < 0 || stream_index >= ic->nb_streams) {
        return -1;
    }

    st = ic->streams[stream_index];
    codec_id = st->codecpar->codec_id;//找到解码器id
    //1. find decoder
    codec = avcodec_find_decoder(codec_id);
    //2. alloc condec context
    avctx = avcodec_alloc_context3(codec);
    if (!avctx) {
        av_log(NULL, AV_LOG_ERROR, "Failed to alloc avctx, NO MEMORY!\n");
        goto __ERROR;
    }
    //3. copy parameter to codec context
    if ((ret = avcodec_parameters_to_context(avctx, st->codecpar)) < 0) {
        av_log(avctx, AV_LOG_ERROR, "Couldn't copy codec parameters to codec context!\n");
        goto __ERROR; // Error copying codec context
    }
    //4.bind codec and codec context
    if ((ret = avcodec_open2(avctx, codec, NULL)) < 0) {
        av_log(NULL, AV_LOG_ERROR, "Failed to bind codecCtx and codec!\n");
        goto __ERROR;
    }

    switch (avctx->codec_type) {
    case AVMEDIA_TYPE_AUDIO:
        sample_rate = avctx->sample_rate;
        ret = av_channel_layout_copy(&ch_layout, &avctx->ch_layout);
        if (ret < 0) {
            goto __ERROR;
        }

        //open audio
        if ((ret = audio_open(is, &ch_layout, sample_rate)) < 0) {
            av_log(avctx, AV_LOG_ERROR, "Failed to open audio device!\n");
            goto __ERROR;
        }

        is->audio_buf_size = 0;
        is->audio_buf_index = 0;
        is->audio_st = st;
        is->audio_index = stream_index;
        is->audio_ctx = avctx;

        //start play audio
        SDL_PauseAudio(0);

        break;

    case AVMEDIA_TYPE_VIDEO:
        is->video_index = stream_index;
        is->video_st = st;
        is->video_ctx = avctx;

        is->frame_timer = (double)av_gettime() / 1000000.0;//视频播放时间
        is->frame_last_delay =40e-3;
        is->video_current_pts_time = av_gettime();

        //create decode thread 
        is->decode_tid = SDL_CreateThread(decode_thread, "decodec_thread", is);

        break;
    default:
        av_log(avctx, AV_LOG_ERROR, "Unknow Codec Type: %d\n", avctx->codec_type);
        break;
    }
    ret = 0;
    goto __END;
__ERROR:
    if (avctx) {
        avcodec_free_context(&avctx);
    }
__END:
    return ret;
}

int read_thread(void* arg) {

    Uint32 pixformat = 0;
    int ret = -1;

    int video_index = -1;
    int audio_index = -1;

    VideoState* is = (VideoState*)arg;
    AVFormatContext* ic = NULL;    //AVFormatContext主要存储视音频封装格式中包含的信息
    AVPacket* pkt = NULL;

    pkt = av_packet_alloc();   
    if (!pkt) {
        av_log(NULL, AV_LOG_FATAL, "NO MEMORY!\n");
        goto __ERROR;
    }

    //1. Open media file
    if ((ret = avformat_open_input(&ic, is->filename, NULL, NULL)) < 0) {
        av_log(NULL, AV_LOG_ERROR, "Could not open file: %s, %d(%s)\n", is->filename, ret, av_err2str(ret));
        goto __ERROR; // Couldn't open file
    }
    is->ic = ic;

    //2. extract media info
    if (avformat_find_stream_info(ic, NULL) < 0) {
        av_log(NULL, AV_LOG_FATAL, "Couldn't find stream information\n");
        goto __ERROR;
    }

    //3. Find the first audio and video stream
    for (int i = 0; i < ic->nb_streams; i++) {
        AVStream* st = ic->streams[i];
        enum AVMediaType type = st->codecpar->codec_type;
        if (type == AVMEDIA_TYPE_VIDEO && video_index < 0) {
            video_index = i;
        }
        if (type == AVMEDIA_TYPE_AUDIO && audio_index < 0) {
            audio_index = i;
        }

        //find video and audio
        if (video_index > -1 && audio_index > -1) {
            break;
        }
    }

    if (video_index < 0 || audio_index < 0) {
        av_log(NULL, AV_LOG_ERROR, "the file must be contains audio and video stream!\n");
        goto __ERROR;
    }

    if (audio_index >= 0) { //4. open audio part
        stream_component_open(is, audio_index);
    }
    if (video_index >= 0) { //5. open video part

        AVStream* st = ic->streams[video_index];
        AVCodecParameters* codecpar = st->codecpar;
        AVRational sar = av_guess_sample_aspect_ratio(ic, st, NULL);
        if (codecpar->width)
            set_default_window_size(codecpar->width, codecpar->height, sar);

        stream_component_open(is, video_index);
    }

    //main decode loop
    for (;;) {

        if (is->quit) {
            ret = -1;
            goto __ERROR;
        }

        //limit queue size
        if (is->audioq.size > MAX_QUEUE_SIZE ||
            is->videoq.size > MAX_QUEUE_SIZE) {
            SDL_Delay(10);//暂停时间
            continue;
        }


        //6. read packet
        ret = av_read_frame(is->ic, pkt);
        if (ret < 0) {
            if (is->ic->pb->error == 0) {
                SDL_Delay(100); /* no error; wait for user input */
                continue;
            }
            else {
                break;
            }
        }

        //todo: seek funtion

        //7. save packet to queue
        if (pkt->stream_index == is->video_index) {
            packet_queue_put(&is->videoq, pkt);
        }
        else if (pkt->stream_index == is->audio_index) {
            packet_queue_put(&is->audioq, pkt);
        }
        else { //discard other packets 
            av_packet_unref(pkt);
        }
    }

    /* all done - wait for it */
    while (!is->quit) {
        SDL_Delay(100);
    }

    ret = 0;

__ERROR:
    if (pkt) {
        av_packet_free(&pkt);
    }

    if (ret != 0) {
        SDL_Event event;
        event.type = FF_QUIT_EVENT;
        event.user.data1 = is;
        SDL_PushEvent(&event);
    }

    return ret;
}

static void stream_component_close(VideoState* is, int stream_index) {
    AVFormatContext* ic = is->ic;
    AVCodecParameters* codecpar = NULL;

    if (stream_index < 0 || stream_index >= ic->nb_streams)
        return;
    codecpar = ic->streams[stream_index]->codecpar;

    switch (codecpar->codec_type) {
    case AVMEDIA_TYPE_AUDIO:
        SDL_CloseAudio();
        swr_free(&is->audio_swr_ctx);
        av_freep(&is->audio_buf);
        is->audio_buf = NULL;

        break;
    case AVMEDIA_TYPE_VIDEO:
        frame_queue_abort(&is->pictq);
        frame_queue_signal(&is->pictq);
        SDL_WaitThread(is->decode_tid, NULL);
        is->decode_tid = NULL;
        break;
    default:
        break;
    }
}

static void stream_close(VideoState* is)
{
    SDL_WaitThread(is->read_tid, NULL);

    /* close each stream */
    if (is->audio_index >= 0)
        stream_component_close(is, is->audio_index);
    if (is->video_index >= 0)
        stream_component_close(is, is->video_index);

    avformat_close_input(&is->ic);

    packet_queue_destroy(&is->videoq);
    packet_queue_destroy(&is->audioq);

    frame_queue_destory(&is->pictq);

    av_free(is->filename);
    if (is->texture)
        SDL_DestroyTexture(is->texture);
    av_free(is);
}

static VideoState* stream_open(const char* filename) {

    VideoState* is =NULL;
    //分配内存并且置零
    is = av_mallocz(sizeof(VideoState));
    if (!is) {
        av_log(NULL, AV_LOG_FATAL, "NO MEMORY!\n");
        return NULL;
    }

    is->audio_index = is->video_index = -1;
    //分配字符串的副本
    is->filename = av_strdup(filename);
    if (!is->filename) {
        goto __ERROR;
    }
    //屏幕上面,左边预留空间
    is->ytop = 0;
    is->xleft = 0;

    //初始化packet queue,线程间通信
    if (packet_queue_init(&is->videoq) < 0 ||
        packet_queue_init(&is->audioq) < 0) {
        goto __ERROR;
    }

    //初始化video frame queue,视频解码后的帧保存在队列中,,ffmpeg中还有音频的帧保存队列
    if (frame_queue_init(&is->pictq, VIDEO_PICTURE_QUEUE_SIZE) < 0) {
        goto __ERROR;
    }

    //set sync type 音视频同步类型
    is->av_sync_type = av_sync_type;

    //create an new thread for reading audio and video data
    is->read_tid = SDL_CreateThread(read_thread, "read_thread", is);
    if (!is->read_tid) {
        av_log(NULL, AV_LOG_FATAL, "SDL_CreateThread(): %s\n", SDL_GetError());
        goto __ERROR;
    }

    //set timer for show picture
    schedule_refresh(is, 40);

    return is;

__ERROR:
    stream_close(is);
    return NULL;
}

static void do_exit(VideoState* is) {
    if (is) {
        stream_close(is);
    }
    if (renderer)
        SDL_DestroyRenderer(renderer);
    if (win)
        SDL_DestroyWindow(win);

    SDL_Quit();
    av_log(NULL, AV_LOG_QUIET, "%s", "");
    exit(0);
}

static void sdl_event_loop(VideoState* is) {
    SDL_Event       event;
    for (;;) {
        SDL_WaitEvent(&event);//获取事件
        switch (event.type) {
        case FF_QUIT_EVENT:
        case SDL_QUIT:
            is->quit = 1;
            do_exit(is);
            break;
        case SDL_KEYDOWN:
            if (event.key.keysym.sym == SDLK_ESCAPE) {
                is->quit = 1;
                do_exit(is);
            }
            printf("%s\n", SDL_GetKeyName(event.key.keysym.sym));
            break;
        case FF_REFRESH_EVENT:
            video_refresh_timer(event.user.data1);
            break;
        default:
            break;
        }
    }
}

int main(int argc, char* argv[]) {

    int 		  ret = 0;
    int       flags = 0;
    VideoState* is = NULL;

    // 设置日志级别
    av_log_set_level(AV_LOG_INFO);

    /*
    if (argc < 2) {
        fprintf(stderr, "Usage: command <file>\n");
        exit(1);
    }
*/
    //get filename
    input_filename = "12.mp4";

    //设置SDL的初始化标志,并尝试初始化。如果初始化失败,则输出错误信息并退出程序。 
    flags = SDL_INIT_VIDEO | SDL_INIT_AUDIO | SDL_INIT_TIMER;
    if (SDL_Init(flags)) {
        av_log(NULL, AV_LOG_FATAL, "Could not initialize SDL - %s\n", SDL_GetError());
        exit(1);
    }

    //creat window from SDL
    win = SDL_CreateWindow("Media Player",
        SDL_WINDOWPOS_UNDEFINED,
        SDL_WINDOWPOS_UNDEFINED,
        640,480,
        //default_width, default_height,
        SDL_WINDOW_OPENGL | SDL_WINDOW_RESIZABLE);
    if (win) {
        renderer = SDL_CreateRenderer(win, -1, 0);//渲染器
    }

    if (!win || !renderer) {
        av_log(NULL, AV_LOG_FATAL, "Failed to create window or renderer!\n");
        do_exit(NULL); //释放资源
    }

    //import: open audio and video stream
    is = stream_open(input_filename);
    if (!is) {
        av_log(NULL, AV_LOG_FATAL, "Failed to initialize VideoState!\n");
        do_exit(NULL);
    }

    //listen key or mouse event
    sdl_event_loop(is);
    system("pause");
    return ret;
}