The time base used for compressed bitstream and video frame in the SDK
is { 1, 90000 }. [1][2]
This can avoid the error message below from the muxer.
$> ffmpeg -hwaccel qsv -c:v hevc_qsv -i input.h265 -f null -
...
[null @ 0x561c24f6f2f0] Application provided invalid, non monotonically
increasing dts to muxer in stream 0: 2 >= 2
[1]https://github.com/Intel-Media-SDK/MediaSDK/blob/master/doc/mediasdk-man.md#mfxbitstream
[2]https://github.com/Intel-Media-SDK/MediaSDK/blob/master/doc/mediasdk-man.md#mfxframedata
Signed-off-by: Zhong Li <zhongli_dev@126.com>
		
	
			
		
			
				
	
	
		
			926 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			926 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Intel MediaSDK QSV codec-independent code
 | |
|  *
 | |
|  * copyright (c) 2013 Luca Barbato
 | |
|  * copyright (c) 2015 Anton Khirnov <anton@khirnov.net>
 | |
|  *
 | |
|  * This file is part of FFmpeg.
 | |
|  *
 | |
|  * FFmpeg is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU Lesser General Public
 | |
|  * License as published by the Free Software Foundation; either
 | |
|  * version 2.1 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * FFmpeg is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|  * Lesser General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU Lesser General Public
 | |
|  * License along with FFmpeg; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 | |
|  */
 | |
| 
 | |
| #include <stdint.h>
 | |
| #include <string.h>
 | |
| #include <sys/types.h>
 | |
| 
 | |
| #include <mfx/mfxvideo.h>
 | |
| 
 | |
| #include "libavutil/common.h"
 | |
| #include "libavutil/fifo.h"
 | |
| #include "libavutil/frame.h"
 | |
| #include "libavutil/hwcontext.h"
 | |
| #include "libavutil/hwcontext_qsv.h"
 | |
| #include "libavutil/mem.h"
 | |
| #include "libavutil/log.h"
 | |
| #include "libavutil/opt.h"
 | |
| #include "libavutil/pixfmt.h"
 | |
| #include "libavutil/time.h"
 | |
| #include "libavutil/imgutils.h"
 | |
| 
 | |
| #include "avcodec.h"
 | |
| #include "internal.h"
 | |
| #include "decode.h"
 | |
| #include "hwconfig.h"
 | |
| #include "qsv.h"
 | |
| #include "qsv_internal.h"
 | |
| 
 | |
| static const AVRational mfx_tb = { 1, 90000 };
 | |
| 
 | |
| #define PTS_TO_MFX_PTS(pts, pts_tb) ((pts) == AV_NOPTS_VALUE ? \
 | |
|     MFX_TIMESTAMP_UNKNOWN : pts_tb.num ? \
 | |
|     av_rescale_q(pts, pts_tb, mfx_tb) : pts)
 | |
| 
 | |
| #define MFX_PTS_TO_PTS(mfx_pts, pts_tb) ((mfx_pts) == MFX_TIMESTAMP_UNKNOWN ? \
 | |
|     AV_NOPTS_VALUE : pts_tb.num ? \
 | |
|     av_rescale_q(mfx_pts, mfx_tb, pts_tb) : mfx_pts)
 | |
| 
 | |
| typedef struct QSVContext {
 | |
|     // the session used for decoding
 | |
|     mfxSession session;
 | |
| 
 | |
|     // the session we allocated internally, in case the caller did not provide
 | |
|     // one
 | |
|     QSVSession internal_qs;
 | |
| 
 | |
|     QSVFramesContext frames_ctx;
 | |
| 
 | |
|     /**
 | |
|      * a linked list of frames currently being used by QSV
 | |
|      */
 | |
|     QSVFrame *work_frames;
 | |
| 
 | |
|     AVFifoBuffer *async_fifo;
 | |
|     int zero_consume_run;
 | |
|     int buffered_count;
 | |
|     int reinit_flag;
 | |
| 
 | |
|     enum AVPixelFormat orig_pix_fmt;
 | |
|     uint32_t fourcc;
 | |
|     mfxFrameInfo frame_info;
 | |
|     AVBufferPool *pool;
 | |
| 
 | |
|     int initialized;
 | |
| 
 | |
|     // options set by the caller
 | |
|     int async_depth;
 | |
|     int iopattern;
 | |
|     int gpu_copy;
 | |
| 
 | |
|     char *load_plugins;
 | |
| 
 | |
|     mfxExtBuffer **ext_buffers;
 | |
|     int         nb_ext_buffers;
 | |
| } QSVContext;
 | |
| 
 | |
| static const AVCodecHWConfigInternal *const qsv_hw_configs[] = {
 | |
|     &(const AVCodecHWConfigInternal) {
 | |
|         .public = {
 | |
|             .pix_fmt     = AV_PIX_FMT_QSV,
 | |
|             .methods     = AV_CODEC_HW_CONFIG_METHOD_HW_FRAMES_CTX |
 | |
|                            AV_CODEC_HW_CONFIG_METHOD_AD_HOC,
 | |
|             .device_type = AV_HWDEVICE_TYPE_QSV,
 | |
|         },
 | |
|         .hwaccel = NULL,
 | |
|     },
 | |
|     NULL
 | |
| };
 | |
| 
 | |
| static int qsv_get_continuous_buffer(AVCodecContext *avctx, AVFrame *frame,
 | |
|                                      AVBufferPool *pool)
 | |
| {
 | |
|     int ret = 0;
 | |
| 
 | |
|     ff_decode_frame_props(avctx, frame);
 | |
| 
 | |
|     frame->width       = avctx->width;
 | |
|     frame->height      = avctx->height;
 | |
| 
 | |
|     switch (avctx->pix_fmt) {
 | |
|     case AV_PIX_FMT_NV12:
 | |
|         frame->linesize[0] = FFALIGN(avctx->width, 128);
 | |
|         break;
 | |
|     case AV_PIX_FMT_P010:
 | |
|         frame->linesize[0] = 2 * FFALIGN(avctx->width, 128);
 | |
|         break;
 | |
|     default:
 | |
|         av_log(avctx, AV_LOG_ERROR, "Unsupported pixel format.\n");
 | |
|         return AVERROR(EINVAL);
 | |
|     }
 | |
| 
 | |
|     frame->linesize[1] = frame->linesize[0];
 | |
|     frame->buf[0]      = av_buffer_pool_get(pool);
 | |
|     if (!frame->buf[0])
 | |
|         return AVERROR(ENOMEM);
 | |
| 
 | |
|     frame->data[0] = frame->buf[0]->data;
 | |
|     frame->data[1] = frame->data[0] +
 | |
|                             frame->linesize[0] * FFALIGN(avctx->height, 64);
 | |
| 
 | |
|     ret = ff_attach_decode_data(frame);
 | |
|     if (ret < 0)
 | |
|         return ret;
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static int qsv_init_session(AVCodecContext *avctx, QSVContext *q, mfxSession session,
 | |
|                             AVBufferRef *hw_frames_ref, AVBufferRef *hw_device_ref)
 | |
| {
 | |
|     int ret;
 | |
| 
 | |
|     if (q->gpu_copy == MFX_GPUCOPY_ON &&
 | |
|         !(q->iopattern & MFX_IOPATTERN_OUT_SYSTEM_MEMORY)) {
 | |
|         av_log(avctx, AV_LOG_WARNING, "GPU-accelerated memory copy "
 | |
|                         "only works in system memory mode.\n");
 | |
|         q->gpu_copy = MFX_GPUCOPY_OFF;
 | |
|     }
 | |
|     if (session) {
 | |
|         q->session = session;
 | |
|     } else if (hw_frames_ref) {
 | |
|         if (q->internal_qs.session) {
 | |
|             MFXClose(q->internal_qs.session);
 | |
|             q->internal_qs.session = NULL;
 | |
|         }
 | |
|         av_buffer_unref(&q->frames_ctx.hw_frames_ctx);
 | |
| 
 | |
|         q->frames_ctx.hw_frames_ctx = av_buffer_ref(hw_frames_ref);
 | |
|         if (!q->frames_ctx.hw_frames_ctx)
 | |
|             return AVERROR(ENOMEM);
 | |
| 
 | |
|         ret = ff_qsv_init_session_frames(avctx, &q->internal_qs.session,
 | |
|                                          &q->frames_ctx, q->load_plugins,
 | |
|                                          q->iopattern == MFX_IOPATTERN_OUT_OPAQUE_MEMORY,
 | |
|                                          q->gpu_copy);
 | |
|         if (ret < 0) {
 | |
|             av_buffer_unref(&q->frames_ctx.hw_frames_ctx);
 | |
|             return ret;
 | |
|         }
 | |
| 
 | |
|         q->session = q->internal_qs.session;
 | |
|     } else if (hw_device_ref) {
 | |
|         if (q->internal_qs.session) {
 | |
|             MFXClose(q->internal_qs.session);
 | |
|             q->internal_qs.session = NULL;
 | |
|         }
 | |
| 
 | |
|         ret = ff_qsv_init_session_device(avctx, &q->internal_qs.session,
 | |
|                                          hw_device_ref, q->load_plugins, q->gpu_copy);
 | |
|         if (ret < 0)
 | |
|             return ret;
 | |
| 
 | |
|         q->session = q->internal_qs.session;
 | |
|     } else {
 | |
|         if (!q->internal_qs.session) {
 | |
|             ret = ff_qsv_init_internal_session(avctx, &q->internal_qs,
 | |
|                                                q->load_plugins, q->gpu_copy);
 | |
|             if (ret < 0)
 | |
|                 return ret;
 | |
|         }
 | |
| 
 | |
|         q->session = q->internal_qs.session;
 | |
|     }
 | |
| 
 | |
|     /* make sure the decoder is uninitialized */
 | |
|     MFXVideoDECODE_Close(q->session);
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static inline unsigned int qsv_fifo_item_size(void)
 | |
| {
 | |
|     return sizeof(mfxSyncPoint*) + sizeof(QSVFrame*);
 | |
| }
 | |
| 
 | |
| static inline unsigned int qsv_fifo_size(const AVFifoBuffer* fifo)
 | |
| {
 | |
|     return av_fifo_size(fifo) / qsv_fifo_item_size();
 | |
| }
 | |
| 
 | |
| static int qsv_decode_preinit(AVCodecContext *avctx, QSVContext *q, enum AVPixelFormat pix_fmt, mfxVideoParam *param)
 | |
| {
 | |
|     mfxSession session = NULL;
 | |
|     int iopattern = 0;
 | |
|     int ret;
 | |
|     enum AVPixelFormat pix_fmts[3] = {
 | |
|         AV_PIX_FMT_QSV, /* opaque format in case of video memory output */
 | |
|         pix_fmt,        /* system memory format obtained from bitstream parser */
 | |
|         AV_PIX_FMT_NONE };
 | |
| 
 | |
|     ret = ff_get_format(avctx, pix_fmts);
 | |
|     if (ret < 0) {
 | |
|         q->orig_pix_fmt = avctx->pix_fmt = AV_PIX_FMT_NONE;
 | |
|         return ret;
 | |
|     }
 | |
| 
 | |
|     if (!q->async_fifo) {
 | |
|         q->async_fifo = av_fifo_alloc(q->async_depth * qsv_fifo_item_size());
 | |
|         if (!q->async_fifo)
 | |
|             return AVERROR(ENOMEM);
 | |
|     }
 | |
| 
 | |
|     if (avctx->pix_fmt == AV_PIX_FMT_QSV && avctx->hwaccel_context) {
 | |
|         AVQSVContext *user_ctx = avctx->hwaccel_context;
 | |
|         session           = user_ctx->session;
 | |
|         iopattern         = user_ctx->iopattern;
 | |
|         q->ext_buffers    = user_ctx->ext_buffers;
 | |
|         q->nb_ext_buffers = user_ctx->nb_ext_buffers;
 | |
|     }
 | |
| 
 | |
|     if (avctx->hw_frames_ctx) {
 | |
|         AVHWFramesContext    *frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
 | |
|         AVQSVFramesContext *frames_hwctx = frames_ctx->hwctx;
 | |
| 
 | |
|         if (!iopattern) {
 | |
|             if (frames_hwctx->frame_type & MFX_MEMTYPE_OPAQUE_FRAME)
 | |
|                 iopattern = MFX_IOPATTERN_OUT_OPAQUE_MEMORY;
 | |
|             else if (frames_hwctx->frame_type & MFX_MEMTYPE_VIDEO_MEMORY_DECODER_TARGET)
 | |
|                 iopattern = MFX_IOPATTERN_OUT_VIDEO_MEMORY;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (!iopattern)
 | |
|         iopattern = MFX_IOPATTERN_OUT_SYSTEM_MEMORY;
 | |
|     q->iopattern = iopattern;
 | |
| 
 | |
|     ff_qsv_print_iopattern(avctx, q->iopattern, "Decoder");
 | |
| 
 | |
|     ret = qsv_init_session(avctx, q, session, avctx->hw_frames_ctx, avctx->hw_device_ctx);
 | |
|     if (ret < 0) {
 | |
|         av_log(avctx, AV_LOG_ERROR, "Error initializing an MFX session\n");
 | |
|         return ret;
 | |
|     }
 | |
| 
 | |
|     param->IOPattern   = q->iopattern;
 | |
|     param->AsyncDepth  = q->async_depth;
 | |
|     param->ExtParam    = q->ext_buffers;
 | |
|     param->NumExtParam = q->nb_ext_buffers;
 | |
| 
 | |
|     return 0;
 | |
|  }
 | |
| 
 | |
| static int qsv_decode_init_context(AVCodecContext *avctx, QSVContext *q, mfxVideoParam *param)
 | |
| {
 | |
|     int ret;
 | |
| 
 | |
|     avctx->width        = param->mfx.FrameInfo.CropW;
 | |
|     avctx->height       = param->mfx.FrameInfo.CropH;
 | |
|     avctx->coded_width  = param->mfx.FrameInfo.Width;
 | |
|     avctx->coded_height = param->mfx.FrameInfo.Height;
 | |
|     avctx->level        = param->mfx.CodecLevel;
 | |
|     avctx->profile      = param->mfx.CodecProfile;
 | |
|     avctx->field_order  = ff_qsv_map_picstruct(param->mfx.FrameInfo.PicStruct);
 | |
|     avctx->pix_fmt      = ff_qsv_map_fourcc(param->mfx.FrameInfo.FourCC);
 | |
| 
 | |
|     ret = MFXVideoDECODE_Init(q->session, param);
 | |
|     if (ret < 0)
 | |
|         return ff_qsv_print_error(avctx, ret,
 | |
|                                   "Error initializing the MFX video decoder");
 | |
| 
 | |
|     q->frame_info = param->mfx.FrameInfo;
 | |
| 
 | |
|     if (!avctx->hw_frames_ctx)
 | |
|         q->pool = av_buffer_pool_init(av_image_get_buffer_size(avctx->pix_fmt,
 | |
|                     FFALIGN(avctx->width, 128), FFALIGN(avctx->height, 64), 1), av_buffer_allocz);
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static int qsv_decode_header(AVCodecContext *avctx, QSVContext *q,
 | |
|                              const AVPacket *avpkt, enum AVPixelFormat pix_fmt,
 | |
|                              mfxVideoParam *param)
 | |
| {
 | |
|     int ret;
 | |
| 
 | |
|     mfxBitstream bs = { 0 };
 | |
| 
 | |
|     if (avpkt->size) {
 | |
|         bs.Data       = avpkt->data;
 | |
|         bs.DataLength = avpkt->size;
 | |
|         bs.MaxLength  = bs.DataLength;
 | |
|         bs.TimeStamp  = PTS_TO_MFX_PTS(avpkt->pts, avctx->pkt_timebase);
 | |
|         if (avctx->field_order == AV_FIELD_PROGRESSIVE)
 | |
|             bs.DataFlag   |= MFX_BITSTREAM_COMPLETE_FRAME;
 | |
|     } else
 | |
|         return AVERROR_INVALIDDATA;
 | |
| 
 | |
| 
 | |
|     if(!q->session) {
 | |
|         ret = qsv_decode_preinit(avctx, q, pix_fmt, param);
 | |
|         if (ret < 0)
 | |
|             return ret;
 | |
|     }
 | |
| 
 | |
|     ret = ff_qsv_codec_id_to_mfx(avctx->codec_id);
 | |
|     if (ret < 0)
 | |
|         return ret;
 | |
| 
 | |
|     param->mfx.CodecId = ret;
 | |
|     ret = MFXVideoDECODE_DecodeHeader(q->session, &bs, param);
 | |
|     if (MFX_ERR_MORE_DATA == ret) {
 | |
|        return AVERROR(EAGAIN);
 | |
|     }
 | |
|     if (ret < 0)
 | |
|         return ff_qsv_print_error(avctx, ret,
 | |
|                 "Error decoding stream header");
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static int alloc_frame(AVCodecContext *avctx, QSVContext *q, QSVFrame *frame)
 | |
| {
 | |
|     int ret;
 | |
| 
 | |
|     if (q->pool)
 | |
|         ret = qsv_get_continuous_buffer(avctx, frame->frame, q->pool);
 | |
|     else
 | |
|         ret = ff_get_buffer(avctx, frame->frame, AV_GET_BUFFER_FLAG_REF);
 | |
| 
 | |
|     if (ret < 0)
 | |
|         return ret;
 | |
| 
 | |
|     if (frame->frame->format == AV_PIX_FMT_QSV) {
 | |
|         frame->surface = *(mfxFrameSurface1*)frame->frame->data[3];
 | |
|     } else {
 | |
|         frame->surface.Info = q->frame_info;
 | |
| 
 | |
|         frame->surface.Data.PitchLow = frame->frame->linesize[0];
 | |
|         frame->surface.Data.Y        = frame->frame->data[0];
 | |
|         frame->surface.Data.UV       = frame->frame->data[1];
 | |
|     }
 | |
| 
 | |
|     if (q->frames_ctx.mids) {
 | |
|         ret = ff_qsv_find_surface_idx(&q->frames_ctx, frame);
 | |
|         if (ret < 0)
 | |
|             return ret;
 | |
| 
 | |
|         frame->surface.Data.MemId = &q->frames_ctx.mids[ret];
 | |
|     }
 | |
|     frame->surface.Data.ExtParam    = &frame->ext_param;
 | |
|     frame->surface.Data.NumExtParam = 1;
 | |
|     frame->ext_param                = (mfxExtBuffer*)&frame->dec_info;
 | |
|     frame->dec_info.Header.BufferId = MFX_EXTBUFF_DECODED_FRAME_INFO;
 | |
|     frame->dec_info.Header.BufferSz = sizeof(frame->dec_info);
 | |
| 
 | |
|     frame->used = 1;
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static void qsv_clear_unused_frames(QSVContext *q)
 | |
| {
 | |
|     QSVFrame *cur = q->work_frames;
 | |
|     while (cur) {
 | |
|         if (cur->used && !cur->surface.Data.Locked && !cur->queued) {
 | |
|             cur->used = 0;
 | |
|             av_frame_unref(cur->frame);
 | |
|         }
 | |
|         cur = cur->next;
 | |
|     }
 | |
| }
 | |
| 
 | |
| static int get_surface(AVCodecContext *avctx, QSVContext *q, mfxFrameSurface1 **surf)
 | |
| {
 | |
|     QSVFrame *frame, **last;
 | |
|     int ret;
 | |
| 
 | |
|     qsv_clear_unused_frames(q);
 | |
| 
 | |
|     frame = q->work_frames;
 | |
|     last  = &q->work_frames;
 | |
|     while (frame) {
 | |
|         if (!frame->used) {
 | |
|             ret = alloc_frame(avctx, q, frame);
 | |
|             if (ret < 0)
 | |
|                 return ret;
 | |
|             *surf = &frame->surface;
 | |
|             return 0;
 | |
|         }
 | |
| 
 | |
|         last  = &frame->next;
 | |
|         frame = frame->next;
 | |
|     }
 | |
| 
 | |
|     frame = av_mallocz(sizeof(*frame));
 | |
|     if (!frame)
 | |
|         return AVERROR(ENOMEM);
 | |
|     frame->frame = av_frame_alloc();
 | |
|     if (!frame->frame) {
 | |
|         av_freep(&frame);
 | |
|         return AVERROR(ENOMEM);
 | |
|     }
 | |
|     *last = frame;
 | |
| 
 | |
|     ret = alloc_frame(avctx, q, frame);
 | |
|     if (ret < 0)
 | |
|         return ret;
 | |
| 
 | |
|     *surf = &frame->surface;
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static QSVFrame *find_frame(QSVContext *q, mfxFrameSurface1 *surf)
 | |
| {
 | |
|     QSVFrame *cur = q->work_frames;
 | |
|     while (cur) {
 | |
|         if (surf == &cur->surface)
 | |
|             return cur;
 | |
|         cur = cur->next;
 | |
|     }
 | |
|     return NULL;
 | |
| }
 | |
| 
 | |
| static int qsv_decode(AVCodecContext *avctx, QSVContext *q,
 | |
|                       AVFrame *frame, int *got_frame,
 | |
|                       const AVPacket *avpkt)
 | |
| {
 | |
|     QSVFrame *out_frame;
 | |
|     mfxFrameSurface1 *insurf;
 | |
|     mfxFrameSurface1 *outsurf;
 | |
|     mfxSyncPoint *sync;
 | |
|     mfxBitstream bs = { { { 0 } } };
 | |
|     int ret;
 | |
| 
 | |
|     if (avpkt->size) {
 | |
|         bs.Data       = avpkt->data;
 | |
|         bs.DataLength = avpkt->size;
 | |
|         bs.MaxLength  = bs.DataLength;
 | |
|         bs.TimeStamp  = PTS_TO_MFX_PTS(avpkt->pts, avctx->pkt_timebase);
 | |
|         if (avctx->field_order == AV_FIELD_PROGRESSIVE)
 | |
|             bs.DataFlag   |= MFX_BITSTREAM_COMPLETE_FRAME;
 | |
|     }
 | |
| 
 | |
|     sync = av_mallocz(sizeof(*sync));
 | |
|     if (!sync) {
 | |
|         av_freep(&sync);
 | |
|         return AVERROR(ENOMEM);
 | |
|     }
 | |
| 
 | |
|     do {
 | |
|         ret = get_surface(avctx, q, &insurf);
 | |
|         if (ret < 0) {
 | |
|             av_freep(&sync);
 | |
|             return ret;
 | |
|         }
 | |
| 
 | |
|         ret = MFXVideoDECODE_DecodeFrameAsync(q->session, avpkt->size ? &bs : NULL,
 | |
|                                               insurf, &outsurf, sync);
 | |
|         if (ret == MFX_WRN_DEVICE_BUSY)
 | |
|             av_usleep(500);
 | |
| 
 | |
|     } while (ret == MFX_WRN_DEVICE_BUSY || ret == MFX_ERR_MORE_SURFACE);
 | |
| 
 | |
|     if (ret != MFX_ERR_NONE &&
 | |
|         ret != MFX_ERR_MORE_DATA &&
 | |
|         ret != MFX_WRN_VIDEO_PARAM_CHANGED &&
 | |
|         ret != MFX_ERR_MORE_SURFACE) {
 | |
|         av_freep(&sync);
 | |
|         return ff_qsv_print_error(avctx, ret,
 | |
|                                   "Error during QSV decoding.");
 | |
|     }
 | |
| 
 | |
|     /* make sure we do not enter an infinite loop if the SDK
 | |
|      * did not consume any data and did not return anything */
 | |
|     if (!*sync && !bs.DataOffset) {
 | |
|         bs.DataOffset = avpkt->size;
 | |
|         ++q->zero_consume_run;
 | |
|         if (q->zero_consume_run > 1)
 | |
|             ff_qsv_print_warning(avctx, ret, "A decode call did not consume any data");
 | |
|     } else if (!*sync && bs.DataOffset) {
 | |
|         ++q->buffered_count;
 | |
|     } else {
 | |
|         q->zero_consume_run = 0;
 | |
|     }
 | |
| 
 | |
|     if (*sync) {
 | |
|         QSVFrame *out_frame = find_frame(q, outsurf);
 | |
| 
 | |
|         if (!out_frame) {
 | |
|             av_log(avctx, AV_LOG_ERROR,
 | |
|                    "The returned surface does not correspond to any frame\n");
 | |
|             av_freep(&sync);
 | |
|             return AVERROR_BUG;
 | |
|         }
 | |
| 
 | |
|         out_frame->queued = 1;
 | |
|         av_fifo_generic_write(q->async_fifo, &out_frame, sizeof(out_frame), NULL);
 | |
|         av_fifo_generic_write(q->async_fifo, &sync,      sizeof(sync),      NULL);
 | |
|     } else {
 | |
|         av_freep(&sync);
 | |
|     }
 | |
| 
 | |
|     if ((qsv_fifo_size(q->async_fifo) >= q->async_depth) ||
 | |
|         (!avpkt->size && av_fifo_size(q->async_fifo))) {
 | |
|         AVFrame *src_frame;
 | |
| 
 | |
|         av_fifo_generic_read(q->async_fifo, &out_frame, sizeof(out_frame), NULL);
 | |
|         av_fifo_generic_read(q->async_fifo, &sync,      sizeof(sync),      NULL);
 | |
|         out_frame->queued = 0;
 | |
| 
 | |
|         if (avctx->pix_fmt != AV_PIX_FMT_QSV) {
 | |
|             do {
 | |
|                 ret = MFXVideoCORE_SyncOperation(q->session, *sync, 1000);
 | |
|             } while (ret == MFX_WRN_IN_EXECUTION);
 | |
|         }
 | |
| 
 | |
|         av_freep(&sync);
 | |
| 
 | |
|         src_frame = out_frame->frame;
 | |
| 
 | |
|         ret = av_frame_ref(frame, src_frame);
 | |
|         if (ret < 0)
 | |
|             return ret;
 | |
| 
 | |
|         outsurf = &out_frame->surface;
 | |
| 
 | |
|         frame->pts = MFX_PTS_TO_PTS(outsurf->Data.TimeStamp, avctx->pkt_timebase);
 | |
| 
 | |
|         frame->repeat_pict =
 | |
|             outsurf->Info.PicStruct & MFX_PICSTRUCT_FRAME_TRIPLING ? 4 :
 | |
|             outsurf->Info.PicStruct & MFX_PICSTRUCT_FRAME_DOUBLING ? 2 :
 | |
|             outsurf->Info.PicStruct & MFX_PICSTRUCT_FIELD_REPEATED ? 1 : 0;
 | |
|         frame->top_field_first =
 | |
|             outsurf->Info.PicStruct & MFX_PICSTRUCT_FIELD_TFF;
 | |
|         frame->interlaced_frame =
 | |
|             !(outsurf->Info.PicStruct & MFX_PICSTRUCT_PROGRESSIVE);
 | |
|         frame->pict_type = ff_qsv_map_pictype(out_frame->dec_info.FrameType);
 | |
|         //Key frame is IDR frame is only suitable for H264. For HEVC, IRAPs are key frames.
 | |
|         if (avctx->codec_id == AV_CODEC_ID_H264)
 | |
|             frame->key_frame = !!(out_frame->dec_info.FrameType & MFX_FRAMETYPE_IDR);
 | |
| 
 | |
|         /* update the surface properties */
 | |
|         if (avctx->pix_fmt == AV_PIX_FMT_QSV)
 | |
|             ((mfxFrameSurface1*)frame->data[3])->Info = outsurf->Info;
 | |
| 
 | |
|         *got_frame = 1;
 | |
|     }
 | |
| 
 | |
|     return bs.DataOffset;
 | |
| }
 | |
| 
 | |
| static void qsv_decode_close_qsvcontext(QSVContext *q)
 | |
| {
 | |
|     QSVFrame *cur = q->work_frames;
 | |
| 
 | |
|     if (q->session)
 | |
|         MFXVideoDECODE_Close(q->session);
 | |
| 
 | |
|     while (q->async_fifo && av_fifo_size(q->async_fifo)) {
 | |
|         QSVFrame *out_frame;
 | |
|         mfxSyncPoint *sync;
 | |
| 
 | |
|         av_fifo_generic_read(q->async_fifo, &out_frame, sizeof(out_frame), NULL);
 | |
|         av_fifo_generic_read(q->async_fifo, &sync,      sizeof(sync),      NULL);
 | |
| 
 | |
|         av_freep(&sync);
 | |
|     }
 | |
| 
 | |
|     while (cur) {
 | |
|         q->work_frames = cur->next;
 | |
|         av_frame_free(&cur->frame);
 | |
|         av_freep(&cur);
 | |
|         cur = q->work_frames;
 | |
|     }
 | |
| 
 | |
|     av_fifo_free(q->async_fifo);
 | |
|     q->async_fifo = NULL;
 | |
| 
 | |
|     ff_qsv_close_internal_session(&q->internal_qs);
 | |
| 
 | |
|     av_buffer_unref(&q->frames_ctx.hw_frames_ctx);
 | |
|     av_buffer_unref(&q->frames_ctx.mids_buf);
 | |
|     av_buffer_pool_uninit(&q->pool);
 | |
| }
 | |
| 
 | |
| static int qsv_process_data(AVCodecContext *avctx, QSVContext *q,
 | |
|                             AVFrame *frame, int *got_frame, const AVPacket *pkt)
 | |
| {
 | |
|     int ret;
 | |
|     mfxVideoParam param = { 0 };
 | |
|     enum AVPixelFormat pix_fmt = AV_PIX_FMT_NV12;
 | |
| 
 | |
|     if (!pkt->size)
 | |
|         return qsv_decode(avctx, q, frame, got_frame, pkt);
 | |
| 
 | |
|     /* TODO: flush delayed frames on reinit */
 | |
| 
 | |
|     // sw_pix_fmt, coded_width/height should be set for ff_get_format(),
 | |
|     // assume sw_pix_fmt is NV12 and coded_width/height to be 1280x720,
 | |
|     // the assumption may be not corret but will be updated after header decoded if not true.
 | |
|     if (q->orig_pix_fmt != AV_PIX_FMT_NONE)
 | |
|         pix_fmt = q->orig_pix_fmt;
 | |
|     if (!avctx->coded_width)
 | |
|         avctx->coded_width = 1280;
 | |
|     if (!avctx->coded_height)
 | |
|         avctx->coded_height = 720;
 | |
| 
 | |
|     ret = qsv_decode_header(avctx, q, pkt, pix_fmt, ¶m);
 | |
| 
 | |
|     if (ret >= 0 && (q->orig_pix_fmt != ff_qsv_map_fourcc(param.mfx.FrameInfo.FourCC) ||
 | |
|         avctx->coded_width  != param.mfx.FrameInfo.Width ||
 | |
|         avctx->coded_height != param.mfx.FrameInfo.Height)) {
 | |
|         AVPacket zero_pkt = {0};
 | |
| 
 | |
|         if (q->buffered_count) {
 | |
|             q->reinit_flag = 1;
 | |
|             /* decode zero-size pkt to flush the buffered pkt before reinit */
 | |
|             q->buffered_count--;
 | |
|             return qsv_decode(avctx, q, frame, got_frame, &zero_pkt);
 | |
|         }
 | |
|         q->reinit_flag = 0;
 | |
| 
 | |
|         q->orig_pix_fmt = avctx->pix_fmt = pix_fmt = ff_qsv_map_fourcc(param.mfx.FrameInfo.FourCC);
 | |
| 
 | |
|         avctx->coded_width  = param.mfx.FrameInfo.Width;
 | |
|         avctx->coded_height = param.mfx.FrameInfo.Height;
 | |
| 
 | |
|         ret = qsv_decode_preinit(avctx, q, pix_fmt, ¶m);
 | |
|         if (ret < 0)
 | |
|             goto reinit_fail;
 | |
|         q->initialized = 0;
 | |
|     }
 | |
| 
 | |
|     if (!q->initialized) {
 | |
|         ret = qsv_decode_init_context(avctx, q, ¶m);
 | |
|         if (ret < 0)
 | |
|             goto reinit_fail;
 | |
|         q->initialized = 1;
 | |
|     }
 | |
| 
 | |
|     return qsv_decode(avctx, q, frame, got_frame, pkt);
 | |
| 
 | |
| reinit_fail:
 | |
|     q->orig_pix_fmt = avctx->pix_fmt = AV_PIX_FMT_NONE;
 | |
|     return ret;
 | |
| }
 | |
| 
 | |
| enum LoadPlugin {
 | |
|     LOAD_PLUGIN_NONE,
 | |
|     LOAD_PLUGIN_HEVC_SW,
 | |
|     LOAD_PLUGIN_HEVC_HW,
 | |
| };
 | |
| 
 | |
| typedef struct QSVDecContext {
 | |
|     AVClass *class;
 | |
|     QSVContext qsv;
 | |
| 
 | |
|     int load_plugin;
 | |
| 
 | |
|     AVFifoBuffer *packet_fifo;
 | |
| 
 | |
|     AVPacket buffer_pkt;
 | |
| } QSVDecContext;
 | |
| 
 | |
| static void qsv_clear_buffers(QSVDecContext *s)
 | |
| {
 | |
|     AVPacket pkt;
 | |
|     while (av_fifo_size(s->packet_fifo) >= sizeof(pkt)) {
 | |
|         av_fifo_generic_read(s->packet_fifo, &pkt, sizeof(pkt), NULL);
 | |
|         av_packet_unref(&pkt);
 | |
|     }
 | |
| 
 | |
|     av_packet_unref(&s->buffer_pkt);
 | |
| }
 | |
| 
 | |
| static av_cold int qsv_decode_close(AVCodecContext *avctx)
 | |
| {
 | |
|     QSVDecContext *s = avctx->priv_data;
 | |
| 
 | |
|     av_freep(&s->qsv.load_plugins);
 | |
| 
 | |
|     qsv_decode_close_qsvcontext(&s->qsv);
 | |
| 
 | |
|     qsv_clear_buffers(s);
 | |
| 
 | |
|     av_fifo_free(s->packet_fifo);
 | |
| 
 | |
|     return 0;
 | |
| }
 | |
| 
 | |
| static av_cold int qsv_decode_init(AVCodecContext *avctx)
 | |
| {
 | |
|     QSVDecContext *s = avctx->priv_data;
 | |
|     int ret;
 | |
|     const char *uid = NULL;
 | |
| 
 | |
|     if (avctx->codec_id == AV_CODEC_ID_VP8) {
 | |
|         uid = "f622394d8d87452f878c51f2fc9b4131";
 | |
|     } else if (avctx->codec_id == AV_CODEC_ID_VP9) {
 | |
|         uid = "a922394d8d87452f878c51f2fc9b4131";
 | |
|     }
 | |
|     else if (avctx->codec_id == AV_CODEC_ID_HEVC && s->load_plugin != LOAD_PLUGIN_NONE) {
 | |
|         static const char * const uid_hevcdec_sw = "15dd936825ad475ea34e35f3f54217a6";
 | |
|         static const char * const uid_hevcdec_hw = "33a61c0b4c27454ca8d85dde757c6f8e";
 | |
| 
 | |
|         if (s->qsv.load_plugins[0]) {
 | |
|             av_log(avctx, AV_LOG_WARNING,
 | |
|                    "load_plugins is not empty, but load_plugin is not set to 'none'."
 | |
|                    "The load_plugin value will be ignored.\n");
 | |
|         } else {
 | |
|             if (s->load_plugin == LOAD_PLUGIN_HEVC_SW)
 | |
|                 uid = uid_hevcdec_sw;
 | |
|             else
 | |
|                 uid = uid_hevcdec_hw;
 | |
|         }
 | |
|     }
 | |
|     if (uid) {
 | |
|         av_freep(&s->qsv.load_plugins);
 | |
|         s->qsv.load_plugins = av_strdup(uid);
 | |
|         if (!s->qsv.load_plugins)
 | |
|             return AVERROR(ENOMEM);
 | |
|     }
 | |
| 
 | |
|     s->qsv.orig_pix_fmt = AV_PIX_FMT_NV12;
 | |
|     s->packet_fifo = av_fifo_alloc(sizeof(AVPacket));
 | |
|     if (!s->packet_fifo) {
 | |
|         ret = AVERROR(ENOMEM);
 | |
|         goto fail;
 | |
|     }
 | |
| 
 | |
|     if (!avctx->pkt_timebase.num)
 | |
|         av_log(avctx, AV_LOG_WARNING, "Invalid pkt_timebase, passing timestamps as-is.\n");
 | |
| 
 | |
|     return 0;
 | |
| fail:
 | |
|     qsv_decode_close(avctx);
 | |
|     return ret;
 | |
| }
 | |
| 
 | |
| static int qsv_decode_frame(AVCodecContext *avctx, void *data,
 | |
|                             int *got_frame, AVPacket *avpkt)
 | |
| {
 | |
|     QSVDecContext *s = avctx->priv_data;
 | |
|     AVFrame *frame    = data;
 | |
|     int ret;
 | |
| 
 | |
|     /* buffer the input packet */
 | |
|     if (avpkt->size) {
 | |
|         AVPacket input_ref;
 | |
| 
 | |
|         if (av_fifo_space(s->packet_fifo) < sizeof(input_ref)) {
 | |
|             ret = av_fifo_realloc2(s->packet_fifo,
 | |
|                                    av_fifo_size(s->packet_fifo) + sizeof(input_ref));
 | |
|             if (ret < 0)
 | |
|                 return ret;
 | |
|         }
 | |
| 
 | |
|         ret = av_packet_ref(&input_ref, avpkt);
 | |
|         if (ret < 0)
 | |
|             return ret;
 | |
|         av_fifo_generic_write(s->packet_fifo, &input_ref, sizeof(input_ref), NULL);
 | |
|     }
 | |
| 
 | |
|     /* process buffered data */
 | |
|     while (!*got_frame) {
 | |
|         /* prepare the input data */
 | |
|         if (s->buffer_pkt.size <= 0) {
 | |
|             /* no more data */
 | |
|             if (av_fifo_size(s->packet_fifo) < sizeof(AVPacket))
 | |
|                 return avpkt->size ? avpkt->size : qsv_process_data(avctx, &s->qsv, frame, got_frame, avpkt);
 | |
|             /* in progress of reinit, no read from fifo and keep the buffer_pkt */
 | |
|             if (!s->qsv.reinit_flag) {
 | |
|                 av_packet_unref(&s->buffer_pkt);
 | |
|                 av_fifo_generic_read(s->packet_fifo, &s->buffer_pkt, sizeof(s->buffer_pkt), NULL);
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         ret = qsv_process_data(avctx, &s->qsv, frame, got_frame, &s->buffer_pkt);
 | |
|         if (ret < 0){
 | |
|             /* Drop buffer_pkt when failed to decode the packet. Otherwise,
 | |
|                the decoder will keep decoding the failure packet. */
 | |
|             av_packet_unref(&s->buffer_pkt);
 | |
|             return ret;
 | |
|         }
 | |
|         if (s->qsv.reinit_flag)
 | |
|             continue;
 | |
| 
 | |
|         s->buffer_pkt.size -= ret;
 | |
|         s->buffer_pkt.data += ret;
 | |
|     }
 | |
| 
 | |
|     return avpkt->size;
 | |
| }
 | |
| 
 | |
| static void qsv_decode_flush(AVCodecContext *avctx)
 | |
| {
 | |
|     QSVDecContext *s = avctx->priv_data;
 | |
| 
 | |
|     qsv_clear_buffers(s);
 | |
| 
 | |
|     s->qsv.orig_pix_fmt = AV_PIX_FMT_NONE;
 | |
|     s->qsv.initialized = 0;
 | |
| }
 | |
| 
 | |
| #define OFFSET(x) offsetof(QSVDecContext, x)
 | |
| #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
 | |
| 
 | |
| #define DEFINE_QSV_DECODER_WITH_OPTION(x, X, bsf_name, opt) \
 | |
| static const AVClass x##_qsv_class = { \
 | |
|     .class_name = #x "_qsv", \
 | |
|     .item_name  = av_default_item_name, \
 | |
|     .option     = opt, \
 | |
|     .version    = LIBAVUTIL_VERSION_INT, \
 | |
| }; \
 | |
| const AVCodec ff_##x##_qsv_decoder = { \
 | |
|     .name           = #x "_qsv", \
 | |
|     .long_name      = NULL_IF_CONFIG_SMALL(#X " video (Intel Quick Sync Video acceleration)"), \
 | |
|     .priv_data_size = sizeof(QSVDecContext), \
 | |
|     .type           = AVMEDIA_TYPE_VIDEO, \
 | |
|     .id             = AV_CODEC_ID_##X, \
 | |
|     .init           = qsv_decode_init, \
 | |
|     .decode         = qsv_decode_frame, \
 | |
|     .flush          = qsv_decode_flush, \
 | |
|     .close          = qsv_decode_close, \
 | |
|     .bsfs           = bsf_name, \
 | |
|     .capabilities   = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_DR1 | AV_CODEC_CAP_AVOID_PROBING | AV_CODEC_CAP_HYBRID, \
 | |
|     .priv_class     = &x##_qsv_class, \
 | |
|     .pix_fmts       = (const enum AVPixelFormat[]){ AV_PIX_FMT_NV12, \
 | |
|                                                     AV_PIX_FMT_P010, \
 | |
|                                                     AV_PIX_FMT_QSV, \
 | |
|                                                     AV_PIX_FMT_NONE }, \
 | |
|     .hw_configs     = qsv_hw_configs, \
 | |
|     .wrapper_name   = "qsv", \
 | |
| }; \
 | |
| 
 | |
| #define DEFINE_QSV_DECODER(x, X, bsf_name) DEFINE_QSV_DECODER_WITH_OPTION(x, X, bsf_name, options)
 | |
| 
 | |
| #if CONFIG_HEVC_QSV_DECODER
 | |
| static const AVOption hevc_options[] = {
 | |
|     { "async_depth", "Internal parallelization depth, the higher the value the higher the latency.", OFFSET(qsv.async_depth), AV_OPT_TYPE_INT, { .i64 = ASYNC_DEPTH_DEFAULT }, 1, INT_MAX, VD },
 | |
| 
 | |
|     { "load_plugin", "A user plugin to load in an internal session", OFFSET(load_plugin), AV_OPT_TYPE_INT, { .i64 = LOAD_PLUGIN_HEVC_HW }, LOAD_PLUGIN_NONE, LOAD_PLUGIN_HEVC_HW, VD, "load_plugin" },
 | |
|     { "none",     NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_NONE },    0, 0, VD, "load_plugin" },
 | |
|     { "hevc_sw",  NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_SW }, 0, 0, VD, "load_plugin" },
 | |
|     { "hevc_hw",  NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_HW }, 0, 0, VD, "load_plugin" },
 | |
| 
 | |
|     { "load_plugins", "A :-separate list of hexadecimal plugin UIDs to load in an internal session",
 | |
|         OFFSET(qsv.load_plugins), AV_OPT_TYPE_STRING, { .str = "" }, 0, 0, VD },
 | |
| 
 | |
|     { "gpu_copy", "A GPU-accelerated copy between video and system memory", OFFSET(qsv.gpu_copy), AV_OPT_TYPE_INT, { .i64 = MFX_GPUCOPY_DEFAULT }, MFX_GPUCOPY_DEFAULT, MFX_GPUCOPY_OFF, VD, "gpu_copy"},
 | |
|         { "default", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_DEFAULT }, 0, 0, VD, "gpu_copy"},
 | |
|         { "on",      NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_ON },      0, 0, VD, "gpu_copy"},
 | |
|         { "off",     NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_OFF },     0, 0, VD, "gpu_copy"},
 | |
|     { NULL },
 | |
| };
 | |
| DEFINE_QSV_DECODER_WITH_OPTION(hevc, HEVC, "hevc_mp4toannexb", hevc_options)
 | |
| #endif
 | |
| 
 | |
| static const AVOption options[] = {
 | |
|     { "async_depth", "Internal parallelization depth, the higher the value the higher the latency.", OFFSET(qsv.async_depth), AV_OPT_TYPE_INT, { .i64 = ASYNC_DEPTH_DEFAULT }, 1, INT_MAX, VD },
 | |
| 
 | |
|     { "gpu_copy", "A GPU-accelerated copy between video and system memory", OFFSET(qsv.gpu_copy), AV_OPT_TYPE_INT, { .i64 = MFX_GPUCOPY_DEFAULT }, MFX_GPUCOPY_DEFAULT, MFX_GPUCOPY_OFF, VD, "gpu_copy"},
 | |
|         { "default", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_DEFAULT }, 0, 0, VD, "gpu_copy"},
 | |
|         { "on",      NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_ON },      0, 0, VD, "gpu_copy"},
 | |
|         { "off",     NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_OFF },     0, 0, VD, "gpu_copy"},
 | |
|     { NULL },
 | |
| };
 | |
| 
 | |
| #if CONFIG_H264_QSV_DECODER
 | |
| DEFINE_QSV_DECODER(h264, H264, "h264_mp4toannexb")
 | |
| #endif
 | |
| 
 | |
| #if CONFIG_MPEG2_QSV_DECODER
 | |
| DEFINE_QSV_DECODER(mpeg2, MPEG2VIDEO, NULL)
 | |
| #endif
 | |
| 
 | |
| #if CONFIG_VC1_QSV_DECODER
 | |
| DEFINE_QSV_DECODER(vc1, VC1, NULL)
 | |
| #endif
 | |
| 
 | |
| #if CONFIG_MJPEG_QSV_DECODER
 | |
| DEFINE_QSV_DECODER(mjpeg, MJPEG, NULL)
 | |
| #endif
 | |
| 
 | |
| #if CONFIG_VP8_QSV_DECODER
 | |
| DEFINE_QSV_DECODER(vp8, VP8, NULL)
 | |
| #endif
 | |
| 
 | |
| #if CONFIG_VP9_QSV_DECODER
 | |
| DEFINE_QSV_DECODER(vp9, VP9, NULL)
 | |
| #endif
 | |
| 
 | |
| #if CONFIG_AV1_QSV_DECODER
 | |
| DEFINE_QSV_DECODER(av1, AV1, NULL)
 | |
| #endif
 |