It is d3d12va's requirement that the FrameStartOffset must be aligned as per hardware limitation. However, we could trim this alignment at output to reduce coded size. A aligned_header_size is added to D3D12VAEncodePicture. Signed-off-by: Tong Wu <wutong1208@outlook.com>
		
			
				
	
	
		
			338 lines
		
	
	
		
			7.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			338 lines
		
	
	
		
			7.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * Direct3D 12 HW acceleration video encoder
 | 
						|
 *
 | 
						|
 * Copyright (c) 2024 Intel Corporation
 | 
						|
 *
 | 
						|
 * This file is part of FFmpeg.
 | 
						|
 *
 | 
						|
 * FFmpeg is free software; you can redistribute it and/or
 | 
						|
 * modify it under the terms of the GNU Lesser General Public
 | 
						|
 * License as published by the Free Software Foundation; either
 | 
						|
 * version 2.1 of the License, or (at your option) any later version.
 | 
						|
 *
 | 
						|
 * FFmpeg is distributed in the hope that it will be useful,
 | 
						|
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | 
						|
 * Lesser General Public License for more details.
 | 
						|
 *
 | 
						|
 * You should have received a copy of the GNU Lesser General Public
 | 
						|
 * License along with FFmpeg; if not, write to the Free Software
 | 
						|
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 | 
						|
 */
 | 
						|
 | 
						|
#ifndef AVCODEC_D3D12VA_ENCODE_H
 | 
						|
#define AVCODEC_D3D12VA_ENCODE_H
 | 
						|
 | 
						|
#include "libavutil/fifo.h"
 | 
						|
#include "libavutil/hwcontext.h"
 | 
						|
#include "libavutil/hwcontext_d3d12va_internal.h"
 | 
						|
#include "libavutil/hwcontext_d3d12va.h"
 | 
						|
#include "avcodec.h"
 | 
						|
#include "internal.h"
 | 
						|
#include "hwconfig.h"
 | 
						|
#include "hw_base_encode.h"
 | 
						|
 | 
						|
struct D3D12VAEncodeType;
 | 
						|
 | 
						|
extern const AVCodecHWConfigInternal *const ff_d3d12va_encode_hw_configs[];
 | 
						|
 | 
						|
#define MAX_PARAM_BUFFER_SIZE 4096
 | 
						|
#define D3D12VA_VIDEO_ENC_ASYNC_DEPTH 8
 | 
						|
 | 
						|
typedef struct D3D12VAEncodePicture {
 | 
						|
    FFHWBaseEncodePicture base;
 | 
						|
 | 
						|
    int             header_size;
 | 
						|
    int             aligned_header_size;
 | 
						|
 | 
						|
    AVD3D12VAFrame *input_surface;
 | 
						|
    AVD3D12VAFrame *recon_surface;
 | 
						|
 | 
						|
    AVBufferRef    *output_buffer_ref;
 | 
						|
    ID3D12Resource *output_buffer;
 | 
						|
 | 
						|
    ID3D12Resource *encoded_metadata;
 | 
						|
    ID3D12Resource *resolved_metadata;
 | 
						|
 | 
						|
    D3D12_VIDEO_ENCODER_PICTURE_CONTROL_CODEC_DATA pic_ctl;
 | 
						|
 | 
						|
    int             fence_value;
 | 
						|
} D3D12VAEncodePicture;
 | 
						|
 | 
						|
typedef struct D3D12VAEncodeProfile {
 | 
						|
    /**
 | 
						|
     * lavc profile value (AV_PROFILE_*).
 | 
						|
     */
 | 
						|
    int       av_profile;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Supported bit depth.
 | 
						|
     */
 | 
						|
    int       depth;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Number of components.
 | 
						|
     */
 | 
						|
    int       nb_components;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Chroma subsampling in width dimension.
 | 
						|
     */
 | 
						|
    int       log2_chroma_w;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Chroma subsampling in height dimension.
 | 
						|
     */
 | 
						|
    int       log2_chroma_h;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12 profile value.
 | 
						|
     */
 | 
						|
    D3D12_VIDEO_ENCODER_PROFILE_DESC d3d12_profile;
 | 
						|
} D3D12VAEncodeProfile;
 | 
						|
 | 
						|
enum {
 | 
						|
    RC_MODE_AUTO,
 | 
						|
    RC_MODE_CQP,
 | 
						|
    RC_MODE_CBR,
 | 
						|
    RC_MODE_VBR,
 | 
						|
    RC_MODE_QVBR,
 | 
						|
    RC_MODE_MAX = RC_MODE_QVBR,
 | 
						|
};
 | 
						|
 | 
						|
 | 
						|
typedef struct D3D12VAEncodeRCMode {
 | 
						|
    /**
 | 
						|
     * Mode from above enum (RC_MODE_*).
 | 
						|
     */
 | 
						|
    int mode;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Name.
 | 
						|
     *
 | 
						|
     */
 | 
						|
    const char *name;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Uses bitrate parameters.
 | 
						|
     *
 | 
						|
     */
 | 
						|
    int bitrate;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Supports maxrate distinct from bitrate.
 | 
						|
     *
 | 
						|
     */
 | 
						|
    int maxrate;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Uses quality value.
 | 
						|
     *
 | 
						|
     */
 | 
						|
    int quality;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Supports HRD/VBV parameters.
 | 
						|
     *
 | 
						|
     */
 | 
						|
    int hrd;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12 mode value.
 | 
						|
     */
 | 
						|
    D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE d3d12_mode;
 | 
						|
} D3D12VAEncodeRCMode;
 | 
						|
 | 
						|
typedef struct D3D12VAEncodeContext {
 | 
						|
    FFHWBaseEncodeContext base;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Codec-specific hooks.
 | 
						|
     */
 | 
						|
    const struct D3D12VAEncodeType *codec;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Explicitly set RC mode (otherwise attempt to pick from
 | 
						|
     * available modes).
 | 
						|
     */
 | 
						|
    int explicit_rc_mode;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Explicitly-set QP, for use with the "qp" options.
 | 
						|
     * (Forces CQP mode when set, overriding everything else.)
 | 
						|
     */
 | 
						|
    int explicit_qp;
 | 
						|
 | 
						|
    /**
 | 
						|
     * RC quality level - meaning depends on codec and RC mode.
 | 
						|
     * In CQP mode this sets the fixed quantiser value.
 | 
						|
     */
 | 
						|
    int rc_quality;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Chosen encoding profile details.
 | 
						|
     */
 | 
						|
    const D3D12VAEncodeProfile *profile;
 | 
						|
 | 
						|
    AVD3D12VADeviceContext *hwctx;
 | 
						|
 | 
						|
    /**
 | 
						|
     * ID3D12Device3 interface.
 | 
						|
     */
 | 
						|
    ID3D12Device3 *device3;
 | 
						|
 | 
						|
    /**
 | 
						|
     * ID3D12VideoDevice3 interface.
 | 
						|
     */
 | 
						|
    ID3D12VideoDevice3 *video_device3;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Pool of (reusable) bitstream output buffers.
 | 
						|
     */
 | 
						|
    AVBufferPool *output_buffer_pool;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12 video encoder.
 | 
						|
     */
 | 
						|
    AVBufferRef *encoder_ref;
 | 
						|
 | 
						|
    ID3D12VideoEncoder *encoder;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12 video encoder heap.
 | 
						|
     */
 | 
						|
    ID3D12VideoEncoderHeap *encoder_heap;
 | 
						|
 | 
						|
    /**
 | 
						|
     * A cached queue for reusing the D3D12 command allocators.
 | 
						|
     *
 | 
						|
     * @see https://learn.microsoft.com/en-us/windows/win32/direct3d12/recording-command-lists-and-bundles#id3d12commandallocator
 | 
						|
     */
 | 
						|
    AVFifo *allocator_queue;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12 command queue.
 | 
						|
     */
 | 
						|
    ID3D12CommandQueue *command_queue;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12 video encode command list.
 | 
						|
     */
 | 
						|
    ID3D12VideoEncodeCommandList2 *command_list;
 | 
						|
 | 
						|
    /**
 | 
						|
     * The sync context used to sync command queue.
 | 
						|
     */
 | 
						|
    AVD3D12VASyncContext sync_ctx;
 | 
						|
 | 
						|
    /**
 | 
						|
     * The bi_not_empty feature.
 | 
						|
     */
 | 
						|
    int bi_not_empty;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12_FEATURE structures.
 | 
						|
     */
 | 
						|
    D3D12_FEATURE_DATA_VIDEO_ENCODER_RESOURCE_REQUIREMENTS req;
 | 
						|
 | 
						|
    D3D12_FEATURE_DATA_VIDEO_ENCODER_RESOLUTION_SUPPORT_LIMITS res_limits;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12_VIDEO_ENCODER structures.
 | 
						|
     */
 | 
						|
    D3D12_VIDEO_ENCODER_PICTURE_RESOLUTION_DESC resolution;
 | 
						|
 | 
						|
    D3D12_VIDEO_ENCODER_CODEC_CONFIGURATION codec_conf;
 | 
						|
 | 
						|
    D3D12_VIDEO_ENCODER_RATE_CONTROL rc;
 | 
						|
 | 
						|
    D3D12_VIDEO_ENCODER_SEQUENCE_GOP_STRUCTURE gop;
 | 
						|
 | 
						|
    D3D12_VIDEO_ENCODER_LEVEL_SETTING level;
 | 
						|
} D3D12VAEncodeContext;
 | 
						|
 | 
						|
typedef struct D3D12VAEncodeType {
 | 
						|
    /**
 | 
						|
     * List of supported profiles.
 | 
						|
     */
 | 
						|
   const D3D12VAEncodeProfile *profiles;
 | 
						|
 | 
						|
    /**
 | 
						|
     * D3D12 codec name.
 | 
						|
     */
 | 
						|
    D3D12_VIDEO_ENCODER_CODEC d3d12_codec;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Codec feature flags.
 | 
						|
     */
 | 
						|
    int flags;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Default quality for this codec - used as quantiser or RC quality
 | 
						|
     * factor depending on RC mode.
 | 
						|
     */
 | 
						|
    int default_quality;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Query codec configuration and determine encode parameters like
 | 
						|
     * block sizes for surface alignment and slices. If not set, assume
 | 
						|
     * that all blocks are 16x16 and that surfaces should be aligned to match
 | 
						|
     * this.
 | 
						|
     */
 | 
						|
    int (*get_encoder_caps)(AVCodecContext *avctx);
 | 
						|
 | 
						|
    /**
 | 
						|
     * Perform any extra codec-specific configuration.
 | 
						|
     */
 | 
						|
    int (*configure)(AVCodecContext *avctx);
 | 
						|
 | 
						|
    /**
 | 
						|
     * Set codec-specific level setting.
 | 
						|
     */
 | 
						|
    int (*set_level)(AVCodecContext *avctx);
 | 
						|
 | 
						|
    /**
 | 
						|
     * The size of any private data structure associated with each
 | 
						|
     * picture (can be zero if not required).
 | 
						|
     */
 | 
						|
    size_t picture_priv_data_size;
 | 
						|
 | 
						|
    /**
 | 
						|
     * Fill the corresponding parameters.
 | 
						|
     */
 | 
						|
    int (*init_sequence_params)(AVCodecContext *avctx);
 | 
						|
 | 
						|
    int (*init_picture_params)(AVCodecContext *avctx,
 | 
						|
                               D3D12VAEncodePicture *pic);
 | 
						|
 | 
						|
    void (*free_picture_params)(D3D12VAEncodePicture *pic);
 | 
						|
 | 
						|
    /**
 | 
						|
     * Write the packed header data to the provided buffer.
 | 
						|
     */
 | 
						|
    int (*write_sequence_header)(AVCodecContext *avctx,
 | 
						|
                                 char *data, size_t *data_len);
 | 
						|
} D3D12VAEncodeType;
 | 
						|
 | 
						|
int ff_d3d12va_encode_receive_packet(AVCodecContext *avctx, AVPacket *pkt);
 | 
						|
 | 
						|
int ff_d3d12va_encode_init(AVCodecContext *avctx);
 | 
						|
int ff_d3d12va_encode_close(AVCodecContext *avctx);
 | 
						|
 | 
						|
#define D3D12VA_ENCODE_RC_MODE(name, desc) \
 | 
						|
    { #name, desc, 0, AV_OPT_TYPE_CONST, { .i64 = RC_MODE_ ## name }, \
 | 
						|
      0, 0, FLAGS, .unit = "rc_mode" }
 | 
						|
#define D3D12VA_ENCODE_RC_OPTIONS \
 | 
						|
    { "rc_mode",\
 | 
						|
      "Set rate control mode", \
 | 
						|
      OFFSET(common.explicit_rc_mode), AV_OPT_TYPE_INT, \
 | 
						|
      { .i64 = RC_MODE_AUTO }, RC_MODE_AUTO, RC_MODE_MAX, FLAGS, .unit = "rc_mode" }, \
 | 
						|
    { "auto", "Choose mode automatically based on other parameters", \
 | 
						|
      0, AV_OPT_TYPE_CONST, { .i64 = RC_MODE_AUTO }, 0, 0, FLAGS, .unit = "rc_mode" }, \
 | 
						|
    D3D12VA_ENCODE_RC_MODE(CQP,  "Constant-quality"), \
 | 
						|
    D3D12VA_ENCODE_RC_MODE(CBR,  "Constant-bitrate"), \
 | 
						|
    D3D12VA_ENCODE_RC_MODE(VBR,  "Variable-bitrate"), \
 | 
						|
    D3D12VA_ENCODE_RC_MODE(QVBR, "Quality-defined variable-bitrate")
 | 
						|
 | 
						|
#endif /* AVCODEC_D3D12VA_ENCODE_H */
 |