summaryrefslogtreecommitdiff
path: root/libavcodec
diff options
context:
space:
mode:
authorgalinart <artem.galin@gmail.com>2022-12-05 20:18:21 +0000
committerHaihao Xiang <haihao.xiang@intel.com>2023-01-30 08:48:58 +0800
commit500282941655558e2440afe163f0268dc5ac61bf (patch)
tree2f19c8273c7fedfb629a720cfde70dbb3a3facd0 /libavcodec
parentaecfec6f80fd8be68e050a97935589beeae588fa (diff)
downloadffmpeg-500282941655558e2440afe163f0268dc5ac61bf.tar.gz
libavcodec/qsvenc: enable Hyper Encode
Hyper Encode uses Intel integrated and discrete graphics on one system to accelerate encoding of a single video stream. Depending on the selected parameters and codecs, performance gain on AlderLake iGPU + ARC Gfx up to 1.6x. More information: https://www.intel.co.uk/content/www/uk/en/architecture-and-technology/adaptix/deep-link.html Developer guide: https://github.com/oneapi-src/oneVPL-intel-gpu/blob/main/doc/HyperEncode_FeatureDeveloperGuide.md Hyper Encode is supported only on Windows and requires D3D11 and oneVPL. To enable Hyper Encode need to specify: -Hyper Encode mode (-dual_gfx on or dual_gfx adaptive) -Encoder: h264_qsv or hevc_qsv -BRC: VBR, CQP or ICQ -Lowpower mode (-low_power 1) -Closed GOP for AVC or strict GOP for HEVC -idr_interval = 0 used by default Depending on the encoding parameters, the following parameters may need to be adjusted: -g recommended >= 30 for better performance -async_depth recommended >= 30 for better performance -extra_hw_frames recommended equal to async_depth value -bf recommended = 0 for better performance In the cases with fast encoding (-preset veryfast) there may be no performance gain due to the fact that the decode is slower than the encode. Command line examples: ffmpeg.exe -init_hw_device qsv:hw,child_device_type=d3d11va,child_device=0 -v verbose -y -hwaccel qsv -extra_hw_frames 60 -async_depth 60 -c:v h264_qsv -i bbb_sunflower_2160p_60fps_normal.mp4 -async_depth 60 -c:v h264_qsv -preset medium -g 60 -low_power 1 -bf 0 -dual_gfx on output.h265 Signed-off-by: galinart <artem.galin@intel.com>
Diffstat (limited to 'libavcodec')
-rw-r--r--libavcodec/qsvenc.c91
-rw-r--r--libavcodec/qsvenc.h19
-rw-r--r--libavcodec/qsvenc_h264.c3
-rw-r--r--libavcodec/qsvenc_hevc.c3
4 files changed, 112 insertions, 4 deletions
diff --git a/libavcodec/qsvenc.c b/libavcodec/qsvenc.c
index 93f1862a4b..2f0e94a914 100644
--- a/libavcodec/qsvenc.c
+++ b/libavcodec/qsvenc.c
@@ -169,6 +169,8 @@ do { \
} \
} while (0) \
+#define MFX_IMPL_VIA_MASK(impl) (0x0f00 & (impl))
+
static const char *print_ratecontrol(mfxU16 rc_mode)
{
int i;
@@ -197,6 +199,10 @@ static void dump_video_param(AVCodecContext *avctx, QSVEncContext *q,
mfxExtCodingOption2 *co2 = NULL;
mfxExtCodingOption3 *co3 = NULL;
mfxExtHEVCTiles *exthevctiles = NULL;
+#if QSV_HAVE_HE
+ mfxExtHyperModeParam *exthypermodeparam = NULL;
+#endif
+
const char *tmp_str = NULL;
if (q->co2_idx > 0)
@@ -208,6 +214,11 @@ static void dump_video_param(AVCodecContext *avctx, QSVEncContext *q,
if (q->exthevctiles_idx > 0)
exthevctiles = (mfxExtHEVCTiles *)coding_opts[q->exthevctiles_idx];
+#if QSV_HAVE_HE
+ if (q->exthypermodeparam_idx > 0)
+ exthypermodeparam = (mfxExtHyperModeParam *)coding_opts[q->exthypermodeparam_idx];
+#endif
+
av_log(avctx, AV_LOG_VERBOSE, "profile: %s; level: %"PRIu16"\n",
print_profile(avctx->codec_id, info->CodecProfile), info->CodecLevel);
@@ -373,6 +384,21 @@ static void dump_video_param(AVCodecContext *avctx, QSVEncContext *q,
av_log(avctx, AV_LOG_VERBOSE, "NumTileColumns: %"PRIu16"; NumTileRows: %"PRIu16"\n",
exthevctiles->NumTileColumns, exthevctiles->NumTileRows);
}
+
+#if QSV_HAVE_HE
+ if (exthypermodeparam) {
+ av_log(avctx, AV_LOG_VERBOSE, "HyperEncode: ");
+
+ if (exthypermodeparam->Mode == MFX_HYPERMODE_OFF)
+ av_log(avctx, AV_LOG_VERBOSE, "OFF");
+ if (exthypermodeparam->Mode == MFX_HYPERMODE_ON)
+ av_log(avctx, AV_LOG_VERBOSE, "ON");
+ if (exthypermodeparam->Mode == MFX_HYPERMODE_ADAPTIVE)
+ av_log(avctx, AV_LOG_VERBOSE, "Adaptive");
+
+ av_log(avctx, AV_LOG_VERBOSE, "\n");
+ }
+#endif
}
static void dump_video_vp9_param(AVCodecContext *avctx, QSVEncContext *q,
@@ -1168,6 +1194,54 @@ static int init_video_param(AVCodecContext *avctx, QSVEncContext *q)
q->extparam_internal[q->nb_extparam_internal++] = (mfxExtBuffer *)&q->extvsi;
}
+#if QSV_HAVE_HE
+ if (q->dual_gfx) {
+ if (QSV_RUNTIME_VERSION_ATLEAST(q->ver, 2, 4)) {
+ mfxIMPL impl;
+ MFXQueryIMPL(q->session, &impl);
+
+ if (MFX_IMPL_VIA_MASK(impl) != MFX_IMPL_VIA_D3D11) {
+ av_log(avctx, AV_LOG_ERROR, "Dual GFX mode requires D3D11VA \n");
+ return AVERROR_UNKNOWN;
+ }
+ if (q->param.mfx.LowPower != MFX_CODINGOPTION_ON) {
+ av_log(avctx, AV_LOG_ERROR, "Dual GFX mode supports only low-power encoding mode \n");
+ return AVERROR_UNKNOWN;
+ }
+ if (q->param.mfx.CodecId != MFX_CODEC_AVC && q->param.mfx.CodecId != MFX_CODEC_HEVC) {
+ av_log(avctx, AV_LOG_ERROR, "Not supported encoder for dual GFX mode. "
+ "Supported: h264_qsv and hevc_qsv \n");
+ return AVERROR_UNKNOWN;
+ }
+ if (q->param.mfx.RateControlMethod != MFX_RATECONTROL_VBR &&
+ q->param.mfx.RateControlMethod != MFX_RATECONTROL_CQP &&
+ q->param.mfx.RateControlMethod != MFX_RATECONTROL_ICQ) {
+ av_log(avctx, AV_LOG_WARNING, "Not supported BRC for dual GFX mode. "
+ "Supported: VBR, CQP and ICQ \n");
+ }
+ if ((q->param.mfx.CodecId == MFX_CODEC_AVC && q->param.mfx.IdrInterval != 0) ||
+ (q->param.mfx.CodecId == MFX_CODEC_HEVC && q->param.mfx.IdrInterval != 1)) {
+ av_log(avctx, AV_LOG_WARNING, "Dual GFX mode requires closed GOP for AVC and strict GOP for HEVC, -idr_interval 0 \n");
+ }
+ if (q->param.mfx.GopPicSize < 30) {
+ av_log(avctx, AV_LOG_WARNING, "For better performance in dual GFX mode GopPicSize must be >= 30 \n");
+ }
+ if (q->param.AsyncDepth < 30) {
+ av_log(avctx, AV_LOG_WARNING, "For better performance in dual GFX mode AsyncDepth must be >= 30 \n");
+ }
+
+ q->exthypermodeparam.Header.BufferId = MFX_EXTBUFF_HYPER_MODE_PARAM;
+ q->exthypermodeparam.Header.BufferSz = sizeof(q->exthypermodeparam);
+ q->exthypermodeparam.Mode = q->dual_gfx;
+ q->extparam_internal[q->nb_extparam_internal++] = (mfxExtBuffer *)&q->exthypermodeparam;
+ } else {
+ av_log(avctx, AV_LOG_ERROR,
+ "This version of runtime doesn't support Hyper Encode\n");
+ return AVERROR_UNKNOWN;
+ }
+ }
+#endif
+
if (!check_enc_param(avctx,q)) {
av_log(avctx, AV_LOG_ERROR,
"some encoding parameters are not supported by the QSV "
@@ -1342,12 +1416,19 @@ static int qsv_retrieve_enc_params(AVCodecContext *avctx, QSVEncContext *q)
.Header.BufferSz = sizeof(hevc_tile_buf),
};
- mfxExtBuffer *ext_buffers[6];
+#if QSV_HAVE_HE
+ mfxExtHyperModeParam hyper_mode_param_buf = {
+ .Header.BufferId = MFX_EXTBUFF_HYPER_MODE_PARAM,
+ .Header.BufferSz = sizeof(hyper_mode_param_buf),
+ };
+#endif
+
+ mfxExtBuffer *ext_buffers[6 + QSV_HAVE_HE];
int need_pps = avctx->codec_id != AV_CODEC_ID_MPEG2VIDEO;
int ret, ext_buf_num = 0, extradata_offset = 0;
- q->co2_idx = q->co3_idx = q->exthevctiles_idx = -1;
+ q->co2_idx = q->co3_idx = q->exthevctiles_idx = q->exthypermodeparam_idx = -1;
ext_buffers[ext_buf_num++] = (mfxExtBuffer*)&extradata;
ext_buffers[ext_buf_num++] = (mfxExtBuffer*)&co;
@@ -1369,6 +1450,12 @@ static int qsv_retrieve_enc_params(AVCodecContext *avctx, QSVEncContext *q)
q->exthevctiles_idx = ext_buf_num;
ext_buffers[ext_buf_num++] = (mfxExtBuffer*)&hevc_tile_buf;
}
+#if QSV_HAVE_HE
+ if (q->dual_gfx && QSV_RUNTIME_VERSION_ATLEAST(q->ver, 2, 4)) {
+ q->exthypermodeparam_idx = ext_buf_num;
+ ext_buffers[ext_buf_num++] = (mfxExtBuffer*)&hyper_mode_param_buf;
+ }
+#endif
q->param.ExtParam = ext_buffers;
q->param.NumExtParam = ext_buf_num;
diff --git a/libavcodec/qsvenc.h b/libavcodec/qsvenc.h
index a7bbb3797e..4a6fa2caed 100644
--- a/libavcodec/qsvenc.h
+++ b/libavcodec/qsvenc.h
@@ -45,10 +45,12 @@
#define QSV_HAVE_AVBR 1
#define QSV_HAVE_VCM 1
#define QSV_HAVE_MF 0
+#define QSV_HAVE_HE QSV_VERSION_ATLEAST(2, 4)
#else
#define QSV_HAVE_AVBR 0
#define QSV_HAVE_VCM 0
#define QSV_HAVE_MF !QSV_ONEVPL
+#define QSV_HAVE_HE 0
#endif
#define QSV_COMMON_OPTS \
@@ -64,6 +66,14 @@
{ "forced_idr", "Forcing I frames as IDR frames", OFFSET(qsv.forced_idr), AV_OPT_TYPE_BOOL,{ .i64 = 0 }, 0, 1, VE }, \
{ "low_power", "enable low power mode(experimental: many limitations by mfx version, BRC modes, etc.)", OFFSET(qsv.low_power), AV_OPT_TYPE_BOOL, { .i64 = -1}, -1, 1, VE},
+#if QSV_HAVE_HE
+#define QSV_HE_OPTIONS \
+{ "dual_gfx", "Prefer processing on both iGfx and dGfx simultaneously", OFFSET(qsv.dual_gfx), AV_OPT_TYPE_INT, { .i64 = MFX_HYPERMODE_OFF }, MFX_HYPERMODE_OFF, MFX_HYPERMODE_ADAPTIVE, VE, "dual_gfx" }, \
+{ "off", "Disable HyperEncode mode", 0, AV_OPT_TYPE_CONST, { .i64 = MFX_HYPERMODE_OFF }, INT_MIN, INT_MAX, VE, "dual_gfx" }, \
+{ "on", "Enable HyperEncode mode and return error if incompatible parameters during initialization", 0, AV_OPT_TYPE_CONST, { .i64 = MFX_HYPERMODE_ON }, INT_MIN, INT_MAX, VE, "dual_gfx" }, \
+{ "adaptive", "Enable HyperEncode mode or fallback to single GPU if incompatible parameters during initialization", 0, AV_OPT_TYPE_CONST, { .i64 = MFX_HYPERMODE_ADAPTIVE }, INT_MIN, INT_MAX, VE, "dual_gfx" },
+#endif
+
#define QSV_OPTION_RDO \
{ "rdo", "Enable rate distortion optimization", OFFSET(qsv.rdo), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
@@ -171,7 +181,9 @@ typedef struct QSVEncContext {
mfxExtAV1TileParam extav1tileparam;
mfxExtAV1BitstreamParam extav1bsparam;
#endif
-
+#if QSV_HAVE_HE
+ mfxExtHyperModeParam exthypermodeparam;
+#endif
#if QSV_HAVE_OPAQUE
mfxExtOpaqueSurfaceAlloc opaque_alloc;
mfxFrameSurface1 **opaque_surfaces;
@@ -180,7 +192,7 @@ typedef struct QSVEncContext {
mfxExtVideoSignalInfo extvsi;
- mfxExtBuffer *extparam_internal[5 + (QSV_HAVE_MF * 2) + QSV_HAVE_EXT_AV1_PARAM * 2];
+ mfxExtBuffer *extparam_internal[5 + (QSV_HAVE_MF * 2) + (QSV_HAVE_EXT_AV1_PARAM * 2) + QSV_HAVE_HE];
int nb_extparam_internal;
mfxExtBuffer **extparam;
@@ -255,6 +267,7 @@ typedef struct QSVEncContext {
int co2_idx;
int co3_idx;
int exthevctiles_idx;
+ int exthypermodeparam_idx;
int vp9_idx;
int max_qp_i;
@@ -299,6 +312,8 @@ typedef struct QSVEncContext {
// This is used for SEI Timing reset
int old_pic_timing_sei;
int skip_frame;
+ // This is used for Hyper Encode
+ int dual_gfx;
} QSVEncContext;
int ff_qsv_enc_init(AVCodecContext *avctx, QSVEncContext *q);
diff --git a/libavcodec/qsvenc_h264.c b/libavcodec/qsvenc_h264.c
index bbdedc3335..071a9a79e9 100644
--- a/libavcodec/qsvenc_h264.c
+++ b/libavcodec/qsvenc_h264.c
@@ -117,6 +117,9 @@ static const AVOption options[] = {
QSV_OPTION_SCENARIO
QSV_OPTION_AVBR
QSV_OPTION_SKIP_FRAME
+#if QSV_HAVE_HE
+ QSV_HE_OPTIONS
+#endif
{ "cavlc", "Enable CAVLC", OFFSET(qsv.cavlc), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE },
#if QSV_HAVE_VCM
diff --git a/libavcodec/qsvenc_hevc.c b/libavcodec/qsvenc_hevc.c
index e042263bf5..5e23ca9647 100644
--- a/libavcodec/qsvenc_hevc.c
+++ b/libavcodec/qsvenc_hevc.c
@@ -318,6 +318,9 @@ static const AVOption options[] = {
QSV_OPTION_SCENARIO
QSV_OPTION_AVBR
QSV_OPTION_SKIP_FRAME
+#if QSV_HAVE_HE
+ QSV_HE_OPTIONS
+#endif
{ "idr_interval", "Distance (in I-frames) between IDR frames", OFFSET(qsv.idr_interval), AV_OPT_TYPE_INT, { .i64 = 0 }, -1, INT_MAX, VE, "idr_interval" },
{ "begin_only", "Output an IDR-frame only at the beginning of the stream", 0, AV_OPT_TYPE_CONST, { .i64 = -1 }, 0, 0, VE, "idr_interval" },