123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411 |
- /*
- * Intel MediaSDK QSV based HEVC encoder
- *
- * This file is part of FFmpeg.
- *
- * FFmpeg is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation; either
- * version 2.1 of the License, or (at your option) any later version.
- *
- * FFmpeg is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with FFmpeg; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- */
- #include <stdint.h>
- #include <sys/types.h>
- #include <mfxvideo.h>
- #include "libavutil/common.h"
- #include "libavutil/opt.h"
- #include "libavutil/mastering_display_metadata.h"
- #include "avcodec.h"
- #include "bytestream.h"
- #include "codec_internal.h"
- #include "get_bits.h"
- #include "hevc.h"
- #include "hevcdec.h"
- #include "h2645_parse.h"
- #include "qsv.h"
- #include "qsvenc.h"
- enum LoadPlugin {
- LOAD_PLUGIN_NONE,
- LOAD_PLUGIN_HEVC_SW,
- LOAD_PLUGIN_HEVC_HW,
- };
- typedef struct QSVHEVCEncContext {
- AVClass *class;
- QSVEncContext qsv;
- int load_plugin;
- } QSVHEVCEncContext;
- static int generate_fake_vps(QSVEncContext *q, AVCodecContext *avctx)
- {
- GetByteContext gbc;
- PutByteContext pbc;
- GetBitContext gb;
- H2645RBSP sps_rbsp = { NULL };
- H2645NAL sps_nal = { NULL };
- HEVCSPS sps = { 0 };
- HEVCVPS vps = { 0 };
- uint8_t vps_buf[128], vps_rbsp_buf[128];
- uint8_t *new_extradata;
- unsigned int sps_id;
- int ret, i, type, vps_size;
- if (!avctx->extradata_size) {
- av_log(avctx, AV_LOG_ERROR, "No extradata returned from libmfx\n");
- return AVERROR_UNKNOWN;
- }
- av_fast_padded_malloc(&sps_rbsp.rbsp_buffer, &sps_rbsp.rbsp_buffer_alloc_size, avctx->extradata_size);
- if (!sps_rbsp.rbsp_buffer)
- return AVERROR(ENOMEM);
- /* parse the SPS */
- ret = ff_h2645_extract_rbsp(avctx->extradata + 4, avctx->extradata_size - 4, &sps_rbsp, &sps_nal, 1);
- if (ret < 0) {
- av_log(avctx, AV_LOG_ERROR, "Error unescaping the SPS buffer\n");
- return ret;
- }
- ret = init_get_bits8(&gb, sps_nal.data, sps_nal.size);
- if (ret < 0) {
- av_freep(&sps_rbsp.rbsp_buffer);
- return ret;
- }
- get_bits(&gb, 1);
- type = get_bits(&gb, 6);
- if (type != HEVC_NAL_SPS) {
- av_log(avctx, AV_LOG_ERROR, "Unexpected NAL type in the extradata: %d\n",
- type);
- av_freep(&sps_rbsp.rbsp_buffer);
- return AVERROR_INVALIDDATA;
- }
- get_bits(&gb, 9);
- ret = ff_hevc_parse_sps(&sps, &gb, &sps_id, 0, NULL, avctx);
- av_freep(&sps_rbsp.rbsp_buffer);
- if (ret < 0) {
- av_log(avctx, AV_LOG_ERROR, "Error parsing the SPS\n");
- return ret;
- }
- /* generate the VPS */
- vps.vps_max_layers = 1;
- vps.vps_max_sub_layers = sps.max_sub_layers;
- vps.vps_temporal_id_nesting_flag = sps.temporal_id_nesting_flag;
- memcpy(&vps.ptl, &sps.ptl, sizeof(vps.ptl));
- vps.vps_sub_layer_ordering_info_present_flag = 1;
- for (i = 0; i < HEVC_MAX_SUB_LAYERS; i++) {
- vps.vps_max_dec_pic_buffering[i] = sps.temporal_layer[i].max_dec_pic_buffering;
- vps.vps_num_reorder_pics[i] = sps.temporal_layer[i].num_reorder_pics;
- vps.vps_max_latency_increase[i] = sps.temporal_layer[i].max_latency_increase;
- }
- vps.vps_num_layer_sets = 1;
- vps.vps_timing_info_present_flag = sps.vui.vui_timing_info_present_flag;
- vps.vps_num_units_in_tick = sps.vui.vui_num_units_in_tick;
- vps.vps_time_scale = sps.vui.vui_time_scale;
- vps.vps_poc_proportional_to_timing_flag = sps.vui.vui_poc_proportional_to_timing_flag;
- vps.vps_num_ticks_poc_diff_one = sps.vui.vui_num_ticks_poc_diff_one_minus1 + 1;
- vps.vps_num_hrd_parameters = 0;
- /* generate the encoded RBSP form of the VPS */
- ret = ff_hevc_encode_nal_vps(&vps, sps.vps_id, vps_rbsp_buf, sizeof(vps_rbsp_buf));
- if (ret < 0) {
- av_log(avctx, AV_LOG_ERROR, "Error writing the VPS\n");
- return ret;
- }
- /* escape and add the startcode */
- bytestream2_init(&gbc, vps_rbsp_buf, ret);
- bytestream2_init_writer(&pbc, vps_buf, sizeof(vps_buf));
- bytestream2_put_be32(&pbc, 1); // startcode
- bytestream2_put_byte(&pbc, HEVC_NAL_VPS << 1); // NAL
- bytestream2_put_byte(&pbc, 1); // header
- while (bytestream2_get_bytes_left(&gbc)) {
- if (bytestream2_get_bytes_left(&gbc) >= 3 && bytestream2_peek_be24(&gbc) <= 3) {
- bytestream2_put_be24(&pbc, 3);
- bytestream2_skip(&gbc, 2);
- } else
- bytestream2_put_byte(&pbc, bytestream2_get_byte(&gbc));
- }
- vps_size = bytestream2_tell_p(&pbc);
- new_extradata = av_mallocz(vps_size + avctx->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE);
- if (!new_extradata)
- return AVERROR(ENOMEM);
- memcpy(new_extradata, vps_buf, vps_size);
- memcpy(new_extradata + vps_size, avctx->extradata, avctx->extradata_size);
- av_freep(&avctx->extradata);
- avctx->extradata = new_extradata;
- avctx->extradata_size += vps_size;
- return 0;
- }
- static int qsv_hevc_set_encode_ctrl(AVCodecContext *avctx,
- const AVFrame *frame, mfxEncodeCtrl *enc_ctrl)
- {
- QSVHEVCEncContext *q = avctx->priv_data;
- AVFrameSideData *sd;
- if (!frame || !QSV_RUNTIME_VERSION_ATLEAST(q->qsv.ver, 1, 25))
- return 0;
- sd = av_frame_get_side_data(frame, AV_FRAME_DATA_MASTERING_DISPLAY_METADATA);
- if (sd) {
- AVMasteringDisplayMetadata *mdm = (AVMasteringDisplayMetadata *)sd->data;
- // SEI is needed when both the primaries and luminance are set
- if (mdm->has_primaries && mdm->has_luminance) {
- const int mapping[3] = {1, 2, 0};
- const int chroma_den = 50000;
- const int luma_den = 10000;
- int i;
- mfxExtMasteringDisplayColourVolume *mdcv = av_mallocz(sizeof(mfxExtMasteringDisplayColourVolume));
- if (!mdcv)
- return AVERROR(ENOMEM);
- mdcv->Header.BufferId = MFX_EXTBUFF_MASTERING_DISPLAY_COLOUR_VOLUME;
- mdcv->Header.BufferSz = sizeof(*mdcv);
- for (i = 0; i < 3; i++) {
- const int j = mapping[i];
- mdcv->DisplayPrimariesX[i] =
- FFMIN(lrint(chroma_den *
- av_q2d(mdm->display_primaries[j][0])),
- chroma_den);
- mdcv->DisplayPrimariesY[i] =
- FFMIN(lrint(chroma_den *
- av_q2d(mdm->display_primaries[j][1])),
- chroma_den);
- }
- mdcv->WhitePointX =
- FFMIN(lrint(chroma_den * av_q2d(mdm->white_point[0])),
- chroma_den);
- mdcv->WhitePointY =
- FFMIN(lrint(chroma_den * av_q2d(mdm->white_point[1])),
- chroma_den);
- mdcv->MaxDisplayMasteringLuminance =
- lrint(luma_den * av_q2d(mdm->max_luminance));
- mdcv->MinDisplayMasteringLuminance =
- FFMIN(lrint(luma_den * av_q2d(mdm->min_luminance)),
- mdcv->MaxDisplayMasteringLuminance);
- enc_ctrl->ExtParam[enc_ctrl->NumExtParam++] = (mfxExtBuffer *)mdcv;
- }
- }
- sd = av_frame_get_side_data(frame, AV_FRAME_DATA_CONTENT_LIGHT_LEVEL);
- if (sd) {
- AVContentLightMetadata *clm = (AVContentLightMetadata *)sd->data;
- mfxExtContentLightLevelInfo * clli = av_mallocz(sizeof(mfxExtContentLightLevelInfo));
- if (!clli)
- return AVERROR(ENOMEM);
- clli->Header.BufferId = MFX_EXTBUFF_CONTENT_LIGHT_LEVEL_INFO;
- clli->Header.BufferSz = sizeof(*clli);
- clli->MaxContentLightLevel = FFMIN(clm->MaxCLL, 65535);
- clli->MaxPicAverageLightLevel = FFMIN(clm->MaxFALL, 65535);
- enc_ctrl->ExtParam[enc_ctrl->NumExtParam++] = (mfxExtBuffer *)clli;
- }
- return 0;
- }
- static av_cold int qsv_enc_init(AVCodecContext *avctx)
- {
- QSVHEVCEncContext *q = avctx->priv_data;
- int ret;
- if (q->load_plugin != LOAD_PLUGIN_NONE) {
- static const char * const uid_hevcenc_sw = "2fca99749fdb49aeb121a5b63ef568f7";
- static const char * const uid_hevcenc_hw = "6fadc791a0c2eb479ab6dcd5ea9da347";
- if (q->qsv.load_plugins[0]) {
- av_log(avctx, AV_LOG_WARNING,
- "load_plugins is not empty, but load_plugin is not set to 'none'."
- "The load_plugin value will be ignored.\n");
- } else {
- av_freep(&q->qsv.load_plugins);
- if (q->load_plugin == LOAD_PLUGIN_HEVC_SW)
- q->qsv.load_plugins = av_strdup(uid_hevcenc_sw);
- else
- q->qsv.load_plugins = av_strdup(uid_hevcenc_hw);
- if (!q->qsv.load_plugins)
- return AVERROR(ENOMEM);
- }
- }
- // HEVC and H264 meaning of the value is shifted by 1, make it consistent
- q->qsv.idr_interval++;
- q->qsv.set_encode_ctrl_cb = qsv_hevc_set_encode_ctrl;
- ret = ff_qsv_enc_init(avctx, &q->qsv);
- if (ret < 0)
- return ret;
- if (!q->qsv.hevc_vps) {
- ret = generate_fake_vps(&q->qsv, avctx);
- if (ret < 0) {
- ff_qsv_enc_close(avctx, &q->qsv);
- return ret;
- }
- }
- return 0;
- }
- static int qsv_enc_frame(AVCodecContext *avctx, AVPacket *pkt,
- const AVFrame *frame, int *got_packet)
- {
- QSVHEVCEncContext *q = avctx->priv_data;
- return ff_qsv_encode(avctx, &q->qsv, pkt, frame, got_packet);
- }
- static av_cold int qsv_enc_close(AVCodecContext *avctx)
- {
- QSVHEVCEncContext *q = avctx->priv_data;
- return ff_qsv_enc_close(avctx, &q->qsv);
- }
- #define OFFSET(x) offsetof(QSVHEVCEncContext, x)
- #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
- static const AVOption options[] = {
- QSV_COMMON_OPTS
- QSV_OPTION_RDO
- QSV_OPTION_MAX_FRAME_SIZE
- QSV_OPTION_MAX_SLICE_SIZE
- QSV_OPTION_MBBRC
- QSV_OPTION_EXTBRC
- QSV_OPTION_P_STRATEGY
- QSV_OPTION_B_STRATEGY
- QSV_OPTION_DBLK_IDC
- QSV_OPTION_LOW_DELAY_BRC
- QSV_OPTION_MAX_MIN_QP
- QSV_OPTION_ADAPTIVE_I
- QSV_OPTION_ADAPTIVE_B
- QSV_OPTION_SCENARIO
- QSV_OPTION_AVBR
- QSV_OPTION_SKIP_FRAME
- { "idr_interval", "Distance (in I-frames) between IDR frames", OFFSET(qsv.idr_interval), AV_OPT_TYPE_INT, { .i64 = 0 }, -1, INT_MAX, VE, "idr_interval" },
- { "begin_only", "Output an IDR-frame only at the beginning of the stream", 0, AV_OPT_TYPE_CONST, { .i64 = -1 }, 0, 0, VE, "idr_interval" },
- { "load_plugin", "A user plugin to load in an internal session", OFFSET(load_plugin), AV_OPT_TYPE_INT, { .i64 = LOAD_PLUGIN_HEVC_HW }, LOAD_PLUGIN_NONE, LOAD_PLUGIN_HEVC_HW, VE, "load_plugin" },
- { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_NONE }, 0, 0, VE, "load_plugin" },
- { "hevc_sw", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_SW }, 0, 0, VE, "load_plugin" },
- { "hevc_hw", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_HW }, 0, 0, VE, "load_plugin" },
- { "load_plugins", "A :-separate list of hexadecimal plugin UIDs to load in an internal session",
- OFFSET(qsv.load_plugins), AV_OPT_TYPE_STRING, { .str = "" }, 0, 0, VE },
- { "look_ahead_depth", "Depth of look ahead in number frames, available when extbrc option is enabled", OFFSET(qsv.look_ahead_depth), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 100, VE },
- { "profile", NULL, OFFSET(qsv.profile), AV_OPT_TYPE_INT, { .i64 = MFX_PROFILE_UNKNOWN }, 0, INT_MAX, VE, "profile" },
- { "unknown", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_UNKNOWN }, INT_MIN, INT_MAX, VE, "profile" },
- { "main", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_MAIN }, INT_MIN, INT_MAX, VE, "profile" },
- { "main10", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_MAIN10 }, INT_MIN, INT_MAX, VE, "profile" },
- { "mainsp", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_MAINSP }, INT_MIN, INT_MAX, VE, "profile" },
- { "rext", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_REXT }, INT_MIN, INT_MAX, VE, "profile" },
- #if QSV_VERSION_ATLEAST(1, 32)
- { "scc", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_SCC }, INT_MIN, INT_MAX, VE, "profile" },
- #endif
- { "tier", "Set the encoding tier (only level >= 4 can support high tier)", OFFSET(qsv.tier), AV_OPT_TYPE_INT, { .i64 = MFX_TIER_HEVC_HIGH }, MFX_TIER_HEVC_MAIN, MFX_TIER_HEVC_HIGH, VE, "tier" },
- { "main", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TIER_HEVC_MAIN }, INT_MIN, INT_MAX, VE, "tier" },
- { "high", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TIER_HEVC_HIGH }, INT_MIN, INT_MAX, VE, "tier" },
- { "gpb", "1: GPB (generalized P/B frame); 0: regular P frame", OFFSET(qsv.gpb), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, VE},
- { "tile_cols", "Number of columns for tiled encoding", OFFSET(qsv.tile_cols), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, UINT16_MAX, VE },
- { "tile_rows", "Number of rows for tiled encoding", OFFSET(qsv.tile_rows), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, UINT16_MAX, VE },
- { "recovery_point_sei", "Insert recovery point SEI messages", OFFSET(qsv.recovery_point_sei), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
- { "aud", "Insert the Access Unit Delimiter NAL", OFFSET(qsv.aud), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE},
- { "pic_timing_sei", "Insert picture timing SEI with pic_struct_syntax element", OFFSET(qsv.pic_timing_sei), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, VE },
- { "transform_skip", "Turn this option ON to enable transformskip", OFFSET(qsv.transform_skip), AV_OPT_TYPE_INT, { .i64 = -1}, -1, 1, VE},
- { "int_ref_type", "Intra refresh type. B frames should be set to 0", OFFSET(qsv.int_ref_type), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, UINT16_MAX, VE, "int_ref_type" },
- { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, .flags = VE, "int_ref_type" },
- { "vertical", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, .flags = VE, "int_ref_type" },
- { "horizontal", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 2 }, .flags = VE, "int_ref_type" },
- { "slice" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 3 }, .flags = VE, "int_ref_type" },
- { "int_ref_cycle_size", "Number of frames in the intra refresh cycle", OFFSET(qsv.int_ref_cycle_size), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, UINT16_MAX, VE },
- { "int_ref_qp_delta", "QP difference for the refresh MBs", OFFSET(qsv.int_ref_qp_delta), AV_OPT_TYPE_INT, { .i64 = INT16_MIN }, INT16_MIN, INT16_MAX, VE },
- { "int_ref_cycle_dist", "Distance between the beginnings of the intra-refresh cycles in frames", OFFSET(qsv.int_ref_cycle_dist), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT16_MAX, VE },
- { NULL },
- };
- static const AVClass class = {
- .class_name = "hevc_qsv encoder",
- .item_name = av_default_item_name,
- .option = options,
- .version = LIBAVUTIL_VERSION_INT,
- };
- static const FFCodecDefault qsv_enc_defaults[] = {
- { "b", "1M" },
- { "refs", "0" },
- { "g", "-1" },
- { "bf", "-1" },
- { "qmin", "-1" },
- { "qmax", "-1" },
- { "trellis", "-1" },
- { NULL },
- };
- const FFCodec ff_hevc_qsv_encoder = {
- .p.name = "hevc_qsv",
- CODEC_LONG_NAME("HEVC (Intel Quick Sync Video acceleration)"),
- .priv_data_size = sizeof(QSVHEVCEncContext),
- .p.type = AVMEDIA_TYPE_VIDEO,
- .p.id = AV_CODEC_ID_HEVC,
- .init = qsv_enc_init,
- FF_CODEC_ENCODE_CB(qsv_enc_frame),
- .close = qsv_enc_close,
- .p.capabilities = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_HYBRID,
- .p.pix_fmts = (const enum AVPixelFormat[]){ AV_PIX_FMT_NV12,
- AV_PIX_FMT_P010,
- AV_PIX_FMT_P012,
- AV_PIX_FMT_YUYV422,
- AV_PIX_FMT_Y210,
- AV_PIX_FMT_QSV,
- AV_PIX_FMT_BGRA,
- AV_PIX_FMT_X2RGB10,
- AV_PIX_FMT_VUYX,
- AV_PIX_FMT_XV30,
- AV_PIX_FMT_NONE },
- .p.priv_class = &class,
- .defaults = qsv_enc_defaults,
- .caps_internal = FF_CODEC_CAP_NOT_INIT_THREADSAFE |
- FF_CODEC_CAP_INIT_CLEANUP,
- .p.wrapper_name = "qsv",
- .hw_configs = ff_qsv_enc_hw_configs,
- };
|