vulkan_encode_h264.c 66 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666
  1. /*
  2. * This file is part of FFmpeg.
  3. *
  4. * FFmpeg is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * FFmpeg is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with FFmpeg; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. #include "libavutil/opt.h"
  19. #include "libavutil/mem.h"
  20. #include "cbs.h"
  21. #include "cbs_h264.h"
  22. #include "atsc_a53.h"
  23. #include "h264_levels.h"
  24. #include "h2645data.h"
  25. #include "codec_internal.h"
  26. #include "version.h"
  27. #include "hw_base_encode_h264.h"
  28. #include "vulkan_encode.h"
  29. enum UnitElems {
  30. UNIT_AUD = 1 << 0,
  31. UNIT_SEI_TIMING = 1 << 1,
  32. UNIT_SEI_IDENTIFIER = 1 << 2,
  33. UNIT_SEI_RECOVERY = 1 << 3,
  34. UNIT_SEI_A53_CC = 1 << 4,
  35. };
  36. const FFVulkanEncodeDescriptor ff_vk_enc_h264_desc = {
  37. .codec_id = AV_CODEC_ID_H264,
  38. .encode_extension = FF_VK_EXT_VIDEO_ENCODE_H264,
  39. .encode_op = VK_VIDEO_CODEC_OPERATION_ENCODE_H264_BIT_KHR,
  40. .ext_props = {
  41. .extensionName = VK_STD_VULKAN_VIDEO_CODEC_H264_ENCODE_EXTENSION_NAME,
  42. .specVersion = VK_STD_VULKAN_VIDEO_CODEC_H264_ENCODE_SPEC_VERSION,
  43. },
  44. };
  45. /* Random (version 4) ISO 11578 UUID. */
  46. static const uint8_t vulkan_encode_h264_sei_identifier_uuid[16] = {
  47. 0x03, 0xfd, 0xf2, 0x0a, 0x5d, 0x4c, 0x05, 0x48,
  48. 0x20, 0x98, 0xca, 0x6b, 0x0c, 0x95, 0x30, 0x1c,
  49. };
  50. typedef struct VulkanEncodeH264Picture {
  51. int frame_num;
  52. int64_t last_idr_frame;
  53. uint16_t idr_pic_id;
  54. int primary_pic_type;
  55. int slice_type;
  56. int pic_order_cnt;
  57. enum UnitElems units_needed;
  58. VkVideoEncodeH264RateControlInfoKHR vkrc_info;
  59. VkVideoEncodeH264RateControlLayerInfoKHR vkrc_layer_info;
  60. VkVideoEncodeH264GopRemainingFrameInfoKHR vkrc_remaining;
  61. StdVideoEncodeH264WeightTable slice_wt;
  62. StdVideoEncodeH264SliceHeader slice_hdr;
  63. VkVideoEncodeH264NaluSliceInfoKHR vkslice;
  64. StdVideoEncodeH264PictureInfo h264pic_info;
  65. VkVideoEncodeH264PictureInfoKHR vkh264pic_info;
  66. StdVideoEncodeH264ReferenceInfo h264dpb_info;
  67. VkVideoEncodeH264DpbSlotInfoKHR vkh264dpb_info;
  68. StdVideoEncodeH264RefListModEntry mods[MAX_REFERENCE_LIST_NUM][H264_MAX_RPLM_COUNT];
  69. StdVideoEncodeH264RefPicMarkingEntry mmco[H264_MAX_RPLM_COUNT];
  70. StdVideoEncodeH264ReferenceListsInfo ref_list_info;
  71. } VulkanEncodeH264Picture;
  72. typedef struct VulkanEncodeH264Context {
  73. FFVulkanEncodeContext common;
  74. FFHWBaseEncodeH264 units;
  75. FFHWBaseEncodeH264Opts unit_opts;
  76. enum UnitElems unit_elems;
  77. uint8_t fixed_qp_p;
  78. uint8_t fixed_qp_b;
  79. VkVideoEncodeH264ProfileInfoKHR profile;
  80. VkVideoEncodeH264CapabilitiesKHR caps;
  81. VkVideoEncodeH264QualityLevelPropertiesKHR quality_props;
  82. CodedBitstreamContext *cbs;
  83. CodedBitstreamFragment current_access_unit;
  84. H264RawAUD raw_aud;
  85. SEIRawUserDataUnregistered sei_identifier;
  86. H264RawSEIPicTiming sei_pic_timing;
  87. H264RawSEIRecoveryPoint sei_recovery_point;
  88. SEIRawUserDataRegistered sei_a53cc;
  89. void *sei_a53cc_data;
  90. char *sei_identifier_string;
  91. } VulkanEncodeH264Context;
  92. static int init_pic_rc(AVCodecContext *avctx, FFHWBaseEncodePicture *pic,
  93. VkVideoEncodeRateControlInfoKHR *rc_info,
  94. VkVideoEncodeRateControlLayerInfoKHR *rc_layer)
  95. {
  96. VulkanEncodeH264Context *enc = avctx->priv_data;
  97. FFVulkanEncodeContext *ctx = &enc->common;
  98. VulkanEncodeH264Picture *hp = pic->codec_priv;
  99. hp->vkrc_info = (VkVideoEncodeH264RateControlInfoKHR) {
  100. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_RATE_CONTROL_INFO_KHR,
  101. .flags = VK_VIDEO_ENCODE_H264_RATE_CONTROL_REFERENCE_PATTERN_FLAT_BIT_KHR |
  102. VK_VIDEO_ENCODE_H264_RATE_CONTROL_REGULAR_GOP_BIT_KHR,
  103. .idrPeriod = ctx->base.gop_size,
  104. .gopFrameCount = ctx->base.gop_size,
  105. .consecutiveBFrameCount = FFMAX(ctx->base.b_per_p - 1, 0),
  106. .temporalLayerCount = 0,
  107. };
  108. rc_info->pNext = &hp->vkrc_info;
  109. rc_info->virtualBufferSizeInMs = enc->unit_opts.hrd_buffer_size;
  110. rc_info->initialVirtualBufferSizeInMs = enc->unit_opts.initial_buffer_fullness;
  111. if (rc_info->rateControlMode > VK_VIDEO_ENCODE_RATE_CONTROL_MODE_DISABLED_BIT_KHR) {
  112. hp->vkrc_layer_info = (VkVideoEncodeH264RateControlLayerInfoKHR) {
  113. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_RATE_CONTROL_LAYER_INFO_KHR,
  114. .useMinQp = avctx->qmin > 0,
  115. .minQp.qpI = avctx->qmin > 0 ? avctx->qmin : 0,
  116. .minQp.qpP = avctx->qmin > 0 ? avctx->qmin : 0,
  117. .minQp.qpB = avctx->qmin > 0 ? avctx->qmin : 0,
  118. .useMaxQp = avctx->qmax > 0,
  119. .maxQp.qpI = avctx->qmax > 0 ? avctx->qmax : 0,
  120. .maxQp.qpP = avctx->qmax > 0 ? avctx->qmax : 0,
  121. .maxQp.qpB = avctx->qmax > 0 ? avctx->qmax : 0,
  122. .useMaxFrameSize = 0,
  123. };
  124. rc_layer->pNext = &hp->vkrc_layer_info;
  125. hp->vkrc_info.temporalLayerCount = 1;
  126. }
  127. return 0;
  128. }
  129. static int vk_enc_h264_update_pic_info(AVCodecContext *avctx,
  130. FFHWBaseEncodePicture *pic)
  131. {
  132. VulkanEncodeH264Context *enc = avctx->priv_data;
  133. FFVulkanEncodeContext *ctx = &enc->common;
  134. VulkanEncodeH264Picture *hp = pic->codec_priv;
  135. FFHWBaseEncodePicture *prev = pic->prev;
  136. VulkanEncodeH264Picture *hprev = prev ? prev->codec_priv : NULL;
  137. if (pic->type == FF_HW_PICTURE_TYPE_IDR) {
  138. av_assert0(pic->display_order == pic->encode_order);
  139. hp->frame_num = 0;
  140. hp->last_idr_frame = pic->display_order;
  141. hp->idr_pic_id = hprev ? hprev->idr_pic_id + 1 : 0;
  142. hp->primary_pic_type = 0;
  143. hp->slice_type = STD_VIDEO_H264_SLICE_TYPE_I;
  144. } else {
  145. av_assert0(prev);
  146. hp->frame_num = hprev->frame_num + prev->is_reference;
  147. hp->last_idr_frame = hprev->last_idr_frame;
  148. hp->idr_pic_id = hprev->idr_pic_id;
  149. if (pic->type == FF_HW_PICTURE_TYPE_I) {
  150. hp->slice_type = STD_VIDEO_H264_SLICE_TYPE_I;
  151. hp->primary_pic_type = 0;
  152. } else if (pic->type == FF_HW_PICTURE_TYPE_P) {
  153. hp->slice_type = STD_VIDEO_H264_SLICE_TYPE_P;
  154. hp->primary_pic_type = 1;
  155. } else {
  156. hp->slice_type = STD_VIDEO_H264_SLICE_TYPE_B;
  157. hp->primary_pic_type = 2;
  158. }
  159. }
  160. hp->pic_order_cnt = pic->display_order - hp->last_idr_frame;
  161. if (enc->units.raw_sps.pic_order_cnt_type == 2)
  162. hp->pic_order_cnt *= 2;
  163. hp->units_needed = 0;
  164. if (enc->unit_elems & UNIT_SEI_IDENTIFIER && pic->encode_order == 0)
  165. hp->units_needed |= UNIT_SEI_IDENTIFIER;
  166. if (enc->unit_elems & UNIT_SEI_TIMING) {
  167. enc->sei_pic_timing = (H264RawSEIPicTiming) {
  168. .cpb_removal_delay = 2 * (pic->encode_order - hp->last_idr_frame),
  169. .dpb_output_delay = 2 * (pic->display_order - pic->encode_order + ctx->base.max_b_depth),
  170. };
  171. hp->units_needed |= UNIT_SEI_TIMING;
  172. }
  173. if (enc->unit_elems & UNIT_SEI_RECOVERY && pic->type == FF_HW_PICTURE_TYPE_I) {
  174. enc->sei_recovery_point = (H264RawSEIRecoveryPoint) {
  175. .recovery_frame_cnt = 0,
  176. .exact_match_flag = 1,
  177. .broken_link_flag = ctx->base.b_per_p > 0,
  178. };
  179. hp->units_needed |= UNIT_SEI_RECOVERY;
  180. }
  181. if (enc->unit_elems & UNIT_SEI_A53_CC) {
  182. int err;
  183. size_t sei_a53cc_len;
  184. av_freep(&enc->sei_a53cc_data);
  185. err = ff_alloc_a53_sei(pic->input_image, 0, &enc->sei_a53cc_data, &sei_a53cc_len);
  186. if (err < 0)
  187. return err;
  188. if (enc->sei_a53cc_data != NULL) {
  189. enc->sei_a53cc.itu_t_t35_country_code = 181;
  190. enc->sei_a53cc.data = (uint8_t *)enc->sei_a53cc_data + 1;
  191. enc->sei_a53cc.data_length = sei_a53cc_len - 1;
  192. hp->units_needed |= UNIT_SEI_A53_CC;
  193. }
  194. }
  195. return 0;
  196. }
  197. static void setup_slices(AVCodecContext *avctx,
  198. FFHWBaseEncodePicture *pic)
  199. {
  200. VulkanEncodeH264Context *enc = avctx->priv_data;
  201. VulkanEncodeH264Picture *hp = pic->codec_priv;
  202. hp->slice_wt = (StdVideoEncodeH264WeightTable) {
  203. .flags = (StdVideoEncodeH264WeightTableFlags) {
  204. .luma_weight_l0_flag = 0,
  205. .chroma_weight_l0_flag = 0,
  206. .luma_weight_l1_flag = 0,
  207. .chroma_weight_l1_flag = 0,
  208. },
  209. .luma_log2_weight_denom = 0,
  210. .chroma_log2_weight_denom = 0,
  211. .luma_weight_l0 = { 0 },
  212. .luma_offset_l0 = { 0 },
  213. .chroma_weight_l0 = { { 0 } },
  214. .chroma_offset_l0 = { { 0 } },
  215. .luma_weight_l1 = { 0 },
  216. .luma_offset_l1 = { 0 },
  217. .chroma_weight_l1 = { { 0 } },
  218. .chroma_offset_l1 = { { 0 } },
  219. };
  220. hp->slice_hdr = (StdVideoEncodeH264SliceHeader) {
  221. .flags = (StdVideoEncodeH264SliceHeaderFlags) {
  222. .direct_spatial_mv_pred_flag = 1,
  223. /* The vk_samples code does this */
  224. .num_ref_idx_active_override_flag =
  225. ((enc->units.raw_pps.num_ref_idx_l0_default_active_minus1) &&
  226. (pic->type == FF_HW_PICTURE_TYPE_B)) ? 1 : 0,
  227. },
  228. .first_mb_in_slice = 1,
  229. .slice_type = hp->slice_type,
  230. .slice_alpha_c0_offset_div2 = 0,
  231. .slice_beta_offset_div2 = 0,
  232. .slice_qp_delta = 0, /* Filled in below */
  233. /* Reserved */
  234. .cabac_init_idc = 0,
  235. .disable_deblocking_filter_idc = 0,
  236. .pWeightTable = NULL, // &hp->slice_wt,
  237. };
  238. hp->vkslice = (VkVideoEncodeH264NaluSliceInfoKHR) {
  239. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_NALU_SLICE_INFO_KHR,
  240. .pNext = NULL,
  241. .constantQp = pic->type == FF_HW_PICTURE_TYPE_B ? enc->fixed_qp_b :
  242. pic->type == FF_HW_PICTURE_TYPE_P ? enc->fixed_qp_p :
  243. enc->unit_opts.fixed_qp_idr,
  244. .pStdSliceHeader = &hp->slice_hdr,
  245. };
  246. if (enc->common.opts.rc_mode != VK_VIDEO_ENCODE_RATE_CONTROL_MODE_DISABLED_BIT_KHR)
  247. hp->vkslice.constantQp = 0;
  248. hp->slice_hdr.slice_qp_delta = hp->vkslice.constantQp -
  249. (enc->units.raw_pps.pic_init_qp_minus26 + 26);
  250. hp->vkh264pic_info.pNaluSliceEntries = &hp->vkslice;
  251. hp->vkh264pic_info.naluSliceEntryCount = 1;
  252. }
  253. static void vk_enc_h264_default_ref_pic_list(AVCodecContext *avctx,
  254. FFHWBaseEncodePicture *pic,
  255. FFHWBaseEncodePicture **rpl0,
  256. FFHWBaseEncodePicture **rpl1,
  257. int *rpl_size)
  258. {
  259. FFHWBaseEncodePicture *prev;
  260. VulkanEncodeH264Picture *hp, *hn, *hc;
  261. int i, j, n = 0;
  262. prev = pic->prev;
  263. av_assert0(prev);
  264. hp = pic->codec_priv;
  265. for (i = 0; i < pic->prev->nb_dpb_pics; i++) {
  266. hn = prev->dpb[i]->codec_priv;
  267. av_assert0(hn->frame_num < hp->frame_num);
  268. if (pic->type == FF_HW_PICTURE_TYPE_P) {
  269. for (j = n; j > 0; j--) {
  270. hc = rpl0[j - 1]->codec_priv;
  271. av_assert0(hc->frame_num != hn->frame_num);
  272. if (hc->frame_num > hn->frame_num)
  273. break;
  274. rpl0[j] = rpl0[j - 1];
  275. }
  276. rpl0[j] = prev->dpb[i];
  277. } else if (pic->type == FF_HW_PICTURE_TYPE_B) {
  278. for (j = n; j > 0; j--) {
  279. hc = rpl0[j - 1]->codec_priv;
  280. av_assert0(hc->pic_order_cnt != hp->pic_order_cnt);
  281. if (hc->pic_order_cnt < hp->pic_order_cnt) {
  282. if (hn->pic_order_cnt > hp->pic_order_cnt ||
  283. hn->pic_order_cnt < hc->pic_order_cnt)
  284. break;
  285. } else {
  286. if (hn->pic_order_cnt > hc->pic_order_cnt)
  287. break;
  288. }
  289. rpl0[j] = rpl0[j - 1];
  290. }
  291. rpl0[j] = prev->dpb[i];
  292. for (j = n; j > 0; j--) {
  293. hc = rpl1[j - 1]->codec_priv;
  294. av_assert0(hc->pic_order_cnt != hp->pic_order_cnt);
  295. if (hc->pic_order_cnt > hp->pic_order_cnt) {
  296. if (hn->pic_order_cnt < hp->pic_order_cnt ||
  297. hn->pic_order_cnt > hc->pic_order_cnt)
  298. break;
  299. } else {
  300. if (hn->pic_order_cnt < hc->pic_order_cnt)
  301. break;
  302. }
  303. rpl1[j] = rpl1[j - 1];
  304. }
  305. rpl1[j] = prev->dpb[i];
  306. }
  307. ++n;
  308. }
  309. if (pic->type == FF_HW_PICTURE_TYPE_B) {
  310. for (i = 0; i < n; i++) {
  311. if (rpl0[i] != rpl1[i])
  312. break;
  313. }
  314. if (i == n)
  315. FFSWAP(FFHWBaseEncodePicture *, rpl1[0], rpl1[1]);
  316. }
  317. if (pic->type == FF_HW_PICTURE_TYPE_P ||
  318. pic->type == FF_HW_PICTURE_TYPE_B) {
  319. av_log(avctx, AV_LOG_DEBUG, "Default RefPicList0 for fn=%d/poc=%d:",
  320. hp->frame_num, hp->pic_order_cnt);
  321. for (i = 0; i < n; i++) {
  322. hn = rpl0[i]->codec_priv;
  323. av_log(avctx, AV_LOG_DEBUG, " fn=%d/poc=%d",
  324. hn->frame_num, hn->pic_order_cnt);
  325. }
  326. av_log(avctx, AV_LOG_DEBUG, "\n");
  327. }
  328. if (pic->type == FF_HW_PICTURE_TYPE_B) {
  329. av_log(avctx, AV_LOG_DEBUG, "Default RefPicList1 for fn=%d/poc=%d:",
  330. hp->frame_num, hp->pic_order_cnt);
  331. for (i = 0; i < n; i++) {
  332. hn = rpl1[i]->codec_priv;
  333. av_log(avctx, AV_LOG_DEBUG, " fn=%d/poc=%d",
  334. hn->frame_num, hn->pic_order_cnt);
  335. }
  336. av_log(avctx, AV_LOG_DEBUG, "\n");
  337. }
  338. *rpl_size = n;
  339. }
  340. static void setup_refs(AVCodecContext *avctx,
  341. FFHWBaseEncodePicture *pic,
  342. VkVideoEncodeInfoKHR *encode_info)
  343. {
  344. int n, i, j;
  345. VulkanEncodeH264Context *enc = avctx->priv_data;
  346. VulkanEncodeH264Picture *hp = pic->codec_priv;
  347. FFHWBaseEncodePicture *prev = pic->prev;
  348. FFHWBaseEncodePicture *def_l0[MAX_DPB_SIZE], *def_l1[MAX_DPB_SIZE];
  349. VulkanEncodeH264Picture *href;
  350. hp->ref_list_info = (StdVideoEncodeH264ReferenceListsInfo) {
  351. .flags = (StdVideoEncodeH264ReferenceListsInfoFlags) {
  352. .ref_pic_list_modification_flag_l0 = 0,
  353. .ref_pic_list_modification_flag_l1 = 0,
  354. /* Reserved */
  355. },
  356. /* May be overridden during setup_slices() */
  357. .num_ref_idx_l0_active_minus1 = pic->nb_refs[0] - 1,
  358. .num_ref_idx_l1_active_minus1 = pic->nb_refs[1] - 1,
  359. /* .RefPicList0 is set in vk_enc_h264_default_ref_pic_list() */
  360. /* .RefPicList1 is set in vk_enc_h264_default_ref_pic_list() */
  361. /* Reserved */
  362. .pRefList0ModOperations = NULL, /* All set below */
  363. .refList0ModOpCount = 0,
  364. .pRefList1ModOperations = NULL,
  365. .refList1ModOpCount = 0,
  366. .pRefPicMarkingOperations = NULL,
  367. .refPicMarkingOpCount = 0,
  368. };
  369. for (i = 0; i < STD_VIDEO_H264_MAX_NUM_LIST_REF; i++)
  370. hp->ref_list_info.RefPicList0[i] = hp->ref_list_info.RefPicList1[i] = -1;
  371. /* Note: really not sure */
  372. for (int i = 0; i < pic->nb_refs[0]; i++) {
  373. VkVideoReferenceSlotInfoKHR *slot_info;
  374. slot_info = (VkVideoReferenceSlotInfoKHR *)&encode_info->pReferenceSlots[i];
  375. hp->ref_list_info.RefPicList0[i] = slot_info->slotIndex;
  376. }
  377. /* Note: really not sure */
  378. for (int i = 0; i < pic->nb_refs[1]; i++) {
  379. VkVideoReferenceSlotInfoKHR *slot_info;
  380. slot_info = (VkVideoReferenceSlotInfoKHR *)&encode_info->pReferenceSlots[pic->nb_refs[0] + i];
  381. hp->ref_list_info.RefPicList1[i] = slot_info->slotIndex;
  382. }
  383. hp->h264pic_info.pRefLists = &hp->ref_list_info;
  384. if (pic->is_reference && pic->type != FF_HW_PICTURE_TYPE_IDR) {
  385. FFHWBaseEncodePicture *discard_list[MAX_DPB_SIZE];
  386. int discard = 0, keep = 0;
  387. // Discard everything which is in the DPB of the previous frame but
  388. // not in the DPB of this one.
  389. for (i = 0; i < prev->nb_dpb_pics; i++) {
  390. for (j = 0; j < pic->nb_dpb_pics; j++) {
  391. if (prev->dpb[i] == pic->dpb[j])
  392. break;
  393. }
  394. if (j == pic->nb_dpb_pics) {
  395. discard_list[discard] = prev->dpb[i];
  396. ++discard;
  397. } else {
  398. ++keep;
  399. }
  400. }
  401. av_assert0(keep <= enc->units.dpb_frames);
  402. if (discard == 0) {
  403. hp->h264pic_info.flags.adaptive_ref_pic_marking_mode_flag = 0;
  404. } else {
  405. hp->h264pic_info.flags.adaptive_ref_pic_marking_mode_flag = 1;
  406. for (i = 0; i < discard; i++) {
  407. VulkanEncodeH264Picture *old = discard_list[i]->codec_priv;
  408. av_assert0(old->frame_num < hp->frame_num);
  409. hp->mmco[i] = (StdVideoEncodeH264RefPicMarkingEntry) {
  410. .memory_management_control_operation = 1,
  411. .difference_of_pic_nums_minus1 = hp->frame_num - old->frame_num - 1,
  412. };
  413. }
  414. hp->mmco[i] = (StdVideoEncodeH264RefPicMarkingEntry) {
  415. .memory_management_control_operation = 0,
  416. };
  417. hp->ref_list_info.pRefPicMarkingOperations = hp->mmco;
  418. hp->ref_list_info.refPicMarkingOpCount = i + 1;
  419. }
  420. }
  421. if (pic->type == FF_HW_PICTURE_TYPE_I || pic->type == FF_HW_PICTURE_TYPE_IDR)
  422. return;
  423. // If the intended references are not the first entries of RefPicListN
  424. // by default, use ref-pic-list-modification to move them there.
  425. vk_enc_h264_default_ref_pic_list(avctx, pic,
  426. def_l0, def_l1, &n);
  427. if (pic->type == FF_HW_PICTURE_TYPE_P) {
  428. int need_rplm = 0;
  429. for (i = 0; i < pic->nb_refs[0]; i++) {
  430. av_assert0(pic->refs[0][i]);
  431. if (pic->refs[0][i] != (FFHWBaseEncodePicture *)def_l0[i])
  432. need_rplm = 1;
  433. }
  434. hp->ref_list_info.flags.ref_pic_list_modification_flag_l0 = need_rplm;
  435. if (need_rplm) {
  436. int pic_num = hp->frame_num;
  437. for (i = 0; i < pic->nb_refs[0]; i++) {
  438. href = pic->refs[0][i]->codec_priv;
  439. av_assert0(href->frame_num != pic_num);
  440. if (href->frame_num < pic_num) {
  441. hp->mods[0][i] = (StdVideoEncodeH264RefListModEntry) {
  442. .modification_of_pic_nums_idc = 0,
  443. .abs_diff_pic_num_minus1 = pic_num - href->frame_num - 1,
  444. };
  445. } else {
  446. hp->mods[0][i] = (StdVideoEncodeH264RefListModEntry) {
  447. .modification_of_pic_nums_idc = 1,
  448. .abs_diff_pic_num_minus1 = href->frame_num - pic_num - 1,
  449. };
  450. }
  451. pic_num = href->frame_num;
  452. }
  453. hp->ref_list_info.pRefList0ModOperations = hp->mods[0];
  454. hp->ref_list_info.refList0ModOpCount = i - 1;
  455. }
  456. } else {
  457. int need_rplm_l0 = 0, need_rplm_l1 = 0;
  458. int n0 = 0, n1 = 0;
  459. for (i = 0; i < pic->nb_refs[0]; i++) {
  460. av_assert0(pic->refs[0][i]);
  461. href = pic->refs[0][i]->codec_priv;
  462. av_assert0(href->pic_order_cnt < hp->pic_order_cnt);
  463. if (pic->refs[0][i] != (FFHWBaseEncodePicture *)def_l0[n0])
  464. need_rplm_l0 = 1;
  465. ++n0;
  466. }
  467. for (int i = 0; i < pic->nb_refs[1]; i++) {
  468. av_assert0(pic->refs[1][i]);
  469. href = pic->refs[1][i]->codec_priv;
  470. av_assert0(href->pic_order_cnt > hp->pic_order_cnt);
  471. if (pic->refs[1][i] != (FFHWBaseEncodePicture *)def_l1[n1])
  472. need_rplm_l1 = 1;
  473. ++n1;
  474. }
  475. hp->ref_list_info.flags.ref_pic_list_modification_flag_l0 = need_rplm_l0;
  476. if (need_rplm_l0) {
  477. int pic_num = hp->frame_num;
  478. for (i = j = 0; i < pic->nb_refs[0]; i++) {
  479. href = pic->refs[0][i]->codec_priv;
  480. av_assert0(href->frame_num != pic_num);
  481. if (href->frame_num < pic_num) {
  482. hp->mods[0][j] = (StdVideoEncodeH264RefListModEntry) {
  483. .modification_of_pic_nums_idc = 0,
  484. .abs_diff_pic_num_minus1 = pic_num - href->frame_num - 1,
  485. };
  486. } else {
  487. hp->mods[0][j] = (StdVideoEncodeH264RefListModEntry) {
  488. .modification_of_pic_nums_idc = 1,
  489. .abs_diff_pic_num_minus1 = href->frame_num - pic_num - 1,
  490. };
  491. }
  492. pic_num = href->frame_num;
  493. ++j;
  494. }
  495. hp->ref_list_info.pRefList0ModOperations = hp->mods[0];
  496. hp->ref_list_info.refList0ModOpCount = j - 1;
  497. }
  498. hp->ref_list_info.flags.ref_pic_list_modification_flag_l1 = need_rplm_l1;
  499. if (need_rplm_l1) {
  500. int pic_num = hp->frame_num;
  501. for (i = j = 0; i < pic->nb_refs[1]; i++) {
  502. href = pic->refs[1][i]->codec_priv;
  503. av_assert0(href->frame_num != pic_num);
  504. if (href->frame_num < pic_num) {
  505. hp->mods[1][j] = (StdVideoEncodeH264RefListModEntry) {
  506. .modification_of_pic_nums_idc = 0,
  507. .abs_diff_pic_num_minus1 = pic_num - href->frame_num - 1,
  508. };
  509. } else {
  510. hp->mods[1][j] = (StdVideoEncodeH264RefListModEntry) {
  511. .modification_of_pic_nums_idc = 1,
  512. .abs_diff_pic_num_minus1 = href->frame_num - pic_num - 1,
  513. };
  514. }
  515. pic_num = href->frame_num;
  516. ++j;
  517. }
  518. hp->ref_list_info.pRefList1ModOperations = hp->mods[1];
  519. hp->ref_list_info.refList1ModOpCount = j - 1;
  520. }
  521. }
  522. }
  523. static int init_pic_params(AVCodecContext *avctx, FFHWBaseEncodePicture *pic,
  524. VkVideoEncodeInfoKHR *encode_info)
  525. {
  526. int err;
  527. FFVulkanEncodePicture *vp = pic->priv;
  528. VulkanEncodeH264Picture *hp = pic->codec_priv;
  529. VkVideoReferenceSlotInfoKHR *ref_slot;
  530. err = vk_enc_h264_update_pic_info(avctx, pic);
  531. if (err < 0)
  532. return err;
  533. hp->vkh264pic_info = (VkVideoEncodeH264PictureInfoKHR) {
  534. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_PICTURE_INFO_KHR,
  535. .pNext = NULL,
  536. .pNaluSliceEntries = NULL, // Filled in during setup_slices()
  537. .naluSliceEntryCount = 0, // Filled in during setup_slices()
  538. .pStdPictureInfo = &hp->h264pic_info,
  539. };
  540. hp->h264pic_info = (StdVideoEncodeH264PictureInfo) {
  541. .flags = (StdVideoEncodeH264PictureInfoFlags) {
  542. .IdrPicFlag = pic->type == FF_HW_PICTURE_TYPE_IDR,
  543. .is_reference = pic->is_reference,
  544. .no_output_of_prior_pics_flag = 0,
  545. .long_term_reference_flag = 0,
  546. .adaptive_ref_pic_marking_mode_flag = 0, // Filled in during setup_refs()
  547. /* Reserved */
  548. },
  549. .seq_parameter_set_id = 0,
  550. .pic_parameter_set_id = 0,
  551. .idr_pic_id = hp->idr_pic_id,
  552. .primary_pic_type = pic->type == FF_HW_PICTURE_TYPE_P ? STD_VIDEO_H264_PICTURE_TYPE_P :
  553. pic->type == FF_HW_PICTURE_TYPE_B ? STD_VIDEO_H264_PICTURE_TYPE_B :
  554. pic->type == FF_HW_PICTURE_TYPE_I ? STD_VIDEO_H264_PICTURE_TYPE_I :
  555. STD_VIDEO_H264_PICTURE_TYPE_IDR,
  556. .frame_num = hp->frame_num,
  557. .PicOrderCnt = hp->pic_order_cnt,
  558. .temporal_id = 0, /* ? */
  559. /* Reserved */
  560. .pRefLists = NULL, // Filled in during setup_refs
  561. };
  562. encode_info->pNext = &hp->vkh264pic_info;
  563. hp->h264dpb_info = (StdVideoEncodeH264ReferenceInfo) {
  564. .flags = (StdVideoEncodeH264ReferenceInfoFlags) {
  565. .used_for_long_term_reference = 0,
  566. /* Reserved */
  567. },
  568. .primary_pic_type = hp->h264pic_info.primary_pic_type,
  569. .FrameNum = hp->h264pic_info.frame_num,
  570. .PicOrderCnt = hp->h264pic_info.PicOrderCnt,
  571. .long_term_pic_num = 0,
  572. .long_term_frame_idx = 0,
  573. .temporal_id = hp->h264pic_info.temporal_id,
  574. };
  575. hp->vkh264dpb_info = (VkVideoEncodeH264DpbSlotInfoKHR) {
  576. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_DPB_SLOT_INFO_KHR,
  577. .pStdReferenceInfo = &hp->h264dpb_info,
  578. };
  579. vp->dpb_slot.pNext = &hp->vkh264dpb_info;
  580. ref_slot = (VkVideoReferenceSlotInfoKHR *)encode_info->pSetupReferenceSlot;
  581. ref_slot->pNext = &hp->vkh264dpb_info;
  582. setup_refs(avctx, pic, encode_info);
  583. setup_slices(avctx, pic);
  584. return 0;
  585. }
  586. static int init_profile(AVCodecContext *avctx,
  587. VkVideoProfileInfoKHR *profile, void *pnext)
  588. {
  589. VkResult ret;
  590. VulkanEncodeH264Context *enc = avctx->priv_data;
  591. FFVulkanEncodeContext *ctx = &enc->common;
  592. FFVulkanContext *s = &ctx->s;
  593. FFVulkanFunctions *vk = &ctx->s.vkfn;
  594. VkVideoEncodeH264CapabilitiesKHR h264_caps = {
  595. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_CAPABILITIES_KHR,
  596. };
  597. VkVideoEncodeCapabilitiesKHR enc_caps = {
  598. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_CAPABILITIES_KHR,
  599. .pNext = &h264_caps,
  600. };
  601. VkVideoCapabilitiesKHR caps = {
  602. .sType = VK_STRUCTURE_TYPE_VIDEO_CAPABILITIES_KHR,
  603. .pNext = &enc_caps,
  604. };
  605. /* In order of preference */
  606. int last_supported = AV_PROFILE_UNKNOWN;
  607. static const int known_profiles[] = {
  608. AV_PROFILE_H264_CONSTRAINED_BASELINE,
  609. AV_PROFILE_H264_MAIN,
  610. AV_PROFILE_H264_HIGH,
  611. AV_PROFILE_H264_HIGH_10,
  612. };
  613. int nb_profiles = FF_ARRAY_ELEMS(known_profiles);
  614. const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(s->frames->sw_format);
  615. if (!desc)
  616. return AVERROR(EINVAL);
  617. if (desc->comp[0].depth == 8)
  618. nb_profiles = 3;
  619. enc->profile = (VkVideoEncodeH264ProfileInfoKHR) {
  620. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_PROFILE_INFO_KHR,
  621. .pNext = pnext,
  622. .stdProfileIdc = ff_vk_h264_profile_to_vk(avctx->profile),
  623. };
  624. profile->pNext = &enc->profile;
  625. /* Set level */
  626. if (avctx->level == AV_LEVEL_UNKNOWN)
  627. avctx->level = enc->common.opts.level;
  628. /* User has explicitly specified a profile. */
  629. if (avctx->profile != AV_PROFILE_UNKNOWN)
  630. return 0;
  631. av_log(avctx, AV_LOG_DEBUG, "Supported profiles:\n");
  632. for (int i = 0; i < nb_profiles; i++) {
  633. enc->profile.stdProfileIdc = ff_vk_h264_profile_to_vk(known_profiles[i]);
  634. ret = vk->GetPhysicalDeviceVideoCapabilitiesKHR(s->hwctx->phys_dev,
  635. profile,
  636. &caps);
  637. if (ret == VK_SUCCESS) {
  638. av_log(avctx, AV_LOG_DEBUG, " %s\n",
  639. avcodec_profile_name(avctx->codec_id, known_profiles[i]));
  640. last_supported = known_profiles[i];
  641. }
  642. }
  643. if (last_supported == AV_PROFILE_UNKNOWN) {
  644. av_log(avctx, AV_LOG_ERROR, "No supported profiles for given format\n");
  645. return AVERROR(ENOTSUP);
  646. }
  647. enc->profile.stdProfileIdc = ff_vk_h264_profile_to_vk(last_supported);
  648. av_log(avctx, AV_LOG_VERBOSE, "Using profile %s\n",
  649. avcodec_profile_name(avctx->codec_id, last_supported));
  650. avctx->profile = last_supported;
  651. return 0;
  652. }
  653. static int init_enc_options(AVCodecContext *avctx)
  654. {
  655. VulkanEncodeH264Context *enc = avctx->priv_data;
  656. FFHWBaseEncodeH264Opts *unit_opts = &enc->unit_opts;
  657. if (avctx->rc_buffer_size)
  658. unit_opts->hrd_buffer_size = avctx->rc_buffer_size;
  659. else if (avctx->rc_max_rate > 0)
  660. unit_opts->hrd_buffer_size = avctx->rc_max_rate;
  661. else
  662. unit_opts->hrd_buffer_size = avctx->bit_rate;
  663. if (avctx->rc_initial_buffer_occupancy) {
  664. if (avctx->rc_initial_buffer_occupancy > unit_opts->hrd_buffer_size) {
  665. av_log(avctx, AV_LOG_ERROR, "Invalid RC buffer settings: "
  666. "must have initial buffer size (%d) <= "
  667. "buffer size (%"PRId64").\n",
  668. avctx->rc_initial_buffer_occupancy, unit_opts->hrd_buffer_size);
  669. return AVERROR(EINVAL);
  670. }
  671. unit_opts->initial_buffer_fullness = avctx->rc_initial_buffer_occupancy;
  672. } else {
  673. unit_opts->initial_buffer_fullness = unit_opts->hrd_buffer_size * 3 / 4;
  674. }
  675. if (enc->common.opts.rc_mode == VK_VIDEO_ENCODE_RATE_CONTROL_MODE_DISABLED_BIT_KHR) {
  676. /* HRD info is required for timing */
  677. enc->unit_elems &= ~UNIT_SEI_TIMING;
  678. enc->fixed_qp_p = av_clip(enc->common.explicit_qp,
  679. enc->caps.minQp, enc->caps.maxQp);
  680. if (avctx->i_quant_factor > 0.0)
  681. unit_opts->fixed_qp_idr = av_clip((avctx->i_quant_factor * enc->fixed_qp_p +
  682. avctx->i_quant_offset) + 0.5,
  683. enc->caps.minQp, enc->caps.maxQp);
  684. else
  685. unit_opts->fixed_qp_idr = enc->fixed_qp_p;
  686. if (avctx->b_quant_factor > 0.0)
  687. enc->fixed_qp_b = av_clip((avctx->b_quant_factor * enc->fixed_qp_p +
  688. avctx->b_quant_offset) + 0.5,
  689. enc->caps.minQp, enc->caps.maxQp);
  690. else
  691. enc->fixed_qp_b = enc->fixed_qp_p;
  692. av_log(avctx, AV_LOG_DEBUG, "Using fixed QP = "
  693. "%d / %d / %d for IDR- / P- / B-frames.\n",
  694. unit_opts->fixed_qp_idr, enc->fixed_qp_p, enc->fixed_qp_b);
  695. } else {
  696. unit_opts->fixed_qp_idr = 26;
  697. enc->fixed_qp_p = 26;
  698. enc->fixed_qp_b = 26;
  699. }
  700. return 0;
  701. }
  702. static av_cold int init_sequence_headers(AVCodecContext *avctx)
  703. {
  704. int err;
  705. VulkanEncodeH264Context *enc = avctx->priv_data;
  706. FFHWBaseEncodeH264 *units = &enc->units;
  707. FFHWBaseEncodeH264Opts *unit_opts = &enc->unit_opts;
  708. unit_opts->bit_rate = avctx->bit_rate;
  709. unit_opts->mb_width = FFALIGN(avctx->width, 16) / 16;
  710. unit_opts->mb_height = FFALIGN(avctx->height, 16) / 16;
  711. unit_opts->flags = enc->unit_elems & UNIT_SEI_TIMING ? FF_HW_H264_SEI_TIMING : 0;
  712. /* cabac already set via an option */
  713. /* fixed_qp_idr initialized in init_enc_options() */
  714. /* hrd_buffer_size initialized in init_enc_options() */
  715. /* initial_buffer_fullness initialized in init_enc_options() */
  716. err = ff_hw_base_encode_init_params_h264(&enc->common.base, avctx,
  717. units, unit_opts);
  718. if (err < 0)
  719. return err;
  720. units->raw_sps.seq_scaling_matrix_present_flag =
  721. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_SCALING_MATRIX_PRESENT_FLAG_SET_BIT_KHR);
  722. units->raw_pps.pic_scaling_matrix_present_flag =
  723. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_SCALING_MATRIX_PRESENT_FLAG_SET_BIT_KHR);
  724. units->raw_pps.transform_8x8_mode_flag =
  725. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_TRANSFORM_8X8_MODE_FLAG_SET_BIT_KHR);
  726. return 0;
  727. }
  728. typedef struct VulkanH264Units {
  729. StdVideoH264SequenceParameterSet vksps;
  730. StdVideoH264ScalingLists vksps_scaling;
  731. StdVideoH264HrdParameters vksps_vui_header;
  732. StdVideoH264SequenceParameterSetVui vksps_vui;
  733. StdVideoH264PictureParameterSet vkpps;
  734. StdVideoH264ScalingLists vkpps_scaling;
  735. } VulkanH264Units;
  736. static av_cold int base_unit_to_vk(AVCodecContext *avctx,
  737. VulkanH264Units *vk_units)
  738. {
  739. VulkanEncodeH264Context *enc = avctx->priv_data;
  740. FFHWBaseEncodeH264 *units = &enc->units;
  741. H264RawSPS *sps = &units->raw_sps;
  742. H264RawHRD *hrd = &sps->vui.nal_hrd_parameters;
  743. StdVideoH264ScalingLists *vksps_scaling = &vk_units->vksps_scaling;
  744. StdVideoH264HrdParameters *vksps_vui_header = &vk_units->vksps_vui_header;
  745. StdVideoH264SequenceParameterSetVui *vksps_vui = &vk_units->vksps_vui;
  746. StdVideoH264SequenceParameterSet *vksps = &vk_units->vksps;
  747. H264RawPPS *pps = &units->raw_pps;
  748. StdVideoH264ScalingLists *vkpps_scaling = &vk_units->vkpps_scaling;
  749. StdVideoH264PictureParameterSet *vkpps = &vk_units->vkpps;
  750. *vksps_scaling = (StdVideoH264ScalingLists) {
  751. .scaling_list_present_mask = 0x0, // mask
  752. .use_default_scaling_matrix_mask = 1,
  753. };
  754. *vksps_vui_header = (StdVideoH264HrdParameters) {
  755. .cpb_cnt_minus1 = hrd->cpb_cnt_minus1,
  756. .bit_rate_scale = hrd->bit_rate_scale,
  757. .cpb_size_scale = hrd->cpb_size_scale,
  758. /* Reserved */
  759. /* bit_rate/cpb_size/cbr_flag set below */
  760. .initial_cpb_removal_delay_length_minus1 = hrd->initial_cpb_removal_delay_length_minus1,
  761. .cpb_removal_delay_length_minus1 = hrd->cpb_removal_delay_length_minus1,
  762. .dpb_output_delay_length_minus1 = hrd->dpb_output_delay_length_minus1,
  763. .time_offset_length = hrd->time_offset_length,
  764. };
  765. for (int i = 0; i < H264_MAX_CPB_CNT; i++) {
  766. vksps_vui_header->bit_rate_value_minus1[i] = hrd->bit_rate_value_minus1[i];
  767. vksps_vui_header->cpb_size_value_minus1[i] = hrd->cpb_size_value_minus1[i];
  768. vksps_vui_header->cbr_flag[i] = hrd->cbr_flag[i];
  769. }
  770. *vksps_vui = (StdVideoH264SequenceParameterSetVui) {
  771. .flags = (StdVideoH264SpsVuiFlags) {
  772. .aspect_ratio_info_present_flag = sps->vui.aspect_ratio_info_present_flag,
  773. .overscan_info_present_flag = sps->vui.overscan_info_present_flag,
  774. .overscan_appropriate_flag = sps->vui.overscan_appropriate_flag,
  775. .video_signal_type_present_flag = sps->vui.video_signal_type_present_flag,
  776. .video_full_range_flag = sps->vui.video_full_range_flag,
  777. .color_description_present_flag = sps->vui.colour_description_present_flag,
  778. .chroma_loc_info_present_flag = sps->vui.chroma_loc_info_present_flag,
  779. .timing_info_present_flag = sps->vui.timing_info_present_flag,
  780. .fixed_frame_rate_flag = sps->vui.fixed_frame_rate_flag,
  781. .bitstream_restriction_flag = sps->vui.bitstream_restriction_flag,
  782. .nal_hrd_parameters_present_flag = sps->vui.nal_hrd_parameters_present_flag,
  783. .vcl_hrd_parameters_present_flag = sps->vui.vcl_hrd_parameters_present_flag,
  784. },
  785. .aspect_ratio_idc = sps->vui.aspect_ratio_idc,
  786. .sar_width = sps->vui.sar_width,
  787. .sar_height = sps->vui.sar_height,
  788. .video_format = sps->vui.video_format,
  789. .colour_primaries = sps->vui.colour_primaries,
  790. .transfer_characteristics = sps->vui.transfer_characteristics,
  791. .matrix_coefficients = sps->vui.matrix_coefficients,
  792. .num_units_in_tick = sps->vui.num_units_in_tick,
  793. .time_scale = sps->vui.time_scale,
  794. .max_num_reorder_frames = sps->vui.max_num_reorder_frames,
  795. .max_dec_frame_buffering = sps->vui.max_dec_frame_buffering,
  796. .chroma_sample_loc_type_top_field = sps->vui.chroma_sample_loc_type_top_field,
  797. .chroma_sample_loc_type_bottom_field = sps->vui.chroma_sample_loc_type_bottom_field,
  798. /* Reserved */
  799. .pHrdParameters = vksps_vui_header,
  800. };
  801. *vksps = (StdVideoH264SequenceParameterSet) {
  802. .flags = (StdVideoH264SpsFlags) {
  803. .constraint_set0_flag = sps->constraint_set0_flag,
  804. .constraint_set1_flag = sps->constraint_set1_flag,
  805. .constraint_set2_flag = sps->constraint_set2_flag,
  806. .constraint_set3_flag = sps->constraint_set3_flag,
  807. .constraint_set4_flag = sps->constraint_set4_flag,
  808. .constraint_set5_flag = sps->constraint_set5_flag,
  809. .direct_8x8_inference_flag = sps->direct_8x8_inference_flag,
  810. .mb_adaptive_frame_field_flag = sps->mb_adaptive_frame_field_flag,
  811. .frame_mbs_only_flag = sps->frame_mbs_only_flag,
  812. .delta_pic_order_always_zero_flag = sps->delta_pic_order_always_zero_flag,
  813. .separate_colour_plane_flag = sps->separate_colour_plane_flag,
  814. .gaps_in_frame_num_value_allowed_flag = sps->gaps_in_frame_num_allowed_flag,
  815. .qpprime_y_zero_transform_bypass_flag = sps->qpprime_y_zero_transform_bypass_flag,
  816. .frame_cropping_flag = sps->frame_cropping_flag,
  817. .seq_scaling_matrix_present_flag = sps->seq_scaling_matrix_present_flag,
  818. .vui_parameters_present_flag = sps->vui_parameters_present_flag,
  819. },
  820. .profile_idc = ff_vk_h264_profile_to_vk(sps->profile_idc),
  821. .level_idc = ff_vk_h264_level_to_vk(sps->level_idc),
  822. .chroma_format_idc = sps->chroma_format_idc,
  823. .seq_parameter_set_id = sps->seq_parameter_set_id,
  824. .bit_depth_luma_minus8 = sps->bit_depth_luma_minus8,
  825. .bit_depth_chroma_minus8 = sps->bit_depth_chroma_minus8,
  826. .log2_max_frame_num_minus4 = sps->log2_max_frame_num_minus4,
  827. .pic_order_cnt_type = sps->pic_order_cnt_type,
  828. .offset_for_non_ref_pic = sps->offset_for_non_ref_pic,
  829. .offset_for_top_to_bottom_field = sps->offset_for_top_to_bottom_field,
  830. .log2_max_pic_order_cnt_lsb_minus4 = sps->log2_max_pic_order_cnt_lsb_minus4,
  831. .num_ref_frames_in_pic_order_cnt_cycle = sps->num_ref_frames_in_pic_order_cnt_cycle,
  832. .max_num_ref_frames = sps->max_num_ref_frames,
  833. /* Reserved */
  834. .pic_width_in_mbs_minus1 = sps->pic_width_in_mbs_minus1,
  835. .pic_height_in_map_units_minus1 = sps->pic_height_in_map_units_minus1,
  836. .frame_crop_left_offset = sps->frame_crop_left_offset,
  837. .frame_crop_right_offset = sps->frame_crop_right_offset,
  838. .frame_crop_top_offset = sps->frame_crop_top_offset,
  839. .frame_crop_bottom_offset = sps->frame_crop_bottom_offset,
  840. /* Reserved */
  841. .pOffsetForRefFrame = sps->offset_for_ref_frame,
  842. .pScalingLists = vksps_scaling,
  843. .pSequenceParameterSetVui = vksps_vui,
  844. };
  845. *vkpps_scaling = (StdVideoH264ScalingLists) {
  846. .scaling_list_present_mask = 0x0, // mask
  847. .use_default_scaling_matrix_mask = 1,
  848. };
  849. *vkpps = (StdVideoH264PictureParameterSet) {
  850. .flags = (StdVideoH264PpsFlags) {
  851. .transform_8x8_mode_flag = pps->transform_8x8_mode_flag,
  852. .redundant_pic_cnt_present_flag = pps->redundant_pic_cnt_present_flag,
  853. .constrained_intra_pred_flag = pps->constrained_intra_pred_flag,
  854. .deblocking_filter_control_present_flag = pps->deblocking_filter_control_present_flag,
  855. .weighted_pred_flag = pps->weighted_pred_flag,
  856. .bottom_field_pic_order_in_frame_present_flag = pps->bottom_field_pic_order_in_frame_present_flag,
  857. .entropy_coding_mode_flag = pps->entropy_coding_mode_flag,
  858. .pic_scaling_matrix_present_flag = pps->pic_scaling_matrix_present_flag,
  859. },
  860. .seq_parameter_set_id = pps->seq_parameter_set_id,
  861. .pic_parameter_set_id = pps->pic_parameter_set_id,
  862. .num_ref_idx_l0_default_active_minus1 = pps->num_ref_idx_l0_default_active_minus1,
  863. .num_ref_idx_l1_default_active_minus1 = pps->num_ref_idx_l1_default_active_minus1,
  864. .weighted_bipred_idc = pps->weighted_bipred_idc,
  865. .pic_init_qp_minus26 = pps->pic_init_qp_minus26,
  866. .pic_init_qs_minus26 = pps->pic_init_qs_minus26,
  867. .chroma_qp_index_offset = pps->chroma_qp_index_offset,
  868. .second_chroma_qp_index_offset = pps->second_chroma_qp_index_offset,
  869. .pScalingLists = vkpps_scaling,
  870. };
  871. return 0;
  872. }
  873. static int create_session_params(AVCodecContext *avctx)
  874. {
  875. int err;
  876. VulkanEncodeH264Context *enc = avctx->priv_data;
  877. FFVulkanEncodeContext *ctx = &enc->common;
  878. FFVulkanContext *s = &ctx->s;
  879. FFVulkanFunctions *vk = &ctx->s.vkfn;
  880. VulkanH264Units vk_units = { 0 };
  881. VkVideoEncodeH264SessionParametersAddInfoKHR h264_params_info;
  882. VkVideoEncodeH264SessionParametersCreateInfoKHR h264_params;
  883. /* Convert it to Vulkan */
  884. err = base_unit_to_vk(avctx, &vk_units);
  885. if (err < 0) {
  886. av_log(avctx, AV_LOG_ERROR, "Unable to convert SPS/PPS units to Vulkan: %s\n",
  887. av_err2str(err));
  888. return err;
  889. }
  890. /* Destroy the session params */
  891. if (ctx->session_params)
  892. vk->DestroyVideoSessionParametersKHR(s->hwctx->act_dev,
  893. ctx->session_params,
  894. s->hwctx->alloc);
  895. h264_params_info = (VkVideoEncodeH264SessionParametersAddInfoKHR) {
  896. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_SESSION_PARAMETERS_ADD_INFO_KHR,
  897. .pStdSPSs = &vk_units.vksps,
  898. .stdSPSCount = 1,
  899. .pStdPPSs = &vk_units.vkpps,
  900. .stdPPSCount = 1,
  901. };
  902. h264_params = (VkVideoEncodeH264SessionParametersCreateInfoKHR) {
  903. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_SESSION_PARAMETERS_CREATE_INFO_KHR,
  904. .maxStdSPSCount = 1,
  905. .maxStdPPSCount = 1,
  906. .pParametersAddInfo = &h264_params_info,
  907. };
  908. return ff_vulkan_encode_create_session_params(avctx, ctx, &h264_params);
  909. }
  910. static int parse_feedback_units(AVCodecContext *avctx,
  911. const uint8_t *data, size_t size,
  912. int sps_override, int pps_override)
  913. {
  914. int err;
  915. VulkanEncodeH264Context *enc = avctx->priv_data;
  916. CodedBitstreamContext *cbs;
  917. CodedBitstreamFragment au = { 0 };
  918. err = ff_cbs_init(&cbs, AV_CODEC_ID_H264, avctx);
  919. if (err < 0)
  920. return err;
  921. err = ff_cbs_read(cbs, &au, data, size);
  922. if (err < 0) {
  923. av_log(avctx, AV_LOG_ERROR, "Unable to parse feedback units, bad drivers: %s\n",
  924. av_err2str(err));
  925. return err;
  926. }
  927. /* If PPS has an override, just copy it entirely. */
  928. if (pps_override) {
  929. for (int i = 0; i < au.nb_units; i++) {
  930. if (au.units[i].type == H264_NAL_PPS) {
  931. H264RawPPS *pps = au.units[i].content;
  932. memcpy(&enc->units.raw_pps, pps, sizeof(*pps));
  933. break;
  934. }
  935. }
  936. }
  937. ff_cbs_fragment_free(&au);
  938. ff_cbs_close(&cbs);
  939. return 0;
  940. }
  941. static int init_base_units(AVCodecContext *avctx)
  942. {
  943. int err;
  944. VkResult ret;
  945. VulkanEncodeH264Context *enc = avctx->priv_data;
  946. FFVulkanEncodeContext *ctx = &enc->common;
  947. FFVulkanContext *s = &ctx->s;
  948. FFVulkanFunctions *vk = &ctx->s.vkfn;
  949. VkVideoEncodeH264SessionParametersGetInfoKHR h264_params_info;
  950. VkVideoEncodeSessionParametersGetInfoKHR params_info;
  951. VkVideoEncodeH264SessionParametersFeedbackInfoKHR h264_params_feedback;
  952. VkVideoEncodeSessionParametersFeedbackInfoKHR params_feedback;
  953. void *data = NULL;
  954. size_t data_size = 0;
  955. /* Generate SPS/PPS unit info */
  956. err = init_sequence_headers(avctx);
  957. if (err < 0) {
  958. av_log(avctx, AV_LOG_ERROR, "Unable to initialize SPS/PPS units: %s\n",
  959. av_err2str(err));
  960. return err;
  961. }
  962. /* Create session parameters from them */
  963. err = create_session_params(avctx);
  964. if (err < 0)
  965. return err;
  966. h264_params_info = (VkVideoEncodeH264SessionParametersGetInfoKHR) {
  967. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_SESSION_PARAMETERS_GET_INFO_KHR,
  968. .writeStdSPS = 1,
  969. .writeStdPPS = 1,
  970. .stdSPSId = enc->units.raw_sps.seq_parameter_set_id,
  971. .stdPPSId = enc->units.raw_pps.pic_parameter_set_id,
  972. };
  973. params_info = (VkVideoEncodeSessionParametersGetInfoKHR) {
  974. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_SESSION_PARAMETERS_GET_INFO_KHR,
  975. .pNext = &h264_params_info,
  976. .videoSessionParameters = ctx->session_params,
  977. };
  978. h264_params_feedback = (VkVideoEncodeH264SessionParametersFeedbackInfoKHR) {
  979. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_SESSION_PARAMETERS_FEEDBACK_INFO_KHR,
  980. };
  981. params_feedback = (VkVideoEncodeSessionParametersFeedbackInfoKHR) {
  982. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_SESSION_PARAMETERS_FEEDBACK_INFO_KHR,
  983. .pNext = &h264_params_feedback,
  984. };
  985. ret = vk->GetEncodedVideoSessionParametersKHR(s->hwctx->act_dev, &params_info,
  986. &params_feedback,
  987. &data_size, data);
  988. if (ret == VK_INCOMPLETE ||
  989. (ret == VK_SUCCESS) && (data_size > 0)) {
  990. data = av_mallocz(data_size);
  991. if (!data)
  992. return AVERROR(ENOMEM);
  993. } else {
  994. av_log(avctx, AV_LOG_ERROR, "Unable to get feedback for H.264 units = %lu\n", data_size);
  995. return err;
  996. }
  997. ret = vk->GetEncodedVideoSessionParametersKHR(s->hwctx->act_dev, &params_info,
  998. &params_feedback,
  999. &data_size, data);
  1000. if (ret != VK_SUCCESS) {
  1001. av_log(avctx, AV_LOG_ERROR, "Error writing feedback units\n");
  1002. return err;
  1003. }
  1004. av_log(avctx, AV_LOG_VERBOSE, "Feedback units written, overrides: %i (SPS: %i PPS: %i)\n",
  1005. params_feedback.hasOverrides,
  1006. h264_params_feedback.hasStdSPSOverrides,
  1007. h264_params_feedback.hasStdPPSOverrides);
  1008. params_feedback.hasOverrides = 1;
  1009. h264_params_feedback.hasStdPPSOverrides = 1;
  1010. /* No need to sync any overrides */
  1011. if (!params_feedback.hasOverrides)
  1012. return 0;
  1013. /* Parse back tne units and override */
  1014. err = parse_feedback_units(avctx, data, data_size,
  1015. h264_params_feedback.hasStdSPSOverrides,
  1016. h264_params_feedback.hasStdPPSOverrides);
  1017. if (err < 0)
  1018. return err;
  1019. /* Create final session parameters */
  1020. err = create_session_params(avctx);
  1021. if (err < 0)
  1022. return err;
  1023. return 0;
  1024. }
  1025. static int vulkan_encode_h264_add_nal(AVCodecContext *avctx,
  1026. CodedBitstreamFragment *au,
  1027. void *nal_unit)
  1028. {
  1029. H264RawNALUnitHeader *header = nal_unit;
  1030. int err = ff_cbs_insert_unit_content(au, -1,
  1031. header->nal_unit_type, nal_unit, NULL);
  1032. if (err < 0)
  1033. av_log(avctx, AV_LOG_ERROR, "Failed to add NAL unit: "
  1034. "type = %d.\n", header->nal_unit_type);
  1035. return err;
  1036. }
  1037. static int write_access_unit(AVCodecContext *avctx,
  1038. uint8_t *data, size_t *data_len,
  1039. CodedBitstreamFragment *au)
  1040. {
  1041. VulkanEncodeH264Context *enc = avctx->priv_data;
  1042. int err = ff_cbs_write_fragment_data(enc->cbs, au);
  1043. if (err < 0) {
  1044. av_log(avctx, AV_LOG_ERROR, "Failed to write packed header.\n");
  1045. return err;
  1046. }
  1047. if (*data_len < au->data_size) {
  1048. av_log(avctx, AV_LOG_ERROR, "Access unit too large: %zu < %zu.\n",
  1049. *data_len, au->data_size);
  1050. return AVERROR(ENOSPC);
  1051. }
  1052. memcpy(data, au->data, au->data_size);
  1053. *data_len = au->data_size;
  1054. return 0;
  1055. }
  1056. static int write_sequence_headers(AVCodecContext *avctx,
  1057. FFHWBaseEncodePicture *base_pic,
  1058. uint8_t *data, size_t *data_len)
  1059. {
  1060. int err;
  1061. VulkanEncodeH264Context *enc = avctx->priv_data;
  1062. VulkanEncodeH264Picture *hp = base_pic ? base_pic->codec_priv : NULL;
  1063. CodedBitstreamFragment *au = &enc->current_access_unit;
  1064. if (hp && hp->units_needed & UNIT_AUD) {
  1065. err = vulkan_encode_h264_add_nal(avctx, au, &enc->raw_aud);
  1066. if (err < 0)
  1067. goto fail;
  1068. }
  1069. err = vulkan_encode_h264_add_nal(avctx, au, &enc->units.raw_sps);
  1070. if (err < 0)
  1071. goto fail;
  1072. err = vulkan_encode_h264_add_nal(avctx, au, &enc->units.raw_pps);
  1073. if (err < 0)
  1074. goto fail;
  1075. err = write_access_unit(avctx, data, data_len, au);
  1076. fail:
  1077. ff_cbs_fragment_reset(au);
  1078. return err;
  1079. }
  1080. static int write_extra_headers(AVCodecContext *avctx,
  1081. FFHWBaseEncodePicture *base_pic,
  1082. uint8_t *data, size_t *data_len)
  1083. {
  1084. int err;
  1085. VulkanEncodeH264Context *enc = avctx->priv_data;
  1086. VulkanEncodeH264Picture *hp = base_pic->codec_priv;
  1087. CodedBitstreamFragment *au = &enc->current_access_unit;
  1088. if (hp->units_needed & UNIT_AUD) {
  1089. err = vulkan_encode_h264_add_nal(avctx, au, &enc->raw_aud);
  1090. if (err < 0)
  1091. goto fail;
  1092. }
  1093. if (hp->units_needed & UNIT_SEI_IDENTIFIER) {
  1094. err = ff_cbs_sei_add_message(enc->cbs, au, 1,
  1095. SEI_TYPE_USER_DATA_UNREGISTERED,
  1096. &enc->sei_identifier, NULL);
  1097. if (err < 0)
  1098. goto fail;
  1099. }
  1100. if (hp->units_needed & UNIT_SEI_TIMING) {
  1101. if (base_pic->type == FF_HW_PICTURE_TYPE_IDR) {
  1102. err = ff_cbs_sei_add_message(enc->cbs, au, 1,
  1103. SEI_TYPE_BUFFERING_PERIOD,
  1104. &enc->units.sei_buffering_period, NULL);
  1105. if (err < 0)
  1106. goto fail;
  1107. }
  1108. err = ff_cbs_sei_add_message(enc->cbs, au, 1,
  1109. SEI_TYPE_PIC_TIMING,
  1110. &enc->sei_pic_timing, NULL);
  1111. if (err < 0)
  1112. goto fail;
  1113. }
  1114. if (hp->units_needed & UNIT_SEI_RECOVERY) {
  1115. err = ff_cbs_sei_add_message(enc->cbs, au, 1,
  1116. SEI_TYPE_RECOVERY_POINT,
  1117. &enc->sei_recovery_point, NULL);
  1118. if (err < 0)
  1119. goto fail;
  1120. }
  1121. if (hp->units_needed & UNIT_SEI_A53_CC) {
  1122. err = ff_cbs_sei_add_message(enc->cbs, au, 1,
  1123. SEI_TYPE_USER_DATA_REGISTERED_ITU_T_T35,
  1124. &enc->sei_a53cc, NULL);
  1125. if (err < 0)
  1126. goto fail;
  1127. }
  1128. if (hp->units_needed) {
  1129. err = write_access_unit(avctx, data, data_len, au);
  1130. if (err < 0)
  1131. goto fail;
  1132. } else {
  1133. *data_len = 0;
  1134. }
  1135. fail:
  1136. ff_cbs_fragment_reset(au);
  1137. return err;
  1138. }
  1139. static int write_filler(AVCodecContext *avctx, uint32_t filler,
  1140. uint8_t *data, size_t *data_len)
  1141. {
  1142. int err;
  1143. VulkanEncodeH264Context *enc = avctx->priv_data;
  1144. CodedBitstreamFragment *au = &enc->current_access_unit;
  1145. H264RawFiller raw_filler = {
  1146. .nal_unit_header = {
  1147. .nal_unit_type = H264_NAL_FILLER_DATA,
  1148. },
  1149. .filler_size = filler,
  1150. };
  1151. err = vulkan_encode_h264_add_nal(avctx, au, &raw_filler);
  1152. if (err < 0)
  1153. goto fail;
  1154. err = write_access_unit(avctx, data, data_len, au);
  1155. fail:
  1156. ff_cbs_fragment_reset(au);
  1157. return err;
  1158. }
  1159. static const FFVulkanCodec enc_cb = {
  1160. .flags = FF_HW_FLAG_B_PICTURES |
  1161. FF_HW_FLAG_B_PICTURE_REFERENCES |
  1162. FF_HW_FLAG_NON_IDR_KEY_PICTURES,
  1163. .picture_priv_data_size = sizeof(VulkanEncodeH264Picture),
  1164. .filler_header_size = 6,
  1165. .init_profile = init_profile,
  1166. .init_pic_rc = init_pic_rc,
  1167. .init_pic_params = init_pic_params,
  1168. .write_sequence_headers = write_sequence_headers,
  1169. .write_extra_headers = write_extra_headers,
  1170. .write_filler = write_filler,
  1171. };
  1172. static av_cold int vulkan_encode_h264_init(AVCodecContext *avctx)
  1173. {
  1174. int err, ref_l0, ref_l1;
  1175. VulkanEncodeH264Context *enc = avctx->priv_data;
  1176. FFVulkanEncodeContext *ctx = &enc->common;
  1177. FFVulkanContext *s = &ctx->s;
  1178. FFHWBaseEncodeContext *base_ctx = &ctx->base;
  1179. int flags;
  1180. if (avctx->profile == AV_PROFILE_UNKNOWN)
  1181. avctx->profile = enc->common.opts.profile;
  1182. enc->caps = (VkVideoEncodeH264CapabilitiesKHR) {
  1183. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_CAPABILITIES_KHR,
  1184. };
  1185. enc->quality_props = (VkVideoEncodeH264QualityLevelPropertiesKHR) {
  1186. .sType = VK_STRUCTURE_TYPE_VIDEO_ENCODE_H264_QUALITY_LEVEL_PROPERTIES_KHR,
  1187. };
  1188. err = ff_vulkan_encode_init(avctx, &enc->common,
  1189. &ff_vk_enc_h264_desc, &enc_cb,
  1190. &enc->caps, &enc->quality_props);
  1191. if (err < 0)
  1192. return err;
  1193. av_log(avctx, AV_LOG_VERBOSE, "H264 encoder capabilities:\n");
  1194. av_log(avctx, AV_LOG_VERBOSE, " Standard capability flags:\n");
  1195. av_log(avctx, AV_LOG_VERBOSE, " separate_color_plane: %i\n",
  1196. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_SEPARATE_COLOR_PLANE_FLAG_SET_BIT_KHR));
  1197. av_log(avctx, AV_LOG_VERBOSE, " qprime_y_zero_transform_bypass: %i\n",
  1198. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_QPPRIME_Y_ZERO_TRANSFORM_BYPASS_FLAG_SET_BIT_KHR));
  1199. av_log(avctx, AV_LOG_VERBOSE, " scaling_lists: %i\n",
  1200. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_SCALING_MATRIX_PRESENT_FLAG_SET_BIT_KHR));
  1201. av_log(avctx, AV_LOG_VERBOSE, " chroma_qp_index_offset: %i\n",
  1202. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_CHROMA_QP_INDEX_OFFSET_BIT_KHR));
  1203. av_log(avctx, AV_LOG_VERBOSE, " second_chroma_qp_index_offset: %i\n",
  1204. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_SECOND_CHROMA_QP_INDEX_OFFSET_BIT_KHR));
  1205. av_log(avctx, AV_LOG_VERBOSE, " pic_init_qp: %i\n",
  1206. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_PIC_INIT_QP_MINUS26_BIT_KHR));
  1207. av_log(avctx, AV_LOG_VERBOSE, " weighted:%s%s%s\n",
  1208. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_WEIGHTED_PRED_FLAG_SET_BIT_KHR ?
  1209. " pred" : "",
  1210. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_WEIGHTED_BIPRED_IDC_EXPLICIT_BIT_KHR ?
  1211. " bipred_explicit" : "",
  1212. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_WEIGHTED_BIPRED_IDC_IMPLICIT_BIT_KHR ?
  1213. " bipred_implicit" : "");
  1214. av_log(avctx, AV_LOG_VERBOSE, " 8x8_transforms: %i\n",
  1215. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_TRANSFORM_8X8_MODE_FLAG_SET_BIT_KHR));
  1216. av_log(avctx, AV_LOG_VERBOSE, " disable_direct_spatial_mv_pred: %i\n",
  1217. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_DIRECT_SPATIAL_MV_PRED_FLAG_UNSET_BIT_KHR));
  1218. av_log(avctx, AV_LOG_VERBOSE, " coder:%s%s\n",
  1219. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_ENTROPY_CODING_MODE_FLAG_UNSET_BIT_KHR ?
  1220. " cabac" : "",
  1221. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_ENTROPY_CODING_MODE_FLAG_SET_BIT_KHR ?
  1222. " cavlc" : "");
  1223. av_log(avctx, AV_LOG_VERBOSE, " direct_8x8_inference: %i\n",
  1224. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_DIRECT_8X8_INFERENCE_FLAG_UNSET_BIT_KHR));
  1225. av_log(avctx, AV_LOG_VERBOSE, " constrained_intra_pred: %i\n",
  1226. !!(enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_CONSTRAINED_INTRA_PRED_FLAG_SET_BIT_KHR));
  1227. av_log(avctx, AV_LOG_VERBOSE, " deblock:%s%s%s\n",
  1228. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_DEBLOCKING_FILTER_DISABLED_BIT_KHR ?
  1229. " filter_disabling" : "",
  1230. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_DEBLOCKING_FILTER_ENABLED_BIT_KHR ?
  1231. " filter_enabling" : "",
  1232. enc->caps.stdSyntaxFlags & VK_VIDEO_ENCODE_H264_STD_DEBLOCKING_FILTER_PARTIAL_BIT_KHR ?
  1233. " filter_partial" : "");
  1234. av_log(avctx, AV_LOG_VERBOSE, " Capability flags:\n");
  1235. av_log(avctx, AV_LOG_VERBOSE, " hdr_compliance: %i\n",
  1236. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_HRD_COMPLIANCE_BIT_KHR));
  1237. av_log(avctx, AV_LOG_VERBOSE, " pred_weight_table_generated: %i\n",
  1238. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_PREDICTION_WEIGHT_TABLE_GENERATED_BIT_KHR));
  1239. av_log(avctx, AV_LOG_VERBOSE, " row_unaligned_slice: %i\n",
  1240. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_ROW_UNALIGNED_SLICE_BIT_KHR));
  1241. av_log(avctx, AV_LOG_VERBOSE, " different_slice_type: %i\n",
  1242. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_DIFFERENT_SLICE_TYPE_BIT_KHR));
  1243. av_log(avctx, AV_LOG_VERBOSE, " b_frame_in_l0_list: %i\n",
  1244. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_B_FRAME_IN_L0_LIST_BIT_KHR));
  1245. av_log(avctx, AV_LOG_VERBOSE, " b_frame_in_l1_list: %i\n",
  1246. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_B_FRAME_IN_L1_LIST_BIT_KHR));
  1247. av_log(avctx, AV_LOG_VERBOSE, " per_pict_type_min_max_qp: %i\n",
  1248. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_PER_PICTURE_TYPE_MIN_MAX_QP_BIT_KHR));
  1249. av_log(avctx, AV_LOG_VERBOSE, " per_slice_constant_qp: %i\n",
  1250. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_PER_SLICE_CONSTANT_QP_BIT_KHR));
  1251. av_log(avctx, AV_LOG_VERBOSE, " generate_prefix_nalu: %i\n",
  1252. !!(enc->caps.flags & VK_VIDEO_ENCODE_H264_CAPABILITY_GENERATE_PREFIX_NALU_BIT_KHR));
  1253. av_log(avctx, AV_LOG_VERBOSE, " Capabilities:\n");
  1254. av_log(avctx, AV_LOG_VERBOSE, " maxLevelIdc: %i\n",
  1255. enc->caps.maxLevelIdc);
  1256. av_log(avctx, AV_LOG_VERBOSE, " maxSliceCount: %i\n",
  1257. enc->caps.maxSliceCount);
  1258. av_log(avctx, AV_LOG_VERBOSE, " max(P/B)PictureL0ReferenceCount: %i P's; %i B's\n",
  1259. enc->caps.maxPPictureL0ReferenceCount,
  1260. enc->caps.maxBPictureL0ReferenceCount);
  1261. av_log(avctx, AV_LOG_VERBOSE, " maxL1ReferenceCount: %i\n",
  1262. enc->caps.maxL1ReferenceCount);
  1263. av_log(avctx, AV_LOG_VERBOSE, " maxTemporalLayerCount: %i\n",
  1264. enc->caps.maxTemporalLayerCount);
  1265. av_log(avctx, AV_LOG_VERBOSE, " expectDyadicTemporalLayerPattern: %i\n",
  1266. enc->caps.expectDyadicTemporalLayerPattern);
  1267. av_log(avctx, AV_LOG_VERBOSE, " min/max Qp: [%i, %i]\n",
  1268. enc->caps.minQp, enc->caps.maxQp);
  1269. av_log(avctx, AV_LOG_VERBOSE, " prefersGopRemainingFrames: %i\n",
  1270. enc->caps.prefersGopRemainingFrames);
  1271. av_log(avctx, AV_LOG_VERBOSE, " requiresGopRemainingFrames: %i\n",
  1272. enc->caps.requiresGopRemainingFrames);
  1273. err = init_enc_options(avctx);
  1274. if (err < 0)
  1275. return err;
  1276. flags = ctx->codec->flags;
  1277. if (!enc->caps.maxPPictureL0ReferenceCount &&
  1278. !enc->caps.maxBPictureL0ReferenceCount &&
  1279. !enc->caps.maxL1ReferenceCount) {
  1280. /* Intra-only */
  1281. flags |= FF_HW_FLAG_INTRA_ONLY;
  1282. ref_l0 = ref_l1 = 0;
  1283. } else if (!enc->caps.maxPPictureL0ReferenceCount) {
  1284. /* No P-frames? How. */
  1285. base_ctx->p_to_gpb = 1;
  1286. ref_l0 = enc->caps.maxBPictureL0ReferenceCount;
  1287. ref_l1 = enc->caps.maxL1ReferenceCount;
  1288. } else if (!enc->caps.maxBPictureL0ReferenceCount &&
  1289. !enc->caps.maxL1ReferenceCount) {
  1290. /* No B-frames */
  1291. flags &= ~(FF_HW_FLAG_B_PICTURES | FF_HW_FLAG_B_PICTURE_REFERENCES);
  1292. ref_l0 = enc->caps.maxPPictureL0ReferenceCount;
  1293. ref_l1 = 0;
  1294. } else {
  1295. /* P and B frames */
  1296. ref_l0 = FFMIN(enc->caps.maxPPictureL0ReferenceCount,
  1297. enc->caps.maxBPictureL0ReferenceCount);
  1298. ref_l1 = enc->caps.maxL1ReferenceCount;
  1299. }
  1300. err = ff_hw_base_init_gop_structure(base_ctx, avctx, ref_l0, ref_l1,
  1301. flags, 0);
  1302. if (err < 0)
  1303. return err;
  1304. base_ctx->output_delay = base_ctx->b_per_p;
  1305. base_ctx->decode_delay = base_ctx->max_b_depth;
  1306. /* Prepare SEI */
  1307. if (enc->unit_elems & UNIT_SEI_IDENTIFIER) {
  1308. int len;
  1309. memcpy(enc->sei_identifier.uuid_iso_iec_11578,
  1310. vulkan_encode_h264_sei_identifier_uuid,
  1311. sizeof(enc->sei_identifier.uuid_iso_iec_11578));
  1312. len = snprintf(NULL, 0,
  1313. "%s / Vulkan video %i.%i.%i / %s %i.%i.%i / %s",
  1314. LIBAVCODEC_IDENT,
  1315. CODEC_VER(ff_vk_enc_h264_desc.ext_props.specVersion),
  1316. s->driver_props.driverName,
  1317. CODEC_VER(s->props.properties.driverVersion),
  1318. s->props.properties.deviceName);
  1319. if (len >= 0) {
  1320. enc->sei_identifier_string = av_malloc(len + 1);
  1321. if (!enc->sei_identifier_string)
  1322. return AVERROR(ENOMEM);
  1323. len = snprintf(enc->sei_identifier_string, len + 1,
  1324. "%s / Vulkan video %i.%i.%i / %s %i.%i.%i / %s",
  1325. LIBAVCODEC_IDENT,
  1326. CODEC_VER(ff_vk_enc_h264_desc.ext_props.specVersion),
  1327. s->driver_props.driverName,
  1328. CODEC_VER(s->props.properties.driverVersion),
  1329. s->props.properties.deviceName);
  1330. enc->sei_identifier.data = enc->sei_identifier_string;
  1331. enc->sei_identifier.data_length = len + 1;
  1332. }
  1333. }
  1334. /* Init CBS */
  1335. err = ff_cbs_init(&enc->cbs, AV_CODEC_ID_H264, avctx);
  1336. if (err < 0)
  1337. return err;
  1338. /* Create units and session parameters */
  1339. err = init_base_units(avctx);
  1340. if (err < 0)
  1341. return err;
  1342. /* Write out extradata */
  1343. err = ff_vulkan_write_global_header(avctx, &enc->common);
  1344. if (err < 0)
  1345. return err;
  1346. return 0;
  1347. }
  1348. static av_cold int vulkan_encode_h264_close(AVCodecContext *avctx)
  1349. {
  1350. VulkanEncodeH264Context *enc = avctx->priv_data;
  1351. ff_vulkan_encode_uninit(&enc->common);
  1352. return 0;
  1353. }
  1354. #define OFFSET(x) offsetof(VulkanEncodeH264Context, x)
  1355. #define FLAGS (AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM)
  1356. static const AVOption vulkan_encode_h264_options[] = {
  1357. HW_BASE_ENCODE_COMMON_OPTIONS,
  1358. VULKAN_ENCODE_COMMON_OPTIONS,
  1359. { "profile", "Set profile (profile_idc and constraint_set*_flag)",
  1360. OFFSET(common.opts.profile), AV_OPT_TYPE_INT,
  1361. { .i64 = AV_PROFILE_UNKNOWN }, AV_PROFILE_UNKNOWN, 0xffff, FLAGS, .unit = "profile" },
  1362. #define PROFILE(name, value) name, NULL, 0, AV_OPT_TYPE_CONST, \
  1363. { .i64 = value }, 0, 0, FLAGS, .unit = "profile"
  1364. { PROFILE("constrained_baseline", AV_PROFILE_H264_CONSTRAINED_BASELINE) },
  1365. { PROFILE("main", AV_PROFILE_H264_MAIN) },
  1366. { PROFILE("high", AV_PROFILE_H264_HIGH) },
  1367. { PROFILE("high444p", AV_PROFILE_H264_HIGH_10) },
  1368. #undef PROFILE
  1369. { "level", "Set level (level_idc)",
  1370. OFFSET(common.opts.level), AV_OPT_TYPE_INT,
  1371. { .i64 = AV_LEVEL_UNKNOWN }, AV_LEVEL_UNKNOWN, 0xff, FLAGS, .unit = "level" },
  1372. #define LEVEL(name, value) name, NULL, 0, AV_OPT_TYPE_CONST, \
  1373. { .i64 = value }, 0, 0, FLAGS, .unit = "level"
  1374. { LEVEL("1", 10) },
  1375. { LEVEL("1.1", 11) },
  1376. { LEVEL("1.2", 12) },
  1377. { LEVEL("1.3", 13) },
  1378. { LEVEL("2", 20) },
  1379. { LEVEL("2.1", 21) },
  1380. { LEVEL("2.2", 22) },
  1381. { LEVEL("3", 30) },
  1382. { LEVEL("3.1", 31) },
  1383. { LEVEL("3.2", 32) },
  1384. { LEVEL("4", 40) },
  1385. { LEVEL("4.1", 41) },
  1386. { LEVEL("4.2", 42) },
  1387. { LEVEL("5", 50) },
  1388. { LEVEL("5.1", 51) },
  1389. { LEVEL("5.2", 52) },
  1390. { LEVEL("6", 60) },
  1391. { LEVEL("6.1", 61) },
  1392. { LEVEL("6.2", 62) },
  1393. #undef LEVEL
  1394. { "coder", "Entropy coder type", OFFSET(unit_opts.cabac), AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, FLAGS, "coder" },
  1395. { "cabac", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, INT_MIN, INT_MAX, FLAGS, "coder" },
  1396. { "vlc", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, INT_MIN, INT_MAX, FLAGS, "coder" },
  1397. { "units", "Set units to include", OFFSET(unit_elems), AV_OPT_TYPE_FLAGS, { .i64 = UNIT_AUD | UNIT_SEI_IDENTIFIER | UNIT_SEI_RECOVERY | UNIT_SEI_TIMING | UNIT_SEI_A53_CC }, 0, INT_MAX, FLAGS, "units" },
  1398. { "aud", "Include AUD units", 0, AV_OPT_TYPE_CONST, { .i64 = UNIT_AUD }, INT_MIN, INT_MAX, FLAGS, "units" },
  1399. { "identifier", "Include encoder version identifier", 0, AV_OPT_TYPE_CONST, { .i64 = UNIT_SEI_IDENTIFIER }, INT_MIN, INT_MAX, FLAGS, "units" },
  1400. { "timing", "Include timing parameters (buffering_period and pic_timing)", 0, AV_OPT_TYPE_CONST, { .i64 = UNIT_SEI_TIMING }, INT_MIN, INT_MAX, FLAGS, "units" },
  1401. { "recovery", "Include recovery points where appropriate", 0, AV_OPT_TYPE_CONST, { .i64 = UNIT_SEI_RECOVERY }, INT_MIN, INT_MAX, FLAGS, "units" },
  1402. { "a53_cc", "Include A/53 caption data", 0, AV_OPT_TYPE_CONST, { .i64 = UNIT_SEI_A53_CC }, INT_MIN, INT_MAX, FLAGS, "units" },
  1403. { NULL },
  1404. };
  1405. static const FFCodecDefault vulkan_encode_h264_defaults[] = {
  1406. { "b", "0" },
  1407. { "bf", "2" },
  1408. { "g", "300" },
  1409. { "i_qfactor", "1" },
  1410. { "i_qoffset", "0" },
  1411. { "b_qfactor", "1" },
  1412. { "b_qoffset", "0" },
  1413. { "qmin", "-1" },
  1414. { "qmax", "-1" },
  1415. { NULL },
  1416. };
  1417. static const AVClass vulkan_encode_h264_class = {
  1418. .class_name = "h264_vulkan",
  1419. .item_name = av_default_item_name,
  1420. .option = vulkan_encode_h264_options,
  1421. .version = LIBAVUTIL_VERSION_INT,
  1422. };
  1423. const FFCodec ff_h264_vulkan_encoder = {
  1424. .p.name = "h264_vulkan",
  1425. CODEC_LONG_NAME("H.264/AVC (Vulkan)"),
  1426. .p.type = AVMEDIA_TYPE_VIDEO,
  1427. .p.id = AV_CODEC_ID_H264,
  1428. .priv_data_size = sizeof(VulkanEncodeH264Context),
  1429. .init = &vulkan_encode_h264_init,
  1430. FF_CODEC_RECEIVE_PACKET_CB(&ff_vulkan_encode_receive_packet),
  1431. .close = &vulkan_encode_h264_close,
  1432. .p.priv_class = &vulkan_encode_h264_class,
  1433. .p.capabilities = AV_CODEC_CAP_DELAY |
  1434. AV_CODEC_CAP_HARDWARE |
  1435. AV_CODEC_CAP_DR1 |
  1436. AV_CODEC_CAP_ENCODER_FLUSH |
  1437. AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
  1438. .caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
  1439. .defaults = vulkan_encode_h264_defaults,
  1440. .p.pix_fmts = (const enum AVPixelFormat[]) {
  1441. AV_PIX_FMT_VULKAN,
  1442. AV_PIX_FMT_NONE,
  1443. },
  1444. .hw_configs = ff_vulkan_encode_hw_configs,
  1445. .p.wrapper_name = "vulkan",
  1446. };