1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990 |
- /*
- * Copyright (c) Lynne
- *
- * This file is part of FFmpeg.
- *
- * FFmpeg is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation; either
- * version 2.1 of the License, or (at your option) any later version.
- *
- * FFmpeg is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with FFmpeg; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- */
- #include "avassert.h"
- #include "mem.h"
- #include "vulkan.h"
- #include "libavutil/vulkan_loader.h"
- const VkComponentMapping ff_comp_identity_map = {
- .r = VK_COMPONENT_SWIZZLE_IDENTITY,
- .g = VK_COMPONENT_SWIZZLE_IDENTITY,
- .b = VK_COMPONENT_SWIZZLE_IDENTITY,
- .a = VK_COMPONENT_SWIZZLE_IDENTITY,
- };
- /* Converts return values to strings */
- const char *ff_vk_ret2str(VkResult res)
- {
- #define CASE(VAL) case VAL: return #VAL
- switch (res) {
- CASE(VK_SUCCESS);
- CASE(VK_NOT_READY);
- CASE(VK_TIMEOUT);
- CASE(VK_EVENT_SET);
- CASE(VK_EVENT_RESET);
- CASE(VK_INCOMPLETE);
- CASE(VK_ERROR_OUT_OF_HOST_MEMORY);
- CASE(VK_ERROR_OUT_OF_DEVICE_MEMORY);
- CASE(VK_ERROR_INITIALIZATION_FAILED);
- CASE(VK_ERROR_DEVICE_LOST);
- CASE(VK_ERROR_MEMORY_MAP_FAILED);
- CASE(VK_ERROR_LAYER_NOT_PRESENT);
- CASE(VK_ERROR_EXTENSION_NOT_PRESENT);
- CASE(VK_ERROR_FEATURE_NOT_PRESENT);
- CASE(VK_ERROR_INCOMPATIBLE_DRIVER);
- CASE(VK_ERROR_TOO_MANY_OBJECTS);
- CASE(VK_ERROR_FORMAT_NOT_SUPPORTED);
- CASE(VK_ERROR_FRAGMENTED_POOL);
- CASE(VK_ERROR_UNKNOWN);
- CASE(VK_ERROR_OUT_OF_POOL_MEMORY);
- CASE(VK_ERROR_INVALID_EXTERNAL_HANDLE);
- CASE(VK_ERROR_FRAGMENTATION);
- CASE(VK_ERROR_INVALID_OPAQUE_CAPTURE_ADDRESS);
- CASE(VK_PIPELINE_COMPILE_REQUIRED);
- CASE(VK_ERROR_SURFACE_LOST_KHR);
- CASE(VK_ERROR_NATIVE_WINDOW_IN_USE_KHR);
- CASE(VK_SUBOPTIMAL_KHR);
- CASE(VK_ERROR_OUT_OF_DATE_KHR);
- CASE(VK_ERROR_INCOMPATIBLE_DISPLAY_KHR);
- CASE(VK_ERROR_VALIDATION_FAILED_EXT);
- CASE(VK_ERROR_INVALID_SHADER_NV);
- CASE(VK_ERROR_VIDEO_PICTURE_LAYOUT_NOT_SUPPORTED_KHR);
- CASE(VK_ERROR_VIDEO_PROFILE_OPERATION_NOT_SUPPORTED_KHR);
- CASE(VK_ERROR_VIDEO_PROFILE_FORMAT_NOT_SUPPORTED_KHR);
- CASE(VK_ERROR_VIDEO_PROFILE_CODEC_NOT_SUPPORTED_KHR);
- CASE(VK_ERROR_VIDEO_STD_VERSION_NOT_SUPPORTED_KHR);
- CASE(VK_ERROR_INVALID_DRM_FORMAT_MODIFIER_PLANE_LAYOUT_EXT);
- CASE(VK_ERROR_NOT_PERMITTED_KHR);
- CASE(VK_ERROR_FULL_SCREEN_EXCLUSIVE_MODE_LOST_EXT);
- CASE(VK_THREAD_IDLE_KHR);
- CASE(VK_THREAD_DONE_KHR);
- CASE(VK_OPERATION_DEFERRED_KHR);
- CASE(VK_OPERATION_NOT_DEFERRED_KHR);
- default: return "Unknown error";
- }
- #undef CASE
- }
- static void load_enabled_qfs(FFVulkanContext *s)
- {
- s->nb_qfs = 0;
- for (int i = 0; i < s->hwctx->nb_qf; i++) {
- /* Skip duplicates */
- int skip = 0;
- for (int j = 0; j < s->nb_qfs; j++) {
- if (s->qfs[j] == s->hwctx->qf[i].idx) {
- skip = 1;
- break;
- }
- }
- if (skip)
- continue;
- s->qfs[s->nb_qfs++] = s->hwctx->qf[i].idx;
- }
- }
- int ff_vk_load_props(FFVulkanContext *s)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- s->hprops = (VkPhysicalDeviceExternalMemoryHostPropertiesEXT) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_EXTERNAL_MEMORY_HOST_PROPERTIES_EXT,
- };
- s->optical_flow_props = (VkPhysicalDeviceOpticalFlowPropertiesNV) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_OPTICAL_FLOW_PROPERTIES_NV,
- .pNext = &s->hprops,
- };
- s->coop_matrix_props = (VkPhysicalDeviceCooperativeMatrixPropertiesKHR) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_COOPERATIVE_MATRIX_PROPERTIES_KHR,
- .pNext = &s->optical_flow_props,
- };
- s->subgroup_props = (VkPhysicalDeviceSubgroupSizeControlProperties) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SUBGROUP_SIZE_CONTROL_PROPERTIES,
- .pNext = &s->coop_matrix_props,
- };
- s->desc_buf_props = (VkPhysicalDeviceDescriptorBufferPropertiesEXT) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_DESCRIPTOR_BUFFER_PROPERTIES_EXT,
- .pNext = &s->subgroup_props,
- };
- s->driver_props = (VkPhysicalDeviceDriverProperties) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_DRIVER_PROPERTIES,
- .pNext = &s->desc_buf_props,
- };
- s->props = (VkPhysicalDeviceProperties2) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PROPERTIES_2,
- .pNext = &s->driver_props,
- };
- s->atomic_float_feats = (VkPhysicalDeviceShaderAtomicFloatFeaturesEXT) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SHADER_ATOMIC_FLOAT_FEATURES_EXT,
- };
- s->feats_12 = (VkPhysicalDeviceVulkan12Features) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VULKAN_1_2_FEATURES,
- .pNext = &s->atomic_float_feats,
- };
- s->feats = (VkPhysicalDeviceFeatures2) {
- .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2,
- .pNext = &s->feats_12,
- };
- vk->GetPhysicalDeviceProperties2(s->hwctx->phys_dev, &s->props);
- vk->GetPhysicalDeviceMemoryProperties(s->hwctx->phys_dev, &s->mprops);
- vk->GetPhysicalDeviceFeatures2(s->hwctx->phys_dev, &s->feats);
- load_enabled_qfs(s);
- if (s->qf_props)
- return 0;
- vk->GetPhysicalDeviceQueueFamilyProperties2(s->hwctx->phys_dev, &s->tot_nb_qfs, NULL);
- s->qf_props = av_calloc(s->tot_nb_qfs, sizeof(*s->qf_props));
- if (!s->qf_props)
- return AVERROR(ENOMEM);
- s->query_props = av_calloc(s->tot_nb_qfs, sizeof(*s->query_props));
- if (!s->qf_props) {
- av_freep(&s->qf_props);
- return AVERROR(ENOMEM);
- }
- s->video_props = av_calloc(s->tot_nb_qfs, sizeof(*s->video_props));
- if (!s->video_props) {
- av_freep(&s->qf_props);
- av_freep(&s->query_props);
- return AVERROR(ENOMEM);
- }
- for (uint32_t i = 0; i < s->tot_nb_qfs; i++) {
- s->query_props[i] = (VkQueueFamilyQueryResultStatusPropertiesKHR) {
- .sType = VK_STRUCTURE_TYPE_QUEUE_FAMILY_QUERY_RESULT_STATUS_PROPERTIES_KHR,
- };
- s->video_props[i] = (VkQueueFamilyVideoPropertiesKHR) {
- .sType = VK_STRUCTURE_TYPE_QUEUE_FAMILY_VIDEO_PROPERTIES_KHR,
- .pNext = &s->query_props[i],
- };
- s->qf_props[i] = (VkQueueFamilyProperties2) {
- .sType = VK_STRUCTURE_TYPE_QUEUE_FAMILY_PROPERTIES_2,
- .pNext = &s->video_props[i],
- };
- }
- vk->GetPhysicalDeviceQueueFamilyProperties2(s->hwctx->phys_dev, &s->tot_nb_qfs, s->qf_props);
- if (s->extensions & FF_VK_EXT_COOP_MATRIX) {
- vk->GetPhysicalDeviceCooperativeMatrixPropertiesKHR(s->hwctx->phys_dev,
- &s->coop_mat_props_nb, NULL);
- if (s->coop_mat_props_nb) {
- s->coop_mat_props = av_malloc_array(s->coop_mat_props_nb,
- sizeof(VkCooperativeMatrixPropertiesKHR));
- for (int i = 0; i < s->coop_mat_props_nb; i++) {
- s->coop_mat_props[i] = (VkCooperativeMatrixPropertiesKHR) {
- .sType = VK_STRUCTURE_TYPE_COOPERATIVE_MATRIX_PROPERTIES_KHR,
- };
- }
- vk->GetPhysicalDeviceCooperativeMatrixPropertiesKHR(s->hwctx->phys_dev,
- &s->coop_mat_props_nb,
- s->coop_mat_props);
- }
- }
- return 0;
- }
- static int vk_qf_get_index(FFVulkanContext *s, VkQueueFlagBits dev_family, int *nb)
- {
- for (int i = 0; i < s->hwctx->nb_qf; i++) {
- if (s->hwctx->qf[i].flags & dev_family) {
- *nb = s->hwctx->qf[i].num;
- return s->hwctx->qf[i].idx;
- }
- }
- av_assert0(0); /* Should never happen */
- }
- int ff_vk_qf_init(FFVulkanContext *s, FFVkQueueFamilyCtx *qf,
- VkQueueFlagBits dev_family)
- {
- /* Fill in queue families from context if not done yet */
- if (!s->nb_qfs)
- load_enabled_qfs(s);
- return (qf->queue_family = vk_qf_get_index(s, dev_family, &qf->nb_queues));
- }
- void ff_vk_exec_pool_free(FFVulkanContext *s, FFVkExecPool *pool)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- for (int i = 0; i < pool->pool_size; i++) {
- FFVkExecContext *e = &pool->contexts[i];
- if (e->fence) {
- vk->WaitForFences(s->hwctx->act_dev, 1, &e->fence, VK_TRUE, UINT64_MAX);
- vk->DestroyFence(s->hwctx->act_dev, e->fence, s->hwctx->alloc);
- }
- pthread_mutex_destroy(&e->lock);
- ff_vk_exec_discard_deps(s, e);
- av_free(e->frame_deps);
- av_free(e->buf_deps);
- av_free(e->queue_family_dst);
- av_free(e->layout_dst);
- av_free(e->access_dst);
- av_free(e->frame_update);
- av_free(e->frame_locked);
- av_free(e->sem_sig);
- av_free(e->sem_sig_val_dst);
- av_free(e->sem_wait);
- }
- if (pool->cmd_bufs)
- vk->FreeCommandBuffers(s->hwctx->act_dev, pool->cmd_buf_pool,
- pool->pool_size, pool->cmd_bufs);
- if (pool->cmd_buf_pool)
- vk->DestroyCommandPool(s->hwctx->act_dev, pool->cmd_buf_pool, s->hwctx->alloc);
- if (pool->query_pool)
- vk->DestroyQueryPool(s->hwctx->act_dev, pool->query_pool, s->hwctx->alloc);
- av_free(pool->query_data);
- av_free(pool->cmd_bufs);
- av_free(pool->contexts);
- }
- int ff_vk_exec_pool_init(FFVulkanContext *s, FFVkQueueFamilyCtx *qf,
- FFVkExecPool *pool, int nb_contexts,
- int nb_queries, VkQueryType query_type, int query_64bit,
- const void *query_create_pnext)
- {
- int err;
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkCommandPoolCreateInfo cqueue_create;
- VkCommandBufferAllocateInfo cbuf_create;
- const VkQueryPoolVideoEncodeFeedbackCreateInfoKHR *ef = NULL;
- if (query_type == VK_QUERY_TYPE_VIDEO_ENCODE_FEEDBACK_KHR) {
- ef = ff_vk_find_struct(query_create_pnext,
- VK_STRUCTURE_TYPE_QUERY_POOL_VIDEO_ENCODE_FEEDBACK_CREATE_INFO_KHR);
- if (!ef)
- return AVERROR(EINVAL);
- }
- /* Create command pool */
- cqueue_create = (VkCommandPoolCreateInfo) {
- .sType = VK_STRUCTURE_TYPE_COMMAND_POOL_CREATE_INFO,
- .flags = VK_COMMAND_POOL_CREATE_TRANSIENT_BIT |
- VK_COMMAND_POOL_CREATE_RESET_COMMAND_BUFFER_BIT,
- .queueFamilyIndex = qf->queue_family,
- };
- ret = vk->CreateCommandPool(s->hwctx->act_dev, &cqueue_create,
- s->hwctx->alloc, &pool->cmd_buf_pool);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Command pool creation failure: %s\n",
- ff_vk_ret2str(ret));
- err = AVERROR_EXTERNAL;
- goto fail;
- }
- /* Allocate space for command buffers */
- pool->cmd_bufs = av_malloc(nb_contexts*sizeof(*pool->cmd_bufs));
- if (!pool->cmd_bufs) {
- err = AVERROR(ENOMEM);
- goto fail;
- }
- /* Allocate command buffer */
- cbuf_create = (VkCommandBufferAllocateInfo) {
- .sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_ALLOCATE_INFO,
- .level = VK_COMMAND_BUFFER_LEVEL_PRIMARY,
- .commandPool = pool->cmd_buf_pool,
- .commandBufferCount = nb_contexts,
- };
- ret = vk->AllocateCommandBuffers(s->hwctx->act_dev, &cbuf_create,
- pool->cmd_bufs);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Command buffer alloc failure: %s\n",
- ff_vk_ret2str(ret));
- err = AVERROR_EXTERNAL;
- goto fail;
- }
- /* Query pool */
- if (nb_queries) {
- VkQueryPoolCreateInfo query_pool_info = {
- .sType = VK_STRUCTURE_TYPE_QUERY_POOL_CREATE_INFO,
- .pNext = query_create_pnext,
- .queryType = query_type,
- .queryCount = nb_queries*nb_contexts,
- };
- ret = vk->CreateQueryPool(s->hwctx->act_dev, &query_pool_info,
- s->hwctx->alloc, &pool->query_pool);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Query pool alloc failure: %s\n",
- ff_vk_ret2str(ret));
- err = AVERROR_EXTERNAL;
- goto fail;
- }
- pool->nb_queries = nb_queries;
- pool->query_status_stride = 1 + 1; /* One result, one status by default */
- pool->query_results = nb_queries;
- pool->query_statuses = nb_queries;
- /* Video encode quieries produce two results per query */
- if (query_type == VK_QUERY_TYPE_VIDEO_ENCODE_FEEDBACK_KHR) {
- int nb_results = av_popcount(ef->encodeFeedbackFlags);
- pool->query_status_stride = nb_results + 1;
- pool->query_results *= nb_results;
- } else if (query_type == VK_QUERY_TYPE_RESULT_STATUS_ONLY_KHR) {
- pool->query_status_stride = 1;
- pool->query_results = 0;
- }
- pool->qd_size = (pool->query_results + pool->query_statuses)*(query_64bit ? 8 : 4);
- /* Allocate space for the query data */
- pool->query_data = av_calloc(nb_contexts, pool->qd_size);
- if (!pool->query_data) {
- err = AVERROR(ENOMEM);
- goto fail;
- }
- }
- /* Allocate space for the contexts */
- pool->contexts = av_calloc(nb_contexts, sizeof(*pool->contexts));
- if (!pool->contexts) {
- err = AVERROR(ENOMEM);
- goto fail;
- }
- pool->pool_size = nb_contexts;
- /* Init contexts */
- for (int i = 0; i < pool->pool_size; i++) {
- FFVkExecContext *e = &pool->contexts[i];
- VkFenceCreateInfo fence_create = {
- .sType = VK_STRUCTURE_TYPE_FENCE_CREATE_INFO,
- .flags = VK_FENCE_CREATE_SIGNALED_BIT,
- };
- /* Mutex */
- err = pthread_mutex_init(&e->lock, NULL);
- if (err != 0)
- return AVERROR(err);
- /* Fence */
- ret = vk->CreateFence(s->hwctx->act_dev, &fence_create, s->hwctx->alloc,
- &e->fence);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to create submission fence: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- e->idx = i;
- e->parent = pool;
- /* Query data */
- e->query_data = ((uint8_t *)pool->query_data) + pool->qd_size*i;
- e->query_idx = nb_queries*i;
- /* Command buffer */
- e->buf = pool->cmd_bufs[i];
- /* Queue index distribution */
- e->qi = i % qf->nb_queues;
- e->qf = qf->queue_family;
- vk->GetDeviceQueue(s->hwctx->act_dev, qf->queue_family,
- e->qi, &e->queue);
- }
- return 0;
- fail:
- ff_vk_exec_pool_free(s, pool);
- return err;
- }
- VkResult ff_vk_exec_get_query(FFVulkanContext *s, FFVkExecContext *e,
- void **data, VkQueryResultFlagBits flags)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- const FFVkExecPool *pool = e->parent;
- VkQueryResultFlags qf = flags & ~(VK_QUERY_RESULT_64_BIT |
- VK_QUERY_RESULT_WITH_STATUS_BIT_KHR);
- if (!e->query_data) {
- av_log(s, AV_LOG_ERROR, "Requested a query with a NULL query_data pointer!\n");
- return VK_INCOMPLETE;
- }
- qf |= pool->query_64bit ?
- VK_QUERY_RESULT_64_BIT : 0x0;
- qf |= pool->query_statuses ?
- VK_QUERY_RESULT_WITH_STATUS_BIT_KHR : 0x0;
- if (data)
- *data = e->query_data;
- return vk->GetQueryPoolResults(s->hwctx->act_dev, pool->query_pool,
- e->query_idx,
- pool->nb_queries,
- pool->qd_size, e->query_data,
- pool->qd_size, qf);
- }
- FFVkExecContext *ff_vk_exec_get(FFVkExecPool *pool)
- {
- uint32_t idx = pool->idx++;
- idx %= pool->pool_size;
- return &pool->contexts[idx];
- }
- void ff_vk_exec_wait(FFVulkanContext *s, FFVkExecContext *e)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- pthread_mutex_lock(&e->lock);
- vk->WaitForFences(s->hwctx->act_dev, 1, &e->fence, VK_TRUE, UINT64_MAX);
- ff_vk_exec_discard_deps(s, e);
- pthread_mutex_unlock(&e->lock);
- }
- int ff_vk_exec_start(FFVulkanContext *s, FFVkExecContext *e)
- {
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- const FFVkExecPool *pool = e->parent;
- VkCommandBufferBeginInfo cmd_start = {
- .sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_BEGIN_INFO,
- .flags = VK_COMMAND_BUFFER_USAGE_ONE_TIME_SUBMIT_BIT,
- };
- /* Wait for the fence to be signalled */
- vk->WaitForFences(s->hwctx->act_dev, 1, &e->fence, VK_TRUE, UINT64_MAX);
- /* vkResetFences is defined as being host-synchronized */
- pthread_mutex_lock(&e->lock);
- vk->ResetFences(s->hwctx->act_dev, 1, &e->fence);
- pthread_mutex_unlock(&e->lock);
- /* Discard queue dependencies */
- ff_vk_exec_discard_deps(s, e);
- ret = vk->BeginCommandBuffer(e->buf, &cmd_start);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to start command recoding: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- if (pool->nb_queries)
- vk->CmdResetQueryPool(e->buf, pool->query_pool,
- e->query_idx, pool->nb_queries);
- return 0;
- }
- void ff_vk_exec_discard_deps(FFVulkanContext *s, FFVkExecContext *e)
- {
- for (int j = 0; j < e->nb_buf_deps; j++)
- av_buffer_unref(&e->buf_deps[j]);
- e->nb_buf_deps = 0;
- for (int j = 0; j < e->nb_frame_deps; j++) {
- AVFrame *f = e->frame_deps[j];
- if (e->frame_locked[j]) {
- AVHWFramesContext *hwfc = (AVHWFramesContext *)f->hw_frames_ctx->data;
- AVVulkanFramesContext *vkfc = hwfc->hwctx;
- AVVkFrame *vkf = (AVVkFrame *)f->data[0];
- vkfc->unlock_frame(hwfc, vkf);
- e->frame_locked[j] = 0;
- }
- e->frame_update[j] = 0;
- if (f->buf[0])
- av_frame_free(&e->frame_deps[j]);
- }
- e->nb_frame_deps = 0;
- e->sem_wait_cnt = 0;
- e->sem_sig_cnt = 0;
- e->sem_sig_val_dst_cnt = 0;
- }
- int ff_vk_exec_add_dep_buf(FFVulkanContext *s, FFVkExecContext *e,
- AVBufferRef **deps, int nb_deps, int ref)
- {
- AVBufferRef **dst = av_fast_realloc(e->buf_deps, &e->buf_deps_alloc_size,
- (e->nb_buf_deps + nb_deps) * sizeof(*dst));
- if (!dst) {
- ff_vk_exec_discard_deps(s, e);
- return AVERROR(ENOMEM);
- }
- e->buf_deps = dst;
- for (int i = 0; i < nb_deps; i++) {
- e->buf_deps[e->nb_buf_deps] = ref ? av_buffer_ref(deps[i]) : deps[i];
- if (!e->buf_deps[e->nb_buf_deps]) {
- ff_vk_exec_discard_deps(s, e);
- return AVERROR(ENOMEM);
- }
- e->nb_buf_deps++;
- }
- return 0;
- }
- #define ARR_REALLOC(str, arr, alloc_s, cnt) \
- do { \
- arr = av_fast_realloc(str->arr, alloc_s, (cnt + 1)*sizeof(*arr)); \
- if (!arr) { \
- ff_vk_exec_discard_deps(s, e); \
- return AVERROR(ENOMEM); \
- } \
- str->arr = arr; \
- } while (0)
- typedef struct TempSyncCtx {
- int nb_sem;
- VkSemaphore sem[];
- } TempSyncCtx;
- static void destroy_tmp_semaphores(void *opaque, uint8_t *data)
- {
- FFVulkanContext *s = opaque;
- FFVulkanFunctions *vk = &s->vkfn;
- TempSyncCtx *ts = (TempSyncCtx *)data;
- for (int i = 0; i < ts->nb_sem; i++)
- vk->DestroySemaphore(s->hwctx->act_dev, ts->sem[i], s->hwctx->alloc);
- av_free(ts);
- }
- int ff_vk_exec_add_dep_bool_sem(FFVulkanContext *s, FFVkExecContext *e,
- VkSemaphore *sem, int nb,
- VkPipelineStageFlagBits2 stage,
- int wait)
- {
- int err;
- size_t buf_size;
- AVBufferRef *buf;
- TempSyncCtx *ts;
- FFVulkanFunctions *vk = &s->vkfn;
- /* Do not transfer ownership if we're signalling a binary semaphore,
- * since we're probably exporting it. */
- if (!wait) {
- for (int i = 0; i < nb; i++) {
- VkSemaphoreSubmitInfo *sem_sig;
- ARR_REALLOC(e, sem_sig, &e->sem_sig_alloc, e->sem_sig_cnt);
- e->sem_sig[e->sem_sig_cnt++] = (VkSemaphoreSubmitInfo) {
- .sType = VK_STRUCTURE_TYPE_SEMAPHORE_SUBMIT_INFO,
- .semaphore = sem[i],
- .stageMask = stage,
- };
- }
- return 0;
- }
- buf_size = sizeof(int) + sizeof(VkSemaphore)*nb;
- ts = av_mallocz(buf_size);
- if (!ts) {
- err = AVERROR(ENOMEM);
- goto fail;
- }
- memcpy(ts->sem, sem, nb*sizeof(*sem));
- ts->nb_sem = nb;
- buf = av_buffer_create((uint8_t *)ts, buf_size, destroy_tmp_semaphores, s, 0);
- if (!buf) {
- av_free(ts);
- err = AVERROR(ENOMEM);
- goto fail;
- }
- err = ff_vk_exec_add_dep_buf(s, e, &buf, 1, 0);
- if (err < 0) {
- av_buffer_unref(&buf);
- return err;
- }
- for (int i = 0; i < nb; i++) {
- VkSemaphoreSubmitInfo *sem_wait;
- ARR_REALLOC(e, sem_wait, &e->sem_wait_alloc, e->sem_wait_cnt);
- e->sem_wait[e->sem_wait_cnt++] = (VkSemaphoreSubmitInfo) {
- .sType = VK_STRUCTURE_TYPE_SEMAPHORE_SUBMIT_INFO,
- .semaphore = sem[i],
- .stageMask = stage,
- };
- }
- return 0;
- fail:
- for (int i = 0; i < nb; i++)
- vk->DestroySemaphore(s->hwctx->act_dev, sem[i], s->hwctx->alloc);
- return err;
- }
- int ff_vk_exec_add_dep_frame(FFVulkanContext *s, FFVkExecContext *e, AVFrame *f,
- VkPipelineStageFlagBits2 wait_stage,
- VkPipelineStageFlagBits2 signal_stage)
- {
- uint8_t *frame_locked;
- uint8_t *frame_update;
- AVFrame **frame_deps;
- VkImageLayout *layout_dst;
- uint32_t *queue_family_dst;
- VkAccessFlagBits *access_dst;
- AVHWFramesContext *hwfc = (AVHWFramesContext *)f->hw_frames_ctx->data;
- AVVulkanFramesContext *vkfc = hwfc->hwctx;
- AVVkFrame *vkf = (AVVkFrame *)f->data[0];
- int nb_images = ff_vk_count_images(vkf);
- /* Don't add duplicates */
- for (int i = 0; i < e->nb_frame_deps; i++)
- if (e->frame_deps[i]->data[0] == f->data[0])
- return 1;
- ARR_REALLOC(e, layout_dst, &e->layout_dst_alloc, e->nb_frame_deps);
- ARR_REALLOC(e, queue_family_dst, &e->queue_family_dst_alloc, e->nb_frame_deps);
- ARR_REALLOC(e, access_dst, &e->access_dst_alloc, e->nb_frame_deps);
- ARR_REALLOC(e, frame_locked, &e->frame_locked_alloc_size, e->nb_frame_deps);
- ARR_REALLOC(e, frame_update, &e->frame_update_alloc_size, e->nb_frame_deps);
- ARR_REALLOC(e, frame_deps, &e->frame_deps_alloc_size, e->nb_frame_deps);
- e->frame_deps[e->nb_frame_deps] = f->buf[0] ? av_frame_clone(f) : f;
- if (!e->frame_deps[e->nb_frame_deps]) {
- ff_vk_exec_discard_deps(s, e);
- return AVERROR(ENOMEM);
- }
- vkfc->lock_frame(hwfc, vkf);
- e->frame_locked[e->nb_frame_deps] = 1;
- e->frame_update[e->nb_frame_deps] = 0;
- e->nb_frame_deps++;
- for (int i = 0; i < nb_images; i++) {
- VkSemaphoreSubmitInfo *sem_wait;
- VkSemaphoreSubmitInfo *sem_sig;
- uint64_t **sem_sig_val_dst;
- ARR_REALLOC(e, sem_wait, &e->sem_wait_alloc, e->sem_wait_cnt);
- ARR_REALLOC(e, sem_sig, &e->sem_sig_alloc, e->sem_sig_cnt);
- ARR_REALLOC(e, sem_sig_val_dst, &e->sem_sig_val_dst_alloc, e->sem_sig_val_dst_cnt);
- e->sem_wait[e->sem_wait_cnt++] = (VkSemaphoreSubmitInfo) {
- .sType = VK_STRUCTURE_TYPE_SEMAPHORE_SUBMIT_INFO,
- .semaphore = vkf->sem[i],
- .value = vkf->sem_value[i],
- .stageMask = wait_stage,
- };
- e->sem_sig[e->sem_sig_cnt++] = (VkSemaphoreSubmitInfo) {
- .sType = VK_STRUCTURE_TYPE_SEMAPHORE_SUBMIT_INFO,
- .semaphore = vkf->sem[i],
- .value = vkf->sem_value[i] + 1,
- .stageMask = signal_stage,
- };
- e->sem_sig_val_dst[e->sem_sig_val_dst_cnt] = &vkf->sem_value[i];
- e->sem_sig_val_dst_cnt++;
- }
- return 0;
- }
- void ff_vk_exec_update_frame(FFVulkanContext *s, FFVkExecContext *e, AVFrame *f,
- VkImageMemoryBarrier2 *bar, uint32_t *nb_img_bar)
- {
- int i;
- for (i = 0; i < e->nb_frame_deps; i++)
- if (e->frame_deps[i]->data[0] == f->data[0])
- break;
- av_assert0(i < e->nb_frame_deps);
- /* Don't update duplicates */
- if (nb_img_bar && !e->frame_update[i])
- (*nb_img_bar)++;
- e->queue_family_dst[i] = bar->dstQueueFamilyIndex;
- e->access_dst[i] = bar->dstAccessMask;
- e->layout_dst[i] = bar->newLayout;
- e->frame_update[i] = 1;
- }
- int ff_vk_exec_mirror_sem_value(FFVulkanContext *s, FFVkExecContext *e,
- VkSemaphore *dst, uint64_t *dst_val,
- AVFrame *f)
- {
- uint64_t **sem_sig_val_dst;
- AVVkFrame *vkf = (AVVkFrame *)f->data[0];
- /* Reject unknown frames */
- int i;
- for (i = 0; i < e->nb_frame_deps; i++)
- if (e->frame_deps[i]->data[0] == f->data[0])
- break;
- if (i == e->nb_frame_deps)
- return AVERROR(EINVAL);
- ARR_REALLOC(e, sem_sig_val_dst, &e->sem_sig_val_dst_alloc, e->sem_sig_val_dst_cnt);
- *dst = vkf->sem[0];
- *dst_val = vkf->sem_value[0];
- e->sem_sig_val_dst[e->sem_sig_val_dst_cnt] = dst_val;
- e->sem_sig_val_dst_cnt++;
- return 0;
- }
- int ff_vk_exec_submit(FFVulkanContext *s, FFVkExecContext *e)
- {
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkCommandBufferSubmitInfo cmd_buf_info = (VkCommandBufferSubmitInfo) {
- .sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_SUBMIT_INFO,
- .commandBuffer = e->buf,
- };
- VkSubmitInfo2 submit_info = (VkSubmitInfo2) {
- .sType = VK_STRUCTURE_TYPE_SUBMIT_INFO_2,
- .pCommandBufferInfos = &cmd_buf_info,
- .commandBufferInfoCount = 1,
- .pWaitSemaphoreInfos = e->sem_wait,
- .waitSemaphoreInfoCount = e->sem_wait_cnt,
- .pSignalSemaphoreInfos = e->sem_sig,
- .signalSemaphoreInfoCount = e->sem_sig_cnt,
- };
- ret = vk->EndCommandBuffer(e->buf);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Unable to finish command buffer: %s\n",
- ff_vk_ret2str(ret));
- ff_vk_exec_discard_deps(s, e);
- return AVERROR_EXTERNAL;
- }
- s->hwctx->lock_queue(s->device, e->qf, e->qi);
- ret = vk->QueueSubmit2(e->queue, 1, &submit_info, e->fence);
- s->hwctx->unlock_queue(s->device, e->qf, e->qi);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Unable to submit command buffer: %s\n",
- ff_vk_ret2str(ret));
- ff_vk_exec_discard_deps(s, e);
- return AVERROR_EXTERNAL;
- }
- for (int i = 0; i < e->sem_sig_val_dst_cnt; i++)
- *e->sem_sig_val_dst[i] += 1;
- /* Unlock all frames */
- for (int j = 0; j < e->nb_frame_deps; j++) {
- if (e->frame_locked[j]) {
- AVFrame *f = e->frame_deps[j];
- AVHWFramesContext *hwfc = (AVHWFramesContext *)f->hw_frames_ctx->data;
- AVVulkanFramesContext *vkfc = hwfc->hwctx;
- AVVkFrame *vkf = (AVVkFrame *)f->data[0];
- if (e->frame_update[j]) {
- int nb_images = ff_vk_count_images(vkf);
- for (int i = 0; i < nb_images; i++) {
- vkf->layout[i] = e->layout_dst[j];
- vkf->access[i] = e->access_dst[j];
- vkf->queue_family[i] = e->queue_family_dst[j];
- }
- }
- vkfc->unlock_frame(hwfc, vkf);
- e->frame_locked[j] = 0;
- }
- }
- e->had_submission = 1;
- return 0;
- }
- int ff_vk_alloc_mem(FFVulkanContext *s, VkMemoryRequirements *req,
- VkMemoryPropertyFlagBits req_flags, void *alloc_extension,
- VkMemoryPropertyFlagBits *mem_flags, VkDeviceMemory *mem)
- {
- VkResult ret;
- int index = -1;
- FFVulkanFunctions *vk = &s->vkfn;
- VkMemoryAllocateInfo alloc_info = {
- .sType = VK_STRUCTURE_TYPE_MEMORY_ALLOCATE_INFO,
- .pNext = alloc_extension,
- };
- /* Align if we need to */
- if ((req_flags != UINT32_MAX) && req_flags & VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT)
- req->size = FFALIGN(req->size, s->props.properties.limits.minMemoryMapAlignment);
- alloc_info.allocationSize = req->size;
- /* The vulkan spec requires memory types to be sorted in the "optimal"
- * order, so the first matching type we find will be the best/fastest one */
- for (int i = 0; i < s->mprops.memoryTypeCount; i++) {
- /* The memory type must be supported by the requirements (bitfield) */
- if (!(req->memoryTypeBits & (1 << i)))
- continue;
- /* The memory type flags must include our properties */
- if ((req_flags != UINT32_MAX) &&
- ((s->mprops.memoryTypes[i].propertyFlags & req_flags) != req_flags))
- continue;
- /* Found a suitable memory type */
- index = i;
- break;
- }
- if (index < 0) {
- av_log(s, AV_LOG_ERROR, "No memory type found for flags 0x%x\n",
- req_flags);
- return AVERROR(EINVAL);
- }
- alloc_info.memoryTypeIndex = index;
- ret = vk->AllocateMemory(s->hwctx->act_dev, &alloc_info,
- s->hwctx->alloc, mem);
- if (ret != VK_SUCCESS)
- return AVERROR(ENOMEM);
- if (mem_flags)
- *mem_flags |= s->mprops.memoryTypes[index].propertyFlags;
- return 0;
- }
- int ff_vk_create_buf(FFVulkanContext *s, FFVkBuffer *buf, size_t size,
- void *pNext, void *alloc_pNext,
- VkBufferUsageFlags usage, VkMemoryPropertyFlagBits flags)
- {
- int err;
- VkResult ret;
- int use_ded_mem;
- FFVulkanFunctions *vk = &s->vkfn;
- VkBufferCreateInfo buf_spawn = {
- .sType = VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO,
- .pNext = pNext,
- .usage = usage,
- .sharingMode = VK_SHARING_MODE_EXCLUSIVE,
- .size = size, /* Gets FFALIGNED during alloc if host visible
- but should be ok */
- };
- VkMemoryAllocateFlagsInfo alloc_flags = {
- .sType = VK_STRUCTURE_TYPE_MEMORY_ALLOCATE_FLAGS_INFO,
- .flags = VK_MEMORY_ALLOCATE_DEVICE_ADDRESS_BIT,
- };
- VkBufferMemoryRequirementsInfo2 req_desc = {
- .sType = VK_STRUCTURE_TYPE_BUFFER_MEMORY_REQUIREMENTS_INFO_2,
- };
- VkMemoryDedicatedAllocateInfo ded_alloc = {
- .sType = VK_STRUCTURE_TYPE_MEMORY_DEDICATED_ALLOCATE_INFO,
- .pNext = alloc_pNext,
- };
- VkMemoryDedicatedRequirements ded_req = {
- .sType = VK_STRUCTURE_TYPE_MEMORY_DEDICATED_REQUIREMENTS,
- };
- VkMemoryRequirements2 req = {
- .sType = VK_STRUCTURE_TYPE_MEMORY_REQUIREMENTS_2,
- .pNext = &ded_req,
- };
- ret = vk->CreateBuffer(s->hwctx->act_dev, &buf_spawn, s->hwctx->alloc, &buf->buf);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to create buffer: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- req_desc.buffer = buf->buf;
- vk->GetBufferMemoryRequirements2(s->hwctx->act_dev, &req_desc, &req);
- /* In case the implementation prefers/requires dedicated allocation */
- use_ded_mem = ded_req.prefersDedicatedAllocation |
- ded_req.requiresDedicatedAllocation;
- if (use_ded_mem) {
- ded_alloc.buffer = buf->buf;
- ded_alloc.pNext = alloc_pNext;
- alloc_pNext = &ded_alloc;
- }
- if (usage & VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT) {
- alloc_flags.pNext = alloc_pNext;
- alloc_pNext = &alloc_flags;
- }
- err = ff_vk_alloc_mem(s, &req.memoryRequirements, flags, alloc_pNext,
- &buf->flags, &buf->mem);
- if (err)
- return err;
- ret = vk->BindBufferMemory(s->hwctx->act_dev, buf->buf, buf->mem, 0);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to bind memory to buffer: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- if (usage & VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT) {
- VkBufferDeviceAddressInfo address_info = {
- .sType = VK_STRUCTURE_TYPE_BUFFER_DEVICE_ADDRESS_INFO,
- .buffer = buf->buf,
- };
- buf->address = vk->GetBufferDeviceAddress(s->hwctx->act_dev, &address_info);
- }
- buf->size = size;
- return 0;
- }
- static void destroy_avvkbuf(void *opaque, uint8_t *data)
- {
- FFVulkanContext *s = opaque;
- FFVkBuffer *buf = (FFVkBuffer *)data;
- ff_vk_free_buf(s, buf);
- av_free(buf);
- }
- int ff_vk_create_avbuf(FFVulkanContext *s, AVBufferRef **ref, size_t size,
- void *pNext, void *alloc_pNext,
- VkBufferUsageFlags usage, VkMemoryPropertyFlagBits flags)
- {
- int err;
- AVBufferRef *buf;
- FFVkBuffer *vkb = av_mallocz(sizeof(*vkb));
- if (!vkb)
- return AVERROR(ENOMEM);
- err = ff_vk_create_buf(s, vkb, size, pNext, alloc_pNext, usage, flags);
- if (err < 0) {
- av_free(vkb);
- return err;
- }
- buf = av_buffer_create((uint8_t *)vkb, sizeof(*vkb), destroy_avvkbuf, s, 0);
- if (!buf) {
- destroy_avvkbuf(s, (uint8_t *)vkb);
- return AVERROR(ENOMEM);
- }
- *ref = buf;
- return 0;
- }
- int ff_vk_map_buffers(FFVulkanContext *s, FFVkBuffer **buf, uint8_t *mem[],
- int nb_buffers, int invalidate)
- {
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkMappedMemoryRange inval_list[64];
- int inval_count = 0;
- for (int i = 0; i < nb_buffers; i++) {
- void *dst;
- ret = vk->MapMemory(s->hwctx->act_dev, buf[i]->mem, 0,
- VK_WHOLE_SIZE, 0, &dst);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to map buffer memory: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- mem[i] = dst;
- }
- if (!invalidate)
- return 0;
- for (int i = 0; i < nb_buffers; i++) {
- const VkMappedMemoryRange ival_buf = {
- .sType = VK_STRUCTURE_TYPE_MAPPED_MEMORY_RANGE,
- .memory = buf[i]->mem,
- .size = VK_WHOLE_SIZE,
- };
- if (buf[i]->flags & VK_MEMORY_PROPERTY_HOST_COHERENT_BIT)
- continue;
- inval_list[inval_count++] = ival_buf;
- }
- if (inval_count) {
- ret = vk->InvalidateMappedMemoryRanges(s->hwctx->act_dev, inval_count,
- inval_list);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to invalidate memory: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- }
- return 0;
- }
- int ff_vk_unmap_buffers(FFVulkanContext *s, FFVkBuffer **buf, int nb_buffers,
- int flush)
- {
- int err = 0;
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkMappedMemoryRange flush_list[64];
- int flush_count = 0;
- if (flush) {
- for (int i = 0; i < nb_buffers; i++) {
- const VkMappedMemoryRange flush_buf = {
- .sType = VK_STRUCTURE_TYPE_MAPPED_MEMORY_RANGE,
- .memory = buf[i]->mem,
- .size = VK_WHOLE_SIZE,
- };
- if (buf[i]->flags & VK_MEMORY_PROPERTY_HOST_COHERENT_BIT)
- continue;
- flush_list[flush_count++] = flush_buf;
- }
- }
- if (flush_count) {
- ret = vk->FlushMappedMemoryRanges(s->hwctx->act_dev, flush_count,
- flush_list);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to flush memory: %s\n",
- ff_vk_ret2str(ret));
- err = AVERROR_EXTERNAL; /* We still want to try to unmap them */
- }
- }
- for (int i = 0; i < nb_buffers; i++)
- vk->UnmapMemory(s->hwctx->act_dev, buf[i]->mem);
- return err;
- }
- void ff_vk_free_buf(FFVulkanContext *s, FFVkBuffer *buf)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- if (!buf || !s->hwctx)
- return;
- if (buf->mapped_mem)
- ff_vk_unmap_buffer(s, buf, 0);
- if (buf->buf != VK_NULL_HANDLE)
- vk->DestroyBuffer(s->hwctx->act_dev, buf->buf, s->hwctx->alloc);
- if (buf->mem != VK_NULL_HANDLE)
- vk->FreeMemory(s->hwctx->act_dev, buf->mem, s->hwctx->alloc);
- }
- static void free_data_buf(void *opaque, uint8_t *data)
- {
- FFVulkanContext *ctx = opaque;
- FFVkBuffer *buf = (FFVkBuffer *)data;
- ff_vk_free_buf(ctx, buf);
- av_free(data);
- }
- static AVBufferRef *alloc_data_buf(void *opaque, size_t size)
- {
- AVBufferRef *ref;
- uint8_t *buf = av_mallocz(size);
- if (!buf)
- return NULL;
- ref = av_buffer_create(buf, size, free_data_buf, opaque, 0);
- if (!ref)
- av_free(buf);
- return ref;
- }
- int ff_vk_get_pooled_buffer(FFVulkanContext *ctx, AVBufferPool **buf_pool,
- AVBufferRef **buf, VkBufferUsageFlags usage,
- void *create_pNext, size_t size,
- VkMemoryPropertyFlagBits mem_props)
- {
- int err;
- AVBufferRef *ref;
- FFVkBuffer *data;
- if (!(*buf_pool)) {
- *buf_pool = av_buffer_pool_init2(sizeof(FFVkBuffer), ctx,
- alloc_data_buf, NULL);
- if (!(*buf_pool))
- return AVERROR(ENOMEM);
- }
- *buf = ref = av_buffer_pool_get(*buf_pool);
- if (!ref)
- return AVERROR(ENOMEM);
- data = (FFVkBuffer *)ref->data;
- data->stage = VK_PIPELINE_STAGE_2_ALL_COMMANDS_BIT;
- data->access = VK_ACCESS_2_NONE;
- if (data->size >= size)
- return 0;
- ff_vk_free_buf(ctx, data);
- memset(data, 0, sizeof(*data));
- av_log(ctx, AV_LOG_DEBUG, "Allocating buffer of %"SIZE_SPECIFIER" bytes for pool %p\n",
- size, *buf_pool);
- err = ff_vk_create_buf(ctx, data, size,
- create_pNext, NULL, usage,
- mem_props);
- if (err < 0) {
- av_buffer_unref(&ref);
- return err;
- }
- if (mem_props & VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT) {
- err = ff_vk_map_buffer(ctx, data, &data->mapped_mem, 0);
- if (err < 0) {
- av_buffer_unref(&ref);
- return err;
- }
- }
- return 0;
- }
- int ff_vk_add_push_constant(FFVulkanPipeline *pl, int offset, int size,
- VkShaderStageFlagBits stage)
- {
- VkPushConstantRange *pc;
- pl->push_consts = av_realloc_array(pl->push_consts, sizeof(*pl->push_consts),
- pl->push_consts_num + 1);
- if (!pl->push_consts)
- return AVERROR(ENOMEM);
- pc = &pl->push_consts[pl->push_consts_num++];
- memset(pc, 0, sizeof(*pc));
- pc->stageFlags = stage;
- pc->offset = offset;
- pc->size = size;
- return 0;
- }
- int ff_vk_init_sampler(FFVulkanContext *s, VkSampler *sampler,
- int unnorm_coords, VkFilter filt)
- {
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkSamplerCreateInfo sampler_info = {
- .sType = VK_STRUCTURE_TYPE_SAMPLER_CREATE_INFO,
- .magFilter = filt,
- .minFilter = sampler_info.magFilter,
- .mipmapMode = unnorm_coords ? VK_SAMPLER_MIPMAP_MODE_NEAREST :
- VK_SAMPLER_MIPMAP_MODE_LINEAR,
- .addressModeU = VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,
- .addressModeV = sampler_info.addressModeU,
- .addressModeW = sampler_info.addressModeU,
- .anisotropyEnable = VK_FALSE,
- .compareOp = VK_COMPARE_OP_NEVER,
- .borderColor = VK_BORDER_COLOR_FLOAT_TRANSPARENT_BLACK,
- .unnormalizedCoordinates = unnorm_coords,
- };
- ret = vk->CreateSampler(s->hwctx->act_dev, &sampler_info,
- s->hwctx->alloc, sampler);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Unable to init sampler: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- return 0;
- }
- int ff_vk_mt_is_np_rgb(enum AVPixelFormat pix_fmt)
- {
- if (pix_fmt == AV_PIX_FMT_ABGR || pix_fmt == AV_PIX_FMT_BGRA ||
- pix_fmt == AV_PIX_FMT_RGBA || pix_fmt == AV_PIX_FMT_RGB24 ||
- pix_fmt == AV_PIX_FMT_BGR24 || pix_fmt == AV_PIX_FMT_RGB48 ||
- pix_fmt == AV_PIX_FMT_RGBA64 || pix_fmt == AV_PIX_FMT_RGB565 ||
- pix_fmt == AV_PIX_FMT_BGR565 || pix_fmt == AV_PIX_FMT_BGR0 ||
- pix_fmt == AV_PIX_FMT_0BGR || pix_fmt == AV_PIX_FMT_RGB0 ||
- pix_fmt == AV_PIX_FMT_X2RGB10 || pix_fmt == AV_PIX_FMT_X2BGR10)
- return 1;
- return 0;
- }
- const char *ff_vk_shader_rep_fmt(enum AVPixelFormat pixfmt)
- {
- const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pixfmt);
- const int high = desc->comp[0].depth > 8;
- return high ? "rgba16f" : "rgba8";
- }
- typedef struct ImageViewCtx {
- int nb_views;
- VkImageView views[];
- } ImageViewCtx;
- static void destroy_imageviews(void *opaque, uint8_t *data)
- {
- FFVulkanContext *s = opaque;
- FFVulkanFunctions *vk = &s->vkfn;
- ImageViewCtx *iv = (ImageViewCtx *)data;
- for (int i = 0; i < iv->nb_views; i++)
- vk->DestroyImageView(s->hwctx->act_dev, iv->views[i], s->hwctx->alloc);
- av_free(iv);
- }
- int ff_vk_create_imageviews(FFVulkanContext *s, FFVkExecContext *e,
- VkImageView views[AV_NUM_DATA_POINTERS],
- AVFrame *f)
- {
- int err;
- VkResult ret;
- AVBufferRef *buf;
- FFVulkanFunctions *vk = &s->vkfn;
- AVHWFramesContext *hwfc = (AVHWFramesContext *)f->hw_frames_ctx->data;
- const VkFormat *rep_fmts = av_vkfmt_from_pixfmt(hwfc->sw_format);
- AVVkFrame *vkf = (AVVkFrame *)f->data[0];
- const int nb_images = ff_vk_count_images(vkf);
- const int nb_planes = av_pix_fmt_count_planes(hwfc->sw_format);
- const size_t buf_size = sizeof(int) + nb_planes*sizeof(VkImageView);
- ImageViewCtx *iv = av_mallocz(buf_size);
- if (!iv)
- return AVERROR(ENOMEM);
- for (int i = 0; i < nb_planes; i++) {
- VkImageAspectFlags plane_aspect[] = { VK_IMAGE_ASPECT_COLOR_BIT,
- VK_IMAGE_ASPECT_PLANE_0_BIT,
- VK_IMAGE_ASPECT_PLANE_1_BIT,
- VK_IMAGE_ASPECT_PLANE_2_BIT, };
- VkImageViewCreateInfo view_create_info = {
- .sType = VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,
- .pNext = NULL,
- .image = vkf->img[FFMIN(i, nb_images - 1)],
- .viewType = VK_IMAGE_VIEW_TYPE_2D,
- .format = rep_fmts[i],
- .components = ff_comp_identity_map,
- .subresourceRange = {
- .aspectMask = plane_aspect[(nb_planes != nb_images) +
- i*(nb_planes != nb_images)],
- .levelCount = 1,
- .layerCount = 1,
- },
- };
- ret = vk->CreateImageView(s->hwctx->act_dev, &view_create_info,
- s->hwctx->alloc, &iv->views[i]);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Failed to create imageview: %s\n",
- ff_vk_ret2str(ret));
- err = AVERROR_EXTERNAL;
- goto fail;
- }
- iv->nb_views++;
- }
- buf = av_buffer_create((uint8_t *)iv, buf_size, destroy_imageviews, s, 0);
- if (!buf) {
- err = AVERROR(ENOMEM);
- goto fail;
- }
- /* Add to queue dependencies */
- err = ff_vk_exec_add_dep_buf(s, e, &buf, 1, 0);
- if (err < 0)
- av_buffer_unref(&buf);
- memcpy(views, iv->views, nb_planes*sizeof(*views));
- return err;
- fail:
- for (int i = 0; i < iv->nb_views; i++)
- vk->DestroyImageView(s->hwctx->act_dev, iv->views[i], s->hwctx->alloc);
- av_free(iv);
- return err;
- }
- void ff_vk_frame_barrier(FFVulkanContext *s, FFVkExecContext *e,
- AVFrame *pic, VkImageMemoryBarrier2 *bar, int *nb_bar,
- VkPipelineStageFlags src_stage,
- VkPipelineStageFlags dst_stage,
- VkAccessFlagBits new_access,
- VkImageLayout new_layout,
- uint32_t new_qf)
- {
- int found = -1;
- AVVkFrame *vkf = (AVVkFrame *)pic->data[0];
- const int nb_images = ff_vk_count_images(vkf);
- for (int i = 0; i < e->nb_frame_deps; i++)
- if (e->frame_deps[i]->data[0] == pic->data[0]) {
- if (e->frame_update[i])
- found = i;
- break;
- }
- for (int i = 0; i < nb_images; i++) {
- bar[*nb_bar] = (VkImageMemoryBarrier2) {
- .sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER_2,
- .pNext = NULL,
- .srcStageMask = src_stage,
- .dstStageMask = dst_stage,
- .srcAccessMask = found >= 0 ? e->access_dst[found] : vkf->access[i],
- .dstAccessMask = new_access,
- .oldLayout = found >= 0 ? e->layout_dst[found] : vkf->layout[0],
- .newLayout = new_layout,
- .srcQueueFamilyIndex = found >= 0 ? e->queue_family_dst[found] : vkf->queue_family[0],
- .dstQueueFamilyIndex = new_qf,
- .image = vkf->img[i],
- .subresourceRange = (VkImageSubresourceRange) {
- .aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
- .layerCount = 1,
- .levelCount = 1,
- },
- };
- *nb_bar += 1;
- }
- ff_vk_exec_update_frame(s, e, pic, &bar[*nb_bar - nb_images], NULL);
- }
- int ff_vk_shader_init(FFVulkanPipeline *pl, FFVkSPIRVShader *shd, const char *name,
- VkShaderStageFlags stage, uint32_t required_subgroup_size)
- {
- av_bprint_init(&shd->src, 0, AV_BPRINT_SIZE_UNLIMITED);
- shd->shader.sType = VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO;
- shd->shader.stage = stage;
- if (required_subgroup_size) {
- shd->shader.flags |= VK_PIPELINE_SHADER_STAGE_CREATE_REQUIRE_FULL_SUBGROUPS_BIT;
- shd->shader.pNext = &shd->subgroup_info;
- shd->subgroup_info.sType = VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_REQUIRED_SUBGROUP_SIZE_CREATE_INFO;
- shd->subgroup_info.requiredSubgroupSize = required_subgroup_size;
- }
- shd->name = name;
- GLSLF(0, #version %i ,460);
- GLSLC(0, #define IS_WITHIN(v1, v2) ((v1.x < v2.x) && (v1.y < v2.y)) );
- GLSLC(0, );
- GLSLC(0, #extension GL_EXT_buffer_reference : require );
- GLSLC(0, #extension GL_EXT_buffer_reference2 : require );
- return 0;
- }
- void ff_vk_shader_set_compute_sizes(FFVkSPIRVShader *shd, int x, int y, int z)
- {
- shd->local_size[0] = x;
- shd->local_size[1] = y;
- shd->local_size[2] = z;
- av_bprintf(&shd->src, "layout (local_size_x = %i, "
- "local_size_y = %i, local_size_z = %i) in;\n\n",
- shd->local_size[0], shd->local_size[1], shd->local_size[2]);
- }
- void ff_vk_shader_print(void *ctx, FFVkSPIRVShader *shd, int prio)
- {
- int line = 0;
- const char *p = shd->src.str;
- const char *start = p;
- const size_t len = strlen(p);
- AVBPrint buf;
- av_bprint_init(&buf, 0, AV_BPRINT_SIZE_UNLIMITED);
- for (int i = 0; i < len; i++) {
- if (p[i] == '\n') {
- av_bprintf(&buf, "%i\t", ++line);
- av_bprint_append_data(&buf, start, &p[i] - start + 1);
- start = &p[i + 1];
- }
- }
- av_log(ctx, prio, "Shader %s: \n%s", shd->name, buf.str);
- av_bprint_finalize(&buf, NULL);
- }
- void ff_vk_shader_free(FFVulkanContext *s, FFVkSPIRVShader *shd)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- av_bprint_finalize(&shd->src, NULL);
- if (shd->shader.module)
- vk->DestroyShaderModule(s->hwctx->act_dev, shd->shader.module, s->hwctx->alloc);
- }
- int ff_vk_shader_create(FFVulkanContext *s, FFVkSPIRVShader *shd,
- uint8_t *spirv, size_t spirv_size, const char *entrypoint)
- {
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkShaderModuleCreateInfo shader_create;
- shd->shader.pName = entrypoint;
- av_log(s, AV_LOG_VERBOSE, "Shader %s compiled! Size: %zu bytes\n",
- shd->name, spirv_size);
- shader_create.sType = VK_STRUCTURE_TYPE_SHADER_MODULE_CREATE_INFO;
- shader_create.pNext = NULL;
- shader_create.codeSize = spirv_size;
- shader_create.flags = 0;
- shader_create.pCode = (void *)spirv;
- ret = vk->CreateShaderModule(s->hwctx->act_dev, &shader_create, NULL,
- &shd->shader.module);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_VERBOSE, "Error creating shader module: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- return 0;
- }
- static const struct descriptor_props {
- size_t struct_size; /* Size of the opaque which updates the descriptor */
- const char *type;
- int is_uniform;
- int mem_quali; /* Can use a memory qualifier */
- int dim_needed; /* Must indicate dimension */
- int buf_content; /* Must indicate buffer contents */
- } descriptor_props[] = {
- [VK_DESCRIPTOR_TYPE_SAMPLER] = { sizeof(VkDescriptorImageInfo), "sampler", 1, 0, 0, 0, },
- [VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE] = { sizeof(VkDescriptorImageInfo), "texture", 1, 0, 1, 0, },
- [VK_DESCRIPTOR_TYPE_STORAGE_IMAGE] = { sizeof(VkDescriptorImageInfo), "image", 1, 1, 1, 0, },
- [VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT] = { sizeof(VkDescriptorImageInfo), "subpassInput", 1, 0, 0, 0, },
- [VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER] = { sizeof(VkDescriptorImageInfo), "sampler", 1, 0, 1, 0, },
- [VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER] = { sizeof(VkDescriptorBufferInfo), NULL, 1, 0, 0, 1, },
- [VK_DESCRIPTOR_TYPE_STORAGE_BUFFER] = { sizeof(VkDescriptorBufferInfo), "buffer", 0, 1, 0, 1, },
- [VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC] = { sizeof(VkDescriptorBufferInfo), NULL, 1, 0, 0, 1, },
- [VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC] = { sizeof(VkDescriptorBufferInfo), "buffer", 0, 1, 0, 1, },
- [VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER] = { sizeof(VkBufferView), "samplerBuffer", 1, 0, 0, 0, },
- [VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER] = { sizeof(VkBufferView), "imageBuffer", 1, 0, 0, 0, },
- };
- int ff_vk_pipeline_descriptor_set_add(FFVulkanContext *s, FFVulkanPipeline *pl,
- FFVkSPIRVShader *shd,
- FFVulkanDescriptorSetBinding *desc, int nb,
- int singular, int print_to_shader_only)
- {
- VkResult ret;
- int has_sampler = 0;
- FFVulkanFunctions *vk = &s->vkfn;
- FFVulkanDescriptorSet *set;
- VkDescriptorSetLayoutCreateInfo desc_create_layout;
- if (print_to_shader_only)
- goto print;
- /* Actual layout allocated for the pipeline */
- set = av_realloc_array(pl->desc_set, sizeof(*pl->desc_set),
- pl->nb_descriptor_sets + 1);
- if (!set)
- return AVERROR(ENOMEM);
- pl->desc_set = set;
- set = &set[pl->nb_descriptor_sets];
- memset(set, 0, sizeof(*set));
- set->binding = av_calloc(nb, sizeof(*set->binding));
- if (!set->binding)
- return AVERROR(ENOMEM);
- set->binding_offset = av_calloc(nb, sizeof(*set->binding_offset));
- if (!set->binding_offset) {
- av_freep(&set->binding);
- return AVERROR(ENOMEM);
- }
- desc_create_layout = (VkDescriptorSetLayoutCreateInfo) {
- .sType = VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO,
- .bindingCount = nb,
- .pBindings = set->binding,
- .flags = VK_DESCRIPTOR_SET_LAYOUT_CREATE_DESCRIPTOR_BUFFER_BIT_EXT,
- };
- for (int i = 0; i < nb; i++) {
- set->binding[i].binding = i;
- set->binding[i].descriptorType = desc[i].type;
- set->binding[i].descriptorCount = FFMAX(desc[i].elems, 1);
- set->binding[i].stageFlags = desc[i].stages;
- set->binding[i].pImmutableSamplers = desc[i].samplers;
- if (desc[i].type == VK_DESCRIPTOR_TYPE_SAMPLER ||
- desc[i].type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
- has_sampler |= 1;
- }
- set->usage = VK_BUFFER_USAGE_RESOURCE_DESCRIPTOR_BUFFER_BIT_EXT |
- VK_BUFFER_USAGE_SHADER_DEVICE_ADDRESS_BIT;
- if (has_sampler)
- set->usage |= VK_BUFFER_USAGE_SAMPLER_DESCRIPTOR_BUFFER_BIT_EXT;
- ret = vk->CreateDescriptorSetLayout(s->hwctx->act_dev, &desc_create_layout,
- s->hwctx->alloc, &set->layout);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Unable to init descriptor set layout: %s",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- vk->GetDescriptorSetLayoutSizeEXT(s->hwctx->act_dev, set->layout, &set->layout_size);
- set->aligned_size = FFALIGN(set->layout_size, s->desc_buf_props.descriptorBufferOffsetAlignment);
- for (int i = 0; i < nb; i++)
- vk->GetDescriptorSetLayoutBindingOffsetEXT(s->hwctx->act_dev, set->layout,
- i, &set->binding_offset[i]);
- set->singular = singular;
- set->nb_bindings = nb;
- pl->nb_descriptor_sets++;
- print:
- /* Write shader info */
- for (int i = 0; i < nb; i++) {
- const struct descriptor_props *prop = &descriptor_props[desc[i].type];
- GLSLA("layout (set = %i, binding = %i", pl->nb_descriptor_sets - 1, i);
- if (desc[i].mem_layout)
- GLSLA(", %s", desc[i].mem_layout);
- GLSLA(")");
- if (prop->is_uniform)
- GLSLA(" uniform");
- if (prop->mem_quali && desc[i].mem_quali)
- GLSLA(" %s", desc[i].mem_quali);
- if (prop->type)
- GLSLA(" %s", prop->type);
- if (prop->dim_needed)
- GLSLA("%iD", desc[i].dimensions);
- GLSLA(" %s", desc[i].name);
- if (prop->buf_content)
- GLSLA(" {\n %s\n}", desc[i].buf_content);
- else if (desc[i].elems > 0)
- GLSLA("[%i]", desc[i].elems);
- GLSLA(";");
- GLSLA("\n");
- }
- GLSLA("\n");
- return 0;
- }
- int ff_vk_exec_pipeline_register(FFVulkanContext *s, FFVkExecPool *pool,
- FFVulkanPipeline *pl)
- {
- int err;
- pl->desc_bind = av_calloc(pl->nb_descriptor_sets, sizeof(*pl->desc_bind));
- if (!pl->desc_bind)
- return AVERROR(ENOMEM);
- pl->bound_buffer_indices = av_calloc(pl->nb_descriptor_sets,
- sizeof(*pl->bound_buffer_indices));
- if (!pl->bound_buffer_indices)
- return AVERROR(ENOMEM);
- for (int i = 0; i < pl->nb_descriptor_sets; i++) {
- FFVulkanDescriptorSet *set = &pl->desc_set[i];
- int nb = set->singular ? 1 : pool->pool_size;
- err = ff_vk_create_buf(s, &set->buf, set->aligned_size*nb,
- NULL, NULL, set->usage,
- VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT |
- VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT |
- VK_MEMORY_PROPERTY_HOST_COHERENT_BIT);
- if (err < 0)
- return err;
- err = ff_vk_map_buffer(s, &set->buf, &set->desc_mem, 0);
- if (err < 0)
- return err;
- pl->desc_bind[i] = (VkDescriptorBufferBindingInfoEXT) {
- .sType = VK_STRUCTURE_TYPE_DESCRIPTOR_BUFFER_BINDING_INFO_EXT,
- .usage = set->usage,
- .address = set->buf.address,
- };
- pl->bound_buffer_indices[i] = i;
- }
- return 0;
- }
- static inline void update_set_descriptor(FFVulkanContext *s, FFVkExecContext *e,
- FFVulkanDescriptorSet *set,
- int bind_idx, int array_idx,
- VkDescriptorGetInfoEXT *desc_get_info,
- size_t desc_size)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- const size_t exec_offset = set->singular ? 0 : set->aligned_size*e->idx;
- void *desc = set->desc_mem + /* Base */
- exec_offset + /* Execution context */
- set->binding_offset[bind_idx] + /* Descriptor binding */
- array_idx*desc_size; /* Array position */
- vk->GetDescriptorEXT(s->hwctx->act_dev, desc_get_info, desc_size, desc);
- }
- static int vk_set_descriptor_image(FFVulkanContext *s, FFVulkanPipeline *pl,
- FFVkExecContext *e, int set, int bind, int offs,
- VkImageView view, VkImageLayout layout,
- VkSampler sampler)
- {
- FFVulkanDescriptorSet *desc_set = &pl->desc_set[set];
- VkDescriptorGetInfoEXT desc_get_info = {
- .sType = VK_STRUCTURE_TYPE_DESCRIPTOR_GET_INFO_EXT,
- .type = desc_set->binding[bind].descriptorType,
- };
- VkDescriptorImageInfo desc_img_info = {
- .imageView = view,
- .sampler = sampler,
- .imageLayout = layout,
- };
- size_t desc_size;
- switch (desc_get_info.type) {
- case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
- desc_get_info.data.pSampledImage = &desc_img_info;
- desc_size = s->desc_buf_props.sampledImageDescriptorSize;
- break;
- case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
- desc_get_info.data.pStorageImage = &desc_img_info;
- desc_size = s->desc_buf_props.storageImageDescriptorSize;
- break;
- case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
- desc_get_info.data.pInputAttachmentImage = &desc_img_info;
- desc_size = s->desc_buf_props.inputAttachmentDescriptorSize;
- break;
- case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
- desc_get_info.data.pCombinedImageSampler = &desc_img_info;
- desc_size = s->desc_buf_props.combinedImageSamplerDescriptorSize;
- break;
- default:
- av_log(s, AV_LOG_ERROR, "Invalid descriptor type at set %i binding %i: %i!\n",
- set, bind, desc_get_info.type);
- return AVERROR(EINVAL);
- break;
- };
- update_set_descriptor(s, e, desc_set, bind, offs, &desc_get_info, desc_size);
- return 0;
- }
- int ff_vk_set_descriptor_buffer(FFVulkanContext *s, FFVulkanPipeline *pl,
- FFVkExecContext *e, int set, int bind, int offs,
- VkDeviceAddress addr, VkDeviceSize len, VkFormat fmt)
- {
- FFVulkanDescriptorSet *desc_set = &pl->desc_set[set];
- VkDescriptorGetInfoEXT desc_get_info = {
- .sType = VK_STRUCTURE_TYPE_DESCRIPTOR_GET_INFO_EXT,
- .type = desc_set->binding[bind].descriptorType,
- };
- VkDescriptorAddressInfoEXT desc_buf_info = {
- .sType = VK_STRUCTURE_TYPE_DESCRIPTOR_ADDRESS_INFO_EXT,
- .address = addr,
- .range = len,
- .format = fmt,
- };
- size_t desc_size;
- switch (desc_get_info.type) {
- case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
- desc_get_info.data.pUniformBuffer = &desc_buf_info;
- desc_size = s->desc_buf_props.uniformBufferDescriptorSize;
- break;
- case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
- desc_get_info.data.pStorageBuffer = &desc_buf_info;
- desc_size = s->desc_buf_props.storageBufferDescriptorSize;
- break;
- case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
- desc_get_info.data.pUniformTexelBuffer = &desc_buf_info;
- desc_size = s->desc_buf_props.uniformTexelBufferDescriptorSize;
- break;
- case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
- desc_get_info.data.pStorageTexelBuffer = &desc_buf_info;
- desc_size = s->desc_buf_props.storageTexelBufferDescriptorSize;
- break;
- default:
- av_log(s, AV_LOG_ERROR, "Invalid descriptor type at set %i binding %i: %i!\n",
- set, bind, desc_get_info.type);
- return AVERROR(EINVAL);
- break;
- };
- update_set_descriptor(s, e, desc_set, bind, offs, &desc_get_info, desc_size);
- return 0;
- }
- void ff_vk_update_descriptor_img_array(FFVulkanContext *s, FFVulkanPipeline *pl,
- FFVkExecContext *e, AVFrame *f,
- VkImageView *views, int set, int binding,
- VkImageLayout layout, VkSampler sampler)
- {
- AVHWFramesContext *hwfc = (AVHWFramesContext *)f->hw_frames_ctx->data;
- const int nb_planes = av_pix_fmt_count_planes(hwfc->sw_format);
- for (int i = 0; i < nb_planes; i++)
- vk_set_descriptor_image(s, pl, e, set, binding, i,
- views[i], layout, sampler);
- }
- void ff_vk_update_push_exec(FFVulkanContext *s, FFVkExecContext *e,
- FFVulkanPipeline *pl,
- VkShaderStageFlagBits stage,
- int offset, size_t size, void *src)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- vk->CmdPushConstants(e->buf, pl->pipeline_layout,
- stage, offset, size, src);
- }
- static int init_pipeline_layout(FFVulkanContext *s, FFVulkanPipeline *pl)
- {
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkPipelineLayoutCreateInfo pipeline_layout_info;
- VkDescriptorSetLayout *desc_layouts = av_malloc(pl->nb_descriptor_sets*
- sizeof(desc_layouts));
- if (!desc_layouts)
- return AVERROR(ENOMEM);
- for (int i = 0; i < pl->nb_descriptor_sets; i++)
- desc_layouts[i] = pl->desc_set[i].layout;
- /* Finally create the pipeline layout */
- pipeline_layout_info = (VkPipelineLayoutCreateInfo) {
- .sType = VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,
- .pSetLayouts = desc_layouts,
- .setLayoutCount = pl->nb_descriptor_sets,
- .pushConstantRangeCount = pl->push_consts_num,
- .pPushConstantRanges = pl->push_consts,
- };
- ret = vk->CreatePipelineLayout(s->hwctx->act_dev, &pipeline_layout_info,
- s->hwctx->alloc, &pl->pipeline_layout);
- av_free(desc_layouts);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Unable to init pipeline layout: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- return 0;
- }
- int ff_vk_init_compute_pipeline(FFVulkanContext *s, FFVulkanPipeline *pl,
- FFVkSPIRVShader *shd)
- {
- int err;
- VkResult ret;
- FFVulkanFunctions *vk = &s->vkfn;
- VkComputePipelineCreateInfo pipeline_create_info;
- err = init_pipeline_layout(s, pl);
- if (err < 0)
- return err;
- pipeline_create_info = (VkComputePipelineCreateInfo) {
- .sType = VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO,
- .flags = VK_PIPELINE_CREATE_DESCRIPTOR_BUFFER_BIT_EXT,
- .layout = pl->pipeline_layout,
- .stage = shd->shader,
- };
- ret = vk->CreateComputePipelines(s->hwctx->act_dev, VK_NULL_HANDLE, 1,
- &pipeline_create_info,
- s->hwctx->alloc, &pl->pipeline);
- if (ret != VK_SUCCESS) {
- av_log(s, AV_LOG_ERROR, "Unable to init compute pipeline: %s\n",
- ff_vk_ret2str(ret));
- return AVERROR_EXTERNAL;
- }
- pl->bind_point = VK_PIPELINE_BIND_POINT_COMPUTE;
- pl->wg_size[0] = shd->local_size[0];
- pl->wg_size[1] = shd->local_size[1];
- pl->wg_size[2] = shd->local_size[2];
- return 0;
- }
- void ff_vk_exec_bind_pipeline(FFVulkanContext *s, FFVkExecContext *e,
- FFVulkanPipeline *pl)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- VkDeviceSize offsets[1024];
- /* Bind pipeline */
- vk->CmdBindPipeline(e->buf, pl->bind_point, pl->pipeline);
- if (pl->nb_descriptor_sets) {
- for (int i = 0; i < pl->nb_descriptor_sets; i++)
- offsets[i] = pl->desc_set[i].singular ? 0 : pl->desc_set[i].aligned_size*e->idx;
- /* Bind descriptor buffers */
- vk->CmdBindDescriptorBuffersEXT(e->buf, pl->nb_descriptor_sets, pl->desc_bind);
- /* Binding offsets */
- vk->CmdSetDescriptorBufferOffsetsEXT(e->buf, pl->bind_point, pl->pipeline_layout,
- 0, pl->nb_descriptor_sets,
- pl->bound_buffer_indices, offsets);
- }
- }
- void ff_vk_pipeline_free(FFVulkanContext *s, FFVulkanPipeline *pl)
- {
- FFVulkanFunctions *vk = &s->vkfn;
- if (pl->pipeline)
- vk->DestroyPipeline(s->hwctx->act_dev, pl->pipeline, s->hwctx->alloc);
- if (pl->pipeline_layout)
- vk->DestroyPipelineLayout(s->hwctx->act_dev, pl->pipeline_layout,
- s->hwctx->alloc);
- for (int i = 0; i < pl->nb_descriptor_sets; i++) {
- FFVulkanDescriptorSet *set = &pl->desc_set[i];
- if (set->buf.mem)
- ff_vk_unmap_buffer(s, &set->buf, 0);
- ff_vk_free_buf(s, &set->buf);
- if (set->layout)
- vk->DestroyDescriptorSetLayout(s->hwctx->act_dev, set->layout,
- s->hwctx->alloc);
- av_free(set->binding);
- av_free(set->binding_offset);
- }
- av_freep(&pl->desc_set);
- av_freep(&pl->desc_bind);
- av_freep(&pl->bound_buffer_indices);
- av_freep(&pl->push_consts);
- pl->push_consts_num = 0;
- }
- void ff_vk_uninit(FFVulkanContext *s)
- {
- av_freep(&s->query_props);
- av_freep(&s->qf_props);
- av_freep(&s->video_props);
- av_freep(&s->coop_mat_props);
- av_buffer_unref(&s->device_ref);
- av_buffer_unref(&s->frames_ref);
- }
- int ff_vk_init(FFVulkanContext *s, void *log_parent,
- AVBufferRef *device_ref, AVBufferRef *frames_ref)
- {
- int err;
- static const AVClass vulkan_context_class = {
- .class_name = "vk",
- .version = LIBAVUTIL_VERSION_INT,
- .parent_log_context_offset = offsetof(FFVulkanContext, log_parent),
- };
- memset(s, 0, sizeof(*s));
- s->log_parent = log_parent;
- s->class = &vulkan_context_class;
- if (frames_ref) {
- s->frames_ref = av_buffer_ref(frames_ref);
- if (!s->frames_ref)
- return AVERROR(ENOMEM);
- s->frames = (AVHWFramesContext *)s->frames_ref->data;
- s->hwfc = s->frames->hwctx;
- device_ref = s->frames->device_ref;
- }
- s->device_ref = av_buffer_ref(device_ref);
- if (!s->device_ref) {
- ff_vk_uninit(s);
- return AVERROR(ENOMEM);
- }
- s->device = (AVHWDeviceContext *)s->device_ref->data;
- s->hwctx = s->device->hwctx;
- s->extensions = ff_vk_extensions_to_mask(s->hwctx->enabled_dev_extensions,
- s->hwctx->nb_enabled_dev_extensions);
- err = ff_vk_load_functions(s->device, &s->vkfn, s->extensions, 1, 1);
- if (err < 0) {
- ff_vk_uninit(s);
- return err;
- }
- err = ff_vk_load_props(s);
- if (err < 0) {
- ff_vk_uninit(s);
- return err;
- }
- return 0;
- }
|