testffmpeg_vulkan.c 43 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968
  1. /*
  2. Copyright (C) 1997-2024 Sam Lantinga <slouken@libsdl.org>
  3. This software is provided 'as-is', without any express or implied
  4. warranty. In no event will the authors be held liable for any damages
  5. arising from the use of this software.
  6. Permission is granted to anyone to use this software for any purpose,
  7. including commercial applications, and to alter it and redistribute it
  8. freely.
  9. */
  10. #include <SDL3/SDL.h>
  11. #include <SDL3/SDL_vulkan.h>
  12. #include <libavutil/hwcontext.h>
  13. #include <libavutil/hwcontext_vulkan.h>
  14. #include "testffmpeg_vulkan.h"
  15. #define VULKAN_FUNCTIONS() \
  16. VULKAN_GLOBAL_FUNCTION(vkCreateInstance) \
  17. VULKAN_GLOBAL_FUNCTION(vkEnumerateInstanceExtensionProperties) \
  18. VULKAN_GLOBAL_FUNCTION(vkEnumerateInstanceLayerProperties) \
  19. VULKAN_INSTANCE_FUNCTION(vkCreateDevice) \
  20. VULKAN_INSTANCE_FUNCTION(vkDestroyInstance) \
  21. VULKAN_INSTANCE_FUNCTION(vkDestroySurfaceKHR) \
  22. VULKAN_INSTANCE_FUNCTION(vkEnumerateDeviceExtensionProperties) \
  23. VULKAN_INSTANCE_FUNCTION(vkEnumeratePhysicalDevices) \
  24. VULKAN_INSTANCE_FUNCTION(vkGetDeviceProcAddr) \
  25. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceFeatures2) \
  26. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceQueueFamilyProperties) \
  27. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceSurfaceSupportKHR) \
  28. VULKAN_INSTANCE_FUNCTION(vkQueueWaitIdle) \
  29. VULKAN_DEVICE_FUNCTION(vkAllocateCommandBuffers) \
  30. VULKAN_DEVICE_FUNCTION(vkBeginCommandBuffer) \
  31. VULKAN_DEVICE_FUNCTION(vkCmdPipelineBarrier2) \
  32. VULKAN_DEVICE_FUNCTION(vkCreateCommandPool) \
  33. VULKAN_DEVICE_FUNCTION(vkCreateSemaphore) \
  34. VULKAN_DEVICE_FUNCTION(vkDestroyCommandPool) \
  35. VULKAN_DEVICE_FUNCTION(vkDestroyDevice) \
  36. VULKAN_DEVICE_FUNCTION(vkDestroySemaphore) \
  37. VULKAN_DEVICE_FUNCTION(vkDeviceWaitIdle) \
  38. VULKAN_DEVICE_FUNCTION(vkEndCommandBuffer) \
  39. VULKAN_DEVICE_FUNCTION(vkFreeCommandBuffers) \
  40. VULKAN_DEVICE_FUNCTION(vkGetDeviceQueue) \
  41. VULKAN_DEVICE_FUNCTION(vkQueueSubmit) \
  42. \
  43. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceVideoFormatPropertiesKHR) \
  44. typedef struct
  45. {
  46. VkPhysicalDeviceFeatures2 device_features;
  47. VkPhysicalDeviceVulkan11Features device_features_1_1;
  48. VkPhysicalDeviceVulkan12Features device_features_1_2;
  49. VkPhysicalDeviceVulkan13Features device_features_1_3;
  50. VkPhysicalDeviceDescriptorBufferFeaturesEXT desc_buf_features;
  51. VkPhysicalDeviceShaderAtomicFloatFeaturesEXT atomic_float_features;
  52. VkPhysicalDeviceCooperativeMatrixFeaturesKHR coop_matrix_features;
  53. } VulkanDeviceFeatures;
  54. struct VulkanVideoContext
  55. {
  56. VkInstance instance;
  57. VkSurfaceKHR surface;
  58. VkPhysicalDevice physicalDevice;
  59. int presentQueueFamilyIndex;
  60. int presentQueueCount;
  61. int graphicsQueueFamilyIndex;
  62. int graphicsQueueCount;
  63. int transferQueueFamilyIndex;
  64. int transferQueueCount;
  65. int computeQueueFamilyIndex;
  66. int computeQueueCount;
  67. int decodeQueueFamilyIndex;
  68. int decodeQueueCount;
  69. VkDevice device;
  70. VkQueue graphicsQueue;
  71. VkCommandPool commandPool;
  72. VkCommandBuffer *commandBuffers;
  73. uint32_t commandBufferCount;
  74. uint32_t commandBufferIndex;
  75. VkSemaphore *waitSemaphores;
  76. uint32_t waitSemaphoreCount;
  77. VkSemaphore *signalSemaphores;
  78. uint32_t signalSemaphoreCount;
  79. const char **instanceExtensions;
  80. int instanceExtensionsCount;
  81. const char **deviceExtensions;
  82. int deviceExtensionsCount;
  83. VulkanDeviceFeatures features;
  84. PFN_vkGetInstanceProcAddr vkGetInstanceProcAddr;
  85. #define VULKAN_GLOBAL_FUNCTION(name) PFN_##name name;
  86. #define VULKAN_INSTANCE_FUNCTION(name) PFN_##name name;
  87. #define VULKAN_DEVICE_FUNCTION(name) PFN_##name name;
  88. VULKAN_FUNCTIONS()
  89. #undef VULKAN_GLOBAL_FUNCTION
  90. #undef VULKAN_INSTANCE_FUNCTION
  91. #undef VULKAN_DEVICE_FUNCTION
  92. };
  93. static int loadGlobalFunctions(VulkanVideoContext *context)
  94. {
  95. context->vkGetInstanceProcAddr = (PFN_vkGetInstanceProcAddr)SDL_Vulkan_GetVkGetInstanceProcAddr();
  96. if (!context->vkGetInstanceProcAddr) {
  97. return -1;
  98. }
  99. #define VULKAN_GLOBAL_FUNCTION(name) \
  100. context->name = (PFN_##name)context->vkGetInstanceProcAddr(VK_NULL_HANDLE, #name); \
  101. if (!context->name) { \
  102. return SDL_SetError("vkGetInstanceProcAddr(VK_NULL_HANDLE, \"" #name "\") failed"); \
  103. }
  104. #define VULKAN_INSTANCE_FUNCTION(name)
  105. #define VULKAN_DEVICE_FUNCTION(name)
  106. VULKAN_FUNCTIONS()
  107. #undef VULKAN_GLOBAL_FUNCTION
  108. #undef VULKAN_INSTANCE_FUNCTION
  109. #undef VULKAN_DEVICE_FUNCTION
  110. return 0;
  111. }
  112. static int loadInstanceFunctions(VulkanVideoContext *context)
  113. {
  114. #define VULKAN_GLOBAL_FUNCTION(name)
  115. #define VULKAN_INSTANCE_FUNCTION(name) \
  116. context->name = (PFN_##name)context->vkGetInstanceProcAddr(context->instance, #name); \
  117. if (!context->name) { \
  118. return SDL_SetError("vkGetInstanceProcAddr(instance, \"" #name "\") failed"); \
  119. }
  120. #define VULKAN_DEVICE_FUNCTION(name)
  121. VULKAN_FUNCTIONS()
  122. #undef VULKAN_GLOBAL_FUNCTION
  123. #undef VULKAN_INSTANCE_FUNCTION
  124. #undef VULKAN_DEVICE_FUNCTION
  125. return 0;
  126. }
  127. static int loadDeviceFunctions(VulkanVideoContext *context)
  128. {
  129. #define VULKAN_GLOBAL_FUNCTION(name)
  130. #define VULKAN_INSTANCE_FUNCTION(name)
  131. #define VULKAN_DEVICE_FUNCTION(name) \
  132. context->name = (PFN_##name)context->vkGetDeviceProcAddr(context->device, #name); \
  133. if (!context->name) { \
  134. return SDL_SetError("vkGetDeviceProcAddr(device, \"" #name "\") failed\n"); \
  135. }
  136. VULKAN_FUNCTIONS()
  137. #undef VULKAN_GLOBAL_FUNCTION
  138. #undef VULKAN_INSTANCE_FUNCTION
  139. #undef VULKAN_DEVICE_FUNCTION
  140. return 0;
  141. }
  142. #undef VULKAN_FUNCTIONS
  143. static const char *getVulkanResultString(VkResult result)
  144. {
  145. switch ((int)result) {
  146. #define RESULT_CASE(x) \
  147. case x: \
  148. return #x
  149. RESULT_CASE(VK_SUCCESS);
  150. RESULT_CASE(VK_NOT_READY);
  151. RESULT_CASE(VK_TIMEOUT);
  152. RESULT_CASE(VK_EVENT_SET);
  153. RESULT_CASE(VK_EVENT_RESET);
  154. RESULT_CASE(VK_INCOMPLETE);
  155. RESULT_CASE(VK_ERROR_OUT_OF_HOST_MEMORY);
  156. RESULT_CASE(VK_ERROR_OUT_OF_DEVICE_MEMORY);
  157. RESULT_CASE(VK_ERROR_INITIALIZATION_FAILED);
  158. RESULT_CASE(VK_ERROR_DEVICE_LOST);
  159. RESULT_CASE(VK_ERROR_MEMORY_MAP_FAILED);
  160. RESULT_CASE(VK_ERROR_LAYER_NOT_PRESENT);
  161. RESULT_CASE(VK_ERROR_EXTENSION_NOT_PRESENT);
  162. RESULT_CASE(VK_ERROR_FEATURE_NOT_PRESENT);
  163. RESULT_CASE(VK_ERROR_INCOMPATIBLE_DRIVER);
  164. RESULT_CASE(VK_ERROR_TOO_MANY_OBJECTS);
  165. RESULT_CASE(VK_ERROR_FORMAT_NOT_SUPPORTED);
  166. RESULT_CASE(VK_ERROR_FRAGMENTED_POOL);
  167. RESULT_CASE(VK_ERROR_SURFACE_LOST_KHR);
  168. RESULT_CASE(VK_ERROR_NATIVE_WINDOW_IN_USE_KHR);
  169. RESULT_CASE(VK_SUBOPTIMAL_KHR);
  170. RESULT_CASE(VK_ERROR_OUT_OF_DATE_KHR);
  171. RESULT_CASE(VK_ERROR_INCOMPATIBLE_DISPLAY_KHR);
  172. RESULT_CASE(VK_ERROR_VALIDATION_FAILED_EXT);
  173. RESULT_CASE(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
  174. RESULT_CASE(VK_ERROR_INVALID_SHADER_NV);
  175. #undef RESULT_CASE
  176. default:
  177. break;
  178. }
  179. return (result < 0) ? "VK_ERROR_<Unknown>" : "VK_<Unknown>";
  180. }
  181. static int createInstance(VulkanVideoContext *context)
  182. {
  183. static const char *optional_extensions[] = {
  184. VK_EXT_SWAPCHAIN_COLOR_SPACE_EXTENSION_NAME,
  185. VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME
  186. };
  187. VkApplicationInfo appInfo = { 0 };
  188. VkInstanceCreateInfo instanceCreateInfo = { 0 };
  189. VkResult result;
  190. char const *const *instanceExtensions = SDL_Vulkan_GetInstanceExtensions(&instanceCreateInfo.enabledExtensionCount);
  191. appInfo.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
  192. appInfo.apiVersion = VK_API_VERSION_1_3;
  193. instanceCreateInfo.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
  194. instanceCreateInfo.pApplicationInfo = &appInfo;
  195. const char **instanceExtensionsCopy = SDL_calloc(instanceCreateInfo.enabledExtensionCount + SDL_arraysize(optional_extensions), sizeof(const char *));
  196. for (uint32_t i = 0; i < instanceCreateInfo.enabledExtensionCount; i++) {
  197. instanceExtensionsCopy[i] = instanceExtensions[i];
  198. }
  199. // Get the rest of the optional extensions
  200. {
  201. uint32_t extensionCount;
  202. if (context->vkEnumerateInstanceExtensionProperties(NULL, &extensionCount, NULL) == VK_SUCCESS && extensionCount > 0) {
  203. VkExtensionProperties *extensionProperties = SDL_calloc(sizeof(VkExtensionProperties), extensionCount);
  204. if (context->vkEnumerateInstanceExtensionProperties(NULL, &extensionCount, extensionProperties) == VK_SUCCESS) {
  205. for (uint32_t i = 0; i < SDL_arraysize(optional_extensions); ++i) {
  206. for (uint32_t j = 0; j < extensionCount; ++j) {
  207. if (SDL_strcmp(extensionProperties[j].extensionName, optional_extensions[i]) == 0) {
  208. instanceExtensionsCopy[instanceCreateInfo.enabledExtensionCount++] = optional_extensions[i];
  209. break;
  210. }
  211. }
  212. }
  213. }
  214. SDL_free(extensionProperties);
  215. }
  216. }
  217. instanceCreateInfo.ppEnabledExtensionNames = instanceExtensionsCopy;
  218. context->instanceExtensions = instanceExtensionsCopy;
  219. context->instanceExtensionsCount = instanceCreateInfo.enabledExtensionCount;
  220. result = context->vkCreateInstance(&instanceCreateInfo, NULL, &context->instance);
  221. if (result != VK_SUCCESS) {
  222. context->instance = VK_NULL_HANDLE;
  223. return SDL_SetError("vkCreateInstance(): %s\n", getVulkanResultString(result));
  224. }
  225. if (loadInstanceFunctions(context) < 0) {
  226. return -1;
  227. }
  228. return 0;
  229. }
  230. static int createSurface(VulkanVideoContext *context, SDL_Window *window)
  231. {
  232. if (!SDL_Vulkan_CreateSurface(window,
  233. context->instance,
  234. NULL,
  235. &context->surface)) {
  236. context->surface = VK_NULL_HANDLE;
  237. return -1;
  238. }
  239. return 0;
  240. }
  241. // Use the same queue scoring algorithm as ffmpeg to make sure we get the same device configuration
  242. static int selectQueueFamily(VkQueueFamilyProperties *queueFamiliesProperties, uint32_t queueFamiliesCount, VkQueueFlagBits flags, int *queueCount)
  243. {
  244. uint32_t queueFamilyIndex;
  245. uint32_t selectedQueueFamilyIndex = queueFamiliesCount;
  246. uint32_t min_score = ~0u;
  247. for (queueFamilyIndex = 0; queueFamilyIndex < queueFamiliesCount; ++queueFamilyIndex) {
  248. VkQueueFlagBits current_flags = queueFamiliesProperties[queueFamilyIndex].queueFlags;
  249. if (current_flags & flags) {
  250. uint32_t score = av_popcount(current_flags) + queueFamiliesProperties[queueFamilyIndex].timestampValidBits;
  251. if (score < min_score) {
  252. selectedQueueFamilyIndex = queueFamilyIndex;
  253. min_score = score;
  254. }
  255. }
  256. }
  257. if (selectedQueueFamilyIndex != queueFamiliesCount) {
  258. VkQueueFamilyProperties *selectedQueueFamily = &queueFamiliesProperties[selectedQueueFamilyIndex];
  259. *queueCount = (int)selectedQueueFamily->queueCount;
  260. ++selectedQueueFamily->timestampValidBits;
  261. return (int)selectedQueueFamilyIndex;
  262. } else {
  263. *queueCount = 0;
  264. return -1;
  265. }
  266. }
  267. static int findPhysicalDevice(VulkanVideoContext *context)
  268. {
  269. uint32_t physicalDeviceCount = 0;
  270. VkPhysicalDevice *physicalDevices;
  271. VkQueueFamilyProperties *queueFamiliesProperties = NULL;
  272. uint32_t queueFamiliesPropertiesAllocatedSize = 0;
  273. VkExtensionProperties *deviceExtensions = NULL;
  274. uint32_t deviceExtensionsAllocatedSize = 0;
  275. uint32_t physicalDeviceIndex;
  276. VkResult result;
  277. result = context->vkEnumeratePhysicalDevices(context->instance, &physicalDeviceCount, NULL);
  278. if (result != VK_SUCCESS) {
  279. return SDL_SetError("vkEnumeratePhysicalDevices(): %s", getVulkanResultString(result));
  280. }
  281. if (physicalDeviceCount == 0) {
  282. return SDL_SetError("vkEnumeratePhysicalDevices(): no physical devices");
  283. }
  284. physicalDevices = (VkPhysicalDevice *)SDL_malloc(sizeof(VkPhysicalDevice) * physicalDeviceCount);
  285. if (!physicalDevices) {
  286. return -1;
  287. }
  288. result = context->vkEnumeratePhysicalDevices(context->instance, &physicalDeviceCount, physicalDevices);
  289. if (result != VK_SUCCESS) {
  290. SDL_free(physicalDevices);
  291. return SDL_SetError("vkEnumeratePhysicalDevices(): %s", getVulkanResultString(result));
  292. }
  293. context->physicalDevice = NULL;
  294. for (physicalDeviceIndex = 0; physicalDeviceIndex < physicalDeviceCount; physicalDeviceIndex++) {
  295. uint32_t queueFamiliesCount = 0;
  296. uint32_t queueFamilyIndex;
  297. uint32_t deviceExtensionCount = 0;
  298. SDL_bool hasSwapchainExtension = SDL_FALSE;
  299. uint32_t i;
  300. VkPhysicalDevice physicalDevice = physicalDevices[physicalDeviceIndex];
  301. context->vkGetPhysicalDeviceQueueFamilyProperties(physicalDevice, &queueFamiliesCount, NULL);
  302. if (queueFamiliesCount == 0) {
  303. continue;
  304. }
  305. if (queueFamiliesPropertiesAllocatedSize < queueFamiliesCount) {
  306. SDL_free(queueFamiliesProperties);
  307. queueFamiliesPropertiesAllocatedSize = queueFamiliesCount;
  308. queueFamiliesProperties = (VkQueueFamilyProperties *)SDL_malloc(sizeof(VkQueueFamilyProperties) * queueFamiliesPropertiesAllocatedSize);
  309. if (!queueFamiliesProperties) {
  310. SDL_free(physicalDevices);
  311. SDL_free(deviceExtensions);
  312. return -1;
  313. }
  314. }
  315. context->vkGetPhysicalDeviceQueueFamilyProperties(physicalDevice, &queueFamiliesCount, queueFamiliesProperties);
  316. // Initialize timestampValidBits for scoring in selectQueueFamily
  317. for (queueFamilyIndex = 0; queueFamilyIndex < queueFamiliesCount; queueFamilyIndex++) {
  318. queueFamiliesProperties[queueFamilyIndex].timestampValidBits = 0;
  319. }
  320. context->presentQueueFamilyIndex = -1;
  321. context->graphicsQueueFamilyIndex = -1;
  322. for (queueFamilyIndex = 0; queueFamilyIndex < queueFamiliesCount; queueFamilyIndex++) {
  323. VkBool32 supported = 0;
  324. if (queueFamiliesProperties[queueFamilyIndex].queueCount == 0) {
  325. continue;
  326. }
  327. if (queueFamiliesProperties[queueFamilyIndex].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
  328. context->graphicsQueueFamilyIndex = queueFamilyIndex;
  329. }
  330. result = context->vkGetPhysicalDeviceSurfaceSupportKHR(physicalDevice, queueFamilyIndex, context->surface, &supported);
  331. if (result == VK_SUCCESS) {
  332. if (supported) {
  333. context->presentQueueFamilyIndex = queueFamilyIndex;
  334. if (queueFamiliesProperties[queueFamilyIndex].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
  335. break; // use this queue because it can present and do graphics
  336. }
  337. }
  338. }
  339. }
  340. if (context->presentQueueFamilyIndex < 0 || context->graphicsQueueFamilyIndex < 0) {
  341. // We can't render and present on this device
  342. continue;
  343. }
  344. context->presentQueueCount = queueFamiliesProperties[context->presentQueueFamilyIndex].queueCount;
  345. ++queueFamiliesProperties[context->presentQueueFamilyIndex].timestampValidBits;
  346. context->graphicsQueueCount = queueFamiliesProperties[context->graphicsQueueFamilyIndex].queueCount;
  347. ++queueFamiliesProperties[context->graphicsQueueFamilyIndex].timestampValidBits;
  348. context->transferQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_TRANSFER_BIT, &context->transferQueueCount);
  349. context->computeQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_COMPUTE_BIT, &context->computeQueueCount);
  350. context->decodeQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_VIDEO_DECODE_BIT_KHR, &context->decodeQueueCount);
  351. if (context->transferQueueFamilyIndex < 0) {
  352. // ffmpeg can fall back to the compute or graphics queues for this
  353. context->transferQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_COMPUTE_BIT, &context->transferQueueCount);
  354. if (context->transferQueueFamilyIndex < 0) {
  355. context->transferQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_GRAPHICS_BIT, &context->transferQueueCount);
  356. }
  357. }
  358. if (context->transferQueueFamilyIndex < 0 ||
  359. context->computeQueueFamilyIndex < 0) {
  360. // This device doesn't have the queues we need for video decoding
  361. continue;
  362. }
  363. result = context->vkEnumerateDeviceExtensionProperties(physicalDevice, NULL, &deviceExtensionCount, NULL);
  364. if (result != VK_SUCCESS) {
  365. SDL_free(physicalDevices);
  366. SDL_free(queueFamiliesProperties);
  367. SDL_free(deviceExtensions);
  368. return SDL_SetError("vkEnumerateDeviceExtensionProperties(): %s", getVulkanResultString(result));
  369. }
  370. if (deviceExtensionCount == 0) {
  371. continue;
  372. }
  373. if (deviceExtensionsAllocatedSize < deviceExtensionCount) {
  374. SDL_free(deviceExtensions);
  375. deviceExtensionsAllocatedSize = deviceExtensionCount;
  376. deviceExtensions = SDL_malloc(sizeof(VkExtensionProperties) * deviceExtensionsAllocatedSize);
  377. if (!deviceExtensions) {
  378. SDL_free(physicalDevices);
  379. SDL_free(queueFamiliesProperties);
  380. return -1;
  381. }
  382. }
  383. result = context->vkEnumerateDeviceExtensionProperties(physicalDevice, NULL, &deviceExtensionCount, deviceExtensions);
  384. if (result != VK_SUCCESS) {
  385. SDL_free(physicalDevices);
  386. SDL_free(queueFamiliesProperties);
  387. SDL_free(deviceExtensions);
  388. return SDL_SetError("vkEnumerateDeviceExtensionProperties(): %s", getVulkanResultString(result));
  389. }
  390. for (i = 0; i < deviceExtensionCount; i++) {
  391. if (SDL_strcmp(deviceExtensions[i].extensionName, VK_KHR_SWAPCHAIN_EXTENSION_NAME) == 0) {
  392. hasSwapchainExtension = SDL_TRUE;
  393. break;
  394. }
  395. }
  396. if (!hasSwapchainExtension) {
  397. continue;
  398. }
  399. context->physicalDevice = physicalDevice;
  400. break;
  401. }
  402. SDL_free(physicalDevices);
  403. SDL_free(queueFamiliesProperties);
  404. SDL_free(deviceExtensions);
  405. if (!context->physicalDevice) {
  406. return SDL_SetError("Vulkan: no viable physical devices found");
  407. }
  408. return 0;
  409. }
  410. static void initDeviceFeatures(VulkanDeviceFeatures *features)
  411. {
  412. features->device_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2;
  413. features->device_features.pNext = &features->device_features_1_1;
  414. features->device_features_1_1.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VULKAN_1_1_FEATURES;
  415. features->device_features_1_1.pNext = &features->device_features_1_2;
  416. features->device_features_1_2.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VULKAN_1_2_FEATURES;
  417. features->device_features_1_2.pNext = &features->device_features_1_3;
  418. features->device_features_1_3.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VULKAN_1_3_FEATURES;
  419. features->device_features_1_3.pNext = &features->desc_buf_features;
  420. features->desc_buf_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_DESCRIPTOR_BUFFER_FEATURES_EXT;
  421. features->desc_buf_features.pNext = &features->atomic_float_features;
  422. features->atomic_float_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SHADER_ATOMIC_FLOAT_FEATURES_EXT;
  423. features->atomic_float_features.pNext = &features->coop_matrix_features;
  424. features->coop_matrix_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_COOPERATIVE_MATRIX_FEATURES_KHR;
  425. features->coop_matrix_features.pNext = NULL;
  426. }
  427. static void copyDeviceFeatures(VulkanDeviceFeatures *supported_features, VulkanDeviceFeatures *requested_features)
  428. {
  429. #define COPY_OPTIONAL_FEATURE(X) requested_features->X = supported_features->X
  430. COPY_OPTIONAL_FEATURE(device_features.features.shaderImageGatherExtended);
  431. COPY_OPTIONAL_FEATURE(device_features.features.shaderStorageImageReadWithoutFormat);
  432. COPY_OPTIONAL_FEATURE(device_features.features.shaderStorageImageWriteWithoutFormat);
  433. COPY_OPTIONAL_FEATURE(device_features.features.fragmentStoresAndAtomics);
  434. COPY_OPTIONAL_FEATURE(device_features.features.vertexPipelineStoresAndAtomics);
  435. COPY_OPTIONAL_FEATURE(device_features.features.shaderInt64);
  436. COPY_OPTIONAL_FEATURE(device_features.features.shaderInt16);
  437. COPY_OPTIONAL_FEATURE(device_features.features.shaderFloat64);
  438. COPY_OPTIONAL_FEATURE(device_features_1_1.samplerYcbcrConversion);
  439. COPY_OPTIONAL_FEATURE(device_features_1_1.storagePushConstant16);
  440. COPY_OPTIONAL_FEATURE(device_features_1_2.bufferDeviceAddress);
  441. COPY_OPTIONAL_FEATURE(device_features_1_2.hostQueryReset);
  442. COPY_OPTIONAL_FEATURE(device_features_1_2.storagePushConstant8);
  443. COPY_OPTIONAL_FEATURE(device_features_1_2.shaderInt8);
  444. COPY_OPTIONAL_FEATURE(device_features_1_2.storageBuffer8BitAccess);
  445. COPY_OPTIONAL_FEATURE(device_features_1_2.uniformAndStorageBuffer8BitAccess);
  446. COPY_OPTIONAL_FEATURE(device_features_1_2.shaderFloat16);
  447. COPY_OPTIONAL_FEATURE(device_features_1_2.shaderSharedInt64Atomics);
  448. COPY_OPTIONAL_FEATURE(device_features_1_2.vulkanMemoryModel);
  449. COPY_OPTIONAL_FEATURE(device_features_1_2.vulkanMemoryModelDeviceScope);
  450. COPY_OPTIONAL_FEATURE(device_features_1_2.hostQueryReset);
  451. COPY_OPTIONAL_FEATURE(device_features_1_3.dynamicRendering);
  452. COPY_OPTIONAL_FEATURE(device_features_1_3.maintenance4);
  453. COPY_OPTIONAL_FEATURE(device_features_1_3.synchronization2);
  454. COPY_OPTIONAL_FEATURE(device_features_1_3.computeFullSubgroups);
  455. COPY_OPTIONAL_FEATURE(device_features_1_3.shaderZeroInitializeWorkgroupMemory);
  456. COPY_OPTIONAL_FEATURE(desc_buf_features.descriptorBuffer);
  457. COPY_OPTIONAL_FEATURE(desc_buf_features.descriptorBufferPushDescriptors);
  458. COPY_OPTIONAL_FEATURE(atomic_float_features.shaderBufferFloat32Atomics);
  459. COPY_OPTIONAL_FEATURE(atomic_float_features.shaderBufferFloat32AtomicAdd);
  460. COPY_OPTIONAL_FEATURE(coop_matrix_features.cooperativeMatrix);
  461. #undef COPY_OPTIONAL_FEATURE
  462. // timeline semaphores is required by ffmpeg
  463. requested_features->device_features_1_2.timelineSemaphore = 1;
  464. }
  465. static int addQueueFamily(VkDeviceQueueCreateInfo **pQueueCreateInfos, uint32_t *pQueueCreateInfoCount, uint32_t queueFamilyIndex, uint32_t queueCount)
  466. {
  467. VkDeviceQueueCreateInfo *queueCreateInfo;
  468. VkDeviceQueueCreateInfo *queueCreateInfos = *pQueueCreateInfos;
  469. uint32_t queueCreateInfoCount = *pQueueCreateInfoCount;
  470. float *queuePriorities;
  471. if (queueCount == 0) {
  472. return 0;
  473. }
  474. for (uint32_t i = 0; i < queueCreateInfoCount; ++i) {
  475. if (queueCreateInfos[i].queueFamilyIndex == queueFamilyIndex) {
  476. return 0;
  477. }
  478. }
  479. queueCreateInfos = (VkDeviceQueueCreateInfo *)SDL_realloc(queueCreateInfos, (queueCreateInfoCount + 1) * sizeof(*queueCreateInfos));
  480. if (!queueCreateInfos) {
  481. return -1;
  482. }
  483. queuePriorities = (float *)SDL_malloc(queueCount * sizeof(*queuePriorities));
  484. if (!queuePriorities) {
  485. return -1;
  486. }
  487. for (uint32_t i = 0; i < queueCount; ++i) {
  488. queuePriorities[i] = 1.0f / queueCount;
  489. }
  490. queueCreateInfo = &queueCreateInfos[queueCreateInfoCount++];
  491. SDL_zerop(queueCreateInfo);
  492. queueCreateInfo->sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
  493. queueCreateInfo->queueFamilyIndex = queueFamilyIndex;
  494. queueCreateInfo->queueCount = queueCount;
  495. queueCreateInfo->pQueuePriorities = queuePriorities;
  496. *pQueueCreateInfos = queueCreateInfos;
  497. *pQueueCreateInfoCount = queueCreateInfoCount;
  498. return 0;
  499. }
  500. static int createDevice(VulkanVideoContext *context)
  501. {
  502. static const char *const deviceExtensionNames[] = {
  503. VK_KHR_SWAPCHAIN_EXTENSION_NAME,
  504. VK_KHR_SAMPLER_YCBCR_CONVERSION_EXTENSION_NAME,
  505. VK_KHR_MAINTENANCE1_EXTENSION_NAME,
  506. VK_KHR_BIND_MEMORY_2_EXTENSION_NAME,
  507. VK_KHR_GET_MEMORY_REQUIREMENTS_2_EXTENSION_NAME,
  508. };
  509. static const char *optional_extensions[] = {
  510. VK_KHR_VIDEO_QUEUE_EXTENSION_NAME,
  511. VK_KHR_VIDEO_DECODE_QUEUE_EXTENSION_NAME,
  512. VK_KHR_VIDEO_DECODE_H264_EXTENSION_NAME,
  513. VK_KHR_VIDEO_DECODE_H265_EXTENSION_NAME,
  514. "VK_MESA_video_decode_av1"
  515. };
  516. VkDeviceCreateInfo deviceCreateInfo = { 0 };
  517. VkDeviceQueueCreateInfo *queueCreateInfos = NULL;
  518. uint32_t queueCreateInfoCount = 0;
  519. VulkanDeviceFeatures supported_features;
  520. VkResult result = VK_ERROR_UNKNOWN;
  521. if (addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->presentQueueFamilyIndex, context->presentQueueCount) < 0 ||
  522. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->graphicsQueueFamilyIndex, context->graphicsQueueCount) < 0 ||
  523. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->transferQueueFamilyIndex, context->transferQueueCount) < 0 ||
  524. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->computeQueueFamilyIndex, context->computeQueueCount) < 0 ||
  525. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->decodeQueueFamilyIndex, context->decodeQueueCount) < 0) {
  526. goto done;
  527. }
  528. initDeviceFeatures(&supported_features);
  529. initDeviceFeatures(&context->features);
  530. context->vkGetPhysicalDeviceFeatures2(context->physicalDevice, &supported_features.device_features);
  531. copyDeviceFeatures(&supported_features, &context->features);
  532. deviceCreateInfo.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
  533. deviceCreateInfo.queueCreateInfoCount = queueCreateInfoCount;
  534. deviceCreateInfo.pQueueCreateInfos = queueCreateInfos;
  535. deviceCreateInfo.pEnabledFeatures = NULL;
  536. deviceCreateInfo.enabledExtensionCount = SDL_arraysize(deviceExtensionNames);
  537. deviceCreateInfo.pNext = &context->features.device_features;
  538. const char **deviceExtensionsCopy = SDL_calloc(deviceCreateInfo.enabledExtensionCount + SDL_arraysize(optional_extensions), sizeof(const char *));
  539. for (uint32_t i = 0; i < deviceCreateInfo.enabledExtensionCount; i++) {
  540. deviceExtensionsCopy[i] = deviceExtensionNames[i];
  541. }
  542. // Get the rest of the optional extensions
  543. {
  544. uint32_t extensionCount;
  545. if (context->vkEnumerateDeviceExtensionProperties(context->physicalDevice, NULL, &extensionCount, NULL) == VK_SUCCESS && extensionCount > 0) {
  546. VkExtensionProperties *extensionProperties = SDL_calloc(sizeof(VkExtensionProperties), extensionCount);
  547. if (context->vkEnumerateDeviceExtensionProperties(context->physicalDevice, NULL, &extensionCount, extensionProperties) == VK_SUCCESS) {
  548. for (uint32_t i = 0; i < SDL_arraysize(optional_extensions); ++i) {
  549. for (uint32_t j = 0; j < extensionCount; ++j) {
  550. if (SDL_strcmp(extensionProperties[j].extensionName, optional_extensions[i]) == 0) {
  551. deviceExtensionsCopy[deviceCreateInfo.enabledExtensionCount++] = optional_extensions[i];
  552. break;
  553. }
  554. }
  555. }
  556. }
  557. SDL_free(extensionProperties);
  558. }
  559. }
  560. deviceCreateInfo.ppEnabledExtensionNames = deviceExtensionsCopy;
  561. context->deviceExtensions = deviceExtensionsCopy;
  562. context->deviceExtensionsCount = deviceCreateInfo.enabledExtensionCount;
  563. result = context->vkCreateDevice(context->physicalDevice, &deviceCreateInfo, NULL, &context->device);
  564. if (result != VK_SUCCESS) {
  565. SDL_SetError("vkCreateDevice(): %s", getVulkanResultString(result));
  566. goto done;
  567. }
  568. if (loadDeviceFunctions(context) < 0) {
  569. result = VK_ERROR_UNKNOWN;
  570. context->device = VK_NULL_HANDLE;
  571. goto done;
  572. }
  573. // Get the graphics queue that SDL will use
  574. context->vkGetDeviceQueue(context->device, context->graphicsQueueFamilyIndex, 0, &context->graphicsQueue);
  575. // Create a command pool
  576. VkCommandPoolCreateInfo commandPoolCreateInfo = { 0 };
  577. commandPoolCreateInfo.sType = VK_STRUCTURE_TYPE_COMMAND_POOL_CREATE_INFO;
  578. commandPoolCreateInfo.flags = VK_COMMAND_POOL_CREATE_RESET_COMMAND_BUFFER_BIT;
  579. commandPoolCreateInfo.queueFamilyIndex = context->graphicsQueueFamilyIndex;
  580. result = context->vkCreateCommandPool(context->device, &commandPoolCreateInfo, NULL, &context->commandPool);
  581. if (result != VK_SUCCESS) {
  582. SDL_SetError("vkCreateCommandPool(): %s", getVulkanResultString(result));
  583. goto done;
  584. }
  585. done:
  586. for (uint32_t i = 0; i < queueCreateInfoCount; ++i) {
  587. SDL_free((void *)queueCreateInfos[i].pQueuePriorities);
  588. }
  589. SDL_free(queueCreateInfos);
  590. if (result != VK_SUCCESS) {
  591. return -1;
  592. }
  593. return 0;
  594. }
  595. VulkanVideoContext *CreateVulkanVideoContext(SDL_Window *window)
  596. {
  597. VulkanVideoContext *context = SDL_calloc(1, sizeof(*context));
  598. if (!context) {
  599. return NULL;
  600. }
  601. if (loadGlobalFunctions(context) < 0 ||
  602. createInstance(context) < 0 ||
  603. createSurface(context, window) < 0 ||
  604. findPhysicalDevice(context) < 0 ||
  605. createDevice(context) < 0) {
  606. DestroyVulkanVideoContext(context);
  607. return NULL;
  608. }
  609. return context;
  610. }
  611. void SetupVulkanRenderProperties(VulkanVideoContext *context, SDL_PropertiesID props)
  612. {
  613. SDL_SetProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_INSTANCE_POINTER, context->instance);
  614. SDL_SetNumberProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_SURFACE_NUMBER, (Sint64)context->surface);
  615. SDL_SetProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_PHYSICAL_DEVICE_POINTER, context->physicalDevice);
  616. SDL_SetProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_DEVICE_POINTER, context->device);
  617. SDL_SetNumberProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_PRESENT_QUEUE_FAMILY_INDEX_NUMBER, context->presentQueueFamilyIndex);
  618. SDL_SetNumberProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_GRAPHICS_QUEUE_FAMILY_INDEX_NUMBER, context->graphicsQueueFamilyIndex);
  619. }
  620. void SetupVulkanDeviceContextData(VulkanVideoContext *context, AVVulkanDeviceContext *ctx)
  621. {
  622. ctx->get_proc_addr = context->vkGetInstanceProcAddr;
  623. ctx->inst = context->instance;
  624. ctx->phys_dev = context->physicalDevice;
  625. ctx->act_dev = context->device;
  626. ctx->device_features = context->features.device_features;
  627. ctx->enabled_inst_extensions = context->instanceExtensions;
  628. ctx->nb_enabled_inst_extensions = context->instanceExtensionsCount;
  629. ctx->enabled_dev_extensions = context->deviceExtensions;
  630. ctx->nb_enabled_dev_extensions = context->deviceExtensionsCount;
  631. ctx->queue_family_index = context->graphicsQueueFamilyIndex;
  632. ctx->nb_graphics_queues = context->graphicsQueueCount;
  633. ctx->queue_family_tx_index = context->transferQueueFamilyIndex;
  634. ctx->nb_tx_queues = context->transferQueueCount;
  635. ctx->queue_family_comp_index = context->computeQueueFamilyIndex;
  636. ctx->nb_comp_queues = context->computeQueueCount;
  637. ctx->queue_family_encode_index = -1;
  638. ctx->nb_encode_queues = 0;
  639. ctx->queue_family_decode_index = context->decodeQueueFamilyIndex;
  640. ctx->nb_decode_queues = context->decodeQueueCount;
  641. }
  642. static int CreateCommandBuffers(VulkanVideoContext *context, SDL_Renderer *renderer)
  643. {
  644. uint32_t commandBufferCount = (uint32_t)SDL_GetNumberProperty(SDL_GetRendererProperties(renderer), SDL_PROP_RENDERER_VULKAN_SWAPCHAIN_IMAGE_COUNT_NUMBER, 1);
  645. if (commandBufferCount > context->waitSemaphoreCount) {
  646. VkSemaphore *semaphores = (VkSemaphore *)SDL_realloc(context->waitSemaphores, commandBufferCount * sizeof(*semaphores));
  647. if (!semaphores) {
  648. return -1;
  649. }
  650. context->waitSemaphores = semaphores;
  651. VkSemaphoreCreateInfo semaphoreCreateInfo = { 0 };
  652. semaphoreCreateInfo.sType = VK_STRUCTURE_TYPE_SEMAPHORE_CREATE_INFO;
  653. while (context->waitSemaphoreCount < commandBufferCount) {
  654. VkResult result = context->vkCreateSemaphore(context->device, &semaphoreCreateInfo, NULL, &context->waitSemaphores[context->waitSemaphoreCount]);
  655. if (result != VK_SUCCESS) {
  656. SDL_SetError("vkCreateSemaphore(): %s", getVulkanResultString(result));
  657. return -1;
  658. }
  659. ++context->waitSemaphoreCount;
  660. }
  661. }
  662. if (commandBufferCount > context->signalSemaphoreCount) {
  663. VkSemaphore *semaphores = (VkSemaphore *)SDL_realloc(context->signalSemaphores, commandBufferCount * sizeof(*semaphores));
  664. if (!semaphores) {
  665. return -1;
  666. }
  667. context->signalSemaphores = semaphores;
  668. VkSemaphoreCreateInfo semaphoreCreateInfo = { 0 };
  669. semaphoreCreateInfo.sType = VK_STRUCTURE_TYPE_SEMAPHORE_CREATE_INFO;
  670. while (context->signalSemaphoreCount < commandBufferCount) {
  671. VkResult result = context->vkCreateSemaphore(context->device, &semaphoreCreateInfo, NULL, &context->signalSemaphores[context->signalSemaphoreCount]);
  672. if (result != VK_SUCCESS) {
  673. SDL_SetError("vkCreateSemaphore(): %s", getVulkanResultString(result));
  674. return -1;
  675. }
  676. ++context->signalSemaphoreCount;
  677. }
  678. }
  679. if (commandBufferCount > context->commandBufferCount) {
  680. uint32_t needed = (commandBufferCount - context->commandBufferCount);
  681. VkCommandBuffer *commandBuffers = (VkCommandBuffer *)SDL_realloc(context->commandBuffers, commandBufferCount * sizeof(*commandBuffers));
  682. if (!commandBuffers) {
  683. return -1;
  684. }
  685. context->commandBuffers = commandBuffers;
  686. VkCommandBufferAllocateInfo commandBufferAllocateInfo = { 0 };
  687. commandBufferAllocateInfo.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_ALLOCATE_INFO;
  688. commandBufferAllocateInfo.commandPool = context->commandPool;
  689. commandBufferAllocateInfo.level = VK_COMMAND_BUFFER_LEVEL_PRIMARY;
  690. commandBufferAllocateInfo.commandBufferCount = needed;
  691. VkResult result = context->vkAllocateCommandBuffers(context->device, &commandBufferAllocateInfo, &context->commandBuffers[context->commandBufferCount]);
  692. if (result != VK_SUCCESS) {
  693. SDL_SetError("vkAllocateCommandBuffers(): %s", getVulkanResultString(result));
  694. return -1;
  695. }
  696. context->commandBufferCount = commandBufferCount;
  697. }
  698. return 0;
  699. }
  700. int BeginVulkanFrameRendering(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer)
  701. {
  702. AVHWFramesContext *frames = (AVHWFramesContext *)(frame->hw_frames_ctx->data);
  703. AVVulkanFramesContext *vk = (AVVulkanFramesContext *)(frames->hwctx);
  704. AVVkFrame *pVkFrame = (AVVkFrame *)frame->data[0];
  705. if (CreateCommandBuffers(context, renderer) < 0) {
  706. return -1;
  707. }
  708. vk->lock_frame(frames, pVkFrame);
  709. VkTimelineSemaphoreSubmitInfo timeline = { 0 };
  710. timeline.sType = VK_STRUCTURE_TYPE_TIMELINE_SEMAPHORE_SUBMIT_INFO;
  711. timeline.waitSemaphoreValueCount = 1;
  712. timeline.pWaitSemaphoreValues = pVkFrame->sem_value;
  713. VkPipelineStageFlags pipelineStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  714. VkSubmitInfo submitInfo = { 0 };
  715. submitInfo.sType = VK_STRUCTURE_TYPE_SUBMIT_INFO;
  716. submitInfo.waitSemaphoreCount = 1;
  717. submitInfo.pWaitSemaphores = pVkFrame->sem;
  718. submitInfo.pWaitDstStageMask = &pipelineStageMask;
  719. submitInfo.signalSemaphoreCount = 1;
  720. submitInfo.pSignalSemaphores = &context->waitSemaphores[context->commandBufferIndex];
  721. submitInfo.pNext = &timeline;
  722. if (pVkFrame->layout[0] != VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL) {
  723. VkCommandBuffer commandBuffer = context->commandBuffers[context->commandBufferIndex];
  724. VkCommandBufferBeginInfo beginInfo = { 0 };
  725. beginInfo.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_BEGIN_INFO;
  726. beginInfo.flags = 0;
  727. context->vkBeginCommandBuffer(commandBuffer, &beginInfo);
  728. VkImageMemoryBarrier2 barrier = { 0 };
  729. barrier.sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER_2;
  730. barrier.srcAccessMask = VK_ACCESS_2_NONE;
  731. barrier.dstAccessMask = VK_ACCESS_2_SHADER_SAMPLED_READ_BIT;
  732. barrier.oldLayout = pVkFrame->layout[0];
  733. barrier.newLayout = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
  734. barrier.image = pVkFrame->img[0];
  735. barrier.subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  736. barrier.subresourceRange.levelCount = 1;
  737. barrier.subresourceRange.layerCount = 1;
  738. barrier.srcQueueFamilyIndex = pVkFrame->queue_family[0];
  739. barrier.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  740. barrier.srcStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  741. barrier.dstStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  742. VkDependencyInfo dep = { 0 };
  743. dep.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
  744. dep.dependencyFlags = VK_DEPENDENCY_BY_REGION_BIT;
  745. dep.imageMemoryBarrierCount = 1;
  746. dep.pImageMemoryBarriers = &barrier;
  747. context->vkCmdPipelineBarrier2(commandBuffer, &dep);
  748. context->vkEndCommandBuffer(commandBuffer);
  749. // Add the image barrier to the submit info
  750. submitInfo.commandBufferCount = 1;
  751. submitInfo.pCommandBuffers = &context->commandBuffers[context->commandBufferIndex];
  752. pVkFrame->layout[0] = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
  753. pVkFrame->queue_family[0] = VK_QUEUE_FAMILY_IGNORED;
  754. }
  755. VkResult result = context->vkQueueSubmit(context->graphicsQueue, 1, &submitInfo, 0);
  756. if (result != VK_SUCCESS) {
  757. // Don't return an error here, we need to complete the frame operation
  758. SDL_LogError(SDL_LOG_CATEGORY_APPLICATION , "vkQueueSubmit(): %s", getVulkanResultString(result));
  759. }
  760. SDL_AddVulkanRenderSemaphores(renderer, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT, (Sint64)context->waitSemaphores[context->commandBufferIndex], (Sint64)context->signalSemaphores[context->commandBufferIndex]);
  761. return 0;
  762. }
  763. int FinishVulkanFrameRendering(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer)
  764. {
  765. AVHWFramesContext *frames = (AVHWFramesContext *)(frame->hw_frames_ctx->data);
  766. AVVulkanFramesContext *vk = (AVVulkanFramesContext *)(frames->hwctx);
  767. AVVkFrame *pVkFrame = (AVVkFrame *)frame->data[0];
  768. // Transition the frame back to ffmpeg
  769. ++pVkFrame->sem_value[0];
  770. VkTimelineSemaphoreSubmitInfo timeline = { 0 };
  771. timeline.sType = VK_STRUCTURE_TYPE_TIMELINE_SEMAPHORE_SUBMIT_INFO;
  772. timeline.signalSemaphoreValueCount = 1;
  773. timeline.pSignalSemaphoreValues = pVkFrame->sem_value;
  774. VkPipelineStageFlags pipelineStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  775. VkSubmitInfo submitInfo = { 0 };
  776. submitInfo.sType = VK_STRUCTURE_TYPE_SUBMIT_INFO;
  777. submitInfo.waitSemaphoreCount = 1;
  778. submitInfo.pWaitSemaphores = &context->signalSemaphores[context->commandBufferIndex];
  779. submitInfo.pWaitDstStageMask = &pipelineStageMask;
  780. submitInfo.signalSemaphoreCount = 1;
  781. submitInfo.pSignalSemaphores = pVkFrame->sem;
  782. submitInfo.pNext = &timeline;
  783. VkResult result = context->vkQueueSubmit(context->graphicsQueue, 1, &submitInfo, 0);
  784. if (result != VK_SUCCESS) {
  785. // Don't return an error here, we need to complete the frame operation
  786. SDL_LogError(SDL_LOG_CATEGORY_APPLICATION, "vkQueueSubmit(): %s", getVulkanResultString(result));
  787. }
  788. vk->unlock_frame(frames, pVkFrame);
  789. context->commandBufferIndex = (context->commandBufferIndex + 1) % context->commandBufferCount;
  790. return 0;
  791. }
  792. SDL_Texture *CreateVulkanVideoTexture(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer, SDL_PropertiesID props)
  793. {
  794. AVHWFramesContext *frames = (AVHWFramesContext *)(frame->hw_frames_ctx->data);
  795. AVVulkanFramesContext *vk = (AVVulkanFramesContext *)(frames->hwctx);
  796. AVVkFrame *pVkFrame = (AVVkFrame *)frame->data[0];
  797. Uint32 format;
  798. switch (vk->format[0]) {
  799. case VK_FORMAT_G8B8G8R8_422_UNORM:
  800. format = SDL_PIXELFORMAT_YUY2;
  801. break;
  802. case VK_FORMAT_B8G8R8G8_422_UNORM:
  803. format = SDL_PIXELFORMAT_UYVY;
  804. break;
  805. case VK_FORMAT_G8_B8_R8_3PLANE_420_UNORM:
  806. format = SDL_PIXELFORMAT_IYUV;
  807. break;
  808. case VK_FORMAT_G8_B8R8_2PLANE_420_UNORM:
  809. format = SDL_PIXELFORMAT_NV12;
  810. break;
  811. case VK_FORMAT_G10X6_B10X6R10X6_2PLANE_420_UNORM_3PACK16:
  812. format = SDL_PIXELFORMAT_P010;
  813. break;
  814. default:
  815. format = SDL_PIXELFORMAT_UNKNOWN;
  816. break;
  817. }
  818. SDL_SetNumberProperty(props, SDL_PROP_TEXTURE_CREATE_FORMAT_NUMBER, format);
  819. SDL_SetNumberProperty(props, SDL_PROP_TEXTURE_CREATE_VULKAN_TEXTURE_NUMBER, (Sint64)pVkFrame->img[0]);
  820. return SDL_CreateTextureWithProperties(renderer, props);
  821. }
  822. void DestroyVulkanVideoContext(VulkanVideoContext *context)
  823. {
  824. if (context) {
  825. if (context->device) {
  826. context->vkDeviceWaitIdle(context->device);
  827. }
  828. if (context->instanceExtensions) {
  829. SDL_free(context->instanceExtensions);
  830. }
  831. if (context->deviceExtensions) {
  832. SDL_free(context->deviceExtensions);
  833. }
  834. if (context->waitSemaphores) {
  835. for (uint32_t i = 0; i < context->waitSemaphoreCount; ++i) {
  836. context->vkDestroySemaphore(context->device, context->waitSemaphores[i], NULL);
  837. }
  838. SDL_free(context->waitSemaphores);
  839. context->waitSemaphores = NULL;
  840. }
  841. if (context->signalSemaphores) {
  842. for (uint32_t i = 0; i < context->signalSemaphoreCount; ++i) {
  843. context->vkDestroySemaphore(context->device, context->signalSemaphores[i], NULL);
  844. }
  845. SDL_free(context->signalSemaphores);
  846. context->signalSemaphores = NULL;
  847. }
  848. if (context->commandBuffers) {
  849. context->vkFreeCommandBuffers(context->device, context->commandPool, context->commandBufferCount, context->commandBuffers);
  850. SDL_free(context->commandBuffers);
  851. context->commandBuffers = NULL;
  852. }
  853. if (context->commandPool) {
  854. context->vkDestroyCommandPool(context->device, context->commandPool, NULL);
  855. context->commandPool = VK_NULL_HANDLE;
  856. }
  857. if (context->device) {
  858. context->vkDestroyDevice(context->device, NULL);
  859. }
  860. if (context->surface) {
  861. context->vkDestroySurfaceKHR(context->instance, context->surface, NULL);
  862. }
  863. if (context->instance) {
  864. context->vkDestroyInstance(context->instance, NULL);
  865. }
  866. SDL_free(context);
  867. }
  868. }