testffmpeg_vulkan.c 44 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004
  1. /*
  2. Copyright (C) 1997-2024 Sam Lantinga <[email protected]>
  3. This software is provided 'as-is', without any express or implied
  4. warranty. In no event will the authors be held liable for any damages
  5. arising from the use of this software.
  6. Permission is granted to anyone to use this software for any purpose,
  7. including commercial applications, and to alter it and redistribute it
  8. freely.
  9. */
  10. #include <SDL3/SDL.h>
  11. #include <SDL3/SDL_vulkan.h>
  12. #include "testffmpeg_vulkan.h"
  13. #ifdef FFMPEG_VULKAN_SUPPORT
  14. #define VULKAN_FUNCTIONS() \
  15. VULKAN_GLOBAL_FUNCTION(vkCreateInstance) \
  16. VULKAN_GLOBAL_FUNCTION(vkEnumerateInstanceExtensionProperties) \
  17. VULKAN_GLOBAL_FUNCTION(vkEnumerateInstanceLayerProperties) \
  18. VULKAN_INSTANCE_FUNCTION(vkCreateDevice) \
  19. VULKAN_INSTANCE_FUNCTION(vkDestroyInstance) \
  20. VULKAN_INSTANCE_FUNCTION(vkDestroySurfaceKHR) \
  21. VULKAN_INSTANCE_FUNCTION(vkEnumerateDeviceExtensionProperties) \
  22. VULKAN_INSTANCE_FUNCTION(vkEnumeratePhysicalDevices) \
  23. VULKAN_INSTANCE_FUNCTION(vkGetDeviceProcAddr) \
  24. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceFeatures2) \
  25. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceQueueFamilyProperties) \
  26. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceSurfaceSupportKHR) \
  27. VULKAN_INSTANCE_FUNCTION(vkQueueWaitIdle) \
  28. VULKAN_DEVICE_FUNCTION(vkAllocateCommandBuffers) \
  29. VULKAN_DEVICE_FUNCTION(vkBeginCommandBuffer) \
  30. VULKAN_DEVICE_FUNCTION(vkCmdPipelineBarrier2) \
  31. VULKAN_DEVICE_FUNCTION(vkCreateCommandPool) \
  32. VULKAN_DEVICE_FUNCTION(vkCreateSemaphore) \
  33. VULKAN_DEVICE_FUNCTION(vkDestroyCommandPool) \
  34. VULKAN_DEVICE_FUNCTION(vkDestroyDevice) \
  35. VULKAN_DEVICE_FUNCTION(vkDestroySemaphore) \
  36. VULKAN_DEVICE_FUNCTION(vkDeviceWaitIdle) \
  37. VULKAN_DEVICE_FUNCTION(vkEndCommandBuffer) \
  38. VULKAN_DEVICE_FUNCTION(vkFreeCommandBuffers) \
  39. VULKAN_DEVICE_FUNCTION(vkGetDeviceQueue) \
  40. VULKAN_DEVICE_FUNCTION(vkQueueSubmit) \
  41. \
  42. VULKAN_INSTANCE_FUNCTION(vkGetPhysicalDeviceVideoFormatPropertiesKHR) \
  43. typedef struct
  44. {
  45. VkPhysicalDeviceFeatures2 device_features;
  46. VkPhysicalDeviceVulkan11Features device_features_1_1;
  47. VkPhysicalDeviceVulkan12Features device_features_1_2;
  48. VkPhysicalDeviceVulkan13Features device_features_1_3;
  49. VkPhysicalDeviceDescriptorBufferFeaturesEXT desc_buf_features;
  50. VkPhysicalDeviceShaderAtomicFloatFeaturesEXT atomic_float_features;
  51. VkPhysicalDeviceCooperativeMatrixFeaturesKHR coop_matrix_features;
  52. } VulkanDeviceFeatures;
  53. struct VulkanVideoContext
  54. {
  55. VkInstance instance;
  56. VkSurfaceKHR surface;
  57. VkPhysicalDevice physicalDevice;
  58. int presentQueueFamilyIndex;
  59. int presentQueueCount;
  60. int graphicsQueueFamilyIndex;
  61. int graphicsQueueCount;
  62. int transferQueueFamilyIndex;
  63. int transferQueueCount;
  64. int computeQueueFamilyIndex;
  65. int computeQueueCount;
  66. int decodeQueueFamilyIndex;
  67. int decodeQueueCount;
  68. VkDevice device;
  69. VkQueue graphicsQueue;
  70. VkCommandPool commandPool;
  71. VkCommandBuffer *commandBuffers;
  72. uint32_t commandBufferCount;
  73. uint32_t commandBufferIndex;
  74. VkSemaphore *waitSemaphores;
  75. uint32_t waitSemaphoreCount;
  76. VkSemaphore *signalSemaphores;
  77. uint32_t signalSemaphoreCount;
  78. const char **instanceExtensions;
  79. int instanceExtensionsCount;
  80. const char **deviceExtensions;
  81. int deviceExtensionsCount;
  82. VulkanDeviceFeatures features;
  83. PFN_vkGetInstanceProcAddr vkGetInstanceProcAddr;
  84. #define VULKAN_GLOBAL_FUNCTION(name) PFN_##name name;
  85. #define VULKAN_INSTANCE_FUNCTION(name) PFN_##name name;
  86. #define VULKAN_DEVICE_FUNCTION(name) PFN_##name name;
  87. VULKAN_FUNCTIONS()
  88. #undef VULKAN_GLOBAL_FUNCTION
  89. #undef VULKAN_INSTANCE_FUNCTION
  90. #undef VULKAN_DEVICE_FUNCTION
  91. };
  92. static int loadGlobalFunctions(VulkanVideoContext *context)
  93. {
  94. context->vkGetInstanceProcAddr = (PFN_vkGetInstanceProcAddr)SDL_Vulkan_GetVkGetInstanceProcAddr();
  95. if (!context->vkGetInstanceProcAddr) {
  96. return -1;
  97. }
  98. #define VULKAN_GLOBAL_FUNCTION(name) \
  99. context->name = (PFN_##name)context->vkGetInstanceProcAddr(VK_NULL_HANDLE, #name); \
  100. if (!context->name) { \
  101. return SDL_SetError("vkGetInstanceProcAddr(VK_NULL_HANDLE, \"" #name "\") failed"); \
  102. }
  103. #define VULKAN_INSTANCE_FUNCTION(name)
  104. #define VULKAN_DEVICE_FUNCTION(name)
  105. VULKAN_FUNCTIONS()
  106. #undef VULKAN_GLOBAL_FUNCTION
  107. #undef VULKAN_INSTANCE_FUNCTION
  108. #undef VULKAN_DEVICE_FUNCTION
  109. return 0;
  110. }
  111. static int loadInstanceFunctions(VulkanVideoContext *context)
  112. {
  113. #define VULKAN_GLOBAL_FUNCTION(name)
  114. #define VULKAN_INSTANCE_FUNCTION(name) \
  115. context->name = (PFN_##name)context->vkGetInstanceProcAddr(context->instance, #name); \
  116. if (!context->name) { \
  117. return SDL_SetError("vkGetInstanceProcAddr(instance, \"" #name "\") failed"); \
  118. }
  119. #define VULKAN_DEVICE_FUNCTION(name)
  120. VULKAN_FUNCTIONS()
  121. #undef VULKAN_GLOBAL_FUNCTION
  122. #undef VULKAN_INSTANCE_FUNCTION
  123. #undef VULKAN_DEVICE_FUNCTION
  124. return 0;
  125. }
  126. static int loadDeviceFunctions(VulkanVideoContext *context)
  127. {
  128. #define VULKAN_GLOBAL_FUNCTION(name)
  129. #define VULKAN_INSTANCE_FUNCTION(name)
  130. #define VULKAN_DEVICE_FUNCTION(name) \
  131. context->name = (PFN_##name)context->vkGetDeviceProcAddr(context->device, #name); \
  132. if (!context->name) { \
  133. return SDL_SetError("vkGetDeviceProcAddr(device, \"" #name "\") failed\n"); \
  134. }
  135. VULKAN_FUNCTIONS()
  136. #undef VULKAN_GLOBAL_FUNCTION
  137. #undef VULKAN_INSTANCE_FUNCTION
  138. #undef VULKAN_DEVICE_FUNCTION
  139. return 0;
  140. }
  141. #undef VULKAN_FUNCTIONS
  142. static const char *getVulkanResultString(VkResult result)
  143. {
  144. switch ((int)result) {
  145. #define RESULT_CASE(x) \
  146. case x: \
  147. return #x
  148. RESULT_CASE(VK_SUCCESS);
  149. RESULT_CASE(VK_NOT_READY);
  150. RESULT_CASE(VK_TIMEOUT);
  151. RESULT_CASE(VK_EVENT_SET);
  152. RESULT_CASE(VK_EVENT_RESET);
  153. RESULT_CASE(VK_INCOMPLETE);
  154. RESULT_CASE(VK_ERROR_OUT_OF_HOST_MEMORY);
  155. RESULT_CASE(VK_ERROR_OUT_OF_DEVICE_MEMORY);
  156. RESULT_CASE(VK_ERROR_INITIALIZATION_FAILED);
  157. RESULT_CASE(VK_ERROR_DEVICE_LOST);
  158. RESULT_CASE(VK_ERROR_MEMORY_MAP_FAILED);
  159. RESULT_CASE(VK_ERROR_LAYER_NOT_PRESENT);
  160. RESULT_CASE(VK_ERROR_EXTENSION_NOT_PRESENT);
  161. RESULT_CASE(VK_ERROR_FEATURE_NOT_PRESENT);
  162. RESULT_CASE(VK_ERROR_INCOMPATIBLE_DRIVER);
  163. RESULT_CASE(VK_ERROR_TOO_MANY_OBJECTS);
  164. RESULT_CASE(VK_ERROR_FORMAT_NOT_SUPPORTED);
  165. RESULT_CASE(VK_ERROR_FRAGMENTED_POOL);
  166. RESULT_CASE(VK_ERROR_SURFACE_LOST_KHR);
  167. RESULT_CASE(VK_ERROR_NATIVE_WINDOW_IN_USE_KHR);
  168. RESULT_CASE(VK_SUBOPTIMAL_KHR);
  169. RESULT_CASE(VK_ERROR_OUT_OF_DATE_KHR);
  170. RESULT_CASE(VK_ERROR_INCOMPATIBLE_DISPLAY_KHR);
  171. RESULT_CASE(VK_ERROR_VALIDATION_FAILED_EXT);
  172. RESULT_CASE(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
  173. RESULT_CASE(VK_ERROR_INVALID_SHADER_NV);
  174. #undef RESULT_CASE
  175. default:
  176. break;
  177. }
  178. return (result < 0) ? "VK_ERROR_<Unknown>" : "VK_<Unknown>";
  179. }
  180. static int createInstance(VulkanVideoContext *context)
  181. {
  182. static const char *optional_extensions[] = {
  183. VK_EXT_SWAPCHAIN_COLOR_SPACE_EXTENSION_NAME,
  184. VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME
  185. };
  186. VkApplicationInfo appInfo = { 0 };
  187. VkInstanceCreateInfo instanceCreateInfo = { 0 };
  188. VkResult result;
  189. char const *const *instanceExtensions = SDL_Vulkan_GetInstanceExtensions(&instanceCreateInfo.enabledExtensionCount);
  190. appInfo.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
  191. appInfo.apiVersion = VK_API_VERSION_1_3;
  192. instanceCreateInfo.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
  193. instanceCreateInfo.pApplicationInfo = &appInfo;
  194. const char **instanceExtensionsCopy = SDL_calloc(instanceCreateInfo.enabledExtensionCount + SDL_arraysize(optional_extensions), sizeof(const char *));
  195. for (uint32_t i = 0; i < instanceCreateInfo.enabledExtensionCount; i++) {
  196. instanceExtensionsCopy[i] = instanceExtensions[i];
  197. }
  198. // Get the rest of the optional extensions
  199. {
  200. uint32_t extensionCount;
  201. if (context->vkEnumerateInstanceExtensionProperties(NULL, &extensionCount, NULL) == VK_SUCCESS && extensionCount > 0) {
  202. VkExtensionProperties *extensionProperties = SDL_calloc(sizeof(VkExtensionProperties), extensionCount);
  203. if (context->vkEnumerateInstanceExtensionProperties(NULL, &extensionCount, extensionProperties) == VK_SUCCESS) {
  204. for (uint32_t i = 0; i < SDL_arraysize(optional_extensions); ++i) {
  205. for (uint32_t j = 0; j < extensionCount; ++j) {
  206. if (SDL_strcmp(extensionProperties[j].extensionName, optional_extensions[i]) == 0) {
  207. instanceExtensionsCopy[instanceCreateInfo.enabledExtensionCount++] = optional_extensions[i];
  208. break;
  209. }
  210. }
  211. }
  212. }
  213. SDL_free(extensionProperties);
  214. }
  215. }
  216. instanceCreateInfo.ppEnabledExtensionNames = instanceExtensionsCopy;
  217. context->instanceExtensions = instanceExtensionsCopy;
  218. context->instanceExtensionsCount = instanceCreateInfo.enabledExtensionCount;
  219. result = context->vkCreateInstance(&instanceCreateInfo, NULL, &context->instance);
  220. if (result != VK_SUCCESS) {
  221. context->instance = VK_NULL_HANDLE;
  222. return SDL_SetError("vkCreateInstance(): %s\n", getVulkanResultString(result));
  223. }
  224. if (loadInstanceFunctions(context) < 0) {
  225. return -1;
  226. }
  227. return 0;
  228. }
  229. static int createSurface(VulkanVideoContext *context, SDL_Window *window)
  230. {
  231. if (!SDL_Vulkan_CreateSurface(window,
  232. context->instance,
  233. NULL,
  234. &context->surface)) {
  235. context->surface = VK_NULL_HANDLE;
  236. return -1;
  237. }
  238. return 0;
  239. }
  240. // Use the same queue scoring algorithm as ffmpeg to make sure we get the same device configuration
  241. static int selectQueueFamily(VkQueueFamilyProperties *queueFamiliesProperties, uint32_t queueFamiliesCount, VkQueueFlagBits flags, int *queueCount)
  242. {
  243. uint32_t queueFamilyIndex;
  244. uint32_t selectedQueueFamilyIndex = queueFamiliesCount;
  245. uint32_t min_score = ~0u;
  246. for (queueFamilyIndex = 0; queueFamilyIndex < queueFamiliesCount; ++queueFamilyIndex) {
  247. VkQueueFlagBits current_flags = queueFamiliesProperties[queueFamilyIndex].queueFlags;
  248. if (current_flags & flags) {
  249. uint32_t score = av_popcount(current_flags) + queueFamiliesProperties[queueFamilyIndex].timestampValidBits;
  250. if (score < min_score) {
  251. selectedQueueFamilyIndex = queueFamilyIndex;
  252. min_score = score;
  253. }
  254. }
  255. }
  256. if (selectedQueueFamilyIndex != queueFamiliesCount) {
  257. VkQueueFamilyProperties *selectedQueueFamily = &queueFamiliesProperties[selectedQueueFamilyIndex];
  258. *queueCount = (int)selectedQueueFamily->queueCount;
  259. ++selectedQueueFamily->timestampValidBits;
  260. return (int)selectedQueueFamilyIndex;
  261. } else {
  262. *queueCount = 0;
  263. return -1;
  264. }
  265. }
  266. static int findPhysicalDevice(VulkanVideoContext *context)
  267. {
  268. uint32_t physicalDeviceCount = 0;
  269. VkPhysicalDevice *physicalDevices;
  270. VkQueueFamilyProperties *queueFamiliesProperties = NULL;
  271. uint32_t queueFamiliesPropertiesAllocatedSize = 0;
  272. VkExtensionProperties *deviceExtensions = NULL;
  273. uint32_t deviceExtensionsAllocatedSize = 0;
  274. uint32_t physicalDeviceIndex;
  275. VkResult result;
  276. result = context->vkEnumeratePhysicalDevices(context->instance, &physicalDeviceCount, NULL);
  277. if (result != VK_SUCCESS) {
  278. return SDL_SetError("vkEnumeratePhysicalDevices(): %s", getVulkanResultString(result));
  279. }
  280. if (physicalDeviceCount == 0) {
  281. return SDL_SetError("vkEnumeratePhysicalDevices(): no physical devices");
  282. }
  283. physicalDevices = (VkPhysicalDevice *)SDL_malloc(sizeof(VkPhysicalDevice) * physicalDeviceCount);
  284. if (!physicalDevices) {
  285. return -1;
  286. }
  287. result = context->vkEnumeratePhysicalDevices(context->instance, &physicalDeviceCount, physicalDevices);
  288. if (result != VK_SUCCESS) {
  289. SDL_free(physicalDevices);
  290. return SDL_SetError("vkEnumeratePhysicalDevices(): %s", getVulkanResultString(result));
  291. }
  292. context->physicalDevice = NULL;
  293. for (physicalDeviceIndex = 0; physicalDeviceIndex < physicalDeviceCount; physicalDeviceIndex++) {
  294. uint32_t queueFamiliesCount = 0;
  295. uint32_t queueFamilyIndex;
  296. uint32_t deviceExtensionCount = 0;
  297. SDL_bool hasSwapchainExtension = SDL_FALSE;
  298. uint32_t i;
  299. VkPhysicalDevice physicalDevice = physicalDevices[physicalDeviceIndex];
  300. context->vkGetPhysicalDeviceQueueFamilyProperties(physicalDevice, &queueFamiliesCount, NULL);
  301. if (queueFamiliesCount == 0) {
  302. continue;
  303. }
  304. if (queueFamiliesPropertiesAllocatedSize < queueFamiliesCount) {
  305. SDL_free(queueFamiliesProperties);
  306. queueFamiliesPropertiesAllocatedSize = queueFamiliesCount;
  307. queueFamiliesProperties = (VkQueueFamilyProperties *)SDL_malloc(sizeof(VkQueueFamilyProperties) * queueFamiliesPropertiesAllocatedSize);
  308. if (!queueFamiliesProperties) {
  309. SDL_free(physicalDevices);
  310. SDL_free(deviceExtensions);
  311. return -1;
  312. }
  313. }
  314. context->vkGetPhysicalDeviceQueueFamilyProperties(physicalDevice, &queueFamiliesCount, queueFamiliesProperties);
  315. // Initialize timestampValidBits for scoring in selectQueueFamily
  316. for (queueFamilyIndex = 0; queueFamilyIndex < queueFamiliesCount; queueFamilyIndex++) {
  317. queueFamiliesProperties[queueFamilyIndex].timestampValidBits = 0;
  318. }
  319. context->presentQueueFamilyIndex = -1;
  320. context->graphicsQueueFamilyIndex = -1;
  321. for (queueFamilyIndex = 0; queueFamilyIndex < queueFamiliesCount; queueFamilyIndex++) {
  322. VkBool32 supported = 0;
  323. if (queueFamiliesProperties[queueFamilyIndex].queueCount == 0) {
  324. continue;
  325. }
  326. if (queueFamiliesProperties[queueFamilyIndex].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
  327. context->graphicsQueueFamilyIndex = queueFamilyIndex;
  328. }
  329. result = context->vkGetPhysicalDeviceSurfaceSupportKHR(physicalDevice, queueFamilyIndex, context->surface, &supported);
  330. if (result == VK_SUCCESS) {
  331. if (supported) {
  332. context->presentQueueFamilyIndex = queueFamilyIndex;
  333. if (queueFamiliesProperties[queueFamilyIndex].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
  334. break; // use this queue because it can present and do graphics
  335. }
  336. }
  337. }
  338. }
  339. if (context->presentQueueFamilyIndex < 0 || context->graphicsQueueFamilyIndex < 0) {
  340. // We can't render and present on this device
  341. continue;
  342. }
  343. context->presentQueueCount = queueFamiliesProperties[context->presentQueueFamilyIndex].queueCount;
  344. ++queueFamiliesProperties[context->presentQueueFamilyIndex].timestampValidBits;
  345. context->graphicsQueueCount = queueFamiliesProperties[context->graphicsQueueFamilyIndex].queueCount;
  346. ++queueFamiliesProperties[context->graphicsQueueFamilyIndex].timestampValidBits;
  347. context->transferQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_TRANSFER_BIT, &context->transferQueueCount);
  348. context->computeQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_COMPUTE_BIT, &context->computeQueueCount);
  349. context->decodeQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_VIDEO_DECODE_BIT_KHR, &context->decodeQueueCount);
  350. if (context->transferQueueFamilyIndex < 0) {
  351. // ffmpeg can fall back to the compute or graphics queues for this
  352. context->transferQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_COMPUTE_BIT, &context->transferQueueCount);
  353. if (context->transferQueueFamilyIndex < 0) {
  354. context->transferQueueFamilyIndex = selectQueueFamily(queueFamiliesProperties, queueFamiliesCount, VK_QUEUE_GRAPHICS_BIT, &context->transferQueueCount);
  355. }
  356. }
  357. if (context->transferQueueFamilyIndex < 0 ||
  358. context->computeQueueFamilyIndex < 0) {
  359. // This device doesn't have the queues we need for video decoding
  360. continue;
  361. }
  362. result = context->vkEnumerateDeviceExtensionProperties(physicalDevice, NULL, &deviceExtensionCount, NULL);
  363. if (result != VK_SUCCESS) {
  364. SDL_free(physicalDevices);
  365. SDL_free(queueFamiliesProperties);
  366. SDL_free(deviceExtensions);
  367. return SDL_SetError("vkEnumerateDeviceExtensionProperties(): %s", getVulkanResultString(result));
  368. }
  369. if (deviceExtensionCount == 0) {
  370. continue;
  371. }
  372. if (deviceExtensionsAllocatedSize < deviceExtensionCount) {
  373. SDL_free(deviceExtensions);
  374. deviceExtensionsAllocatedSize = deviceExtensionCount;
  375. deviceExtensions = SDL_malloc(sizeof(VkExtensionProperties) * deviceExtensionsAllocatedSize);
  376. if (!deviceExtensions) {
  377. SDL_free(physicalDevices);
  378. SDL_free(queueFamiliesProperties);
  379. return -1;
  380. }
  381. }
  382. result = context->vkEnumerateDeviceExtensionProperties(physicalDevice, NULL, &deviceExtensionCount, deviceExtensions);
  383. if (result != VK_SUCCESS) {
  384. SDL_free(physicalDevices);
  385. SDL_free(queueFamiliesProperties);
  386. SDL_free(deviceExtensions);
  387. return SDL_SetError("vkEnumerateDeviceExtensionProperties(): %s", getVulkanResultString(result));
  388. }
  389. for (i = 0; i < deviceExtensionCount; i++) {
  390. if (SDL_strcmp(deviceExtensions[i].extensionName, VK_KHR_SWAPCHAIN_EXTENSION_NAME) == 0) {
  391. hasSwapchainExtension = SDL_TRUE;
  392. break;
  393. }
  394. }
  395. if (!hasSwapchainExtension) {
  396. continue;
  397. }
  398. context->physicalDevice = physicalDevice;
  399. break;
  400. }
  401. SDL_free(physicalDevices);
  402. SDL_free(queueFamiliesProperties);
  403. SDL_free(deviceExtensions);
  404. if (!context->physicalDevice) {
  405. return SDL_SetError("Vulkan: no viable physical devices found");
  406. }
  407. return 0;
  408. }
  409. static void initDeviceFeatures(VulkanDeviceFeatures *features)
  410. {
  411. features->device_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2;
  412. features->device_features.pNext = &features->device_features_1_1;
  413. features->device_features_1_1.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VULKAN_1_1_FEATURES;
  414. features->device_features_1_1.pNext = &features->device_features_1_2;
  415. features->device_features_1_2.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VULKAN_1_2_FEATURES;
  416. features->device_features_1_2.pNext = &features->device_features_1_3;
  417. features->device_features_1_3.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VULKAN_1_3_FEATURES;
  418. features->device_features_1_3.pNext = &features->desc_buf_features;
  419. features->desc_buf_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_DESCRIPTOR_BUFFER_FEATURES_EXT;
  420. features->desc_buf_features.pNext = &features->atomic_float_features;
  421. features->atomic_float_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_SHADER_ATOMIC_FLOAT_FEATURES_EXT;
  422. features->atomic_float_features.pNext = &features->coop_matrix_features;
  423. features->coop_matrix_features.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_COOPERATIVE_MATRIX_FEATURES_KHR;
  424. features->coop_matrix_features.pNext = NULL;
  425. }
  426. static void copyDeviceFeatures(VulkanDeviceFeatures *supported_features, VulkanDeviceFeatures *requested_features)
  427. {
  428. #define COPY_OPTIONAL_FEATURE(X) requested_features->X = supported_features->X
  429. COPY_OPTIONAL_FEATURE(device_features.features.shaderImageGatherExtended);
  430. COPY_OPTIONAL_FEATURE(device_features.features.shaderStorageImageReadWithoutFormat);
  431. COPY_OPTIONAL_FEATURE(device_features.features.shaderStorageImageWriteWithoutFormat);
  432. COPY_OPTIONAL_FEATURE(device_features.features.fragmentStoresAndAtomics);
  433. COPY_OPTIONAL_FEATURE(device_features.features.vertexPipelineStoresAndAtomics);
  434. COPY_OPTIONAL_FEATURE(device_features.features.shaderInt64);
  435. COPY_OPTIONAL_FEATURE(device_features.features.shaderInt16);
  436. COPY_OPTIONAL_FEATURE(device_features.features.shaderFloat64);
  437. COPY_OPTIONAL_FEATURE(device_features_1_1.samplerYcbcrConversion);
  438. COPY_OPTIONAL_FEATURE(device_features_1_1.storagePushConstant16);
  439. COPY_OPTIONAL_FEATURE(device_features_1_2.bufferDeviceAddress);
  440. COPY_OPTIONAL_FEATURE(device_features_1_2.hostQueryReset);
  441. COPY_OPTIONAL_FEATURE(device_features_1_2.storagePushConstant8);
  442. COPY_OPTIONAL_FEATURE(device_features_1_2.shaderInt8);
  443. COPY_OPTIONAL_FEATURE(device_features_1_2.storageBuffer8BitAccess);
  444. COPY_OPTIONAL_FEATURE(device_features_1_2.uniformAndStorageBuffer8BitAccess);
  445. COPY_OPTIONAL_FEATURE(device_features_1_2.shaderFloat16);
  446. COPY_OPTIONAL_FEATURE(device_features_1_2.shaderSharedInt64Atomics);
  447. COPY_OPTIONAL_FEATURE(device_features_1_2.vulkanMemoryModel);
  448. COPY_OPTIONAL_FEATURE(device_features_1_2.vulkanMemoryModelDeviceScope);
  449. COPY_OPTIONAL_FEATURE(device_features_1_2.hostQueryReset);
  450. COPY_OPTIONAL_FEATURE(device_features_1_3.dynamicRendering);
  451. COPY_OPTIONAL_FEATURE(device_features_1_3.maintenance4);
  452. COPY_OPTIONAL_FEATURE(device_features_1_3.synchronization2);
  453. COPY_OPTIONAL_FEATURE(device_features_1_3.computeFullSubgroups);
  454. COPY_OPTIONAL_FEATURE(device_features_1_3.shaderZeroInitializeWorkgroupMemory);
  455. COPY_OPTIONAL_FEATURE(desc_buf_features.descriptorBuffer);
  456. COPY_OPTIONAL_FEATURE(desc_buf_features.descriptorBufferPushDescriptors);
  457. COPY_OPTIONAL_FEATURE(atomic_float_features.shaderBufferFloat32Atomics);
  458. COPY_OPTIONAL_FEATURE(atomic_float_features.shaderBufferFloat32AtomicAdd);
  459. COPY_OPTIONAL_FEATURE(coop_matrix_features.cooperativeMatrix);
  460. #undef COPY_OPTIONAL_FEATURE
  461. // timeline semaphores is required by ffmpeg
  462. requested_features->device_features_1_2.timelineSemaphore = 1;
  463. }
  464. static int addQueueFamily(VkDeviceQueueCreateInfo **pQueueCreateInfos, uint32_t *pQueueCreateInfoCount, uint32_t queueFamilyIndex, uint32_t queueCount)
  465. {
  466. VkDeviceQueueCreateInfo *queueCreateInfo;
  467. VkDeviceQueueCreateInfo *queueCreateInfos = *pQueueCreateInfos;
  468. uint32_t queueCreateInfoCount = *pQueueCreateInfoCount;
  469. float *queuePriorities;
  470. if (queueCount == 0) {
  471. return 0;
  472. }
  473. for (uint32_t i = 0; i < queueCreateInfoCount; ++i) {
  474. if (queueCreateInfos[i].queueFamilyIndex == queueFamilyIndex) {
  475. return 0;
  476. }
  477. }
  478. queueCreateInfos = (VkDeviceQueueCreateInfo *)SDL_realloc(queueCreateInfos, (queueCreateInfoCount + 1) * sizeof(*queueCreateInfos));
  479. if (!queueCreateInfos) {
  480. return -1;
  481. }
  482. queuePriorities = (float *)SDL_malloc(queueCount * sizeof(*queuePriorities));
  483. if (!queuePriorities) {
  484. return -1;
  485. }
  486. for (uint32_t i = 0; i < queueCount; ++i) {
  487. queuePriorities[i] = 1.0f / queueCount;
  488. }
  489. queueCreateInfo = &queueCreateInfos[queueCreateInfoCount++];
  490. SDL_zerop(queueCreateInfo);
  491. queueCreateInfo->sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
  492. queueCreateInfo->queueFamilyIndex = queueFamilyIndex;
  493. queueCreateInfo->queueCount = queueCount;
  494. queueCreateInfo->pQueuePriorities = queuePriorities;
  495. *pQueueCreateInfos = queueCreateInfos;
  496. *pQueueCreateInfoCount = queueCreateInfoCount;
  497. return 0;
  498. }
  499. static int createDevice(VulkanVideoContext *context)
  500. {
  501. static const char *const deviceExtensionNames[] = {
  502. VK_KHR_SWAPCHAIN_EXTENSION_NAME,
  503. VK_KHR_SAMPLER_YCBCR_CONVERSION_EXTENSION_NAME,
  504. VK_KHR_MAINTENANCE1_EXTENSION_NAME,
  505. VK_KHR_BIND_MEMORY_2_EXTENSION_NAME,
  506. VK_KHR_GET_MEMORY_REQUIREMENTS_2_EXTENSION_NAME,
  507. };
  508. static const char *optional_extensions[] = {
  509. VK_KHR_VIDEO_QUEUE_EXTENSION_NAME,
  510. VK_KHR_VIDEO_DECODE_QUEUE_EXTENSION_NAME,
  511. VK_KHR_VIDEO_DECODE_H264_EXTENSION_NAME,
  512. VK_KHR_VIDEO_DECODE_H265_EXTENSION_NAME,
  513. VK_KHR_VIDEO_DECODE_AV1_EXTENSION_NAME
  514. };
  515. VkDeviceCreateInfo deviceCreateInfo = { 0 };
  516. VkDeviceQueueCreateInfo *queueCreateInfos = NULL;
  517. uint32_t queueCreateInfoCount = 0;
  518. VulkanDeviceFeatures supported_features;
  519. VkResult result = VK_ERROR_UNKNOWN;
  520. if (addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->presentQueueFamilyIndex, context->presentQueueCount) < 0 ||
  521. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->graphicsQueueFamilyIndex, context->graphicsQueueCount) < 0 ||
  522. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->transferQueueFamilyIndex, context->transferQueueCount) < 0 ||
  523. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->computeQueueFamilyIndex, context->computeQueueCount) < 0 ||
  524. addQueueFamily(&queueCreateInfos, &queueCreateInfoCount, context->decodeQueueFamilyIndex, context->decodeQueueCount) < 0) {
  525. goto done;
  526. }
  527. initDeviceFeatures(&supported_features);
  528. initDeviceFeatures(&context->features);
  529. context->vkGetPhysicalDeviceFeatures2(context->physicalDevice, &supported_features.device_features);
  530. copyDeviceFeatures(&supported_features, &context->features);
  531. deviceCreateInfo.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
  532. deviceCreateInfo.queueCreateInfoCount = queueCreateInfoCount;
  533. deviceCreateInfo.pQueueCreateInfos = queueCreateInfos;
  534. deviceCreateInfo.pEnabledFeatures = NULL;
  535. deviceCreateInfo.enabledExtensionCount = SDL_arraysize(deviceExtensionNames);
  536. deviceCreateInfo.pNext = &context->features.device_features;
  537. const char **deviceExtensionsCopy = SDL_calloc(deviceCreateInfo.enabledExtensionCount + SDL_arraysize(optional_extensions), sizeof(const char *));
  538. for (uint32_t i = 0; i < deviceCreateInfo.enabledExtensionCount; i++) {
  539. deviceExtensionsCopy[i] = deviceExtensionNames[i];
  540. }
  541. // Get the rest of the optional extensions
  542. {
  543. uint32_t extensionCount;
  544. if (context->vkEnumerateDeviceExtensionProperties(context->physicalDevice, NULL, &extensionCount, NULL) == VK_SUCCESS && extensionCount > 0) {
  545. VkExtensionProperties *extensionProperties = SDL_calloc(sizeof(VkExtensionProperties), extensionCount);
  546. if (context->vkEnumerateDeviceExtensionProperties(context->physicalDevice, NULL, &extensionCount, extensionProperties) == VK_SUCCESS) {
  547. for (uint32_t i = 0; i < SDL_arraysize(optional_extensions); ++i) {
  548. for (uint32_t j = 0; j < extensionCount; ++j) {
  549. if (SDL_strcmp(extensionProperties[j].extensionName, optional_extensions[i]) == 0) {
  550. deviceExtensionsCopy[deviceCreateInfo.enabledExtensionCount++] = optional_extensions[i];
  551. break;
  552. }
  553. }
  554. }
  555. }
  556. SDL_free(extensionProperties);
  557. }
  558. }
  559. deviceCreateInfo.ppEnabledExtensionNames = deviceExtensionsCopy;
  560. context->deviceExtensions = deviceExtensionsCopy;
  561. context->deviceExtensionsCount = deviceCreateInfo.enabledExtensionCount;
  562. result = context->vkCreateDevice(context->physicalDevice, &deviceCreateInfo, NULL, &context->device);
  563. if (result != VK_SUCCESS) {
  564. SDL_SetError("vkCreateDevice(): %s", getVulkanResultString(result));
  565. goto done;
  566. }
  567. if (loadDeviceFunctions(context) < 0) {
  568. result = VK_ERROR_UNKNOWN;
  569. context->device = VK_NULL_HANDLE;
  570. goto done;
  571. }
  572. // Get the graphics queue that SDL will use
  573. context->vkGetDeviceQueue(context->device, context->graphicsQueueFamilyIndex, 0, &context->graphicsQueue);
  574. // Create a command pool
  575. VkCommandPoolCreateInfo commandPoolCreateInfo = { 0 };
  576. commandPoolCreateInfo.sType = VK_STRUCTURE_TYPE_COMMAND_POOL_CREATE_INFO;
  577. commandPoolCreateInfo.flags = VK_COMMAND_POOL_CREATE_RESET_COMMAND_BUFFER_BIT;
  578. commandPoolCreateInfo.queueFamilyIndex = context->graphicsQueueFamilyIndex;
  579. result = context->vkCreateCommandPool(context->device, &commandPoolCreateInfo, NULL, &context->commandPool);
  580. if (result != VK_SUCCESS) {
  581. SDL_SetError("vkCreateCommandPool(): %s", getVulkanResultString(result));
  582. goto done;
  583. }
  584. done:
  585. for (uint32_t i = 0; i < queueCreateInfoCount; ++i) {
  586. SDL_free((void *)queueCreateInfos[i].pQueuePriorities);
  587. }
  588. SDL_free(queueCreateInfos);
  589. if (result != VK_SUCCESS) {
  590. return -1;
  591. }
  592. return 0;
  593. }
  594. VulkanVideoContext *CreateVulkanVideoContext(SDL_Window *window)
  595. {
  596. VulkanVideoContext *context = SDL_calloc(1, sizeof(*context));
  597. if (!context) {
  598. return NULL;
  599. }
  600. if (loadGlobalFunctions(context) < 0 ||
  601. createInstance(context) < 0 ||
  602. createSurface(context, window) < 0 ||
  603. findPhysicalDevice(context) < 0 ||
  604. createDevice(context) < 0) {
  605. DestroyVulkanVideoContext(context);
  606. return NULL;
  607. }
  608. return context;
  609. }
  610. void SetupVulkanRenderProperties(VulkanVideoContext *context, SDL_PropertiesID props)
  611. {
  612. SDL_SetProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_INSTANCE_POINTER, context->instance);
  613. SDL_SetNumberProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_SURFACE_NUMBER, (Sint64)context->surface);
  614. SDL_SetProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_PHYSICAL_DEVICE_POINTER, context->physicalDevice);
  615. SDL_SetProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_DEVICE_POINTER, context->device);
  616. SDL_SetNumberProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_PRESENT_QUEUE_FAMILY_INDEX_NUMBER, context->presentQueueFamilyIndex);
  617. SDL_SetNumberProperty(props, SDL_PROP_RENDERER_CREATE_VULKAN_GRAPHICS_QUEUE_FAMILY_INDEX_NUMBER, context->graphicsQueueFamilyIndex);
  618. }
  619. void SetupVulkanDeviceContextData(VulkanVideoContext *context, AVVulkanDeviceContext *ctx)
  620. {
  621. ctx->get_proc_addr = context->vkGetInstanceProcAddr;
  622. ctx->inst = context->instance;
  623. ctx->phys_dev = context->physicalDevice;
  624. ctx->act_dev = context->device;
  625. ctx->device_features = context->features.device_features;
  626. ctx->enabled_inst_extensions = context->instanceExtensions;
  627. ctx->nb_enabled_inst_extensions = context->instanceExtensionsCount;
  628. ctx->enabled_dev_extensions = context->deviceExtensions;
  629. ctx->nb_enabled_dev_extensions = context->deviceExtensionsCount;
  630. ctx->queue_family_index = context->graphicsQueueFamilyIndex;
  631. ctx->nb_graphics_queues = context->graphicsQueueCount;
  632. ctx->queue_family_tx_index = context->transferQueueFamilyIndex;
  633. ctx->nb_tx_queues = context->transferQueueCount;
  634. ctx->queue_family_comp_index = context->computeQueueFamilyIndex;
  635. ctx->nb_comp_queues = context->computeQueueCount;
  636. ctx->queue_family_encode_index = -1;
  637. ctx->nb_encode_queues = 0;
  638. ctx->queue_family_decode_index = context->decodeQueueFamilyIndex;
  639. ctx->nb_decode_queues = context->decodeQueueCount;
  640. }
  641. static int CreateCommandBuffers(VulkanVideoContext *context, SDL_Renderer *renderer)
  642. {
  643. uint32_t commandBufferCount = (uint32_t)SDL_GetNumberProperty(SDL_GetRendererProperties(renderer), SDL_PROP_RENDERER_VULKAN_SWAPCHAIN_IMAGE_COUNT_NUMBER, 1);
  644. if (commandBufferCount > context->waitSemaphoreCount) {
  645. VkSemaphore *semaphores = (VkSemaphore *)SDL_realloc(context->waitSemaphores, commandBufferCount * sizeof(*semaphores));
  646. if (!semaphores) {
  647. return -1;
  648. }
  649. context->waitSemaphores = semaphores;
  650. VkSemaphoreCreateInfo semaphoreCreateInfo = { 0 };
  651. semaphoreCreateInfo.sType = VK_STRUCTURE_TYPE_SEMAPHORE_CREATE_INFO;
  652. while (context->waitSemaphoreCount < commandBufferCount) {
  653. VkResult result = context->vkCreateSemaphore(context->device, &semaphoreCreateInfo, NULL, &context->waitSemaphores[context->waitSemaphoreCount]);
  654. if (result != VK_SUCCESS) {
  655. SDL_SetError("vkCreateSemaphore(): %s", getVulkanResultString(result));
  656. return -1;
  657. }
  658. ++context->waitSemaphoreCount;
  659. }
  660. }
  661. if (commandBufferCount > context->signalSemaphoreCount) {
  662. VkSemaphore *semaphores = (VkSemaphore *)SDL_realloc(context->signalSemaphores, commandBufferCount * sizeof(*semaphores));
  663. if (!semaphores) {
  664. return -1;
  665. }
  666. context->signalSemaphores = semaphores;
  667. VkSemaphoreCreateInfo semaphoreCreateInfo = { 0 };
  668. semaphoreCreateInfo.sType = VK_STRUCTURE_TYPE_SEMAPHORE_CREATE_INFO;
  669. while (context->signalSemaphoreCount < commandBufferCount) {
  670. VkResult result = context->vkCreateSemaphore(context->device, &semaphoreCreateInfo, NULL, &context->signalSemaphores[context->signalSemaphoreCount]);
  671. if (result != VK_SUCCESS) {
  672. SDL_SetError("vkCreateSemaphore(): %s", getVulkanResultString(result));
  673. return -1;
  674. }
  675. ++context->signalSemaphoreCount;
  676. }
  677. }
  678. if (commandBufferCount > context->commandBufferCount) {
  679. uint32_t needed = (commandBufferCount - context->commandBufferCount);
  680. VkCommandBuffer *commandBuffers = (VkCommandBuffer *)SDL_realloc(context->commandBuffers, commandBufferCount * sizeof(*commandBuffers));
  681. if (!commandBuffers) {
  682. return -1;
  683. }
  684. context->commandBuffers = commandBuffers;
  685. VkCommandBufferAllocateInfo commandBufferAllocateInfo = { 0 };
  686. commandBufferAllocateInfo.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_ALLOCATE_INFO;
  687. commandBufferAllocateInfo.commandPool = context->commandPool;
  688. commandBufferAllocateInfo.level = VK_COMMAND_BUFFER_LEVEL_PRIMARY;
  689. commandBufferAllocateInfo.commandBufferCount = needed;
  690. VkResult result = context->vkAllocateCommandBuffers(context->device, &commandBufferAllocateInfo, &context->commandBuffers[context->commandBufferCount]);
  691. if (result != VK_SUCCESS) {
  692. SDL_SetError("vkAllocateCommandBuffers(): %s", getVulkanResultString(result));
  693. return -1;
  694. }
  695. context->commandBufferCount = commandBufferCount;
  696. }
  697. return 0;
  698. }
  699. int BeginVulkanFrameRendering(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer)
  700. {
  701. AVHWFramesContext *frames = (AVHWFramesContext *)(frame->hw_frames_ctx->data);
  702. AVVulkanFramesContext *vk = (AVVulkanFramesContext *)(frames->hwctx);
  703. AVVkFrame *pVkFrame = (AVVkFrame *)frame->data[0];
  704. if (CreateCommandBuffers(context, renderer) < 0) {
  705. return -1;
  706. }
  707. vk->lock_frame(frames, pVkFrame);
  708. VkTimelineSemaphoreSubmitInfo timeline = { 0 };
  709. timeline.sType = VK_STRUCTURE_TYPE_TIMELINE_SEMAPHORE_SUBMIT_INFO;
  710. timeline.waitSemaphoreValueCount = 1;
  711. timeline.pWaitSemaphoreValues = pVkFrame->sem_value;
  712. VkPipelineStageFlags pipelineStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  713. VkSubmitInfo submitInfo = { 0 };
  714. submitInfo.sType = VK_STRUCTURE_TYPE_SUBMIT_INFO;
  715. submitInfo.waitSemaphoreCount = 1;
  716. submitInfo.pWaitSemaphores = pVkFrame->sem;
  717. submitInfo.pWaitDstStageMask = &pipelineStageMask;
  718. submitInfo.signalSemaphoreCount = 1;
  719. submitInfo.pSignalSemaphores = &context->waitSemaphores[context->commandBufferIndex];
  720. submitInfo.pNext = &timeline;
  721. if (pVkFrame->layout[0] != VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL) {
  722. VkCommandBuffer commandBuffer = context->commandBuffers[context->commandBufferIndex];
  723. VkCommandBufferBeginInfo beginInfo = { 0 };
  724. beginInfo.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_BEGIN_INFO;
  725. beginInfo.flags = 0;
  726. context->vkBeginCommandBuffer(commandBuffer, &beginInfo);
  727. VkImageMemoryBarrier2 barrier = { 0 };
  728. barrier.sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER_2;
  729. barrier.srcAccessMask = VK_ACCESS_2_NONE;
  730. barrier.dstAccessMask = VK_ACCESS_2_SHADER_SAMPLED_READ_BIT;
  731. barrier.oldLayout = pVkFrame->layout[0];
  732. barrier.newLayout = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
  733. barrier.image = pVkFrame->img[0];
  734. barrier.subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  735. barrier.subresourceRange.levelCount = 1;
  736. barrier.subresourceRange.layerCount = 1;
  737. barrier.srcQueueFamilyIndex = pVkFrame->queue_family[0];
  738. barrier.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  739. barrier.srcStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  740. barrier.dstStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  741. VkDependencyInfo dep = { 0 };
  742. dep.sType = VK_STRUCTURE_TYPE_DEPENDENCY_INFO;
  743. dep.dependencyFlags = VK_DEPENDENCY_BY_REGION_BIT;
  744. dep.imageMemoryBarrierCount = 1;
  745. dep.pImageMemoryBarriers = &barrier;
  746. context->vkCmdPipelineBarrier2(commandBuffer, &dep);
  747. context->vkEndCommandBuffer(commandBuffer);
  748. // Add the image barrier to the submit info
  749. submitInfo.commandBufferCount = 1;
  750. submitInfo.pCommandBuffers = &context->commandBuffers[context->commandBufferIndex];
  751. pVkFrame->layout[0] = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
  752. pVkFrame->queue_family[0] = VK_QUEUE_FAMILY_IGNORED;
  753. }
  754. VkResult result = context->vkQueueSubmit(context->graphicsQueue, 1, &submitInfo, 0);
  755. if (result != VK_SUCCESS) {
  756. // Don't return an error here, we need to complete the frame operation
  757. SDL_LogError(SDL_LOG_CATEGORY_APPLICATION , "vkQueueSubmit(): %s", getVulkanResultString(result));
  758. }
  759. SDL_AddVulkanRenderSemaphores(renderer, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT, (Sint64)context->waitSemaphores[context->commandBufferIndex], (Sint64)context->signalSemaphores[context->commandBufferIndex]);
  760. return 0;
  761. }
  762. int FinishVulkanFrameRendering(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer)
  763. {
  764. AVHWFramesContext *frames = (AVHWFramesContext *)(frame->hw_frames_ctx->data);
  765. AVVulkanFramesContext *vk = (AVVulkanFramesContext *)(frames->hwctx);
  766. AVVkFrame *pVkFrame = (AVVkFrame *)frame->data[0];
  767. // Transition the frame back to ffmpeg
  768. ++pVkFrame->sem_value[0];
  769. VkTimelineSemaphoreSubmitInfo timeline = { 0 };
  770. timeline.sType = VK_STRUCTURE_TYPE_TIMELINE_SEMAPHORE_SUBMIT_INFO;
  771. timeline.signalSemaphoreValueCount = 1;
  772. timeline.pSignalSemaphoreValues = pVkFrame->sem_value;
  773. VkPipelineStageFlags pipelineStageMask = VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT;
  774. VkSubmitInfo submitInfo = { 0 };
  775. submitInfo.sType = VK_STRUCTURE_TYPE_SUBMIT_INFO;
  776. submitInfo.waitSemaphoreCount = 1;
  777. submitInfo.pWaitSemaphores = &context->signalSemaphores[context->commandBufferIndex];
  778. submitInfo.pWaitDstStageMask = &pipelineStageMask;
  779. submitInfo.signalSemaphoreCount = 1;
  780. submitInfo.pSignalSemaphores = pVkFrame->sem;
  781. submitInfo.pNext = &timeline;
  782. VkResult result = context->vkQueueSubmit(context->graphicsQueue, 1, &submitInfo, 0);
  783. if (result != VK_SUCCESS) {
  784. // Don't return an error here, we need to complete the frame operation
  785. SDL_LogError(SDL_LOG_CATEGORY_APPLICATION, "vkQueueSubmit(): %s", getVulkanResultString(result));
  786. }
  787. vk->unlock_frame(frames, pVkFrame);
  788. context->commandBufferIndex = (context->commandBufferIndex + 1) % context->commandBufferCount;
  789. return 0;
  790. }
  791. SDL_Texture *CreateVulkanVideoTexture(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer, SDL_PropertiesID props)
  792. {
  793. AVHWFramesContext *frames = (AVHWFramesContext *)(frame->hw_frames_ctx->data);
  794. AVVulkanFramesContext *vk = (AVVulkanFramesContext *)(frames->hwctx);
  795. AVVkFrame *pVkFrame = (AVVkFrame *)frame->data[0];
  796. Uint32 format;
  797. switch (vk->format[0]) {
  798. case VK_FORMAT_G8B8G8R8_422_UNORM:
  799. format = SDL_PIXELFORMAT_YUY2;
  800. break;
  801. case VK_FORMAT_B8G8R8G8_422_UNORM:
  802. format = SDL_PIXELFORMAT_UYVY;
  803. break;
  804. case VK_FORMAT_G8_B8_R8_3PLANE_420_UNORM:
  805. format = SDL_PIXELFORMAT_IYUV;
  806. break;
  807. case VK_FORMAT_G8_B8R8_2PLANE_420_UNORM:
  808. format = SDL_PIXELFORMAT_NV12;
  809. break;
  810. case VK_FORMAT_G10X6_B10X6R10X6_2PLANE_420_UNORM_3PACK16:
  811. format = SDL_PIXELFORMAT_P010;
  812. break;
  813. default:
  814. format = SDL_PIXELFORMAT_UNKNOWN;
  815. break;
  816. }
  817. SDL_SetNumberProperty(props, SDL_PROP_TEXTURE_CREATE_FORMAT_NUMBER, format);
  818. SDL_SetNumberProperty(props, SDL_PROP_TEXTURE_CREATE_VULKAN_TEXTURE_NUMBER, (Sint64)pVkFrame->img[0]);
  819. return SDL_CreateTextureWithProperties(renderer, props);
  820. }
  821. void DestroyVulkanVideoContext(VulkanVideoContext *context)
  822. {
  823. if (context) {
  824. if (context->device) {
  825. context->vkDeviceWaitIdle(context->device);
  826. }
  827. if (context->instanceExtensions) {
  828. SDL_free(context->instanceExtensions);
  829. }
  830. if (context->deviceExtensions) {
  831. SDL_free(context->deviceExtensions);
  832. }
  833. if (context->waitSemaphores) {
  834. for (uint32_t i = 0; i < context->waitSemaphoreCount; ++i) {
  835. context->vkDestroySemaphore(context->device, context->waitSemaphores[i], NULL);
  836. }
  837. SDL_free(context->waitSemaphores);
  838. context->waitSemaphores = NULL;
  839. }
  840. if (context->signalSemaphores) {
  841. for (uint32_t i = 0; i < context->signalSemaphoreCount; ++i) {
  842. context->vkDestroySemaphore(context->device, context->signalSemaphores[i], NULL);
  843. }
  844. SDL_free(context->signalSemaphores);
  845. context->signalSemaphores = NULL;
  846. }
  847. if (context->commandBuffers) {
  848. context->vkFreeCommandBuffers(context->device, context->commandPool, context->commandBufferCount, context->commandBuffers);
  849. SDL_free(context->commandBuffers);
  850. context->commandBuffers = NULL;
  851. }
  852. if (context->commandPool) {
  853. context->vkDestroyCommandPool(context->device, context->commandPool, NULL);
  854. context->commandPool = VK_NULL_HANDLE;
  855. }
  856. if (context->device) {
  857. context->vkDestroyDevice(context->device, NULL);
  858. }
  859. if (context->surface) {
  860. context->vkDestroySurfaceKHR(context->instance, context->surface, NULL);
  861. }
  862. if (context->instance) {
  863. context->vkDestroyInstance(context->instance, NULL);
  864. }
  865. SDL_free(context);
  866. }
  867. }
  868. #else
  869. VulkanVideoContext *CreateVulkanVideoContext(SDL_Window *window)
  870. {
  871. SDL_SetError("testffmpeg not built with Vulkan support");
  872. return NULL;
  873. }
  874. void SetupVulkanRenderProperties(VulkanVideoContext *context, SDL_PropertiesID props)
  875. {
  876. }
  877. void SetupVulkanDeviceContextData(VulkanVideoContext *context, AVVulkanDeviceContext *ctx)
  878. {
  879. }
  880. SDL_Texture *CreateVulkanVideoTexture(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer, SDL_PropertiesID props)
  881. {
  882. return NULL;
  883. }
  884. int BeginVulkanFrameRendering(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer)
  885. {
  886. return -1;
  887. }
  888. int FinishVulkanFrameRendering(VulkanVideoContext *context, AVFrame *frame, SDL_Renderer *renderer)
  889. {
  890. return -1;
  891. }
  892. void DestroyVulkanVideoContext(VulkanVideoContext *context)
  893. {
  894. }
  895. #endif // FFMPEG_VULKAN_SUPPORT