vulkan-capture.c 45 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654
  1. #include <windows.h>
  2. #include "graphics-hook.h"
  3. #define VK_USE_PLATFORM_WIN32_KHR
  4. #include <malloc.h>
  5. #include <vulkan/vulkan.h>
  6. #include <vulkan/vk_layer.h>
  7. #undef VK_LAYER_EXPORT
  8. #if defined(WIN32)
  9. #define VK_LAYER_EXPORT __declspec(dllexport)
  10. #else
  11. #define VK_LAYER_EXPORT
  12. #endif
  13. #include <vulkan/vulkan_win32.h>
  14. #define COBJMACROS
  15. #include <dxgi.h>
  16. #include <d3d11.h>
  17. #include "vulkan-capture.h"
  18. /* ======================================================================== */
  19. /* defs/statics */
  20. /* shorten stuff because dear GOD is vulkan unclean. */
  21. #define VKAPI VKAPI_CALL
  22. #define VkFunc PFN_vkVoidFunction
  23. #define EXPORT VK_LAYER_EXPORT
  24. /* use the loader's dispatch table pointer as a key for internal data maps */
  25. #define GET_LDT(x) (*(void **)x)
  26. static bool vulkan_seen = false;
  27. /* ======================================================================== */
  28. /* hook data */
  29. struct vk_obj_node {
  30. uint64_t obj;
  31. struct vk_obj_node *next;
  32. };
  33. struct vk_obj_list {
  34. struct vk_obj_node *root;
  35. SRWLOCK mutex;
  36. };
  37. struct vk_swap_data {
  38. struct vk_obj_node node;
  39. VkSwapchainKHR sc;
  40. VkExtent2D image_extent;
  41. VkFormat format;
  42. HWND hwnd;
  43. VkImage export_image;
  44. bool layout_initialized;
  45. VkDeviceMemory export_mem;
  46. VkImage *swap_images;
  47. uint32_t image_count;
  48. HANDLE handle;
  49. struct shtex_data *shtex_info;
  50. ID3D11Texture2D *d3d11_tex;
  51. bool captured;
  52. };
  53. struct vk_queue_data {
  54. VkQueue queue;
  55. uint32_t fam_idx;
  56. };
  57. struct vk_frame_data {
  58. VkCommandPool cmd_pool;
  59. VkCommandBuffer cmd_buffer;
  60. VkFence fence;
  61. bool cmd_buffer_busy;
  62. };
  63. struct vk_family_data {
  64. struct vk_frame_data *frames;
  65. uint32_t frame_index;
  66. uint32_t frame_count;
  67. };
  68. struct vk_surf_data {
  69. struct vk_obj_node node;
  70. HWND hwnd;
  71. };
  72. struct vk_inst_data {
  73. struct vk_obj_node node;
  74. bool valid;
  75. struct vk_inst_funcs funcs;
  76. struct vk_obj_list surfaces;
  77. };
  78. struct vk_data {
  79. struct vk_obj_node node;
  80. bool valid;
  81. struct vk_device_funcs funcs;
  82. VkPhysicalDevice phy_device;
  83. VkDevice device;
  84. struct vk_obj_list swaps;
  85. struct vk_swap_data *cur_swap;
  86. struct vk_queue_data *queues;
  87. uint32_t queue_count;
  88. struct vk_family_data *families;
  89. uint32_t family_capacity;
  90. VkExternalMemoryProperties external_mem_props;
  91. struct vk_inst_data *inst_data;
  92. VkAllocationCallbacks ac_storage;
  93. const VkAllocationCallbacks *ac;
  94. ID3D11Device *d3d11_device;
  95. ID3D11DeviceContext *d3d11_context;
  96. };
  97. /* ------------------------------------------------------------------------- */
  98. static void *vk_alloc(const VkAllocationCallbacks *ac, size_t size,
  99. size_t alignment, enum VkSystemAllocationScope scope)
  100. {
  101. return ac ? ac->pfnAllocation(ac->pUserData, size, alignment, scope)
  102. : _aligned_malloc(size, alignment);
  103. }
  104. static void vk_free(const VkAllocationCallbacks *ac, void *memory)
  105. {
  106. if (ac)
  107. ac->pfnFree(ac->pUserData, memory);
  108. else
  109. _aligned_free(memory);
  110. }
  111. static void add_obj_data(struct vk_obj_list *list, uint64_t obj, void *data)
  112. {
  113. AcquireSRWLockExclusive(&list->mutex);
  114. struct vk_obj_node *const node = data;
  115. node->obj = obj;
  116. node->next = list->root;
  117. list->root = node;
  118. ReleaseSRWLockExclusive(&list->mutex);
  119. }
  120. static struct vk_obj_node *get_obj_data(struct vk_obj_list *list, uint64_t obj)
  121. {
  122. struct vk_obj_node *data = NULL;
  123. AcquireSRWLockExclusive(&list->mutex);
  124. struct vk_obj_node *node = list->root;
  125. while (node) {
  126. if (node->obj == obj) {
  127. data = node;
  128. break;
  129. }
  130. node = node->next;
  131. }
  132. ReleaseSRWLockExclusive(&list->mutex);
  133. return data;
  134. }
  135. static struct vk_obj_node *remove_obj_data(struct vk_obj_list *list,
  136. uint64_t obj)
  137. {
  138. struct vk_obj_node *data = NULL;
  139. AcquireSRWLockExclusive(&list->mutex);
  140. struct vk_obj_node *prev = NULL;
  141. struct vk_obj_node *node = list->root;
  142. while (node) {
  143. if (node->obj == obj) {
  144. data = node;
  145. if (prev)
  146. prev->next = node->next;
  147. else
  148. list->root = node->next;
  149. break;
  150. }
  151. prev = node;
  152. node = node->next;
  153. }
  154. ReleaseSRWLockExclusive(&list->mutex);
  155. return data;
  156. }
  157. static void init_obj_list(struct vk_obj_list *list)
  158. {
  159. list->root = NULL;
  160. InitializeSRWLock(&list->mutex);
  161. }
  162. /* ------------------------------------------------------------------------- */
  163. static struct vk_obj_list devices;
  164. static struct vk_data *add_device_data(VkDevice device,
  165. const VkAllocationCallbacks *ac)
  166. {
  167. struct vk_data *data = vk_alloc(ac, sizeof(struct vk_data),
  168. _Alignof(struct vk_data),
  169. VK_SYSTEM_ALLOCATION_SCOPE_DEVICE);
  170. add_obj_data(&devices, (uint64_t)GET_LDT(device), data);
  171. return data;
  172. }
  173. static struct vk_data *get_device_data(void *obj)
  174. {
  175. return (struct vk_data *)get_obj_data(&devices, (uint64_t)GET_LDT(obj));
  176. }
  177. /* ------------------------------------------------------------------------- */
  178. static struct vk_swap_data *add_swap_data(struct vk_data *data,
  179. VkSwapchainKHR sc)
  180. {
  181. struct vk_swap_data *swap = vk_alloc(data->ac,
  182. sizeof(struct vk_swap_data),
  183. _Alignof(struct vk_swap_data),
  184. VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
  185. add_obj_data(&data->swaps, (uint64_t)sc, swap);
  186. return swap;
  187. }
  188. static struct vk_swap_data *get_swap_data(struct vk_data *data,
  189. VkSwapchainKHR sc)
  190. {
  191. return (struct vk_swap_data *)get_obj_data(&data->swaps, (uint64_t)sc);
  192. }
  193. /* ------------------------------------------------------------------------- */
  194. static void vk_shtex_clear_fence(const struct vk_data *data,
  195. struct vk_frame_data *frame_data)
  196. {
  197. const VkFence fence = frame_data->fence;
  198. if (frame_data->cmd_buffer_busy) {
  199. VkDevice device = data->device;
  200. const struct vk_device_funcs *funcs = &data->funcs;
  201. funcs->WaitForFences(device, 1, &fence, VK_TRUE, ~0ull);
  202. funcs->ResetFences(device, 1, &fence);
  203. frame_data->cmd_buffer_busy = false;
  204. }
  205. }
  206. static void vk_shtex_wait_until_pool_idle(struct vk_data *data,
  207. struct vk_family_data *family_data)
  208. {
  209. for (uint32_t frame_idx = 0; frame_idx < family_data->frame_count;
  210. frame_idx++) {
  211. struct vk_frame_data *frame_data =
  212. &family_data->frames[frame_idx];
  213. if (frame_data->cmd_pool != VK_NULL_HANDLE)
  214. vk_shtex_clear_fence(data, frame_data);
  215. }
  216. }
  217. static void vk_shtex_wait_until_idle(struct vk_data *data)
  218. {
  219. for (uint32_t fam_idx = 0; fam_idx < data->family_capacity; fam_idx++) {
  220. struct vk_family_data *family_data = &data->families[fam_idx];
  221. vk_shtex_wait_until_pool_idle(data, family_data);
  222. }
  223. }
  224. static void vk_shtex_free(struct vk_data *data)
  225. {
  226. capture_free();
  227. vk_shtex_wait_until_idle(data);
  228. struct vk_swap_data *swap = (struct vk_swap_data *)data->swaps.root;
  229. while (swap) {
  230. if (swap->export_image)
  231. data->funcs.DestroyImage(data->device,
  232. swap->export_image, data->ac);
  233. if (swap->export_mem)
  234. data->funcs.FreeMemory(data->device, swap->export_mem,
  235. NULL);
  236. if (swap->d3d11_tex) {
  237. ID3D11Texture2D_Release(swap->d3d11_tex);
  238. }
  239. swap->handle = INVALID_HANDLE_VALUE;
  240. swap->d3d11_tex = NULL;
  241. swap->export_mem = VK_NULL_HANDLE;
  242. swap->export_image = VK_NULL_HANDLE;
  243. swap->captured = false;
  244. swap = (struct vk_swap_data *)swap->node.next;
  245. }
  246. if (data->d3d11_context) {
  247. ID3D11DeviceContext_Release(data->d3d11_context);
  248. data->d3d11_context = NULL;
  249. }
  250. if (data->d3d11_device) {
  251. ID3D11Device_Release(data->d3d11_device);
  252. data->d3d11_device = NULL;
  253. }
  254. data->cur_swap = NULL;
  255. hlog("------------------ vulkan capture freed ------------------");
  256. }
  257. /* ------------------------------------------------------------------------- */
  258. static void insert_surf_data(struct vk_inst_data *data, VkSurfaceKHR surf,
  259. HWND hwnd, const VkAllocationCallbacks *ac)
  260. {
  261. struct vk_surf_data *surf_data = vk_alloc(
  262. ac, sizeof(struct vk_surf_data), _Alignof(struct vk_surf_data),
  263. VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
  264. if (surf_data) {
  265. surf_data->hwnd = hwnd;
  266. add_obj_data(&data->surfaces, (uint64_t)surf, surf_data);
  267. }
  268. }
  269. static HWND find_surf_hwnd(struct vk_inst_data *data, VkSurfaceKHR surf)
  270. {
  271. struct vk_surf_data *surf_data = (struct vk_surf_data *)get_obj_data(
  272. &data->surfaces, (uint64_t)surf);
  273. return surf_data->hwnd;
  274. }
  275. /* ------------------------------------------------------------------------- */
  276. static struct vk_obj_list instances;
  277. static struct vk_inst_data *add_inst_data(void *inst,
  278. const VkAllocationCallbacks *ac)
  279. {
  280. struct vk_inst_data *data = vk_alloc(
  281. ac, sizeof(struct vk_inst_data), _Alignof(struct vk_inst_data),
  282. VK_SYSTEM_ALLOCATION_SCOPE_INSTANCE);
  283. add_obj_data(&instances, (uint64_t)GET_LDT(inst), data);
  284. return data;
  285. }
  286. static struct vk_inst_data *get_inst_data(void *inst)
  287. {
  288. return (struct vk_inst_data *)get_obj_data(&instances,
  289. (uint64_t)GET_LDT(inst));
  290. }
  291. static inline struct vk_inst_funcs *get_inst_funcs(void *inst)
  292. {
  293. struct vk_inst_data *data = (struct vk_inst_data *)get_inst_data(inst);
  294. return &data->funcs;
  295. }
  296. /* ======================================================================== */
  297. /* capture */
  298. static inline bool vk_shtex_init_d3d11(struct vk_data *data)
  299. {
  300. D3D_FEATURE_LEVEL level_used;
  301. IDXGIFactory1 *factory;
  302. IDXGIAdapter1 *adapter;
  303. HRESULT hr;
  304. HMODULE d3d11 = load_system_library("d3d11.dll");
  305. if (!d3d11) {
  306. flog("failed to load d3d11: %d", GetLastError());
  307. return false;
  308. }
  309. HMODULE dxgi = load_system_library("dxgi.dll");
  310. if (!dxgi) {
  311. flog("failed to load dxgi: %d", GetLastError());
  312. return false;
  313. }
  314. HRESULT(WINAPI * create_factory)
  315. (REFIID, void **) = (void *)GetProcAddress(dxgi, "CreateDXGIFactory1");
  316. if (!create_factory) {
  317. flog("failed to get CreateDXGIFactory1 address: %d",
  318. GetLastError());
  319. return false;
  320. }
  321. PFN_D3D11_CREATE_DEVICE create =
  322. (void *)GetProcAddress(d3d11, "D3D11CreateDevice");
  323. if (!create) {
  324. flog("failed to get D3D11CreateDevice address: %d",
  325. GetLastError());
  326. return false;
  327. }
  328. hr = create_factory(&IID_IDXGIFactory1, &factory);
  329. if (FAILED(hr)) {
  330. flog_hr("failed to create factory", hr);
  331. return false;
  332. }
  333. hr = IDXGIFactory1_EnumAdapters1(factory, 0, &adapter);
  334. IDXGIFactory1_Release(factory);
  335. if (FAILED(hr)) {
  336. flog_hr("failed to create adapter", hr);
  337. return false;
  338. }
  339. static const D3D_FEATURE_LEVEL feature_levels[] = {
  340. D3D_FEATURE_LEVEL_11_0,
  341. D3D_FEATURE_LEVEL_10_1,
  342. D3D_FEATURE_LEVEL_10_0,
  343. D3D_FEATURE_LEVEL_9_3,
  344. };
  345. hr = create((IDXGIAdapter *)adapter, D3D_DRIVER_TYPE_UNKNOWN, NULL, 0,
  346. feature_levels,
  347. sizeof(feature_levels) / sizeof(D3D_FEATURE_LEVEL),
  348. D3D11_SDK_VERSION, &data->d3d11_device, &level_used,
  349. &data->d3d11_context);
  350. IDXGIAdapter1_Release(adapter);
  351. if (FAILED(hr)) {
  352. flog_hr("failed to create device", hr);
  353. return false;
  354. }
  355. return true;
  356. }
  357. static inline bool vk_shtex_init_d3d11_tex(struct vk_data *data,
  358. struct vk_swap_data *swap)
  359. {
  360. IDXGIResource *dxgi_res;
  361. HRESULT hr;
  362. const UINT width = swap->image_extent.width;
  363. const UINT height = swap->image_extent.height;
  364. flog("OBS requesting %s texture format. capture dimensions: %ux%u",
  365. vk_format_to_str(swap->format), width, height);
  366. const DXGI_FORMAT format = vk_format_to_dxgi(swap->format);
  367. if (format == DXGI_FORMAT_UNKNOWN) {
  368. flog("cannot convert to DXGI format");
  369. return false;
  370. }
  371. D3D11_TEXTURE2D_DESC desc = {0};
  372. desc.Width = width;
  373. desc.Height = height;
  374. desc.MipLevels = 1;
  375. desc.ArraySize = 1;
  376. desc.Format = format;
  377. desc.SampleDesc.Count = 1;
  378. desc.SampleDesc.Quality = 0;
  379. desc.Usage = D3D11_USAGE_DEFAULT;
  380. desc.MiscFlags = D3D11_RESOURCE_MISC_SHARED;
  381. desc.BindFlags = D3D11_BIND_RENDER_TARGET | D3D11_BIND_SHADER_RESOURCE;
  382. hr = ID3D11Device_CreateTexture2D(data->d3d11_device, &desc, NULL,
  383. &swap->d3d11_tex);
  384. if (FAILED(hr)) {
  385. flog_hr("failed to create texture", hr);
  386. return false;
  387. }
  388. hr = ID3D11Texture2D_QueryInterface(swap->d3d11_tex, &IID_IDXGIResource,
  389. &dxgi_res);
  390. if (FAILED(hr)) {
  391. flog_hr("failed to get IDXGIResource", hr);
  392. return false;
  393. }
  394. hr = IDXGIResource_GetSharedHandle(dxgi_res, &swap->handle);
  395. IDXGIResource_Release(dxgi_res);
  396. if (FAILED(hr)) {
  397. flog_hr("failed to get shared handle", hr);
  398. return false;
  399. }
  400. return true;
  401. }
  402. static inline bool vk_shtex_init_vulkan_tex(struct vk_data *data,
  403. struct vk_swap_data *swap)
  404. {
  405. struct vk_device_funcs *funcs = &data->funcs;
  406. VkExternalMemoryFeatureFlags f =
  407. data->external_mem_props.externalMemoryFeatures;
  408. /* -------------------------------------------------------- */
  409. /* create texture */
  410. VkExternalMemoryImageCreateInfo emici;
  411. emici.sType = VK_STRUCTURE_TYPE_EXTERNAL_MEMORY_IMAGE_CREATE_INFO;
  412. emici.pNext = NULL;
  413. emici.handleTypes =
  414. VK_EXTERNAL_MEMORY_HANDLE_TYPE_D3D11_TEXTURE_KMT_BIT;
  415. VkImageCreateInfo ici;
  416. ici.sType = VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO;
  417. ici.pNext = &emici;
  418. ici.flags = 0;
  419. ici.imageType = VK_IMAGE_TYPE_2D;
  420. ici.format = swap->format;
  421. ici.extent.width = swap->image_extent.width;
  422. ici.extent.height = swap->image_extent.height;
  423. ici.extent.depth = 1;
  424. ici.mipLevels = 1;
  425. ici.arrayLayers = 1;
  426. ici.samples = VK_SAMPLE_COUNT_1_BIT;
  427. ici.tiling = VK_IMAGE_TILING_OPTIMAL;
  428. ici.usage = VK_IMAGE_USAGE_TRANSFER_DST_BIT |
  429. VK_IMAGE_USAGE_SAMPLED_BIT;
  430. ici.sharingMode = VK_SHARING_MODE_EXCLUSIVE;
  431. ici.queueFamilyIndexCount = 0;
  432. ici.pQueueFamilyIndices = 0;
  433. ici.initialLayout = VK_IMAGE_LAYOUT_UNDEFINED;
  434. VkResult res;
  435. res = funcs->CreateImage(data->device, &ici, data->ac,
  436. &swap->export_image);
  437. if (VK_SUCCESS != res) {
  438. flog("failed to CreateImage: %s", result_to_str(res));
  439. swap->export_image = VK_NULL_HANDLE;
  440. return false;
  441. }
  442. swap->layout_initialized = false;
  443. /* -------------------------------------------------------- */
  444. /* get image memory requirements */
  445. VkMemoryRequirements mr;
  446. bool use_gimr2 = f & VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT;
  447. if (use_gimr2) {
  448. VkMemoryDedicatedRequirements mdr = {0};
  449. mdr.sType = VK_STRUCTURE_TYPE_MEMORY_DEDICATED_REQUIREMENTS;
  450. mdr.pNext = NULL;
  451. VkMemoryRequirements2 mr2 = {0};
  452. mr2.sType = VK_STRUCTURE_TYPE_MEMORY_REQUIREMENTS_2;
  453. mr2.pNext = &mdr;
  454. VkImageMemoryRequirementsInfo2 imri2 = {0};
  455. imri2.sType =
  456. VK_STRUCTURE_TYPE_IMAGE_MEMORY_REQUIREMENTS_INFO_2;
  457. imri2.pNext = NULL;
  458. imri2.image = swap->export_image;
  459. funcs->GetImageMemoryRequirements2(data->device, &imri2, &mr2);
  460. mr = mr2.memoryRequirements;
  461. } else {
  462. funcs->GetImageMemoryRequirements(data->device,
  463. swap->export_image, &mr);
  464. }
  465. /* -------------------------------------------------------- */
  466. /* get memory type index */
  467. struct vk_inst_funcs *ifuncs = get_inst_funcs(data->phy_device);
  468. VkPhysicalDeviceMemoryProperties pdmp;
  469. ifuncs->GetPhysicalDeviceMemoryProperties(data->phy_device, &pdmp);
  470. uint32_t mem_type_idx = 0;
  471. for (; mem_type_idx < pdmp.memoryTypeCount; mem_type_idx++) {
  472. if ((mr.memoryTypeBits & (1 << mem_type_idx)) &&
  473. (pdmp.memoryTypes[mem_type_idx].propertyFlags &
  474. VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) ==
  475. VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) {
  476. break;
  477. }
  478. }
  479. if (mem_type_idx == pdmp.memoryTypeCount) {
  480. flog("failed to get memory type index");
  481. funcs->DestroyImage(data->device, swap->export_image, data->ac);
  482. swap->export_image = VK_NULL_HANDLE;
  483. return false;
  484. }
  485. /* -------------------------------------------------------- */
  486. /* allocate memory */
  487. VkImportMemoryWin32HandleInfoKHR imw32hi;
  488. imw32hi.sType = VK_STRUCTURE_TYPE_IMPORT_MEMORY_WIN32_HANDLE_INFO_KHR;
  489. imw32hi.pNext = NULL;
  490. imw32hi.name = NULL;
  491. imw32hi.handleType =
  492. VK_EXTERNAL_MEMORY_HANDLE_TYPE_D3D11_TEXTURE_KMT_BIT;
  493. imw32hi.handle = swap->handle;
  494. VkMemoryAllocateInfo mai;
  495. mai.sType = VK_STRUCTURE_TYPE_MEMORY_ALLOCATE_INFO;
  496. mai.pNext = &imw32hi;
  497. mai.allocationSize = mr.size;
  498. mai.memoryTypeIndex = mem_type_idx;
  499. VkMemoryDedicatedAllocateInfo mdai;
  500. mdai.sType = VK_STRUCTURE_TYPE_MEMORY_DEDICATED_ALLOCATE_INFO;
  501. mdai.pNext = NULL;
  502. mdai.buffer = VK_NULL_HANDLE;
  503. if (data->external_mem_props.externalMemoryFeatures &
  504. VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT) {
  505. mdai.image = swap->export_image;
  506. imw32hi.pNext = &mdai;
  507. }
  508. res = funcs->AllocateMemory(data->device, &mai, NULL,
  509. &swap->export_mem);
  510. if (VK_SUCCESS != res) {
  511. flog("failed to AllocateMemory: %s", result_to_str(res));
  512. funcs->DestroyImage(data->device, swap->export_image, data->ac);
  513. swap->export_image = VK_NULL_HANDLE;
  514. return false;
  515. }
  516. /* -------------------------------------------------------- */
  517. /* bind image memory */
  518. bool use_bi2 = f & VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT;
  519. if (use_bi2) {
  520. VkBindImageMemoryInfo bimi = {0};
  521. bimi.sType = VK_STRUCTURE_TYPE_BIND_IMAGE_MEMORY_INFO;
  522. bimi.image = swap->export_image;
  523. bimi.memory = swap->export_mem;
  524. bimi.memoryOffset = 0;
  525. res = funcs->BindImageMemory2(data->device, 1, &bimi);
  526. } else {
  527. res = funcs->BindImageMemory(data->device, swap->export_image,
  528. swap->export_mem, 0);
  529. }
  530. if (VK_SUCCESS != res) {
  531. flog("%s failed: %s",
  532. use_bi2 ? "BindImageMemory2" : "BindImageMemory",
  533. result_to_str(res));
  534. funcs->DestroyImage(data->device, swap->export_image, data->ac);
  535. swap->export_image = VK_NULL_HANDLE;
  536. return false;
  537. }
  538. return true;
  539. }
  540. static bool vk_shtex_init(struct vk_data *data, HWND window,
  541. struct vk_swap_data *swap)
  542. {
  543. if (!vk_shtex_init_d3d11(data)) {
  544. return false;
  545. }
  546. if (!vk_shtex_init_d3d11_tex(data, swap)) {
  547. return false;
  548. }
  549. if (!vk_shtex_init_vulkan_tex(data, swap)) {
  550. return false;
  551. }
  552. data->cur_swap = swap;
  553. swap->captured = capture_init_shtex(&swap->shtex_info, window,
  554. swap->image_extent.width,
  555. swap->image_extent.height,
  556. (uint32_t)swap->format, false,
  557. (uintptr_t)swap->handle);
  558. if (!swap->captured)
  559. return false;
  560. if (global_hook_info->force_shmem) {
  561. flog("shared memory capture currently "
  562. "unsupported; ignoring");
  563. }
  564. hlog("vulkan shared texture capture successful");
  565. return true;
  566. }
  567. static void vk_shtex_create_family_objects(struct vk_data *data,
  568. uint32_t fam_idx,
  569. uint32_t image_count)
  570. {
  571. struct vk_family_data *family_data = &data->families[fam_idx];
  572. family_data->frames =
  573. vk_alloc(data->ac, image_count * sizeof(struct vk_frame_data),
  574. _Alignof(struct vk_frame_data),
  575. VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
  576. memset(family_data->frames, 0,
  577. image_count * sizeof(struct vk_frame_data));
  578. family_data->frame_index = 0;
  579. family_data->frame_count = image_count;
  580. for (uint32_t image_index = 0; image_index < image_count;
  581. image_index++) {
  582. struct vk_frame_data *frame_data =
  583. &family_data->frames[image_index];
  584. VkCommandPoolCreateInfo cpci;
  585. cpci.sType = VK_STRUCTURE_TYPE_COMMAND_POOL_CREATE_INFO;
  586. cpci.pNext = NULL;
  587. cpci.flags = 0;
  588. cpci.queueFamilyIndex = fam_idx;
  589. VkResult res = data->funcs.CreateCommandPool(
  590. data->device, &cpci, data->ac, &frame_data->cmd_pool);
  591. debug_res("CreateCommandPool", res);
  592. VkCommandBufferAllocateInfo cbai;
  593. cbai.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_ALLOCATE_INFO;
  594. cbai.pNext = NULL;
  595. cbai.commandPool = frame_data->cmd_pool;
  596. cbai.level = VK_COMMAND_BUFFER_LEVEL_PRIMARY;
  597. cbai.commandBufferCount = 1;
  598. res = data->funcs.AllocateCommandBuffers(
  599. data->device, &cbai, &frame_data->cmd_buffer);
  600. debug_res("AllocateCommandBuffers", res);
  601. *(void **)frame_data->cmd_buffer = *(void **)(data->device);
  602. VkFenceCreateInfo fci = {0};
  603. fci.sType = VK_STRUCTURE_TYPE_FENCE_CREATE_INFO;
  604. fci.pNext = NULL;
  605. fci.flags = 0;
  606. res = data->funcs.CreateFence(data->device, &fci, data->ac,
  607. &frame_data->fence);
  608. debug_res("CreateFence", res);
  609. }
  610. }
  611. static void vk_shtex_destroy_fence(struct vk_data *data, bool *cmd_buffer_busy,
  612. VkFence *fence)
  613. {
  614. VkDevice device = data->device;
  615. if (*cmd_buffer_busy) {
  616. data->funcs.WaitForFences(device, 1, fence, VK_TRUE, ~0ull);
  617. *cmd_buffer_busy = false;
  618. }
  619. data->funcs.DestroyFence(device, *fence, data->ac);
  620. *fence = VK_NULL_HANDLE;
  621. }
  622. static void vk_shtex_destroy_family_objects(struct vk_data *data,
  623. struct vk_family_data *family_data)
  624. {
  625. for (uint32_t frame_idx = 0; frame_idx < family_data->frame_count;
  626. frame_idx++) {
  627. struct vk_frame_data *frame_data =
  628. &family_data->frames[frame_idx];
  629. bool *cmd_buffer_busy = &frame_data->cmd_buffer_busy;
  630. VkFence *fence = &frame_data->fence;
  631. vk_shtex_destroy_fence(data, cmd_buffer_busy, fence);
  632. data->funcs.DestroyCommandPool(data->device,
  633. frame_data->cmd_pool, data->ac);
  634. frame_data->cmd_pool = VK_NULL_HANDLE;
  635. }
  636. vk_free(data->ac, family_data->frames);
  637. family_data->frames = NULL;
  638. family_data->frame_count = 0;
  639. }
  640. static void vk_shtex_capture(struct vk_data *data,
  641. struct vk_device_funcs *funcs,
  642. struct vk_swap_data *swap, uint32_t idx,
  643. VkQueue queue, const VkPresentInfoKHR *info)
  644. {
  645. VkResult res = VK_SUCCESS;
  646. VkCommandBufferBeginInfo begin_info;
  647. begin_info.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_BEGIN_INFO;
  648. begin_info.pNext = NULL;
  649. begin_info.flags = VK_COMMAND_BUFFER_USAGE_ONE_TIME_SUBMIT_BIT;
  650. begin_info.pInheritanceInfo = NULL;
  651. VkImageMemoryBarrier mb[2];
  652. VkImageMemoryBarrier *src_mb = &mb[0];
  653. VkImageMemoryBarrier *dst_mb = &mb[1];
  654. /* ------------------------------------------------------ */
  655. /* do image copy */
  656. const uint32_t image_index = info->pImageIndices[idx];
  657. VkImage cur_backbuffer = swap->swap_images[image_index];
  658. uint32_t fam_idx = 0;
  659. for (uint32_t i = 0; i < data->queue_count; i++) {
  660. if (data->queues[i].queue == queue)
  661. fam_idx = data->queues[i].fam_idx;
  662. }
  663. struct vk_family_data *family_data = &data->families[fam_idx];
  664. const uint32_t image_count = swap->image_count;
  665. if (family_data->frame_count < image_count) {
  666. if (family_data->frame_count > 0)
  667. vk_shtex_destroy_family_objects(data, family_data);
  668. vk_shtex_create_family_objects(data, fam_idx, image_count);
  669. }
  670. const uint32_t frame_index = family_data->frame_index;
  671. struct vk_frame_data *frame_data = &family_data->frames[frame_index];
  672. family_data->frame_index = (frame_index + 1) % family_data->frame_count;
  673. vk_shtex_clear_fence(data, frame_data);
  674. res = funcs->ResetCommandPool(data->device, frame_data->cmd_pool, 0);
  675. #ifdef MORE_DEBUGGING
  676. debug_res("ResetCommandPool", res);
  677. #endif
  678. const VkCommandBuffer cmd_buffer = frame_data->cmd_buffer;
  679. res = funcs->BeginCommandBuffer(cmd_buffer, &begin_info);
  680. #ifdef MORE_DEBUGGING
  681. debug_res("BeginCommandBuffer", res);
  682. #endif
  683. /* ------------------------------------------------------ */
  684. /* transition shared texture if necessary */
  685. if (!swap->layout_initialized) {
  686. VkImageMemoryBarrier imb;
  687. imb.sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER;
  688. imb.pNext = NULL;
  689. imb.srcAccessMask = 0;
  690. imb.dstAccessMask = 0;
  691. imb.oldLayout = VK_IMAGE_LAYOUT_UNDEFINED;
  692. imb.newLayout = VK_IMAGE_LAYOUT_GENERAL;
  693. imb.srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  694. imb.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  695. imb.image = swap->export_image;
  696. imb.subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  697. imb.subresourceRange.baseMipLevel = 0;
  698. imb.subresourceRange.levelCount = 1;
  699. imb.subresourceRange.baseArrayLayer = 0;
  700. imb.subresourceRange.layerCount = 1;
  701. funcs->CmdPipelineBarrier(cmd_buffer,
  702. VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT,
  703. VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, 0,
  704. 0, NULL, 0, NULL, 1, &imb);
  705. swap->layout_initialized = true;
  706. }
  707. /* ------------------------------------------------------ */
  708. /* transition cur_backbuffer to transfer source state */
  709. src_mb->sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER;
  710. src_mb->pNext = NULL;
  711. src_mb->srcAccessMask = VK_ACCESS_MEMORY_READ_BIT;
  712. src_mb->dstAccessMask = VK_ACCESS_TRANSFER_READ_BIT;
  713. src_mb->oldLayout = VK_IMAGE_LAYOUT_PRESENT_SRC_KHR;
  714. src_mb->newLayout = VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL;
  715. src_mb->srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  716. src_mb->dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  717. src_mb->image = cur_backbuffer;
  718. src_mb->subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  719. src_mb->subresourceRange.baseMipLevel = 0;
  720. src_mb->subresourceRange.levelCount = 1;
  721. src_mb->subresourceRange.baseArrayLayer = 0;
  722. src_mb->subresourceRange.layerCount = 1;
  723. /* ------------------------------------------------------ */
  724. /* transition exportedTexture to transfer dest state */
  725. dst_mb->sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER;
  726. dst_mb->pNext = NULL;
  727. dst_mb->srcAccessMask = 0;
  728. dst_mb->dstAccessMask = VK_ACCESS_TRANSFER_WRITE_BIT;
  729. dst_mb->oldLayout = VK_IMAGE_LAYOUT_GENERAL;
  730. dst_mb->newLayout = VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL;
  731. dst_mb->srcQueueFamilyIndex = VK_QUEUE_FAMILY_EXTERNAL;
  732. dst_mb->dstQueueFamilyIndex = fam_idx;
  733. dst_mb->image = swap->export_image;
  734. dst_mb->subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  735. dst_mb->subresourceRange.baseMipLevel = 0;
  736. dst_mb->subresourceRange.levelCount = 1;
  737. dst_mb->subresourceRange.baseArrayLayer = 0;
  738. dst_mb->subresourceRange.layerCount = 1;
  739. funcs->CmdPipelineBarrier(cmd_buffer,
  740. VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT,
  741. VK_PIPELINE_STAGE_TRANSFER_BIT, 0, 0, NULL, 0,
  742. NULL, 2, mb);
  743. /* ------------------------------------------------------ */
  744. /* copy cur_backbuffer's content to our interop image */
  745. VkImageCopy cpy;
  746. cpy.srcSubresource.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  747. cpy.srcSubresource.mipLevel = 0;
  748. cpy.srcSubresource.baseArrayLayer = 0;
  749. cpy.srcSubresource.layerCount = 1;
  750. cpy.srcOffset.x = 0;
  751. cpy.srcOffset.y = 0;
  752. cpy.srcOffset.z = 0;
  753. cpy.dstSubresource.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  754. cpy.dstSubresource.mipLevel = 0;
  755. cpy.dstSubresource.baseArrayLayer = 0;
  756. cpy.dstSubresource.layerCount = 1;
  757. cpy.dstOffset.x = 0;
  758. cpy.dstOffset.y = 0;
  759. cpy.dstOffset.z = 0;
  760. cpy.extent.width = swap->image_extent.width;
  761. cpy.extent.height = swap->image_extent.height;
  762. cpy.extent.depth = 1;
  763. funcs->CmdCopyImage(cmd_buffer, cur_backbuffer,
  764. VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL,
  765. swap->export_image,
  766. VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL, 1, &cpy);
  767. /* ------------------------------------------------------ */
  768. /* Restore the swap chain image layout to what it was
  769. * before. This may not be strictly needed, but it is
  770. * generally good to restore things to their original
  771. * state. */
  772. src_mb->srcAccessMask = VK_ACCESS_TRANSFER_READ_BIT;
  773. src_mb->dstAccessMask = VK_ACCESS_MEMORY_READ_BIT;
  774. src_mb->oldLayout = VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL;
  775. src_mb->newLayout = VK_IMAGE_LAYOUT_PRESENT_SRC_KHR;
  776. dst_mb->srcAccessMask = VK_ACCESS_TRANSFER_WRITE_BIT;
  777. dst_mb->dstAccessMask = 0;
  778. dst_mb->oldLayout = VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL;
  779. dst_mb->newLayout = VK_IMAGE_LAYOUT_GENERAL;
  780. dst_mb->srcQueueFamilyIndex = fam_idx;
  781. dst_mb->dstQueueFamilyIndex = VK_QUEUE_FAMILY_EXTERNAL;
  782. funcs->CmdPipelineBarrier(cmd_buffer, VK_PIPELINE_STAGE_TRANSFER_BIT,
  783. VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT |
  784. VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT,
  785. 0, 0, NULL, 0, NULL, 2, mb);
  786. funcs->EndCommandBuffer(cmd_buffer);
  787. /* ------------------------------------------------------ */
  788. VkSubmitInfo submit_info;
  789. submit_info.sType = VK_STRUCTURE_TYPE_SUBMIT_INFO;
  790. submit_info.pNext = NULL;
  791. submit_info.waitSemaphoreCount = 0;
  792. submit_info.pWaitSemaphores = NULL;
  793. submit_info.pWaitDstStageMask = NULL;
  794. submit_info.commandBufferCount = 1;
  795. submit_info.pCommandBuffers = &cmd_buffer;
  796. submit_info.signalSemaphoreCount = 0;
  797. submit_info.pSignalSemaphores = NULL;
  798. const VkFence fence = frame_data->fence;
  799. res = funcs->QueueSubmit(queue, 1, &submit_info, fence);
  800. #ifdef MORE_DEBUGGING
  801. debug_res("QueueSubmit", res);
  802. #endif
  803. if (res == VK_SUCCESS)
  804. frame_data->cmd_buffer_busy = true;
  805. }
  806. static inline bool valid_rect(struct vk_swap_data *swap)
  807. {
  808. return !!swap->image_extent.width && !!swap->image_extent.height;
  809. }
  810. static void vk_capture(struct vk_data *data, VkQueue queue,
  811. const VkPresentInfoKHR *info)
  812. {
  813. struct vk_swap_data *swap = NULL;
  814. HWND window = NULL;
  815. uint32_t idx = 0;
  816. #ifdef MORE_DEBUGGING
  817. debug("QueuePresentKHR called on "
  818. "devicekey %p, swapchain count %d",
  819. &data->funcs, info->swapchainCount);
  820. #endif
  821. /* use first swap chain associated with a window */
  822. for (; idx < info->swapchainCount; idx++) {
  823. struct vk_swap_data *cur_swap =
  824. get_swap_data(data, info->pSwapchains[idx]);
  825. window = cur_swap->hwnd;
  826. if (!!window) {
  827. swap = cur_swap;
  828. break;
  829. }
  830. }
  831. if (!window) {
  832. return;
  833. }
  834. if (capture_should_stop()) {
  835. vk_shtex_free(data);
  836. }
  837. if (capture_should_init()) {
  838. if (valid_rect(swap) && !vk_shtex_init(data, window, swap)) {
  839. vk_shtex_free(data);
  840. data->valid = false;
  841. flog("vk_shtex_init failed");
  842. }
  843. }
  844. if (capture_ready()) {
  845. if (swap != data->cur_swap) {
  846. vk_shtex_free(data);
  847. return;
  848. }
  849. vk_shtex_capture(data, &data->funcs, swap, idx, queue, info);
  850. }
  851. }
  852. static VkResult VKAPI OBS_QueuePresentKHR(VkQueue queue,
  853. const VkPresentInfoKHR *info)
  854. {
  855. struct vk_data *data = get_device_data(queue);
  856. struct vk_device_funcs *funcs = &data->funcs;
  857. if (data->valid) {
  858. vk_capture(data, queue, info);
  859. }
  860. return funcs->QueuePresentKHR(queue, info);
  861. }
  862. /* ======================================================================== */
  863. /* setup hooks */
  864. static inline bool is_inst_link_info(VkLayerInstanceCreateInfo *lici)
  865. {
  866. return lici->sType == VK_STRUCTURE_TYPE_LOADER_INSTANCE_CREATE_INFO &&
  867. lici->function == VK_LAYER_LINK_INFO;
  868. }
  869. static VkResult VKAPI OBS_CreateInstance(const VkInstanceCreateInfo *cinfo,
  870. const VkAllocationCallbacks *ac,
  871. VkInstance *p_inst)
  872. {
  873. VkInstanceCreateInfo info = *cinfo;
  874. bool funcs_not_found = false;
  875. /* -------------------------------------------------------- */
  876. /* step through chain until we get to the link info */
  877. VkLayerInstanceCreateInfo *lici = (void *)info.pNext;
  878. while (lici && !is_inst_link_info(lici)) {
  879. lici = (VkLayerInstanceCreateInfo *)lici->pNext;
  880. }
  881. if (lici == NULL) {
  882. return VK_ERROR_INITIALIZATION_FAILED;
  883. }
  884. PFN_vkGetInstanceProcAddr gpa =
  885. lici->u.pLayerInfo->pfnNextGetInstanceProcAddr;
  886. /* -------------------------------------------------------- */
  887. /* move chain on for next layer */
  888. lici->u.pLayerInfo = lici->u.pLayerInfo->pNext;
  889. /* -------------------------------------------------------- */
  890. /* (HACK) Set api version to 1.1 if set to 1.0 */
  891. /* We do this to get our extensions working properly */
  892. VkApplicationInfo ai;
  893. if (info.pApplicationInfo) {
  894. ai = *info.pApplicationInfo;
  895. if (ai.apiVersion < VK_API_VERSION_1_1)
  896. ai.apiVersion = VK_API_VERSION_1_1;
  897. } else {
  898. ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
  899. ai.pNext = NULL;
  900. ai.pApplicationName = NULL;
  901. ai.applicationVersion = 0;
  902. ai.pEngineName = NULL;
  903. ai.engineVersion = 0;
  904. ai.apiVersion = VK_API_VERSION_1_1;
  905. }
  906. info.pApplicationInfo = &ai;
  907. /* -------------------------------------------------------- */
  908. /* create instance */
  909. PFN_vkCreateInstance create = (void *)gpa(NULL, "vkCreateInstance");
  910. VkResult res = create(&info, ac, p_inst);
  911. VkInstance inst = *p_inst;
  912. /* -------------------------------------------------------- */
  913. /* fetch the functions we need */
  914. struct vk_inst_data *data = add_inst_data(inst, ac);
  915. struct vk_inst_funcs *funcs = &data->funcs;
  916. #define GETADDR(x) \
  917. do { \
  918. funcs->x = (void *)gpa(inst, "vk" #x); \
  919. if (!funcs->x) { \
  920. flog("could not get instance " \
  921. "address for %s", \
  922. #x); \
  923. funcs_not_found = true; \
  924. } \
  925. } while (false)
  926. GETADDR(GetInstanceProcAddr);
  927. GETADDR(DestroyInstance);
  928. GETADDR(CreateWin32SurfaceKHR);
  929. GETADDR(DestroySurfaceKHR);
  930. GETADDR(GetPhysicalDeviceMemoryProperties);
  931. GETADDR(GetPhysicalDeviceImageFormatProperties2);
  932. GETADDR(EnumerateDeviceExtensionProperties);
  933. #undef GETADDR
  934. init_obj_list(&data->surfaces);
  935. data->valid = !funcs_not_found;
  936. return res;
  937. }
  938. static VkResult VKAPI OBS_DestroyInstance(VkInstance instance,
  939. const VkAllocationCallbacks *ac)
  940. {
  941. struct vk_inst_funcs *funcs = get_inst_funcs(instance);
  942. const uint64_t obj = (uint64_t)GET_LDT(instance);
  943. struct vk_inst_data *data =
  944. (struct vk_inst_data *)remove_obj_data(&instances, obj);
  945. funcs->DestroyInstance(instance, ac);
  946. vk_free(ac, data);
  947. return VK_SUCCESS;
  948. }
  949. static bool
  950. vk_shared_tex_supported(struct vk_inst_funcs *funcs,
  951. VkPhysicalDevice phy_device, VkFormat format,
  952. VkImageUsageFlags usage,
  953. VkExternalMemoryProperties *external_mem_props)
  954. {
  955. VkPhysicalDeviceImageFormatInfo2 info;
  956. VkPhysicalDeviceExternalImageFormatInfo external_info;
  957. external_info.sType =
  958. VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_EXTERNAL_IMAGE_FORMAT_INFO;
  959. external_info.pNext = NULL;
  960. external_info.handleType =
  961. VK_EXTERNAL_MEMORY_HANDLE_TYPE_D3D11_TEXTURE_KMT_BIT;
  962. info.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_IMAGE_FORMAT_INFO_2;
  963. info.pNext = &external_info;
  964. info.format = format;
  965. info.type = VK_IMAGE_TYPE_2D;
  966. info.tiling = VK_IMAGE_TILING_OPTIMAL;
  967. info.flags = 0;
  968. info.usage = usage;
  969. VkExternalImageFormatProperties external_props = {0};
  970. external_props.sType =
  971. VK_STRUCTURE_TYPE_EXTERNAL_IMAGE_FORMAT_PROPERTIES;
  972. external_props.pNext = NULL;
  973. VkImageFormatProperties2 props = {0};
  974. props.sType = VK_STRUCTURE_TYPE_IMAGE_FORMAT_PROPERTIES_2;
  975. props.pNext = &external_props;
  976. VkResult result = funcs->GetPhysicalDeviceImageFormatProperties2(
  977. phy_device, &info, &props);
  978. *external_mem_props = external_props.externalMemoryProperties;
  979. const VkExternalMemoryFeatureFlags features =
  980. external_mem_props->externalMemoryFeatures;
  981. return ((VK_SUCCESS == result) &&
  982. (features & VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT));
  983. }
  984. static inline bool is_device_link_info(VkLayerDeviceCreateInfo *lici)
  985. {
  986. return lici->sType == VK_STRUCTURE_TYPE_LOADER_DEVICE_CREATE_INFO &&
  987. lici->function == VK_LAYER_LINK_INFO;
  988. }
  989. static VkResult VKAPI OBS_CreateDevice(VkPhysicalDevice phy_device,
  990. const VkDeviceCreateInfo *info,
  991. const VkAllocationCallbacks *ac,
  992. VkDevice *p_device)
  993. {
  994. struct vk_inst_data *idata = get_inst_data(phy_device);
  995. struct vk_inst_funcs *ifuncs = &idata->funcs;
  996. struct vk_data *data = NULL;
  997. VkResult ret = VK_ERROR_INITIALIZATION_FAILED;
  998. VkLayerDeviceCreateInfo *ldci = (void *)info->pNext;
  999. /* -------------------------------------------------------- */
  1000. /* step through chain until we get to the link info */
  1001. while (ldci && !is_device_link_info(ldci)) {
  1002. ldci = (VkLayerDeviceCreateInfo *)ldci->pNext;
  1003. }
  1004. if (!ldci) {
  1005. goto fail;
  1006. }
  1007. PFN_vkGetInstanceProcAddr gipa;
  1008. PFN_vkGetDeviceProcAddr gdpa;
  1009. gipa = ldci->u.pLayerInfo->pfnNextGetInstanceProcAddr;
  1010. gdpa = ldci->u.pLayerInfo->pfnNextGetDeviceProcAddr;
  1011. /* -------------------------------------------------------- */
  1012. /* move chain on for next layer */
  1013. ldci->u.pLayerInfo = ldci->u.pLayerInfo->pNext;
  1014. /* -------------------------------------------------------- */
  1015. /* create device and initialize hook data */
  1016. PFN_vkCreateDevice createFunc =
  1017. (PFN_vkCreateDevice)gipa(VK_NULL_HANDLE, "vkCreateDevice");
  1018. ret = createFunc(phy_device, info, ac, p_device);
  1019. if (ret != VK_SUCCESS) {
  1020. goto fail;
  1021. }
  1022. VkDevice device = *p_device;
  1023. data = add_device_data(*p_device, ac);
  1024. struct vk_device_funcs *dfuncs = &data->funcs;
  1025. data->valid = false; /* set true below if it doesn't go to fail */
  1026. data->phy_device = phy_device;
  1027. data->device = device;
  1028. /* -------------------------------------------------------- */
  1029. /* fetch the functions we need */
  1030. bool funcs_not_found = false;
  1031. #define GETADDR(x) \
  1032. do { \
  1033. dfuncs->x = (void *)gdpa(device, "vk" #x); \
  1034. if (!dfuncs->x) { \
  1035. flog("could not get device " \
  1036. "address for %s", \
  1037. #x); \
  1038. funcs_not_found = true; \
  1039. } \
  1040. } while (false)
  1041. #define GETADDR_OPTIONAL(x) \
  1042. do { \
  1043. dfuncs->x = (void *)gdpa(device, "vk" #x); \
  1044. } while (false)
  1045. GETADDR(GetDeviceProcAddr);
  1046. GETADDR(DestroyDevice);
  1047. GETADDR(CreateSwapchainKHR);
  1048. GETADDR(DestroySwapchainKHR);
  1049. GETADDR(QueuePresentKHR);
  1050. GETADDR(AllocateMemory);
  1051. GETADDR(FreeMemory);
  1052. GETADDR(BindImageMemory);
  1053. GETADDR(BindImageMemory2);
  1054. GETADDR(GetSwapchainImagesKHR);
  1055. GETADDR(CreateImage);
  1056. GETADDR(DestroyImage);
  1057. GETADDR(GetImageMemoryRequirements);
  1058. GETADDR(GetImageMemoryRequirements2);
  1059. GETADDR(ResetCommandPool);
  1060. GETADDR(BeginCommandBuffer);
  1061. GETADDR(EndCommandBuffer);
  1062. GETADDR(CmdCopyImage);
  1063. GETADDR(CmdPipelineBarrier);
  1064. GETADDR(GetDeviceQueue);
  1065. GETADDR(QueueSubmit);
  1066. GETADDR(CreateCommandPool);
  1067. GETADDR(DestroyCommandPool);
  1068. GETADDR(AllocateCommandBuffers);
  1069. GETADDR(CreateFence);
  1070. GETADDR(DestroyFence);
  1071. GETADDR(WaitForFences);
  1072. GETADDR(ResetFences);
  1073. #undef GETADDR_OPTIONAL
  1074. #undef GETADDR
  1075. if (funcs_not_found) {
  1076. goto fail;
  1077. }
  1078. if (!idata->valid) {
  1079. flog("instance not valid");
  1080. goto fail;
  1081. }
  1082. const char *required_device_extensions[] = {
  1083. VK_KHR_EXTERNAL_MEMORY_WIN32_EXTENSION_NAME};
  1084. uint32_t device_extension_count = 0;
  1085. ret = ifuncs->EnumerateDeviceExtensionProperties(
  1086. phy_device, NULL, &device_extension_count, NULL);
  1087. if (ret != VK_SUCCESS)
  1088. goto fail;
  1089. VkExtensionProperties *device_extensions = _malloca(
  1090. sizeof(VkExtensionProperties) * device_extension_count);
  1091. ret = ifuncs->EnumerateDeviceExtensionProperties(
  1092. phy_device, NULL, &device_extension_count, device_extensions);
  1093. if (ret != VK_SUCCESS)
  1094. goto fail;
  1095. bool extensions_found = true;
  1096. for (uint32_t i = 0; i < _countof(required_device_extensions); i++) {
  1097. const char *const required_extension =
  1098. required_device_extensions[i];
  1099. bool found = false;
  1100. for (uint32_t j = 0; j < device_extension_count; j++) {
  1101. if (!strcmp(required_extension,
  1102. device_extensions[j].extensionName)) {
  1103. found = true;
  1104. break;
  1105. }
  1106. }
  1107. if (!found) {
  1108. flog("missing device extension: %s",
  1109. required_extension);
  1110. extensions_found = false;
  1111. }
  1112. }
  1113. if (!extensions_found)
  1114. goto fail;
  1115. VkFormat format = VK_FORMAT_R8G8B8A8_UNORM;
  1116. VkImageUsageFlags usage = VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT |
  1117. VK_IMAGE_USAGE_TRANSFER_DST_BIT;
  1118. if (!vk_shared_tex_supported(ifuncs, phy_device, format, usage,
  1119. &data->external_mem_props)) {
  1120. flog("texture sharing is not supported");
  1121. goto fail;
  1122. }
  1123. data->inst_data = idata;
  1124. data->ac = NULL;
  1125. if (ac) {
  1126. data->ac_storage = *ac;
  1127. data->ac = &data->ac_storage;
  1128. }
  1129. uint32_t queue_capacity = 0;
  1130. uint32_t family_capacity = 1;
  1131. for (uint32_t i = 0, count = info->queueCreateInfoCount; i < count;
  1132. ++i) {
  1133. const VkDeviceQueueCreateInfo *queue_info =
  1134. &info->pQueueCreateInfos[i];
  1135. queue_capacity += queue_info->queueCount;
  1136. family_capacity =
  1137. max(family_capacity, queue_info->queueFamilyIndex + 1);
  1138. }
  1139. data->queues = vk_alloc(ac,
  1140. queue_capacity * sizeof(struct vk_queue_data),
  1141. _Alignof(struct vk_queue_data),
  1142. VK_SYSTEM_ALLOCATION_SCOPE_DEVICE);
  1143. data->queue_count = 0;
  1144. data->families =
  1145. vk_alloc(ac, family_capacity * sizeof(struct vk_family_data),
  1146. _Alignof(struct vk_family_data),
  1147. VK_SYSTEM_ALLOCATION_SCOPE_DEVICE);
  1148. memset(data->families, 0,
  1149. family_capacity * sizeof(struct vk_family_data));
  1150. data->family_capacity = family_capacity;
  1151. init_obj_list(&data->swaps);
  1152. data->valid = true;
  1153. fail:
  1154. return ret;
  1155. }
  1156. static void VKAPI OBS_DestroyDevice(VkDevice device,
  1157. const VkAllocationCallbacks *ac)
  1158. {
  1159. struct vk_data *data = get_device_data(device);
  1160. if (!data)
  1161. return;
  1162. if (data->valid) {
  1163. for (uint32_t fam_idx = 0; fam_idx < data->family_capacity;
  1164. fam_idx++) {
  1165. struct vk_family_data *family_data =
  1166. &data->families[fam_idx];
  1167. vk_shtex_destroy_family_objects(data, family_data);
  1168. }
  1169. vk_free(ac, data->queues);
  1170. data->queues = NULL;
  1171. data->queue_count = 0;
  1172. vk_free(ac, data->families);
  1173. data->families = NULL;
  1174. data->family_capacity = 0;
  1175. }
  1176. const uint64_t obj = (uint64_t)GET_LDT(device);
  1177. remove_obj_data(&devices, obj);
  1178. data->funcs.DestroyDevice(device, ac);
  1179. vk_free(ac, data);
  1180. }
  1181. static VkResult VKAPI
  1182. OBS_CreateSwapchainKHR(VkDevice device, const VkSwapchainCreateInfoKHR *cinfo,
  1183. const VkAllocationCallbacks *ac, VkSwapchainKHR *p_sc)
  1184. {
  1185. struct vk_data *data = get_device_data(device);
  1186. VkSwapchainCreateInfoKHR info = *cinfo;
  1187. if (data->valid)
  1188. info.imageUsage |= VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
  1189. struct vk_device_funcs *funcs = &data->funcs;
  1190. VkResult res = funcs->CreateSwapchainKHR(device, &info, ac, p_sc);
  1191. debug_res("CreateSwapchainKHR", res);
  1192. if ((res != VK_SUCCESS) || !data->valid)
  1193. return res;
  1194. VkSwapchainKHR sc = *p_sc;
  1195. uint32_t count = 0;
  1196. res = funcs->GetSwapchainImagesKHR(data->device, sc, &count, NULL);
  1197. debug_res("GetSwapchainImagesKHR", res);
  1198. struct vk_swap_data *swap = add_swap_data(data, sc);
  1199. if (count > 0) {
  1200. swap->swap_images = vk_alloc(ac, count * sizeof(VkImage),
  1201. _Alignof(VkImage),
  1202. VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
  1203. res = funcs->GetSwapchainImagesKHR(data->device, sc, &count,
  1204. swap->swap_images);
  1205. debug_res("GetSwapchainImagesKHR", res);
  1206. }
  1207. swap->sc = sc;
  1208. swap->image_extent = cinfo->imageExtent;
  1209. swap->format = cinfo->imageFormat;
  1210. swap->hwnd = find_surf_hwnd(data->inst_data, cinfo->surface);
  1211. swap->image_count = count;
  1212. swap->d3d11_tex = NULL;
  1213. return VK_SUCCESS;
  1214. }
  1215. static void VKAPI OBS_DestroySwapchainKHR(VkDevice device, VkSwapchainKHR sc,
  1216. const VkAllocationCallbacks *ac)
  1217. {
  1218. struct vk_data *data = get_device_data(device);
  1219. struct vk_device_funcs *funcs = &data->funcs;
  1220. if (data->valid) {
  1221. struct vk_swap_data *swap = get_swap_data(data, sc);
  1222. if (swap) {
  1223. if (data->cur_swap == swap) {
  1224. vk_shtex_free(data);
  1225. }
  1226. swap->sc = VK_NULL_HANDLE;
  1227. swap->hwnd = NULL;
  1228. vk_free(ac, swap->swap_images);
  1229. swap->swap_images = NULL;
  1230. swap->image_count = 0;
  1231. }
  1232. const uint64_t obj = swap->node.obj;
  1233. remove_obj_data(&data->swaps, obj);
  1234. funcs->DestroySwapchainKHR(device, sc, ac);
  1235. vk_free(data->ac, swap);
  1236. }
  1237. }
  1238. static void VKAPI OBS_GetDeviceQueue(VkDevice device, uint32_t queueFamilyIndex,
  1239. uint32_t queueIndex, VkQueue *pQueue)
  1240. {
  1241. struct vk_data *data = get_device_data(device);
  1242. struct vk_device_funcs *funcs = &data->funcs;
  1243. funcs->GetDeviceQueue(device, queueFamilyIndex, queueIndex, pQueue);
  1244. for (uint32_t i = 0; i < data->queue_count; ++i) {
  1245. if (data->queues[i].queue == *pQueue)
  1246. return;
  1247. }
  1248. if (data->queue_count < _countof(data->queues)) {
  1249. data->queues[data->queue_count].queue = *pQueue;
  1250. data->queues[data->queue_count].fam_idx = queueFamilyIndex;
  1251. ++data->queue_count;
  1252. }
  1253. }
  1254. static VkResult VKAPI OBS_CreateWin32SurfaceKHR(
  1255. VkInstance inst, const VkWin32SurfaceCreateInfoKHR *info,
  1256. const VkAllocationCallbacks *ac, VkSurfaceKHR *surf)
  1257. {
  1258. struct vk_inst_data *data = get_inst_data(inst);
  1259. struct vk_inst_funcs *funcs = &data->funcs;
  1260. VkResult res = funcs->CreateWin32SurfaceKHR(inst, info, ac, surf);
  1261. if (res == VK_SUCCESS)
  1262. insert_surf_data(data, *surf, info->hwnd, ac);
  1263. return res;
  1264. }
  1265. static void VKAPI OBS_DestroySurfaceKHR(VkInstance inst, VkSurfaceKHR surf,
  1266. const VkAllocationCallbacks *ac)
  1267. {
  1268. struct vk_inst_data *data = get_inst_data(inst);
  1269. struct vk_inst_funcs *funcs = &data->funcs;
  1270. const uint64_t obj = (uint64_t)surf;
  1271. struct vk_surf_data *surf_data =
  1272. (struct vk_surf_data *)remove_obj_data(&data->surfaces, obj);
  1273. funcs->DestroySurfaceKHR(inst, surf, ac);
  1274. vk_free(ac, surf_data);
  1275. }
  1276. #define GETPROCADDR(func) \
  1277. if (!strcmp(name, "vk" #func)) \
  1278. return (VkFunc)&OBS_##func;
  1279. static VkFunc VKAPI OBS_GetDeviceProcAddr(VkDevice dev, const char *name)
  1280. {
  1281. struct vk_data *data = get_device_data(dev);
  1282. struct vk_device_funcs *funcs = &data->funcs;
  1283. debug_procaddr("vkGetDeviceProcAddr(%p, \"%s\")", dev, name);
  1284. GETPROCADDR(GetDeviceProcAddr);
  1285. GETPROCADDR(CreateDevice);
  1286. GETPROCADDR(DestroyDevice);
  1287. GETPROCADDR(CreateSwapchainKHR);
  1288. GETPROCADDR(DestroySwapchainKHR);
  1289. GETPROCADDR(QueuePresentKHR);
  1290. GETPROCADDR(GetDeviceQueue);
  1291. if (funcs->GetDeviceProcAddr == NULL)
  1292. return NULL;
  1293. return funcs->GetDeviceProcAddr(dev, name);
  1294. }
  1295. static VkFunc VKAPI OBS_GetInstanceProcAddr(VkInstance inst, const char *name)
  1296. {
  1297. debug_procaddr("vkGetInstanceProcAddr(%p, \"%s\")", inst, name);
  1298. /* instance chain functions we intercept */
  1299. GETPROCADDR(GetInstanceProcAddr);
  1300. GETPROCADDR(CreateInstance);
  1301. GETPROCADDR(DestroyInstance);
  1302. GETPROCADDR(CreateWin32SurfaceKHR);
  1303. GETPROCADDR(DestroySurfaceKHR);
  1304. /* device chain functions we intercept */
  1305. GETPROCADDR(GetDeviceProcAddr);
  1306. GETPROCADDR(CreateDevice);
  1307. GETPROCADDR(DestroyDevice);
  1308. struct vk_inst_funcs *funcs = get_inst_funcs(inst);
  1309. if (funcs->GetInstanceProcAddr == NULL)
  1310. return NULL;
  1311. return funcs->GetInstanceProcAddr(inst, name);
  1312. }
  1313. #undef GETPROCADDR
  1314. #ifndef _WIN64
  1315. #pragma comment(linker, "/EXPORT:OBS_Negotiate=_OBS_Negotiate@4")
  1316. #endif
  1317. EXPORT VkResult VKAPI OBS_Negotiate(VkNegotiateLayerInterface *nli)
  1318. {
  1319. if (nli->loaderLayerInterfaceVersion >= 2) {
  1320. nli->sType = LAYER_NEGOTIATE_INTERFACE_STRUCT;
  1321. nli->pNext = NULL;
  1322. nli->pfnGetInstanceProcAddr = OBS_GetInstanceProcAddr;
  1323. nli->pfnGetDeviceProcAddr = OBS_GetDeviceProcAddr;
  1324. nli->pfnGetPhysicalDeviceProcAddr = NULL;
  1325. }
  1326. const uint32_t cur_ver = CURRENT_LOADER_LAYER_INTERFACE_VERSION;
  1327. if (nli->loaderLayerInterfaceVersion > cur_ver) {
  1328. nli->loaderLayerInterfaceVersion = cur_ver;
  1329. }
  1330. if (!vulkan_seen) {
  1331. init_obj_list(&instances);
  1332. init_obj_list(&devices);
  1333. vulkan_seen = true;
  1334. }
  1335. return VK_SUCCESS;
  1336. }
  1337. bool hook_vulkan(void)
  1338. {
  1339. static bool hooked = false;
  1340. if (!hooked && vulkan_seen) {
  1341. hlog("Hooked Vulkan");
  1342. hooked = true;
  1343. }
  1344. return hooked;
  1345. }