vulkan-capture.c 43 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597
  1. #include <windows.h>
  2. #include "graphics-hook.h"
  3. #define VK_USE_PLATFORM_WIN32_KHR
  4. #include <malloc.h>
  5. #include <vulkan/vulkan.h>
  6. #include <vulkan/vk_layer.h>
  7. #undef VK_LAYER_EXPORT
  8. #if defined(WIN32)
  9. #define VK_LAYER_EXPORT __declspec(dllexport)
  10. #else
  11. #define VK_LAYER_EXPORT
  12. #endif
  13. #include <vulkan/vulkan_win32.h>
  14. #define COBJMACROS
  15. #include <dxgi.h>
  16. #include <d3d11.h>
  17. #include "vulkan-capture.h"
  18. /* ======================================================================== */
  19. /* defs/statics */
  20. /* shorten stuff because dear GOD is vulkan unclean. */
  21. #define VKAPI VKAPI_CALL
  22. #define VkFunc PFN_vkVoidFunction
  23. #define EXPORT VK_LAYER_EXPORT
  24. #define OBJ_MAX 16
  25. /* use the loader's dispatch table pointer as a key for internal data maps */
  26. #define GET_LDT(x) (*(void **)x)
  27. static bool vulkan_seen = false;
  28. static SRWLOCK mutex = SRWLOCK_INIT; // Faster CRITICAL_SECTION
  29. /* ======================================================================== */
  30. /* hook data */
  31. struct vk_swap_data {
  32. VkSwapchainKHR sc;
  33. VkExtent2D image_extent;
  34. VkFormat format;
  35. HWND hwnd;
  36. VkImage export_image;
  37. bool layout_initialized;
  38. VkDeviceMemory export_mem;
  39. VkImage swap_images[OBJ_MAX];
  40. uint32_t image_count;
  41. HANDLE handle;
  42. struct shtex_data *shtex_info;
  43. ID3D11Texture2D *d3d11_tex;
  44. bool captured;
  45. };
  46. struct vk_queue_data {
  47. VkQueue queue;
  48. uint32_t fam_idx;
  49. };
  50. struct vk_cmd_pool_data {
  51. VkCommandPool cmd_pool;
  52. VkCommandBuffer cmd_buffers[OBJ_MAX];
  53. VkFence fences[OBJ_MAX];
  54. bool cmd_buffer_busy[OBJ_MAX];
  55. uint32_t image_count;
  56. };
  57. struct vk_data {
  58. bool valid;
  59. struct vk_device_funcs funcs;
  60. VkPhysicalDevice phy_device;
  61. VkDevice device;
  62. struct vk_swap_data swaps[OBJ_MAX];
  63. struct vk_swap_data *cur_swap;
  64. uint32_t swap_idx;
  65. struct vk_queue_data queues[OBJ_MAX];
  66. uint32_t queue_count;
  67. struct vk_cmd_pool_data cmd_pools[OBJ_MAX];
  68. VkExternalMemoryProperties external_mem_props;
  69. struct vk_inst_data *inst_data;
  70. VkAllocationCallbacks ac_storage;
  71. const VkAllocationCallbacks *ac;
  72. ID3D11Device *d3d11_device;
  73. ID3D11DeviceContext *d3d11_context;
  74. };
  75. static struct vk_swap_data *get_swap_data(struct vk_data *data,
  76. VkSwapchainKHR sc)
  77. {
  78. for (int i = 0; i < OBJ_MAX; i++) {
  79. if (data->swaps[i].sc == sc) {
  80. return &data->swaps[i];
  81. }
  82. }
  83. debug("get_swap_data failed, swapchain not found");
  84. return NULL;
  85. }
  86. static struct vk_swap_data *get_new_swap_data(struct vk_data *data)
  87. {
  88. for (int i = 0; i < OBJ_MAX; i++) {
  89. if (data->swaps[i].sc == VK_NULL_HANDLE) {
  90. return &data->swaps[i];
  91. }
  92. }
  93. debug("get_new_swap_data failed, no more free slot");
  94. return NULL;
  95. }
  96. /* ------------------------------------------------------------------------- */
  97. static inline size_t find_obj_idx(void *objs[], void *obj)
  98. {
  99. size_t idx = SIZE_MAX;
  100. AcquireSRWLockExclusive(&mutex);
  101. for (size_t i = 0; i < OBJ_MAX; i++) {
  102. if (objs[i] == obj) {
  103. idx = i;
  104. break;
  105. }
  106. }
  107. ReleaseSRWLockExclusive(&mutex);
  108. return idx;
  109. }
  110. static size_t get_obj_idx(void *objs[], void *obj)
  111. {
  112. size_t idx = SIZE_MAX;
  113. AcquireSRWLockExclusive(&mutex);
  114. for (size_t i = 0; i < OBJ_MAX; i++) {
  115. if (objs[i] == obj) {
  116. idx = i;
  117. break;
  118. }
  119. if (!objs[i] && idx == SIZE_MAX) {
  120. idx = i;
  121. }
  122. }
  123. ReleaseSRWLockExclusive(&mutex);
  124. return idx;
  125. }
  126. /* ------------------------------------------------------------------------- */
  127. static struct vk_data device_data[OBJ_MAX] = {0};
  128. static void *devices[OBJ_MAX] = {0};
  129. static inline struct vk_data *get_device_data(void *dev)
  130. {
  131. size_t idx = get_obj_idx(devices, GET_LDT(dev));
  132. if (idx == SIZE_MAX) {
  133. debug("out of device slots");
  134. return NULL;
  135. }
  136. return &device_data[idx];
  137. }
  138. static void vk_shtex_clear_fence(struct vk_data *data,
  139. struct vk_cmd_pool_data *pool_data,
  140. uint32_t image_idx)
  141. {
  142. VkFence fence = pool_data->fences[image_idx];
  143. if (pool_data->cmd_buffer_busy[image_idx]) {
  144. VkDevice device = data->device;
  145. struct vk_device_funcs *funcs = &data->funcs;
  146. funcs->WaitForFences(device, 1, &fence, VK_TRUE, ~0ull);
  147. funcs->ResetFences(device, 1, &fence);
  148. pool_data->cmd_buffer_busy[image_idx] = false;
  149. }
  150. }
  151. static void vk_shtex_wait_until_pool_idle(struct vk_data *data,
  152. struct vk_cmd_pool_data *pool_data)
  153. {
  154. for (uint32_t image_idx = 0; image_idx < pool_data->image_count;
  155. image_idx++) {
  156. vk_shtex_clear_fence(data, pool_data, image_idx);
  157. }
  158. }
  159. static void vk_shtex_wait_until_idle(struct vk_data *data)
  160. {
  161. for (uint32_t fam_idx = 0; fam_idx < _countof(data->cmd_pools);
  162. fam_idx++) {
  163. struct vk_cmd_pool_data *pool_data = &data->cmd_pools[fam_idx];
  164. if (pool_data->cmd_pool != VK_NULL_HANDLE)
  165. vk_shtex_wait_until_pool_idle(data, pool_data);
  166. }
  167. }
  168. static void vk_shtex_free(struct vk_data *data)
  169. {
  170. capture_free();
  171. vk_shtex_wait_until_idle(data);
  172. for (int swap_idx = 0; swap_idx < OBJ_MAX; swap_idx++) {
  173. struct vk_swap_data *swap = &data->swaps[swap_idx];
  174. if (swap->export_image)
  175. data->funcs.DestroyImage(data->device,
  176. swap->export_image, data->ac);
  177. if (swap->export_mem)
  178. data->funcs.FreeMemory(data->device, swap->export_mem,
  179. NULL);
  180. if (swap->d3d11_tex) {
  181. ID3D11Texture2D_Release(swap->d3d11_tex);
  182. }
  183. swap->handle = INVALID_HANDLE_VALUE;
  184. swap->d3d11_tex = NULL;
  185. swap->export_mem = VK_NULL_HANDLE;
  186. swap->export_image = VK_NULL_HANDLE;
  187. swap->captured = false;
  188. }
  189. if (data->d3d11_context) {
  190. ID3D11DeviceContext_Release(data->d3d11_context);
  191. data->d3d11_context = NULL;
  192. }
  193. if (data->d3d11_device) {
  194. ID3D11Device_Release(data->d3d11_device);
  195. data->d3d11_device = NULL;
  196. }
  197. data->cur_swap = NULL;
  198. hlog("------------------ vulkan capture freed ------------------");
  199. }
  200. static void vk_remove_device(void *dev)
  201. {
  202. size_t idx = find_obj_idx(devices, GET_LDT(dev));
  203. if (idx == SIZE_MAX) {
  204. return;
  205. }
  206. struct vk_data *data = &device_data[idx];
  207. memset(data, 0, sizeof(*data));
  208. AcquireSRWLockExclusive(&mutex);
  209. devices[idx] = NULL;
  210. ReleaseSRWLockExclusive(&mutex);
  211. }
  212. /* ------------------------------------------------------------------------- */
  213. struct vk_surf_data {
  214. VkSurfaceKHR surf;
  215. HWND hwnd;
  216. struct vk_surf_data *next;
  217. };
  218. struct vk_inst_data {
  219. bool valid;
  220. struct vk_inst_funcs funcs;
  221. struct vk_surf_data *surfaces;
  222. };
  223. static void *object_malloc(const VkAllocationCallbacks *ac, size_t size,
  224. size_t alignment)
  225. {
  226. return ac ? ac->pfnAllocation(ac->pUserData, size, alignment,
  227. VK_SYSTEM_ALLOCATION_SCOPE_OBJECT)
  228. : _aligned_malloc(size, alignment);
  229. }
  230. static void object_free(const VkAllocationCallbacks *ac, void *memory)
  231. {
  232. if (ac)
  233. ac->pfnFree(ac->pUserData, memory);
  234. else
  235. _aligned_free(memory);
  236. }
  237. static void insert_surf_data(struct vk_inst_data *data, VkSurfaceKHR surf,
  238. HWND hwnd, const VkAllocationCallbacks *ac)
  239. {
  240. struct vk_surf_data *surf_data = object_malloc(
  241. ac, sizeof(struct vk_surf_data), _Alignof(struct vk_surf_data));
  242. if (surf_data) {
  243. surf_data->surf = surf;
  244. surf_data->hwnd = hwnd;
  245. AcquireSRWLockExclusive(&mutex);
  246. struct vk_surf_data *next = data->surfaces;
  247. surf_data->next = next;
  248. data->surfaces = surf_data;
  249. ReleaseSRWLockExclusive(&mutex);
  250. }
  251. }
  252. static HWND find_surf_hwnd(struct vk_inst_data *data, VkSurfaceKHR surf)
  253. {
  254. HWND hwnd = NULL;
  255. AcquireSRWLockExclusive(&mutex);
  256. struct vk_surf_data *surf_data = data->surfaces;
  257. while (surf_data) {
  258. if (surf_data->surf == surf) {
  259. hwnd = surf_data->hwnd;
  260. break;
  261. }
  262. surf_data = surf_data->next;
  263. }
  264. ReleaseSRWLockExclusive(&mutex);
  265. return hwnd;
  266. }
  267. static void erase_surf_data(struct vk_inst_data *data, VkSurfaceKHR surf,
  268. const VkAllocationCallbacks *ac)
  269. {
  270. AcquireSRWLockExclusive(&mutex);
  271. struct vk_surf_data *current = data->surfaces;
  272. if (current->surf == surf) {
  273. data->surfaces = current->next;
  274. } else {
  275. struct vk_surf_data *previous;
  276. do {
  277. previous = current;
  278. current = current->next;
  279. } while (current && current->surf != surf);
  280. if (current)
  281. previous->next = current->next;
  282. }
  283. ReleaseSRWLockExclusive(&mutex);
  284. object_free(ac, current);
  285. }
  286. /* ------------------------------------------------------------------------- */
  287. static struct vk_inst_data inst_data[OBJ_MAX] = {0};
  288. static void *instances[OBJ_MAX] = {0};
  289. static struct vk_inst_data *get_inst_data(void *inst)
  290. {
  291. size_t idx = get_obj_idx(instances, GET_LDT(inst));
  292. if (idx == SIZE_MAX) {
  293. debug("out of instance slots");
  294. return NULL;
  295. }
  296. vulkan_seen = true;
  297. return &inst_data[idx];
  298. }
  299. static inline struct vk_inst_funcs *get_inst_funcs(void *inst)
  300. {
  301. struct vk_inst_data *data = get_inst_data(inst);
  302. return &data->funcs;
  303. }
  304. static void remove_instance(void *inst)
  305. {
  306. size_t idx = find_obj_idx(instances, inst);
  307. if (idx == SIZE_MAX) {
  308. return;
  309. }
  310. struct vk_inst_data *data = &inst_data[idx];
  311. memset(data, 0, sizeof(*data));
  312. AcquireSRWLockExclusive(&mutex);
  313. instances[idx] = NULL;
  314. ReleaseSRWLockExclusive(&mutex);
  315. }
  316. /* ======================================================================== */
  317. /* capture */
  318. static inline bool vk_shtex_init_d3d11(struct vk_data *data)
  319. {
  320. D3D_FEATURE_LEVEL level_used;
  321. IDXGIFactory1 *factory;
  322. IDXGIAdapter1 *adapter;
  323. HRESULT hr;
  324. HMODULE d3d11 = load_system_library("d3d11.dll");
  325. if (!d3d11) {
  326. flog("failed to load d3d11: %d", GetLastError());
  327. return false;
  328. }
  329. HMODULE dxgi = load_system_library("dxgi.dll");
  330. if (!dxgi) {
  331. flog("failed to load dxgi: %d", GetLastError());
  332. return false;
  333. }
  334. HRESULT(WINAPI * create_factory)
  335. (REFIID, void **) = (void *)GetProcAddress(dxgi, "CreateDXGIFactory1");
  336. if (!create_factory) {
  337. flog("failed to get CreateDXGIFactory1 address: %d",
  338. GetLastError());
  339. return false;
  340. }
  341. PFN_D3D11_CREATE_DEVICE create =
  342. (void *)GetProcAddress(d3d11, "D3D11CreateDevice");
  343. if (!create) {
  344. flog("failed to get D3D11CreateDevice address: %d",
  345. GetLastError());
  346. return false;
  347. }
  348. hr = create_factory(&IID_IDXGIFactory1, &factory);
  349. if (FAILED(hr)) {
  350. flog_hr("failed to create factory", hr);
  351. return false;
  352. }
  353. hr = IDXGIFactory1_EnumAdapters1(factory, 0, &adapter);
  354. IDXGIFactory1_Release(factory);
  355. if (FAILED(hr)) {
  356. flog_hr("failed to create adapter", hr);
  357. return false;
  358. }
  359. static const D3D_FEATURE_LEVEL feature_levels[] = {
  360. D3D_FEATURE_LEVEL_11_0,
  361. D3D_FEATURE_LEVEL_10_1,
  362. D3D_FEATURE_LEVEL_10_0,
  363. D3D_FEATURE_LEVEL_9_3,
  364. };
  365. hr = create((IDXGIAdapter *)adapter, D3D_DRIVER_TYPE_UNKNOWN, NULL, 0,
  366. feature_levels,
  367. sizeof(feature_levels) / sizeof(D3D_FEATURE_LEVEL),
  368. D3D11_SDK_VERSION, &data->d3d11_device, &level_used,
  369. &data->d3d11_context);
  370. IDXGIAdapter1_Release(adapter);
  371. if (FAILED(hr)) {
  372. flog_hr("failed to create device", hr);
  373. return false;
  374. }
  375. return true;
  376. }
  377. static inline bool vk_shtex_init_d3d11_tex(struct vk_data *data,
  378. struct vk_swap_data *swap)
  379. {
  380. IDXGIResource *dxgi_res;
  381. HRESULT hr;
  382. const UINT width = swap->image_extent.width;
  383. const UINT height = swap->image_extent.height;
  384. flog("OBS requesting %s texture format. capture dimensions: %ux%u",
  385. vk_format_to_str(swap->format), width, height);
  386. const DXGI_FORMAT format = vk_format_to_dxgi(swap->format);
  387. if (format == DXGI_FORMAT_UNKNOWN) {
  388. flog("cannot convert to DXGI format");
  389. return false;
  390. }
  391. D3D11_TEXTURE2D_DESC desc = {0};
  392. desc.Width = width;
  393. desc.Height = height;
  394. desc.MipLevels = 1;
  395. desc.ArraySize = 1;
  396. desc.Format = format;
  397. desc.SampleDesc.Count = 1;
  398. desc.SampleDesc.Quality = 0;
  399. desc.Usage = D3D11_USAGE_DEFAULT;
  400. desc.MiscFlags = D3D11_RESOURCE_MISC_SHARED;
  401. desc.BindFlags = D3D11_BIND_RENDER_TARGET | D3D11_BIND_SHADER_RESOURCE;
  402. hr = ID3D11Device_CreateTexture2D(data->d3d11_device, &desc, NULL,
  403. &swap->d3d11_tex);
  404. if (FAILED(hr)) {
  405. flog_hr("failed to create texture", hr);
  406. return false;
  407. }
  408. hr = ID3D11Texture2D_QueryInterface(swap->d3d11_tex, &IID_IDXGIResource,
  409. &dxgi_res);
  410. if (FAILED(hr)) {
  411. flog_hr("failed to get IDXGIResource", hr);
  412. return false;
  413. }
  414. hr = IDXGIResource_GetSharedHandle(dxgi_res, &swap->handle);
  415. IDXGIResource_Release(dxgi_res);
  416. if (FAILED(hr)) {
  417. flog_hr("failed to get shared handle", hr);
  418. return false;
  419. }
  420. return true;
  421. }
  422. static inline bool vk_shtex_init_vulkan_tex(struct vk_data *data,
  423. struct vk_swap_data *swap)
  424. {
  425. struct vk_device_funcs *funcs = &data->funcs;
  426. VkExternalMemoryFeatureFlags f =
  427. data->external_mem_props.externalMemoryFeatures;
  428. /* -------------------------------------------------------- */
  429. /* create texture */
  430. VkExternalMemoryImageCreateInfo emici;
  431. emici.sType = VK_STRUCTURE_TYPE_EXTERNAL_MEMORY_IMAGE_CREATE_INFO;
  432. emici.pNext = NULL;
  433. emici.handleTypes =
  434. VK_EXTERNAL_MEMORY_HANDLE_TYPE_D3D11_TEXTURE_KMT_BIT;
  435. VkImageCreateInfo ici;
  436. ici.sType = VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO;
  437. ici.pNext = &emici;
  438. ici.flags = 0;
  439. ici.imageType = VK_IMAGE_TYPE_2D;
  440. ici.format = swap->format;
  441. ici.extent.width = swap->image_extent.width;
  442. ici.extent.height = swap->image_extent.height;
  443. ici.extent.depth = 1;
  444. ici.mipLevels = 1;
  445. ici.arrayLayers = 1;
  446. ici.samples = VK_SAMPLE_COUNT_1_BIT;
  447. ici.tiling = VK_IMAGE_TILING_OPTIMAL;
  448. ici.usage = VK_IMAGE_USAGE_TRANSFER_DST_BIT |
  449. VK_IMAGE_USAGE_SAMPLED_BIT;
  450. ici.sharingMode = VK_SHARING_MODE_EXCLUSIVE;
  451. ici.queueFamilyIndexCount = 0;
  452. ici.pQueueFamilyIndices = 0;
  453. ici.initialLayout = VK_IMAGE_LAYOUT_UNDEFINED;
  454. VkResult res;
  455. res = funcs->CreateImage(data->device, &ici, data->ac,
  456. &swap->export_image);
  457. if (VK_SUCCESS != res) {
  458. flog("failed to CreateImage: %s", result_to_str(res));
  459. swap->export_image = VK_NULL_HANDLE;
  460. return false;
  461. }
  462. swap->layout_initialized = false;
  463. /* -------------------------------------------------------- */
  464. /* get image memory requirements */
  465. VkMemoryRequirements mr;
  466. bool use_gimr2 = f & VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT;
  467. if (use_gimr2) {
  468. VkMemoryDedicatedRequirements mdr = {0};
  469. mdr.sType = VK_STRUCTURE_TYPE_MEMORY_DEDICATED_REQUIREMENTS;
  470. mdr.pNext = NULL;
  471. VkMemoryRequirements2 mr2 = {0};
  472. mr2.sType = VK_STRUCTURE_TYPE_MEMORY_REQUIREMENTS_2;
  473. mr2.pNext = &mdr;
  474. VkImageMemoryRequirementsInfo2 imri2 = {0};
  475. imri2.sType =
  476. VK_STRUCTURE_TYPE_IMAGE_MEMORY_REQUIREMENTS_INFO_2;
  477. imri2.pNext = NULL;
  478. imri2.image = swap->export_image;
  479. funcs->GetImageMemoryRequirements2(data->device, &imri2, &mr2);
  480. mr = mr2.memoryRequirements;
  481. } else {
  482. funcs->GetImageMemoryRequirements(data->device,
  483. swap->export_image, &mr);
  484. }
  485. /* -------------------------------------------------------- */
  486. /* get memory type index */
  487. struct vk_inst_funcs *ifuncs = get_inst_funcs(data->phy_device);
  488. VkPhysicalDeviceMemoryProperties pdmp;
  489. ifuncs->GetPhysicalDeviceMemoryProperties(data->phy_device, &pdmp);
  490. uint32_t mem_type_idx = 0;
  491. for (; mem_type_idx < pdmp.memoryTypeCount; mem_type_idx++) {
  492. if ((mr.memoryTypeBits & (1 << mem_type_idx)) &&
  493. (pdmp.memoryTypes[mem_type_idx].propertyFlags &
  494. VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) ==
  495. VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT) {
  496. break;
  497. }
  498. }
  499. if (mem_type_idx == pdmp.memoryTypeCount) {
  500. flog("failed to get memory type index");
  501. funcs->DestroyImage(data->device, swap->export_image, data->ac);
  502. swap->export_image = VK_NULL_HANDLE;
  503. return false;
  504. }
  505. /* -------------------------------------------------------- */
  506. /* allocate memory */
  507. VkImportMemoryWin32HandleInfoKHR imw32hi;
  508. imw32hi.sType = VK_STRUCTURE_TYPE_IMPORT_MEMORY_WIN32_HANDLE_INFO_KHR;
  509. imw32hi.pNext = NULL;
  510. imw32hi.name = NULL;
  511. imw32hi.handleType =
  512. VK_EXTERNAL_MEMORY_HANDLE_TYPE_D3D11_TEXTURE_KMT_BIT;
  513. imw32hi.handle = swap->handle;
  514. VkMemoryAllocateInfo mai;
  515. mai.sType = VK_STRUCTURE_TYPE_MEMORY_ALLOCATE_INFO;
  516. mai.pNext = &imw32hi;
  517. mai.allocationSize = mr.size;
  518. mai.memoryTypeIndex = mem_type_idx;
  519. VkMemoryDedicatedAllocateInfo mdai;
  520. mdai.sType = VK_STRUCTURE_TYPE_MEMORY_DEDICATED_ALLOCATE_INFO;
  521. mdai.pNext = NULL;
  522. mdai.buffer = VK_NULL_HANDLE;
  523. if (data->external_mem_props.externalMemoryFeatures &
  524. VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT) {
  525. mdai.image = swap->export_image;
  526. imw32hi.pNext = &mdai;
  527. }
  528. res = funcs->AllocateMemory(data->device, &mai, NULL,
  529. &swap->export_mem);
  530. if (VK_SUCCESS != res) {
  531. flog("failed to AllocateMemory: %s", result_to_str(res));
  532. funcs->DestroyImage(data->device, swap->export_image, data->ac);
  533. swap->export_image = VK_NULL_HANDLE;
  534. return false;
  535. }
  536. /* -------------------------------------------------------- */
  537. /* bind image memory */
  538. bool use_bi2 = f & VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT;
  539. if (use_bi2) {
  540. VkBindImageMemoryInfo bimi = {0};
  541. bimi.sType = VK_STRUCTURE_TYPE_BIND_IMAGE_MEMORY_INFO;
  542. bimi.image = swap->export_image;
  543. bimi.memory = swap->export_mem;
  544. bimi.memoryOffset = 0;
  545. res = funcs->BindImageMemory2(data->device, 1, &bimi);
  546. } else {
  547. res = funcs->BindImageMemory(data->device, swap->export_image,
  548. swap->export_mem, 0);
  549. }
  550. if (VK_SUCCESS != res) {
  551. flog("%s failed: %s",
  552. use_bi2 ? "BindImageMemory2" : "BindImageMemory",
  553. result_to_str(res));
  554. funcs->DestroyImage(data->device, swap->export_image, data->ac);
  555. swap->export_image = VK_NULL_HANDLE;
  556. return false;
  557. }
  558. return true;
  559. }
  560. static bool vk_shtex_init(struct vk_data *data, HWND window,
  561. struct vk_swap_data *swap)
  562. {
  563. if (!vk_shtex_init_d3d11(data)) {
  564. return false;
  565. }
  566. if (!vk_shtex_init_d3d11_tex(data, swap)) {
  567. return false;
  568. }
  569. if (!vk_shtex_init_vulkan_tex(data, swap)) {
  570. return false;
  571. }
  572. data->cur_swap = swap;
  573. swap->captured = capture_init_shtex(
  574. &swap->shtex_info, window, swap->image_extent.width,
  575. swap->image_extent.height, swap->image_extent.width,
  576. swap->image_extent.height, (uint32_t)swap->format, false,
  577. (uintptr_t)swap->handle);
  578. if (swap->captured) {
  579. if (global_hook_info->force_shmem) {
  580. flog("shared memory capture currently "
  581. "unsupported; ignoring");
  582. }
  583. hlog("vulkan shared texture capture successful");
  584. return true;
  585. }
  586. return false;
  587. }
  588. static void vk_shtex_create_cmd_pool_objects(struct vk_data *data,
  589. uint32_t fam_idx,
  590. uint32_t image_count)
  591. {
  592. struct vk_cmd_pool_data *pool_data = &data->cmd_pools[fam_idx];
  593. VkCommandPoolCreateInfo cpci;
  594. cpci.sType = VK_STRUCTURE_TYPE_COMMAND_POOL_CREATE_INFO;
  595. cpci.pNext = NULL;
  596. cpci.flags = VK_COMMAND_POOL_CREATE_RESET_COMMAND_BUFFER_BIT;
  597. cpci.queueFamilyIndex = fam_idx;
  598. VkResult res = data->funcs.CreateCommandPool(
  599. data->device, &cpci, data->ac, &pool_data->cmd_pool);
  600. debug_res("CreateCommandPool", res);
  601. VkCommandBufferAllocateInfo cbai;
  602. cbai.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_ALLOCATE_INFO;
  603. cbai.pNext = NULL;
  604. cbai.commandPool = pool_data->cmd_pool;
  605. cbai.level = VK_COMMAND_BUFFER_LEVEL_PRIMARY;
  606. cbai.commandBufferCount = image_count;
  607. res = data->funcs.AllocateCommandBuffers(data->device, &cbai,
  608. pool_data->cmd_buffers);
  609. debug_res("AllocateCommandBuffers", res);
  610. for (uint32_t image_index = 0; image_index < image_count;
  611. image_index++) {
  612. /* Dispatch table something or other. Well-designed API. */
  613. VkCommandBuffer cmd_buffer =
  614. pool_data->cmd_buffers[image_index];
  615. *(void **)cmd_buffer = *(void **)(data->device);
  616. VkFence *fence = &pool_data->fences[image_index];
  617. VkFenceCreateInfo fci = {0};
  618. fci.sType = VK_STRUCTURE_TYPE_FENCE_CREATE_INFO;
  619. fci.pNext = NULL;
  620. fci.flags = 0;
  621. res = data->funcs.CreateFence(data->device, &fci, data->ac,
  622. fence);
  623. debug_res("CreateFence", res);
  624. }
  625. pool_data->image_count = image_count;
  626. }
  627. static void vk_shtex_destroy_fence(struct vk_data *data, bool *cmd_buffer_busy,
  628. VkFence *fence)
  629. {
  630. VkDevice device = data->device;
  631. if (*cmd_buffer_busy) {
  632. data->funcs.WaitForFences(device, 1, fence, VK_TRUE, ~0ull);
  633. *cmd_buffer_busy = false;
  634. }
  635. data->funcs.DestroyFence(device, *fence, data->ac);
  636. *fence = VK_NULL_HANDLE;
  637. }
  638. static void
  639. vk_shtex_destroy_cmd_pool_objects(struct vk_data *data,
  640. struct vk_cmd_pool_data *pool_data)
  641. {
  642. for (uint32_t image_idx = 0; image_idx < pool_data->image_count;
  643. image_idx++) {
  644. bool *cmd_buffer_busy = &pool_data->cmd_buffer_busy[image_idx];
  645. VkFence *fence = &pool_data->fences[image_idx];
  646. vk_shtex_destroy_fence(data, cmd_buffer_busy, fence);
  647. }
  648. data->funcs.DestroyCommandPool(data->device, pool_data->cmd_pool,
  649. data->ac);
  650. pool_data->cmd_pool = VK_NULL_HANDLE;
  651. pool_data->image_count = 0;
  652. }
  653. static void vk_shtex_capture(struct vk_data *data,
  654. struct vk_device_funcs *funcs,
  655. struct vk_swap_data *swap, uint32_t idx,
  656. VkQueue queue, const VkPresentInfoKHR *info)
  657. {
  658. VkResult res = VK_SUCCESS;
  659. VkCommandBufferBeginInfo begin_info;
  660. begin_info.sType = VK_STRUCTURE_TYPE_COMMAND_BUFFER_BEGIN_INFO;
  661. begin_info.pNext = NULL;
  662. begin_info.flags = VK_COMMAND_BUFFER_USAGE_ONE_TIME_SUBMIT_BIT;
  663. begin_info.pInheritanceInfo = NULL;
  664. VkImageMemoryBarrier mb[2];
  665. VkImageMemoryBarrier *src_mb = &mb[0];
  666. VkImageMemoryBarrier *dst_mb = &mb[1];
  667. /* ------------------------------------------------------ */
  668. /* do image copy */
  669. const uint32_t image_index = info->pImageIndices[idx];
  670. VkImage cur_backbuffer = swap->swap_images[image_index];
  671. uint32_t fam_idx = 0;
  672. for (uint32_t i = 0; i < data->queue_count; i++) {
  673. if (data->queues[i].queue == queue)
  674. fam_idx = data->queues[i].fam_idx;
  675. }
  676. if (fam_idx >= _countof(data->cmd_pools))
  677. return;
  678. struct vk_cmd_pool_data *pool_data = &data->cmd_pools[fam_idx];
  679. VkCommandPool *pool = &pool_data->cmd_pool;
  680. const uint32_t image_count = swap->image_count;
  681. if (pool_data->image_count < image_count) {
  682. if (*pool != VK_NULL_HANDLE)
  683. vk_shtex_destroy_cmd_pool_objects(data, pool_data);
  684. vk_shtex_create_cmd_pool_objects(data, fam_idx, image_count);
  685. }
  686. vk_shtex_clear_fence(data, pool_data, image_index);
  687. VkCommandBuffer cmd_buffer = pool_data->cmd_buffers[image_index];
  688. res = funcs->BeginCommandBuffer(cmd_buffer, &begin_info);
  689. #ifdef MORE_DEBUGGING
  690. debug_res("BeginCommandBuffer", res);
  691. #endif
  692. /* ------------------------------------------------------ */
  693. /* transition shared texture if necessary */
  694. if (!swap->layout_initialized) {
  695. VkImageMemoryBarrier imb;
  696. imb.sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER;
  697. imb.pNext = NULL;
  698. imb.srcAccessMask = 0;
  699. imb.dstAccessMask = 0;
  700. imb.oldLayout = VK_IMAGE_LAYOUT_UNDEFINED;
  701. imb.newLayout = VK_IMAGE_LAYOUT_GENERAL;
  702. imb.srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  703. imb.dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  704. imb.image = swap->export_image;
  705. imb.subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  706. imb.subresourceRange.baseMipLevel = 0;
  707. imb.subresourceRange.levelCount = 1;
  708. imb.subresourceRange.baseArrayLayer = 0;
  709. imb.subresourceRange.layerCount = 1;
  710. funcs->CmdPipelineBarrier(cmd_buffer,
  711. VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT,
  712. VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT, 0,
  713. 0, NULL, 0, NULL, 1, &imb);
  714. swap->layout_initialized = true;
  715. }
  716. /* ------------------------------------------------------ */
  717. /* transition cur_backbuffer to transfer source state */
  718. src_mb->sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER;
  719. src_mb->pNext = NULL;
  720. src_mb->srcAccessMask = VK_ACCESS_MEMORY_READ_BIT;
  721. src_mb->dstAccessMask = VK_ACCESS_TRANSFER_READ_BIT;
  722. src_mb->oldLayout = VK_IMAGE_LAYOUT_PRESENT_SRC_KHR;
  723. src_mb->newLayout = VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL;
  724. src_mb->srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  725. src_mb->dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED;
  726. src_mb->image = cur_backbuffer;
  727. src_mb->subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  728. src_mb->subresourceRange.baseMipLevel = 0;
  729. src_mb->subresourceRange.levelCount = 1;
  730. src_mb->subresourceRange.baseArrayLayer = 0;
  731. src_mb->subresourceRange.layerCount = 1;
  732. /* ------------------------------------------------------ */
  733. /* transition exportedTexture to transfer dest state */
  734. dst_mb->sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER;
  735. dst_mb->pNext = NULL;
  736. dst_mb->srcAccessMask = 0;
  737. dst_mb->dstAccessMask = VK_ACCESS_TRANSFER_WRITE_BIT;
  738. dst_mb->oldLayout = VK_IMAGE_LAYOUT_GENERAL;
  739. dst_mb->newLayout = VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL;
  740. dst_mb->srcQueueFamilyIndex = VK_QUEUE_FAMILY_EXTERNAL;
  741. dst_mb->dstQueueFamilyIndex = fam_idx;
  742. dst_mb->image = swap->export_image;
  743. dst_mb->subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  744. dst_mb->subresourceRange.baseMipLevel = 0;
  745. dst_mb->subresourceRange.levelCount = 1;
  746. dst_mb->subresourceRange.baseArrayLayer = 0;
  747. dst_mb->subresourceRange.layerCount = 1;
  748. funcs->CmdPipelineBarrier(cmd_buffer,
  749. VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT,
  750. VK_PIPELINE_STAGE_TRANSFER_BIT, 0, 0, NULL, 0,
  751. NULL, 2, mb);
  752. /* ------------------------------------------------------ */
  753. /* copy cur_backbuffer's content to our interop image */
  754. VkImageCopy cpy;
  755. cpy.srcSubresource.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  756. cpy.srcSubresource.mipLevel = 0;
  757. cpy.srcSubresource.baseArrayLayer = 0;
  758. cpy.srcSubresource.layerCount = 1;
  759. cpy.srcOffset.x = 0;
  760. cpy.srcOffset.y = 0;
  761. cpy.srcOffset.z = 0;
  762. cpy.dstSubresource.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT;
  763. cpy.dstSubresource.mipLevel = 0;
  764. cpy.dstSubresource.baseArrayLayer = 0;
  765. cpy.dstSubresource.layerCount = 1;
  766. cpy.dstOffset.x = 0;
  767. cpy.dstOffset.y = 0;
  768. cpy.dstOffset.z = 0;
  769. cpy.extent.width = swap->image_extent.width;
  770. cpy.extent.height = swap->image_extent.height;
  771. cpy.extent.depth = 1;
  772. funcs->CmdCopyImage(cmd_buffer, cur_backbuffer,
  773. VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL,
  774. swap->export_image,
  775. VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL, 1, &cpy);
  776. /* ------------------------------------------------------ */
  777. /* Restore the swap chain image layout to what it was
  778. * before. This may not be strictly needed, but it is
  779. * generally good to restore things to their original
  780. * state. */
  781. src_mb->srcAccessMask = VK_ACCESS_TRANSFER_READ_BIT;
  782. src_mb->dstAccessMask = VK_ACCESS_MEMORY_READ_BIT;
  783. src_mb->oldLayout = VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL;
  784. src_mb->newLayout = VK_IMAGE_LAYOUT_PRESENT_SRC_KHR;
  785. dst_mb->srcAccessMask = VK_ACCESS_TRANSFER_WRITE_BIT;
  786. dst_mb->dstAccessMask = 0;
  787. dst_mb->oldLayout = VK_IMAGE_LAYOUT_TRANSFER_DST_OPTIMAL;
  788. dst_mb->newLayout = VK_IMAGE_LAYOUT_GENERAL;
  789. dst_mb->srcQueueFamilyIndex = fam_idx;
  790. dst_mb->dstQueueFamilyIndex = VK_QUEUE_FAMILY_EXTERNAL;
  791. funcs->CmdPipelineBarrier(cmd_buffer, VK_PIPELINE_STAGE_TRANSFER_BIT,
  792. VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT |
  793. VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT,
  794. 0, 0, NULL, 0, NULL, 2, mb);
  795. funcs->EndCommandBuffer(cmd_buffer);
  796. /* ------------------------------------------------------ */
  797. VkSubmitInfo submit_info;
  798. submit_info.sType = VK_STRUCTURE_TYPE_SUBMIT_INFO;
  799. submit_info.pNext = NULL;
  800. submit_info.waitSemaphoreCount = 0;
  801. submit_info.pWaitSemaphores = NULL;
  802. submit_info.pWaitDstStageMask = NULL;
  803. submit_info.commandBufferCount = 1;
  804. submit_info.pCommandBuffers = &cmd_buffer;
  805. submit_info.signalSemaphoreCount = 0;
  806. submit_info.pSignalSemaphores = NULL;
  807. VkFence fence = pool_data->fences[image_index];
  808. res = funcs->QueueSubmit(queue, 1, &submit_info, fence);
  809. #ifdef MORE_DEBUGGING
  810. debug_res("QueueSubmit", res);
  811. #endif
  812. if (res == VK_SUCCESS)
  813. pool_data->cmd_buffer_busy[image_index] = true;
  814. }
  815. static inline bool valid_rect(struct vk_swap_data *swap)
  816. {
  817. return !!swap->image_extent.width && !!swap->image_extent.height;
  818. }
  819. static void vk_capture(struct vk_data *data, VkQueue queue,
  820. const VkPresentInfoKHR *info)
  821. {
  822. struct vk_swap_data *swap = NULL;
  823. HWND window = NULL;
  824. uint32_t idx = 0;
  825. #ifdef MORE_DEBUGGING
  826. debug("QueuePresentKHR called on "
  827. "devicekey %p, swapchain count %d",
  828. &data->funcs, info->swapchainCount);
  829. #endif
  830. /* use first swap chain associated with a window */
  831. for (; idx < info->swapchainCount; idx++) {
  832. struct vk_swap_data *cur_swap =
  833. get_swap_data(data, info->pSwapchains[idx]);
  834. window = cur_swap->hwnd;
  835. if (!!window) {
  836. swap = cur_swap;
  837. break;
  838. }
  839. }
  840. if (!window) {
  841. return;
  842. }
  843. if (capture_should_stop()) {
  844. vk_shtex_free(data);
  845. }
  846. if (capture_should_init()) {
  847. if (valid_rect(swap) && !vk_shtex_init(data, window, swap)) {
  848. vk_shtex_free(data);
  849. data->valid = false;
  850. flog("vk_shtex_init failed");
  851. }
  852. }
  853. if (capture_ready()) {
  854. if (swap != data->cur_swap) {
  855. vk_shtex_free(data);
  856. return;
  857. }
  858. vk_shtex_capture(data, &data->funcs, swap, idx, queue, info);
  859. }
  860. }
  861. static VkResult VKAPI OBS_QueuePresentKHR(VkQueue queue,
  862. const VkPresentInfoKHR *info)
  863. {
  864. struct vk_data *data = get_device_data(queue);
  865. struct vk_device_funcs *funcs = &data->funcs;
  866. if (data->valid) {
  867. vk_capture(data, queue, info);
  868. }
  869. return funcs->QueuePresentKHR(queue, info);
  870. }
  871. /* ======================================================================== */
  872. /* setup hooks */
  873. static inline bool is_inst_link_info(VkLayerInstanceCreateInfo *lici)
  874. {
  875. return lici->sType == VK_STRUCTURE_TYPE_LOADER_INSTANCE_CREATE_INFO &&
  876. lici->function == VK_LAYER_LINK_INFO;
  877. }
  878. static VkResult VKAPI OBS_CreateInstance(const VkInstanceCreateInfo *cinfo,
  879. const VkAllocationCallbacks *ac,
  880. VkInstance *p_inst)
  881. {
  882. VkInstanceCreateInfo info = *cinfo;
  883. bool funcs_not_found = false;
  884. /* -------------------------------------------------------- */
  885. /* step through chain until we get to the link info */
  886. VkLayerInstanceCreateInfo *lici = (void *)info.pNext;
  887. while (lici && !is_inst_link_info(lici)) {
  888. lici = (VkLayerInstanceCreateInfo *)lici->pNext;
  889. }
  890. if (lici == NULL) {
  891. return VK_ERROR_INITIALIZATION_FAILED;
  892. }
  893. PFN_vkGetInstanceProcAddr gpa =
  894. lici->u.pLayerInfo->pfnNextGetInstanceProcAddr;
  895. /* -------------------------------------------------------- */
  896. /* move chain on for next layer */
  897. lici->u.pLayerInfo = lici->u.pLayerInfo->pNext;
  898. /* -------------------------------------------------------- */
  899. /* (HACK) Set api version to 1.1 if set to 1.0 */
  900. /* We do this to get our extensions working properly */
  901. VkApplicationInfo ai;
  902. if (info.pApplicationInfo) {
  903. ai = *info.pApplicationInfo;
  904. if (ai.apiVersion < VK_API_VERSION_1_1)
  905. ai.apiVersion = VK_API_VERSION_1_1;
  906. } else {
  907. ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
  908. ai.pNext = NULL;
  909. ai.pApplicationName = NULL;
  910. ai.applicationVersion = 0;
  911. ai.pEngineName = NULL;
  912. ai.engineVersion = 0;
  913. ai.apiVersion = VK_API_VERSION_1_1;
  914. }
  915. info.pApplicationInfo = &ai;
  916. /* -------------------------------------------------------- */
  917. /* create instance */
  918. PFN_vkCreateInstance create = (void *)gpa(NULL, "vkCreateInstance");
  919. VkResult res = create(&info, ac, p_inst);
  920. VkInstance inst = *p_inst;
  921. /* -------------------------------------------------------- */
  922. /* fetch the functions we need */
  923. struct vk_inst_data *data = get_inst_data(inst);
  924. struct vk_inst_funcs *funcs = &data->funcs;
  925. #define GETADDR(x) \
  926. do { \
  927. funcs->x = (void *)gpa(inst, "vk" #x); \
  928. if (!funcs->x) { \
  929. flog("could not get instance " \
  930. "address for %s", \
  931. #x); \
  932. funcs_not_found = true; \
  933. } \
  934. } while (false)
  935. GETADDR(GetInstanceProcAddr);
  936. GETADDR(DestroyInstance);
  937. GETADDR(CreateWin32SurfaceKHR);
  938. GETADDR(DestroySurfaceKHR);
  939. GETADDR(GetPhysicalDeviceMemoryProperties);
  940. GETADDR(GetPhysicalDeviceImageFormatProperties2);
  941. GETADDR(EnumerateDeviceExtensionProperties);
  942. #undef GETADDR
  943. data->valid = !funcs_not_found;
  944. return res;
  945. }
  946. static VkResult VKAPI OBS_DestroyInstance(VkInstance instance,
  947. const VkAllocationCallbacks *ac)
  948. {
  949. struct vk_inst_funcs *funcs = get_inst_funcs(instance);
  950. funcs->DestroyInstance(instance, ac);
  951. remove_instance(instance);
  952. return VK_SUCCESS;
  953. }
  954. static bool
  955. vk_shared_tex_supported(struct vk_inst_funcs *funcs,
  956. VkPhysicalDevice phy_device, VkFormat format,
  957. VkImageUsageFlags usage,
  958. VkExternalMemoryProperties *external_mem_props)
  959. {
  960. VkPhysicalDeviceImageFormatInfo2 info;
  961. VkPhysicalDeviceExternalImageFormatInfo external_info;
  962. external_info.sType =
  963. VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_EXTERNAL_IMAGE_FORMAT_INFO;
  964. external_info.pNext = NULL;
  965. external_info.handleType =
  966. VK_EXTERNAL_MEMORY_HANDLE_TYPE_D3D11_TEXTURE_KMT_BIT;
  967. info.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_IMAGE_FORMAT_INFO_2;
  968. info.pNext = &external_info;
  969. info.format = format;
  970. info.type = VK_IMAGE_TYPE_2D;
  971. info.tiling = VK_IMAGE_TILING_OPTIMAL;
  972. info.flags = 0;
  973. info.usage = usage;
  974. VkExternalImageFormatProperties external_props = {0};
  975. external_props.sType =
  976. VK_STRUCTURE_TYPE_EXTERNAL_IMAGE_FORMAT_PROPERTIES;
  977. external_props.pNext = NULL;
  978. VkImageFormatProperties2 props = {0};
  979. props.sType = VK_STRUCTURE_TYPE_IMAGE_FORMAT_PROPERTIES_2;
  980. props.pNext = &external_props;
  981. VkResult result = funcs->GetPhysicalDeviceImageFormatProperties2(
  982. phy_device, &info, &props);
  983. *external_mem_props = external_props.externalMemoryProperties;
  984. const VkExternalMemoryFeatureFlags features =
  985. external_mem_props->externalMemoryFeatures;
  986. return ((VK_SUCCESS == result) &&
  987. (features & VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT));
  988. }
  989. static inline bool is_device_link_info(VkLayerDeviceCreateInfo *lici)
  990. {
  991. return lici->sType == VK_STRUCTURE_TYPE_LOADER_DEVICE_CREATE_INFO &&
  992. lici->function == VK_LAYER_LINK_INFO;
  993. }
  994. static VkResult VKAPI OBS_CreateDevice(VkPhysicalDevice phy_device,
  995. const VkDeviceCreateInfo *info,
  996. const VkAllocationCallbacks *ac,
  997. VkDevice *p_device)
  998. {
  999. struct vk_inst_data *idata = get_inst_data(phy_device);
  1000. struct vk_inst_funcs *ifuncs = &idata->funcs;
  1001. struct vk_data *data = NULL;
  1002. VkResult ret = VK_ERROR_INITIALIZATION_FAILED;
  1003. VkLayerDeviceCreateInfo *ldci = (void *)info->pNext;
  1004. /* -------------------------------------------------------- */
  1005. /* step through chain until we get to the link info */
  1006. while (ldci && !is_device_link_info(ldci)) {
  1007. ldci = (VkLayerDeviceCreateInfo *)ldci->pNext;
  1008. }
  1009. if (!ldci) {
  1010. goto fail;
  1011. }
  1012. PFN_vkGetInstanceProcAddr gipa;
  1013. PFN_vkGetDeviceProcAddr gdpa;
  1014. gipa = ldci->u.pLayerInfo->pfnNextGetInstanceProcAddr;
  1015. gdpa = ldci->u.pLayerInfo->pfnNextGetDeviceProcAddr;
  1016. /* -------------------------------------------------------- */
  1017. /* move chain on for next layer */
  1018. ldci->u.pLayerInfo = ldci->u.pLayerInfo->pNext;
  1019. /* -------------------------------------------------------- */
  1020. /* create device and initialize hook data */
  1021. PFN_vkCreateDevice createFunc =
  1022. (PFN_vkCreateDevice)gipa(VK_NULL_HANDLE, "vkCreateDevice");
  1023. ret = createFunc(phy_device, info, ac, p_device);
  1024. if (ret != VK_SUCCESS) {
  1025. goto fail;
  1026. }
  1027. VkDevice device = *p_device;
  1028. data = get_device_data(*p_device);
  1029. struct vk_device_funcs *dfuncs = &data->funcs;
  1030. data->valid = false; /* set true below if it doesn't go to fail */
  1031. data->phy_device = phy_device;
  1032. data->device = device;
  1033. /* -------------------------------------------------------- */
  1034. /* fetch the functions we need */
  1035. bool funcs_not_found = false;
  1036. #define GETADDR(x) \
  1037. do { \
  1038. dfuncs->x = (void *)gdpa(device, "vk" #x); \
  1039. if (!dfuncs->x) { \
  1040. flog("could not get device " \
  1041. "address for %s", \
  1042. #x); \
  1043. funcs_not_found = true; \
  1044. } \
  1045. } while (false)
  1046. #define GETADDR_OPTIONAL(x) \
  1047. do { \
  1048. dfuncs->x = (void *)gdpa(device, "vk" #x); \
  1049. } while (false)
  1050. GETADDR(GetDeviceProcAddr);
  1051. GETADDR(DestroyDevice);
  1052. GETADDR(CreateSwapchainKHR);
  1053. GETADDR(DestroySwapchainKHR);
  1054. GETADDR(QueuePresentKHR);
  1055. GETADDR(AllocateMemory);
  1056. GETADDR(FreeMemory);
  1057. GETADDR(BindImageMemory);
  1058. GETADDR(BindImageMemory2);
  1059. GETADDR(GetSwapchainImagesKHR);
  1060. GETADDR(CreateImage);
  1061. GETADDR(DestroyImage);
  1062. GETADDR(GetImageMemoryRequirements);
  1063. GETADDR(GetImageMemoryRequirements2);
  1064. GETADDR(BeginCommandBuffer);
  1065. GETADDR(EndCommandBuffer);
  1066. GETADDR(CmdCopyImage);
  1067. GETADDR(CmdPipelineBarrier);
  1068. GETADDR(GetDeviceQueue);
  1069. GETADDR(QueueSubmit);
  1070. GETADDR(CreateCommandPool);
  1071. GETADDR(DestroyCommandPool);
  1072. GETADDR(AllocateCommandBuffers);
  1073. GETADDR(CreateFence);
  1074. GETADDR(DestroyFence);
  1075. GETADDR(WaitForFences);
  1076. GETADDR(ResetFences);
  1077. #undef GETADDR_OPTIONAL
  1078. #undef GETADDR
  1079. if (funcs_not_found) {
  1080. goto fail;
  1081. }
  1082. if (!idata->valid) {
  1083. flog("instance not valid");
  1084. goto fail;
  1085. }
  1086. const char *required_device_extensions[] = {
  1087. VK_KHR_EXTERNAL_MEMORY_WIN32_EXTENSION_NAME};
  1088. uint32_t device_extension_count = 0;
  1089. ret = ifuncs->EnumerateDeviceExtensionProperties(
  1090. phy_device, NULL, &device_extension_count, NULL);
  1091. if (ret != VK_SUCCESS)
  1092. goto fail;
  1093. VkExtensionProperties *device_extensions = _malloca(
  1094. sizeof(VkExtensionProperties) * device_extension_count);
  1095. ret = ifuncs->EnumerateDeviceExtensionProperties(
  1096. phy_device, NULL, &device_extension_count, device_extensions);
  1097. if (ret != VK_SUCCESS)
  1098. goto fail;
  1099. bool extensions_found = true;
  1100. for (uint32_t i = 0; i < _countof(required_device_extensions); i++) {
  1101. const char *const required_extension =
  1102. required_device_extensions[i];
  1103. bool found = false;
  1104. for (uint32_t j = 0; j < device_extension_count; j++) {
  1105. if (!strcmp(required_extension,
  1106. device_extensions[j].extensionName)) {
  1107. found = true;
  1108. break;
  1109. }
  1110. }
  1111. if (!found) {
  1112. flog("missing device extension: %s",
  1113. required_extension);
  1114. extensions_found = false;
  1115. }
  1116. }
  1117. if (!extensions_found)
  1118. goto fail;
  1119. VkFormat format = VK_FORMAT_R8G8B8A8_UNORM;
  1120. VkImageUsageFlags usage = VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT |
  1121. VK_IMAGE_USAGE_TRANSFER_DST_BIT;
  1122. if (!vk_shared_tex_supported(ifuncs, phy_device, format, usage,
  1123. &data->external_mem_props)) {
  1124. flog("texture sharing is not supported");
  1125. goto fail;
  1126. }
  1127. data->inst_data = idata;
  1128. data->ac = NULL;
  1129. if (ac) {
  1130. data->ac_storage = *ac;
  1131. data->ac = &data->ac_storage;
  1132. }
  1133. data->valid = true;
  1134. fail:
  1135. return ret;
  1136. }
  1137. static void VKAPI OBS_DestroyDevice(VkDevice device,
  1138. const VkAllocationCallbacks *ac)
  1139. {
  1140. struct vk_data *data = get_device_data(device);
  1141. if (!data)
  1142. return;
  1143. if (data->valid) {
  1144. for (uint32_t fam_idx = 0; fam_idx < _countof(data->cmd_pools);
  1145. fam_idx++) {
  1146. struct vk_cmd_pool_data *pool_data =
  1147. &data->cmd_pools[fam_idx];
  1148. if (pool_data->cmd_pool != VK_NULL_HANDLE) {
  1149. vk_shtex_destroy_cmd_pool_objects(data,
  1150. pool_data);
  1151. }
  1152. }
  1153. }
  1154. data->queue_count = 0;
  1155. vk_remove_device(device);
  1156. data->funcs.DestroyDevice(device, ac);
  1157. }
  1158. static VkResult VKAPI
  1159. OBS_CreateSwapchainKHR(VkDevice device, const VkSwapchainCreateInfoKHR *cinfo,
  1160. const VkAllocationCallbacks *ac, VkSwapchainKHR *p_sc)
  1161. {
  1162. struct vk_data *data = get_device_data(device);
  1163. VkSwapchainCreateInfoKHR info = *cinfo;
  1164. if (data->valid)
  1165. info.imageUsage |= VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
  1166. struct vk_device_funcs *funcs = &data->funcs;
  1167. VkResult res = funcs->CreateSwapchainKHR(device, &info, ac, p_sc);
  1168. debug_res("CreateSwapchainKHR", res);
  1169. if ((res != VK_SUCCESS) || !data->valid)
  1170. return res;
  1171. VkSwapchainKHR sc = *p_sc;
  1172. uint32_t count = 0;
  1173. res = funcs->GetSwapchainImagesKHR(data->device, sc, &count, NULL);
  1174. debug_res("GetSwapchainImagesKHR", res);
  1175. struct vk_swap_data *swap = get_new_swap_data(data);
  1176. if (count > 0) {
  1177. if (count > OBJ_MAX)
  1178. count = OBJ_MAX;
  1179. res = funcs->GetSwapchainImagesKHR(data->device, sc, &count,
  1180. swap->swap_images);
  1181. debug_res("GetSwapchainImagesKHR", res);
  1182. }
  1183. swap->sc = sc;
  1184. swap->image_extent = cinfo->imageExtent;
  1185. swap->format = cinfo->imageFormat;
  1186. swap->hwnd = find_surf_hwnd(data->inst_data, cinfo->surface);
  1187. swap->image_count = count;
  1188. swap->d3d11_tex = NULL;
  1189. return VK_SUCCESS;
  1190. }
  1191. static void VKAPI OBS_DestroySwapchainKHR(VkDevice device, VkSwapchainKHR sc,
  1192. const VkAllocationCallbacks *ac)
  1193. {
  1194. struct vk_data *data = get_device_data(device);
  1195. struct vk_device_funcs *funcs = &data->funcs;
  1196. if (data->valid) {
  1197. struct vk_swap_data *swap = get_swap_data(data, sc);
  1198. if (swap) {
  1199. if (data->cur_swap == swap) {
  1200. vk_shtex_free(data);
  1201. }
  1202. swap->sc = VK_NULL_HANDLE;
  1203. swap->hwnd = NULL;
  1204. }
  1205. }
  1206. funcs->DestroySwapchainKHR(device, sc, ac);
  1207. }
  1208. static void VKAPI OBS_GetDeviceQueue(VkDevice device, uint32_t queueFamilyIndex,
  1209. uint32_t queueIndex, VkQueue *pQueue)
  1210. {
  1211. struct vk_data *data = get_device_data(device);
  1212. struct vk_device_funcs *funcs = &data->funcs;
  1213. funcs->GetDeviceQueue(device, queueFamilyIndex, queueIndex, pQueue);
  1214. for (uint32_t i = 0; i < data->queue_count; ++i) {
  1215. if (data->queues[i].queue == *pQueue)
  1216. return;
  1217. }
  1218. if (data->queue_count < _countof(data->queues)) {
  1219. data->queues[data->queue_count].queue = *pQueue;
  1220. data->queues[data->queue_count].fam_idx = queueFamilyIndex;
  1221. ++data->queue_count;
  1222. }
  1223. }
  1224. static VkResult VKAPI OBS_CreateWin32SurfaceKHR(
  1225. VkInstance inst, const VkWin32SurfaceCreateInfoKHR *info,
  1226. const VkAllocationCallbacks *ac, VkSurfaceKHR *surf)
  1227. {
  1228. struct vk_inst_data *data = get_inst_data(inst);
  1229. struct vk_inst_funcs *funcs = &data->funcs;
  1230. VkResult res = funcs->CreateWin32SurfaceKHR(inst, info, ac, surf);
  1231. if (res == VK_SUCCESS)
  1232. insert_surf_data(data, *surf, info->hwnd, ac);
  1233. return res;
  1234. }
  1235. static void VKAPI OBS_DestroySurfaceKHR(VkInstance inst, VkSurfaceKHR surf,
  1236. const VkAllocationCallbacks *ac)
  1237. {
  1238. struct vk_inst_data *data = get_inst_data(inst);
  1239. struct vk_inst_funcs *funcs = &data->funcs;
  1240. erase_surf_data(data, surf, ac);
  1241. funcs->DestroySurfaceKHR(inst, surf, ac);
  1242. }
  1243. #define GETPROCADDR(func) \
  1244. if (!strcmp(name, "vk" #func)) \
  1245. return (VkFunc)&OBS_##func;
  1246. static VkFunc VKAPI OBS_GetDeviceProcAddr(VkDevice dev, const char *name)
  1247. {
  1248. struct vk_data *data = get_device_data(dev);
  1249. struct vk_device_funcs *funcs = &data->funcs;
  1250. debug_procaddr("vkGetDeviceProcAddr(%p, \"%s\")", dev, name);
  1251. GETPROCADDR(GetDeviceProcAddr);
  1252. GETPROCADDR(CreateDevice);
  1253. GETPROCADDR(DestroyDevice);
  1254. GETPROCADDR(CreateSwapchainKHR);
  1255. GETPROCADDR(DestroySwapchainKHR);
  1256. GETPROCADDR(QueuePresentKHR);
  1257. GETPROCADDR(GetDeviceQueue);
  1258. if (funcs->GetDeviceProcAddr == NULL)
  1259. return NULL;
  1260. return funcs->GetDeviceProcAddr(dev, name);
  1261. }
  1262. static VkFunc VKAPI OBS_GetInstanceProcAddr(VkInstance inst, const char *name)
  1263. {
  1264. debug_procaddr("vkGetInstanceProcAddr(%p, \"%s\")", inst, name);
  1265. /* instance chain functions we intercept */
  1266. GETPROCADDR(GetInstanceProcAddr);
  1267. GETPROCADDR(CreateInstance);
  1268. GETPROCADDR(DestroyInstance);
  1269. GETPROCADDR(CreateWin32SurfaceKHR);
  1270. GETPROCADDR(DestroySurfaceKHR);
  1271. /* device chain functions we intercept */
  1272. GETPROCADDR(GetDeviceProcAddr);
  1273. GETPROCADDR(CreateDevice);
  1274. GETPROCADDR(DestroyDevice);
  1275. struct vk_inst_funcs *funcs = get_inst_funcs(inst);
  1276. if (funcs->GetInstanceProcAddr == NULL)
  1277. return NULL;
  1278. return funcs->GetInstanceProcAddr(inst, name);
  1279. }
  1280. #undef GETPROCADDR
  1281. EXPORT VkResult VKAPI OBS_Negotiate(VkNegotiateLayerInterface *nli)
  1282. {
  1283. if (nli->loaderLayerInterfaceVersion >= 2) {
  1284. nli->sType = LAYER_NEGOTIATE_INTERFACE_STRUCT;
  1285. nli->pNext = NULL;
  1286. nli->pfnGetInstanceProcAddr = OBS_GetInstanceProcAddr;
  1287. nli->pfnGetDeviceProcAddr = OBS_GetDeviceProcAddr;
  1288. nli->pfnGetPhysicalDeviceProcAddr = NULL;
  1289. }
  1290. const uint32_t cur_ver = CURRENT_LOADER_LAYER_INTERFACE_VERSION;
  1291. if (nli->loaderLayerInterfaceVersion > cur_ver) {
  1292. nli->loaderLayerInterfaceVersion = cur_ver;
  1293. }
  1294. return VK_SUCCESS;
  1295. }
  1296. bool hook_vulkan(void)
  1297. {
  1298. static bool hooked = false;
  1299. if (!hooked && vulkan_seen) {
  1300. hlog("Hooked Vulkan");
  1301. hooked = true;
  1302. }
  1303. return hooked;
  1304. }