jim-nvenc.c 26 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036
  1. #include "jim-nvenc.h"
  2. #include <util/circlebuf.h>
  3. #include <util/darray.h>
  4. #include <util/dstr.h>
  5. #include <obs-avc.h>
  6. #include <libavutil/rational.h>
  7. #define INITGUID
  8. #include <dxgi.h>
  9. #include <d3d11.h>
  10. #include <d3d11_1.h>
  11. /* ========================================================================= */
  12. #define EXTRA_BUFFERS 5
  13. #define do_log(level, format, ...) \
  14. blog(level, "[jim-nvenc: '%s'] " format, \
  15. obs_encoder_get_name(enc->encoder), ##__VA_ARGS__)
  16. #define error(format, ...) do_log(LOG_ERROR, format, ##__VA_ARGS__)
  17. #define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
  18. #define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
  19. #define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
  20. #define error_hr(msg) error("%s: %s: 0x%08lX", __FUNCTION__, msg, (uint32_t)hr);
  21. struct nv_bitstream;
  22. struct nv_texture;
  23. struct handle_tex {
  24. uint32_t handle;
  25. ID3D11Texture2D *tex;
  26. IDXGIKeyedMutex *km;
  27. };
  28. /* ------------------------------------------------------------------------- */
  29. /* Main Implementation Structure */
  30. struct nvenc_data {
  31. obs_encoder_t *encoder;
  32. void *session;
  33. NV_ENC_INITIALIZE_PARAMS params;
  34. NV_ENC_CONFIG config;
  35. int rc_lookahead;
  36. int buf_count;
  37. int output_delay;
  38. int buffers_queued;
  39. size_t next_bitstream;
  40. size_t cur_bitstream;
  41. bool encode_started;
  42. bool first_packet;
  43. bool can_change_bitrate;
  44. int32_t bframes;
  45. DARRAY(struct nv_bitstream) bitstreams;
  46. DARRAY(struct nv_texture) textures;
  47. DARRAY(struct handle_tex) input_textures;
  48. struct circlebuf dts_list;
  49. DARRAY(uint8_t) packet_data;
  50. int64_t packet_pts;
  51. bool packet_keyframe;
  52. ID3D11Device *device;
  53. ID3D11DeviceContext *context;
  54. uint32_t cx;
  55. uint32_t cy;
  56. uint8_t *header;
  57. size_t header_size;
  58. uint8_t *sei;
  59. size_t sei_size;
  60. };
  61. /* ------------------------------------------------------------------------- */
  62. /* Bitstream Buffer */
  63. struct nv_bitstream {
  64. void *ptr;
  65. HANDLE event;
  66. };
  67. #define NV_FAILED(x) nv_failed(enc->encoder, x, __FUNCTION__, #x)
  68. static bool nv_bitstream_init(struct nvenc_data *enc, struct nv_bitstream *bs)
  69. {
  70. NV_ENC_CREATE_BITSTREAM_BUFFER buf = {
  71. NV_ENC_CREATE_BITSTREAM_BUFFER_VER};
  72. NV_ENC_EVENT_PARAMS params = {NV_ENC_EVENT_PARAMS_VER};
  73. HANDLE event = NULL;
  74. if (NV_FAILED(nv.nvEncCreateBitstreamBuffer(enc->session, &buf))) {
  75. return false;
  76. }
  77. event = CreateEvent(NULL, true, true, NULL);
  78. if (!event) {
  79. error("%s: %s", __FUNCTION__, "Failed to create event");
  80. goto fail;
  81. }
  82. params.completionEvent = event;
  83. if (NV_FAILED(nv.nvEncRegisterAsyncEvent(enc->session, &params))) {
  84. goto fail;
  85. }
  86. bs->ptr = buf.bitstreamBuffer;
  87. bs->event = event;
  88. return true;
  89. fail:
  90. if (event) {
  91. CloseHandle(event);
  92. }
  93. if (buf.bitstreamBuffer) {
  94. nv.nvEncDestroyBitstreamBuffer(enc->session,
  95. buf.bitstreamBuffer);
  96. }
  97. return false;
  98. }
  99. static void nv_bitstream_free(struct nvenc_data *enc, struct nv_bitstream *bs)
  100. {
  101. if (bs->ptr) {
  102. nv.nvEncDestroyBitstreamBuffer(enc->session, bs->ptr);
  103. NV_ENC_EVENT_PARAMS params = {NV_ENC_EVENT_PARAMS_VER};
  104. params.completionEvent = bs->event;
  105. nv.nvEncUnregisterAsyncEvent(enc->session, &params);
  106. CloseHandle(bs->event);
  107. }
  108. }
  109. /* ------------------------------------------------------------------------- */
  110. /* Texture Resource */
  111. struct nv_texture {
  112. void *res;
  113. ID3D11Texture2D *tex;
  114. void *mapped_res;
  115. };
  116. static bool nv_texture_init(struct nvenc_data *enc, struct nv_texture *nvtex)
  117. {
  118. ID3D11Device *device = enc->device;
  119. ID3D11Texture2D *tex;
  120. HRESULT hr;
  121. D3D11_TEXTURE2D_DESC desc = {0};
  122. desc.Width = enc->cx;
  123. desc.Height = enc->cy;
  124. desc.MipLevels = 1;
  125. desc.ArraySize = 1;
  126. desc.Format = DXGI_FORMAT_NV12;
  127. desc.SampleDesc.Count = 1;
  128. desc.BindFlags = D3D11_BIND_RENDER_TARGET;
  129. hr = device->lpVtbl->CreateTexture2D(device, &desc, NULL, &tex);
  130. if (FAILED(hr)) {
  131. error_hr("Failed to create texture");
  132. return false;
  133. }
  134. tex->lpVtbl->SetEvictionPriority(tex, DXGI_RESOURCE_PRIORITY_MAXIMUM);
  135. NV_ENC_REGISTER_RESOURCE res = {NV_ENC_REGISTER_RESOURCE_VER};
  136. res.resourceType = NV_ENC_INPUT_RESOURCE_TYPE_DIRECTX;
  137. res.resourceToRegister = tex;
  138. res.width = enc->cx;
  139. res.height = enc->cy;
  140. res.bufferFormat = NV_ENC_BUFFER_FORMAT_NV12;
  141. if (NV_FAILED(nv.nvEncRegisterResource(enc->session, &res))) {
  142. tex->lpVtbl->Release(tex);
  143. return false;
  144. }
  145. nvtex->res = res.registeredResource;
  146. nvtex->tex = tex;
  147. return true;
  148. }
  149. static void nv_texture_free(struct nvenc_data *enc, struct nv_texture *nvtex)
  150. {
  151. if (nvtex->res) {
  152. if (nvtex->mapped_res) {
  153. nv.nvEncUnmapInputResource(enc->session,
  154. nvtex->mapped_res);
  155. }
  156. nv.nvEncUnregisterResource(enc->session, nvtex->res);
  157. nvtex->tex->lpVtbl->Release(nvtex->tex);
  158. }
  159. }
  160. /* ------------------------------------------------------------------------- */
  161. /* Implementation */
  162. static const char *nvenc_get_name(void *type_data)
  163. {
  164. UNUSED_PARAMETER(type_data);
  165. return "NVIDIA NVENC H.264 (new)";
  166. }
  167. static inline int nv_get_cap(struct nvenc_data *enc, NV_ENC_CAPS cap)
  168. {
  169. if (!enc->session)
  170. return 0;
  171. NV_ENC_CAPS_PARAM param = {NV_ENC_CAPS_PARAM_VER};
  172. int v;
  173. param.capsToQuery = cap;
  174. nv.nvEncGetEncodeCaps(enc->session, NV_ENC_CODEC_H264_GUID, &param, &v);
  175. return v;
  176. }
  177. static bool nvenc_update(void *data, obs_data_t *settings)
  178. {
  179. struct nvenc_data *enc = data;
  180. /* Only support reconfiguration of CBR bitrate */
  181. if (enc->can_change_bitrate) {
  182. int bitrate = (int)obs_data_get_int(settings, "bitrate");
  183. enc->config.rcParams.averageBitRate = bitrate * 1000;
  184. enc->config.rcParams.maxBitRate = bitrate * 1000;
  185. NV_ENC_RECONFIGURE_PARAMS params = {0};
  186. params.version = NV_ENC_RECONFIGURE_PARAMS_VER;
  187. params.reInitEncodeParams = enc->params;
  188. params.resetEncoder = 1;
  189. params.forceIDR = 1;
  190. if (NV_FAILED(nv.nvEncReconfigureEncoder(enc->session,
  191. &params))) {
  192. return false;
  193. }
  194. }
  195. return true;
  196. }
  197. static HANDLE get_lib(struct nvenc_data *enc, const char *lib)
  198. {
  199. HMODULE mod = GetModuleHandleA(lib);
  200. if (mod)
  201. return mod;
  202. mod = LoadLibraryA(lib);
  203. if (!mod)
  204. error("Failed to load %s", lib);
  205. return mod;
  206. }
  207. typedef HRESULT(WINAPI *CREATEDXGIFACTORY1PROC)(REFIID, void **);
  208. static bool init_d3d11(struct nvenc_data *enc, obs_data_t *settings)
  209. {
  210. HMODULE dxgi = get_lib(enc, "DXGI.dll");
  211. HMODULE d3d11 = get_lib(enc, "D3D11.dll");
  212. CREATEDXGIFACTORY1PROC create_dxgi;
  213. PFN_D3D11_CREATE_DEVICE create_device;
  214. IDXGIFactory1 *factory;
  215. IDXGIAdapter *adapter;
  216. ID3D11Device *device;
  217. ID3D11DeviceContext *context;
  218. HRESULT hr;
  219. if (!dxgi || !d3d11) {
  220. return false;
  221. }
  222. create_dxgi = (CREATEDXGIFACTORY1PROC)GetProcAddress(
  223. dxgi, "CreateDXGIFactory1");
  224. create_device = (PFN_D3D11_CREATE_DEVICE)GetProcAddress(
  225. d3d11, "D3D11CreateDevice");
  226. if (!create_dxgi || !create_device) {
  227. error("Failed to load D3D11/DXGI procedures");
  228. return false;
  229. }
  230. hr = create_dxgi(&IID_IDXGIFactory1, &factory);
  231. if (FAILED(hr)) {
  232. error_hr("CreateDXGIFactory1 failed");
  233. return false;
  234. }
  235. hr = factory->lpVtbl->EnumAdapters(factory, 0, &adapter);
  236. factory->lpVtbl->Release(factory);
  237. if (FAILED(hr)) {
  238. error_hr("EnumAdapters failed");
  239. return false;
  240. }
  241. hr = create_device(adapter, D3D_DRIVER_TYPE_UNKNOWN, NULL, 0, NULL, 0,
  242. D3D11_SDK_VERSION, &device, NULL, &context);
  243. adapter->lpVtbl->Release(adapter);
  244. if (FAILED(hr)) {
  245. error_hr("D3D11CreateDevice failed");
  246. return false;
  247. }
  248. enc->device = device;
  249. enc->context = context;
  250. return true;
  251. }
  252. static bool init_session(struct nvenc_data *enc)
  253. {
  254. NV_ENC_OPEN_ENCODE_SESSION_EX_PARAMS params = {
  255. NV_ENC_OPEN_ENCODE_SESSION_EX_PARAMS_VER};
  256. params.device = enc->device;
  257. params.deviceType = NV_ENC_DEVICE_TYPE_DIRECTX;
  258. params.apiVersion = NVENCAPI_VERSION;
  259. if (NV_FAILED(nv.nvEncOpenEncodeSessionEx(&params, &enc->session))) {
  260. return false;
  261. }
  262. return true;
  263. }
  264. static bool init_encoder(struct nvenc_data *enc, obs_data_t *settings,
  265. bool psycho_aq)
  266. {
  267. const char *rc = obs_data_get_string(settings, "rate_control");
  268. int bitrate = (int)obs_data_get_int(settings, "bitrate");
  269. int max_bitrate = (int)obs_data_get_int(settings, "max_bitrate");
  270. int cqp = (int)obs_data_get_int(settings, "cqp");
  271. int keyint_sec = (int)obs_data_get_int(settings, "keyint_sec");
  272. const char *preset = obs_data_get_string(settings, "preset");
  273. const char *profile = obs_data_get_string(settings, "profile");
  274. bool lookahead = obs_data_get_bool(settings, "lookahead");
  275. int bf = (int)obs_data_get_int(settings, "bf");
  276. bool vbr = astrcmpi(rc, "VBR") == 0;
  277. NVENCSTATUS err;
  278. video_t *video = obs_encoder_video(enc->encoder);
  279. const struct video_output_info *voi = video_output_get_info(video);
  280. enc->cx = voi->width;
  281. enc->cy = voi->height;
  282. /* -------------------------- */
  283. /* get preset */
  284. GUID nv_preset = NV_ENC_PRESET_DEFAULT_GUID;
  285. bool twopass = false;
  286. bool hp = false;
  287. bool ll = false;
  288. if (astrcmpi(preset, "hq") == 0) {
  289. nv_preset = NV_ENC_PRESET_HQ_GUID;
  290. } else if (astrcmpi(preset, "mq") == 0) {
  291. nv_preset = NV_ENC_PRESET_HQ_GUID;
  292. twopass = true;
  293. } else if (astrcmpi(preset, "hp") == 0) {
  294. nv_preset = NV_ENC_PRESET_HP_GUID;
  295. hp = true;
  296. } else if (astrcmpi(preset, "ll") == 0) {
  297. nv_preset = NV_ENC_PRESET_LOW_LATENCY_DEFAULT_GUID;
  298. ll = true;
  299. } else if (astrcmpi(preset, "llhq") == 0) {
  300. nv_preset = NV_ENC_PRESET_LOW_LATENCY_HQ_GUID;
  301. ll = true;
  302. } else if (astrcmpi(preset, "llhp") == 0) {
  303. nv_preset = NV_ENC_PRESET_LOW_LATENCY_HP_GUID;
  304. hp = true;
  305. ll = true;
  306. }
  307. const bool rc_lossless = astrcmpi(rc, "lossless") == 0;
  308. bool lossless = rc_lossless;
  309. if (rc_lossless) {
  310. lossless = nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_LOSSLESS_ENCODE);
  311. if (lossless) {
  312. nv_preset = hp ? NV_ENC_PRESET_LOSSLESS_HP_GUID
  313. : NV_ENC_PRESET_LOSSLESS_DEFAULT_GUID;
  314. } else {
  315. warn("lossless encode is not supported, ignoring");
  316. }
  317. }
  318. /* -------------------------- */
  319. /* get preset default config */
  320. NV_ENC_PRESET_CONFIG preset_config = {NV_ENC_PRESET_CONFIG_VER,
  321. {NV_ENC_CONFIG_VER}};
  322. err = nv.nvEncGetEncodePresetConfig(enc->session,
  323. NV_ENC_CODEC_H264_GUID, nv_preset,
  324. &preset_config);
  325. if (nv_failed(enc->encoder, err, __FUNCTION__,
  326. "nvEncGetEncodePresetConfig")) {
  327. return false;
  328. }
  329. /* -------------------------- */
  330. /* main configuration */
  331. enc->config = preset_config.presetCfg;
  332. uint32_t gop_size =
  333. (keyint_sec) ? keyint_sec * voi->fps_num / voi->fps_den : 250;
  334. NV_ENC_INITIALIZE_PARAMS *params = &enc->params;
  335. NV_ENC_CONFIG *config = &enc->config;
  336. NV_ENC_CONFIG_H264 *h264_config = &config->encodeCodecConfig.h264Config;
  337. NV_ENC_CONFIG_H264_VUI_PARAMETERS *vui_params =
  338. &h264_config->h264VUIParameters;
  339. int darWidth, darHeight;
  340. av_reduce(&darWidth, &darHeight, voi->width, voi->height, 1024 * 1024);
  341. memset(params, 0, sizeof(*params));
  342. params->version = NV_ENC_INITIALIZE_PARAMS_VER;
  343. params->encodeGUID = NV_ENC_CODEC_H264_GUID;
  344. params->presetGUID = nv_preset;
  345. params->encodeWidth = voi->width;
  346. params->encodeHeight = voi->height;
  347. params->darWidth = darWidth;
  348. params->darHeight = darHeight;
  349. params->frameRateNum = voi->fps_num;
  350. params->frameRateDen = voi->fps_den;
  351. params->enableEncodeAsync = 1;
  352. params->enablePTD = 1;
  353. params->encodeConfig = &enc->config;
  354. config->gopLength = gop_size;
  355. config->frameIntervalP = 1 + bf;
  356. h264_config->idrPeriod = gop_size;
  357. bool repeat_headers = obs_data_get_bool(settings, "repeat_headers");
  358. if (repeat_headers) {
  359. h264_config->repeatSPSPPS = 1;
  360. h264_config->disableSPSPPS = 0;
  361. h264_config->outputAUD = 1;
  362. }
  363. h264_config->sliceMode = 3;
  364. h264_config->sliceModeData = 1;
  365. h264_config->useBFramesAsRef = NV_ENC_BFRAME_REF_MODE_DISABLED;
  366. vui_params->videoSignalTypePresentFlag = 1;
  367. vui_params->videoFullRangeFlag = (voi->range == VIDEO_RANGE_FULL);
  368. vui_params->colourDescriptionPresentFlag = 1;
  369. switch (voi->colorspace) {
  370. case VIDEO_CS_601:
  371. vui_params->colourPrimaries = 6;
  372. vui_params->transferCharacteristics = 6;
  373. vui_params->colourMatrix = 6;
  374. break;
  375. case VIDEO_CS_DEFAULT:
  376. case VIDEO_CS_709:
  377. vui_params->colourPrimaries = 1;
  378. vui_params->transferCharacteristics = 1;
  379. vui_params->colourMatrix = 1;
  380. break;
  381. case VIDEO_CS_SRGB:
  382. vui_params->colourPrimaries = 1;
  383. vui_params->transferCharacteristics = 13;
  384. vui_params->colourMatrix = 1;
  385. break;
  386. }
  387. enc->bframes = bf;
  388. /* lookahead */
  389. const bool use_profile_lookahead = config->rcParams.enableLookahead;
  390. lookahead = nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_LOOKAHEAD) &&
  391. (lookahead || use_profile_lookahead);
  392. if (lookahead) {
  393. enc->rc_lookahead = use_profile_lookahead
  394. ? config->rcParams.lookaheadDepth
  395. : 8;
  396. }
  397. int buf_count = max(4, config->frameIntervalP * 2 * 2);
  398. if (lookahead) {
  399. buf_count = max(buf_count, config->frameIntervalP +
  400. enc->rc_lookahead +
  401. EXTRA_BUFFERS);
  402. }
  403. buf_count = min(64, buf_count);
  404. enc->buf_count = buf_count;
  405. const int output_delay = buf_count - 1;
  406. enc->output_delay = output_delay;
  407. if (lookahead) {
  408. const int lkd_bound = output_delay - config->frameIntervalP - 4;
  409. if (lkd_bound >= 0) {
  410. config->rcParams.enableLookahead = 1;
  411. config->rcParams.lookaheadDepth =
  412. max(enc->rc_lookahead, lkd_bound);
  413. config->rcParams.disableIadapt = 0;
  414. config->rcParams.disableBadapt = 0;
  415. } else {
  416. lookahead = false;
  417. }
  418. }
  419. /* psycho aq */
  420. if (nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_TEMPORAL_AQ)) {
  421. config->rcParams.enableAQ = psycho_aq;
  422. config->rcParams.aqStrength = 8;
  423. config->rcParams.enableTemporalAQ = psycho_aq;
  424. } else if (psycho_aq) {
  425. warn("Ignoring Psycho Visual Tuning request since GPU is not capable");
  426. }
  427. /* -------------------------- */
  428. /* rate control */
  429. enc->can_change_bitrate =
  430. nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_DYN_BITRATE_CHANGE) &&
  431. !lookahead;
  432. config->rcParams.rateControlMode = twopass ? NV_ENC_PARAMS_RC_VBR_HQ
  433. : NV_ENC_PARAMS_RC_VBR;
  434. if (astrcmpi(rc, "cqp") == 0 || rc_lossless) {
  435. if (lossless) {
  436. h264_config->qpPrimeYZeroTransformBypassFlag = 1;
  437. cqp = 0;
  438. }
  439. config->rcParams.rateControlMode = NV_ENC_PARAMS_RC_CONSTQP;
  440. config->rcParams.constQP.qpInterP = cqp;
  441. config->rcParams.constQP.qpInterB = cqp;
  442. config->rcParams.constQP.qpIntra = cqp;
  443. enc->can_change_bitrate = false;
  444. bitrate = 0;
  445. max_bitrate = 0;
  446. } else if (astrcmpi(rc, "vbr") != 0) { /* CBR by default */
  447. h264_config->outputBufferingPeriodSEI = 1;
  448. config->rcParams.rateControlMode =
  449. twopass ? NV_ENC_PARAMS_RC_2_PASS_QUALITY
  450. : NV_ENC_PARAMS_RC_CBR;
  451. }
  452. h264_config->outputPictureTimingSEI = 1;
  453. config->rcParams.averageBitRate = bitrate * 1000;
  454. config->rcParams.maxBitRate = vbr ? max_bitrate * 1000 : bitrate * 1000;
  455. config->rcParams.vbvBufferSize = bitrate * 1000;
  456. /* -------------------------- */
  457. /* profile */
  458. if (astrcmpi(profile, "main") == 0) {
  459. config->profileGUID = NV_ENC_H264_PROFILE_MAIN_GUID;
  460. } else if (astrcmpi(profile, "baseline") == 0) {
  461. config->profileGUID = NV_ENC_H264_PROFILE_BASELINE_GUID;
  462. } else if (!lossless) {
  463. config->profileGUID = NV_ENC_H264_PROFILE_HIGH_GUID;
  464. }
  465. /* -------------------------- */
  466. /* initialize */
  467. if (NV_FAILED(nv.nvEncInitializeEncoder(enc->session, params))) {
  468. return false;
  469. }
  470. info("settings:\n"
  471. "\trate_control: %s\n"
  472. "\tbitrate: %d\n"
  473. "\tcqp: %d\n"
  474. "\tkeyint: %d\n"
  475. "\tpreset: %s\n"
  476. "\tprofile: %s\n"
  477. "\twidth: %d\n"
  478. "\theight: %d\n"
  479. "\t2-pass: %s\n"
  480. "\tb-frames: %d\n"
  481. "\tlookahead: %s\n"
  482. "\tpsycho_aq: %s\n",
  483. rc, bitrate, cqp, gop_size, preset, profile, enc->cx, enc->cy,
  484. twopass ? "true" : "false", bf, lookahead ? "true" : "false",
  485. psycho_aq ? "true" : "false");
  486. return true;
  487. }
  488. static bool init_bitstreams(struct nvenc_data *enc)
  489. {
  490. da_reserve(enc->bitstreams, enc->buf_count);
  491. for (int i = 0; i < enc->buf_count; i++) {
  492. struct nv_bitstream bitstream;
  493. if (!nv_bitstream_init(enc, &bitstream)) {
  494. return false;
  495. }
  496. da_push_back(enc->bitstreams, &bitstream);
  497. }
  498. return true;
  499. }
  500. static bool init_textures(struct nvenc_data *enc)
  501. {
  502. da_reserve(enc->bitstreams, enc->buf_count);
  503. for (int i = 0; i < enc->buf_count; i++) {
  504. struct nv_texture texture;
  505. if (!nv_texture_init(enc, &texture)) {
  506. return false;
  507. }
  508. da_push_back(enc->textures, &texture);
  509. }
  510. return true;
  511. }
  512. static void nvenc_destroy(void *data);
  513. static void *nvenc_create_internal(obs_data_t *settings, obs_encoder_t *encoder,
  514. bool psycho_aq)
  515. {
  516. NV_ENCODE_API_FUNCTION_LIST init = {NV_ENCODE_API_FUNCTION_LIST_VER};
  517. struct nvenc_data *enc = bzalloc(sizeof(*enc));
  518. enc->encoder = encoder;
  519. enc->first_packet = true;
  520. if (!init_nvenc(encoder)) {
  521. goto fail;
  522. }
  523. if (NV_FAILED(nv_create_instance(&init))) {
  524. goto fail;
  525. }
  526. if (!init_d3d11(enc, settings)) {
  527. goto fail;
  528. }
  529. if (!init_session(enc)) {
  530. goto fail;
  531. }
  532. if (!init_encoder(enc, settings, psycho_aq)) {
  533. goto fail;
  534. }
  535. if (!init_bitstreams(enc)) {
  536. goto fail;
  537. }
  538. if (!init_textures(enc)) {
  539. goto fail;
  540. }
  541. return enc;
  542. fail:
  543. nvenc_destroy(enc);
  544. return NULL;
  545. }
  546. static void *nvenc_create(obs_data_t *settings, obs_encoder_t *encoder)
  547. {
  548. /* this encoder requires shared textures, this cannot be used on a
  549. * gpu other than the one OBS is currently running on. */
  550. const int gpu = (int)obs_data_get_int(settings, "gpu");
  551. if (gpu != 0) {
  552. blog(LOG_INFO,
  553. "[jim-nvenc] different GPU selected by user, falling back to ffmpeg");
  554. goto reroute;
  555. }
  556. if (obs_encoder_scaling_enabled(encoder)) {
  557. blog(LOG_INFO,
  558. "[jim-nvenc] scaling enabled, falling back to ffmpeg");
  559. goto reroute;
  560. }
  561. if (!obs_nv12_tex_active()) {
  562. blog(LOG_INFO,
  563. "[jim-nvenc] nv12 not active, falling back to ffmpeg");
  564. goto reroute;
  565. }
  566. const bool psycho_aq = obs_data_get_bool(settings, "psycho_aq");
  567. struct nvenc_data *enc =
  568. nvenc_create_internal(settings, encoder, psycho_aq);
  569. if ((enc == NULL) && psycho_aq) {
  570. blog(LOG_WARNING, "[jim-nvenc] nvenc_create_internal failed, "
  571. "trying again without Psycho Visual Tuning");
  572. enc = nvenc_create_internal(settings, encoder, false);
  573. }
  574. if (enc) {
  575. return enc;
  576. }
  577. reroute:
  578. return obs_encoder_create_rerouted(encoder, "ffmpeg_nvenc");
  579. }
  580. static bool get_encoded_packet(struct nvenc_data *enc, bool finalize);
  581. static void nvenc_destroy(void *data)
  582. {
  583. struct nvenc_data *enc = data;
  584. if (enc->encode_started) {
  585. size_t next_bitstream = enc->next_bitstream;
  586. HANDLE next_event = enc->bitstreams.array[next_bitstream].event;
  587. NV_ENC_PIC_PARAMS params = {NV_ENC_PIC_PARAMS_VER};
  588. params.encodePicFlags = NV_ENC_PIC_FLAG_EOS;
  589. params.completionEvent = next_event;
  590. nv.nvEncEncodePicture(enc->session, &params);
  591. get_encoded_packet(enc, true);
  592. }
  593. for (size_t i = 0; i < enc->textures.num; i++) {
  594. nv_texture_free(enc, &enc->textures.array[i]);
  595. }
  596. for (size_t i = 0; i < enc->bitstreams.num; i++) {
  597. nv_bitstream_free(enc, &enc->bitstreams.array[i]);
  598. }
  599. if (enc->session) {
  600. nv.nvEncDestroyEncoder(enc->session);
  601. }
  602. for (size_t i = 0; i < enc->input_textures.num; i++) {
  603. ID3D11Texture2D *tex = enc->input_textures.array[i].tex;
  604. IDXGIKeyedMutex *km = enc->input_textures.array[i].km;
  605. tex->lpVtbl->Release(tex);
  606. km->lpVtbl->Release(km);
  607. }
  608. if (enc->context) {
  609. enc->context->lpVtbl->Release(enc->context);
  610. }
  611. if (enc->device) {
  612. enc->device->lpVtbl->Release(enc->device);
  613. }
  614. bfree(enc->header);
  615. bfree(enc->sei);
  616. circlebuf_free(&enc->dts_list);
  617. da_free(enc->textures);
  618. da_free(enc->bitstreams);
  619. da_free(enc->input_textures);
  620. da_free(enc->packet_data);
  621. bfree(enc);
  622. }
  623. static ID3D11Texture2D *get_tex_from_handle(struct nvenc_data *enc,
  624. uint32_t handle,
  625. IDXGIKeyedMutex **km_out)
  626. {
  627. ID3D11Device *device = enc->device;
  628. IDXGIKeyedMutex *km;
  629. ID3D11Texture2D *input_tex;
  630. HRESULT hr;
  631. for (size_t i = 0; i < enc->input_textures.num; i++) {
  632. struct handle_tex *ht = &enc->input_textures.array[i];
  633. if (ht->handle == handle) {
  634. *km_out = ht->km;
  635. return ht->tex;
  636. }
  637. }
  638. hr = device->lpVtbl->OpenSharedResource(device,
  639. (HANDLE)(uintptr_t)handle,
  640. &IID_ID3D11Texture2D,
  641. &input_tex);
  642. if (FAILED(hr)) {
  643. error_hr("OpenSharedResource failed");
  644. return NULL;
  645. }
  646. hr = input_tex->lpVtbl->QueryInterface(input_tex, &IID_IDXGIKeyedMutex,
  647. &km);
  648. if (FAILED(hr)) {
  649. error_hr("QueryInterface(IDXGIKeyedMutex) failed");
  650. input_tex->lpVtbl->Release(input_tex);
  651. return NULL;
  652. }
  653. input_tex->lpVtbl->SetEvictionPriority(input_tex,
  654. DXGI_RESOURCE_PRIORITY_MAXIMUM);
  655. *km_out = km;
  656. struct handle_tex new_ht = {handle, input_tex, km};
  657. da_push_back(enc->input_textures, &new_ht);
  658. return input_tex;
  659. }
  660. static bool get_encoded_packet(struct nvenc_data *enc, bool finalize)
  661. {
  662. void *s = enc->session;
  663. da_resize(enc->packet_data, 0);
  664. if (!enc->buffers_queued)
  665. return true;
  666. if (!finalize && enc->buffers_queued < enc->output_delay)
  667. return true;
  668. size_t count = finalize ? enc->buffers_queued : 1;
  669. for (size_t i = 0; i < count; i++) {
  670. size_t cur_bs_idx = enc->cur_bitstream;
  671. struct nv_bitstream *bs = &enc->bitstreams.array[cur_bs_idx];
  672. struct nv_texture *nvtex = &enc->textures.array[cur_bs_idx];
  673. /* ---------------- */
  674. NV_ENC_LOCK_BITSTREAM lock = {NV_ENC_LOCK_BITSTREAM_VER};
  675. lock.outputBitstream = bs->ptr;
  676. lock.doNotWait = false;
  677. if (NV_FAILED(nv.nvEncLockBitstream(s, &lock))) {
  678. return false;
  679. }
  680. if (enc->first_packet) {
  681. uint8_t *new_packet;
  682. size_t size;
  683. enc->first_packet = false;
  684. obs_extract_avc_headers(lock.bitstreamBufferPtr,
  685. lock.bitstreamSizeInBytes,
  686. &new_packet, &size,
  687. &enc->header, &enc->header_size,
  688. &enc->sei, &enc->sei_size);
  689. da_copy_array(enc->packet_data, new_packet, size);
  690. bfree(new_packet);
  691. } else {
  692. da_copy_array(enc->packet_data, lock.bitstreamBufferPtr,
  693. lock.bitstreamSizeInBytes);
  694. }
  695. enc->packet_pts = (int64_t)lock.outputTimeStamp;
  696. enc->packet_keyframe = lock.pictureType == NV_ENC_PIC_TYPE_IDR;
  697. if (NV_FAILED(nv.nvEncUnlockBitstream(s, bs->ptr))) {
  698. return false;
  699. }
  700. /* ---------------- */
  701. if (nvtex->mapped_res) {
  702. NVENCSTATUS err;
  703. err = nv.nvEncUnmapInputResource(s, nvtex->mapped_res);
  704. if (nv_failed(enc->encoder, err, __FUNCTION__,
  705. "unmap")) {
  706. return false;
  707. }
  708. nvtex->mapped_res = NULL;
  709. }
  710. /* ---------------- */
  711. if (++enc->cur_bitstream == enc->buf_count)
  712. enc->cur_bitstream = 0;
  713. enc->buffers_queued--;
  714. }
  715. return true;
  716. }
  717. static bool nvenc_encode_tex(void *data, uint32_t handle, int64_t pts,
  718. uint64_t lock_key, uint64_t *next_key,
  719. struct encoder_packet *packet,
  720. bool *received_packet)
  721. {
  722. struct nvenc_data *enc = data;
  723. ID3D11Device *device = enc->device;
  724. ID3D11DeviceContext *context = enc->context;
  725. ID3D11Texture2D *input_tex;
  726. ID3D11Texture2D *output_tex;
  727. IDXGIKeyedMutex *km;
  728. struct nv_texture *nvtex;
  729. struct nv_bitstream *bs;
  730. NVENCSTATUS err;
  731. if (handle == GS_INVALID_HANDLE) {
  732. error("Encode failed: bad texture handle");
  733. *next_key = lock_key;
  734. return false;
  735. }
  736. bs = &enc->bitstreams.array[enc->next_bitstream];
  737. nvtex = &enc->textures.array[enc->next_bitstream];
  738. input_tex = get_tex_from_handle(enc, handle, &km);
  739. output_tex = nvtex->tex;
  740. if (!input_tex) {
  741. *next_key = lock_key;
  742. return false;
  743. }
  744. circlebuf_push_back(&enc->dts_list, &pts, sizeof(pts));
  745. /* ------------------------------------ */
  746. /* wait for output bitstream/tex */
  747. WaitForSingleObject(bs->event, INFINITE);
  748. /* ------------------------------------ */
  749. /* copy to output tex */
  750. km->lpVtbl->AcquireSync(km, lock_key, INFINITE);
  751. context->lpVtbl->CopyResource(context, (ID3D11Resource *)output_tex,
  752. (ID3D11Resource *)input_tex);
  753. km->lpVtbl->ReleaseSync(km, *next_key);
  754. /* ------------------------------------ */
  755. /* map output tex so nvenc can use it */
  756. NV_ENC_MAP_INPUT_RESOURCE map = {NV_ENC_MAP_INPUT_RESOURCE_VER};
  757. map.registeredResource = nvtex->res;
  758. if (NV_FAILED(nv.nvEncMapInputResource(enc->session, &map))) {
  759. return false;
  760. }
  761. nvtex->mapped_res = map.mappedResource;
  762. /* ------------------------------------ */
  763. /* do actual encode call */
  764. NV_ENC_PIC_PARAMS params = {0};
  765. params.version = NV_ENC_PIC_PARAMS_VER;
  766. params.pictureStruct = NV_ENC_PIC_STRUCT_FRAME;
  767. params.inputBuffer = nvtex->mapped_res;
  768. params.bufferFmt = NV_ENC_BUFFER_FORMAT_NV12;
  769. params.inputTimeStamp = (uint64_t)pts;
  770. params.inputWidth = enc->cx;
  771. params.inputHeight = enc->cy;
  772. params.outputBitstream = bs->ptr;
  773. params.completionEvent = bs->event;
  774. err = nv.nvEncEncodePicture(enc->session, &params);
  775. if (err != NV_ENC_SUCCESS && err != NV_ENC_ERR_NEED_MORE_INPUT) {
  776. nv_failed(enc->encoder, err, __FUNCTION__,
  777. "nvEncEncodePicture");
  778. return false;
  779. }
  780. enc->encode_started = true;
  781. enc->buffers_queued++;
  782. if (++enc->next_bitstream == enc->buf_count) {
  783. enc->next_bitstream = 0;
  784. }
  785. /* ------------------------------------ */
  786. /* check for encoded packet and parse */
  787. if (!get_encoded_packet(enc, false)) {
  788. return false;
  789. }
  790. /* ------------------------------------ */
  791. /* output encoded packet */
  792. if (enc->packet_data.num) {
  793. int64_t dts;
  794. circlebuf_pop_front(&enc->dts_list, &dts, sizeof(dts));
  795. /* subtract bframe delay from dts */
  796. dts -= (int64_t)enc->bframes * packet->timebase_num;
  797. *received_packet = true;
  798. packet->data = enc->packet_data.array;
  799. packet->size = enc->packet_data.num;
  800. packet->type = OBS_ENCODER_VIDEO;
  801. packet->pts = enc->packet_pts;
  802. packet->dts = dts;
  803. packet->keyframe = enc->packet_keyframe;
  804. } else {
  805. *received_packet = false;
  806. }
  807. return true;
  808. }
  809. extern void nvenc_defaults(obs_data_t *settings);
  810. extern obs_properties_t *nvenc_properties(void *unused);
  811. static bool nvenc_extra_data(void *data, uint8_t **header, size_t *size)
  812. {
  813. struct nvenc_data *enc = data;
  814. if (!enc->header) {
  815. return false;
  816. }
  817. *header = enc->header;
  818. *size = enc->header_size;
  819. return true;
  820. }
  821. static bool nvenc_sei_data(void *data, uint8_t **sei, size_t *size)
  822. {
  823. struct nvenc_data *enc = data;
  824. if (!enc->sei) {
  825. return false;
  826. }
  827. *sei = enc->sei;
  828. *size = enc->sei_size;
  829. return true;
  830. }
  831. struct obs_encoder_info nvenc_info = {
  832. .id = "jim_nvenc",
  833. .codec = "h264",
  834. .type = OBS_ENCODER_VIDEO,
  835. .caps = OBS_ENCODER_CAP_PASS_TEXTURE | OBS_ENCODER_CAP_DYN_BITRATE,
  836. .get_name = nvenc_get_name,
  837. .create = nvenc_create,
  838. .destroy = nvenc_destroy,
  839. .update = nvenc_update,
  840. .encode_texture = nvenc_encode_tex,
  841. .get_defaults = nvenc_defaults,
  842. .get_properties = nvenc_properties,
  843. .get_extra_data = nvenc_extra_data,
  844. .get_sei_data = nvenc_sei_data,
  845. };