| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466 |
- #include "obs-nvenc.h"
- #include <util/deque.h>
- #include <util/darray.h>
- #include <util/dstr.h>
- #include <obs-avc.h>
- #include <obs-hevc.h>
- #include <libavutil/rational.h>
- #ifdef _WIN32
- #define INITGUID
- #include <dxgi.h>
- #include <d3d11.h>
- #include <d3d11_1.h>
- #else
- #include <glad/glad.h>
- #endif
- /* ========================================================================= */
- /* a hack of the ages: nvenc backward compatibility */
- #define CONFIGURED_NVENC_MAJOR 12
- #define CONFIGURED_NVENC_MINOR 1
- /* we cannot guarantee structures haven't changed, so purposely break on
- * version change to force the programmer to update or remove backward
- * compatibility NVENC code. */
- #if CONFIGURED_NVENC_MAJOR != NVENCAPI_MAJOR_VERSION || \
- CONFIGURED_NVENC_MINOR < NVENCAPI_MINOR_VERSION
- #error NVENC version changed, update or remove NVENC compatibility code
- #endif
- #undef NVENCAPI_STRUCT_VERSION
- #define NVENCAPI_STRUCT_VERSION(ver) \
- ((uint32_t)(enc->needs_compat_ver ? NVENC_COMPAT_VER \
- : NVENCAPI_VERSION) | \
- ((ver) << 16) | (0x7 << 28))
- #define NV_ENC_CONFIG_COMPAT_VER (NVENCAPI_STRUCT_VERSION(7) | (1 << 31))
- #define NV_ENC_INITIALIZE_PARAMS_COMPAT_VER \
- (NVENCAPI_STRUCT_VERSION(5) | (1 << 31))
- #define NV_ENC_PIC_PARAMS_COMPAT_VER (NVENCAPI_STRUCT_VERSION(4) | (1 << 31))
- #define NV_ENC_LOCK_BITSTREAM_COMPAT_VER NVENCAPI_STRUCT_VERSION(1)
- #define NV_ENC_REGISTER_RESOURCE_COMPAT_VER NVENCAPI_STRUCT_VERSION(3)
- #define COMPATIBILITY_VERSION \
- (NVENC_COMPAT_MAJOR_VER << 4 | NVENC_COMPAT_MINOR_VER)
- /* ========================================================================= */
- #define EXTRA_BUFFERS 5
- #define do_log(level, format, ...) \
- blog(level, "[obs-nvenc: '%s'] " format, \
- obs_encoder_get_name(enc->encoder), ##__VA_ARGS__)
- #define error(format, ...) do_log(LOG_ERROR, format, ##__VA_ARGS__)
- #define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
- #define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
- #define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
- #define error_hr(msg) error("%s: %s: 0x%08lX", __FUNCTION__, msg, (uint32_t)hr);
- #ifndef _WIN32
- #define min(a, b) (((a) < (b)) ? (a) : (b))
- #define max(a, b) (((a) > (b)) ? (a) : (b))
- #endif
- struct nv_bitstream;
- struct nv_texture;
- struct handle_tex {
- #ifdef _WIN32
- uint32_t handle;
- ID3D11Texture2D *tex;
- IDXGIKeyedMutex *km;
- #else
- GLuint tex_id;
- CUgraphicsResource res_y;
- CUgraphicsResource res_uv;
- #endif
- };
- /* ------------------------------------------------------------------------- */
- /* Main Implementation Structure */
- enum codec_type {
- CODEC_H264,
- CODEC_HEVC,
- CODEC_AV1,
- };
- static const char *get_codec_name(enum codec_type type)
- {
- switch (type) {
- case CODEC_H264:
- return "H264";
- case CODEC_HEVC:
- return "HEVC";
- case CODEC_AV1:
- return "AV1";
- }
- return "Unknown";
- }
- struct nvenc_data {
- obs_encoder_t *encoder;
- enum codec_type codec;
- GUID codec_guid;
- void *session;
- NV_ENC_INITIALIZE_PARAMS params;
- NV_ENC_CONFIG config;
- int rc_lookahead;
- uint32_t buf_count;
- int output_delay;
- int buffers_queued;
- size_t next_bitstream;
- size_t cur_bitstream;
- bool encode_started;
- bool first_packet;
- bool can_change_bitrate;
- bool needs_compat_ver;
- bool fallback;
- int32_t bframes;
- DARRAY(struct handle_tex) input_textures;
- DARRAY(struct nv_bitstream) bitstreams;
- DARRAY(struct nv_cuda_surface) surfaces;
- NV_ENC_BUFFER_FORMAT surface_format;
- struct deque dts_list;
- DARRAY(uint8_t) packet_data;
- int64_t packet_pts;
- bool packet_keyframe;
- #ifdef _WIN32
- DARRAY(struct nv_texture) textures;
- ID3D11Device *device;
- ID3D11DeviceContext *context;
- #endif
- uint32_t cx;
- uint32_t cy;
- enum video_format in_format;
- uint8_t *header;
- size_t header_size;
- uint8_t *sei;
- size_t sei_size;
- int8_t *roi_map;
- size_t roi_map_size;
- uint32_t roi_increment;
- CUcontext cu_ctx;
- };
- /* ------------------------------------------------------------------------- */
- /* Bitstream Buffer */
- struct nv_bitstream {
- void *ptr;
- };
- #define NV_FAIL(format, ...) nv_fail(enc->encoder, format, ##__VA_ARGS__)
- #define NV_FAILED(x) nv_failed(enc->encoder, x, __FUNCTION__, #x)
- static bool nv_bitstream_init(struct nvenc_data *enc, struct nv_bitstream *bs)
- {
- NV_ENC_CREATE_BITSTREAM_BUFFER buf = {
- NV_ENC_CREATE_BITSTREAM_BUFFER_VER};
- if (NV_FAILED(nv.nvEncCreateBitstreamBuffer(enc->session, &buf))) {
- return false;
- }
- bs->ptr = buf.bitstreamBuffer;
- return true;
- }
- static void nv_bitstream_free(struct nvenc_data *enc, struct nv_bitstream *bs)
- {
- if (bs->ptr) {
- nv.nvEncDestroyBitstreamBuffer(enc->session, bs->ptr);
- }
- }
- /* ------------------------------------------------------------------------- */
- /* Texture Resource */
- #ifdef _WIN32
- struct nv_texture {
- void *res;
- ID3D11Texture2D *tex;
- void *mapped_res;
- };
- static bool nv_texture_init(struct nvenc_data *enc, struct nv_texture *nvtex)
- {
- const bool p010 = obs_p010_tex_active();
- D3D11_TEXTURE2D_DESC desc = {0};
- desc.Width = enc->cx;
- desc.Height = enc->cy;
- desc.MipLevels = 1;
- desc.ArraySize = 1;
- desc.Format = p010 ? DXGI_FORMAT_P010 : DXGI_FORMAT_NV12;
- desc.SampleDesc.Count = 1;
- desc.BindFlags = D3D11_BIND_RENDER_TARGET;
- ID3D11Device *const device = enc->device;
- ID3D11Texture2D *tex;
- HRESULT hr = device->lpVtbl->CreateTexture2D(device, &desc, NULL, &tex);
- if (FAILED(hr)) {
- error_hr("Failed to create texture");
- return false;
- }
- tex->lpVtbl->SetEvictionPriority(tex, DXGI_RESOURCE_PRIORITY_MAXIMUM);
- uint32_t struct_ver = enc->needs_compat_ver
- ? NV_ENC_REGISTER_RESOURCE_COMPAT_VER
- : NV_ENC_REGISTER_RESOURCE_VER;
- NV_ENC_REGISTER_RESOURCE res = {struct_ver};
- res.resourceType = NV_ENC_INPUT_RESOURCE_TYPE_DIRECTX;
- res.resourceToRegister = tex;
- res.width = enc->cx;
- res.height = enc->cy;
- res.bufferFormat = p010 ? NV_ENC_BUFFER_FORMAT_YUV420_10BIT
- : NV_ENC_BUFFER_FORMAT_NV12;
- if (NV_FAILED(nv.nvEncRegisterResource(enc->session, &res))) {
- tex->lpVtbl->Release(tex);
- return false;
- }
- nvtex->res = res.registeredResource;
- nvtex->tex = tex;
- nvtex->mapped_res = NULL;
- return true;
- }
- static void nv_texture_free(struct nvenc_data *enc, struct nv_texture *nvtex)
- {
- if (nvtex->res) {
- if (nvtex->mapped_res) {
- nv.nvEncUnmapInputResource(enc->session,
- nvtex->mapped_res);
- }
- nv.nvEncUnregisterResource(enc->session, nvtex->res);
- nvtex->tex->lpVtbl->Release(nvtex->tex);
- }
- }
- #endif
- /* ------------------------------------------------------------------------- */
- /* CUDA Stuff */
- /* CUDA error handling */
- static inline bool cuda_error_check(struct nvenc_data *enc, CUresult res,
- const char *func, const char *call)
- {
- if (res == CUDA_SUCCESS)
- return true;
- const char *name, *desc;
- if (cuda_get_error_desc(res, &name, &desc)) {
- error("%s: CUDA call \"%s\" failed with %s (%d): %s", func,
- call, name, res, desc);
- } else {
- error("%s: CUDA call \"%s\" failed with %d", func, call, res);
- }
- return false;
- }
- #define CU_FAILED(call) \
- if (!cuda_error_check(enc, call, __FUNCTION__, #call)) \
- return false;
- #define CU_CHECK(call) \
- if (!cuda_error_check(enc, call, __FUNCTION__, #call)) { \
- success = false; \
- goto unmap; \
- }
- /* CUDA Surfaces */
- struct nv_cuda_surface {
- CUarray tex;
- NV_ENC_REGISTERED_PTR res;
- NV_ENC_INPUT_PTR *mapped_res;
- };
- /* Missing from ffmpeg nvcodec headers, required for CUDA arrays to be usable in NVENC */
- static const int CUDA_ARRAY3D_SURFACE_LDST = 0x02;
- static bool nv_cuda_surface_init(struct nvenc_data *enc,
- struct nv_cuda_surface *nvsurf)
- {
- const bool p010 = obs_p010_tex_active();
- CUDA_ARRAY3D_DESCRIPTOR desc;
- desc.Width = enc->cx;
- desc.Height = enc->cy;
- desc.Depth = 0;
- desc.Flags = CUDA_ARRAY3D_SURFACE_LDST;
- desc.NumChannels = 1;
- if (!enc->fallback) {
- desc.Format = p010 ? CU_AD_FORMAT_UNSIGNED_INT16
- : CU_AD_FORMAT_UNSIGNED_INT8;
- desc.Height = enc->cy + enc->cy / 2;
- } else {
- switch (enc->surface_format) {
- case NV_ENC_BUFFER_FORMAT_NV12:
- desc.Format = CU_AD_FORMAT_UNSIGNED_INT8;
- // Additional half-height plane for UV data
- desc.Height += enc->cy / 2;
- break;
- case NV_ENC_BUFFER_FORMAT_YUV420_10BIT:
- desc.Format = CU_AD_FORMAT_UNSIGNED_INT16;
- desc.Height += enc->cy / 2;
- desc.NumChannels = 2; // number of bytes per element
- break;
- case NV_ENC_BUFFER_FORMAT_YUV444:
- desc.Format = CU_AD_FORMAT_UNSIGNED_INT8;
- desc.Height *= 3; // 3 full-size planes
- break;
- default:
- error("Unknown input format: %d", enc->surface_format);
- return false;
- }
- }
- CU_FAILED(cu->cuArray3DCreate(&nvsurf->tex, &desc))
- NV_ENC_REGISTER_RESOURCE res = {0};
- res.version = enc->needs_compat_ver
- ? NV_ENC_REGISTER_RESOURCE_COMPAT_VER
- : NV_ENC_REGISTER_RESOURCE_VER;
- res.resourceType = NV_ENC_INPUT_RESOURCE_TYPE_CUDAARRAY;
- res.resourceToRegister = (void *)nvsurf->tex;
- res.width = enc->cx;
- res.height = enc->cy;
- res.pitch = (uint32_t)(desc.Width * desc.NumChannels);
- if (!enc->fallback) {
- res.bufferFormat = p010 ? NV_ENC_BUFFER_FORMAT_YUV420_10BIT
- : NV_ENC_BUFFER_FORMAT_NV12;
- } else {
- res.bufferFormat = enc->surface_format;
- }
- if (NV_FAILED(nv.nvEncRegisterResource(enc->session, &res))) {
- return false;
- }
- nvsurf->res = res.registeredResource;
- nvsurf->mapped_res = NULL;
- return true;
- }
- static void nv_cuda_surface_free(struct nvenc_data *enc,
- struct nv_cuda_surface *nvsurf)
- {
- if (nvsurf->res) {
- if (nvsurf->mapped_res) {
- nv.nvEncUnmapInputResource(enc->session,
- nvsurf->mapped_res);
- }
- nv.nvEncUnregisterResource(enc->session, nvsurf->res);
- cu->cuArrayDestroy(nvsurf->tex);
- }
- }
- /* ------------------------------------------------------------------------- */
- /* Implementation */
- static const char *h264_nvenc_get_name(void *type_data)
- {
- UNUSED_PARAMETER(type_data);
- return "NVIDIA NVENC H.264";
- }
- static const char *h264_nvenc_soft_get_name(void *type_data)
- {
- UNUSED_PARAMETER(type_data);
- return "NVIDIA NVENC H.264 (Fallback)";
- }
- #ifdef ENABLE_HEVC
- static const char *hevc_nvenc_get_name(void *type_data)
- {
- UNUSED_PARAMETER(type_data);
- return "NVIDIA NVENC HEVC";
- }
- static const char *hevc_nvenc_soft_get_name(void *type_data)
- {
- UNUSED_PARAMETER(type_data);
- return "NVIDIA NVENC HEVC (Fallback)";
- }
- #endif
- static const char *av1_nvenc_get_name(void *type_data)
- {
- UNUSED_PARAMETER(type_data);
- return "NVIDIA NVENC AV1";
- }
- static const char *av1_nvenc_soft_get_name(void *type_data)
- {
- UNUSED_PARAMETER(type_data);
- return "NVIDIA NVENC AV1 (Fallback)";
- }
- static inline int nv_get_cap(struct nvenc_data *enc, NV_ENC_CAPS cap)
- {
- if (!enc->session)
- return 0;
- NV_ENC_CAPS_PARAM param = {NV_ENC_CAPS_PARAM_VER};
- int v;
- param.capsToQuery = cap;
- nv.nvEncGetEncodeCaps(enc->session, enc->codec_guid, ¶m, &v);
- return v;
- }
- static bool nvenc_update(void *data, obs_data_t *settings)
- {
- struct nvenc_data *enc = data;
- /* Only support reconfiguration of CBR bitrate */
- if (enc->can_change_bitrate) {
- int bitrate = (int)obs_data_get_int(settings, "bitrate");
- int max_bitrate =
- (int)obs_data_get_int(settings, "max_bitrate");
- bool vbr = (enc->config.rcParams.rateControlMode ==
- NV_ENC_PARAMS_RC_VBR);
- enc->config.rcParams.averageBitRate = bitrate * 1000;
- enc->config.rcParams.maxBitRate = vbr ? max_bitrate * 1000
- : bitrate * 1000;
- NV_ENC_RECONFIGURE_PARAMS params = {0};
- params.version = NV_ENC_RECONFIGURE_PARAMS_VER;
- params.reInitEncodeParams = enc->params;
- params.resetEncoder = 1;
- params.forceIDR = 1;
- if (NV_FAILED(nv.nvEncReconfigureEncoder(enc->session,
- ¶ms))) {
- return false;
- }
- }
- return true;
- }
- #ifdef _WIN32
- static HANDLE get_lib(struct nvenc_data *enc, const char *lib)
- {
- HMODULE mod = GetModuleHandleA(lib);
- if (mod)
- return mod;
- mod = LoadLibraryA(lib);
- if (!mod)
- error("Failed to load %s", lib);
- return mod;
- }
- typedef HRESULT(WINAPI *CREATEDXGIFACTORY1PROC)(REFIID, void **);
- static bool init_d3d11(struct nvenc_data *enc, obs_data_t *settings)
- {
- HMODULE dxgi = get_lib(enc, "DXGI.dll");
- HMODULE d3d11 = get_lib(enc, "D3D11.dll");
- CREATEDXGIFACTORY1PROC create_dxgi;
- PFN_D3D11_CREATE_DEVICE create_device;
- IDXGIFactory1 *factory;
- IDXGIAdapter *adapter;
- ID3D11Device *device;
- ID3D11DeviceContext *context;
- HRESULT hr;
- if (!dxgi || !d3d11) {
- return false;
- }
- create_dxgi = (CREATEDXGIFACTORY1PROC)GetProcAddress(
- dxgi, "CreateDXGIFactory1");
- create_device = (PFN_D3D11_CREATE_DEVICE)GetProcAddress(
- d3d11, "D3D11CreateDevice");
- if (!create_dxgi || !create_device) {
- error("Failed to load D3D11/DXGI procedures");
- return false;
- }
- hr = create_dxgi(&IID_IDXGIFactory1, &factory);
- if (FAILED(hr)) {
- error_hr("CreateDXGIFactory1 failed");
- return false;
- }
- hr = factory->lpVtbl->EnumAdapters(factory, 0, &adapter);
- factory->lpVtbl->Release(factory);
- if (FAILED(hr)) {
- error_hr("EnumAdapters failed");
- return false;
- }
- hr = create_device(adapter, D3D_DRIVER_TYPE_UNKNOWN, NULL, 0, NULL, 0,
- D3D11_SDK_VERSION, &device, NULL, &context);
- adapter->lpVtbl->Release(adapter);
- if (FAILED(hr)) {
- error_hr("D3D11CreateDevice failed");
- return false;
- }
- enc->device = device;
- enc->context = context;
- return true;
- }
- #endif
- static bool init_session(struct nvenc_data *enc)
- {
- NV_ENC_OPEN_ENCODE_SESSION_EX_PARAMS params = {
- NV_ENC_OPEN_ENCODE_SESSION_EX_PARAMS_VER};
- params.apiVersion = enc->needs_compat_ver ? NVENC_COMPAT_VER
- : NVENCAPI_VERSION;
- #ifdef _WIN32
- if (enc->fallback) {
- params.device = enc->cu_ctx;
- params.deviceType = NV_ENC_DEVICE_TYPE_CUDA;
- } else {
- params.device = enc->device;
- params.deviceType = NV_ENC_DEVICE_TYPE_DIRECTX;
- }
- #else
- params.device = enc->cu_ctx;
- params.deviceType = NV_ENC_DEVICE_TYPE_CUDA;
- #endif
- if (NV_FAILED(nv.nvEncOpenEncodeSessionEx(¶ms, &enc->session))) {
- return false;
- }
- return true;
- }
- static void initialize_params(struct nvenc_data *enc, const GUID *nv_preset,
- NV_ENC_TUNING_INFO nv_tuning, uint32_t width,
- uint32_t height, uint32_t fps_num,
- uint32_t fps_den)
- {
- int darWidth, darHeight;
- av_reduce(&darWidth, &darHeight, width, height, 1024 * 1024);
- NV_ENC_INITIALIZE_PARAMS *params = &enc->params;
- memset(params, 0, sizeof(*params));
- params->version = enc->needs_compat_ver
- ? NV_ENC_INITIALIZE_PARAMS_COMPAT_VER
- : NV_ENC_INITIALIZE_PARAMS_VER;
- params->encodeGUID = enc->codec_guid;
- params->presetGUID = *nv_preset;
- params->encodeWidth = width;
- params->encodeHeight = height;
- params->darWidth = enc->codec == CODEC_AV1 ? width : (uint32_t)darWidth;
- params->darHeight = enc->codec == CODEC_AV1 ? height
- : (uint32_t)darHeight;
- params->frameRateNum = fps_num;
- params->frameRateDen = fps_den;
- params->enableEncodeAsync = 0;
- params->enablePTD = 1;
- params->encodeConfig = &enc->config;
- params->tuningInfo = nv_tuning;
- }
- static inline GUID get_nv_preset2(const char *preset2)
- {
- if (astrcmpi(preset2, "p1") == 0) {
- return NV_ENC_PRESET_P1_GUID;
- } else if (astrcmpi(preset2, "p2") == 0) {
- return NV_ENC_PRESET_P2_GUID;
- } else if (astrcmpi(preset2, "p3") == 0) {
- return NV_ENC_PRESET_P3_GUID;
- } else if (astrcmpi(preset2, "p4") == 0) {
- return NV_ENC_PRESET_P4_GUID;
- } else if (astrcmpi(preset2, "p6") == 0) {
- return NV_ENC_PRESET_P6_GUID;
- } else if (astrcmpi(preset2, "p7") == 0) {
- return NV_ENC_PRESET_P7_GUID;
- } else {
- return NV_ENC_PRESET_P5_GUID;
- }
- }
- static inline NV_ENC_TUNING_INFO get_nv_tuning(const char *tuning)
- {
- if (astrcmpi(tuning, "ll") == 0) {
- return NV_ENC_TUNING_INFO_LOW_LATENCY;
- } else if (astrcmpi(tuning, "ull") == 0) {
- return NV_ENC_TUNING_INFO_ULTRA_LOW_LATENCY;
- } else {
- return NV_ENC_TUNING_INFO_HIGH_QUALITY;
- }
- }
- static inline NV_ENC_MULTI_PASS get_nv_multipass(const char *multipass)
- {
- if (astrcmpi(multipass, "qres") == 0) {
- return NV_ENC_TWO_PASS_QUARTER_RESOLUTION;
- } else if (astrcmpi(multipass, "fullres") == 0) {
- return NV_ENC_TWO_PASS_FULL_RESOLUTION;
- } else {
- return NV_ENC_MULTI_PASS_DISABLED;
- }
- }
- static bool is_10_bit(const struct nvenc_data *enc)
- {
- return enc->fallback ? enc->in_format == VIDEO_FORMAT_P010
- : obs_p010_tex_active();
- }
- static bool init_encoder_base(struct nvenc_data *enc, obs_data_t *settings,
- int bf, bool compatibility, bool *lossless)
- {
- const char *rc = obs_data_get_string(settings, "rate_control");
- int bitrate = (int)obs_data_get_int(settings, "bitrate");
- int max_bitrate = (int)obs_data_get_int(settings, "max_bitrate");
- int cqp = (int)obs_data_get_int(settings, "cqp");
- int keyint_sec = (int)obs_data_get_int(settings, "keyint_sec");
- const char *preset = obs_data_get_string(settings, "preset");
- const char *preset2 = obs_data_get_string(settings, "preset2");
- const char *tuning = obs_data_get_string(settings, "tune");
- const char *multipass = obs_data_get_string(settings, "multipass");
- const char *profile = obs_data_get_string(settings, "profile");
- bool lookahead = obs_data_get_bool(settings, "lookahead");
- bool vbr = astrcmpi(rc, "VBR") == 0;
- bool psycho_aq = !compatibility &&
- obs_data_get_bool(settings, "psycho_aq");
- bool disable_scenecut = obs_data_get_bool(settings, "disable_scenecut");
- NVENCSTATUS err;
- video_t *video = obs_encoder_video(enc->encoder);
- const struct video_output_info *voi = video_output_get_info(video);
- enc->cx = obs_encoder_get_width(enc->encoder);
- enc->cy = obs_encoder_get_height(enc->encoder);
- /* -------------------------- */
- /* get preset */
- GUID nv_preset = get_nv_preset2(preset2);
- NV_ENC_TUNING_INFO nv_tuning = get_nv_tuning(tuning);
- NV_ENC_MULTI_PASS nv_multipass = compatibility
- ? NV_ENC_MULTI_PASS_DISABLED
- : get_nv_multipass(multipass);
- if (obs_data_has_user_value(settings, "preset") &&
- !obs_data_has_user_value(settings, "preset2") &&
- enc->codec == CODEC_H264) {
- if (astrcmpi(preset, "mq") == 0) {
- nv_preset = NV_ENC_PRESET_P5_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_TWO_PASS_QUARTER_RESOLUTION;
- } else if (astrcmpi(preset, "hq") == 0) {
- nv_preset = NV_ENC_PRESET_P5_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "default") == 0) {
- nv_preset = NV_ENC_PRESET_P3_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "hp") == 0) {
- nv_preset = NV_ENC_PRESET_P1_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "ll") == 0) {
- nv_preset = NV_ENC_PRESET_P3_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_LOW_LATENCY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "llhq") == 0) {
- nv_preset = NV_ENC_PRESET_P4_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_LOW_LATENCY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "llhp") == 0) {
- nv_preset = NV_ENC_PRESET_P2_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_LOW_LATENCY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- }
- } else if (obs_data_has_user_value(settings, "preset") &&
- !obs_data_has_user_value(settings, "preset2") &&
- enc->codec == CODEC_HEVC) {
- if (astrcmpi(preset, "mq") == 0) {
- nv_preset = NV_ENC_PRESET_P6_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_TWO_PASS_QUARTER_RESOLUTION;
- } else if (astrcmpi(preset, "hq") == 0) {
- nv_preset = NV_ENC_PRESET_P6_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "default") == 0) {
- nv_preset = NV_ENC_PRESET_P5_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "hp") == 0) {
- nv_preset = NV_ENC_PRESET_P1_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "ll") == 0) {
- nv_preset = NV_ENC_PRESET_P3_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_LOW_LATENCY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "llhq") == 0) {
- nv_preset = NV_ENC_PRESET_P4_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_LOW_LATENCY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else if (astrcmpi(preset, "llhp") == 0) {
- nv_preset = NV_ENC_PRESET_P2_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_LOW_LATENCY;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- }
- }
- const bool rc_lossless = astrcmpi(rc, "lossless") == 0;
- *lossless = rc_lossless;
- if (rc_lossless) {
- *lossless =
- nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_LOSSLESS_ENCODE);
- if (*lossless) {
- nv_tuning = NV_ENC_TUNING_INFO_LOSSLESS;
- nv_multipass = NV_ENC_MULTI_PASS_DISABLED;
- } else {
- warn("lossless encode is not supported, ignoring");
- nv_preset = NV_ENC_PRESET_P5_GUID;
- nv_tuning = NV_ENC_TUNING_INFO_HIGH_QUALITY;
- nv_multipass = NV_ENC_TWO_PASS_QUARTER_RESOLUTION;
- }
- }
- /* -------------------------- */
- /* get preset default config */
- uint32_t config_ver = enc->needs_compat_ver ? NV_ENC_CONFIG_COMPAT_VER
- : NV_ENC_CONFIG_VER;
- NV_ENC_PRESET_CONFIG preset_config = {NV_ENC_PRESET_CONFIG_VER,
- {config_ver}};
- err = nv.nvEncGetEncodePresetConfigEx(enc->session, enc->codec_guid,
- nv_preset, nv_tuning,
- &preset_config);
- if (nv_failed(enc->encoder, err, __FUNCTION__,
- "nvEncGetEncodePresetConfig")) {
- return false;
- }
- /* -------------------------- */
- /* main configuration */
- enc->config = preset_config.presetCfg;
- uint32_t gop_size =
- (keyint_sec) ? keyint_sec * voi->fps_num / voi->fps_den : 250;
- NV_ENC_CONFIG *config = &enc->config;
- initialize_params(enc, &nv_preset, nv_tuning, voi->width, voi->height,
- voi->fps_num, voi->fps_den);
- config->gopLength = gop_size;
- config->frameIntervalP = 1 + bf;
- enc->bframes = bf;
- /* lookahead */
- const bool use_profile_lookahead = config->rcParams.enableLookahead;
- lookahead = nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_LOOKAHEAD) &&
- (lookahead || use_profile_lookahead);
- if (lookahead) {
- enc->rc_lookahead = use_profile_lookahead
- ? config->rcParams.lookaheadDepth
- : 8;
- }
- int buf_count = max(4, config->frameIntervalP * 2 * 2);
- if (lookahead) {
- buf_count = max(buf_count, config->frameIntervalP +
- enc->rc_lookahead +
- EXTRA_BUFFERS);
- }
- buf_count = min(64, buf_count);
- enc->buf_count = buf_count;
- const int output_delay = buf_count - 1;
- enc->output_delay = output_delay;
- if (lookahead) {
- const int lkd_bound = output_delay - config->frameIntervalP - 4;
- if (lkd_bound >= 0) {
- config->rcParams.enableLookahead = 1;
- config->rcParams.lookaheadDepth =
- max(enc->rc_lookahead, lkd_bound);
- config->rcParams.disableIadapt = 0;
- config->rcParams.disableBadapt = 0;
- } else {
- lookahead = false;
- }
- }
- enc->config.rcParams.disableIadapt = disable_scenecut;
- /* psycho aq */
- if (!compatibility) {
- if (nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_TEMPORAL_AQ)) {
- config->rcParams.enableAQ = psycho_aq;
- config->rcParams.aqStrength = 8;
- config->rcParams.enableTemporalAQ = psycho_aq;
- } else {
- warn("Ignoring Psycho Visual Tuning request since GPU is not capable");
- }
- }
- /* -------------------------- */
- /* rate control */
- enc->can_change_bitrate =
- nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_DYN_BITRATE_CHANGE);
- config->rcParams.rateControlMode = NV_ENC_PARAMS_RC_VBR;
- if (astrcmpi(rc, "cqp") == 0 || rc_lossless) {
- if (*lossless)
- cqp = 0;
- int cqp_val = enc->codec == CODEC_AV1 ? cqp * 4 : cqp;
- config->rcParams.rateControlMode = NV_ENC_PARAMS_RC_CONSTQP;
- config->rcParams.constQP.qpInterP = cqp_val;
- config->rcParams.constQP.qpInterB = cqp_val;
- config->rcParams.constQP.qpIntra = cqp_val;
- enc->can_change_bitrate = false;
- bitrate = 0;
- max_bitrate = 0;
- } else if (astrcmpi(rc, "vbr") != 0) { /* CBR by default */
- config->rcParams.rateControlMode = NV_ENC_PARAMS_RC_CBR;
- }
- config->rcParams.averageBitRate = bitrate * 1000;
- config->rcParams.maxBitRate = vbr ? max_bitrate * 1000 : bitrate * 1000;
- config->rcParams.vbvBufferSize = bitrate * 1000;
- config->rcParams.multiPass = nv_multipass;
- config->rcParams.qpMapMode = NV_ENC_QP_MAP_DELTA;
- /* -------------------------- */
- /* initialize */
- info("settings:\n"
- "\tcodec: %s\n"
- "\trate_control: %s\n"
- "\tbitrate: %d\n"
- "\tcqp: %d\n"
- "\tkeyint: %d\n"
- "\tpreset: %s\n"
- "\ttuning: %s\n"
- "\tmultipass: %s\n"
- "\tprofile: %s\n"
- "\twidth: %d\n"
- "\theight: %d\n"
- "\tb-frames: %d\n"
- "\tlookahead: %s\n"
- "\tpsycho_aq: %s\n",
- get_codec_name(enc->codec), rc, bitrate, cqp, gop_size, preset2,
- tuning, multipass, profile, enc->cx, enc->cy, bf,
- lookahead ? "true" : "false", psycho_aq ? "true" : "false");
- return true;
- }
- static bool init_encoder_h264(struct nvenc_data *enc, obs_data_t *settings,
- int bf, bool compatibility)
- {
- const char *rc = obs_data_get_string(settings, "rate_control");
- int keyint_sec = (int)obs_data_get_int(settings, "keyint_sec");
- const char *profile = obs_data_get_string(settings, "profile");
- bool lossless;
- if (!init_encoder_base(enc, settings, bf, compatibility, &lossless)) {
- return false;
- }
- NV_ENC_CONFIG *config = &enc->config;
- NV_ENC_CONFIG_H264 *h264_config = &config->encodeCodecConfig.h264Config;
- NV_ENC_CONFIG_H264_VUI_PARAMETERS *vui_params =
- &h264_config->h264VUIParameters;
- video_t *video = obs_encoder_video(enc->encoder);
- const struct video_output_info *voi = video_output_get_info(video);
- uint32_t gop_size =
- (keyint_sec) ? keyint_sec * voi->fps_num / voi->fps_den : 250;
- h264_config->idrPeriod = gop_size;
- bool repeat_headers = obs_data_get_bool(settings, "repeat_headers");
- if (repeat_headers) {
- h264_config->repeatSPSPPS = 1;
- h264_config->disableSPSPPS = 0;
- h264_config->outputAUD = 1;
- }
- h264_config->sliceMode = 3;
- h264_config->sliceModeData = 1;
- h264_config->useBFramesAsRef = NV_ENC_BFRAME_REF_MODE_DISABLED;
- /* Enable CBR padding */
- if (config->rcParams.rateControlMode == NV_ENC_PARAMS_RC_CBR)
- h264_config->enableFillerDataInsertion = 1;
- vui_params->videoSignalTypePresentFlag = 1;
- vui_params->videoFullRangeFlag = (voi->range == VIDEO_RANGE_FULL);
- vui_params->colourDescriptionPresentFlag = 1;
- switch (voi->colorspace) {
- case VIDEO_CS_601:
- vui_params->colourPrimaries = 6;
- vui_params->transferCharacteristics = 6;
- vui_params->colourMatrix = 6;
- break;
- case VIDEO_CS_DEFAULT:
- case VIDEO_CS_709:
- vui_params->colourPrimaries = 1;
- vui_params->transferCharacteristics = 1;
- vui_params->colourMatrix = 1;
- break;
- case VIDEO_CS_SRGB:
- vui_params->colourPrimaries = 1;
- vui_params->transferCharacteristics = 13;
- vui_params->colourMatrix = 1;
- break;
- default:
- break;
- }
- if (astrcmpi(rc, "lossless") == 0) {
- h264_config->qpPrimeYZeroTransformBypassFlag = 1;
- } else if (astrcmpi(rc, "vbr") != 0) { /* CBR */
- h264_config->outputBufferingPeriodSEI = 1;
- }
- h264_config->outputPictureTimingSEI = 1;
- /* -------------------------- */
- /* profile */
- if (enc->in_format == VIDEO_FORMAT_I444) {
- config->profileGUID = NV_ENC_H264_PROFILE_HIGH_444_GUID;
- h264_config->chromaFormatIDC = 3;
- } else if (astrcmpi(profile, "main") == 0) {
- config->profileGUID = NV_ENC_H264_PROFILE_MAIN_GUID;
- } else if (astrcmpi(profile, "baseline") == 0) {
- config->profileGUID = NV_ENC_H264_PROFILE_BASELINE_GUID;
- } else if (!lossless) {
- config->profileGUID = NV_ENC_H264_PROFILE_HIGH_GUID;
- }
- if (NV_FAILED(nv.nvEncInitializeEncoder(enc->session, &enc->params))) {
- return false;
- }
- return true;
- }
- static bool init_encoder_hevc(struct nvenc_data *enc, obs_data_t *settings,
- int bf, bool compatibility)
- {
- const char *rc = obs_data_get_string(settings, "rate_control");
- int keyint_sec = (int)obs_data_get_int(settings, "keyint_sec");
- const char *profile = obs_data_get_string(settings, "profile");
- bool lossless;
- if (!init_encoder_base(enc, settings, bf, compatibility, &lossless)) {
- return false;
- }
- NV_ENC_CONFIG *config = &enc->config;
- NV_ENC_CONFIG_HEVC *hevc_config = &config->encodeCodecConfig.hevcConfig;
- NV_ENC_CONFIG_HEVC_VUI_PARAMETERS *vui_params =
- &hevc_config->hevcVUIParameters;
- video_t *video = obs_encoder_video(enc->encoder);
- const struct video_output_info *voi = video_output_get_info(video);
- uint32_t gop_size =
- (keyint_sec) ? keyint_sec * voi->fps_num / voi->fps_den : 250;
- hevc_config->idrPeriod = gop_size;
- bool repeat_headers = obs_data_get_bool(settings, "repeat_headers");
- if (repeat_headers) {
- hevc_config->repeatSPSPPS = 1;
- hevc_config->disableSPSPPS = 0;
- hevc_config->outputAUD = 1;
- }
- hevc_config->sliceMode = 3;
- hevc_config->sliceModeData = 1;
- hevc_config->useBFramesAsRef = NV_ENC_BFRAME_REF_MODE_DISABLED;
- /* Enable CBR padding */
- if (config->rcParams.rateControlMode == NV_ENC_PARAMS_RC_CBR)
- hevc_config->enableFillerDataInsertion = 1;
- vui_params->videoSignalTypePresentFlag = 1;
- vui_params->videoFullRangeFlag = (voi->range == VIDEO_RANGE_FULL);
- vui_params->colourDescriptionPresentFlag = 1;
- switch (voi->colorspace) {
- case VIDEO_CS_601:
- vui_params->colourPrimaries = 6;
- vui_params->transferCharacteristics = 6;
- vui_params->colourMatrix = 6;
- break;
- case VIDEO_CS_DEFAULT:
- case VIDEO_CS_709:
- vui_params->colourPrimaries = 1;
- vui_params->transferCharacteristics = 1;
- vui_params->colourMatrix = 1;
- break;
- case VIDEO_CS_SRGB:
- vui_params->colourPrimaries = 1;
- vui_params->transferCharacteristics = 13;
- vui_params->colourMatrix = 1;
- break;
- case VIDEO_CS_2100_PQ:
- vui_params->colourPrimaries = 9;
- vui_params->transferCharacteristics = 16;
- vui_params->colourMatrix = 9;
- vui_params->chromaSampleLocationFlag = 1;
- vui_params->chromaSampleLocationTop = 2;
- vui_params->chromaSampleLocationBot = 2;
- break;
- case VIDEO_CS_2100_HLG:
- vui_params->colourPrimaries = 9;
- vui_params->transferCharacteristics = 18;
- vui_params->colourMatrix = 9;
- vui_params->chromaSampleLocationFlag = 1;
- vui_params->chromaSampleLocationTop = 2;
- vui_params->chromaSampleLocationBot = 2;
- }
- hevc_config->pixelBitDepthMinus8 = is_10_bit(enc) ? 2 : 0;
- if (astrcmpi(rc, "cbr") == 0) {
- hevc_config->outputBufferingPeriodSEI = 1;
- }
- hevc_config->outputPictureTimingSEI = 1;
- /* -------------------------- */
- /* profile */
- if (enc->in_format == VIDEO_FORMAT_I444) {
- config->profileGUID = NV_ENC_HEVC_PROFILE_FREXT_GUID;
- hevc_config->chromaFormatIDC = 3;
- } else if (astrcmpi(profile, "main10") == 0) {
- config->profileGUID = NV_ENC_HEVC_PROFILE_MAIN10_GUID;
- } else if (is_10_bit(enc)) {
- blog(LOG_WARNING, "[obs-nvenc] Forcing main10 for P010");
- config->profileGUID = NV_ENC_HEVC_PROFILE_MAIN10_GUID;
- } else {
- config->profileGUID = NV_ENC_HEVC_PROFILE_MAIN_GUID;
- }
- if (NV_FAILED(nv.nvEncInitializeEncoder(enc->session, &enc->params))) {
- return false;
- }
- return true;
- }
- static bool init_encoder_av1(struct nvenc_data *enc, obs_data_t *settings,
- int bf, bool compatibility)
- {
- const char *rc = obs_data_get_string(settings, "rate_control");
- int keyint_sec = (int)obs_data_get_int(settings, "keyint_sec");
- bool lossless;
- if (!init_encoder_base(enc, settings, bf, compatibility, &lossless)) {
- return false;
- }
- NV_ENC_INITIALIZE_PARAMS *params = &enc->params;
- NV_ENC_CONFIG *config = &enc->config;
- NV_ENC_CONFIG_AV1 *av1_config = &config->encodeCodecConfig.av1Config;
- video_t *video = obs_encoder_video(enc->encoder);
- const struct video_output_info *voi = video_output_get_info(video);
- uint32_t gop_size =
- (keyint_sec) ? keyint_sec * voi->fps_num / voi->fps_den : 250;
- av1_config->idrPeriod = gop_size;
- av1_config->useBFramesAsRef = NV_ENC_BFRAME_REF_MODE_DISABLED;
- av1_config->colorRange = (voi->range == VIDEO_RANGE_FULL);
- /* Enable CBR padding */
- if (config->rcParams.rateControlMode == NV_ENC_PARAMS_RC_CBR)
- av1_config->enableBitstreamPadding = 1;
- #define PIXELCOUNT_4K (3840 * 2160)
- /* If size is 4K+, set tiles to 2 uniform columns. */
- if ((voi->width * voi->height) >= PIXELCOUNT_4K) {
- av1_config->enableCustomTileConfig = 0;
- av1_config->numTileColumns = 2;
- }
- switch (voi->colorspace) {
- case VIDEO_CS_601:
- av1_config->colorPrimaries = 6;
- av1_config->transferCharacteristics = 6;
- av1_config->matrixCoefficients = 6;
- break;
- case VIDEO_CS_DEFAULT:
- case VIDEO_CS_709:
- av1_config->colorPrimaries = 1;
- av1_config->transferCharacteristics = 1;
- av1_config->matrixCoefficients = 1;
- break;
- case VIDEO_CS_SRGB:
- av1_config->colorPrimaries = 1;
- av1_config->transferCharacteristics = 13;
- av1_config->matrixCoefficients = 1;
- break;
- case VIDEO_CS_2100_PQ:
- av1_config->colorPrimaries = 9;
- av1_config->transferCharacteristics = 16;
- av1_config->matrixCoefficients = 9;
- break;
- case VIDEO_CS_2100_HLG:
- av1_config->colorPrimaries = 9;
- av1_config->transferCharacteristics = 18;
- av1_config->matrixCoefficients = 9;
- }
- /* -------------------------- */
- /* profile */
- config->profileGUID = NV_ENC_AV1_PROFILE_MAIN_GUID;
- av1_config->tier = NV_ENC_TIER_AV1_0;
- av1_config->level = NV_ENC_LEVEL_AV1_AUTOSELECT;
- av1_config->chromaFormatIDC = 1;
- av1_config->pixelBitDepthMinus8 = is_10_bit(enc) ? 2 : 0;
- av1_config->inputPixelBitDepthMinus8 = av1_config->pixelBitDepthMinus8;
- av1_config->numFwdRefs = 1;
- av1_config->numBwdRefs = 1;
- av1_config->repeatSeqHdr = 1;
- if (NV_FAILED(nv.nvEncInitializeEncoder(enc->session, &enc->params))) {
- return false;
- }
- return true;
- }
- static bool init_bitstreams(struct nvenc_data *enc)
- {
- da_reserve(enc->bitstreams, enc->buf_count);
- for (uint32_t i = 0; i < enc->buf_count; i++) {
- struct nv_bitstream bitstream;
- if (!nv_bitstream_init(enc, &bitstream)) {
- return false;
- }
- da_push_back(enc->bitstreams, &bitstream);
- }
- return true;
- }
- #ifdef _WIN32
- static bool init_textures(struct nvenc_data *enc)
- {
- da_reserve(enc->textures, enc->buf_count);
- for (uint32_t i = 0; i < enc->buf_count; i++) {
- struct nv_texture texture;
- if (!nv_texture_init(enc, &texture)) {
- return false;
- }
- da_push_back(enc->textures, &texture);
- }
- return true;
- }
- #endif
- static bool init_cuda_surfaces(struct nvenc_data *enc)
- {
- switch (enc->in_format) {
- case VIDEO_FORMAT_P010:
- enc->surface_format = NV_ENC_BUFFER_FORMAT_YUV420_10BIT;
- break;
- case VIDEO_FORMAT_I444:
- enc->surface_format = NV_ENC_BUFFER_FORMAT_YUV444;
- break;
- default:
- enc->surface_format = NV_ENC_BUFFER_FORMAT_NV12;
- }
- da_reserve(enc->surfaces, enc->buf_count);
- CU_FAILED(cu->cuCtxPushCurrent(enc->cu_ctx))
- for (uint32_t i = 0; i < enc->buf_count; i++) {
- struct nv_cuda_surface buf;
- if (!nv_cuda_surface_init(enc, &buf)) {
- return false;
- }
- da_push_back(enc->surfaces, &buf);
- }
- CU_FAILED(cu->cuCtxPopCurrent(NULL))
- return true;
- }
- static bool init_cuda_ctx(struct nvenc_data *enc, obs_data_t *settings,
- const bool texture)
- {
- int count, gpu;
- CUdevice device;
- bool cuda_override;
- /* Allow CUDA device override for texture encoders (experimental) */
- if (obs_data_has_user_value(settings, "cuda_device")) {
- gpu = (int)obs_data_get_int(settings, "cuda_device");
- cuda_override = true;
- } else {
- gpu = (int)obs_data_get_int(settings, "gpu");
- cuda_override = false;
- }
- CU_FAILED(cu->cuInit(0))
- CU_FAILED(cu->cuDeviceGetCount(&count))
- if (!count) {
- NV_FAIL("No CUDA devices found");
- return false;
- }
- #ifdef _WIN32
- CU_FAILED(cu->cuDeviceGet(&device, gpu))
- #else
- if (!texture || cuda_override) {
- CU_FAILED(cu->cuDeviceGet(&device, gpu))
- } else {
- unsigned int ctx_count = 0;
- CUdevice devices[2];
- obs_enter_graphics();
- CUresult res = cu->cuGLGetDevices(&ctx_count, devices, 2,
- CU_GL_DEVICE_LIST_ALL);
- obs_leave_graphics();
- if (res != CUDA_SUCCESS || !ctx_count) {
- /* CUDA_ERROR_INVALID_GRAPHICS_CONTEXT should be treated
- * as non-fatal fallback (probably running on iGPU). */
- if (res == 219) {
- info("Not running on NVIDIA GPU, falling back to non-texture encoder");
- } else {
- const char *name, *desc;
- if (cuda_get_error_desc(res, &name, &desc)) {
- error("Failed to get a CUDA device for the current OpenGL context: %s: %s",
- name, desc);
- } else {
- error("Failed to get a CUDA device for the current OpenGL context: %d",
- res);
- }
- }
- return false;
- }
- /* Documentation indicates this should only ever happen with SLI, i.e. never for OBS. */
- if (ctx_count > 1) {
- warn("Got more than one CUDA devices for OpenGL context, this is untested.");
- }
- device = devices[0];
- debug("Loading up CUDA on device %u", device);
- }
- #endif
- CU_FAILED(cu->cuCtxCreate(&enc->cu_ctx, 0, device))
- CU_FAILED(cu->cuCtxPopCurrent(NULL))
- return true;
- }
- static enum video_format get_preferred_format(enum video_format format)
- {
- switch (format) {
- case VIDEO_FORMAT_I010:
- case VIDEO_FORMAT_P010:
- return VIDEO_FORMAT_P010;
- case VIDEO_FORMAT_RGBA:
- case VIDEO_FORMAT_BGRA:
- case VIDEO_FORMAT_BGRX:
- case VIDEO_FORMAT_I444:
- return VIDEO_FORMAT_I444;
- default:
- return VIDEO_FORMAT_NV12;
- }
- }
- static void nvenc_destroy(void *data);
- static bool init_specific_encoder(struct nvenc_data *enc, obs_data_t *settings,
- int bf, bool compatibility)
- {
- switch (enc->codec) {
- case CODEC_HEVC:
- return init_encoder_hevc(enc, settings, bf, compatibility);
- case CODEC_H264:
- return init_encoder_h264(enc, settings, bf, compatibility);
- case CODEC_AV1:
- return init_encoder_av1(enc, settings, bf, compatibility);
- }
- return false;
- }
- static bool init_encoder(struct nvenc_data *enc, enum codec_type codec,
- obs_data_t *settings, obs_encoder_t *encoder)
- {
- UNUSED_PARAMETER(codec);
- UNUSED_PARAMETER(encoder);
- int bf = (int)obs_data_get_int(settings, "bf");
- const bool support_10bit =
- nv_get_cap(enc, NV_ENC_CAPS_SUPPORT_10BIT_ENCODE);
- const int bf_max = nv_get_cap(enc, NV_ENC_CAPS_NUM_MAX_BFRAMES);
- video_t *video = obs_encoder_video(enc->encoder);
- const struct video_output_info *voi = video_output_get_info(video);
- enc->in_format = get_preferred_format(voi->format);
- if (is_10_bit(enc) && !support_10bit) {
- NV_FAIL(obs_module_text("NVENC.10bitUnsupported"));
- return false;
- }
- switch (voi->format) {
- case VIDEO_FORMAT_I010:
- case VIDEO_FORMAT_P010:
- break;
- default:
- switch (voi->colorspace) {
- case VIDEO_CS_2100_PQ:
- case VIDEO_CS_2100_HLG:
- NV_FAIL(obs_module_text("NVENC.8bitUnsupportedHdr"));
- return false;
- default:
- break;
- }
- }
- if (bf > bf_max) {
- blog(LOG_WARNING,
- "[obs-nvenc] Max B-frames setting (%d) is more than encoder supports (%d).\n"
- "Setting B-frames to %d",
- bf, bf_max, bf_max);
- bf = bf_max;
- }
- if (!init_specific_encoder(enc, settings, bf, false)) {
- blog(LOG_WARNING, "[obs-nvenc] init_specific_encoder failed, "
- "trying again with compatibility options");
- nv.nvEncDestroyEncoder(enc->session);
- enc->session = NULL;
- if (!init_session(enc)) {
- return false;
- }
- /* try without multipass and psycho aq */
- if (!init_specific_encoder(enc, settings, bf, true)) {
- return false;
- }
- }
- return true;
- }
- static void *nvenc_create_internal(enum codec_type codec, obs_data_t *settings,
- obs_encoder_t *encoder, bool texture)
- {
- struct nvenc_data *enc = bzalloc(sizeof(*enc));
- enc->encoder = encoder;
- enc->codec = codec;
- enc->first_packet = true;
- enc->fallback = !texture;
- if (get_nvenc_ver() == COMPATIBILITY_VERSION) {
- enc->needs_compat_ver = true;
- }
- NV_ENCODE_API_FUNCTION_LIST init = {NV_ENCODE_API_FUNCTION_LIST_VER};
- switch (enc->codec) {
- case CODEC_H264:
- enc->codec_guid = NV_ENC_CODEC_H264_GUID;
- break;
- case CODEC_HEVC:
- enc->codec_guid = NV_ENC_CODEC_HEVC_GUID;
- break;
- case CODEC_AV1:
- enc->codec_guid = NV_ENC_CODEC_AV1_GUID;
- break;
- }
- if (!init_nvenc(encoder)) {
- goto fail;
- }
- if (
- #ifdef _WIN32
- !texture &&
- #endif
- !init_cuda(encoder)) {
- goto fail;
- }
- if (NV_FAILED(nv_create_instance(&init))) {
- goto fail;
- }
- #ifdef _WIN32
- if (texture && !init_d3d11(enc, settings)) {
- goto fail;
- }
- #endif
- if (
- #ifdef _WIN32
- !texture &&
- #endif
- !init_cuda_ctx(enc, settings, texture)) {
- goto fail;
- }
- if (!init_session(enc)) {
- goto fail;
- }
- if (!init_encoder(enc, codec, settings, encoder)) {
- goto fail;
- }
- if (!init_bitstreams(enc)) {
- goto fail;
- }
- #ifdef _WIN32
- if (texture && !init_textures(enc)) {
- goto fail;
- }
- #endif
- if (
- #ifdef _WIN32
- !texture &&
- #endif
- !init_cuda_surfaces(enc)) {
- goto fail;
- }
- enc->codec = codec;
- if (enc->cu_ctx)
- cu->cuCtxPopCurrent(NULL);
- return enc;
- fail:
- nvenc_destroy(enc);
- return NULL;
- }
- static void *nvenc_create_base(enum codec_type codec, obs_data_t *settings,
- obs_encoder_t *encoder, bool texture)
- {
- /* this encoder requires shared textures, this cannot be used on a
- * gpu other than the one OBS is currently running on. */
- const int gpu = (int)obs_data_get_int(settings, "gpu");
- if (gpu != 0 && texture) {
- blog(LOG_INFO,
- "[obs-nvenc] different GPU selected by user, falling back "
- "to non-texture encoder");
- goto reroute;
- }
- if (obs_encoder_scaling_enabled(encoder)) {
- if (obs_encoder_gpu_scaling_enabled(encoder)) {
- blog(LOG_INFO, "[obs-nvenc] GPU scaling enabled");
- } else if (texture) {
- blog(LOG_INFO,
- "[obs-nvenc] CPU scaling enabled, falling back to"
- " non-texture encoder");
- goto reroute;
- }
- }
- if (texture && !obs_p010_tex_active() && !obs_nv12_tex_active()) {
- blog(LOG_INFO,
- "[obs-nvenc] nv12/p010 not active, falling back to "
- "non-texture encoder");
- goto reroute;
- }
- struct nvenc_data *enc =
- nvenc_create_internal(codec, settings, encoder, texture);
- if (enc) {
- return enc;
- }
- reroute:
- if (!texture) {
- blog(LOG_ERROR,
- "Already in fallback encoder, can't fall back further!");
- return NULL;
- }
- switch (codec) {
- case CODEC_H264:
- return obs_encoder_create_rerouted(encoder,
- "obs_nvenc_h264_cuda");
- case CODEC_HEVC:
- return obs_encoder_create_rerouted(encoder,
- "obs_nvenc_hevc_cuda");
- case CODEC_AV1:
- return obs_encoder_create_rerouted(encoder,
- "obs_nvenc_av1_cuda");
- }
- return NULL;
- }
- static void *h264_nvenc_create(obs_data_t *settings, obs_encoder_t *encoder)
- {
- return nvenc_create_base(CODEC_H264, settings, encoder, true);
- }
- #ifdef ENABLE_HEVC
- static void *hevc_nvenc_create(obs_data_t *settings, obs_encoder_t *encoder)
- {
- return nvenc_create_base(CODEC_HEVC, settings, encoder, true);
- }
- #endif
- static void *av1_nvenc_create(obs_data_t *settings, obs_encoder_t *encoder)
- {
- return nvenc_create_base(CODEC_AV1, settings, encoder, true);
- }
- static void *h264_nvenc_soft_create(obs_data_t *settings,
- obs_encoder_t *encoder)
- {
- return nvenc_create_base(CODEC_H264, settings, encoder, false);
- }
- #ifdef ENABLE_HEVC
- static void *hevc_nvenc_soft_create(obs_data_t *settings,
- obs_encoder_t *encoder)
- {
- return nvenc_create_base(CODEC_HEVC, settings, encoder, false);
- }
- #endif
- static void *av1_nvenc_soft_create(obs_data_t *settings, obs_encoder_t *encoder)
- {
- return nvenc_create_base(CODEC_AV1, settings, encoder, false);
- }
- static bool get_encoded_packet(struct nvenc_data *enc, bool finalize);
- static void nvenc_destroy(void *data)
- {
- struct nvenc_data *enc = data;
- if (enc->cu_ctx)
- cu->cuCtxPushCurrent(enc->cu_ctx);
- if (enc->encode_started) {
- uint32_t struct_ver = enc->needs_compat_ver
- ? NV_ENC_PIC_PARAMS_COMPAT_VER
- : NV_ENC_PIC_PARAMS_VER;
- NV_ENC_PIC_PARAMS params = {struct_ver};
- params.encodePicFlags = NV_ENC_PIC_FLAG_EOS;
- nv.nvEncEncodePicture(enc->session, ¶ms);
- get_encoded_packet(enc, true);
- }
- #ifdef _WIN32
- for (size_t i = 0; i < enc->textures.num; i++) {
- nv_texture_free(enc, &enc->textures.array[i]);
- }
- #endif
- for (size_t i = 0; i < enc->surfaces.num; i++) {
- nv_cuda_surface_free(enc, &enc->surfaces.array[i]);
- }
- for (size_t i = 0; i < enc->bitstreams.num; i++) {
- nv_bitstream_free(enc, &enc->bitstreams.array[i]);
- }
- if (enc->session) {
- nv.nvEncDestroyEncoder(enc->session);
- }
- #ifdef _WIN32
- for (size_t i = 0; i < enc->input_textures.num; i++) {
- ID3D11Texture2D *tex = enc->input_textures.array[i].tex;
- IDXGIKeyedMutex *km = enc->input_textures.array[i].km;
- tex->lpVtbl->Release(tex);
- km->lpVtbl->Release(km);
- }
- if (enc->context) {
- enc->context->lpVtbl->Release(enc->context);
- }
- if (enc->device) {
- enc->device->lpVtbl->Release(enc->device);
- }
- #else
- for (size_t i = 0; i < enc->input_textures.num; i++) {
- CUgraphicsResource res_y = enc->input_textures.array[i].res_y;
- CUgraphicsResource res_uv = enc->input_textures.array[i].res_uv;
- cu->cuGraphicsUnregisterResource(res_y);
- cu->cuGraphicsUnregisterResource(res_uv);
- }
- #endif
- if (enc->cu_ctx) {
- cu->cuCtxPopCurrent(NULL);
- cu->cuCtxDestroy(enc->cu_ctx);
- }
- bfree(enc->header);
- bfree(enc->sei);
- deque_free(&enc->dts_list);
- da_free(enc->surfaces);
- da_free(enc->input_textures);
- da_free(enc->bitstreams);
- #ifdef _WIN32
- da_free(enc->textures);
- #endif
- da_free(enc->packet_data);
- bfree(enc->roi_map);
- bfree(enc);
- }
- #ifdef _WIN32
- static ID3D11Texture2D *get_tex_from_handle(struct nvenc_data *enc,
- uint32_t handle,
- IDXGIKeyedMutex **km_out)
- {
- ID3D11Device *device = enc->device;
- IDXGIKeyedMutex *km;
- ID3D11Texture2D *input_tex;
- HRESULT hr;
- for (size_t i = 0; i < enc->input_textures.num; i++) {
- struct handle_tex *ht = &enc->input_textures.array[i];
- if (ht->handle == handle) {
- *km_out = ht->km;
- return ht->tex;
- }
- }
- hr = device->lpVtbl->OpenSharedResource(device,
- (HANDLE)(uintptr_t)handle,
- &IID_ID3D11Texture2D,
- &input_tex);
- if (FAILED(hr)) {
- error_hr("OpenSharedResource failed");
- return NULL;
- }
- hr = input_tex->lpVtbl->QueryInterface(input_tex, &IID_IDXGIKeyedMutex,
- &km);
- if (FAILED(hr)) {
- error_hr("QueryInterface(IDXGIKeyedMutex) failed");
- input_tex->lpVtbl->Release(input_tex);
- return NULL;
- }
- input_tex->lpVtbl->SetEvictionPriority(input_tex,
- DXGI_RESOURCE_PRIORITY_MAXIMUM);
- *km_out = km;
- struct handle_tex new_ht = {handle, input_tex, km};
- da_push_back(enc->input_textures, &new_ht);
- return input_tex;
- }
- #endif
- static bool get_encoded_packet(struct nvenc_data *enc, bool finalize)
- {
- void *s = enc->session;
- da_resize(enc->packet_data, 0);
- if (!enc->buffers_queued)
- return true;
- if (!finalize && enc->buffers_queued < enc->output_delay)
- return true;
- size_t count = finalize ? enc->buffers_queued : 1;
- for (size_t i = 0; i < count; i++) {
- size_t cur_bs_idx = enc->cur_bitstream;
- struct nv_bitstream *bs = &enc->bitstreams.array[cur_bs_idx];
- #ifdef _WIN32
- struct nv_texture *nvtex =
- enc->fallback ? NULL : &enc->textures.array[cur_bs_idx];
- struct nv_cuda_surface *surf =
- enc->fallback ? &enc->surfaces.array[cur_bs_idx] : NULL;
- #else
- struct nv_cuda_surface *surf = &enc->surfaces.array[cur_bs_idx];
- #endif
- /* ---------------- */
- uint32_t struct_ver = enc->needs_compat_ver
- ? NV_ENC_LOCK_BITSTREAM_COMPAT_VER
- : NV_ENC_LOCK_BITSTREAM_VER;
- NV_ENC_LOCK_BITSTREAM lock = {struct_ver};
- lock.outputBitstream = bs->ptr;
- lock.doNotWait = false;
- if (NV_FAILED(nv.nvEncLockBitstream(s, &lock))) {
- return false;
- }
- if (enc->first_packet) {
- NV_ENC_SEQUENCE_PARAM_PAYLOAD payload = {0};
- uint8_t buf[256];
- uint32_t size = 0;
- payload.version = NV_ENC_SEQUENCE_PARAM_PAYLOAD_VER;
- payload.spsppsBuffer = buf;
- payload.inBufferSize = sizeof(buf);
- payload.outSPSPPSPayloadSize = &size;
- nv.nvEncGetSequenceParams(s, &payload);
- enc->header = bmemdup(buf, size);
- enc->header_size = size;
- enc->first_packet = false;
- }
- da_copy_array(enc->packet_data, lock.bitstreamBufferPtr,
- lock.bitstreamSizeInBytes);
- enc->packet_pts = (int64_t)lock.outputTimeStamp;
- enc->packet_keyframe = lock.pictureType == NV_ENC_PIC_TYPE_IDR;
- if (NV_FAILED(nv.nvEncUnlockBitstream(s, bs->ptr))) {
- return false;
- }
- /* ---------------- */
- #ifdef _WIN32
- if (nvtex && nvtex->mapped_res) {
- NVENCSTATUS err;
- err = nv.nvEncUnmapInputResource(s, nvtex->mapped_res);
- if (nv_failed(enc->encoder, err, __FUNCTION__,
- "unmap")) {
- return false;
- }
- nvtex->mapped_res = NULL;
- }
- #endif
- /* ---------------- */
- if (surf && surf->mapped_res) {
- NVENCSTATUS err;
- err = nv.nvEncUnmapInputResource(s, surf->mapped_res);
- if (nv_failed(enc->encoder, err, __FUNCTION__,
- "unmap")) {
- return false;
- }
- surf->mapped_res = NULL;
- }
- /* ---------------- */
- if (++enc->cur_bitstream == enc->buf_count)
- enc->cur_bitstream = 0;
- enc->buffers_queued--;
- }
- return true;
- }
- struct roi_params {
- uint32_t mb_width;
- uint32_t mb_height;
- uint32_t mb_size;
- bool av1;
- int8_t *map;
- };
- static void roi_cb(void *param, struct obs_encoder_roi *roi)
- {
- const struct roi_params *rp = param;
- int8_t qp_val;
- /* AV1 has a larger QP range than HEVC/H.264 */
- if (rp->av1) {
- qp_val = (int8_t)(-128.0f * roi->priority);
- } else {
- qp_val = (int8_t)(-51.0f * roi->priority);
- }
- const uint32_t roi_left = roi->left / rp->mb_size;
- const uint32_t roi_top = roi->top / rp->mb_size;
- const uint32_t roi_right = (roi->right - 1) / rp->mb_size;
- const uint32_t roi_bottom = (roi->bottom - 1) / rp->mb_size;
- for (uint32_t mb_y = 0; mb_y < rp->mb_height; mb_y++) {
- if (mb_y < roi_top || mb_y > roi_bottom)
- continue;
- for (uint32_t mb_x = 0; mb_x < rp->mb_width; mb_x++) {
- if (mb_x < roi_left || mb_x > roi_right)
- continue;
- rp->map[mb_y * rp->mb_width + mb_x] = qp_val;
- }
- }
- }
- static void add_roi(struct nvenc_data *enc, NV_ENC_PIC_PARAMS *params)
- {
- const uint32_t increment = obs_encoder_get_roi_increment(enc->encoder);
- if (enc->roi_map && enc->roi_increment == increment) {
- params->qpDeltaMap = enc->roi_map;
- params->qpDeltaMapSize = (uint32_t)enc->roi_map_size;
- return;
- }
- uint32_t mb_size = 0;
- switch (enc->codec) {
- case CODEC_H264:
- /* H.264 is always 16x16 */
- mb_size = 16;
- break;
- case CODEC_HEVC:
- /* HEVC can be 16x16, 32x32, or 64x64, but NVENC is always 32x32 */
- mb_size = 32;
- break;
- case CODEC_AV1:
- /* AV1 can be 64x64 or 128x128, but NVENC is always 64x64 */
- mb_size = 64;
- break;
- }
- const uint32_t mb_width = (enc->cx + mb_size - 1) / mb_size;
- const uint32_t mb_height = (enc->cy + mb_size - 1) / mb_size;
- const size_t map_size = mb_width * mb_height * sizeof(int8_t);
- if (map_size != enc->roi_map_size) {
- enc->roi_map = brealloc(enc->roi_map, map_size);
- enc->roi_map_size = map_size;
- }
- memset(enc->roi_map, 0, enc->roi_map_size);
- struct roi_params par = {
- .mb_width = mb_width,
- .mb_height = mb_height,
- .mb_size = mb_size,
- .av1 = enc->codec == CODEC_AV1,
- .map = enc->roi_map,
- };
- obs_encoder_enum_roi(enc->encoder, roi_cb, &par);
- enc->roi_increment = increment;
- params->qpDeltaMap = enc->roi_map;
- params->qpDeltaMapSize = (uint32_t)map_size;
- }
- static bool nvenc_encode_shared(struct nvenc_data *enc, struct nv_bitstream *bs,
- void *pic, int64_t pts,
- struct encoder_packet *packet,
- bool *received_packet)
- {
- NV_ENC_PIC_PARAMS params = {0};
- params.version = enc->needs_compat_ver ? NV_ENC_PIC_PARAMS_COMPAT_VER
- : NV_ENC_PIC_PARAMS_VER;
- params.pictureStruct = NV_ENC_PIC_STRUCT_FRAME;
- params.inputBuffer = pic;
- params.inputTimeStamp = (uint64_t)pts;
- params.inputWidth = enc->cx;
- params.inputHeight = enc->cy;
- params.inputPitch = enc->cx;
- params.outputBitstream = bs->ptr;
- if (enc->fallback) {
- params.bufferFmt = enc->surface_format;
- } else {
- params.bufferFmt = obs_p010_tex_active()
- ? NV_ENC_BUFFER_FORMAT_YUV420_10BIT
- : NV_ENC_BUFFER_FORMAT_NV12;
- }
- /* Add ROI map if enabled */
- if (obs_encoder_has_roi(enc->encoder))
- add_roi(enc, ¶ms);
- NVENCSTATUS err = nv.nvEncEncodePicture(enc->session, ¶ms);
- if (err != NV_ENC_SUCCESS && err != NV_ENC_ERR_NEED_MORE_INPUT) {
- nv_failed(enc->encoder, err, __FUNCTION__,
- "nvEncEncodePicture");
- return false;
- }
- enc->encode_started = true;
- enc->buffers_queued++;
- if (++enc->next_bitstream == enc->buf_count) {
- enc->next_bitstream = 0;
- }
- /* ------------------------------------ */
- /* check for encoded packet and parse */
- if (!get_encoded_packet(enc, false)) {
- return false;
- }
- /* ------------------------------------ */
- /* output encoded packet */
- if (enc->packet_data.num) {
- int64_t dts;
- deque_pop_front(&enc->dts_list, &dts, sizeof(dts));
- /* subtract bframe delay from dts */
- dts -= (int64_t)enc->bframes * packet->timebase_num;
- *received_packet = true;
- packet->data = enc->packet_data.array;
- packet->size = enc->packet_data.num;
- packet->type = OBS_ENCODER_VIDEO;
- packet->pts = enc->packet_pts;
- packet->dts = dts;
- packet->keyframe = enc->packet_keyframe;
- } else {
- *received_packet = false;
- }
- return true;
- }
- #ifdef _WIN32
- static bool nvenc_encode_tex(void *data, uint32_t handle, int64_t pts,
- uint64_t lock_key, uint64_t *next_key,
- struct encoder_packet *packet,
- bool *received_packet)
- {
- struct nvenc_data *enc = data;
- ID3D11DeviceContext *context = enc->context;
- ID3D11Texture2D *input_tex;
- ID3D11Texture2D *output_tex;
- IDXGIKeyedMutex *km;
- struct nv_texture *nvtex;
- struct nv_bitstream *bs;
- if (handle == GS_INVALID_HANDLE) {
- error("Encode failed: bad texture handle");
- *next_key = lock_key;
- return false;
- }
- bs = &enc->bitstreams.array[enc->next_bitstream];
- nvtex = &enc->textures.array[enc->next_bitstream];
- input_tex = get_tex_from_handle(enc, handle, &km);
- output_tex = nvtex->tex;
- if (!input_tex) {
- *next_key = lock_key;
- return false;
- }
- deque_push_back(&enc->dts_list, &pts, sizeof(pts));
- /* ------------------------------------ */
- /* copy to output tex */
- km->lpVtbl->AcquireSync(km, lock_key, INFINITE);
- context->lpVtbl->CopyResource(context, (ID3D11Resource *)output_tex,
- (ID3D11Resource *)input_tex);
- km->lpVtbl->ReleaseSync(km, *next_key);
- /* ------------------------------------ */
- /* map output tex so nvenc can use it */
- NV_ENC_MAP_INPUT_RESOURCE map = {NV_ENC_MAP_INPUT_RESOURCE_VER};
- map.registeredResource = nvtex->res;
- if (NV_FAILED(nv.nvEncMapInputResource(enc->session, &map))) {
- return false;
- }
- nvtex->mapped_res = map.mappedResource;
- /* ------------------------------------ */
- /* do actual encode call */
- return nvenc_encode_shared(enc, bs, nvtex->mapped_res, pts, packet,
- received_packet);
- }
- #else
- static inline bool get_res_for_tex_ids(struct nvenc_data *enc, GLuint tex_id_y,
- GLuint tex_id_uv,
- CUgraphicsResource *tex_y,
- CUgraphicsResource *tex_uv)
- {
- bool success = true;
- for (size_t idx = 0; idx < enc->input_textures.num; idx++) {
- struct handle_tex *ht = &enc->input_textures.array[idx];
- if (ht->tex_id != tex_id_y)
- continue;
- *tex_y = ht->res_y;
- *tex_uv = ht->res_uv;
- return success;
- }
- CU_CHECK(cu->cuGraphicsGLRegisterImage(
- tex_y, tex_id_y, GL_TEXTURE_2D,
- CU_GRAPHICS_REGISTER_FLAGS_READ_ONLY))
- CU_CHECK(cu->cuGraphicsGLRegisterImage(
- tex_uv, tex_id_uv, GL_TEXTURE_2D,
- CU_GRAPHICS_REGISTER_FLAGS_READ_ONLY))
- struct handle_tex ht = {tex_id_y, *tex_y, *tex_uv};
- da_push_back(enc->input_textures, &ht);
- unmap:
- if (!success) {
- cu->cuGraphicsUnregisterResource(*tex_y);
- cu->cuGraphicsUnregisterResource(*tex_uv);
- }
- return success;
- }
- static inline bool copy_tex_cuda(struct nvenc_data *enc, const bool p010,
- GLuint tex[2], struct nv_cuda_surface *surf)
- {
- bool success = true;
- CUgraphicsResource mapped_tex[2] = {0};
- CUarray mapped_cuda;
- if (!get_res_for_tex_ids(enc, tex[0], tex[1], &mapped_tex[0],
- &mapped_tex[1]))
- return false;
- CU_CHECK(cu->cuGraphicsMapResources(2, mapped_tex, 0))
- CUDA_MEMCPY2D m = {0};
- m.dstMemoryType = CU_MEMORYTYPE_ARRAY;
- m.srcMemoryType = CU_MEMORYTYPE_ARRAY;
- m.dstArray = surf->tex;
- m.WidthInBytes = p010 ? enc->cx * 2 : enc->cx;
- m.Height = enc->cy;
- // Map and copy Y texture
- CU_CHECK(cu->cuGraphicsSubResourceGetMappedArray(&mapped_cuda,
- mapped_tex[0], 0, 0));
- m.srcArray = mapped_cuda;
- CU_CHECK(cu->cuMemcpy2D(&m))
- // Map and copy UV texture
- CU_CHECK(cu->cuGraphicsSubResourceGetMappedArray(&mapped_cuda,
- mapped_tex[1], 0, 0))
- m.srcArray = mapped_cuda;
- m.dstY += enc->cy;
- m.Height = enc->cy / 2;
- CU_CHECK(cu->cuMemcpy2D(&m))
- unmap:
- cu->cuGraphicsUnmapResources(2, mapped_tex, 0);
- return success;
- }
- static bool nvenc_encode_tex2(void *data, struct encoder_texture *tex,
- int64_t pts, uint64_t lock_key,
- uint64_t *next_key, struct encoder_packet *packet,
- bool *received_packet)
- {
- struct nvenc_data *enc = data;
- struct nv_cuda_surface *surf;
- struct nv_bitstream *bs;
- const bool p010 = obs_p010_tex_active();
- GLuint input_tex[2];
- if (tex == NULL || tex->tex[0] == NULL) {
- error("Encode failed: bad texture handle");
- *next_key = lock_key;
- return false;
- }
- bs = &enc->bitstreams.array[enc->next_bitstream];
- surf = &enc->surfaces.array[enc->next_bitstream];
- deque_push_back(&enc->dts_list, &pts, sizeof(pts));
- /* ------------------------------------ */
- /* copy to CUDA data */
- CU_FAILED(cu->cuCtxPushCurrent(enc->cu_ctx))
- obs_enter_graphics();
- input_tex[0] = *(GLuint *)gs_texture_get_obj(tex->tex[0]);
- input_tex[1] = *(GLuint *)gs_texture_get_obj(tex->tex[1]);
- bool success = copy_tex_cuda(enc, p010, input_tex, surf);
- obs_leave_graphics();
- CU_FAILED(cu->cuCtxPopCurrent(NULL))
- if (!success)
- return false;
- /* ------------------------------------ */
- /* map output tex so nvenc can use it */
- NV_ENC_MAP_INPUT_RESOURCE map = {NV_ENC_MAP_INPUT_RESOURCE_VER};
- map.registeredResource = surf->res;
- map.mappedBufferFmt = p010 ? NV_ENC_BUFFER_FORMAT_YUV420_10BIT
- : NV_ENC_BUFFER_FORMAT_NV12;
- if (NV_FAILED(nv.nvEncMapInputResource(enc->session, &map)))
- return false;
- surf->mapped_res = map.mappedResource;
- /* ------------------------------------ */
- /* do actual encode call */
- return nvenc_encode_shared(enc, bs, surf->mapped_res, pts, packet,
- received_packet);
- }
- #endif
- static inline bool nvenc_copy_frame(struct nvenc_data *enc,
- struct encoder_frame *frame,
- struct nv_cuda_surface *surf)
- {
- bool success = true;
- size_t height = enc->cy;
- size_t width = enc->cx;
- CUDA_MEMCPY2D m = {0};
- m.srcMemoryType = CU_MEMORYTYPE_HOST;
- m.dstMemoryType = CU_MEMORYTYPE_ARRAY;
- m.dstArray = surf->tex;
- m.WidthInBytes = width;
- m.Height = height;
- CU_FAILED(cu->cuCtxPushCurrent(enc->cu_ctx))
- if (enc->surface_format == NV_ENC_BUFFER_FORMAT_NV12) {
- /* Page-locks the host memory so that it can be DMAd directly
- * rather than CUDA doing an internal copy to page-locked
- * memory before actually DMA-ing to the GPU. */
- CU_CHECK(cu->cuMemHostRegister(frame->data[0],
- frame->linesize[0] * height, 0))
- CU_CHECK(cu->cuMemHostRegister(
- frame->data[1], frame->linesize[1] * height / 2, 0))
- m.srcPitch = frame->linesize[0];
- m.srcHost = frame->data[0];
- CU_FAILED(cu->cuMemcpy2D(&m))
- m.srcPitch = frame->linesize[1];
- m.srcHost = frame->data[1];
- m.dstY += height;
- m.Height /= 2;
- CU_FAILED(cu->cuMemcpy2D(&m))
- } else if (enc->surface_format == NV_ENC_BUFFER_FORMAT_YUV420_10BIT) {
- CU_CHECK(cu->cuMemHostRegister(frame->data[0],
- frame->linesize[0] * height, 0))
- CU_CHECK(cu->cuMemHostRegister(
- frame->data[1], frame->linesize[1] * height / 2, 0))
- // P010 lines are double the size (16 bit per pixel)
- m.WidthInBytes *= 2;
- m.srcPitch = frame->linesize[0];
- m.srcHost = frame->data[0];
- CU_FAILED(cu->cuMemcpy2D(&m))
- m.srcPitch = frame->linesize[1];
- m.srcHost = frame->data[1];
- m.dstY += height;
- m.Height /= 2;
- CU_FAILED(cu->cuMemcpy2D(&m))
- } else { // I444
- CU_CHECK(cu->cuMemHostRegister(frame->data[0],
- frame->linesize[0] * height, 0))
- CU_CHECK(cu->cuMemHostRegister(frame->data[1],
- frame->linesize[1] * height, 0))
- CU_CHECK(cu->cuMemHostRegister(frame->data[2],
- frame->linesize[2] * height, 0))
- m.srcPitch = frame->linesize[0];
- m.srcHost = frame->data[0];
- CU_FAILED(cu->cuMemcpy2D(&m))
- m.srcPitch = frame->linesize[1];
- m.srcHost = frame->data[1];
- m.dstY += height;
- CU_FAILED(cu->cuMemcpy2D(&m))
- m.srcPitch = frame->linesize[2];
- m.srcHost = frame->data[2];
- m.dstY += height;
- CU_FAILED(cu->cuMemcpy2D(&m))
- }
- unmap:
- if (frame->data[0])
- cu->cuMemHostUnregister(frame->data[0]);
- if (frame->data[1])
- cu->cuMemHostUnregister(frame->data[1]);
- if (frame->data[2])
- cu->cuMemHostUnregister(frame->data[2]);
- CU_FAILED(cu->cuCtxPopCurrent(NULL))
- return success;
- }
- static bool nvenc_encode_soft(void *data, struct encoder_frame *frame,
- struct encoder_packet *packet,
- bool *received_packet)
- {
- struct nvenc_data *enc = data;
- struct nv_cuda_surface *surf;
- struct nv_bitstream *bs;
- bs = &enc->bitstreams.array[enc->next_bitstream];
- surf = &enc->surfaces.array[enc->next_bitstream];
- deque_push_back(&enc->dts_list, &frame->pts, sizeof(frame->pts));
- /* ------------------------------------ */
- /* copy to CUDA surface */
- if (!nvenc_copy_frame(enc, frame, surf))
- return false;
- /* ------------------------------------ */
- /* map output tex so nvenc can use it */
- NV_ENC_MAP_INPUT_RESOURCE map = {NV_ENC_MAP_INPUT_RESOURCE_VER};
- map.registeredResource = surf->res;
- map.mappedBufferFmt = enc->surface_format;
- if (NV_FAILED(nv.nvEncMapInputResource(enc->session, &map)))
- return false;
- surf->mapped_res = map.mappedResource;
- /* ------------------------------------ */
- /* do actual encode call */
- return nvenc_encode_shared(enc, bs, surf->mapped_res, frame->pts,
- packet, received_packet);
- }
- static void nvenc_soft_video_info(void *data, struct video_scale_info *info)
- {
- struct nvenc_data *enc = data;
- info->format = enc->in_format;
- }
- extern void h264_nvenc_defaults(obs_data_t *settings);
- extern obs_properties_t *h264_nvenc_properties(void *unused);
- #ifdef ENABLE_HEVC
- extern void hevc_nvenc_defaults(obs_data_t *settings);
- extern obs_properties_t *hevc_nvenc_properties(void *unused);
- #endif
- extern obs_properties_t *av1_nvenc_properties(void *unused);
- extern void av1_nvenc_defaults(obs_data_t *settings);
- static bool nvenc_extra_data(void *data, uint8_t **header, size_t *size)
- {
- struct nvenc_data *enc = data;
- if (!enc->header) {
- return false;
- }
- *header = enc->header;
- *size = enc->header_size;
- return true;
- }
- static bool nvenc_sei_data(void *data, uint8_t **sei, size_t *size)
- {
- struct nvenc_data *enc = data;
- if (!enc->sei) {
- return false;
- }
- *sei = enc->sei;
- *size = enc->sei_size;
- return true;
- }
- struct obs_encoder_info h264_nvenc_info = {
- .id = "jim_nvenc",
- .codec = "h264",
- .type = OBS_ENCODER_VIDEO,
- .caps = OBS_ENCODER_CAP_PASS_TEXTURE | OBS_ENCODER_CAP_DYN_BITRATE |
- OBS_ENCODER_CAP_ROI,
- .get_name = h264_nvenc_get_name,
- .create = h264_nvenc_create,
- .destroy = nvenc_destroy,
- .update = nvenc_update,
- #ifdef _WIN32
- .encode_texture = nvenc_encode_tex,
- #else
- .encode_texture2 = nvenc_encode_tex2,
- #endif
- .get_defaults = h264_nvenc_defaults,
- .get_properties = h264_nvenc_properties,
- .get_extra_data = nvenc_extra_data,
- .get_sei_data = nvenc_sei_data,
- };
- #ifdef ENABLE_HEVC
- struct obs_encoder_info hevc_nvenc_info = {
- .id = "jim_hevc_nvenc",
- .codec = "hevc",
- .type = OBS_ENCODER_VIDEO,
- .caps = OBS_ENCODER_CAP_PASS_TEXTURE | OBS_ENCODER_CAP_DYN_BITRATE |
- OBS_ENCODER_CAP_ROI,
- .get_name = hevc_nvenc_get_name,
- .create = hevc_nvenc_create,
- .destroy = nvenc_destroy,
- .update = nvenc_update,
- #ifdef _WIN32
- .encode_texture = nvenc_encode_tex,
- #else
- .encode_texture2 = nvenc_encode_tex2,
- #endif
- .get_defaults = hevc_nvenc_defaults,
- .get_properties = hevc_nvenc_properties,
- .get_extra_data = nvenc_extra_data,
- .get_sei_data = nvenc_sei_data,
- };
- #endif
- struct obs_encoder_info av1_nvenc_info = {
- .id = "jim_av1_nvenc",
- .codec = "av1",
- .type = OBS_ENCODER_VIDEO,
- .caps = OBS_ENCODER_CAP_PASS_TEXTURE | OBS_ENCODER_CAP_DYN_BITRATE |
- OBS_ENCODER_CAP_ROI,
- .get_name = av1_nvenc_get_name,
- .create = av1_nvenc_create,
- .destroy = nvenc_destroy,
- .update = nvenc_update,
- #ifdef _WIN32
- .encode_texture = nvenc_encode_tex,
- #else
- .encode_texture2 = nvenc_encode_tex2,
- #endif
- .get_defaults = av1_nvenc_defaults,
- .get_properties = av1_nvenc_properties,
- .get_extra_data = nvenc_extra_data,
- };
- struct obs_encoder_info h264_nvenc_soft_info = {
- .id = "obs_nvenc_h264_cuda",
- .codec = "h264",
- .type = OBS_ENCODER_VIDEO,
- .caps = OBS_ENCODER_CAP_DYN_BITRATE | OBS_ENCODER_CAP_ROI |
- OBS_ENCODER_CAP_INTERNAL,
- .get_name = h264_nvenc_soft_get_name,
- .create = h264_nvenc_soft_create,
- .destroy = nvenc_destroy,
- .update = nvenc_update,
- .encode = nvenc_encode_soft,
- .get_defaults = h264_nvenc_defaults,
- .get_properties = h264_nvenc_properties,
- .get_extra_data = nvenc_extra_data,
- .get_sei_data = nvenc_sei_data,
- .get_video_info = nvenc_soft_video_info,
- };
- #ifdef ENABLE_HEVC
- struct obs_encoder_info hevc_nvenc_soft_info = {
- .id = "obs_nvenc_hevc_cuda",
- .codec = "hevc",
- .type = OBS_ENCODER_VIDEO,
- .caps = OBS_ENCODER_CAP_DYN_BITRATE | OBS_ENCODER_CAP_ROI |
- OBS_ENCODER_CAP_INTERNAL,
- .get_name = hevc_nvenc_soft_get_name,
- .create = hevc_nvenc_soft_create,
- .destroy = nvenc_destroy,
- .update = nvenc_update,
- .encode = nvenc_encode_soft,
- .get_defaults = hevc_nvenc_defaults,
- .get_properties = hevc_nvenc_properties,
- .get_extra_data = nvenc_extra_data,
- .get_sei_data = nvenc_sei_data,
- .get_video_info = nvenc_soft_video_info,
- };
- #endif
- struct obs_encoder_info av1_nvenc_soft_info = {
- .id = "obs_nvenc_av1_cuda",
- .codec = "av1",
- .type = OBS_ENCODER_VIDEO,
- .caps = OBS_ENCODER_CAP_DYN_BITRATE | OBS_ENCODER_CAP_ROI |
- OBS_ENCODER_CAP_INTERNAL,
- .get_name = av1_nvenc_soft_get_name,
- .create = av1_nvenc_soft_create,
- .destroy = nvenc_destroy,
- .update = nvenc_update,
- .encode = nvenc_encode_soft,
- .get_defaults = av1_nvenc_defaults,
- .get_properties = av1_nvenc_properties,
- .get_extra_data = nvenc_extra_data,
- .get_video_info = nvenc_soft_video_info,
- };
|