ffmpeg-decode.c 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432
  1. /******************************************************************************
  2. Copyright (C) 2023 by Lain Bailey <[email protected]>
  3. This program is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation, either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>.
  13. ******************************************************************************/
  14. #include "ffmpeg-decode.h"
  15. #include "obs-ffmpeg-compat.h"
  16. #include <obs-avc.h>
  17. #ifdef ENABLE_HEVC
  18. #include <obs-hevc.h>
  19. #endif
  20. enum AVHWDeviceType hw_priority[] = {
  21. AV_HWDEVICE_TYPE_D3D11VA,
  22. AV_HWDEVICE_TYPE_DXVA2,
  23. AV_HWDEVICE_TYPE_QSV,
  24. AV_HWDEVICE_TYPE_NONE,
  25. };
  26. static bool has_hw_type(const AVCodec *c, enum AVHWDeviceType type)
  27. {
  28. for (int i = 0;; i++) {
  29. const AVCodecHWConfig *config = avcodec_get_hw_config(c, i);
  30. if (!config) {
  31. break;
  32. }
  33. if (config->methods & AV_CODEC_HW_CONFIG_METHOD_HW_DEVICE_CTX &&
  34. config->device_type == type)
  35. return true;
  36. }
  37. return false;
  38. }
  39. static void init_hw_decoder(struct ffmpeg_decode *d)
  40. {
  41. enum AVHWDeviceType *priority = hw_priority;
  42. AVBufferRef *hw_ctx = NULL;
  43. while (*priority != AV_HWDEVICE_TYPE_NONE) {
  44. if (has_hw_type(d->codec, *priority)) {
  45. int ret = av_hwdevice_ctx_create(&hw_ctx, *priority,
  46. NULL, NULL, 0);
  47. if (ret == 0)
  48. break;
  49. }
  50. priority++;
  51. }
  52. if (hw_ctx) {
  53. d->hw_device_ctx = hw_ctx;
  54. d->decoder->hw_device_ctx = av_buffer_ref(hw_ctx);
  55. d->hw = true;
  56. }
  57. }
  58. int ffmpeg_decode_init(struct ffmpeg_decode *decode, enum AVCodecID id,
  59. bool use_hw)
  60. {
  61. int ret;
  62. memset(decode, 0, sizeof(*decode));
  63. decode->codec = avcodec_find_decoder(id);
  64. if (!decode->codec)
  65. return -1;
  66. decode->decoder = avcodec_alloc_context3(decode->codec);
  67. decode->decoder->thread_count = 0;
  68. if (use_hw)
  69. init_hw_decoder(decode);
  70. ret = avcodec_open2(decode->decoder, decode->codec, NULL);
  71. if (ret < 0) {
  72. ffmpeg_decode_free(decode);
  73. return ret;
  74. }
  75. return 0;
  76. }
  77. void ffmpeg_decode_free(struct ffmpeg_decode *decode)
  78. {
  79. if (decode->hw_frame)
  80. av_frame_free(&decode->hw_frame);
  81. if (decode->decoder)
  82. avcodec_free_context(&decode->decoder);
  83. if (decode->frame)
  84. av_frame_free(&decode->frame);
  85. if (decode->hw_device_ctx)
  86. av_buffer_unref(&decode->hw_device_ctx);
  87. if (decode->packet_buffer)
  88. bfree(decode->packet_buffer);
  89. memset(decode, 0, sizeof(*decode));
  90. }
  91. static inline enum video_format convert_pixel_format(int f)
  92. {
  93. switch (f) {
  94. case AV_PIX_FMT_NONE:
  95. return VIDEO_FORMAT_NONE;
  96. case AV_PIX_FMT_GRAY8:
  97. return VIDEO_FORMAT_Y800;
  98. case AV_PIX_FMT_YUV420P:
  99. case AV_PIX_FMT_YUVJ420P:
  100. return VIDEO_FORMAT_I420;
  101. case AV_PIX_FMT_NV12:
  102. return VIDEO_FORMAT_NV12;
  103. case AV_PIX_FMT_YUYV422:
  104. return VIDEO_FORMAT_YUY2;
  105. case AV_PIX_FMT_YVYU422:
  106. return VIDEO_FORMAT_YVYU;
  107. case AV_PIX_FMT_UYVY422:
  108. return VIDEO_FORMAT_UYVY;
  109. case AV_PIX_FMT_YUV422P:
  110. case AV_PIX_FMT_YUVJ422P:
  111. return VIDEO_FORMAT_I422;
  112. case AV_PIX_FMT_RGBA:
  113. return VIDEO_FORMAT_RGBA;
  114. case AV_PIX_FMT_BGRA:
  115. return VIDEO_FORMAT_BGRA;
  116. case AV_PIX_FMT_YUV420P10LE:
  117. return VIDEO_FORMAT_I010;
  118. case AV_PIX_FMT_BGR0:
  119. return VIDEO_FORMAT_BGRX;
  120. case AV_PIX_FMT_P010LE:
  121. return VIDEO_FORMAT_P010;
  122. default:;
  123. }
  124. return VIDEO_FORMAT_NONE;
  125. }
  126. static inline enum audio_format convert_sample_format(int f)
  127. {
  128. switch (f) {
  129. case AV_SAMPLE_FMT_U8:
  130. return AUDIO_FORMAT_U8BIT;
  131. case AV_SAMPLE_FMT_S16:
  132. return AUDIO_FORMAT_16BIT;
  133. case AV_SAMPLE_FMT_S32:
  134. return AUDIO_FORMAT_32BIT;
  135. case AV_SAMPLE_FMT_FLT:
  136. return AUDIO_FORMAT_FLOAT;
  137. case AV_SAMPLE_FMT_U8P:
  138. return AUDIO_FORMAT_U8BIT_PLANAR;
  139. case AV_SAMPLE_FMT_S16P:
  140. return AUDIO_FORMAT_16BIT_PLANAR;
  141. case AV_SAMPLE_FMT_S32P:
  142. return AUDIO_FORMAT_32BIT_PLANAR;
  143. case AV_SAMPLE_FMT_FLTP:
  144. return AUDIO_FORMAT_FLOAT_PLANAR;
  145. default:;
  146. }
  147. return AUDIO_FORMAT_UNKNOWN;
  148. }
  149. static inline enum speaker_layout convert_speaker_layout(uint8_t channels)
  150. {
  151. switch (channels) {
  152. case 0:
  153. return SPEAKERS_UNKNOWN;
  154. case 1:
  155. return SPEAKERS_MONO;
  156. case 2:
  157. return SPEAKERS_STEREO;
  158. case 3:
  159. return SPEAKERS_2POINT1;
  160. case 4:
  161. return SPEAKERS_4POINT0;
  162. case 5:
  163. return SPEAKERS_4POINT1;
  164. case 6:
  165. return SPEAKERS_5POINT1;
  166. case 8:
  167. return SPEAKERS_7POINT1;
  168. default:
  169. return SPEAKERS_UNKNOWN;
  170. }
  171. }
  172. static inline void copy_data(struct ffmpeg_decode *decode, uint8_t *data,
  173. size_t size)
  174. {
  175. size_t new_size = size + INPUT_BUFFER_PADDING_SIZE;
  176. if (decode->packet_size < new_size) {
  177. decode->packet_buffer =
  178. brealloc(decode->packet_buffer, new_size);
  179. decode->packet_size = new_size;
  180. }
  181. memset(decode->packet_buffer + size, 0, INPUT_BUFFER_PADDING_SIZE);
  182. memcpy(decode->packet_buffer, data, size);
  183. }
  184. bool ffmpeg_decode_audio(struct ffmpeg_decode *decode, uint8_t *data,
  185. size_t size, struct obs_source_audio *audio,
  186. bool *got_output)
  187. {
  188. int got_frame = false;
  189. int ret = 0;
  190. *got_output = false;
  191. copy_data(decode, data, size);
  192. if (!decode->frame) {
  193. decode->frame = av_frame_alloc();
  194. if (!decode->frame)
  195. return false;
  196. }
  197. if (data && size) {
  198. AVPacket *packet = av_packet_alloc();
  199. packet->data = decode->packet_buffer;
  200. packet->size = (int)size;
  201. ret = avcodec_send_packet(decode->decoder, packet);
  202. av_packet_free(&packet);
  203. }
  204. if (ret == 0)
  205. ret = avcodec_receive_frame(decode->decoder, decode->frame);
  206. got_frame = (ret == 0);
  207. if (ret == AVERROR_EOF || ret == AVERROR(EAGAIN))
  208. ret = 0;
  209. if (ret < 0)
  210. return false;
  211. else if (!got_frame)
  212. return true;
  213. for (size_t i = 0; i < MAX_AV_PLANES; i++)
  214. audio->data[i] = decode->frame->data[i];
  215. audio->samples_per_sec = decode->frame->sample_rate;
  216. audio->format = convert_sample_format(decode->frame->format);
  217. audio->speakers = convert_speaker_layout(
  218. (uint8_t)decode->decoder->ch_layout.nb_channels);
  219. audio->frames = decode->frame->nb_samples;
  220. if (audio->format == AUDIO_FORMAT_UNKNOWN)
  221. return false;
  222. *got_output = true;
  223. return true;
  224. }
  225. static enum video_colorspace
  226. convert_color_space(enum AVColorSpace s, enum AVColorTransferCharacteristic trc,
  227. enum AVColorPrimaries color_primaries)
  228. {
  229. switch (s) {
  230. case AVCOL_SPC_BT709:
  231. return (trc == AVCOL_TRC_IEC61966_2_1) ? VIDEO_CS_SRGB
  232. : VIDEO_CS_709;
  233. case AVCOL_SPC_FCC:
  234. case AVCOL_SPC_BT470BG:
  235. case AVCOL_SPC_SMPTE170M:
  236. case AVCOL_SPC_SMPTE240M:
  237. return VIDEO_CS_601;
  238. case AVCOL_SPC_BT2020_NCL:
  239. return (trc == AVCOL_TRC_ARIB_STD_B67) ? VIDEO_CS_2100_HLG
  240. : VIDEO_CS_2100_PQ;
  241. default:
  242. return (color_primaries == AVCOL_PRI_BT2020)
  243. ? ((trc == AVCOL_TRC_ARIB_STD_B67)
  244. ? VIDEO_CS_2100_HLG
  245. : VIDEO_CS_2100_PQ)
  246. : VIDEO_CS_DEFAULT;
  247. }
  248. }
  249. bool ffmpeg_decode_video(struct ffmpeg_decode *decode, uint8_t *data,
  250. size_t size, long long *ts, enum video_colorspace cs,
  251. enum video_range_type range,
  252. struct obs_source_frame2 *frame, bool *got_output)
  253. {
  254. int got_frame = false;
  255. AVFrame *out_frame;
  256. int ret;
  257. *got_output = false;
  258. copy_data(decode, data, size);
  259. if (!decode->frame) {
  260. decode->frame = av_frame_alloc();
  261. if (!decode->frame)
  262. return false;
  263. if (decode->hw && !decode->hw_frame) {
  264. decode->hw_frame = av_frame_alloc();
  265. if (!decode->hw_frame)
  266. return false;
  267. }
  268. }
  269. out_frame = decode->hw ? decode->hw_frame : decode->frame;
  270. AVPacket *packet = av_packet_alloc();
  271. packet->data = decode->packet_buffer;
  272. packet->size = (int)size;
  273. packet->pts = *ts;
  274. switch (decode->codec->id) {
  275. case AV_CODEC_ID_H264:
  276. if (obs_avc_keyframe(data, size))
  277. packet->flags |= AV_PKT_FLAG_KEY;
  278. #ifdef ENABLE_HEVC
  279. break;
  280. case AV_CODEC_ID_HEVC:
  281. if (obs_hevc_keyframe(data, size))
  282. packet->flags |= AV_PKT_FLAG_KEY;
  283. #endif
  284. }
  285. ret = avcodec_send_packet(decode->decoder, packet);
  286. if (ret == 0) {
  287. ret = avcodec_receive_frame(decode->decoder, out_frame);
  288. }
  289. av_packet_free(&packet);
  290. got_frame = (ret == 0);
  291. if (ret == AVERROR_EOF || ret == AVERROR(EAGAIN))
  292. ret = 0;
  293. if (ret < 0)
  294. return false;
  295. else if (!got_frame)
  296. return true;
  297. if (got_frame && decode->hw) {
  298. ret = av_hwframe_transfer_data(decode->frame, out_frame, 0);
  299. if (ret < 0) {
  300. return false;
  301. }
  302. }
  303. for (size_t i = 0; i < MAX_AV_PLANES; i++) {
  304. frame->data[i] = decode->frame->data[i];
  305. frame->linesize[i] = decode->frame->linesize[i];
  306. }
  307. const enum video_format format =
  308. convert_pixel_format(decode->frame->format);
  309. frame->format = format;
  310. if (range == VIDEO_RANGE_DEFAULT) {
  311. range = (decode->frame->color_range == AVCOL_RANGE_JPEG)
  312. ? VIDEO_RANGE_FULL
  313. : VIDEO_RANGE_PARTIAL;
  314. }
  315. if (cs == VIDEO_CS_DEFAULT) {
  316. cs = convert_color_space(decode->frame->colorspace,
  317. decode->frame->color_trc,
  318. decode->frame->color_primaries);
  319. }
  320. const bool success = video_format_get_parameters_for_format(
  321. cs, range, format, frame->color_matrix, frame->color_range_min,
  322. frame->color_range_max);
  323. if (!success) {
  324. blog(LOG_ERROR,
  325. "Failed to get video format "
  326. "parameters for video format %u",
  327. cs);
  328. return false;
  329. }
  330. frame->range = range;
  331. *ts = decode->frame->pts;
  332. frame->width = decode->frame->width;
  333. frame->height = decode->frame->height;
  334. frame->flip = false;
  335. switch (decode->frame->color_trc) {
  336. case AVCOL_TRC_BT709:
  337. case AVCOL_TRC_GAMMA22:
  338. case AVCOL_TRC_GAMMA28:
  339. case AVCOL_TRC_SMPTE170M:
  340. case AVCOL_TRC_SMPTE240M:
  341. case AVCOL_TRC_IEC61966_2_1:
  342. frame->trc = VIDEO_TRC_SRGB;
  343. break;
  344. case AVCOL_TRC_SMPTE2084:
  345. frame->trc = VIDEO_TRC_PQ;
  346. break;
  347. case AVCOL_TRC_ARIB_STD_B67:
  348. frame->trc = VIDEO_TRC_HLG;
  349. break;
  350. default:
  351. frame->trc = VIDEO_TRC_DEFAULT;
  352. }
  353. if (frame->format == VIDEO_FORMAT_NONE)
  354. return false;
  355. *got_output = true;
  356. return true;
  357. }