obs-ffmpeg-audio-encoders.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549
  1. /******************************************************************************
  2. Copyright (C) 2023 by Lain Bailey <[email protected]>
  3. This program is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation, either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>.
  13. ******************************************************************************/
  14. #include <util/base.h>
  15. #include <util/deque.h>
  16. #include <util/darray.h>
  17. #include <util/dstr.h>
  18. #include <obs-module.h>
  19. #include <libavutil/channel_layout.h>
  20. #include <libavformat/avformat.h>
  21. #include "obs-ffmpeg-formats.h"
  22. #include "obs-ffmpeg-compat.h"
  23. #define do_log(level, format, ...) \
  24. blog(level, "[FFmpeg %s encoder: '%s'] " format, enc->type, obs_encoder_get_name(enc->encoder), ##__VA_ARGS__)
  25. #define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
  26. #define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
  27. #define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
  28. struct enc_encoder {
  29. obs_encoder_t *encoder;
  30. const char *type;
  31. const AVCodec *codec;
  32. AVCodecContext *context;
  33. uint8_t *samples[MAX_AV_PLANES];
  34. AVFrame *aframe;
  35. int64_t total_samples;
  36. DARRAY(uint8_t) packet_buffer;
  37. size_t audio_planes;
  38. size_t audio_size;
  39. int frame_size; /* pretty much always 1024 for AAC */
  40. int frame_size_bytes;
  41. };
  42. static const char *aac_getname(void *unused)
  43. {
  44. UNUSED_PARAMETER(unused);
  45. return obs_module_text("FFmpegAAC");
  46. }
  47. static const char *opus_getname(void *unused)
  48. {
  49. UNUSED_PARAMETER(unused);
  50. return obs_module_text("FFmpegOpus");
  51. }
  52. static const char *pcm_getname(void *unused)
  53. {
  54. UNUSED_PARAMETER(unused);
  55. return obs_module_text("FFmpegPCM16Bit");
  56. }
  57. static const char *pcm24_getname(void *unused)
  58. {
  59. UNUSED_PARAMETER(unused);
  60. return obs_module_text("FFmpegPCM24Bit");
  61. }
  62. static const char *pcm32_getname(void *unused)
  63. {
  64. UNUSED_PARAMETER(unused);
  65. return obs_module_text("FFmpegPCM32BitFloat");
  66. }
  67. static const char *alac_getname(void *unused)
  68. {
  69. UNUSED_PARAMETER(unused);
  70. return obs_module_text("FFmpegALAC");
  71. }
  72. static const char *flac_getname(void *unused)
  73. {
  74. UNUSED_PARAMETER(unused);
  75. return obs_module_text("FFmpegFLAC");
  76. }
  77. static void enc_destroy(void *data)
  78. {
  79. struct enc_encoder *enc = data;
  80. if (enc->samples[0])
  81. av_freep(&enc->samples[0]);
  82. if (enc->context)
  83. avcodec_free_context(&enc->context);
  84. if (enc->aframe)
  85. av_frame_free(&enc->aframe);
  86. da_free(enc->packet_buffer);
  87. bfree(enc);
  88. }
  89. static bool initialize_codec(struct enc_encoder *enc)
  90. {
  91. int ret;
  92. int channels;
  93. enc->aframe = av_frame_alloc();
  94. if (!enc->aframe) {
  95. warn("Failed to allocate audio frame");
  96. return false;
  97. }
  98. ret = avcodec_open2(enc->context, enc->codec, NULL);
  99. if (ret < 0) {
  100. struct dstr error_message = {0};
  101. dstr_printf(&error_message, "Failed to open AAC codec: %s", av_err2str(ret));
  102. obs_encoder_set_last_error(enc->encoder, error_message.array);
  103. dstr_free(&error_message);
  104. warn("Failed to open AAC codec: %s", av_err2str(ret));
  105. return false;
  106. }
  107. enc->aframe->format = enc->context->sample_fmt;
  108. channels = enc->context->ch_layout.nb_channels;
  109. enc->aframe->ch_layout = enc->context->ch_layout;
  110. enc->aframe->sample_rate = enc->context->sample_rate;
  111. enc->frame_size = enc->context->frame_size;
  112. if (!enc->frame_size)
  113. enc->frame_size = 1024;
  114. enc->frame_size_bytes = enc->frame_size * (int)enc->audio_size;
  115. ret = av_samples_alloc(enc->samples, NULL, channels, enc->frame_size, enc->context->sample_fmt, 0);
  116. if (ret < 0) {
  117. warn("Failed to create audio buffer: %s", av_err2str(ret));
  118. return false;
  119. }
  120. return true;
  121. }
  122. static void init_sizes(struct enc_encoder *enc, audio_t *audio)
  123. {
  124. const struct audio_output_info *aoi;
  125. enum audio_format format;
  126. aoi = audio_output_get_info(audio);
  127. format = convert_ffmpeg_sample_format(enc->context->sample_fmt);
  128. enc->audio_planes = get_audio_planes(format, aoi->speakers);
  129. enc->audio_size = get_audio_size(format, aoi->speakers, 1);
  130. }
  131. #ifndef MIN
  132. #define MIN(x, y) ((x) < (y) ? (x) : (y))
  133. #endif
  134. static void *enc_create(obs_data_t *settings, obs_encoder_t *encoder, const char *type, const char *alt,
  135. enum AVSampleFormat sample_format)
  136. {
  137. struct enc_encoder *enc;
  138. int bitrate = (int)obs_data_get_int(settings, "bitrate");
  139. audio_t *audio = obs_encoder_audio(encoder);
  140. enc = bzalloc(sizeof(struct enc_encoder));
  141. enc->encoder = encoder;
  142. enc->codec = avcodec_find_encoder_by_name(type);
  143. enc->type = type;
  144. if (!enc->codec && alt) {
  145. enc->codec = avcodec_find_encoder_by_name(alt);
  146. enc->type = alt;
  147. }
  148. blog(LOG_INFO, "---------------------------------");
  149. if (!enc->codec) {
  150. warn("Couldn't find encoder");
  151. goto fail;
  152. }
  153. const AVCodecDescriptor *codec_desc = avcodec_descriptor_get(enc->codec->id);
  154. if (!codec_desc) {
  155. warn("Failed to get codec descriptor");
  156. goto fail;
  157. }
  158. if (!bitrate && !(codec_desc->props & AV_CODEC_PROP_LOSSLESS)) {
  159. warn("Invalid bitrate specified");
  160. goto fail;
  161. }
  162. enc->context = avcodec_alloc_context3(enc->codec);
  163. if (!enc->context) {
  164. warn("Failed to create codec context");
  165. goto fail;
  166. }
  167. if (codec_desc->props & AV_CODEC_PROP_LOSSLESS)
  168. // Set by encoder on init, not known at this time
  169. enc->context->bit_rate = 0;
  170. else
  171. enc->context->bit_rate = bitrate * 1000;
  172. const struct audio_output_info *aoi;
  173. aoi = audio_output_get_info(audio);
  174. av_channel_layout_default(&enc->context->ch_layout, (int)audio_output_get_channels(audio));
  175. /* The avutil default channel layout for 5 channels is 5.0, which OBS
  176. * does not support. Manually set 5 channels to 4.1. */
  177. if (aoi->speakers == SPEAKERS_4POINT1)
  178. enc->context->ch_layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_4POINT1;
  179. /* AAC, ALAC, & FLAC default to 3.0 for 3 channels instead of 2.1.
  180. * Tell the encoder to deal with 2.1 as if it were 3.0. */
  181. if (aoi->speakers == SPEAKERS_2POINT1)
  182. enc->context->ch_layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_SURROUND;
  183. // ALAC supports 7.1 wide instead of regular 7.1.
  184. if (aoi->speakers == SPEAKERS_7POINT1 && astrcmpi(enc->type, "alac") == 0)
  185. enc->context->ch_layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_7POINT1_WIDE_BACK;
  186. enc->context->sample_rate = audio_output_get_sample_rate(audio);
  187. if (enc->codec->sample_fmts) {
  188. /* Check if the requested format is actually available for the specified
  189. * encoder. This may not always be the case due to FFmpeg changes or a
  190. * fallback being used (for example, when libopus is unavailable). */
  191. const enum AVSampleFormat *fmt = enc->codec->sample_fmts;
  192. while (*fmt != AV_SAMPLE_FMT_NONE) {
  193. if (*fmt == sample_format) {
  194. enc->context->sample_fmt = *fmt;
  195. break;
  196. }
  197. fmt++;
  198. }
  199. /* Fall back to default if requested format was not found. */
  200. if (enc->context->sample_fmt == AV_SAMPLE_FMT_NONE)
  201. enc->context->sample_fmt = enc->codec->sample_fmts[0];
  202. } else {
  203. /* Fall back to planar float if codec does not specify formats. */
  204. enc->context->sample_fmt = AV_SAMPLE_FMT_FLTP;
  205. }
  206. /* check to make sure sample rate is supported */
  207. if (enc->codec->supported_samplerates) {
  208. const int *rate = enc->codec->supported_samplerates;
  209. int cur_rate = enc->context->sample_rate;
  210. int closest = 0;
  211. while (*rate) {
  212. int dist = abs(cur_rate - *rate);
  213. int closest_dist = abs(cur_rate - closest);
  214. if (dist < closest_dist)
  215. closest = *rate;
  216. rate++;
  217. }
  218. if (closest)
  219. enc->context->sample_rate = closest;
  220. }
  221. char buf[256];
  222. av_channel_layout_describe(&enc->context->ch_layout, buf, 256);
  223. info("bitrate: %" PRId64 ", channels: %d, channel_layout: %s, track: %d\n",
  224. (int64_t)enc->context->bit_rate / 1000, (int)enc->context->ch_layout.nb_channels, buf,
  225. (int)obs_encoder_get_mixer_index(enc->encoder) + 1);
  226. init_sizes(enc, audio);
  227. /* enable experimental FFmpeg encoder if the only one available */
  228. enc->context->strict_std_compliance = -2;
  229. enc->context->flags = AV_CODEC_FLAG_GLOBAL_HEADER;
  230. if (initialize_codec(enc))
  231. return enc;
  232. fail:
  233. enc_destroy(enc);
  234. return NULL;
  235. }
  236. static void *aac_create(obs_data_t *settings, obs_encoder_t *encoder)
  237. {
  238. return enc_create(settings, encoder, "aac", NULL, AV_SAMPLE_FMT_NONE);
  239. }
  240. static void *opus_create(obs_data_t *settings, obs_encoder_t *encoder)
  241. {
  242. return enc_create(settings, encoder, "libopus", "opus", AV_SAMPLE_FMT_FLT);
  243. }
  244. static void *pcm_create(obs_data_t *settings, obs_encoder_t *encoder)
  245. {
  246. return enc_create(settings, encoder, "pcm_s16le", NULL, AV_SAMPLE_FMT_NONE);
  247. }
  248. static void *pcm24_create(obs_data_t *settings, obs_encoder_t *encoder)
  249. {
  250. return enc_create(settings, encoder, "pcm_s24le", NULL, AV_SAMPLE_FMT_NONE);
  251. }
  252. static void *pcm32_create(obs_data_t *settings, obs_encoder_t *encoder)
  253. {
  254. return enc_create(settings, encoder, "pcm_f32le", NULL, AV_SAMPLE_FMT_NONE);
  255. }
  256. static void *alac_create(obs_data_t *settings, obs_encoder_t *encoder)
  257. {
  258. return enc_create(settings, encoder, "alac", NULL, AV_SAMPLE_FMT_S32P);
  259. }
  260. static void *flac_create(obs_data_t *settings, obs_encoder_t *encoder)
  261. {
  262. return enc_create(settings, encoder, "flac", NULL, AV_SAMPLE_FMT_S16);
  263. }
  264. static bool do_encode(struct enc_encoder *enc, struct encoder_packet *packet, bool *received_packet)
  265. {
  266. AVRational time_base = {1, enc->context->sample_rate};
  267. AVPacket avpacket = {0};
  268. int got_packet;
  269. int ret;
  270. int channels;
  271. enc->aframe->nb_samples = enc->frame_size;
  272. enc->aframe->pts =
  273. av_rescale_q(enc->total_samples, (AVRational){1, enc->context->sample_rate}, enc->context->time_base);
  274. enc->aframe->ch_layout = enc->context->ch_layout;
  275. channels = enc->context->ch_layout.nb_channels;
  276. ret = avcodec_fill_audio_frame(enc->aframe, channels, enc->context->sample_fmt, enc->samples[0],
  277. enc->frame_size_bytes * channels, 1);
  278. if (ret < 0) {
  279. warn("avcodec_fill_audio_frame failed: %s", av_err2str(ret));
  280. return false;
  281. }
  282. enc->total_samples += enc->frame_size;
  283. ret = avcodec_send_frame(enc->context, enc->aframe);
  284. if (ret == 0)
  285. ret = avcodec_receive_packet(enc->context, &avpacket);
  286. got_packet = (ret == 0);
  287. if (ret == AVERROR_EOF || ret == AVERROR(EAGAIN))
  288. ret = 0;
  289. if (ret < 0) {
  290. warn("avcodec_encode_audio2 failed: %s", av_err2str(ret));
  291. return false;
  292. }
  293. *received_packet = !!got_packet;
  294. if (!got_packet)
  295. return true;
  296. da_resize(enc->packet_buffer, 0);
  297. da_push_back_array(enc->packet_buffer, avpacket.data, avpacket.size);
  298. packet->pts = rescale_ts(avpacket.pts, enc->context, time_base);
  299. packet->dts = rescale_ts(avpacket.dts, enc->context, time_base);
  300. packet->data = enc->packet_buffer.array;
  301. packet->size = avpacket.size;
  302. packet->type = OBS_ENCODER_AUDIO;
  303. packet->keyframe = true;
  304. packet->timebase_num = 1;
  305. packet->timebase_den = (int32_t)enc->context->sample_rate;
  306. av_packet_unref(&avpacket);
  307. return true;
  308. }
  309. static bool enc_encode(void *data, struct encoder_frame *frame, struct encoder_packet *packet, bool *received_packet)
  310. {
  311. struct enc_encoder *enc = data;
  312. for (size_t i = 0; i < enc->audio_planes; i++)
  313. memcpy(enc->samples[i], frame->data[i], enc->frame_size_bytes);
  314. return do_encode(enc, packet, received_packet);
  315. }
  316. static void enc_defaults(obs_data_t *settings)
  317. {
  318. obs_data_set_default_int(settings, "bitrate", 128);
  319. }
  320. static obs_properties_t *enc_properties(void *unused)
  321. {
  322. UNUSED_PARAMETER(unused);
  323. obs_properties_t *props = obs_properties_create();
  324. obs_properties_add_int(props, "bitrate", obs_module_text("Bitrate"), 64, 1024, 32);
  325. return props;
  326. }
  327. static bool enc_extra_data(void *data, uint8_t **extra_data, size_t *size)
  328. {
  329. struct enc_encoder *enc = data;
  330. *extra_data = enc->context->extradata;
  331. *size = enc->context->extradata_size;
  332. return true;
  333. }
  334. static void enc_audio_info(void *data, struct audio_convert_info *info)
  335. {
  336. struct enc_encoder *enc = data;
  337. int channels;
  338. channels = enc->context->ch_layout.nb_channels;
  339. info->format = convert_ffmpeg_sample_format(enc->context->sample_fmt);
  340. info->samples_per_sec = (uint32_t)enc->context->sample_rate;
  341. if (channels != 7 && channels <= 8)
  342. info->speakers = (enum speaker_layout)(channels);
  343. else
  344. info->speakers = SPEAKERS_UNKNOWN;
  345. }
  346. static void enc_audio_info_float(void *data, struct audio_convert_info *info)
  347. {
  348. enc_audio_info(data, info);
  349. info->allow_clipping = true;
  350. }
  351. static size_t enc_frame_size(void *data)
  352. {
  353. struct enc_encoder *enc = data;
  354. return enc->frame_size;
  355. }
  356. struct obs_encoder_info aac_encoder_info = {
  357. .id = "ffmpeg_aac",
  358. .type = OBS_ENCODER_AUDIO,
  359. .codec = "aac",
  360. .get_name = aac_getname,
  361. .create = aac_create,
  362. .destroy = enc_destroy,
  363. .encode = enc_encode,
  364. .get_frame_size = enc_frame_size,
  365. .get_defaults = enc_defaults,
  366. .get_properties = enc_properties,
  367. .get_extra_data = enc_extra_data,
  368. .get_audio_info = enc_audio_info,
  369. };
  370. struct obs_encoder_info opus_encoder_info = {
  371. .id = "ffmpeg_opus",
  372. .type = OBS_ENCODER_AUDIO,
  373. .codec = "opus",
  374. .get_name = opus_getname,
  375. .create = opus_create,
  376. .destroy = enc_destroy,
  377. .encode = enc_encode,
  378. .get_frame_size = enc_frame_size,
  379. .get_defaults = enc_defaults,
  380. .get_properties = enc_properties,
  381. .get_extra_data = enc_extra_data,
  382. .get_audio_info = enc_audio_info,
  383. };
  384. struct obs_encoder_info pcm_encoder_info = {
  385. .id = "ffmpeg_pcm_s16le",
  386. .type = OBS_ENCODER_AUDIO,
  387. .codec = "pcm_s16le",
  388. .get_name = pcm_getname,
  389. .create = pcm_create,
  390. .destroy = enc_destroy,
  391. .encode = enc_encode,
  392. .get_frame_size = enc_frame_size,
  393. .get_defaults = enc_defaults,
  394. .get_properties = enc_properties,
  395. .get_extra_data = enc_extra_data,
  396. .get_audio_info = enc_audio_info,
  397. };
  398. struct obs_encoder_info pcm24_encoder_info = {
  399. .id = "ffmpeg_pcm_s24le",
  400. .type = OBS_ENCODER_AUDIO,
  401. .codec = "pcm_s24le",
  402. .get_name = pcm24_getname,
  403. .create = pcm24_create,
  404. .destroy = enc_destroy,
  405. .encode = enc_encode,
  406. .get_frame_size = enc_frame_size,
  407. .get_defaults = enc_defaults,
  408. .get_properties = enc_properties,
  409. .get_extra_data = enc_extra_data,
  410. .get_audio_info = enc_audio_info,
  411. };
  412. struct obs_encoder_info pcm32_encoder_info = {
  413. .id = "ffmpeg_pcm_f32le",
  414. .type = OBS_ENCODER_AUDIO,
  415. .codec = "pcm_f32le",
  416. .get_name = pcm32_getname,
  417. .create = pcm32_create,
  418. .destroy = enc_destroy,
  419. .encode = enc_encode,
  420. .get_frame_size = enc_frame_size,
  421. .get_defaults = enc_defaults,
  422. .get_properties = enc_properties,
  423. .get_extra_data = enc_extra_data,
  424. .get_audio_info = enc_audio_info_float,
  425. };
  426. struct obs_encoder_info alac_encoder_info = {
  427. .id = "ffmpeg_alac",
  428. .type = OBS_ENCODER_AUDIO,
  429. .codec = "alac",
  430. .get_name = alac_getname,
  431. .create = alac_create,
  432. .destroy = enc_destroy,
  433. .encode = enc_encode,
  434. .get_frame_size = enc_frame_size,
  435. .get_defaults = enc_defaults,
  436. .get_properties = enc_properties,
  437. .get_extra_data = enc_extra_data,
  438. .get_audio_info = enc_audio_info,
  439. };
  440. struct obs_encoder_info flac_encoder_info = {
  441. .id = "ffmpeg_flac",
  442. .type = OBS_ENCODER_AUDIO,
  443. .codec = "flac",
  444. .get_name = flac_getname,
  445. .create = flac_create,
  446. .destroy = enc_destroy,
  447. .encode = enc_encode,
  448. .get_frame_size = enc_frame_size,
  449. .get_defaults = enc_defaults,
  450. .get_properties = enc_properties,
  451. .get_extra_data = enc_extra_data,
  452. .get_audio_info = enc_audio_info,
  453. };