1
0

audio-io.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455
  1. /******************************************************************************
  2. Copyright (C) 2023 by Lain Bailey <[email protected]>
  3. This program is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation, either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>.
  13. ******************************************************************************/
  14. #include <math.h>
  15. #include <inttypes.h>
  16. #include "../util/threading.h"
  17. #include "../util/darray.h"
  18. #include "../util/deque.h"
  19. #include "../util/platform.h"
  20. #include "../util/profiler.h"
  21. #include "../util/util_uint64.h"
  22. #include "audio-io.h"
  23. #include "audio-resampler.h"
  24. #ifdef _WIN32
  25. #define WIN32_LEAN_AND_MEAN
  26. #include <Windows.h>
  27. #include <avrt.h>
  28. #endif
  29. extern profiler_name_store_t *obs_get_profiler_name_store(void);
  30. /* #define DEBUG_AUDIO */
  31. #define nop() \
  32. do { \
  33. int invalid = 0; \
  34. } while (0)
  35. struct audio_input {
  36. struct audio_convert_info conversion;
  37. audio_resampler_t *resampler;
  38. audio_output_callback_t callback;
  39. void *param;
  40. };
  41. static inline void audio_input_free(struct audio_input *input)
  42. {
  43. audio_resampler_destroy(input->resampler);
  44. }
  45. struct audio_mix {
  46. DARRAY(struct audio_input) inputs;
  47. float buffer[MAX_AUDIO_CHANNELS][AUDIO_OUTPUT_FRAMES];
  48. float buffer_unclamped[MAX_AUDIO_CHANNELS][AUDIO_OUTPUT_FRAMES];
  49. };
  50. struct audio_output {
  51. struct audio_output_info info;
  52. size_t block_size;
  53. size_t channels;
  54. size_t planes;
  55. pthread_t thread;
  56. os_event_t *stop_event;
  57. bool initialized;
  58. audio_input_callback_t input_cb;
  59. void *input_param;
  60. pthread_mutex_t input_mutex;
  61. struct audio_mix mixes[MAX_AUDIO_MIXES];
  62. };
  63. /* ------------------------------------------------------------------------- */
  64. static bool resample_audio_output(struct audio_input *input, struct audio_data *data)
  65. {
  66. bool success = true;
  67. if (input->resampler) {
  68. uint8_t *output[MAX_AV_PLANES];
  69. uint32_t frames;
  70. uint64_t offset;
  71. memset(output, 0, sizeof(output));
  72. success = audio_resampler_resample(input->resampler, output, &frames, &offset,
  73. (const uint8_t *const *)data->data, data->frames);
  74. for (size_t i = 0; i < MAX_AV_PLANES; i++)
  75. data->data[i] = output[i];
  76. data->frames = frames;
  77. data->timestamp -= offset;
  78. }
  79. return success;
  80. }
  81. static inline void do_audio_output(struct audio_output *audio, size_t mix_idx, uint64_t timestamp, uint32_t frames)
  82. {
  83. struct audio_mix *mix = &audio->mixes[mix_idx];
  84. struct audio_data data;
  85. pthread_mutex_lock(&audio->input_mutex);
  86. for (size_t i = mix->inputs.num; i > 0; i--) {
  87. struct audio_input *input = mix->inputs.array + (i - 1);
  88. float(*buf)[AUDIO_OUTPUT_FRAMES] = input->conversion.allow_clipping ? mix->buffer_unclamped
  89. : mix->buffer;
  90. for (size_t i = 0; i < audio->planes; i++)
  91. data.data[i] = (uint8_t *)buf[i];
  92. data.frames = frames;
  93. data.timestamp = timestamp;
  94. if (resample_audio_output(input, &data))
  95. input->callback(input->param, mix_idx, &data);
  96. }
  97. pthread_mutex_unlock(&audio->input_mutex);
  98. }
  99. static inline void clamp_audio_output(struct audio_output *audio, size_t bytes)
  100. {
  101. size_t float_size = bytes / sizeof(float);
  102. for (size_t mix_idx = 0; mix_idx < MAX_AUDIO_MIXES; mix_idx++) {
  103. struct audio_mix *mix = &audio->mixes[mix_idx];
  104. /* do not process mixing if a specific mix is inactive */
  105. if (!mix->inputs.num)
  106. continue;
  107. for (size_t plane = 0; plane < audio->planes; plane++) {
  108. float *mix_data = mix->buffer[plane];
  109. float *mix_end = &mix_data[float_size];
  110. /* Unclamped mix is copied directly. */
  111. memcpy(mix->buffer_unclamped[plane], mix_data, bytes);
  112. while (mix_data < mix_end) {
  113. float val = *mix_data;
  114. val = (val == val) ? val : 0.0f;
  115. val = (val > 1.0f) ? 1.0f : val;
  116. val = (val < -1.0f) ? -1.0f : val;
  117. *(mix_data++) = val;
  118. }
  119. }
  120. }
  121. }
  122. static void input_and_output(struct audio_output *audio, uint64_t audio_time, uint64_t prev_time)
  123. {
  124. size_t bytes = AUDIO_OUTPUT_FRAMES * audio->block_size;
  125. struct audio_output_data data[MAX_AUDIO_MIXES];
  126. uint32_t active_mixes = 0;
  127. uint64_t new_ts = 0;
  128. bool success;
  129. memset(data, 0, sizeof(data));
  130. #ifdef DEBUG_AUDIO
  131. blog(LOG_DEBUG, "audio_time: %llu, prev_time: %llu, bytes: %lu", audio_time, prev_time, bytes);
  132. #endif
  133. /* get mixers */
  134. pthread_mutex_lock(&audio->input_mutex);
  135. for (size_t i = 0; i < MAX_AUDIO_MIXES; i++) {
  136. if (audio->mixes[i].inputs.num)
  137. active_mixes |= (1 << i);
  138. }
  139. pthread_mutex_unlock(&audio->input_mutex);
  140. /* clear mix buffers */
  141. for (size_t mix_idx = 0; mix_idx < MAX_AUDIO_MIXES; mix_idx++) {
  142. struct audio_mix *mix = &audio->mixes[mix_idx];
  143. memset(mix->buffer, 0, sizeof(mix->buffer));
  144. for (size_t i = 0; i < audio->planes; i++)
  145. data[mix_idx].data[i] = mix->buffer[i];
  146. }
  147. /* get new audio data */
  148. success = audio->input_cb(audio->input_param, prev_time, audio_time, &new_ts, active_mixes, data);
  149. if (!success)
  150. return;
  151. /* clamps audio data to -1.0..1.0 */
  152. clamp_audio_output(audio, bytes);
  153. /* output */
  154. for (size_t i = 0; i < MAX_AUDIO_MIXES; i++)
  155. do_audio_output(audio, i, new_ts, AUDIO_OUTPUT_FRAMES);
  156. }
  157. static void *audio_thread(void *param)
  158. {
  159. #ifdef _WIN32
  160. DWORD unused = 0;
  161. const HANDLE handle = AvSetMmThreadCharacteristics(L"Audio", &unused);
  162. #endif
  163. struct audio_output *audio = param;
  164. size_t rate = audio->info.samples_per_sec;
  165. uint64_t samples = 0;
  166. uint64_t start_time = os_gettime_ns();
  167. uint64_t prev_time = start_time;
  168. os_set_thread_name("audio-io: audio thread");
  169. const char *audio_thread_name =
  170. profile_store_name(obs_get_profiler_name_store(), "audio_thread(%s)", audio->info.name);
  171. while (os_event_try(audio->stop_event) == EAGAIN) {
  172. samples += AUDIO_OUTPUT_FRAMES;
  173. uint64_t audio_time = start_time + audio_frames_to_ns(rate, samples);
  174. os_sleepto_ns_fast(audio_time);
  175. profile_start(audio_thread_name);
  176. input_and_output(audio, audio_time, prev_time);
  177. prev_time = audio_time;
  178. profile_end(audio_thread_name);
  179. profile_reenable_thread();
  180. }
  181. #ifdef _WIN32
  182. if (handle)
  183. AvRevertMmThreadCharacteristics(handle);
  184. #endif
  185. return NULL;
  186. }
  187. /* ------------------------------------------------------------------------- */
  188. static size_t audio_get_input_idx(const audio_t *audio, size_t mix_idx, audio_output_callback_t callback, void *param)
  189. {
  190. const struct audio_mix *mix = &audio->mixes[mix_idx];
  191. for (size_t i = 0; i < mix->inputs.num; i++) {
  192. struct audio_input *input = mix->inputs.array + i;
  193. if (input->callback == callback && input->param == param)
  194. return i;
  195. }
  196. return DARRAY_INVALID;
  197. }
  198. static inline bool audio_input_init(struct audio_input *input, struct audio_output *audio)
  199. {
  200. if (input->conversion.format != audio->info.format ||
  201. input->conversion.samples_per_sec != audio->info.samples_per_sec ||
  202. input->conversion.speakers != audio->info.speakers) {
  203. struct resample_info from = {.format = audio->info.format,
  204. .samples_per_sec = audio->info.samples_per_sec,
  205. .speakers = audio->info.speakers};
  206. struct resample_info to = {.format = input->conversion.format,
  207. .samples_per_sec = input->conversion.samples_per_sec,
  208. .speakers = input->conversion.speakers};
  209. input->resampler = audio_resampler_create(&to, &from);
  210. if (!input->resampler) {
  211. blog(LOG_ERROR, "audio_input_init: Failed to "
  212. "create resampler");
  213. return false;
  214. }
  215. } else {
  216. input->resampler = NULL;
  217. }
  218. return true;
  219. }
  220. bool audio_output_connect(audio_t *audio, size_t mi, const struct audio_convert_info *conversion,
  221. audio_output_callback_t callback, void *param)
  222. {
  223. bool success = false;
  224. if (!audio || mi >= MAX_AUDIO_MIXES)
  225. return false;
  226. pthread_mutex_lock(&audio->input_mutex);
  227. if (audio_get_input_idx(audio, mi, callback, param) == DARRAY_INVALID) {
  228. struct audio_mix *mix = &audio->mixes[mi];
  229. struct audio_input input = {
  230. .callback = callback,
  231. .param = param,
  232. };
  233. if (conversion) {
  234. input.conversion = *conversion;
  235. } else {
  236. input.conversion.format = audio->info.format;
  237. input.conversion.speakers = audio->info.speakers;
  238. input.conversion.samples_per_sec = audio->info.samples_per_sec;
  239. }
  240. if (input.conversion.format == AUDIO_FORMAT_UNKNOWN)
  241. input.conversion.format = audio->info.format;
  242. if (input.conversion.speakers == SPEAKERS_UNKNOWN)
  243. input.conversion.speakers = audio->info.speakers;
  244. if (input.conversion.samples_per_sec == 0)
  245. input.conversion.samples_per_sec = audio->info.samples_per_sec;
  246. success = audio_input_init(&input, audio);
  247. if (success)
  248. da_push_back(mix->inputs, &input);
  249. }
  250. pthread_mutex_unlock(&audio->input_mutex);
  251. return success;
  252. }
  253. void audio_output_disconnect(audio_t *audio, size_t mix_idx, audio_output_callback_t callback, void *param)
  254. {
  255. if (!audio || mix_idx >= MAX_AUDIO_MIXES)
  256. return;
  257. pthread_mutex_lock(&audio->input_mutex);
  258. size_t idx = audio_get_input_idx(audio, mix_idx, callback, param);
  259. if (idx != DARRAY_INVALID) {
  260. struct audio_mix *mix = &audio->mixes[mix_idx];
  261. audio_input_free(mix->inputs.array + idx);
  262. da_erase(mix->inputs, idx);
  263. }
  264. pthread_mutex_unlock(&audio->input_mutex);
  265. }
  266. static inline bool valid_audio_params(const struct audio_output_info *info)
  267. {
  268. return info->format && info->name && info->samples_per_sec > 0 && info->speakers > 0;
  269. }
  270. int audio_output_open(audio_t **audio, struct audio_output_info *info)
  271. {
  272. struct audio_output *out;
  273. bool planar = is_audio_planar(info->format);
  274. if (!valid_audio_params(info))
  275. return AUDIO_OUTPUT_INVALIDPARAM;
  276. out = bzalloc(sizeof(struct audio_output));
  277. if (!out)
  278. goto fail0;
  279. memcpy(&out->info, info, sizeof(struct audio_output_info));
  280. out->channels = get_audio_channels(info->speakers);
  281. out->planes = planar ? out->channels : 1;
  282. out->input_cb = info->input_callback;
  283. out->input_param = info->input_param;
  284. out->block_size = (planar ? 1 : out->channels) * get_audio_bytes_per_channel(info->format);
  285. if (pthread_mutex_init_recursive(&out->input_mutex) != 0)
  286. goto fail0;
  287. if (os_event_init(&out->stop_event, OS_EVENT_TYPE_MANUAL) != 0)
  288. goto fail1;
  289. if (pthread_create(&out->thread, NULL, audio_thread, out) != 0)
  290. goto fail2;
  291. out->initialized = true;
  292. *audio = out;
  293. return AUDIO_OUTPUT_SUCCESS;
  294. fail2:
  295. os_event_destroy(out->stop_event);
  296. fail1:
  297. pthread_mutex_destroy(&out->input_mutex);
  298. fail0:
  299. audio_output_close(out);
  300. return AUDIO_OUTPUT_FAIL;
  301. }
  302. void audio_output_close(audio_t *audio)
  303. {
  304. void *thread_ret;
  305. if (!audio)
  306. return;
  307. if (audio->initialized) {
  308. os_event_signal(audio->stop_event);
  309. pthread_join(audio->thread, &thread_ret);
  310. os_event_destroy(audio->stop_event);
  311. pthread_mutex_destroy(&audio->input_mutex);
  312. }
  313. for (size_t mix_idx = 0; mix_idx < MAX_AUDIO_MIXES; mix_idx++) {
  314. struct audio_mix *mix = &audio->mixes[mix_idx];
  315. for (size_t i = 0; i < mix->inputs.num; i++)
  316. audio_input_free(mix->inputs.array + i);
  317. da_free(mix->inputs);
  318. }
  319. bfree(audio);
  320. }
  321. const struct audio_output_info *audio_output_get_info(const audio_t *audio)
  322. {
  323. return audio ? &audio->info : NULL;
  324. }
  325. bool audio_output_active(const audio_t *audio)
  326. {
  327. if (!audio)
  328. return false;
  329. for (size_t mix_idx = 0; mix_idx < MAX_AUDIO_MIXES; mix_idx++) {
  330. const struct audio_mix *mix = &audio->mixes[mix_idx];
  331. if (mix->inputs.num != 0)
  332. return true;
  333. }
  334. return false;
  335. }
  336. size_t audio_output_get_block_size(const audio_t *audio)
  337. {
  338. return audio->block_size;
  339. }
  340. size_t audio_output_get_planes(const audio_t *audio)
  341. {
  342. return audio->planes;
  343. }
  344. size_t audio_output_get_channels(const audio_t *audio)
  345. {
  346. return audio->channels;
  347. }
  348. uint32_t audio_output_get_sample_rate(const audio_t *audio)
  349. {
  350. return audio->info.samples_per_sec;
  351. }