wasapi-output.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500
  1. #include "../../media-io/audio-resampler.h"
  2. #include "../../util/circlebuf.h"
  3. #include "../../util/platform.h"
  4. #include "../../util/darray.h"
  5. #include "../../util/util_uint64.h"
  6. #include "../../obs-internal.h"
  7. #include "wasapi-output.h"
  8. #define ACTUALLY_DEFINE_GUID(name, l, w1, w2, b1, b2, b3, b4, b5, b6, b7, b8) \
  9. EXTERN_C const GUID DECLSPEC_SELECTANY \
  10. name = {l, w1, w2, {b1, b2, b3, b4, b5, b6, b7, b8}}
  11. #define do_log(level, format, ...) \
  12. blog(level, "[audio monitoring: '%s'] " format, \
  13. obs_source_get_name(monitor->source), ##__VA_ARGS__)
  14. #define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
  15. #define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
  16. #define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
  17. ACTUALLY_DEFINE_GUID(CLSID_MMDeviceEnumerator, 0xBCDE0395, 0xE52F, 0x467C, 0x8E,
  18. 0x3D, 0xC4, 0x57, 0x92, 0x91, 0x69, 0x2E);
  19. ACTUALLY_DEFINE_GUID(IID_IMMDeviceEnumerator, 0xA95664D2, 0x9614, 0x4F35, 0xA7,
  20. 0x46, 0xDE, 0x8D, 0xB6, 0x36, 0x17, 0xE6);
  21. ACTUALLY_DEFINE_GUID(IID_IAudioClient, 0x1CB9AD4C, 0xDBFA, 0x4C32, 0xB1, 0x78,
  22. 0xC2, 0xF5, 0x68, 0xA7, 0x03, 0xB2);
  23. ACTUALLY_DEFINE_GUID(IID_IAudioRenderClient, 0xF294ACFC, 0x3146, 0x4483, 0xA7,
  24. 0xBF, 0xAD, 0xDC, 0xA7, 0xC2, 0x60, 0xE2);
  25. struct audio_monitor {
  26. obs_source_t *source;
  27. IAudioClient *client;
  28. IAudioRenderClient *render;
  29. uint64_t last_recv_time;
  30. uint64_t prev_video_ts;
  31. uint64_t time_since_prev;
  32. audio_resampler_t *resampler;
  33. uint32_t sample_rate;
  34. uint32_t channels;
  35. bool source_has_video;
  36. bool ignore;
  37. int64_t lowest_audio_offset;
  38. struct circlebuf delay_buffer;
  39. uint32_t delay_size;
  40. DARRAY(float) buf;
  41. SRWLOCK playback_mutex;
  42. };
  43. /* #define DEBUG_AUDIO */
  44. static bool process_audio_delay(struct audio_monitor *monitor, float **data,
  45. uint32_t *frames, uint64_t ts, uint32_t pad)
  46. {
  47. obs_source_t *s = monitor->source;
  48. uint64_t last_frame_ts = s->last_frame_ts;
  49. uint64_t cur_time = os_gettime_ns();
  50. uint64_t front_ts;
  51. uint64_t cur_ts;
  52. int64_t diff;
  53. uint32_t blocksize = monitor->channels * sizeof(float);
  54. /* cut off audio if long-since leftover audio in delay buffer */
  55. if (cur_time - monitor->last_recv_time > 1000000000)
  56. circlebuf_free(&monitor->delay_buffer);
  57. monitor->last_recv_time = cur_time;
  58. ts += monitor->source->sync_offset;
  59. circlebuf_push_back(&monitor->delay_buffer, &ts, sizeof(ts));
  60. circlebuf_push_back(&monitor->delay_buffer, frames, sizeof(*frames));
  61. circlebuf_push_back(&monitor->delay_buffer, *data, *frames * blocksize);
  62. if (!monitor->prev_video_ts) {
  63. monitor->prev_video_ts = last_frame_ts;
  64. } else if (monitor->prev_video_ts == last_frame_ts) {
  65. monitor->time_since_prev += util_mul_div64(
  66. *frames, 1000000000ULL, monitor->sample_rate);
  67. } else {
  68. monitor->time_since_prev = 0;
  69. }
  70. while (monitor->delay_buffer.size != 0) {
  71. size_t size;
  72. bool bad_diff;
  73. circlebuf_peek_front(&monitor->delay_buffer, &cur_ts,
  74. sizeof(ts));
  75. front_ts = cur_ts - util_mul_div64(pad, 1000000000ULL,
  76. monitor->sample_rate);
  77. diff = (int64_t)front_ts - (int64_t)last_frame_ts;
  78. bad_diff = !last_frame_ts || llabs(diff) > 5000000000 ||
  79. monitor->time_since_prev > 100000000ULL;
  80. /* delay audio if rushing */
  81. if (!bad_diff && diff > 75000000) {
  82. #ifdef DEBUG_AUDIO
  83. blog(LOG_INFO,
  84. "audio rushing, cutting audio, "
  85. "diff: %lld, delay buffer size: %lu, "
  86. "v: %llu: a: %llu",
  87. diff, (int)monitor->delay_buffer.size,
  88. last_frame_ts, front_ts);
  89. #endif
  90. return false;
  91. }
  92. circlebuf_pop_front(&monitor->delay_buffer, NULL, sizeof(ts));
  93. circlebuf_pop_front(&monitor->delay_buffer, frames,
  94. sizeof(*frames));
  95. size = *frames * blocksize;
  96. da_resize(monitor->buf, size);
  97. circlebuf_pop_front(&monitor->delay_buffer, monitor->buf.array,
  98. size);
  99. /* cut audio if dragging */
  100. if (!bad_diff && diff < -75000000 &&
  101. monitor->delay_buffer.size > 0) {
  102. #ifdef DEBUG_AUDIO
  103. blog(LOG_INFO,
  104. "audio dragging, cutting audio, "
  105. "diff: %lld, delay buffer size: %lu, "
  106. "v: %llu: a: %llu",
  107. diff, (int)monitor->delay_buffer.size,
  108. last_frame_ts, front_ts);
  109. #endif
  110. continue;
  111. }
  112. *data = monitor->buf.array;
  113. return true;
  114. }
  115. return false;
  116. }
  117. static enum speaker_layout convert_speaker_layout(DWORD layout, WORD channels)
  118. {
  119. switch (layout) {
  120. case KSAUDIO_SPEAKER_2POINT1:
  121. return SPEAKERS_2POINT1;
  122. case KSAUDIO_SPEAKER_SURROUND:
  123. return SPEAKERS_4POINT0;
  124. case KSAUDIO_SPEAKER_4POINT1:
  125. return SPEAKERS_4POINT1;
  126. case KSAUDIO_SPEAKER_5POINT1:
  127. return SPEAKERS_5POINT1;
  128. case KSAUDIO_SPEAKER_7POINT1:
  129. return SPEAKERS_7POINT1;
  130. }
  131. return (enum speaker_layout)channels;
  132. }
  133. static bool audio_monitor_init_wasapi(struct audio_monitor *monitor)
  134. {
  135. bool success = false;
  136. IMMDeviceEnumerator *immde = NULL;
  137. WAVEFORMATEX *wfex = NULL;
  138. UINT32 frames;
  139. HRESULT hr;
  140. /* ------------------------------------------ *
  141. * Init device */
  142. hr = CoCreateInstance(&CLSID_MMDeviceEnumerator, NULL, CLSCTX_ALL,
  143. &IID_IMMDeviceEnumerator, (void **)&immde);
  144. if (FAILED(hr)) {
  145. warn("%s: Failed to create IMMDeviceEnumerator: %08lX",
  146. __FUNCTION__, hr);
  147. return false;
  148. }
  149. IMMDevice *device = NULL;
  150. const char *const id = obs->audio.monitoring_device_id;
  151. if (strcmp(id, "default") == 0) {
  152. hr = immde->lpVtbl->GetDefaultAudioEndpoint(immde, eRender,
  153. eConsole, &device);
  154. } else {
  155. wchar_t w_id[512];
  156. os_utf8_to_wcs(id, 0, w_id, 512);
  157. hr = immde->lpVtbl->GetDevice(immde, w_id, &device);
  158. }
  159. if (FAILED(hr)) {
  160. warn("%s: Failed to get device: %08lX", __FUNCTION__, hr);
  161. goto fail;
  162. }
  163. /* ------------------------------------------ *
  164. * Init client */
  165. hr = device->lpVtbl->Activate(device, &IID_IAudioClient, CLSCTX_ALL,
  166. NULL, (void **)&monitor->client);
  167. device->lpVtbl->Release(device);
  168. if (FAILED(hr)) {
  169. warn("%s: Failed to activate device: %08lX", __FUNCTION__, hr);
  170. goto fail;
  171. }
  172. hr = monitor->client->lpVtbl->GetMixFormat(monitor->client, &wfex);
  173. if (FAILED(hr)) {
  174. warn("%s: Failed to get mix format: %08lX", __FUNCTION__, hr);
  175. goto fail;
  176. }
  177. hr = monitor->client->lpVtbl->Initialize(monitor->client,
  178. AUDCLNT_SHAREMODE_SHARED, 0,
  179. 10000000, 0, wfex, NULL);
  180. if (FAILED(hr)) {
  181. warn("%s: Failed to initialize: %08lX", __FUNCTION__, hr);
  182. goto fail;
  183. }
  184. /* ------------------------------------------ *
  185. * Init resampler */
  186. const struct audio_output_info *info =
  187. audio_output_get_info(obs->audio.audio);
  188. WAVEFORMATEXTENSIBLE *ext = (WAVEFORMATEXTENSIBLE *)wfex;
  189. struct resample_info from;
  190. struct resample_info to;
  191. from.samples_per_sec = info->samples_per_sec;
  192. from.speakers = info->speakers;
  193. from.format = AUDIO_FORMAT_FLOAT_PLANAR;
  194. to.samples_per_sec = (uint32_t)wfex->nSamplesPerSec;
  195. to.speakers =
  196. convert_speaker_layout(ext->dwChannelMask, wfex->nChannels);
  197. to.format = AUDIO_FORMAT_FLOAT;
  198. monitor->sample_rate = (uint32_t)wfex->nSamplesPerSec;
  199. monitor->channels = wfex->nChannels;
  200. monitor->resampler = audio_resampler_create(&to, &from);
  201. if (!monitor->resampler) {
  202. goto fail;
  203. }
  204. /* ------------------------------------------ *
  205. * Init client */
  206. hr = monitor->client->lpVtbl->GetBufferSize(monitor->client, &frames);
  207. if (FAILED(hr)) {
  208. warn("%s: Failed to get buffer size: %08lX", __FUNCTION__, hr);
  209. goto fail;
  210. }
  211. hr = monitor->client->lpVtbl->GetService(monitor->client,
  212. &IID_IAudioRenderClient,
  213. (void **)&monitor->render);
  214. if (FAILED(hr)) {
  215. warn("%s: Failed to get IAudioRenderClient: %08lX",
  216. __FUNCTION__, hr);
  217. goto fail;
  218. }
  219. hr = monitor->client->lpVtbl->Start(monitor->client);
  220. if (FAILED(hr)) {
  221. warn("%s: Failed to start audio: %08lX", __FUNCTION__, hr);
  222. goto fail;
  223. }
  224. success = true;
  225. fail:
  226. safe_release(immde);
  227. if (wfex)
  228. CoTaskMemFree(wfex);
  229. return success;
  230. }
  231. static void audio_monitor_free_for_reconnect(struct audio_monitor *monitor)
  232. {
  233. if (monitor->client)
  234. monitor->client->lpVtbl->Stop(monitor->client);
  235. if (monitor->render) {
  236. monitor->render->lpVtbl->Release(monitor->render);
  237. monitor->render = NULL;
  238. }
  239. if (monitor->client) {
  240. monitor->client->lpVtbl->Stop(monitor->client);
  241. monitor->client->lpVtbl->Release(monitor->client);
  242. monitor->client = NULL;
  243. }
  244. audio_resampler_destroy(monitor->resampler);
  245. monitor->resampler = NULL;
  246. circlebuf_free(&monitor->delay_buffer);
  247. da_free(monitor->buf);
  248. }
  249. static void on_audio_playback(void *param, obs_source_t *source,
  250. const struct audio_data *audio_data, bool muted)
  251. {
  252. struct audio_monitor *monitor = param;
  253. uint8_t *resample_data[MAX_AV_PLANES];
  254. float vol = source->user_volume;
  255. uint32_t resample_frames;
  256. uint64_t ts_offset;
  257. bool success;
  258. BYTE *output;
  259. if (!TryAcquireSRWLockExclusive(&monitor->playback_mutex)) {
  260. return;
  261. }
  262. if (os_atomic_load_long(&source->activate_refs) == 0) {
  263. goto unlock;
  264. }
  265. if (!monitor->client && !audio_monitor_init_wasapi(monitor)) {
  266. goto free_for_reconnect;
  267. }
  268. success = audio_resampler_resample(
  269. monitor->resampler, resample_data, &resample_frames, &ts_offset,
  270. (const uint8_t *const *)audio_data->data,
  271. (uint32_t)audio_data->frames);
  272. if (!success) {
  273. goto unlock;
  274. }
  275. UINT32 pad = 0;
  276. HRESULT hr = monitor->client->lpVtbl->GetCurrentPadding(monitor->client,
  277. &pad);
  278. if (FAILED(hr)) {
  279. goto free_for_reconnect;
  280. }
  281. bool decouple_audio = source->async_unbuffered &&
  282. source->async_decoupled;
  283. if (monitor->source_has_video && !decouple_audio) {
  284. uint64_t ts = audio_data->timestamp - ts_offset;
  285. if (!process_audio_delay(monitor, (float **)(&resample_data[0]),
  286. &resample_frames, ts, pad)) {
  287. goto unlock;
  288. }
  289. }
  290. IAudioRenderClient *const render = monitor->render;
  291. hr = render->lpVtbl->GetBuffer(render, resample_frames, &output);
  292. if (FAILED(hr)) {
  293. goto free_for_reconnect;
  294. }
  295. if (!muted) {
  296. /* apply volume */
  297. if (!close_float(vol, 1.0f, EPSILON)) {
  298. register float *cur = (float *)resample_data[0];
  299. register float *end =
  300. cur + resample_frames * monitor->channels;
  301. while (cur < end)
  302. *(cur++) *= vol;
  303. }
  304. memcpy(output, resample_data[0],
  305. resample_frames * monitor->channels * sizeof(float));
  306. }
  307. hr = render->lpVtbl->ReleaseBuffer(render, resample_frames,
  308. muted ? AUDCLNT_BUFFERFLAGS_SILENT
  309. : 0);
  310. if (FAILED(hr)) {
  311. goto free_for_reconnect;
  312. }
  313. goto unlock;
  314. free_for_reconnect:
  315. audio_monitor_free_for_reconnect(monitor);
  316. unlock:
  317. ReleaseSRWLockExclusive(&monitor->playback_mutex);
  318. }
  319. static inline void audio_monitor_free(struct audio_monitor *monitor)
  320. {
  321. if (monitor->ignore)
  322. return;
  323. if (monitor->source) {
  324. obs_source_remove_audio_capture_callback(
  325. monitor->source, on_audio_playback, monitor);
  326. }
  327. if (monitor->client)
  328. monitor->client->lpVtbl->Stop(monitor->client);
  329. safe_release(monitor->client);
  330. safe_release(monitor->render);
  331. audio_resampler_destroy(monitor->resampler);
  332. circlebuf_free(&monitor->delay_buffer);
  333. da_free(monitor->buf);
  334. }
  335. extern bool devices_match(const char *id1, const char *id2);
  336. static bool audio_monitor_init(struct audio_monitor *monitor,
  337. obs_source_t *source)
  338. {
  339. monitor->source = source;
  340. const char *id = obs->audio.monitoring_device_id;
  341. if (!id) {
  342. warn("%s: No device ID set", __FUNCTION__);
  343. return false;
  344. }
  345. if (source->info.output_flags & OBS_SOURCE_DO_NOT_SELF_MONITOR) {
  346. obs_data_t *s = obs_source_get_settings(source);
  347. const char *s_dev_id = obs_data_get_string(s, "device_id");
  348. bool match = devices_match(s_dev_id, id);
  349. obs_data_release(s);
  350. if (match) {
  351. monitor->ignore = true;
  352. return true;
  353. }
  354. }
  355. InitializeSRWLock(&monitor->playback_mutex);
  356. return audio_monitor_init_wasapi(monitor);
  357. }
  358. static void audio_monitor_init_final(struct audio_monitor *monitor)
  359. {
  360. if (monitor->ignore)
  361. return;
  362. monitor->source_has_video =
  363. (monitor->source->info.output_flags & OBS_SOURCE_VIDEO) != 0;
  364. obs_source_add_audio_capture_callback(monitor->source,
  365. on_audio_playback, monitor);
  366. }
  367. struct audio_monitor *audio_monitor_create(obs_source_t *source)
  368. {
  369. struct audio_monitor monitor = {0};
  370. struct audio_monitor *out;
  371. if (!audio_monitor_init(&monitor, source)) {
  372. goto fail;
  373. }
  374. out = bmemdup(&monitor, sizeof(monitor));
  375. pthread_mutex_lock(&obs->audio.monitoring_mutex);
  376. da_push_back(obs->audio.monitors, &out);
  377. pthread_mutex_unlock(&obs->audio.monitoring_mutex);
  378. audio_monitor_init_final(out);
  379. return out;
  380. fail:
  381. audio_monitor_free(&monitor);
  382. return NULL;
  383. }
  384. void audio_monitor_reset(struct audio_monitor *monitor)
  385. {
  386. struct audio_monitor new_monitor = {0};
  387. bool success;
  388. AcquireSRWLockExclusive(&monitor->playback_mutex);
  389. success = audio_monitor_init(&new_monitor, monitor->source);
  390. ReleaseSRWLockExclusive(&monitor->playback_mutex);
  391. if (success) {
  392. obs_source_t *source = monitor->source;
  393. audio_monitor_free(monitor);
  394. *monitor = new_monitor;
  395. audio_monitor_init_final(monitor);
  396. } else {
  397. audio_monitor_free(&new_monitor);
  398. }
  399. }
  400. void audio_monitor_destroy(struct audio_monitor *monitor)
  401. {
  402. if (monitor) {
  403. audio_monitor_free(monitor);
  404. pthread_mutex_lock(&obs->audio.monitoring_mutex);
  405. da_erase_item(obs->audio.monitors, &monitor);
  406. pthread_mutex_unlock(&obs->audio.monitoring_mutex);
  407. bfree(monitor);
  408. }
  409. }