expander-filter.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440
  1. #include <stdint.h>
  2. #include <inttypes.h>
  3. #include <math.h>
  4. #include <obs-module.h>
  5. #include <media-io/audio-math.h>
  6. #include <util/platform.h>
  7. #include <util/circlebuf.h>
  8. #include <util/threading.h>
  9. /* -------------------------------------------------------- */
  10. #define do_log(level, format, ...) \
  11. blog(level, "[expander: '%s'] " format, \
  12. obs_source_get_name(cd->context), ##__VA_ARGS__)
  13. #define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
  14. #define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
  15. #ifdef _DEBUG
  16. #define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
  17. #else
  18. #define debug(format, ...)
  19. #endif
  20. /* -------------------------------------------------------- */
  21. /* clang-format off */
  22. #define S_RATIO "ratio"
  23. #define S_THRESHOLD "threshold"
  24. #define S_ATTACK_TIME "attack_time"
  25. #define S_RELEASE_TIME "release_time"
  26. #define S_OUTPUT_GAIN "output_gain"
  27. #define S_DETECTOR "detector"
  28. #define S_PRESETS "presets"
  29. #define MT_ obs_module_text
  30. #define TEXT_RATIO MT_("expander.Ratio")
  31. #define TEXT_THRESHOLD MT_("expander.Threshold")
  32. #define TEXT_ATTACK_TIME MT_("expander.AttackTime")
  33. #define TEXT_RELEASE_TIME MT_("expander.ReleaseTime")
  34. #define TEXT_OUTPUT_GAIN MT_("expander.OutputGain")
  35. #define TEXT_DETECTOR MT_("expander.Detector")
  36. #define TEXT_PEAK MT_("expander.Peak")
  37. #define TEXT_RMS MT_("expander.RMS")
  38. #define TEXT_NONE MT_("expander.None")
  39. #define TEXT_PRESETS MT_("expander.Presets")
  40. #define TEXT_PRESETS_EXP MT_("expander.Presets.Expander")
  41. #define TEXT_PRESETS_GATE MT_("expander.Presets.Gate")
  42. #define MIN_RATIO 1.0f
  43. #define MAX_RATIO 20.0f
  44. #define MIN_THRESHOLD_DB -60.0f
  45. #define MAX_THRESHOLD_DB 0.0f
  46. #define MIN_OUTPUT_GAIN_DB -32.0f
  47. #define MAX_OUTPUT_GAIN_DB 32.0f
  48. #define MIN_ATK_RLS_MS 1
  49. #define MAX_RLS_MS 1000
  50. #define MAX_ATK_MS 100
  51. #define DEFAULT_AUDIO_BUF_MS 10
  52. #define MS_IN_S 1000
  53. #define MS_IN_S_F ((float)MS_IN_S)
  54. /* clang-format on */
  55. /* -------------------------------------------------------- */
  56. struct expander_data {
  57. obs_source_t *context;
  58. float *envelope_buf[MAX_AUDIO_CHANNELS];
  59. size_t envelope_buf_len;
  60. float ratio;
  61. float threshold;
  62. float attack_gain;
  63. float release_gain;
  64. float output_gain;
  65. size_t num_channels;
  66. size_t sample_rate;
  67. float envelope[MAX_AUDIO_CHANNELS];
  68. float slope;
  69. int detector;
  70. float runave[MAX_AUDIO_CHANNELS];
  71. bool is_gate;
  72. float *runaverage[MAX_AUDIO_CHANNELS];
  73. size_t runaverage_len;
  74. float *gaindB[MAX_AUDIO_CHANNELS];
  75. size_t gaindB_len;
  76. float gaindB_buf[MAX_AUDIO_CHANNELS];
  77. float *env_in;
  78. size_t env_in_len;
  79. };
  80. enum {
  81. RMS_DETECT,
  82. RMS_STILLWELL_DETECT,
  83. PEAK_DETECT,
  84. NO_DETECT,
  85. };
  86. /* -------------------------------------------------------- */
  87. static void resize_env_buffer(struct expander_data *cd, size_t len)
  88. {
  89. cd->envelope_buf_len = len;
  90. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  91. cd->envelope_buf[i] =
  92. brealloc(cd->envelope_buf[i],
  93. cd->envelope_buf_len * sizeof(float));
  94. }
  95. static void resize_runaverage_buffer(struct expander_data *cd, size_t len)
  96. {
  97. cd->runaverage_len = len;
  98. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  99. cd->runaverage[i] = brealloc(
  100. cd->runaverage[i], cd->runaverage_len * sizeof(float));
  101. }
  102. static void resize_env_in_buffer(struct expander_data *cd, size_t len)
  103. {
  104. cd->env_in_len = len;
  105. cd->env_in = brealloc(cd->env_in, cd->env_in_len * sizeof(float));
  106. }
  107. static void resize_gaindB_buffer(struct expander_data *cd, size_t len)
  108. {
  109. cd->gaindB_len = len;
  110. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  111. cd->gaindB[i] =
  112. brealloc(cd->gaindB[i], cd->gaindB_len * sizeof(float));
  113. }
  114. static inline float gain_coefficient(uint32_t sample_rate, float time)
  115. {
  116. return expf(-1.0f / (sample_rate * time));
  117. }
  118. static const char *expander_name(void *unused)
  119. {
  120. UNUSED_PARAMETER(unused);
  121. return obs_module_text("Expander");
  122. }
  123. static void expander_defaults(obs_data_t *s)
  124. {
  125. const char *presets = obs_data_get_string(s, S_PRESETS);
  126. bool is_expander_preset = true;
  127. if (strcmp(presets, "gate") == 0)
  128. is_expander_preset = false;
  129. obs_data_set_default_string(s, S_PRESETS,
  130. is_expander_preset ? "expander" : "gate");
  131. obs_data_set_default_double(s, S_RATIO,
  132. is_expander_preset ? 2.0 : 10.0);
  133. obs_data_set_default_double(s, S_THRESHOLD, -40.0f);
  134. obs_data_set_default_int(s, S_ATTACK_TIME, 10);
  135. obs_data_set_default_int(s, S_RELEASE_TIME,
  136. is_expander_preset ? 50 : 125);
  137. obs_data_set_default_double(s, S_OUTPUT_GAIN, 0.0);
  138. obs_data_set_default_string(s, S_DETECTOR, "RMS");
  139. }
  140. static void expander_update(void *data, obs_data_t *s)
  141. {
  142. struct expander_data *cd = data;
  143. const char *presets = obs_data_get_string(s, S_PRESETS);
  144. if (strcmp(presets, "expander") == 0 && cd->is_gate) {
  145. obs_data_clear(s);
  146. obs_data_set_string(s, S_PRESETS, "expander");
  147. expander_defaults(s);
  148. cd->is_gate = false;
  149. }
  150. if (strcmp(presets, "gate") == 0 && !cd->is_gate) {
  151. obs_data_clear(s);
  152. obs_data_set_string(s, S_PRESETS, "gate");
  153. expander_defaults(s);
  154. cd->is_gate = true;
  155. }
  156. const uint32_t sample_rate =
  157. audio_output_get_sample_rate(obs_get_audio());
  158. const size_t num_channels = audio_output_get_channels(obs_get_audio());
  159. const float attack_time_ms = (float)obs_data_get_int(s, S_ATTACK_TIME);
  160. const float release_time_ms =
  161. (float)obs_data_get_int(s, S_RELEASE_TIME);
  162. const float output_gain_db =
  163. (float)obs_data_get_double(s, S_OUTPUT_GAIN);
  164. cd->ratio = (float)obs_data_get_double(s, S_RATIO);
  165. cd->threshold = (float)obs_data_get_double(s, S_THRESHOLD);
  166. cd->attack_gain =
  167. gain_coefficient(sample_rate, attack_time_ms / MS_IN_S_F);
  168. cd->release_gain =
  169. gain_coefficient(sample_rate, release_time_ms / MS_IN_S_F);
  170. cd->output_gain = db_to_mul(output_gain_db);
  171. cd->num_channels = num_channels;
  172. cd->sample_rate = sample_rate;
  173. cd->slope = 1.0f - cd->ratio;
  174. const char *detect_mode = obs_data_get_string(s, S_DETECTOR);
  175. if (strcmp(detect_mode, "RMS") == 0)
  176. cd->detector = RMS_DETECT;
  177. if (strcmp(detect_mode, "peak") == 0)
  178. cd->detector = PEAK_DETECT;
  179. size_t sample_len = sample_rate * DEFAULT_AUDIO_BUF_MS / MS_IN_S;
  180. if (cd->envelope_buf_len == 0)
  181. resize_env_buffer(cd, sample_len);
  182. if (cd->runaverage_len == 0)
  183. resize_runaverage_buffer(cd, sample_len);
  184. if (cd->env_in_len == 0)
  185. resize_env_in_buffer(cd, sample_len);
  186. if (cd->gaindB_len == 0)
  187. resize_gaindB_buffer(cd, sample_len);
  188. }
  189. static void *expander_create(obs_data_t *settings, obs_source_t *filter)
  190. {
  191. struct expander_data *cd = bzalloc(sizeof(struct expander_data));
  192. cd->context = filter;
  193. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  194. cd->runave[i] = 0;
  195. cd->envelope[i] = 0;
  196. cd->gaindB_buf[i] = 0;
  197. }
  198. cd->is_gate = false;
  199. const char *presets = obs_data_get_string(settings, S_PRESETS);
  200. if (strcmp(presets, "gate") == 0)
  201. cd->is_gate = true;
  202. expander_update(cd, settings);
  203. return cd;
  204. }
  205. static void expander_destroy(void *data)
  206. {
  207. struct expander_data *cd = data;
  208. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  209. bfree(cd->envelope_buf[i]);
  210. bfree(cd->runaverage[i]);
  211. bfree(cd->gaindB[i]);
  212. }
  213. bfree(cd->env_in);
  214. bfree(cd);
  215. }
  216. // detection stage
  217. static void analyze_envelope(struct expander_data *cd, float **samples,
  218. const uint32_t num_samples)
  219. {
  220. if (cd->envelope_buf_len < num_samples)
  221. resize_env_buffer(cd, num_samples);
  222. if (cd->runaverage_len < num_samples)
  223. resize_runaverage_buffer(cd, num_samples);
  224. if (cd->env_in_len < num_samples)
  225. resize_env_in_buffer(cd, num_samples);
  226. // 10 ms RMS window
  227. const float rmscoef = exp2f(-100.0f / cd->sample_rate);
  228. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  229. memset(cd->envelope_buf[i], 0,
  230. num_samples * sizeof(cd->envelope_buf[i][0]));
  231. memset(cd->runaverage[i], 0,
  232. num_samples * sizeof(cd->runaverage[i][0]));
  233. }
  234. memset(cd->env_in, 0, num_samples * sizeof(cd->env_in[0]));
  235. for (size_t chan = 0; chan < cd->num_channels; ++chan) {
  236. if (!samples[chan])
  237. continue;
  238. float *envelope_buf = cd->envelope_buf[chan];
  239. float *runave = cd->runaverage[chan];
  240. float *env_in = cd->env_in;
  241. if (cd->detector == RMS_DETECT) {
  242. runave[0] =
  243. rmscoef * cd->runave[chan] +
  244. (1 - rmscoef) * powf(samples[chan][0], 2.0f);
  245. env_in[0] = sqrtf(fmaxf(runave[0], 0));
  246. for (uint32_t i = 1; i < num_samples; ++i) {
  247. runave[i] =
  248. rmscoef * runave[i - 1] +
  249. (1 - rmscoef) *
  250. powf(samples[chan][i], 2.0f);
  251. env_in[i] = sqrtf(runave[i]);
  252. }
  253. } else if (cd->detector == PEAK_DETECT) {
  254. for (uint32_t i = 0; i < num_samples; ++i) {
  255. runave[i] = powf(samples[chan][i], 2);
  256. env_in[i] = fabsf(samples[chan][i]);
  257. }
  258. }
  259. cd->runave[chan] = runave[num_samples - 1];
  260. for (uint32_t i = 0; i < num_samples; ++i)
  261. envelope_buf[i] = fmaxf(envelope_buf[i], env_in[i]);
  262. cd->envelope[chan] = cd->envelope_buf[chan][num_samples - 1];
  263. }
  264. }
  265. // gain stage and ballistics in dB domain
  266. static inline void process_expansion(struct expander_data *cd, float **samples,
  267. uint32_t num_samples)
  268. {
  269. const float attack_gain = cd->attack_gain;
  270. const float release_gain = cd->release_gain;
  271. if (cd->gaindB_len < num_samples)
  272. resize_gaindB_buffer(cd, num_samples);
  273. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  274. memset(cd->gaindB[i], 0,
  275. num_samples * sizeof(cd->gaindB[i][0]));
  276. for (size_t chan = 0; chan < cd->num_channels; chan++) {
  277. for (size_t i = 0; i < num_samples; ++i) {
  278. // gain stage of expansion
  279. float env_db = mul_to_db(cd->envelope_buf[chan][i]);
  280. float gain =
  281. cd->threshold - env_db > 0.0f
  282. ? fmaxf(cd->slope * (cd->threshold -
  283. env_db),
  284. -60.0f)
  285. : 0.0f;
  286. // ballistics (attack/release)
  287. if (i > 0) {
  288. if (gain > cd->gaindB[chan][i - 1])
  289. cd->gaindB[chan][i] =
  290. attack_gain *
  291. cd->gaindB[chan][i - 1] +
  292. (1.0f - attack_gain) * gain;
  293. else
  294. cd->gaindB[chan][i] =
  295. release_gain *
  296. cd->gaindB[chan][i - 1] +
  297. (1.0f - release_gain) * gain;
  298. } else {
  299. if (gain > cd->gaindB_buf[chan])
  300. cd->gaindB[chan][i] =
  301. attack_gain *
  302. cd->gaindB_buf[chan] +
  303. (1.0f - attack_gain) * gain;
  304. else
  305. cd->gaindB[chan][i] =
  306. release_gain *
  307. cd->gaindB_buf[chan] +
  308. (1.0f - release_gain) * gain;
  309. }
  310. gain = db_to_mul(fminf(0, cd->gaindB[chan][i]));
  311. if (samples[chan])
  312. samples[chan][i] *= gain * cd->output_gain;
  313. }
  314. cd->gaindB_buf[chan] = cd->gaindB[chan][num_samples - 1];
  315. }
  316. }
  317. static struct obs_audio_data *
  318. expander_filter_audio(void *data, struct obs_audio_data *audio)
  319. {
  320. struct expander_data *cd = data;
  321. const uint32_t num_samples = audio->frames;
  322. if (num_samples == 0)
  323. return audio;
  324. float **samples = (float **)audio->data;
  325. analyze_envelope(cd, samples, num_samples);
  326. process_expansion(cd, samples, num_samples);
  327. return audio;
  328. }
  329. static bool presets_changed(obs_properties_t *props, obs_property_t *prop,
  330. obs_data_t *settings)
  331. {
  332. UNUSED_PARAMETER(props);
  333. UNUSED_PARAMETER(prop);
  334. UNUSED_PARAMETER(settings);
  335. return true;
  336. }
  337. static obs_properties_t *expander_properties(void *data)
  338. {
  339. obs_properties_t *props = obs_properties_create();
  340. obs_property_t *p;
  341. obs_property_t *presets = obs_properties_add_list(
  342. props, S_PRESETS, TEXT_PRESETS, OBS_COMBO_TYPE_LIST,
  343. OBS_COMBO_FORMAT_STRING);
  344. obs_property_list_add_string(presets, TEXT_PRESETS_EXP, "expander");
  345. obs_property_list_add_string(presets, TEXT_PRESETS_GATE, "gate");
  346. obs_property_set_modified_callback(presets, presets_changed);
  347. p = obs_properties_add_float_slider(props, S_RATIO, TEXT_RATIO,
  348. MIN_RATIO, MAX_RATIO, 0.1);
  349. obs_property_float_set_suffix(p, ":1");
  350. p = obs_properties_add_float_slider(props, S_THRESHOLD, TEXT_THRESHOLD,
  351. MIN_THRESHOLD_DB, MAX_THRESHOLD_DB,
  352. 0.1);
  353. obs_property_float_set_suffix(p, " dB");
  354. p = obs_properties_add_int_slider(props, S_ATTACK_TIME,
  355. TEXT_ATTACK_TIME, MIN_ATK_RLS_MS,
  356. MAX_ATK_MS, 1);
  357. obs_property_int_set_suffix(p, " ms");
  358. p = obs_properties_add_int_slider(props, S_RELEASE_TIME,
  359. TEXT_RELEASE_TIME, MIN_ATK_RLS_MS,
  360. MAX_RLS_MS, 1);
  361. obs_property_int_set_suffix(p, " ms");
  362. p = obs_properties_add_float_slider(props, S_OUTPUT_GAIN,
  363. TEXT_OUTPUT_GAIN,
  364. MIN_OUTPUT_GAIN_DB,
  365. MAX_OUTPUT_GAIN_DB, 0.1);
  366. obs_property_float_set_suffix(p, " dB");
  367. obs_property_t *detect = obs_properties_add_list(
  368. props, S_DETECTOR, TEXT_DETECTOR, OBS_COMBO_TYPE_LIST,
  369. OBS_COMBO_FORMAT_STRING);
  370. obs_property_list_add_string(detect, TEXT_RMS, "RMS");
  371. obs_property_list_add_string(detect, TEXT_PEAK, "peak");
  372. UNUSED_PARAMETER(data);
  373. return props;
  374. }
  375. struct obs_source_info expander_filter = {
  376. .id = "expander_filter",
  377. .type = OBS_SOURCE_TYPE_FILTER,
  378. .output_flags = OBS_SOURCE_AUDIO,
  379. .get_name = expander_name,
  380. .create = expander_create,
  381. .destroy = expander_destroy,
  382. .update = expander_update,
  383. .filter_audio = expander_filter_audio,
  384. .get_defaults = expander_defaults,
  385. .get_properties = expander_properties,
  386. };