expander-filter.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494
  1. #include <stdint.h>
  2. #include <inttypes.h>
  3. #include <math.h>
  4. #include <obs-module.h>
  5. #include <media-io/audio-math.h>
  6. #include <util/platform.h>
  7. #include <util/deque.h>
  8. #include <util/threading.h>
  9. /* -------------------------------------------------------- */
  10. #define do_log(level, format, ...) \
  11. blog(level, "[expander/gate/upward compressor: '%s'] " format, obs_source_get_name(cd->context), ##__VA_ARGS__)
  12. #define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
  13. #define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
  14. #ifdef _DEBUG
  15. #define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
  16. #else
  17. #define debug(format, ...)
  18. #endif
  19. /* -------------------------------------------------------- */
  20. /* clang-format off */
  21. #define S_RATIO "ratio"
  22. #define S_FILTER_THRESHOLD "threshold"
  23. #define S_ATTACK_TIME "attack_time"
  24. #define S_RELEASE_TIME "release_time"
  25. #define S_OUTPUT_GAIN "output_gain"
  26. #define S_DETECTOR "detector"
  27. #define S_PRESETS "presets"
  28. #define S_KNEE "knee_width"
  29. #define MT_ obs_module_text
  30. #define TEXT_RATIO MT_("Expander.Ratio")
  31. #define TEXT_THRESHOLD MT_("Expander.Threshold")
  32. #define TEXT_ATTACK_TIME MT_("Expander.AttackTime")
  33. #define TEXT_RELEASE_TIME MT_("Expander.ReleaseTime")
  34. #define TEXT_OUTPUT_GAIN MT_("Expander.OutputGain")
  35. #define TEXT_DETECTOR MT_("Expander.Detector")
  36. #define TEXT_PEAK MT_("Expander.Peak")
  37. #define TEXT_RMS MT_("Expander.RMS")
  38. #define TEXT_PRESETS MT_("Expander.Presets")
  39. #define TEXT_PRESETS_EXP MT_("Expander.Presets.Expander")
  40. #define TEXT_PRESETS_GATE MT_("Expander.Presets.Gate")
  41. #define TEXT_KNEE MT_("Expander.Knee.Width")
  42. #define MIN_RATIO 1.0f
  43. #define MAX_RATIO 20.0f
  44. #define MIN_RATIO_UPW 0.0f
  45. #define MAX_RATIO_UPW 1.0f
  46. #define MIN_THRESHOLD_DB -60.0f
  47. #define MAX_THRESHOLD_DB 0.0f
  48. #define MIN_OUTPUT_GAIN_DB -32.0f
  49. #define MAX_OUTPUT_GAIN_DB 32.0f
  50. #define MIN_ATK_RLS_MS 1
  51. #define MAX_RLS_MS 1000
  52. #define MAX_ATK_MS 100
  53. #define DEFAULT_AUDIO_BUF_MS 10
  54. #define MS_IN_S 1000
  55. #define MS_IN_S_F ((float)MS_IN_S)
  56. /* clang-format on */
  57. /* -------------------------------------------------------- */
  58. struct expander_data {
  59. obs_source_t *context;
  60. float *envelope_buf[MAX_AUDIO_CHANNELS];
  61. size_t envelope_buf_len;
  62. float ratio;
  63. float threshold;
  64. float attack_gain;
  65. float release_gain;
  66. float output_gain;
  67. size_t num_channels;
  68. size_t sample_rate;
  69. float envelope[MAX_AUDIO_CHANNELS];
  70. float slope;
  71. int detector;
  72. float runave[MAX_AUDIO_CHANNELS];
  73. bool is_gate;
  74. float *runaverage[MAX_AUDIO_CHANNELS];
  75. size_t runaverage_len;
  76. float *gain_db[MAX_AUDIO_CHANNELS];
  77. size_t gain_db_len;
  78. float gain_db_buf[MAX_AUDIO_CHANNELS];
  79. float *env_in;
  80. size_t env_in_len;
  81. bool is_upwcomp;
  82. float knee;
  83. };
  84. enum {
  85. RMS_DETECT,
  86. RMS_STILLWELL_DETECT,
  87. PEAK_DETECT,
  88. NO_DETECT,
  89. };
  90. /* -------------------------------------------------------- */
  91. static void resize_env_buffer(struct expander_data *cd, size_t len)
  92. {
  93. cd->envelope_buf_len = len;
  94. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  95. cd->envelope_buf[i] = brealloc(cd->envelope_buf[i], cd->envelope_buf_len * sizeof(float));
  96. }
  97. static void resize_runaverage_buffer(struct expander_data *cd, size_t len)
  98. {
  99. cd->runaverage_len = len;
  100. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  101. cd->runaverage[i] = brealloc(cd->runaverage[i], cd->runaverage_len * sizeof(float));
  102. }
  103. static void resize_env_in_buffer(struct expander_data *cd, size_t len)
  104. {
  105. cd->env_in_len = len;
  106. cd->env_in = brealloc(cd->env_in, cd->env_in_len * sizeof(float));
  107. }
  108. static void resize_gain_db_buffer(struct expander_data *cd, size_t len)
  109. {
  110. cd->gain_db_len = len;
  111. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  112. cd->gain_db[i] = brealloc(cd->gain_db[i], cd->gain_db_len * sizeof(float));
  113. }
  114. static inline float gain_coefficient(uint32_t sample_rate, float time)
  115. {
  116. return expf(-1.0f / (sample_rate * time));
  117. }
  118. static const char *expander_name(void *unused)
  119. {
  120. UNUSED_PARAMETER(unused);
  121. return obs_module_text("Expander");
  122. }
  123. static const char *upward_compressor_name(void *unused)
  124. {
  125. UNUSED_PARAMETER(unused);
  126. return obs_module_text("Upward.Compressor");
  127. }
  128. static void expander_defaults(obs_data_t *s)
  129. {
  130. const char *presets = obs_data_get_string(s, S_PRESETS);
  131. bool is_expander_preset = true;
  132. if (strcmp(presets, "gate") == 0)
  133. is_expander_preset = false;
  134. obs_data_set_default_string(s, S_PRESETS, is_expander_preset ? "expander" : "gate");
  135. obs_data_set_default_double(s, S_RATIO, is_expander_preset ? 2.0 : 10.0);
  136. obs_data_set_default_double(s, S_FILTER_THRESHOLD, -40.0f);
  137. obs_data_set_default_int(s, S_ATTACK_TIME, 10);
  138. obs_data_set_default_int(s, S_RELEASE_TIME, is_expander_preset ? 50 : 125);
  139. obs_data_set_default_double(s, S_OUTPUT_GAIN, 0.0);
  140. obs_data_set_default_string(s, S_DETECTOR, "RMS");
  141. }
  142. static void upward_compressor_defaults(obs_data_t *s)
  143. {
  144. obs_data_set_default_double(s, S_RATIO, 0.5);
  145. obs_data_set_default_double(s, S_FILTER_THRESHOLD, -20.0f);
  146. obs_data_set_default_int(s, S_ATTACK_TIME, 10);
  147. obs_data_set_default_int(s, S_RELEASE_TIME, 50);
  148. obs_data_set_default_double(s, S_OUTPUT_GAIN, 0.0);
  149. obs_data_set_default_string(s, S_DETECTOR, "RMS");
  150. obs_data_set_default_int(s, S_KNEE, 10);
  151. }
  152. static void expander_update(void *data, obs_data_t *s)
  153. {
  154. struct expander_data *cd = data;
  155. if (!cd->is_upwcomp) {
  156. const char *presets = obs_data_get_string(s, S_PRESETS);
  157. if (strcmp(presets, "expander") == 0 && cd->is_gate) {
  158. obs_data_clear(s);
  159. obs_data_set_string(s, S_PRESETS, "expander");
  160. expander_defaults(s);
  161. cd->is_gate = false;
  162. }
  163. if (strcmp(presets, "gate") == 0 && !cd->is_gate) {
  164. obs_data_clear(s);
  165. obs_data_set_string(s, S_PRESETS, "gate");
  166. expander_defaults(s);
  167. cd->is_gate = true;
  168. }
  169. }
  170. const uint32_t sample_rate = audio_output_get_sample_rate(obs_get_audio());
  171. const size_t num_channels = audio_output_get_channels(obs_get_audio());
  172. const float attack_time_ms = (float)obs_data_get_int(s, S_ATTACK_TIME);
  173. const float release_time_ms = (float)obs_data_get_int(s, S_RELEASE_TIME);
  174. const float output_gain_db = (float)obs_data_get_double(s, S_OUTPUT_GAIN);
  175. const float knee = cd->is_upwcomp ? (float)obs_data_get_int(s, S_KNEE) : 0.0f;
  176. cd->ratio = (float)obs_data_get_double(s, S_RATIO);
  177. cd->threshold = (float)obs_data_get_double(s, S_FILTER_THRESHOLD);
  178. cd->attack_gain = gain_coefficient(sample_rate, attack_time_ms / MS_IN_S_F);
  179. cd->release_gain = gain_coefficient(sample_rate, release_time_ms / MS_IN_S_F);
  180. cd->output_gain = db_to_mul(output_gain_db);
  181. cd->num_channels = num_channels;
  182. cd->sample_rate = sample_rate;
  183. cd->slope = 1.0f - cd->ratio;
  184. cd->knee = knee;
  185. const char *detect_mode = obs_data_get_string(s, S_DETECTOR);
  186. if (strcmp(detect_mode, "RMS") == 0)
  187. cd->detector = RMS_DETECT;
  188. if (strcmp(detect_mode, "peak") == 0)
  189. cd->detector = PEAK_DETECT;
  190. size_t sample_len = sample_rate * DEFAULT_AUDIO_BUF_MS / MS_IN_S;
  191. if (cd->envelope_buf_len == 0)
  192. resize_env_buffer(cd, sample_len);
  193. if (cd->runaverage_len == 0)
  194. resize_runaverage_buffer(cd, sample_len);
  195. if (cd->env_in_len == 0)
  196. resize_env_in_buffer(cd, sample_len);
  197. if (cd->gain_db_len == 0)
  198. resize_gain_db_buffer(cd, sample_len);
  199. }
  200. static void *compressor_expander_create(obs_data_t *settings, obs_source_t *filter, bool is_compressor)
  201. {
  202. struct expander_data *cd = bzalloc(sizeof(struct expander_data));
  203. cd->context = filter;
  204. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  205. cd->runave[i] = 0;
  206. cd->envelope[i] = 0;
  207. cd->gain_db_buf[i] = 0;
  208. }
  209. cd->is_gate = false;
  210. const char *presets = obs_data_get_string(settings, S_PRESETS);
  211. if (strcmp(presets, "gate") == 0)
  212. cd->is_gate = true;
  213. cd->is_upwcomp = is_compressor;
  214. expander_update(cd, settings);
  215. return cd;
  216. }
  217. static void *expander_create(obs_data_t *settings, obs_source_t *filter)
  218. {
  219. return compressor_expander_create(settings, filter, false);
  220. }
  221. static void *upward_compressor_create(obs_data_t *settings, obs_source_t *filter)
  222. {
  223. return compressor_expander_create(settings, filter, true);
  224. }
  225. static void expander_destroy(void *data)
  226. {
  227. struct expander_data *cd = data;
  228. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  229. bfree(cd->envelope_buf[i]);
  230. bfree(cd->runaverage[i]);
  231. bfree(cd->gain_db[i]);
  232. }
  233. bfree(cd->env_in);
  234. bfree(cd);
  235. }
  236. // detection stage
  237. static void analyze_envelope(struct expander_data *cd, float **samples, const uint32_t num_samples)
  238. {
  239. if (cd->envelope_buf_len < num_samples)
  240. resize_env_buffer(cd, num_samples);
  241. if (cd->runaverage_len < num_samples)
  242. resize_runaverage_buffer(cd, num_samples);
  243. if (cd->env_in_len < num_samples)
  244. resize_env_in_buffer(cd, num_samples);
  245. // 10 ms RMS window
  246. const float rmscoef = exp2f(-100.0f / cd->sample_rate);
  247. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  248. memset(cd->envelope_buf[i], 0, num_samples * sizeof(cd->envelope_buf[i][0]));
  249. memset(cd->runaverage[i], 0, num_samples * sizeof(cd->runaverage[i][0]));
  250. }
  251. memset(cd->env_in, 0, num_samples * sizeof(cd->env_in[0]));
  252. for (size_t chan = 0; chan < cd->num_channels; ++chan) {
  253. if (!samples[chan])
  254. continue;
  255. float *envelope_buf = cd->envelope_buf[chan];
  256. float *runave = cd->runaverage[chan];
  257. float *env_in = cd->env_in;
  258. if (cd->detector == RMS_DETECT) {
  259. runave[0] = rmscoef * cd->runave[chan] + (1 - rmscoef) * powf(samples[chan][0], 2.0f);
  260. env_in[0] = sqrtf(fmaxf(runave[0], 0));
  261. for (uint32_t i = 1; i < num_samples; ++i) {
  262. runave[i] = rmscoef * runave[i - 1] + (1 - rmscoef) * powf(samples[chan][i], 2.0f);
  263. env_in[i] = sqrtf(runave[i]);
  264. }
  265. } else if (cd->detector == PEAK_DETECT) {
  266. for (uint32_t i = 0; i < num_samples; ++i) {
  267. runave[i] = powf(samples[chan][i], 2);
  268. env_in[i] = fabsf(samples[chan][i]);
  269. }
  270. }
  271. cd->runave[chan] = runave[num_samples - 1];
  272. for (uint32_t i = 0; i < num_samples; ++i)
  273. envelope_buf[i] = fmaxf(envelope_buf[i], env_in[i]);
  274. cd->envelope[chan] = cd->envelope_buf[chan][num_samples - 1];
  275. }
  276. }
  277. static inline void process_sample(size_t idx, float *samples, float *env_buf, float *gain_db, bool is_upwcomp,
  278. float channel_gain, float threshold, float slope, float attack_gain,
  279. float inv_attack_gain, float release_gain, float inv_release_gain, float output_gain,
  280. float knee)
  281. {
  282. /* --------------------------------- */
  283. /* gain stage of expansion */
  284. float env_db = mul_to_db(env_buf[idx]);
  285. float diff = threshold - env_db;
  286. if (is_upwcomp && env_db <= (threshold - 60.0f) / 2)
  287. diff = env_db + 60.0f > 0 ? env_db + 60.0f : 0.0f;
  288. float gain = 0.0f;
  289. float prev_gain = 0.0f;
  290. // Note that the gain is always >= 0 for the upward compressor
  291. // but is always <=0 for the expander.
  292. if (is_upwcomp) {
  293. prev_gain = idx > 0 ? fmaxf(gain_db[idx - 1], 0) : fmaxf(channel_gain, 0);
  294. // gain above knee (included for clarity):
  295. if (env_db >= threshold + knee / 2)
  296. gain = 0.0f;
  297. // gain below knee:
  298. if (threshold - knee / 2 >= env_db)
  299. gain = slope * diff;
  300. // gain in knee:
  301. if (env_db > threshold - knee / 2 && threshold + knee / 2 > env_db)
  302. gain = slope * powf(diff + knee / 2, 2) / (2.0f * knee);
  303. } else {
  304. prev_gain = idx > 0 ? gain_db[idx - 1] : channel_gain;
  305. gain = diff > 0.0f ? fmaxf(slope * diff, -60.0f) : 0.0f;
  306. }
  307. /* --------------------------------- */
  308. /* ballistics (attack/release) */
  309. if (gain > prev_gain)
  310. gain_db[idx] = attack_gain * prev_gain + inv_attack_gain * gain;
  311. else
  312. gain_db[idx] = release_gain * prev_gain + inv_release_gain * gain;
  313. /* --------------------------------- */
  314. /* output */
  315. if (!is_upwcomp) {
  316. gain = db_to_mul(fminf(0, gain_db[idx]));
  317. } else {
  318. gain = db_to_mul(gain_db[idx]);
  319. }
  320. samples[idx] *= gain * output_gain;
  321. }
  322. // gain stage and ballistics in dB domain
  323. static inline void process_expansion(struct expander_data *cd, float **samples, uint32_t num_samples)
  324. {
  325. const float attack_gain = cd->attack_gain;
  326. const float release_gain = cd->release_gain;
  327. const float inv_attack_gain = 1.0f - attack_gain;
  328. const float inv_release_gain = 1.0f - release_gain;
  329. const float threshold = cd->threshold;
  330. const float slope = cd->slope;
  331. const float output_gain = cd->output_gain;
  332. const bool is_upwcomp = cd->is_upwcomp;
  333. const float knee = cd->knee;
  334. if (cd->gain_db_len < num_samples)
  335. resize_gain_db_buffer(cd, num_samples);
  336. for (size_t i = 0; i < cd->num_channels; i++)
  337. memset(cd->gain_db[i], 0, num_samples * sizeof(cd->gain_db[i][0]));
  338. for (size_t chan = 0; chan < cd->num_channels; chan++) {
  339. float *channel_samples = samples[chan];
  340. float *env_buf = cd->envelope_buf[chan];
  341. float *gain_db = cd->gain_db[chan];
  342. float channel_gain = cd->gain_db_buf[chan];
  343. for (size_t i = 0; i < num_samples; ++i) {
  344. process_sample(i, channel_samples, env_buf, gain_db, is_upwcomp, channel_gain, threshold, slope,
  345. attack_gain, inv_attack_gain, release_gain, inv_release_gain, output_gain, knee);
  346. }
  347. cd->gain_db_buf[chan] = gain_db[num_samples - 1];
  348. }
  349. }
  350. static struct obs_audio_data *expander_filter_audio(void *data, struct obs_audio_data *audio)
  351. {
  352. struct expander_data *cd = data;
  353. const uint32_t num_samples = audio->frames;
  354. if (num_samples == 0)
  355. return audio;
  356. float **samples = (float **)audio->data;
  357. analyze_envelope(cd, samples, num_samples);
  358. process_expansion(cd, samples, num_samples);
  359. return audio;
  360. }
  361. static bool presets_changed(obs_properties_t *props, obs_property_t *prop, obs_data_t *settings)
  362. {
  363. UNUSED_PARAMETER(props);
  364. UNUSED_PARAMETER(prop);
  365. UNUSED_PARAMETER(settings);
  366. return true;
  367. }
  368. static obs_properties_t *expander_properties(void *data)
  369. {
  370. struct expander_data *cd = data;
  371. obs_properties_t *props = obs_properties_create();
  372. obs_property_t *p;
  373. if (!cd->is_upwcomp) {
  374. obs_property_t *presets = obs_properties_add_list(props, S_PRESETS, TEXT_PRESETS, OBS_COMBO_TYPE_LIST,
  375. OBS_COMBO_FORMAT_STRING);
  376. obs_property_list_add_string(presets, TEXT_PRESETS_EXP, "expander");
  377. obs_property_list_add_string(presets, TEXT_PRESETS_GATE, "gate");
  378. obs_property_set_modified_callback(presets, presets_changed);
  379. }
  380. p = obs_properties_add_float_slider(props, S_RATIO, TEXT_RATIO, !cd->is_upwcomp ? MIN_RATIO : MIN_RATIO_UPW,
  381. !cd->is_upwcomp ? MAX_RATIO : MAX_RATIO_UPW, 0.1);
  382. obs_property_float_set_suffix(p, ":1");
  383. p = obs_properties_add_float_slider(props, S_FILTER_THRESHOLD, TEXT_THRESHOLD, MIN_THRESHOLD_DB,
  384. MAX_THRESHOLD_DB, 0.1);
  385. obs_property_float_set_suffix(p, " dB");
  386. p = obs_properties_add_int_slider(props, S_ATTACK_TIME, TEXT_ATTACK_TIME, MIN_ATK_RLS_MS, MAX_ATK_MS, 1);
  387. obs_property_int_set_suffix(p, " ms");
  388. p = obs_properties_add_int_slider(props, S_RELEASE_TIME, TEXT_RELEASE_TIME, MIN_ATK_RLS_MS, MAX_RLS_MS, 1);
  389. obs_property_int_set_suffix(p, " ms");
  390. p = obs_properties_add_float_slider(props, S_OUTPUT_GAIN, TEXT_OUTPUT_GAIN, MIN_OUTPUT_GAIN_DB,
  391. MAX_OUTPUT_GAIN_DB, 0.1);
  392. obs_property_float_set_suffix(p, " dB");
  393. if (!cd->is_upwcomp) {
  394. obs_property_t *detect = obs_properties_add_list(props, S_DETECTOR, TEXT_DETECTOR, OBS_COMBO_TYPE_LIST,
  395. OBS_COMBO_FORMAT_STRING);
  396. obs_property_list_add_string(detect, TEXT_RMS, "RMS");
  397. obs_property_list_add_string(detect, TEXT_PEAK, "peak");
  398. } else {
  399. p = obs_properties_add_int_slider(props, S_KNEE, TEXT_KNEE, 0, 20, 1);
  400. obs_property_float_set_suffix(p, " dB");
  401. }
  402. return props;
  403. }
  404. struct obs_source_info expander_filter = {
  405. .id = "expander_filter",
  406. .type = OBS_SOURCE_TYPE_FILTER,
  407. .output_flags = OBS_SOURCE_AUDIO,
  408. .get_name = expander_name,
  409. .create = expander_create,
  410. .destroy = expander_destroy,
  411. .update = expander_update,
  412. .filter_audio = expander_filter_audio,
  413. .get_defaults = expander_defaults,
  414. .get_properties = expander_properties,
  415. };
  416. struct obs_source_info upward_compressor_filter = {
  417. .id = "upward_compressor_filter",
  418. .type = OBS_SOURCE_TYPE_FILTER,
  419. .output_flags = OBS_SOURCE_AUDIO,
  420. .get_name = upward_compressor_name,
  421. .create = upward_compressor_create,
  422. .destroy = expander_destroy,
  423. .update = expander_update,
  424. .filter_audio = expander_filter_audio,
  425. .get_defaults = upward_compressor_defaults,
  426. .get_properties = expander_properties,
  427. };