expander-filter.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439
  1. #include <stdint.h>
  2. #include <inttypes.h>
  3. #include <math.h>
  4. #include <obs-module.h>
  5. #include <media-io/audio-math.h>
  6. #include <util/platform.h>
  7. #include <util/circlebuf.h>
  8. #include <util/threading.h>
  9. /* -------------------------------------------------------- */
  10. #define do_log(level, format, ...) \
  11. blog(level, "[expander: '%s'] " format, \
  12. obs_source_get_name(cd->context), ##__VA_ARGS__)
  13. #define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
  14. #define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
  15. #ifdef _DEBUG
  16. #define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
  17. #else
  18. #define debug(format, ...)
  19. #endif
  20. /* -------------------------------------------------------- */
  21. /* clang-format off */
  22. #define S_RATIO "ratio"
  23. #define S_THRESHOLD "threshold"
  24. #define S_ATTACK_TIME "attack_time"
  25. #define S_RELEASE_TIME "release_time"
  26. #define S_OUTPUT_GAIN "output_gain"
  27. #define S_DETECTOR "detector"
  28. #define S_PRESETS "presets"
  29. #define MT_ obs_module_text
  30. #define TEXT_RATIO MT_("expander.Ratio")
  31. #define TEXT_THRESHOLD MT_("expander.Threshold")
  32. #define TEXT_ATTACK_TIME MT_("expander.AttackTime")
  33. #define TEXT_RELEASE_TIME MT_("expander.ReleaseTime")
  34. #define TEXT_OUTPUT_GAIN MT_("expander.OutputGain")
  35. #define TEXT_DETECTOR MT_("expander.Detector")
  36. #define TEXT_PEAK MT_("expander.Peak")
  37. #define TEXT_RMS MT_("expander.RMS")
  38. #define TEXT_NONE MT_("expander.None")
  39. #define TEXT_PRESETS MT_("expander.Presets")
  40. #define TEXT_PRESETS_EXP MT_("expander.Presets.Expander")
  41. #define TEXT_PRESETS_GATE MT_("expander.Presets.Gate")
  42. #define MIN_RATIO 1.0f
  43. #define MAX_RATIO 20.0f
  44. #define MIN_THRESHOLD_DB -60.0f
  45. #define MAX_THRESHOLD_DB 0.0f
  46. #define MIN_OUTPUT_GAIN_DB -32.0f
  47. #define MAX_OUTPUT_GAIN_DB 32.0f
  48. #define MIN_ATK_RLS_MS 1
  49. #define MAX_RLS_MS 1000
  50. #define MAX_ATK_MS 100
  51. #define DEFAULT_AUDIO_BUF_MS 10
  52. #define MS_IN_S 1000
  53. #define MS_IN_S_F ((float)MS_IN_S)
  54. /* clang-format on */
  55. /* -------------------------------------------------------- */
  56. struct expander_data {
  57. obs_source_t *context;
  58. float *envelope_buf[MAX_AUDIO_CHANNELS];
  59. size_t envelope_buf_len;
  60. float ratio;
  61. float threshold;
  62. float attack_gain;
  63. float release_gain;
  64. float output_gain;
  65. size_t num_channels;
  66. size_t sample_rate;
  67. float envelope[MAX_AUDIO_CHANNELS];
  68. float slope;
  69. int detector;
  70. float runave[MAX_AUDIO_CHANNELS];
  71. bool is_gate;
  72. float *runaverage[MAX_AUDIO_CHANNELS];
  73. size_t runaverage_len;
  74. float *gaindB[MAX_AUDIO_CHANNELS];
  75. size_t gaindB_len;
  76. float gaindB_buf[MAX_AUDIO_CHANNELS];
  77. float *env_in;
  78. size_t env_in_len;
  79. };
  80. enum { RMS_DETECT,
  81. RMS_STILLWELL_DETECT,
  82. PEAK_DETECT,
  83. NO_DETECT,
  84. };
  85. /* -------------------------------------------------------- */
  86. static void resize_env_buffer(struct expander_data *cd, size_t len)
  87. {
  88. cd->envelope_buf_len = len;
  89. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  90. cd->envelope_buf[i] =
  91. brealloc(cd->envelope_buf[i],
  92. cd->envelope_buf_len * sizeof(float));
  93. }
  94. static void resize_runaverage_buffer(struct expander_data *cd, size_t len)
  95. {
  96. cd->runaverage_len = len;
  97. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  98. cd->runaverage[i] = brealloc(
  99. cd->runaverage[i], cd->runaverage_len * sizeof(float));
  100. }
  101. static void resize_env_in_buffer(struct expander_data *cd, size_t len)
  102. {
  103. cd->env_in_len = len;
  104. cd->env_in = brealloc(cd->env_in, cd->env_in_len * sizeof(float));
  105. }
  106. static void resize_gaindB_buffer(struct expander_data *cd, size_t len)
  107. {
  108. cd->gaindB_len = len;
  109. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  110. cd->gaindB[i] =
  111. brealloc(cd->gaindB[i], cd->gaindB_len * sizeof(float));
  112. }
  113. static inline float gain_coefficient(uint32_t sample_rate, float time)
  114. {
  115. return expf(-1.0f / (sample_rate * time));
  116. }
  117. static const char *expander_name(void *unused)
  118. {
  119. UNUSED_PARAMETER(unused);
  120. return obs_module_text("Expander");
  121. }
  122. static void expander_defaults(obs_data_t *s)
  123. {
  124. const char *presets = obs_data_get_string(s, S_PRESETS);
  125. bool is_expander_preset = true;
  126. if (strcmp(presets, "gate") == 0)
  127. is_expander_preset = false;
  128. obs_data_set_default_string(s, S_PRESETS,
  129. is_expander_preset ? "expander" : "gate");
  130. obs_data_set_default_double(s, S_RATIO,
  131. is_expander_preset ? 2.0 : 10.0);
  132. obs_data_set_default_double(s, S_THRESHOLD, -40.0f);
  133. obs_data_set_default_int(s, S_ATTACK_TIME, 10);
  134. obs_data_set_default_int(s, S_RELEASE_TIME,
  135. is_expander_preset ? 50 : 125);
  136. obs_data_set_default_double(s, S_OUTPUT_GAIN, 0.0);
  137. obs_data_set_default_string(s, S_DETECTOR, "RMS");
  138. }
  139. static void expander_update(void *data, obs_data_t *s)
  140. {
  141. struct expander_data *cd = data;
  142. const char *presets = obs_data_get_string(s, S_PRESETS);
  143. if (strcmp(presets, "expander") == 0 && cd->is_gate) {
  144. obs_data_clear(s);
  145. obs_data_set_string(s, S_PRESETS, "expander");
  146. expander_defaults(s);
  147. cd->is_gate = false;
  148. }
  149. if (strcmp(presets, "gate") == 0 && !cd->is_gate) {
  150. obs_data_clear(s);
  151. obs_data_set_string(s, S_PRESETS, "gate");
  152. expander_defaults(s);
  153. cd->is_gate = true;
  154. }
  155. const uint32_t sample_rate =
  156. audio_output_get_sample_rate(obs_get_audio());
  157. const size_t num_channels = audio_output_get_channels(obs_get_audio());
  158. const float attack_time_ms = (float)obs_data_get_int(s, S_ATTACK_TIME);
  159. const float release_time_ms =
  160. (float)obs_data_get_int(s, S_RELEASE_TIME);
  161. const float output_gain_db =
  162. (float)obs_data_get_double(s, S_OUTPUT_GAIN);
  163. cd->ratio = (float)obs_data_get_double(s, S_RATIO);
  164. cd->threshold = (float)obs_data_get_double(s, S_THRESHOLD);
  165. cd->attack_gain =
  166. gain_coefficient(sample_rate, attack_time_ms / MS_IN_S_F);
  167. cd->release_gain =
  168. gain_coefficient(sample_rate, release_time_ms / MS_IN_S_F);
  169. cd->output_gain = db_to_mul(output_gain_db);
  170. cd->num_channels = num_channels;
  171. cd->sample_rate = sample_rate;
  172. cd->slope = 1.0f - cd->ratio;
  173. const char *detect_mode = obs_data_get_string(s, S_DETECTOR);
  174. if (strcmp(detect_mode, "RMS") == 0)
  175. cd->detector = RMS_DETECT;
  176. if (strcmp(detect_mode, "peak") == 0)
  177. cd->detector = PEAK_DETECT;
  178. size_t sample_len = sample_rate * DEFAULT_AUDIO_BUF_MS / MS_IN_S;
  179. if (cd->envelope_buf_len == 0)
  180. resize_env_buffer(cd, sample_len);
  181. if (cd->runaverage_len == 0)
  182. resize_runaverage_buffer(cd, sample_len);
  183. if (cd->env_in_len == 0)
  184. resize_env_in_buffer(cd, sample_len);
  185. if (cd->gaindB_len == 0)
  186. resize_gaindB_buffer(cd, sample_len);
  187. }
  188. static void *expander_create(obs_data_t *settings, obs_source_t *filter)
  189. {
  190. struct expander_data *cd = bzalloc(sizeof(struct expander_data));
  191. cd->context = filter;
  192. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  193. cd->runave[i] = 0;
  194. cd->envelope[i] = 0;
  195. cd->gaindB_buf[i] = 0;
  196. }
  197. cd->is_gate = false;
  198. const char *presets = obs_data_get_string(settings, S_PRESETS);
  199. if (strcmp(presets, "gate") == 0)
  200. cd->is_gate = true;
  201. expander_update(cd, settings);
  202. return cd;
  203. }
  204. static void expander_destroy(void *data)
  205. {
  206. struct expander_data *cd = data;
  207. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  208. bfree(cd->envelope_buf[i]);
  209. bfree(cd->runaverage[i]);
  210. bfree(cd->gaindB[i]);
  211. }
  212. bfree(cd->env_in);
  213. bfree(cd);
  214. }
  215. // detection stage
  216. static void analyze_envelope(struct expander_data *cd, float **samples,
  217. const uint32_t num_samples)
  218. {
  219. if (cd->envelope_buf_len < num_samples)
  220. resize_env_buffer(cd, num_samples);
  221. if (cd->runaverage_len < num_samples)
  222. resize_runaverage_buffer(cd, num_samples);
  223. if (cd->env_in_len < num_samples)
  224. resize_env_in_buffer(cd, num_samples);
  225. // 10 ms RMS window
  226. const float rmscoef = exp2f(-100.0f / cd->sample_rate);
  227. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++) {
  228. memset(cd->envelope_buf[i], 0,
  229. num_samples * sizeof(cd->envelope_buf[i][0]));
  230. memset(cd->runaverage[i], 0,
  231. num_samples * sizeof(cd->runaverage[i][0]));
  232. }
  233. memset(cd->env_in, 0, num_samples * sizeof(cd->env_in[0]));
  234. for (size_t chan = 0; chan < cd->num_channels; ++chan) {
  235. if (!samples[chan])
  236. continue;
  237. float *envelope_buf = cd->envelope_buf[chan];
  238. float *runave = cd->runaverage[chan];
  239. float *env_in = cd->env_in;
  240. if (cd->detector == RMS_DETECT) {
  241. runave[0] =
  242. rmscoef * cd->runave[chan] +
  243. (1 - rmscoef) * powf(samples[chan][0], 2.0f);
  244. env_in[0] = sqrtf(fmaxf(runave[0], 0));
  245. for (uint32_t i = 1; i < num_samples; ++i) {
  246. runave[i] =
  247. rmscoef * runave[i - 1] +
  248. (1 - rmscoef) *
  249. powf(samples[chan][i], 2.0f);
  250. env_in[i] = sqrtf(runave[i]);
  251. }
  252. } else if (cd->detector == PEAK_DETECT) {
  253. for (uint32_t i = 0; i < num_samples; ++i) {
  254. runave[i] = powf(samples[chan][i], 2);
  255. env_in[i] = fabsf(samples[chan][i]);
  256. }
  257. }
  258. cd->runave[chan] = runave[num_samples - 1];
  259. for (uint32_t i = 0; i < num_samples; ++i)
  260. envelope_buf[i] = fmaxf(envelope_buf[i], env_in[i]);
  261. cd->envelope[chan] = cd->envelope_buf[chan][num_samples - 1];
  262. }
  263. }
  264. // gain stage and ballistics in dB domain
  265. static inline void process_expansion(struct expander_data *cd, float **samples,
  266. uint32_t num_samples)
  267. {
  268. const float attack_gain = cd->attack_gain;
  269. const float release_gain = cd->release_gain;
  270. if (cd->gaindB_len < num_samples)
  271. resize_gaindB_buffer(cd, num_samples);
  272. for (int i = 0; i < MAX_AUDIO_CHANNELS; i++)
  273. memset(cd->gaindB[i], 0,
  274. num_samples * sizeof(cd->gaindB[i][0]));
  275. for (size_t chan = 0; chan < cd->num_channels; chan++) {
  276. for (size_t i = 0; i < num_samples; ++i) {
  277. // gain stage of expansion
  278. float env_db = mul_to_db(cd->envelope_buf[chan][i]);
  279. float gain =
  280. cd->threshold - env_db > 0.0f
  281. ? fmaxf(cd->slope * (cd->threshold -
  282. env_db),
  283. -60.0f)
  284. : 0.0f;
  285. // ballistics (attack/release)
  286. if (i > 0) {
  287. if (gain > cd->gaindB[chan][i - 1])
  288. cd->gaindB[chan][i] =
  289. attack_gain *
  290. cd->gaindB[chan][i - 1] +
  291. (1.0f - attack_gain) * gain;
  292. else
  293. cd->gaindB[chan][i] =
  294. release_gain *
  295. cd->gaindB[chan][i - 1] +
  296. (1.0f - release_gain) * gain;
  297. } else {
  298. if (gain > cd->gaindB_buf[chan])
  299. cd->gaindB[chan][i] =
  300. attack_gain *
  301. cd->gaindB_buf[chan] +
  302. (1.0f - attack_gain) * gain;
  303. else
  304. cd->gaindB[chan][i] =
  305. release_gain *
  306. cd->gaindB_buf[chan] +
  307. (1.0f - release_gain) * gain;
  308. }
  309. gain = db_to_mul(fminf(0, cd->gaindB[chan][i]));
  310. if (samples[chan])
  311. samples[chan][i] *= gain * cd->output_gain;
  312. }
  313. cd->gaindB_buf[chan] = cd->gaindB[chan][num_samples - 1];
  314. }
  315. }
  316. static struct obs_audio_data *
  317. expander_filter_audio(void *data, struct obs_audio_data *audio)
  318. {
  319. struct expander_data *cd = data;
  320. const uint32_t num_samples = audio->frames;
  321. if (num_samples == 0)
  322. return audio;
  323. float **samples = (float **)audio->data;
  324. analyze_envelope(cd, samples, num_samples);
  325. process_expansion(cd, samples, num_samples);
  326. return audio;
  327. }
  328. static bool presets_changed(obs_properties_t *props, obs_property_t *prop,
  329. obs_data_t *settings)
  330. {
  331. UNUSED_PARAMETER(props);
  332. UNUSED_PARAMETER(prop);
  333. UNUSED_PARAMETER(settings);
  334. return true;
  335. }
  336. static obs_properties_t *expander_properties(void *data)
  337. {
  338. obs_properties_t *props = obs_properties_create();
  339. obs_property_t *p;
  340. obs_property_t *presets = obs_properties_add_list(
  341. props, S_PRESETS, TEXT_PRESETS, OBS_COMBO_TYPE_LIST,
  342. OBS_COMBO_FORMAT_STRING);
  343. obs_property_list_add_string(presets, TEXT_PRESETS_EXP, "expander");
  344. obs_property_list_add_string(presets, TEXT_PRESETS_GATE, "gate");
  345. obs_property_set_modified_callback(presets, presets_changed);
  346. p = obs_properties_add_float_slider(props, S_RATIO, TEXT_RATIO,
  347. MIN_RATIO, MAX_RATIO, 0.1);
  348. obs_property_float_set_suffix(p, ":1");
  349. p = obs_properties_add_float_slider(props, S_THRESHOLD, TEXT_THRESHOLD,
  350. MIN_THRESHOLD_DB, MAX_THRESHOLD_DB,
  351. 0.1);
  352. obs_property_float_set_suffix(p, " dB");
  353. p = obs_properties_add_int_slider(props, S_ATTACK_TIME,
  354. TEXT_ATTACK_TIME, MIN_ATK_RLS_MS,
  355. MAX_ATK_MS, 1);
  356. obs_property_int_set_suffix(p, " ms");
  357. p = obs_properties_add_int_slider(props, S_RELEASE_TIME,
  358. TEXT_RELEASE_TIME, MIN_ATK_RLS_MS,
  359. MAX_RLS_MS, 1);
  360. obs_property_int_set_suffix(p, " ms");
  361. p = obs_properties_add_float_slider(props, S_OUTPUT_GAIN,
  362. TEXT_OUTPUT_GAIN,
  363. MIN_OUTPUT_GAIN_DB,
  364. MAX_OUTPUT_GAIN_DB, 0.1);
  365. obs_property_float_set_suffix(p, " dB");
  366. obs_property_t *detect = obs_properties_add_list(
  367. props, S_DETECTOR, TEXT_DETECTOR, OBS_COMBO_TYPE_LIST,
  368. OBS_COMBO_FORMAT_STRING);
  369. obs_property_list_add_string(detect, TEXT_RMS, "RMS");
  370. obs_property_list_add_string(detect, TEXT_PEAK, "peak");
  371. UNUSED_PARAMETER(data);
  372. return props;
  373. }
  374. struct obs_source_info expander_filter = {
  375. .id = "expander_filter",
  376. .type = OBS_SOURCE_TYPE_FILTER,
  377. .output_flags = OBS_SOURCE_AUDIO,
  378. .get_name = expander_name,
  379. .create = expander_create,
  380. .destroy = expander_destroy,
  381. .update = expander_update,
  382. .filter_audio = expander_filter_audio,
  383. .get_defaults = expander_defaults,
  384. .get_properties = expander_properties,
  385. };