audio-io.h 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243
  1. /******************************************************************************
  2. Copyright (C) 2023 by Lain Bailey <[email protected]>
  3. This program is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation, either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>.
  13. ******************************************************************************/
  14. #pragma once
  15. #include "media-io-defs.h"
  16. #include "../util/c99defs.h"
  17. #include "../util/util_uint64.h"
  18. #ifdef __cplusplus
  19. extern "C" {
  20. #endif
  21. #define MAX_AUDIO_MIXES 6
  22. #define MAX_AUDIO_CHANNELS 8
  23. #define AUDIO_OUTPUT_FRAMES 1024
  24. #define TOTAL_AUDIO_SIZE \
  25. (MAX_AUDIO_MIXES * MAX_AUDIO_CHANNELS * AUDIO_OUTPUT_FRAMES * \
  26. sizeof(float))
  27. /*
  28. * Base audio output component. Use this to create an audio output track
  29. * for the media.
  30. */
  31. struct audio_output;
  32. typedef struct audio_output audio_t;
  33. enum audio_format {
  34. AUDIO_FORMAT_UNKNOWN,
  35. AUDIO_FORMAT_U8BIT,
  36. AUDIO_FORMAT_16BIT,
  37. AUDIO_FORMAT_32BIT,
  38. AUDIO_FORMAT_FLOAT,
  39. AUDIO_FORMAT_U8BIT_PLANAR,
  40. AUDIO_FORMAT_16BIT_PLANAR,
  41. AUDIO_FORMAT_32BIT_PLANAR,
  42. AUDIO_FORMAT_FLOAT_PLANAR,
  43. };
  44. /**
  45. * The speaker layout describes where the speakers are located in the room.
  46. * For OBS it dictates:
  47. * * how many channels are available and
  48. * * which channels are used for which speakers.
  49. *
  50. * Standard channel layouts where retrieved from ffmpeg documentation at:
  51. * https://trac.ffmpeg.org/wiki/AudioChannelManipulation
  52. */
  53. enum speaker_layout {
  54. SPEAKERS_UNKNOWN, /**< Unknown setting, fallback is stereo. */
  55. SPEAKERS_MONO, /**< Channels: MONO */
  56. SPEAKERS_STEREO, /**< Channels: FL, FR */
  57. SPEAKERS_2POINT1, /**< Channels: FL, FR, LFE */
  58. SPEAKERS_4POINT0, /**< Channels: FL, FR, FC, RC */
  59. SPEAKERS_4POINT1, /**< Channels: FL, FR, FC, LFE, RC */
  60. SPEAKERS_5POINT1, /**< Channels: FL, FR, FC, LFE, RL, RR */
  61. SPEAKERS_7POINT1 = 8, /**< Channels: FL, FR, FC, LFE, RL, RR, SL, SR */
  62. };
  63. struct audio_data {
  64. uint8_t *data[MAX_AV_PLANES];
  65. uint32_t frames;
  66. uint64_t timestamp;
  67. };
  68. struct audio_output_data {
  69. float *data[MAX_AUDIO_CHANNELS];
  70. };
  71. typedef bool (*audio_input_callback_t)(void *param, uint64_t start_ts,
  72. uint64_t end_ts, uint64_t *new_ts,
  73. uint32_t active_mixers,
  74. struct audio_output_data *mixes);
  75. struct audio_output_info {
  76. const char *name;
  77. uint32_t samples_per_sec;
  78. enum audio_format format;
  79. enum speaker_layout speakers;
  80. audio_input_callback_t input_callback;
  81. void *input_param;
  82. };
  83. struct audio_convert_info {
  84. uint32_t samples_per_sec;
  85. enum audio_format format;
  86. enum speaker_layout speakers;
  87. bool allow_clipping;
  88. };
  89. static inline uint32_t get_audio_channels(enum speaker_layout speakers)
  90. {
  91. switch (speakers) {
  92. case SPEAKERS_MONO:
  93. return 1;
  94. case SPEAKERS_STEREO:
  95. return 2;
  96. case SPEAKERS_2POINT1:
  97. return 3;
  98. case SPEAKERS_4POINT0:
  99. return 4;
  100. case SPEAKERS_4POINT1:
  101. return 5;
  102. case SPEAKERS_5POINT1:
  103. return 6;
  104. case SPEAKERS_7POINT1:
  105. return 8;
  106. case SPEAKERS_UNKNOWN:
  107. return 0;
  108. }
  109. return 0;
  110. }
  111. static inline size_t get_audio_bytes_per_channel(enum audio_format format)
  112. {
  113. switch (format) {
  114. case AUDIO_FORMAT_U8BIT:
  115. case AUDIO_FORMAT_U8BIT_PLANAR:
  116. return 1;
  117. case AUDIO_FORMAT_16BIT:
  118. case AUDIO_FORMAT_16BIT_PLANAR:
  119. return 2;
  120. case AUDIO_FORMAT_FLOAT:
  121. case AUDIO_FORMAT_FLOAT_PLANAR:
  122. case AUDIO_FORMAT_32BIT:
  123. case AUDIO_FORMAT_32BIT_PLANAR:
  124. return 4;
  125. case AUDIO_FORMAT_UNKNOWN:
  126. return 0;
  127. }
  128. return 0;
  129. }
  130. static inline bool is_audio_planar(enum audio_format format)
  131. {
  132. switch (format) {
  133. case AUDIO_FORMAT_U8BIT:
  134. case AUDIO_FORMAT_16BIT:
  135. case AUDIO_FORMAT_32BIT:
  136. case AUDIO_FORMAT_FLOAT:
  137. return false;
  138. case AUDIO_FORMAT_U8BIT_PLANAR:
  139. case AUDIO_FORMAT_FLOAT_PLANAR:
  140. case AUDIO_FORMAT_16BIT_PLANAR:
  141. case AUDIO_FORMAT_32BIT_PLANAR:
  142. return true;
  143. case AUDIO_FORMAT_UNKNOWN:
  144. return false;
  145. }
  146. return false;
  147. }
  148. static inline size_t get_audio_planes(enum audio_format format,
  149. enum speaker_layout speakers)
  150. {
  151. return (is_audio_planar(format) ? get_audio_channels(speakers) : 1);
  152. }
  153. static inline size_t get_audio_size(enum audio_format format,
  154. enum speaker_layout speakers,
  155. uint32_t frames)
  156. {
  157. bool planar = is_audio_planar(format);
  158. return (planar ? 1 : get_audio_channels(speakers)) *
  159. get_audio_bytes_per_channel(format) * frames;
  160. }
  161. static inline size_t get_total_audio_size(enum audio_format format,
  162. enum speaker_layout speakers,
  163. uint32_t frames)
  164. {
  165. return get_audio_channels(speakers) *
  166. get_audio_bytes_per_channel(format) * frames;
  167. }
  168. static inline uint64_t audio_frames_to_ns(size_t sample_rate, uint64_t frames)
  169. {
  170. return util_mul_div64(frames, 1000000000ULL, sample_rate);
  171. }
  172. static inline uint64_t ns_to_audio_frames(size_t sample_rate, uint64_t frames)
  173. {
  174. return util_mul_div64(frames, sample_rate, 1000000000ULL);
  175. }
  176. #define AUDIO_OUTPUT_SUCCESS 0
  177. #define AUDIO_OUTPUT_INVALIDPARAM -1
  178. #define AUDIO_OUTPUT_FAIL -2
  179. EXPORT int audio_output_open(audio_t **audio, struct audio_output_info *info);
  180. EXPORT void audio_output_close(audio_t *audio);
  181. typedef void (*audio_output_callback_t)(void *param, size_t mix_idx,
  182. struct audio_data *data);
  183. EXPORT bool audio_output_connect(audio_t *video, size_t mix_idx,
  184. const struct audio_convert_info *conversion,
  185. audio_output_callback_t callback, void *param);
  186. EXPORT void audio_output_disconnect(audio_t *video, size_t mix_idx,
  187. audio_output_callback_t callback,
  188. void *param);
  189. EXPORT bool audio_output_active(const audio_t *audio);
  190. EXPORT size_t audio_output_get_block_size(const audio_t *audio);
  191. EXPORT size_t audio_output_get_planes(const audio_t *audio);
  192. EXPORT size_t audio_output_get_channels(const audio_t *audio);
  193. EXPORT uint32_t audio_output_get_sample_rate(const audio_t *audio);
  194. EXPORT const struct audio_output_info *
  195. audio_output_get_info(const audio_t *audio);
  196. #ifdef __cplusplus
  197. }
  198. #endif