audio-io.h 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233
  1. /******************************************************************************
  2. Copyright (C) 2013 by Hugh Bailey <[email protected]>
  3. This program is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation, either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>.
  13. ******************************************************************************/
  14. #pragma once
  15. #include "media-io-defs.h"
  16. #include "../util/c99defs.h"
  17. #include "../util/util_uint128.h"
  18. #ifdef __cplusplus
  19. extern "C" {
  20. #endif
  21. #define MAX_AUDIO_MIXES 6
  22. #define MAX_AUDIO_CHANNELS 8
  23. #define AUDIO_OUTPUT_FRAMES 1024
  24. #define TOTAL_AUDIO_SIZE \
  25. (MAX_AUDIO_MIXES * MAX_AUDIO_CHANNELS * \
  26. AUDIO_OUTPUT_FRAMES * sizeof(float))
  27. /*
  28. * Base audio output component. Use this to create an audio output track
  29. * for the media.
  30. */
  31. struct audio_output;
  32. typedef struct audio_output audio_t;
  33. enum audio_format {
  34. AUDIO_FORMAT_UNKNOWN,
  35. AUDIO_FORMAT_U8BIT,
  36. AUDIO_FORMAT_16BIT,
  37. AUDIO_FORMAT_32BIT,
  38. AUDIO_FORMAT_FLOAT,
  39. AUDIO_FORMAT_U8BIT_PLANAR,
  40. AUDIO_FORMAT_16BIT_PLANAR,
  41. AUDIO_FORMAT_32BIT_PLANAR,
  42. AUDIO_FORMAT_FLOAT_PLANAR,
  43. };
  44. /**
  45. * The speaker layout describes where the speakers are located in the room.
  46. * For OBS it dictates:
  47. * * how many channels are available and
  48. * * which channels are used for which speakers.
  49. *
  50. * Standard channel layouts where retrieved from ffmpeg documentation at:
  51. * https://trac.ffmpeg.org/wiki/AudioChannelManipulation
  52. */
  53. enum speaker_layout {
  54. SPEAKERS_UNKNOWN, /**< Unknown setting, fallback is stereo. */
  55. SPEAKERS_MONO, /**< Channels: MONO */
  56. SPEAKERS_STEREO, /**< Channels: FL, FR */
  57. SPEAKERS_2POINT1, /**< Channels: FL, FR, LFE */
  58. SPEAKERS_4POINT0, /**< Channels: FL, FR, FC, RC */
  59. SPEAKERS_4POINT1, /**< Channels: FL, FR, FC, LFE, RC */
  60. SPEAKERS_5POINT1, /**< Channels: FL, FR, FC, LFE, RL, RR */
  61. SPEAKERS_7POINT1=8, /**< Channels: FL, FR, FC, LFE, RL, RR, SL, SR */
  62. };
  63. struct audio_data {
  64. uint8_t *data[MAX_AV_PLANES];
  65. uint32_t frames;
  66. uint64_t timestamp;
  67. };
  68. struct audio_output_data {
  69. float *data[MAX_AUDIO_CHANNELS];
  70. };
  71. typedef bool (*audio_input_callback_t)(void *param,
  72. uint64_t start_ts, uint64_t end_ts, uint64_t *new_ts,
  73. uint32_t active_mixers, struct audio_output_data *mixes);
  74. struct audio_output_info {
  75. const char *name;
  76. uint32_t samples_per_sec;
  77. enum audio_format format;
  78. enum speaker_layout speakers;
  79. audio_input_callback_t input_callback;
  80. void *input_param;
  81. };
  82. struct audio_convert_info {
  83. uint32_t samples_per_sec;
  84. enum audio_format format;
  85. enum speaker_layout speakers;
  86. };
  87. static inline uint32_t get_audio_channels(enum speaker_layout speakers)
  88. {
  89. switch (speakers) {
  90. case SPEAKERS_MONO: return 1;
  91. case SPEAKERS_STEREO: return 2;
  92. case SPEAKERS_2POINT1: return 3;
  93. case SPEAKERS_4POINT0: return 4;
  94. case SPEAKERS_4POINT1: return 5;
  95. case SPEAKERS_5POINT1: return 6;
  96. case SPEAKERS_7POINT1: return 8;
  97. case SPEAKERS_UNKNOWN: return 0;
  98. }
  99. return 0;
  100. }
  101. static inline size_t get_audio_bytes_per_channel(enum audio_format format)
  102. {
  103. switch (format) {
  104. case AUDIO_FORMAT_U8BIT:
  105. case AUDIO_FORMAT_U8BIT_PLANAR:
  106. return 1;
  107. case AUDIO_FORMAT_16BIT:
  108. case AUDIO_FORMAT_16BIT_PLANAR:
  109. return 2;
  110. case AUDIO_FORMAT_FLOAT:
  111. case AUDIO_FORMAT_FLOAT_PLANAR:
  112. case AUDIO_FORMAT_32BIT:
  113. case AUDIO_FORMAT_32BIT_PLANAR:
  114. return 4;
  115. case AUDIO_FORMAT_UNKNOWN:
  116. return 0;
  117. }
  118. return 0;
  119. }
  120. static inline bool is_audio_planar(enum audio_format format)
  121. {
  122. switch (format) {
  123. case AUDIO_FORMAT_U8BIT:
  124. case AUDIO_FORMAT_16BIT:
  125. case AUDIO_FORMAT_32BIT:
  126. case AUDIO_FORMAT_FLOAT:
  127. return false;
  128. case AUDIO_FORMAT_U8BIT_PLANAR:
  129. case AUDIO_FORMAT_FLOAT_PLANAR:
  130. case AUDIO_FORMAT_16BIT_PLANAR:
  131. case AUDIO_FORMAT_32BIT_PLANAR:
  132. return true;
  133. case AUDIO_FORMAT_UNKNOWN:
  134. return false;
  135. }
  136. return false;
  137. }
  138. static inline size_t get_audio_planes(enum audio_format format,
  139. enum speaker_layout speakers)
  140. {
  141. return (is_audio_planar(format) ? get_audio_channels(speakers) : 1);
  142. }
  143. static inline size_t get_audio_size(enum audio_format format,
  144. enum speaker_layout speakers, uint32_t frames)
  145. {
  146. bool planar = is_audio_planar(format);
  147. return (planar ? 1 : get_audio_channels(speakers)) *
  148. get_audio_bytes_per_channel(format) *
  149. frames;
  150. }
  151. static inline uint64_t audio_frames_to_ns(size_t sample_rate,
  152. uint64_t frames)
  153. {
  154. util_uint128_t val;
  155. val = util_mul64_64(frames, 1000000000ULL);
  156. val = util_div128_32(val, (uint32_t)sample_rate);
  157. return val.low;
  158. }
  159. static inline uint64_t ns_to_audio_frames(size_t sample_rate,
  160. uint64_t frames)
  161. {
  162. util_uint128_t val;
  163. val = util_mul64_64(frames, sample_rate);
  164. val = util_div128_32(val, 1000000000);
  165. return val.low;
  166. }
  167. #define AUDIO_OUTPUT_SUCCESS 0
  168. #define AUDIO_OUTPUT_INVALIDPARAM -1
  169. #define AUDIO_OUTPUT_FAIL -2
  170. EXPORT int audio_output_open(audio_t **audio, struct audio_output_info *info);
  171. EXPORT void audio_output_close(audio_t *audio);
  172. typedef void (*audio_output_callback_t)(void *param, size_t mix_idx,
  173. struct audio_data *data);
  174. EXPORT bool audio_output_connect(audio_t *video, size_t mix_idx,
  175. const struct audio_convert_info *conversion,
  176. audio_output_callback_t callback, void *param);
  177. EXPORT void audio_output_disconnect(audio_t *video, size_t mix_idx,
  178. audio_output_callback_t callback, void *param);
  179. EXPORT bool audio_output_active(const audio_t *audio);
  180. EXPORT size_t audio_output_get_block_size(const audio_t *audio);
  181. EXPORT size_t audio_output_get_planes(const audio_t *audio);
  182. EXPORT size_t audio_output_get_channels(const audio_t *audio);
  183. EXPORT uint32_t audio_output_get_sample_rate(const audio_t *audio);
  184. EXPORT const struct audio_output_info *audio_output_get_info(
  185. const audio_t *audio);
  186. #ifdef __cplusplus
  187. }
  188. #endif