audio-io.h 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234
  1. /******************************************************************************
  2. Copyright (C) 2013 by Hugh Bailey <[email protected]>
  3. This program is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation, either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>.
  13. ******************************************************************************/
  14. #pragma once
  15. #include "media-io-defs.h"
  16. #include "../util/c99defs.h"
  17. #include "../util/util_uint64.h"
  18. #ifdef __cplusplus
  19. extern "C" {
  20. #endif
  21. #define MAX_AUDIO_MIXES 6
  22. #define MAX_AUDIO_CHANNELS 8
  23. #define AUDIO_OUTPUT_FRAMES 1024
  24. #define TOTAL_AUDIO_SIZE \
  25. (MAX_AUDIO_MIXES * MAX_AUDIO_CHANNELS * AUDIO_OUTPUT_FRAMES * \
  26. sizeof(float))
  27. /*
  28. * Base audio output component. Use this to create an audio output track
  29. * for the media.
  30. */
  31. struct audio_output;
  32. typedef struct audio_output audio_t;
  33. enum audio_format {
  34. AUDIO_FORMAT_UNKNOWN,
  35. AUDIO_FORMAT_U8BIT,
  36. AUDIO_FORMAT_16BIT,
  37. AUDIO_FORMAT_32BIT,
  38. AUDIO_FORMAT_FLOAT,
  39. AUDIO_FORMAT_U8BIT_PLANAR,
  40. AUDIO_FORMAT_16BIT_PLANAR,
  41. AUDIO_FORMAT_32BIT_PLANAR,
  42. AUDIO_FORMAT_FLOAT_PLANAR,
  43. };
  44. /**
  45. * The speaker layout describes where the speakers are located in the room.
  46. * For OBS it dictates:
  47. * * how many channels are available and
  48. * * which channels are used for which speakers.
  49. *
  50. * Standard channel layouts where retrieved from ffmpeg documentation at:
  51. * https://trac.ffmpeg.org/wiki/AudioChannelManipulation
  52. */
  53. enum speaker_layout {
  54. SPEAKERS_UNKNOWN, /**< Unknown setting, fallback is stereo. */
  55. SPEAKERS_MONO, /**< Channels: MONO */
  56. SPEAKERS_STEREO, /**< Channels: FL, FR */
  57. SPEAKERS_2POINT1, /**< Channels: FL, FR, LFE */
  58. SPEAKERS_4POINT0, /**< Channels: FL, FR, FC, RC */
  59. SPEAKERS_4POINT1, /**< Channels: FL, FR, FC, LFE, RC */
  60. SPEAKERS_5POINT1, /**< Channels: FL, FR, FC, LFE, RL, RR */
  61. SPEAKERS_7POINT1 = 8, /**< Channels: FL, FR, FC, LFE, RL, RR, SL, SR */
  62. };
  63. struct audio_data {
  64. uint8_t *data[MAX_AV_PLANES];
  65. uint32_t frames;
  66. uint64_t timestamp;
  67. };
  68. struct audio_output_data {
  69. float *data[MAX_AUDIO_CHANNELS];
  70. };
  71. typedef bool (*audio_input_callback_t)(void *param, uint64_t start_ts,
  72. uint64_t end_ts, uint64_t *new_ts,
  73. uint32_t active_mixers,
  74. struct audio_output_data *mixes);
  75. struct audio_output_info {
  76. const char *name;
  77. uint32_t samples_per_sec;
  78. enum audio_format format;
  79. enum speaker_layout speakers;
  80. audio_input_callback_t input_callback;
  81. void *input_param;
  82. };
  83. struct audio_convert_info {
  84. uint32_t samples_per_sec;
  85. enum audio_format format;
  86. enum speaker_layout speakers;
  87. };
  88. static inline uint32_t get_audio_channels(enum speaker_layout speakers)
  89. {
  90. switch (speakers) {
  91. case SPEAKERS_MONO:
  92. return 1;
  93. case SPEAKERS_STEREO:
  94. return 2;
  95. case SPEAKERS_2POINT1:
  96. return 3;
  97. case SPEAKERS_4POINT0:
  98. return 4;
  99. case SPEAKERS_4POINT1:
  100. return 5;
  101. case SPEAKERS_5POINT1:
  102. return 6;
  103. case SPEAKERS_7POINT1:
  104. return 8;
  105. case SPEAKERS_UNKNOWN:
  106. return 0;
  107. }
  108. return 0;
  109. }
  110. static inline size_t get_audio_bytes_per_channel(enum audio_format format)
  111. {
  112. switch (format) {
  113. case AUDIO_FORMAT_U8BIT:
  114. case AUDIO_FORMAT_U8BIT_PLANAR:
  115. return 1;
  116. case AUDIO_FORMAT_16BIT:
  117. case AUDIO_FORMAT_16BIT_PLANAR:
  118. return 2;
  119. case AUDIO_FORMAT_FLOAT:
  120. case AUDIO_FORMAT_FLOAT_PLANAR:
  121. case AUDIO_FORMAT_32BIT:
  122. case AUDIO_FORMAT_32BIT_PLANAR:
  123. return 4;
  124. case AUDIO_FORMAT_UNKNOWN:
  125. return 0;
  126. }
  127. return 0;
  128. }
  129. static inline bool is_audio_planar(enum audio_format format)
  130. {
  131. switch (format) {
  132. case AUDIO_FORMAT_U8BIT:
  133. case AUDIO_FORMAT_16BIT:
  134. case AUDIO_FORMAT_32BIT:
  135. case AUDIO_FORMAT_FLOAT:
  136. return false;
  137. case AUDIO_FORMAT_U8BIT_PLANAR:
  138. case AUDIO_FORMAT_FLOAT_PLANAR:
  139. case AUDIO_FORMAT_16BIT_PLANAR:
  140. case AUDIO_FORMAT_32BIT_PLANAR:
  141. return true;
  142. case AUDIO_FORMAT_UNKNOWN:
  143. return false;
  144. }
  145. return false;
  146. }
  147. static inline size_t get_audio_planes(enum audio_format format,
  148. enum speaker_layout speakers)
  149. {
  150. return (is_audio_planar(format) ? get_audio_channels(speakers) : 1);
  151. }
  152. static inline size_t get_audio_size(enum audio_format format,
  153. enum speaker_layout speakers,
  154. uint32_t frames)
  155. {
  156. bool planar = is_audio_planar(format);
  157. return (planar ? 1 : get_audio_channels(speakers)) *
  158. get_audio_bytes_per_channel(format) * frames;
  159. }
  160. static inline uint64_t audio_frames_to_ns(size_t sample_rate, uint64_t frames)
  161. {
  162. return util_mul_div64(frames, 1000000000ULL, sample_rate);
  163. }
  164. static inline uint64_t ns_to_audio_frames(size_t sample_rate, uint64_t frames)
  165. {
  166. return util_mul_div64(frames, sample_rate, 1000000000ULL);
  167. }
  168. #define AUDIO_OUTPUT_SUCCESS 0
  169. #define AUDIO_OUTPUT_INVALIDPARAM -1
  170. #define AUDIO_OUTPUT_FAIL -2
  171. EXPORT int audio_output_open(audio_t **audio, struct audio_output_info *info);
  172. EXPORT void audio_output_close(audio_t *audio);
  173. typedef void (*audio_output_callback_t)(void *param, size_t mix_idx,
  174. struct audio_data *data);
  175. EXPORT bool audio_output_connect(audio_t *video, size_t mix_idx,
  176. const struct audio_convert_info *conversion,
  177. audio_output_callback_t callback, void *param);
  178. EXPORT void audio_output_disconnect(audio_t *video, size_t mix_idx,
  179. audio_output_callback_t callback,
  180. void *param);
  181. EXPORT bool audio_output_active(const audio_t *audio);
  182. EXPORT size_t audio_output_get_block_size(const audio_t *audio);
  183. EXPORT size_t audio_output_get_planes(const audio_t *audio);
  184. EXPORT size_t audio_output_get_channels(const audio_t *audio);
  185. EXPORT uint32_t audio_output_get_sample_rate(const audio_t *audio);
  186. EXPORT const struct audio_output_info *
  187. audio_output_get_info(const audio_t *audio);
  188. #ifdef __cplusplus
  189. }
  190. #endif