1
0

rtmp-av1.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603
  1. /******************************************************************************
  2. Copyright (C) 2023 by Lain Bailey <[email protected]>
  3. This program is free software: you can redistribute it and/or modify
  4. it under the terms of the GNU General Public License as published by
  5. the Free Software Foundation, either version 2 of the License, or
  6. (at your option) any later version.
  7. This program is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU General Public License for more details.
  11. You should have received a copy of the GNU General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>.
  13. ******************************************************************************/
  14. #include "rtmp-av1.h"
  15. #include "utils.h"
  16. #include <obs.h>
  17. #include <util/array-serializer.h>
  18. /* Adapted from FFmpeg's libavformat/av1.c for our FLV muxer. */
  19. #define AV1_OBU_SEQUENCE_HEADER 1
  20. #define AV1_OBU_TEMPORAL_DELIMITER 2
  21. #define AV1_OBU_REDUNDANT_FRAME_HEADER 7
  22. #define AV1_OBU_TILE_LIST 8
  23. #define AV1_OBU_PADDING 15
  24. #define AV1_OBU_METADATA 5
  25. #define AV1_OBU_TILE_GROUP 4
  26. #define AV1_OBU_TILE_LIST 8
  27. #define AV1_OBU_FRAME 6
  28. #define AV1_OBU_FRAME_HEADER 3
  29. #define FF_PROFILE_AV1_MAIN 0
  30. #define FF_PROFILE_AV1_HIGH 1
  31. #define FF_PROFILE_AV1_PROFESSIONAL 2
  32. enum frame_type {
  33. AV1_KEY_FRAME,
  34. AV1_INTER_FRAME,
  35. AV1_INTRA_FRAME,
  36. AV1_SWITCH_FRAME,
  37. };
  38. typedef struct AV1SequenceParameters {
  39. uint8_t profile;
  40. uint8_t level;
  41. uint8_t tier;
  42. uint8_t bitdepth;
  43. uint8_t monochrome;
  44. uint8_t chroma_subsampling_x;
  45. uint8_t chroma_subsampling_y;
  46. uint8_t chroma_sample_position;
  47. uint8_t color_description_present_flag;
  48. uint8_t color_primaries;
  49. uint8_t transfer_characteristics;
  50. uint8_t matrix_coefficients;
  51. uint8_t color_range;
  52. } AV1SequenceParameters;
  53. #define MAX_OBU_HEADER_SIZE (2 + 8)
  54. typedef struct Av1GetBitContext {
  55. const uint8_t *buffer, *buffer_end;
  56. int index;
  57. int size_in_bits;
  58. int size_in_bits_plus8;
  59. } Av1GetBitContext;
  60. static inline int init_get_bits_xe(Av1GetBitContext *s, const uint8_t *buffer, int bit_size)
  61. {
  62. int buffer_size;
  63. int ret = 0;
  64. if (bit_size >= INT_MAX - 64 * 8 || bit_size < 0 || !buffer) {
  65. bit_size = 0;
  66. buffer = NULL;
  67. ret = -1;
  68. }
  69. buffer_size = (bit_size + 7) >> 3;
  70. s->buffer = buffer;
  71. s->size_in_bits = bit_size;
  72. s->size_in_bits_plus8 = bit_size + 8;
  73. s->buffer_end = buffer + buffer_size;
  74. s->index = 0;
  75. return ret;
  76. }
  77. static inline int init_get_bits(Av1GetBitContext *s, const uint8_t *buffer, int bit_size)
  78. {
  79. return init_get_bits_xe(s, buffer, bit_size);
  80. }
  81. static inline int init_get_bits8(Av1GetBitContext *s, const uint8_t *buffer, int byte_size)
  82. {
  83. if (byte_size > INT_MAX / 8 || byte_size < 0)
  84. byte_size = -1;
  85. return init_get_bits(s, buffer, byte_size * 8);
  86. }
  87. static inline unsigned int get_bit1(Av1GetBitContext *s)
  88. {
  89. unsigned int index = s->index;
  90. uint8_t result = s->buffer[index >> 3];
  91. result <<= index & 7;
  92. result >>= 8 - 1;
  93. if (s->index < s->size_in_bits_plus8)
  94. index++;
  95. s->index = index;
  96. return result;
  97. }
  98. static inline unsigned int get_bits(Av1GetBitContext *s, unsigned int n)
  99. {
  100. unsigned int out = 0;
  101. for (unsigned int i = 0; i < n; i++)
  102. out = (out << 1) | get_bit1(s);
  103. return out;
  104. }
  105. #define skip_bits get_bits
  106. static inline int get_bits_count(Av1GetBitContext *s)
  107. {
  108. return s->index;
  109. }
  110. static inline int get_bits_left(Av1GetBitContext *gb)
  111. {
  112. return gb->size_in_bits - get_bits_count(gb);
  113. }
  114. #define get_bits_long get_bits
  115. #define skip_bits_long get_bits_long
  116. static inline int64_t leb128(Av1GetBitContext *gb)
  117. {
  118. int64_t ret = 0;
  119. int i;
  120. for (i = 0; i < 8; i++) {
  121. int byte = get_bits(gb, 8);
  122. ret |= (int64_t)(byte & 0x7f) << (i * 7);
  123. if (!(byte & 0x80))
  124. break;
  125. }
  126. return ret;
  127. }
  128. static inline void uvlc(Av1GetBitContext *gb)
  129. {
  130. int leading_zeros = 0;
  131. while (get_bits_left(gb)) {
  132. if (get_bits(gb, 1))
  133. break;
  134. leading_zeros++;
  135. }
  136. if (leading_zeros >= 32)
  137. return;
  138. skip_bits_long(gb, leading_zeros);
  139. }
  140. static inline int parse_obu_header(const uint8_t *buf, int buf_size, int64_t *obu_size, int *start_pos, int *type,
  141. int *temporal_id, int *spatial_id)
  142. {
  143. Av1GetBitContext gb;
  144. int ret, extension_flag, has_size_flag;
  145. size_t size;
  146. ret = init_get_bits8(&gb, buf, min_i32(buf_size, MAX_OBU_HEADER_SIZE));
  147. if (ret < 0)
  148. return ret;
  149. if (get_bits(&gb, 1) != 0) // obu_forbidden_bit
  150. return -1;
  151. *type = get_bits(&gb, 4);
  152. extension_flag = get_bits(&gb, 1);
  153. has_size_flag = get_bits(&gb, 1);
  154. skip_bits(&gb, 1); // obu_reserved_1bit
  155. if (extension_flag) {
  156. *temporal_id = get_bits(&gb, 3);
  157. *spatial_id = get_bits(&gb, 2);
  158. skip_bits(&gb, 3); // extension_header_reserved_3bits
  159. } else {
  160. *temporal_id = *spatial_id = 0;
  161. }
  162. *obu_size = has_size_flag ? leb128(&gb) : buf_size - 1 - extension_flag;
  163. if (get_bits_left(&gb) < 0)
  164. return -1;
  165. *start_pos = get_bits_count(&gb) / 8;
  166. size = (size_t)(*obu_size + *start_pos);
  167. if (size > (size_t)buf_size)
  168. return -1;
  169. assert(size <= INT_MAX);
  170. return (int)size;
  171. }
  172. static inline int get_obu_bit_length(const uint8_t *buf, int size, int type)
  173. {
  174. int v;
  175. /* There are no trailing bits on these */
  176. if (type == AV1_OBU_TILE_GROUP || type == AV1_OBU_TILE_LIST || type == AV1_OBU_FRAME) {
  177. if (size > INT_MAX / 8)
  178. return -1;
  179. else
  180. return size * 8;
  181. }
  182. while (size > 0 && buf[size - 1] == 0)
  183. size--;
  184. if (!size)
  185. return 0;
  186. v = buf[size - 1];
  187. if (size > INT_MAX / 8)
  188. return -1;
  189. size *= 8;
  190. /* Remove the trailing_one_bit and following trailing zeros */
  191. if (v)
  192. size -= ctz32(v) + 1;
  193. return size;
  194. }
  195. static int parse_color_config(AV1SequenceParameters *seq_params, Av1GetBitContext *gb)
  196. {
  197. int twelve_bit = 0;
  198. int high_bitdepth = get_bits(gb, 1);
  199. if (seq_params->profile == FF_PROFILE_AV1_PROFESSIONAL && high_bitdepth)
  200. twelve_bit = get_bits(gb, 1);
  201. seq_params->bitdepth = 8 + (high_bitdepth * 2) + (twelve_bit * 2);
  202. if (seq_params->profile == FF_PROFILE_AV1_HIGH)
  203. seq_params->monochrome = 0;
  204. else
  205. seq_params->monochrome = get_bits(gb, 1);
  206. seq_params->color_description_present_flag = get_bits(gb, 1);
  207. if (seq_params->color_description_present_flag) {
  208. seq_params->color_primaries = get_bits(gb, 8);
  209. seq_params->transfer_characteristics = get_bits(gb, 8);
  210. seq_params->matrix_coefficients = get_bits(gb, 8);
  211. } else {
  212. seq_params->color_primaries = 2;
  213. seq_params->transfer_characteristics = 2;
  214. seq_params->matrix_coefficients = 2;
  215. }
  216. if (seq_params->monochrome) {
  217. seq_params->color_range = get_bits(gb, 1);
  218. seq_params->chroma_subsampling_x = 1;
  219. seq_params->chroma_subsampling_y = 1;
  220. seq_params->chroma_sample_position = 0;
  221. return 0;
  222. } else if (seq_params->color_primaries == 1 && seq_params->transfer_characteristics == 13 &&
  223. seq_params->matrix_coefficients == 0) {
  224. seq_params->chroma_subsampling_x = 0;
  225. seq_params->chroma_subsampling_y = 0;
  226. } else {
  227. seq_params->color_range = get_bits(gb, 1);
  228. if (seq_params->profile == FF_PROFILE_AV1_MAIN) {
  229. seq_params->chroma_subsampling_x = 1;
  230. seq_params->chroma_subsampling_y = 1;
  231. } else if (seq_params->profile == FF_PROFILE_AV1_HIGH) {
  232. seq_params->chroma_subsampling_x = 0;
  233. seq_params->chroma_subsampling_y = 0;
  234. } else {
  235. if (twelve_bit) {
  236. seq_params->chroma_subsampling_x = get_bits(gb, 1);
  237. if (seq_params->chroma_subsampling_x)
  238. seq_params->chroma_subsampling_y = get_bits(gb, 1);
  239. else
  240. seq_params->chroma_subsampling_y = 0;
  241. } else {
  242. seq_params->chroma_subsampling_x = 1;
  243. seq_params->chroma_subsampling_y = 0;
  244. }
  245. }
  246. if (seq_params->chroma_subsampling_x && seq_params->chroma_subsampling_y)
  247. seq_params->chroma_sample_position = get_bits(gb, 2);
  248. }
  249. skip_bits(gb, 1); // separate_uv_delta_q
  250. return 0;
  251. }
  252. static int parse_sequence_header(AV1SequenceParameters *seq_params, const uint8_t *buf, int size)
  253. {
  254. Av1GetBitContext gb;
  255. int reduced_still_picture_header;
  256. int frame_width_bits_minus_1, frame_height_bits_minus_1;
  257. int size_bits, ret;
  258. size_bits = get_obu_bit_length(buf, size, AV1_OBU_SEQUENCE_HEADER);
  259. if (size_bits < 0)
  260. return size_bits;
  261. ret = init_get_bits(&gb, buf, size_bits);
  262. if (ret < 0)
  263. return ret;
  264. memset(seq_params, 0, sizeof(*seq_params));
  265. seq_params->profile = get_bits(&gb, 3);
  266. skip_bits(&gb, 1); // still_picture
  267. reduced_still_picture_header = get_bits(&gb, 1);
  268. if (reduced_still_picture_header) {
  269. seq_params->level = get_bits(&gb, 5);
  270. seq_params->tier = 0;
  271. } else {
  272. int initial_display_delay_present_flag, operating_points_cnt_minus_1;
  273. int decoder_model_info_present_flag, buffer_delay_length_minus_1;
  274. if (get_bits(&gb, 1)) { // timing_info_present_flag
  275. skip_bits_long(&gb, 32); // num_units_in_display_tick
  276. skip_bits_long(&gb, 32); // time_scale
  277. if (get_bits(&gb, 1)) // equal_picture_interval
  278. uvlc(&gb); // num_ticks_per_picture_minus_1
  279. decoder_model_info_present_flag = get_bits(&gb, 1);
  280. if (decoder_model_info_present_flag) {
  281. buffer_delay_length_minus_1 = get_bits(&gb, 5);
  282. skip_bits_long(&gb, 32);
  283. skip_bits(&gb, 10);
  284. }
  285. } else
  286. decoder_model_info_present_flag = 0;
  287. initial_display_delay_present_flag = get_bits(&gb, 1);
  288. operating_points_cnt_minus_1 = get_bits(&gb, 5);
  289. for (int i = 0; i <= operating_points_cnt_minus_1; i++) {
  290. int seq_level_idx, seq_tier;
  291. skip_bits(&gb, 12);
  292. seq_level_idx = get_bits(&gb, 5);
  293. if (seq_level_idx > 7)
  294. seq_tier = get_bits(&gb, 1);
  295. else
  296. seq_tier = 0;
  297. if (decoder_model_info_present_flag) {
  298. if (get_bits(&gb, 1)) {
  299. skip_bits_long(&gb, buffer_delay_length_minus_1 + 1);
  300. skip_bits_long(&gb, buffer_delay_length_minus_1 + 1);
  301. skip_bits(&gb, 1);
  302. }
  303. }
  304. if (initial_display_delay_present_flag) {
  305. if (get_bits(&gb, 1))
  306. skip_bits(&gb, 4);
  307. }
  308. if (i == 0) {
  309. seq_params->level = seq_level_idx;
  310. seq_params->tier = seq_tier;
  311. }
  312. }
  313. }
  314. frame_width_bits_minus_1 = get_bits(&gb, 4);
  315. frame_height_bits_minus_1 = get_bits(&gb, 4);
  316. skip_bits(&gb, frame_width_bits_minus_1 + 1); // max_frame_width_minus_1
  317. skip_bits(&gb,
  318. frame_height_bits_minus_1 + 1); // max_frame_height_minus_1
  319. if (!reduced_still_picture_header) {
  320. if (get_bits(&gb, 1)) // frame_id_numbers_present_flag
  321. skip_bits(&gb, 7);
  322. }
  323. skip_bits(&gb,
  324. 3); // use_128x128_superblock (1), enable_filter_intra (1), enable_intra_edge_filter (1)
  325. if (!reduced_still_picture_header) {
  326. int enable_order_hint, seq_force_screen_content_tools;
  327. skip_bits(&gb, 4);
  328. enable_order_hint = get_bits(&gb, 1);
  329. if (enable_order_hint)
  330. skip_bits(&gb, 2);
  331. if (get_bits(&gb, 1)) // seq_choose_screen_content_tools
  332. seq_force_screen_content_tools = 2;
  333. else
  334. seq_force_screen_content_tools = get_bits(&gb, 1);
  335. if (seq_force_screen_content_tools) {
  336. if (!get_bits(&gb, 1)) // seq_choose_integer_mv
  337. skip_bits(&gb, 1); // seq_force_integer_mv
  338. }
  339. if (enable_order_hint)
  340. skip_bits(&gb, 3); // order_hint_bits_minus_1
  341. }
  342. skip_bits(&gb, 3);
  343. parse_color_config(seq_params, &gb);
  344. skip_bits(&gb, 1); // film_grain_params_present
  345. if (get_bits_left(&gb))
  346. return -1;
  347. return 0;
  348. }
  349. size_t obs_parse_av1_header(uint8_t **header, const uint8_t *data, size_t size)
  350. {
  351. if (data[0] & 0x80) {
  352. int config_record_version = data[0] & 0x7f;
  353. if (config_record_version != 1 || size < 4)
  354. return 0;
  355. *header = bmemdup(data, size);
  356. return size;
  357. }
  358. // AV1S init
  359. AV1SequenceParameters seq_params;
  360. int nb_seq = 0, seq_size = 0, meta_size = 0;
  361. const uint8_t *seq = 0, *meta = 0;
  362. uint8_t *buf = (uint8_t *)data;
  363. while (size > 0) {
  364. int64_t obu_size;
  365. int start_pos, type, temporal_id, spatial_id;
  366. assert(size <= INT_MAX);
  367. int len = parse_obu_header(buf, (int)size, &obu_size, &start_pos, &type, &temporal_id, &spatial_id);
  368. if (len < 0)
  369. return 0;
  370. switch (type) {
  371. case AV1_OBU_SEQUENCE_HEADER:
  372. nb_seq++;
  373. if (!obu_size || nb_seq > 1) {
  374. return 0;
  375. }
  376. assert(obu_size <= INT_MAX);
  377. if (parse_sequence_header(&seq_params, buf + start_pos, (int)obu_size) < 0)
  378. return 0;
  379. seq = buf;
  380. seq_size = len;
  381. break;
  382. case AV1_OBU_METADATA:
  383. if (!obu_size)
  384. return 0;
  385. meta = buf;
  386. meta_size = len;
  387. break;
  388. default:
  389. break;
  390. }
  391. size -= len;
  392. buf += len;
  393. }
  394. if (!nb_seq)
  395. return 0;
  396. uint8_t av1header[4];
  397. av1header[0] = (1 << 7) | 1; // marker and version
  398. av1header[1] = (seq_params.profile << 5) | (seq_params.level);
  399. av1header[2] = (seq_params.tier << 7) | (seq_params.bitdepth > 8) << 6 | (seq_params.bitdepth == 12) << 5 |
  400. (seq_params.monochrome) << 4 | (seq_params.chroma_subsampling_x) << 3 |
  401. (seq_params.chroma_subsampling_y) << 2 | (seq_params.chroma_sample_position);
  402. av1header[3] = 0;
  403. struct array_output_data output;
  404. struct serializer s;
  405. array_output_serializer_init(&s, &output);
  406. s_write(&s, av1header, sizeof(av1header));
  407. if (seq_size)
  408. s_write(&s, seq, seq_size);
  409. if (meta_size)
  410. s_write(&s, meta, meta_size);
  411. *header = output.bytes.array;
  412. return output.bytes.num;
  413. }
  414. static void compute_av1_keyframe_priority(const uint8_t *buf, bool *is_keyframe, int *priority)
  415. {
  416. /* Skip if the packet already has a priority, e.g., assigned by the
  417. * encoder implementation (currently QSV/AMF). */
  418. if (*priority)
  419. return;
  420. Av1GetBitContext gb;
  421. init_get_bits8(&gb, buf, 1);
  422. // show_existing_frame
  423. if (get_bit1(&gb))
  424. return;
  425. enum frame_type type = get_bits(&gb, 2);
  426. bool show_frame = get_bit1(&gb);
  427. switch (type) {
  428. case AV1_KEY_FRAME:
  429. *is_keyframe = true;
  430. *priority = 3;
  431. break;
  432. case AV1_INTER_FRAME:
  433. *priority = show_frame ? 1 : 2;
  434. break;
  435. case AV1_INTRA_FRAME:
  436. *priority = 3;
  437. break;
  438. case AV1_SWITCH_FRAME:
  439. *priority = 2;
  440. break;
  441. }
  442. }
  443. static void serialize_av1_data(struct serializer *s, const uint8_t *data, size_t size, bool *is_keyframe, int *priority)
  444. {
  445. uint8_t *buf = (uint8_t *)data;
  446. uint8_t *end = (uint8_t *)data + size;
  447. while (buf < end) {
  448. int64_t obu_size;
  449. int start_pos, type, temporal_id, spatial_id;
  450. assert(end - buf <= INT_MAX);
  451. int len = parse_obu_header(buf, (int)(end - buf), &obu_size, &start_pos, &type, &temporal_id,
  452. &spatial_id);
  453. if (len < 0)
  454. return;
  455. switch (type) {
  456. case AV1_OBU_TEMPORAL_DELIMITER:
  457. case AV1_OBU_REDUNDANT_FRAME_HEADER:
  458. case AV1_OBU_TILE_LIST:
  459. break;
  460. case AV1_OBU_FRAME:
  461. case AV1_OBU_FRAME_HEADER:
  462. compute_av1_keyframe_priority(buf + start_pos, is_keyframe, priority);
  463. /* Falls through. */
  464. default:
  465. s_write(s, buf, len);
  466. size += len;
  467. break;
  468. }
  469. buf += len;
  470. }
  471. }
  472. void obs_parse_av1_packet(struct encoder_packet *av1_packet, const struct encoder_packet *src)
  473. {
  474. struct array_output_data output;
  475. struct serializer s;
  476. long ref = 1;
  477. array_output_serializer_init(&s, &output);
  478. serialize(&s, &ref, sizeof(ref));
  479. *av1_packet = *src;
  480. serialize_av1_data(&s, src->data, src->size, &av1_packet->keyframe, &av1_packet->priority);
  481. av1_packet->data = output.bytes.array + sizeof(ref);
  482. av1_packet->size = output.bytes.num - sizeof(ref);
  483. av1_packet->drop_priority = av1_packet->priority;
  484. }