whip-output.cpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600
  1. #include "whip-output.h"
  2. #include "whip-utils.h"
  3. /*
  4. * Sets the maximum size for a video fragment. Effective range is
  5. * 576-1470, with a lower value equating to more packets created,
  6. * but also better network compatability.
  7. */
  8. static uint16_t MAX_VIDEO_FRAGMENT_SIZE = 1200;
  9. const int signaling_media_id_length = 16;
  10. const char signaling_media_id_valid_char[] = "0123456789"
  11. "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
  12. "abcdefghijklmnopqrstuvwxyz";
  13. const std::string user_agent = generate_user_agent();
  14. const char *audio_mid = "0";
  15. const uint8_t audio_payload_type = 111;
  16. const char *video_mid = "1";
  17. const uint8_t video_payload_type = 96;
  18. WHIPOutput::WHIPOutput(obs_data_t *, obs_output_t *output)
  19. : output(output),
  20. is_av1(false),
  21. endpoint_url(),
  22. bearer_token(),
  23. resource_url(),
  24. running(false),
  25. start_stop_mutex(),
  26. start_stop_thread(),
  27. base_ssrc(generate_random_u32()),
  28. peer_connection(nullptr),
  29. audio_track(nullptr),
  30. video_track(nullptr),
  31. total_bytes_sent(0),
  32. connect_time_ms(0),
  33. start_time_ns(0),
  34. last_audio_timestamp(0),
  35. last_video_timestamp(0)
  36. {
  37. }
  38. WHIPOutput::~WHIPOutput()
  39. {
  40. Stop();
  41. std::lock_guard<std::mutex> l(start_stop_mutex);
  42. if (start_stop_thread.joinable())
  43. start_stop_thread.join();
  44. }
  45. bool WHIPOutput::Start()
  46. {
  47. std::lock_guard<std::mutex> l(start_stop_mutex);
  48. auto encoder = obs_output_get_video_encoder2(output, 0);
  49. if (encoder == nullptr) {
  50. return false;
  51. }
  52. is_av1 = (strcmp("av1", obs_encoder_get_codec(encoder)) == 0);
  53. if (!obs_output_can_begin_data_capture(output, 0))
  54. return false;
  55. if (!obs_output_initialize_encoders(output, 0))
  56. return false;
  57. if (start_stop_thread.joinable())
  58. start_stop_thread.join();
  59. start_stop_thread = std::thread(&WHIPOutput::StartThread, this);
  60. return true;
  61. }
  62. void WHIPOutput::Stop(bool signal)
  63. {
  64. std::lock_guard<std::mutex> l(start_stop_mutex);
  65. if (start_stop_thread.joinable())
  66. start_stop_thread.join();
  67. start_stop_thread = std::thread(&WHIPOutput::StopThread, this, signal);
  68. }
  69. void WHIPOutput::Data(struct encoder_packet *packet)
  70. {
  71. if (!packet) {
  72. Stop(false);
  73. obs_output_signal_stop(output, OBS_OUTPUT_ENCODE_ERROR);
  74. return;
  75. }
  76. if (packet->type == OBS_ENCODER_AUDIO) {
  77. int64_t duration = packet->dts_usec - last_audio_timestamp;
  78. Send(packet->data, packet->size, duration, audio_track,
  79. audio_sr_reporter);
  80. last_audio_timestamp = packet->dts_usec;
  81. } else if (packet->type == OBS_ENCODER_VIDEO) {
  82. int64_t duration = packet->dts_usec - last_video_timestamp;
  83. Send(packet->data, packet->size, duration, video_track,
  84. video_sr_reporter);
  85. last_video_timestamp = packet->dts_usec;
  86. }
  87. }
  88. void WHIPOutput::ConfigureAudioTrack(std::string media_stream_id,
  89. std::string cname)
  90. {
  91. auto media_stream_track_id = std::string(media_stream_id + "-audio");
  92. uint32_t ssrc = base_ssrc;
  93. rtc::Description::Audio audio_description(
  94. audio_mid, rtc::Description::Direction::SendOnly);
  95. audio_description.addOpusCodec(audio_payload_type);
  96. audio_description.addSSRC(ssrc, cname, media_stream_id,
  97. media_stream_track_id);
  98. audio_track = peer_connection->addTrack(audio_description);
  99. auto rtp_config = std::make_shared<rtc::RtpPacketizationConfig>(
  100. ssrc, cname, audio_payload_type,
  101. rtc::OpusRtpPacketizer::DefaultClockRate);
  102. auto packetizer = std::make_shared<rtc::OpusRtpPacketizer>(rtp_config);
  103. audio_sr_reporter = std::make_shared<rtc::RtcpSrReporter>(rtp_config);
  104. auto nack_responder = std::make_shared<rtc::RtcpNackResponder>();
  105. packetizer->addToChain(audio_sr_reporter);
  106. packetizer->addToChain(nack_responder);
  107. audio_track->setMediaHandler(packetizer);
  108. }
  109. void WHIPOutput::ConfigureVideoTrack(std::string media_stream_id,
  110. std::string cname)
  111. {
  112. auto media_stream_track_id = std::string(media_stream_id + "-video");
  113. std::shared_ptr<rtc::RtpPacketizer> packetizer;
  114. // More predictable SSRC values between audio and video
  115. uint32_t ssrc = base_ssrc + 1;
  116. rtc::Description::Video video_description(
  117. video_mid, rtc::Description::Direction::SendOnly);
  118. video_description.addSSRC(ssrc, cname, media_stream_id,
  119. media_stream_track_id);
  120. auto rtp_config = std::make_shared<rtc::RtpPacketizationConfig>(
  121. ssrc, cname, video_payload_type,
  122. rtc::H264RtpPacketizer::defaultClockRate);
  123. if (is_av1) {
  124. video_description.addAV1Codec(video_payload_type);
  125. packetizer = std::make_shared<rtc::AV1RtpPacketizer>(
  126. rtc::AV1RtpPacketizer::Packetization::TemporalUnit,
  127. rtp_config, MAX_VIDEO_FRAGMENT_SIZE);
  128. } else {
  129. video_description.addH264Codec(video_payload_type);
  130. packetizer = std::make_shared<rtc::H264RtpPacketizer>(
  131. rtc::H264RtpPacketizer::Separator::StartSequence,
  132. rtp_config, MAX_VIDEO_FRAGMENT_SIZE);
  133. }
  134. video_sr_reporter = std::make_shared<rtc::RtcpSrReporter>(rtp_config);
  135. packetizer->addToChain(video_sr_reporter);
  136. packetizer->addToChain(std::make_shared<rtc::RtcpNackResponder>());
  137. video_track = peer_connection->addTrack(video_description);
  138. video_track->setMediaHandler(packetizer);
  139. }
  140. /**
  141. * @brief Initialize encoders and store connect info provided by the service.
  142. *
  143. * @return bool
  144. */
  145. bool WHIPOutput::Init()
  146. {
  147. if (!obs_output_can_begin_data_capture(output, 0))
  148. return false;
  149. if (!obs_output_initialize_encoders(output, 0))
  150. return false;
  151. obs_service_t *service = obs_output_get_service(output);
  152. if (!service) {
  153. obs_output_signal_stop(output, OBS_OUTPUT_ERROR);
  154. return false;
  155. }
  156. endpoint_url = obs_service_get_connect_info(
  157. service, OBS_SERVICE_CONNECT_INFO_SERVER_URL);
  158. if (endpoint_url.empty()) {
  159. obs_output_signal_stop(output, OBS_OUTPUT_BAD_PATH);
  160. return false;
  161. }
  162. bearer_token = obs_service_get_connect_info(
  163. service, OBS_SERVICE_CONNECT_INFO_BEARER_TOKEN);
  164. return true;
  165. }
  166. /**
  167. * @brief Set up the PeerConnection and media tracks.
  168. *
  169. * @return bool
  170. */
  171. bool WHIPOutput::Setup()
  172. {
  173. peer_connection = std::make_shared<rtc::PeerConnection>();
  174. peer_connection->onStateChange([this](rtc::PeerConnection::State state) {
  175. switch (state) {
  176. case rtc::PeerConnection::State::New:
  177. do_log(LOG_INFO, "PeerConnection state is now: New");
  178. break;
  179. case rtc::PeerConnection::State::Connecting:
  180. do_log(LOG_INFO,
  181. "PeerConnection state is now: Connecting");
  182. start_time_ns = os_gettime_ns();
  183. break;
  184. case rtc::PeerConnection::State::Connected:
  185. do_log(LOG_INFO,
  186. "PeerConnection state is now: Connected");
  187. connect_time_ms =
  188. (int)((os_gettime_ns() - start_time_ns) /
  189. 1000000.0);
  190. do_log(LOG_INFO, "Connect time: %dms",
  191. connect_time_ms.load());
  192. break;
  193. case rtc::PeerConnection::State::Disconnected:
  194. do_log(LOG_INFO,
  195. "PeerConnection state is now: Disconnected");
  196. Stop(false);
  197. obs_output_signal_stop(output, OBS_OUTPUT_DISCONNECTED);
  198. break;
  199. case rtc::PeerConnection::State::Failed:
  200. do_log(LOG_INFO, "PeerConnection state is now: Failed");
  201. Stop(false);
  202. obs_output_signal_stop(output, OBS_OUTPUT_ERROR);
  203. break;
  204. case rtc::PeerConnection::State::Closed:
  205. do_log(LOG_INFO, "PeerConnection state is now: Closed");
  206. break;
  207. }
  208. });
  209. std::string media_stream_id, cname;
  210. media_stream_id.reserve(signaling_media_id_length);
  211. cname.reserve(signaling_media_id_length);
  212. for (int i = 0; i < signaling_media_id_length; ++i) {
  213. media_stream_id += signaling_media_id_valid_char
  214. [rand() % (sizeof(signaling_media_id_valid_char) - 1)];
  215. cname += signaling_media_id_valid_char
  216. [rand() % (sizeof(signaling_media_id_valid_char) - 1)];
  217. }
  218. ConfigureAudioTrack(media_stream_id, cname);
  219. ConfigureVideoTrack(media_stream_id, cname);
  220. peer_connection->setLocalDescription();
  221. return true;
  222. }
  223. bool WHIPOutput::Connect()
  224. {
  225. struct curl_slist *headers = NULL;
  226. headers = curl_slist_append(headers, "Content-Type: application/sdp");
  227. if (!bearer_token.empty()) {
  228. auto bearer_token_header =
  229. std::string("Authorization: Bearer ") + bearer_token;
  230. headers =
  231. curl_slist_append(headers, bearer_token_header.c_str());
  232. }
  233. std::string read_buffer;
  234. std::vector<std::string> location_headers;
  235. auto offer_sdp =
  236. std::string(peer_connection->localDescription().value());
  237. #ifdef DEBUG_SDP
  238. do_log(LOG_DEBUG, "Offer SDP:\n%s", offer_sdp.c_str());
  239. #endif
  240. // Add user-agent to our requests
  241. headers = curl_slist_append(headers, user_agent.c_str());
  242. char error_buffer[CURL_ERROR_SIZE] = {};
  243. CURL *c = curl_easy_init();
  244. curl_easy_setopt(c, CURLOPT_WRITEFUNCTION, curl_writefunction);
  245. curl_easy_setopt(c, CURLOPT_WRITEDATA, (void *)&read_buffer);
  246. curl_easy_setopt(c, CURLOPT_HEADERFUNCTION,
  247. curl_header_location_function);
  248. curl_easy_setopt(c, CURLOPT_HEADERDATA, (void *)&location_headers);
  249. curl_easy_setopt(c, CURLOPT_HTTPHEADER, headers);
  250. curl_easy_setopt(c, CURLOPT_URL, endpoint_url.c_str());
  251. curl_easy_setopt(c, CURLOPT_POST, 1L);
  252. curl_easy_setopt(c, CURLOPT_COPYPOSTFIELDS, offer_sdp.c_str());
  253. curl_easy_setopt(c, CURLOPT_TIMEOUT, 8L);
  254. curl_easy_setopt(c, CURLOPT_FOLLOWLOCATION, 1L);
  255. curl_easy_setopt(c, CURLOPT_UNRESTRICTED_AUTH, 1L);
  256. curl_easy_setopt(c, CURLOPT_ERRORBUFFER, error_buffer);
  257. auto cleanup = [&]() {
  258. curl_easy_cleanup(c);
  259. curl_slist_free_all(headers);
  260. };
  261. CURLcode res = curl_easy_perform(c);
  262. if (res != CURLE_OK) {
  263. do_log(LOG_ERROR, "Connect failed: %s",
  264. error_buffer[0] ? error_buffer
  265. : curl_easy_strerror(res));
  266. cleanup();
  267. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  268. return false;
  269. }
  270. long response_code;
  271. curl_easy_getinfo(c, CURLINFO_RESPONSE_CODE, &response_code);
  272. if (response_code != 201) {
  273. do_log(LOG_ERROR,
  274. "Connect failed: HTTP endpoint returned response code %ld",
  275. response_code);
  276. cleanup();
  277. obs_output_signal_stop(output, OBS_OUTPUT_INVALID_STREAM);
  278. return false;
  279. }
  280. if (read_buffer.empty()) {
  281. do_log(LOG_ERROR,
  282. "Connect failed: No data returned from HTTP endpoint request");
  283. cleanup();
  284. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  285. return false;
  286. }
  287. long redirect_count = 0;
  288. curl_easy_getinfo(c, CURLINFO_REDIRECT_COUNT, &redirect_count);
  289. if (location_headers.size() < static_cast<size_t>(redirect_count) + 1) {
  290. do_log(LOG_ERROR,
  291. "WHIP server did not provide a resource URL via the Location header");
  292. cleanup();
  293. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  294. return false;
  295. }
  296. CURLU *url_builder = curl_url();
  297. auto last_location_header = location_headers.back();
  298. // If Location header doesn't start with `http` it is a relative URL.
  299. // Construct a absolute URL using the host of the effective URL
  300. if (last_location_header.find("http") != 0) {
  301. char *effective_url = nullptr;
  302. curl_easy_getinfo(c, CURLINFO_EFFECTIVE_URL, &effective_url);
  303. if (effective_url == nullptr) {
  304. do_log(LOG_ERROR, "Failed to build Resource URL");
  305. cleanup();
  306. obs_output_signal_stop(output,
  307. OBS_OUTPUT_CONNECT_FAILED);
  308. return false;
  309. }
  310. curl_url_set(url_builder, CURLUPART_URL, effective_url, 0);
  311. curl_url_set(url_builder, CURLUPART_PATH,
  312. last_location_header.c_str(), 0);
  313. curl_url_set(url_builder, CURLUPART_QUERY, "", 0);
  314. } else {
  315. curl_url_set(url_builder, CURLUPART_URL,
  316. last_location_header.c_str(), 0);
  317. }
  318. char *url = nullptr;
  319. CURLUcode rc = curl_url_get(url_builder, CURLUPART_URL, &url,
  320. CURLU_NO_DEFAULT_PORT);
  321. if (rc) {
  322. do_log(LOG_ERROR,
  323. "WHIP server provided a invalid resource URL via the Location header");
  324. cleanup();
  325. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  326. return false;
  327. }
  328. resource_url = url;
  329. curl_free(url);
  330. do_log(LOG_DEBUG, "WHIP Resource URL is: %s", resource_url.c_str());
  331. curl_url_cleanup(url_builder);
  332. #ifdef DEBUG_SDP
  333. do_log(LOG_DEBUG, "Answer SDP:\n%s", read_buffer.c_str());
  334. #endif
  335. auto response = std::string(read_buffer);
  336. response.erase(0, response.find("v=0"));
  337. rtc::Description answer(response, "answer");
  338. peer_connection->setRemoteDescription(answer);
  339. cleanup();
  340. return true;
  341. }
  342. void WHIPOutput::StartThread()
  343. {
  344. if (!Init())
  345. return;
  346. if (!Setup())
  347. return;
  348. if (!Connect()) {
  349. peer_connection->close();
  350. peer_connection = nullptr;
  351. audio_track = nullptr;
  352. video_track = nullptr;
  353. return;
  354. }
  355. obs_output_begin_data_capture(output, 0);
  356. running = true;
  357. }
  358. void WHIPOutput::SendDelete()
  359. {
  360. if (resource_url.empty()) {
  361. do_log(LOG_DEBUG,
  362. "No resource URL available, not sending DELETE");
  363. return;
  364. }
  365. struct curl_slist *headers = NULL;
  366. if (!bearer_token.empty()) {
  367. auto bearer_token_header =
  368. std::string("Authorization: Bearer ") + bearer_token;
  369. headers =
  370. curl_slist_append(headers, bearer_token_header.c_str());
  371. }
  372. // Add user-agent to our requests
  373. headers = curl_slist_append(headers, user_agent.c_str());
  374. char error_buffer[CURL_ERROR_SIZE] = {};
  375. CURL *c = curl_easy_init();
  376. curl_easy_setopt(c, CURLOPT_HTTPHEADER, headers);
  377. curl_easy_setopt(c, CURLOPT_URL, resource_url.c_str());
  378. curl_easy_setopt(c, CURLOPT_CUSTOMREQUEST, "DELETE");
  379. curl_easy_setopt(c, CURLOPT_TIMEOUT, 8L);
  380. curl_easy_setopt(c, CURLOPT_ERRORBUFFER, error_buffer);
  381. auto cleanup = [&]() {
  382. curl_easy_cleanup(c);
  383. curl_slist_free_all(headers);
  384. };
  385. CURLcode res = curl_easy_perform(c);
  386. if (res != CURLE_OK) {
  387. do_log(LOG_WARNING,
  388. "DELETE request for resource URL failed: %s",
  389. error_buffer[0] ? error_buffer
  390. : curl_easy_strerror(res));
  391. cleanup();
  392. return;
  393. }
  394. long response_code;
  395. curl_easy_getinfo(c, CURLINFO_RESPONSE_CODE, &response_code);
  396. if (response_code != 200) {
  397. do_log(LOG_WARNING,
  398. "DELETE request for resource URL failed. HTTP Code: %ld",
  399. response_code);
  400. cleanup();
  401. return;
  402. }
  403. do_log(LOG_DEBUG,
  404. "Successfully performed DELETE request for resource URL");
  405. resource_url.clear();
  406. cleanup();
  407. }
  408. void WHIPOutput::StopThread(bool signal)
  409. {
  410. if (peer_connection != nullptr) {
  411. peer_connection->close();
  412. peer_connection = nullptr;
  413. audio_track = nullptr;
  414. video_track = nullptr;
  415. }
  416. SendDelete();
  417. /*
  418. * "signal" exists because we have to preserve the "running" state
  419. * across reconnect attempts. If we don't emit a signal if
  420. * something calls obs_output_stop() and it's reconnecting, you'll
  421. * desync the UI, as the output will be "stopped" and not
  422. * "reconnecting", but the "stop" signal will have never been
  423. * emitted.
  424. */
  425. if (running && signal) {
  426. obs_output_signal_stop(output, OBS_OUTPUT_SUCCESS);
  427. running = false;
  428. }
  429. total_bytes_sent = 0;
  430. connect_time_ms = 0;
  431. start_time_ns = 0;
  432. last_audio_timestamp = 0;
  433. last_video_timestamp = 0;
  434. }
  435. void WHIPOutput::Send(void *data, uintptr_t size, uint64_t duration,
  436. std::shared_ptr<rtc::Track> track,
  437. std::shared_ptr<rtc::RtcpSrReporter> rtcp_sr_reporter)
  438. {
  439. if (track == nullptr || !track->isOpen())
  440. return;
  441. std::vector<rtc::byte> sample{(rtc::byte *)data,
  442. (rtc::byte *)data + size};
  443. auto rtp_config = rtcp_sr_reporter->rtpConfig;
  444. // Sample time is in microseconds, we need to convert it to seconds
  445. auto elapsed_seconds = double(duration) / (1000.0 * 1000.0);
  446. // Get elapsed time in clock rate
  447. uint32_t elapsed_timestamp =
  448. rtp_config->secondsToTimestamp(elapsed_seconds);
  449. // Set new timestamp
  450. rtp_config->timestamp = rtp_config->timestamp + elapsed_timestamp;
  451. // get elapsed time in clock rate from last RTCP sender report
  452. auto report_elapsed_timestamp =
  453. rtp_config->timestamp -
  454. rtcp_sr_reporter->lastReportedTimestamp();
  455. // check if last report was at least 1 second ago
  456. if (rtp_config->timestampToSeconds(report_elapsed_timestamp) > 1)
  457. rtcp_sr_reporter->setNeedsToReport();
  458. try {
  459. track->send(sample);
  460. total_bytes_sent += sample.size();
  461. } catch (const std::exception &e) {
  462. do_log(LOG_ERROR, "error: %s ", e.what());
  463. }
  464. }
  465. void register_whip_output()
  466. {
  467. struct obs_output_info info = {};
  468. info.id = "whip_output";
  469. info.flags = OBS_OUTPUT_AV | OBS_OUTPUT_ENCODED | OBS_OUTPUT_SERVICE;
  470. info.get_name = [](void *) -> const char * {
  471. return obs_module_text("Output.Name");
  472. };
  473. info.create = [](obs_data_t *settings, obs_output_t *output) -> void * {
  474. return new WHIPOutput(settings, output);
  475. };
  476. info.destroy = [](void *priv_data) {
  477. delete static_cast<WHIPOutput *>(priv_data);
  478. };
  479. info.start = [](void *priv_data) -> bool {
  480. return static_cast<WHIPOutput *>(priv_data)->Start();
  481. };
  482. info.stop = [](void *priv_data, uint64_t) {
  483. static_cast<WHIPOutput *>(priv_data)->Stop();
  484. };
  485. info.encoded_packet = [](void *priv_data,
  486. struct encoder_packet *packet) {
  487. static_cast<WHIPOutput *>(priv_data)->Data(packet);
  488. };
  489. info.get_defaults = [](obs_data_t *) {
  490. };
  491. info.get_properties = [](void *) -> obs_properties_t * {
  492. return obs_properties_create();
  493. };
  494. info.get_total_bytes = [](void *priv_data) -> uint64_t {
  495. return (uint64_t) static_cast<WHIPOutput *>(priv_data)
  496. ->GetTotalBytes();
  497. };
  498. info.get_connect_time_ms = [](void *priv_data) -> int {
  499. return static_cast<WHIPOutput *>(priv_data)->GetConnectTime();
  500. };
  501. info.encoded_video_codecs = "h264;av1";
  502. info.encoded_audio_codecs = "opus";
  503. info.protocols = "WHIP";
  504. obs_register_output(&info);
  505. }