whip-output.cpp 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579
  1. #include "whip-output.h"
  2. #include "whip-utils.h"
  3. /*
  4. * Sets the maximum size for a video fragment. Effective range is
  5. * 576-1470, with a lower value equating to more packets created,
  6. * but also better network compatability.
  7. */
  8. static uint16_t MAX_VIDEO_FRAGMENT_SIZE = 1200;
  9. const int signaling_media_id_length = 16;
  10. const char signaling_media_id_valid_char[] = "0123456789"
  11. "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
  12. "abcdefghijklmnopqrstuvwxyz";
  13. const std::string user_agent = generate_user_agent();
  14. const char *audio_mid = "0";
  15. const uint8_t audio_payload_type = 111;
  16. const char *video_mid = "1";
  17. const uint8_t video_payload_type = 96;
  18. WHIPOutput::WHIPOutput(obs_data_t *, obs_output_t *output)
  19. : output(output),
  20. endpoint_url(),
  21. bearer_token(),
  22. resource_url(),
  23. running(false),
  24. start_stop_mutex(),
  25. start_stop_thread(),
  26. base_ssrc(generate_random_u32()),
  27. peer_connection(nullptr),
  28. audio_track(nullptr),
  29. video_track(nullptr),
  30. total_bytes_sent(0),
  31. connect_time_ms(0),
  32. start_time_ns(0),
  33. last_audio_timestamp(0),
  34. last_video_timestamp(0)
  35. {
  36. }
  37. WHIPOutput::~WHIPOutput()
  38. {
  39. Stop();
  40. std::lock_guard<std::mutex> l(start_stop_mutex);
  41. if (start_stop_thread.joinable())
  42. start_stop_thread.join();
  43. }
  44. bool WHIPOutput::Start()
  45. {
  46. std::lock_guard<std::mutex> l(start_stop_mutex);
  47. if (!obs_output_can_begin_data_capture(output, 0))
  48. return false;
  49. if (!obs_output_initialize_encoders(output, 0))
  50. return false;
  51. if (start_stop_thread.joinable())
  52. start_stop_thread.join();
  53. start_stop_thread = std::thread(&WHIPOutput::StartThread, this);
  54. return true;
  55. }
  56. void WHIPOutput::Stop(bool signal)
  57. {
  58. std::lock_guard<std::mutex> l(start_stop_mutex);
  59. if (start_stop_thread.joinable())
  60. start_stop_thread.join();
  61. start_stop_thread = std::thread(&WHIPOutput::StopThread, this, signal);
  62. }
  63. void WHIPOutput::Data(struct encoder_packet *packet)
  64. {
  65. if (!packet) {
  66. Stop(false);
  67. obs_output_signal_stop(output, OBS_OUTPUT_ENCODE_ERROR);
  68. return;
  69. }
  70. if (packet->type == OBS_ENCODER_AUDIO) {
  71. int64_t duration = packet->dts_usec - last_audio_timestamp;
  72. Send(packet->data, packet->size, duration, audio_track,
  73. audio_sr_reporter);
  74. last_audio_timestamp = packet->dts_usec;
  75. } else if (packet->type == OBS_ENCODER_VIDEO) {
  76. int64_t duration = packet->dts_usec - last_video_timestamp;
  77. Send(packet->data, packet->size, duration, video_track,
  78. video_sr_reporter);
  79. last_video_timestamp = packet->dts_usec;
  80. }
  81. }
  82. void WHIPOutput::ConfigureAudioTrack(std::string media_stream_id,
  83. std::string cname)
  84. {
  85. auto media_stream_track_id = std::string(media_stream_id + "-audio");
  86. uint32_t ssrc = base_ssrc;
  87. rtc::Description::Audio audio_description(
  88. audio_mid, rtc::Description::Direction::SendOnly);
  89. audio_description.addOpusCodec(audio_payload_type);
  90. audio_description.addSSRC(ssrc, cname, media_stream_id,
  91. media_stream_track_id);
  92. audio_track = peer_connection->addTrack(audio_description);
  93. auto rtp_config = std::make_shared<rtc::RtpPacketizationConfig>(
  94. ssrc, cname, audio_payload_type,
  95. rtc::OpusRtpPacketizer::defaultClockRate);
  96. auto packetizer = std::make_shared<rtc::OpusRtpPacketizer>(rtp_config);
  97. audio_sr_reporter = std::make_shared<rtc::RtcpSrReporter>(rtp_config);
  98. auto nack_responder = std::make_shared<rtc::RtcpNackResponder>();
  99. auto opus_handler =
  100. std::make_shared<rtc::OpusPacketizationHandler>(packetizer);
  101. opus_handler->addToChain(audio_sr_reporter);
  102. opus_handler->addToChain(nack_responder);
  103. audio_track->setMediaHandler(opus_handler);
  104. }
  105. void WHIPOutput::ConfigureVideoTrack(std::string media_stream_id,
  106. std::string cname)
  107. {
  108. auto media_stream_track_id = std::string(media_stream_id + "-video");
  109. // More predictable SSRC values between audio and video
  110. uint32_t ssrc = base_ssrc + 1;
  111. rtc::Description::Video video_description(
  112. video_mid, rtc::Description::Direction::SendOnly);
  113. video_description.addH264Codec(video_payload_type);
  114. video_description.addSSRC(ssrc, cname, media_stream_id,
  115. media_stream_track_id);
  116. video_track = peer_connection->addTrack(video_description);
  117. auto rtp_config = std::make_shared<rtc::RtpPacketizationConfig>(
  118. ssrc, cname, video_payload_type,
  119. rtc::H264RtpPacketizer::defaultClockRate);
  120. auto packetizer = std::make_shared<rtc::H264RtpPacketizer>(
  121. rtc::H264RtpPacketizer::Separator::StartSequence, rtp_config,
  122. MAX_VIDEO_FRAGMENT_SIZE);
  123. video_sr_reporter = std::make_shared<rtc::RtcpSrReporter>(rtp_config);
  124. auto nack_responder = std::make_shared<rtc::RtcpNackResponder>();
  125. auto h264_handler =
  126. std::make_shared<rtc::H264PacketizationHandler>(packetizer);
  127. h264_handler->addToChain(video_sr_reporter);
  128. h264_handler->addToChain(nack_responder);
  129. video_track->setMediaHandler(h264_handler);
  130. }
  131. /**
  132. * @brief Initialize encoders and store connect info provided by the service.
  133. *
  134. * @return bool
  135. */
  136. bool WHIPOutput::Init()
  137. {
  138. if (!obs_output_can_begin_data_capture(output, 0))
  139. return false;
  140. if (!obs_output_initialize_encoders(output, 0))
  141. return false;
  142. obs_service_t *service = obs_output_get_service(output);
  143. if (!service) {
  144. obs_output_signal_stop(output, OBS_OUTPUT_ERROR);
  145. return false;
  146. }
  147. endpoint_url = obs_service_get_connect_info(
  148. service, OBS_SERVICE_CONNECT_INFO_SERVER_URL);
  149. if (endpoint_url.empty()) {
  150. obs_output_signal_stop(output, OBS_OUTPUT_BAD_PATH);
  151. return false;
  152. }
  153. bearer_token = obs_service_get_connect_info(
  154. service, OBS_SERVICE_CONNECT_INFO_BEARER_TOKEN);
  155. return true;
  156. }
  157. /**
  158. * @brief Set up the PeerConnection and media tracks.
  159. *
  160. * @return bool
  161. */
  162. bool WHIPOutput::Setup()
  163. {
  164. peer_connection = std::make_shared<rtc::PeerConnection>();
  165. peer_connection->onStateChange([this](rtc::PeerConnection::State state) {
  166. switch (state) {
  167. case rtc::PeerConnection::State::New:
  168. do_log(LOG_INFO, "PeerConnection state is now: New");
  169. break;
  170. case rtc::PeerConnection::State::Connecting:
  171. do_log(LOG_INFO,
  172. "PeerConnection state is now: Connecting");
  173. start_time_ns = os_gettime_ns();
  174. break;
  175. case rtc::PeerConnection::State::Connected:
  176. do_log(LOG_INFO,
  177. "PeerConnection state is now: Connected");
  178. connect_time_ms =
  179. (int)((os_gettime_ns() - start_time_ns) /
  180. 1000000.0);
  181. do_log(LOG_INFO, "Connect time: %dms",
  182. connect_time_ms.load());
  183. break;
  184. case rtc::PeerConnection::State::Disconnected:
  185. do_log(LOG_INFO,
  186. "PeerConnection state is now: Disconnected");
  187. Stop(false);
  188. obs_output_signal_stop(output, OBS_OUTPUT_DISCONNECTED);
  189. break;
  190. case rtc::PeerConnection::State::Failed:
  191. do_log(LOG_INFO, "PeerConnection state is now: Failed");
  192. Stop(false);
  193. obs_output_signal_stop(output, OBS_OUTPUT_ERROR);
  194. break;
  195. case rtc::PeerConnection::State::Closed:
  196. do_log(LOG_INFO, "PeerConnection state is now: Closed");
  197. break;
  198. }
  199. });
  200. std::string media_stream_id, cname;
  201. media_stream_id.reserve(signaling_media_id_length);
  202. cname.reserve(signaling_media_id_length);
  203. for (int i = 0; i < signaling_media_id_length; ++i) {
  204. media_stream_id += signaling_media_id_valid_char
  205. [rand() % (sizeof(signaling_media_id_valid_char) - 1)];
  206. cname += signaling_media_id_valid_char
  207. [rand() % (sizeof(signaling_media_id_valid_char) - 1)];
  208. }
  209. ConfigureAudioTrack(media_stream_id, cname);
  210. ConfigureVideoTrack(media_stream_id, cname);
  211. peer_connection->setLocalDescription();
  212. return true;
  213. }
  214. bool WHIPOutput::Connect()
  215. {
  216. struct curl_slist *headers = NULL;
  217. headers = curl_slist_append(headers, "Content-Type: application/sdp");
  218. if (!bearer_token.empty()) {
  219. auto bearer_token_header =
  220. std::string("Authorization: Bearer ") + bearer_token;
  221. headers =
  222. curl_slist_append(headers, bearer_token_header.c_str());
  223. }
  224. std::string read_buffer;
  225. std::vector<std::string> location_headers;
  226. auto offer_sdp =
  227. std::string(peer_connection->localDescription().value());
  228. #ifdef DEBUG_SDP
  229. do_log(LOG_DEBUG, "Offer SDP:\n%s", offer_sdp.c_str());
  230. #endif
  231. // Add user-agent to our requests
  232. headers = curl_slist_append(headers, user_agent.c_str());
  233. CURL *c = curl_easy_init();
  234. curl_easy_setopt(c, CURLOPT_WRITEFUNCTION, curl_writefunction);
  235. curl_easy_setopt(c, CURLOPT_WRITEDATA, (void *)&read_buffer);
  236. curl_easy_setopt(c, CURLOPT_HEADERFUNCTION,
  237. curl_header_location_function);
  238. curl_easy_setopt(c, CURLOPT_HEADERDATA, (void *)&location_headers);
  239. curl_easy_setopt(c, CURLOPT_HTTPHEADER, headers);
  240. curl_easy_setopt(c, CURLOPT_URL, endpoint_url.c_str());
  241. curl_easy_setopt(c, CURLOPT_POST, 1L);
  242. curl_easy_setopt(c, CURLOPT_COPYPOSTFIELDS, offer_sdp.c_str());
  243. curl_easy_setopt(c, CURLOPT_TIMEOUT, 8L);
  244. curl_easy_setopt(c, CURLOPT_FOLLOWLOCATION, 1L);
  245. curl_easy_setopt(c, CURLOPT_UNRESTRICTED_AUTH, 1L);
  246. auto cleanup = [&]() {
  247. curl_easy_cleanup(c);
  248. curl_slist_free_all(headers);
  249. };
  250. CURLcode res = curl_easy_perform(c);
  251. if (res != CURLE_OK) {
  252. do_log(LOG_ERROR,
  253. "Connect failed: CURL returned result not CURLE_OK");
  254. cleanup();
  255. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  256. return false;
  257. }
  258. long response_code;
  259. curl_easy_getinfo(c, CURLINFO_RESPONSE_CODE, &response_code);
  260. if (response_code != 201) {
  261. do_log(LOG_ERROR,
  262. "Connect failed: HTTP endpoint returned response code %ld",
  263. response_code);
  264. cleanup();
  265. obs_output_signal_stop(output, OBS_OUTPUT_INVALID_STREAM);
  266. return false;
  267. }
  268. if (read_buffer.empty()) {
  269. do_log(LOG_ERROR,
  270. "Connect failed: No data returned from HTTP endpoint request");
  271. cleanup();
  272. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  273. return false;
  274. }
  275. long redirect_count = 0;
  276. curl_easy_getinfo(c, CURLINFO_REDIRECT_COUNT, &redirect_count);
  277. if (location_headers.size() < static_cast<size_t>(redirect_count) + 1) {
  278. do_log(LOG_ERROR,
  279. "WHIP server did not provide a resource URL via the Location header");
  280. cleanup();
  281. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  282. return false;
  283. }
  284. CURLU *url_builder = curl_url();
  285. auto last_location_header = location_headers.back();
  286. // If Location header doesn't start with `http` it is a relative URL.
  287. // Construct a absolute URL using the host of the effective URL
  288. if (last_location_header.find("http") != 0) {
  289. char *effective_url = nullptr;
  290. curl_easy_getinfo(c, CURLINFO_EFFECTIVE_URL, &effective_url);
  291. if (effective_url == nullptr) {
  292. do_log(LOG_ERROR, "Failed to build Resource URL");
  293. cleanup();
  294. obs_output_signal_stop(output,
  295. OBS_OUTPUT_CONNECT_FAILED);
  296. return false;
  297. }
  298. curl_url_set(url_builder, CURLUPART_URL, effective_url, 0);
  299. curl_url_set(url_builder, CURLUPART_PATH,
  300. last_location_header.c_str(), 0);
  301. curl_url_set(url_builder, CURLUPART_QUERY, "", 0);
  302. } else {
  303. curl_url_set(url_builder, CURLUPART_URL,
  304. last_location_header.c_str(), 0);
  305. }
  306. char *url = nullptr;
  307. CURLUcode rc = curl_url_get(url_builder, CURLUPART_URL, &url,
  308. CURLU_NO_DEFAULT_PORT);
  309. if (rc) {
  310. do_log(LOG_ERROR,
  311. "WHIP server provided a invalid resource URL via the Location header");
  312. cleanup();
  313. obs_output_signal_stop(output, OBS_OUTPUT_CONNECT_FAILED);
  314. return false;
  315. }
  316. resource_url = url;
  317. curl_free(url);
  318. do_log(LOG_DEBUG, "WHIP Resource URL is: %s", resource_url.c_str());
  319. curl_url_cleanup(url_builder);
  320. #ifdef DEBUG_SDP
  321. do_log(LOG_DEBUG, "Answer SDP:\n%s", read_buffer.c_str());
  322. #endif
  323. auto response = std::string(read_buffer);
  324. response.erase(0, response.find("v=0"));
  325. rtc::Description answer(response, "answer");
  326. peer_connection->setRemoteDescription(answer);
  327. cleanup();
  328. return true;
  329. }
  330. void WHIPOutput::StartThread()
  331. {
  332. if (!Init())
  333. return;
  334. if (!Setup())
  335. return;
  336. if (!Connect()) {
  337. peer_connection->close();
  338. peer_connection = nullptr;
  339. audio_track = nullptr;
  340. video_track = nullptr;
  341. return;
  342. }
  343. obs_output_begin_data_capture(output, 0);
  344. running = true;
  345. }
  346. void WHIPOutput::SendDelete()
  347. {
  348. if (resource_url.empty()) {
  349. do_log(LOG_DEBUG,
  350. "No resource URL available, not sending DELETE");
  351. return;
  352. }
  353. struct curl_slist *headers = NULL;
  354. if (!bearer_token.empty()) {
  355. auto bearer_token_header =
  356. std::string("Authorization: Bearer ") + bearer_token;
  357. headers =
  358. curl_slist_append(headers, bearer_token_header.c_str());
  359. }
  360. // Add user-agent to our requests
  361. headers = curl_slist_append(headers, user_agent.c_str());
  362. CURL *c = curl_easy_init();
  363. curl_easy_setopt(c, CURLOPT_HTTPHEADER, headers);
  364. curl_easy_setopt(c, CURLOPT_URL, resource_url.c_str());
  365. curl_easy_setopt(c, CURLOPT_CUSTOMREQUEST, "DELETE");
  366. curl_easy_setopt(c, CURLOPT_TIMEOUT, 8L);
  367. auto cleanup = [&]() {
  368. curl_easy_cleanup(c);
  369. curl_slist_free_all(headers);
  370. };
  371. CURLcode res = curl_easy_perform(c);
  372. if (res != CURLE_OK) {
  373. do_log(LOG_WARNING,
  374. "DELETE request for resource URL failed. Reason: %s",
  375. curl_easy_strerror(res));
  376. cleanup();
  377. return;
  378. }
  379. long response_code;
  380. curl_easy_getinfo(c, CURLINFO_RESPONSE_CODE, &response_code);
  381. if (response_code != 200) {
  382. do_log(LOG_WARNING,
  383. "DELETE request for resource URL failed. HTTP Code: %ld",
  384. response_code);
  385. cleanup();
  386. return;
  387. }
  388. do_log(LOG_DEBUG,
  389. "Successfully performed DELETE request for resource URL");
  390. resource_url.clear();
  391. cleanup();
  392. }
  393. void WHIPOutput::StopThread(bool signal)
  394. {
  395. if (peer_connection != nullptr) {
  396. peer_connection->close();
  397. peer_connection = nullptr;
  398. audio_track = nullptr;
  399. video_track = nullptr;
  400. }
  401. SendDelete();
  402. /*
  403. * "signal" exists because we have to preserve the "running" state
  404. * across reconnect attempts. If we don't emit a signal if
  405. * something calls obs_output_stop() and it's reconnecting, you'll
  406. * desync the UI, as the output will be "stopped" and not
  407. * "reconnecting", but the "stop" signal will have never been
  408. * emitted.
  409. */
  410. if (running && signal) {
  411. obs_output_signal_stop(output, OBS_OUTPUT_SUCCESS);
  412. running = false;
  413. }
  414. total_bytes_sent = 0;
  415. connect_time_ms = 0;
  416. start_time_ns = 0;
  417. last_audio_timestamp = 0;
  418. last_video_timestamp = 0;
  419. }
  420. void WHIPOutput::Send(void *data, uintptr_t size, uint64_t duration,
  421. std::shared_ptr<rtc::Track> track,
  422. std::shared_ptr<rtc::RtcpSrReporter> rtcp_sr_reporter)
  423. {
  424. if (track == nullptr || !track->isOpen())
  425. return;
  426. std::vector<rtc::byte> sample{(rtc::byte *)data,
  427. (rtc::byte *)data + size};
  428. auto rtp_config = rtcp_sr_reporter->rtpConfig;
  429. // Sample time is in microseconds, we need to convert it to seconds
  430. auto elapsed_seconds = double(duration) / (1000.0 * 1000.0);
  431. // Get elapsed time in clock rate
  432. uint32_t elapsed_timestamp =
  433. rtp_config->secondsToTimestamp(elapsed_seconds);
  434. // Set new timestamp
  435. rtp_config->timestamp = rtp_config->timestamp + elapsed_timestamp;
  436. // get elapsed time in clock rate from last RTCP sender report
  437. auto report_elapsed_timestamp =
  438. rtp_config->timestamp -
  439. rtcp_sr_reporter->lastReportedTimestamp();
  440. // check if last report was at least 1 second ago
  441. if (rtp_config->timestampToSeconds(report_elapsed_timestamp) > 1)
  442. rtcp_sr_reporter->setNeedsToReport();
  443. try {
  444. track->send(sample);
  445. total_bytes_sent += sample.size();
  446. } catch (const std::exception &e) {
  447. do_log(LOG_ERROR, "error: %s ", e.what());
  448. }
  449. }
  450. void register_whip_output()
  451. {
  452. struct obs_output_info info = {};
  453. info.id = "whip_output";
  454. info.flags = OBS_OUTPUT_AV | OBS_OUTPUT_ENCODED | OBS_OUTPUT_SERVICE;
  455. info.get_name = [](void *) -> const char * {
  456. return obs_module_text("Output.Name");
  457. };
  458. info.create = [](obs_data_t *settings, obs_output_t *output) -> void * {
  459. return new WHIPOutput(settings, output);
  460. };
  461. info.destroy = [](void *priv_data) {
  462. delete static_cast<WHIPOutput *>(priv_data);
  463. };
  464. info.start = [](void *priv_data) -> bool {
  465. return static_cast<WHIPOutput *>(priv_data)->Start();
  466. };
  467. info.stop = [](void *priv_data, uint64_t) {
  468. static_cast<WHIPOutput *>(priv_data)->Stop();
  469. };
  470. info.encoded_packet = [](void *priv_data,
  471. struct encoder_packet *packet) {
  472. static_cast<WHIPOutput *>(priv_data)->Data(packet);
  473. };
  474. info.get_defaults = [](obs_data_t *) {
  475. };
  476. info.get_properties = [](void *) -> obs_properties_t * {
  477. return obs_properties_create();
  478. };
  479. info.get_total_bytes = [](void *priv_data) -> uint64_t {
  480. return (uint64_t) static_cast<WHIPOutput *>(priv_data)
  481. ->GetTotalBytes();
  482. };
  483. info.get_connect_time_ms = [](void *priv_data) -> int {
  484. return static_cast<WHIPOutput *>(priv_data)->GetConnectTime();
  485. };
  486. info.encoded_video_codecs = "h264";
  487. info.encoded_audio_codecs = "opus";
  488. info.protocols = "WHIP";
  489. obs_register_output(&info);
  490. }