rtpenc.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507
  1. /*
  2. * RTP output format
  3. * Copyright (c) 2002 Fabrice Bellard
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include "avformat.h"
  22. #include "mpegts.h"
  23. #include "internal.h"
  24. #include "libavutil/mathematics.h"
  25. #include "libavutil/random_seed.h"
  26. #include "libavutil/opt.h"
  27. #include "rtpenc.h"
  28. //#define DEBUG
  29. static const AVOption options[] = {
  30. FF_RTP_FLAG_OPTS(RTPMuxContext, flags)
  31. { "payload_type", "Specify RTP payload type", offsetof(RTPMuxContext, payload_type), AV_OPT_TYPE_INT, {.dbl = -1 }, -1, 127, AV_OPT_FLAG_ENCODING_PARAM },
  32. { NULL },
  33. };
  34. static const AVClass rtp_muxer_class = {
  35. .class_name = "RTP muxer",
  36. .item_name = av_default_item_name,
  37. .option = options,
  38. .version = LIBAVUTIL_VERSION_INT,
  39. };
  40. #define RTCP_SR_SIZE 28
  41. static int is_supported(enum CodecID id)
  42. {
  43. switch(id) {
  44. case CODEC_ID_H263:
  45. case CODEC_ID_H263P:
  46. case CODEC_ID_H264:
  47. case CODEC_ID_MPEG1VIDEO:
  48. case CODEC_ID_MPEG2VIDEO:
  49. case CODEC_ID_MPEG4:
  50. case CODEC_ID_AAC:
  51. case CODEC_ID_MP2:
  52. case CODEC_ID_MP3:
  53. case CODEC_ID_PCM_ALAW:
  54. case CODEC_ID_PCM_MULAW:
  55. case CODEC_ID_PCM_S8:
  56. case CODEC_ID_PCM_S16BE:
  57. case CODEC_ID_PCM_S16LE:
  58. case CODEC_ID_PCM_U16BE:
  59. case CODEC_ID_PCM_U16LE:
  60. case CODEC_ID_PCM_U8:
  61. case CODEC_ID_MPEG2TS:
  62. case CODEC_ID_AMR_NB:
  63. case CODEC_ID_AMR_WB:
  64. case CODEC_ID_VORBIS:
  65. case CODEC_ID_THEORA:
  66. case CODEC_ID_VP8:
  67. case CODEC_ID_ADPCM_G722:
  68. case CODEC_ID_ADPCM_G726:
  69. return 1;
  70. default:
  71. return 0;
  72. }
  73. }
  74. static int rtp_write_header(AVFormatContext *s1)
  75. {
  76. RTPMuxContext *s = s1->priv_data;
  77. int n;
  78. AVStream *st;
  79. if (s1->nb_streams != 1) {
  80. av_log(s1, AV_LOG_ERROR, "Only one stream supported in the RTP muxer\n");
  81. return AVERROR(EINVAL);
  82. }
  83. st = s1->streams[0];
  84. if (!is_supported(st->codec->codec_id)) {
  85. av_log(s1, AV_LOG_ERROR, "Unsupported codec %s\n", avcodec_get_name(st->codec->codec_id));
  86. return -1;
  87. }
  88. if (s->payload_type < 0)
  89. s->payload_type = ff_rtp_get_payload_type(s1, st->codec);
  90. s->base_timestamp = av_get_random_seed();
  91. s->timestamp = s->base_timestamp;
  92. s->cur_timestamp = 0;
  93. s->ssrc = av_get_random_seed();
  94. s->first_packet = 1;
  95. s->first_rtcp_ntp_time = ff_ntp_time();
  96. if (s1->start_time_realtime)
  97. /* Round the NTP time to whole milliseconds. */
  98. s->first_rtcp_ntp_time = (s1->start_time_realtime / 1000) * 1000 +
  99. NTP_OFFSET_US;
  100. if (s1->packet_size) {
  101. if (s1->pb->max_packet_size)
  102. s1->packet_size = FFMIN(s1->packet_size,
  103. s1->pb->max_packet_size);
  104. } else
  105. s1->packet_size = s1->pb->max_packet_size;
  106. if (s1->packet_size <= 12) {
  107. av_log(s1, AV_LOG_ERROR, "Max packet size %d too low\n", s1->packet_size);
  108. return AVERROR(EIO);
  109. }
  110. s->buf = av_malloc(s1->packet_size);
  111. if (s->buf == NULL) {
  112. return AVERROR(ENOMEM);
  113. }
  114. s->max_payload_size = s1->packet_size - 12;
  115. s->max_frames_per_packet = 0;
  116. if (s1->max_delay > 0) {
  117. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  118. int frame_size = av_get_audio_frame_duration(st->codec, 0);
  119. if (!frame_size)
  120. frame_size = st->codec->frame_size;
  121. if (frame_size == 0) {
  122. av_log(s1, AV_LOG_ERROR, "Cannot respect max delay: frame size = 0\n");
  123. } else {
  124. s->max_frames_per_packet =
  125. av_rescale_q_rnd(s1->max_delay,
  126. AV_TIME_BASE_Q,
  127. (AVRational){ frame_size, st->codec->sample_rate },
  128. AV_ROUND_DOWN);
  129. }
  130. }
  131. if (st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
  132. /* FIXME: We should round down here... */
  133. s->max_frames_per_packet = av_rescale_q(s1->max_delay, (AVRational){1, 1000000}, st->codec->time_base);
  134. }
  135. }
  136. avpriv_set_pts_info(st, 32, 1, 90000);
  137. switch(st->codec->codec_id) {
  138. case CODEC_ID_MP2:
  139. case CODEC_ID_MP3:
  140. s->buf_ptr = s->buf + 4;
  141. break;
  142. case CODEC_ID_MPEG1VIDEO:
  143. case CODEC_ID_MPEG2VIDEO:
  144. break;
  145. case CODEC_ID_MPEG2TS:
  146. n = s->max_payload_size / TS_PACKET_SIZE;
  147. if (n < 1)
  148. n = 1;
  149. s->max_payload_size = n * TS_PACKET_SIZE;
  150. s->buf_ptr = s->buf;
  151. break;
  152. case CODEC_ID_H264:
  153. /* check for H.264 MP4 syntax */
  154. if (st->codec->extradata_size > 4 && st->codec->extradata[0] == 1) {
  155. s->nal_length_size = (st->codec->extradata[4] & 0x03) + 1;
  156. }
  157. break;
  158. case CODEC_ID_VORBIS:
  159. case CODEC_ID_THEORA:
  160. if (!s->max_frames_per_packet) s->max_frames_per_packet = 15;
  161. s->max_frames_per_packet = av_clip(s->max_frames_per_packet, 1, 15);
  162. s->max_payload_size -= 6; // ident+frag+tdt/vdt+pkt_num+pkt_length
  163. s->num_frames = 0;
  164. goto defaultcase;
  165. case CODEC_ID_VP8:
  166. av_log(s1, AV_LOG_ERROR, "RTP VP8 payload implementation is "
  167. "incompatible with the latest spec drafts.\n");
  168. break;
  169. case CODEC_ID_ADPCM_G722:
  170. /* Due to a historical error, the clock rate for G722 in RTP is
  171. * 8000, even if the sample rate is 16000. See RFC 3551. */
  172. avpriv_set_pts_info(st, 32, 1, 8000);
  173. break;
  174. case CODEC_ID_AMR_NB:
  175. case CODEC_ID_AMR_WB:
  176. if (!s->max_frames_per_packet)
  177. s->max_frames_per_packet = 12;
  178. if (st->codec->codec_id == CODEC_ID_AMR_NB)
  179. n = 31;
  180. else
  181. n = 61;
  182. /* max_header_toc_size + the largest AMR payload must fit */
  183. if (1 + s->max_frames_per_packet + n > s->max_payload_size) {
  184. av_log(s1, AV_LOG_ERROR, "RTP max payload size too small for AMR\n");
  185. return -1;
  186. }
  187. if (st->codec->channels != 1) {
  188. av_log(s1, AV_LOG_ERROR, "Only mono is supported\n");
  189. return -1;
  190. }
  191. case CODEC_ID_AAC:
  192. s->num_frames = 0;
  193. default:
  194. defaultcase:
  195. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  196. avpriv_set_pts_info(st, 32, 1, st->codec->sample_rate);
  197. }
  198. s->buf_ptr = s->buf;
  199. break;
  200. }
  201. return 0;
  202. }
  203. /* send an rtcp sender report packet */
  204. static void rtcp_send_sr(AVFormatContext *s1, int64_t ntp_time)
  205. {
  206. RTPMuxContext *s = s1->priv_data;
  207. uint32_t rtp_ts;
  208. av_dlog(s1, "RTCP: %02x %"PRIx64" %x\n", s->payload_type, ntp_time, s->timestamp);
  209. s->last_rtcp_ntp_time = ntp_time;
  210. rtp_ts = av_rescale_q(ntp_time - s->first_rtcp_ntp_time, (AVRational){1, 1000000},
  211. s1->streams[0]->time_base) + s->base_timestamp;
  212. avio_w8(s1->pb, (RTP_VERSION << 6));
  213. avio_w8(s1->pb, RTCP_SR);
  214. avio_wb16(s1->pb, 6); /* length in words - 1 */
  215. avio_wb32(s1->pb, s->ssrc);
  216. avio_wb32(s1->pb, ntp_time / 1000000);
  217. avio_wb32(s1->pb, ((ntp_time % 1000000) << 32) / 1000000);
  218. avio_wb32(s1->pb, rtp_ts);
  219. avio_wb32(s1->pb, s->packet_count);
  220. avio_wb32(s1->pb, s->octet_count);
  221. avio_flush(s1->pb);
  222. }
  223. /* send an rtp packet. sequence number is incremented, but the caller
  224. must update the timestamp itself */
  225. void ff_rtp_send_data(AVFormatContext *s1, const uint8_t *buf1, int len, int m)
  226. {
  227. RTPMuxContext *s = s1->priv_data;
  228. av_dlog(s1, "rtp_send_data size=%d\n", len);
  229. /* build the RTP header */
  230. avio_w8(s1->pb, (RTP_VERSION << 6));
  231. avio_w8(s1->pb, (s->payload_type & 0x7f) | ((m & 0x01) << 7));
  232. avio_wb16(s1->pb, s->seq);
  233. avio_wb32(s1->pb, s->timestamp);
  234. avio_wb32(s1->pb, s->ssrc);
  235. avio_write(s1->pb, buf1, len);
  236. avio_flush(s1->pb);
  237. s->seq++;
  238. s->octet_count += len;
  239. s->packet_count++;
  240. }
  241. /* send an integer number of samples and compute time stamp and fill
  242. the rtp send buffer before sending. */
  243. static void rtp_send_samples(AVFormatContext *s1,
  244. const uint8_t *buf1, int size, int sample_size_bits)
  245. {
  246. RTPMuxContext *s = s1->priv_data;
  247. int len, max_packet_size, n;
  248. /* Calculate the number of bytes to get samples aligned on a byte border */
  249. int aligned_samples_size = sample_size_bits/av_gcd(sample_size_bits, 8);
  250. max_packet_size = (s->max_payload_size / aligned_samples_size) * aligned_samples_size;
  251. /* Not needed, but who knows. Don't check if samples aren't an even number of bytes. */
  252. if ((sample_size_bits % 8) == 0 && ((8 * size) % sample_size_bits) != 0)
  253. av_abort();
  254. n = 0;
  255. while (size > 0) {
  256. s->buf_ptr = s->buf;
  257. len = FFMIN(max_packet_size, size);
  258. /* copy data */
  259. memcpy(s->buf_ptr, buf1, len);
  260. s->buf_ptr += len;
  261. buf1 += len;
  262. size -= len;
  263. s->timestamp = s->cur_timestamp + n * 8 / sample_size_bits;
  264. ff_rtp_send_data(s1, s->buf, s->buf_ptr - s->buf, 0);
  265. n += (s->buf_ptr - s->buf);
  266. }
  267. }
  268. static void rtp_send_mpegaudio(AVFormatContext *s1,
  269. const uint8_t *buf1, int size)
  270. {
  271. RTPMuxContext *s = s1->priv_data;
  272. int len, count, max_packet_size;
  273. max_packet_size = s->max_payload_size;
  274. /* test if we must flush because not enough space */
  275. len = (s->buf_ptr - s->buf);
  276. if ((len + size) > max_packet_size) {
  277. if (len > 4) {
  278. ff_rtp_send_data(s1, s->buf, s->buf_ptr - s->buf, 0);
  279. s->buf_ptr = s->buf + 4;
  280. }
  281. }
  282. if (s->buf_ptr == s->buf + 4) {
  283. s->timestamp = s->cur_timestamp;
  284. }
  285. /* add the packet */
  286. if (size > max_packet_size) {
  287. /* big packet: fragment */
  288. count = 0;
  289. while (size > 0) {
  290. len = max_packet_size - 4;
  291. if (len > size)
  292. len = size;
  293. /* build fragmented packet */
  294. s->buf[0] = 0;
  295. s->buf[1] = 0;
  296. s->buf[2] = count >> 8;
  297. s->buf[3] = count;
  298. memcpy(s->buf + 4, buf1, len);
  299. ff_rtp_send_data(s1, s->buf, len + 4, 0);
  300. size -= len;
  301. buf1 += len;
  302. count += len;
  303. }
  304. } else {
  305. if (s->buf_ptr == s->buf + 4) {
  306. /* no fragmentation possible */
  307. s->buf[0] = 0;
  308. s->buf[1] = 0;
  309. s->buf[2] = 0;
  310. s->buf[3] = 0;
  311. }
  312. memcpy(s->buf_ptr, buf1, size);
  313. s->buf_ptr += size;
  314. }
  315. }
  316. static void rtp_send_raw(AVFormatContext *s1,
  317. const uint8_t *buf1, int size)
  318. {
  319. RTPMuxContext *s = s1->priv_data;
  320. int len, max_packet_size;
  321. max_packet_size = s->max_payload_size;
  322. while (size > 0) {
  323. len = max_packet_size;
  324. if (len > size)
  325. len = size;
  326. s->timestamp = s->cur_timestamp;
  327. ff_rtp_send_data(s1, buf1, len, (len == size));
  328. buf1 += len;
  329. size -= len;
  330. }
  331. }
  332. /* NOTE: size is assumed to be an integer multiple of TS_PACKET_SIZE */
  333. static void rtp_send_mpegts_raw(AVFormatContext *s1,
  334. const uint8_t *buf1, int size)
  335. {
  336. RTPMuxContext *s = s1->priv_data;
  337. int len, out_len;
  338. while (size >= TS_PACKET_SIZE) {
  339. len = s->max_payload_size - (s->buf_ptr - s->buf);
  340. if (len > size)
  341. len = size;
  342. memcpy(s->buf_ptr, buf1, len);
  343. buf1 += len;
  344. size -= len;
  345. s->buf_ptr += len;
  346. out_len = s->buf_ptr - s->buf;
  347. if (out_len >= s->max_payload_size) {
  348. ff_rtp_send_data(s1, s->buf, out_len, 0);
  349. s->buf_ptr = s->buf;
  350. }
  351. }
  352. }
  353. static int rtp_write_packet(AVFormatContext *s1, AVPacket *pkt)
  354. {
  355. RTPMuxContext *s = s1->priv_data;
  356. AVStream *st = s1->streams[0];
  357. int rtcp_bytes;
  358. int size= pkt->size;
  359. av_dlog(s1, "%d: write len=%d\n", pkt->stream_index, size);
  360. rtcp_bytes = ((s->octet_count - s->last_octet_count) * RTCP_TX_RATIO_NUM) /
  361. RTCP_TX_RATIO_DEN;
  362. if ((s->first_packet || ((rtcp_bytes >= RTCP_SR_SIZE) &&
  363. (ff_ntp_time() - s->last_rtcp_ntp_time > 5000000))) &&
  364. !(s->flags & FF_RTP_FLAG_SKIP_RTCP)) {
  365. rtcp_send_sr(s1, ff_ntp_time());
  366. s->last_octet_count = s->octet_count;
  367. s->first_packet = 0;
  368. }
  369. s->cur_timestamp = s->base_timestamp + pkt->pts;
  370. switch(st->codec->codec_id) {
  371. case CODEC_ID_PCM_MULAW:
  372. case CODEC_ID_PCM_ALAW:
  373. case CODEC_ID_PCM_U8:
  374. case CODEC_ID_PCM_S8:
  375. rtp_send_samples(s1, pkt->data, size, 8 * st->codec->channels);
  376. break;
  377. case CODEC_ID_PCM_U16BE:
  378. case CODEC_ID_PCM_U16LE:
  379. case CODEC_ID_PCM_S16BE:
  380. case CODEC_ID_PCM_S16LE:
  381. rtp_send_samples(s1, pkt->data, size, 16 * st->codec->channels);
  382. break;
  383. case CODEC_ID_ADPCM_G722:
  384. /* The actual sample size is half a byte per sample, but since the
  385. * stream clock rate is 8000 Hz while the sample rate is 16000 Hz,
  386. * the correct parameter for send_samples_bits is 8 bits per stream
  387. * clock. */
  388. rtp_send_samples(s1, pkt->data, size, 8 * st->codec->channels);
  389. break;
  390. case CODEC_ID_ADPCM_G726:
  391. rtp_send_samples(s1, pkt->data, size,
  392. st->codec->bits_per_coded_sample * st->codec->channels);
  393. break;
  394. case CODEC_ID_MP2:
  395. case CODEC_ID_MP3:
  396. rtp_send_mpegaudio(s1, pkt->data, size);
  397. break;
  398. case CODEC_ID_MPEG1VIDEO:
  399. case CODEC_ID_MPEG2VIDEO:
  400. ff_rtp_send_mpegvideo(s1, pkt->data, size);
  401. break;
  402. case CODEC_ID_AAC:
  403. if (s->flags & FF_RTP_FLAG_MP4A_LATM)
  404. ff_rtp_send_latm(s1, pkt->data, size);
  405. else
  406. ff_rtp_send_aac(s1, pkt->data, size);
  407. break;
  408. case CODEC_ID_AMR_NB:
  409. case CODEC_ID_AMR_WB:
  410. ff_rtp_send_amr(s1, pkt->data, size);
  411. break;
  412. case CODEC_ID_MPEG2TS:
  413. rtp_send_mpegts_raw(s1, pkt->data, size);
  414. break;
  415. case CODEC_ID_H264:
  416. ff_rtp_send_h264(s1, pkt->data, size);
  417. break;
  418. case CODEC_ID_H263:
  419. if (s->flags & FF_RTP_FLAG_RFC2190) {
  420. int mb_info_size = 0;
  421. const uint8_t *mb_info =
  422. av_packet_get_side_data(pkt, AV_PKT_DATA_H263_MB_INFO,
  423. &mb_info_size);
  424. ff_rtp_send_h263_rfc2190(s1, pkt->data, size, mb_info, mb_info_size);
  425. break;
  426. }
  427. /* Fallthrough */
  428. case CODEC_ID_H263P:
  429. ff_rtp_send_h263(s1, pkt->data, size);
  430. break;
  431. case CODEC_ID_VORBIS:
  432. case CODEC_ID_THEORA:
  433. ff_rtp_send_xiph(s1, pkt->data, size);
  434. break;
  435. case CODEC_ID_VP8:
  436. ff_rtp_send_vp8(s1, pkt->data, size);
  437. break;
  438. default:
  439. /* better than nothing : send the codec raw data */
  440. rtp_send_raw(s1, pkt->data, size);
  441. break;
  442. }
  443. return 0;
  444. }
  445. static int rtp_write_trailer(AVFormatContext *s1)
  446. {
  447. RTPMuxContext *s = s1->priv_data;
  448. av_freep(&s->buf);
  449. return 0;
  450. }
  451. AVOutputFormat ff_rtp_muxer = {
  452. .name = "rtp",
  453. .long_name = NULL_IF_CONFIG_SMALL("RTP output format"),
  454. .priv_data_size = sizeof(RTPMuxContext),
  455. .audio_codec = CODEC_ID_PCM_MULAW,
  456. .video_codec = CODEC_ID_MPEG4,
  457. .write_header = rtp_write_header,
  458. .write_packet = rtp_write_packet,
  459. .write_trailer = rtp_write_trailer,
  460. .priv_class = &rtp_muxer_class,
  461. };