You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

570 lines
18KB

  1. /*
  2. * RTP input format
  3. * Copyright (c) 2002 Fabrice Bellard
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /* needed for gethostname() */
  22. #define _XOPEN_SOURCE 600
  23. #include "libavcodec/get_bits.h"
  24. #include "avformat.h"
  25. #include "mpegts.h"
  26. #include <unistd.h>
  27. #include "network.h"
  28. #include "rtpdec.h"
  29. #include "rtpdec_amr.h"
  30. #include "rtpdec_asf.h"
  31. #include "rtpdec_h263.h"
  32. #include "rtpdec_h264.h"
  33. #include "rtpdec_mpeg4.h"
  34. #include "rtpdec_svq3.h"
  35. #include "rtpdec_xiph.h"
  36. //#define DEBUG
  37. /* TODO: - add RTCP statistics reporting (should be optional).
  38. - add support for h263/mpeg4 packetized output : IDEA: send a
  39. buffer to 'rtp_write_packet' contains all the packets for ONE
  40. frame. Each packet should have a four byte header containing
  41. the length in big endian format (same trick as
  42. 'url_open_dyn_packet_buf')
  43. */
  44. /* statistics functions */
  45. RTPDynamicProtocolHandler *RTPFirstDynamicPayloadHandler= NULL;
  46. void ff_register_dynamic_payload_handler(RTPDynamicProtocolHandler *handler)
  47. {
  48. handler->next= RTPFirstDynamicPayloadHandler;
  49. RTPFirstDynamicPayloadHandler= handler;
  50. }
  51. void av_register_rtp_dynamic_payload_handlers(void)
  52. {
  53. ff_register_dynamic_payload_handler(&ff_mp4v_es_dynamic_handler);
  54. ff_register_dynamic_payload_handler(&ff_mpeg4_generic_dynamic_handler);
  55. ff_register_dynamic_payload_handler(&ff_amr_nb_dynamic_handler);
  56. ff_register_dynamic_payload_handler(&ff_amr_wb_dynamic_handler);
  57. ff_register_dynamic_payload_handler(&ff_h263_1998_dynamic_handler);
  58. ff_register_dynamic_payload_handler(&ff_h263_2000_dynamic_handler);
  59. ff_register_dynamic_payload_handler(&ff_h264_dynamic_handler);
  60. ff_register_dynamic_payload_handler(&ff_vorbis_dynamic_handler);
  61. ff_register_dynamic_payload_handler(&ff_theora_dynamic_handler);
  62. ff_register_dynamic_payload_handler(&ff_svq3_dynamic_handler);
  63. ff_register_dynamic_payload_handler(&ff_ms_rtp_asf_pfv_handler);
  64. ff_register_dynamic_payload_handler(&ff_ms_rtp_asf_pfa_handler);
  65. }
  66. static int rtcp_parse_packet(RTPDemuxContext *s, const unsigned char *buf, int len)
  67. {
  68. if (buf[1] != 200)
  69. return -1;
  70. s->last_rtcp_ntp_time = AV_RB64(buf + 8);
  71. if (s->first_rtcp_ntp_time == AV_NOPTS_VALUE)
  72. s->first_rtcp_ntp_time = s->last_rtcp_ntp_time;
  73. s->last_rtcp_timestamp = AV_RB32(buf + 16);
  74. return 0;
  75. }
  76. #define RTP_SEQ_MOD (1<<16)
  77. /**
  78. * called on parse open packet
  79. */
  80. static void rtp_init_statistics(RTPStatistics *s, uint16_t base_sequence) // called on parse open packet.
  81. {
  82. memset(s, 0, sizeof(RTPStatistics));
  83. s->max_seq= base_sequence;
  84. s->probation= 1;
  85. }
  86. /**
  87. * called whenever there is a large jump in sequence numbers, or when they get out of probation...
  88. */
  89. static void rtp_init_sequence(RTPStatistics *s, uint16_t seq)
  90. {
  91. s->max_seq= seq;
  92. s->cycles= 0;
  93. s->base_seq= seq -1;
  94. s->bad_seq= RTP_SEQ_MOD + 1;
  95. s->received= 0;
  96. s->expected_prior= 0;
  97. s->received_prior= 0;
  98. s->jitter= 0;
  99. s->transit= 0;
  100. }
  101. /**
  102. * returns 1 if we should handle this packet.
  103. */
  104. static int rtp_valid_packet_in_sequence(RTPStatistics *s, uint16_t seq)
  105. {
  106. uint16_t udelta= seq - s->max_seq;
  107. const int MAX_DROPOUT= 3000;
  108. const int MAX_MISORDER = 100;
  109. const int MIN_SEQUENTIAL = 2;
  110. /* source not valid until MIN_SEQUENTIAL packets with sequence seq. numbers have been received */
  111. if(s->probation)
  112. {
  113. if(seq==s->max_seq + 1) {
  114. s->probation--;
  115. s->max_seq= seq;
  116. if(s->probation==0) {
  117. rtp_init_sequence(s, seq);
  118. s->received++;
  119. return 1;
  120. }
  121. } else {
  122. s->probation= MIN_SEQUENTIAL - 1;
  123. s->max_seq = seq;
  124. }
  125. } else if (udelta < MAX_DROPOUT) {
  126. // in order, with permissible gap
  127. if(seq < s->max_seq) {
  128. //sequence number wrapped; count antother 64k cycles
  129. s->cycles += RTP_SEQ_MOD;
  130. }
  131. s->max_seq= seq;
  132. } else if (udelta <= RTP_SEQ_MOD - MAX_MISORDER) {
  133. // sequence made a large jump...
  134. if(seq==s->bad_seq) {
  135. // two sequential packets-- assume that the other side restarted without telling us; just resync.
  136. rtp_init_sequence(s, seq);
  137. } else {
  138. s->bad_seq= (seq + 1) & (RTP_SEQ_MOD-1);
  139. return 0;
  140. }
  141. } else {
  142. // duplicate or reordered packet...
  143. }
  144. s->received++;
  145. return 1;
  146. }
  147. #if 0
  148. /**
  149. * This function is currently unused; without a valid local ntp time, I don't see how we could calculate the
  150. * difference between the arrival and sent timestamp. As a result, the jitter and transit statistics values
  151. * never change. I left this in in case someone else can see a way. (rdm)
  152. */
  153. static void rtcp_update_jitter(RTPStatistics *s, uint32_t sent_timestamp, uint32_t arrival_timestamp)
  154. {
  155. uint32_t transit= arrival_timestamp - sent_timestamp;
  156. int d;
  157. s->transit= transit;
  158. d= FFABS(transit - s->transit);
  159. s->jitter += d - ((s->jitter + 8)>>4);
  160. }
  161. #endif
  162. int rtp_check_and_send_back_rr(RTPDemuxContext *s, int count)
  163. {
  164. ByteIOContext *pb;
  165. uint8_t *buf;
  166. int len;
  167. int rtcp_bytes;
  168. RTPStatistics *stats= &s->statistics;
  169. uint32_t lost;
  170. uint32_t extended_max;
  171. uint32_t expected_interval;
  172. uint32_t received_interval;
  173. uint32_t lost_interval;
  174. uint32_t expected;
  175. uint32_t fraction;
  176. uint64_t ntp_time= s->last_rtcp_ntp_time; // TODO: Get local ntp time?
  177. if (!s->rtp_ctx || (count < 1))
  178. return -1;
  179. /* TODO: I think this is way too often; RFC 1889 has algorithm for this */
  180. /* XXX: mpeg pts hardcoded. RTCP send every 0.5 seconds */
  181. s->octet_count += count;
  182. rtcp_bytes = ((s->octet_count - s->last_octet_count) * RTCP_TX_RATIO_NUM) /
  183. RTCP_TX_RATIO_DEN;
  184. rtcp_bytes /= 50; // mmu_man: that's enough for me... VLC sends much less btw !?
  185. if (rtcp_bytes < 28)
  186. return -1;
  187. s->last_octet_count = s->octet_count;
  188. if (url_open_dyn_buf(&pb) < 0)
  189. return -1;
  190. // Receiver Report
  191. put_byte(pb, (RTP_VERSION << 6) + 1); /* 1 report block */
  192. put_byte(pb, 201);
  193. put_be16(pb, 7); /* length in words - 1 */
  194. put_be32(pb, s->ssrc); // our own SSRC
  195. put_be32(pb, s->ssrc); // XXX: should be the server's here!
  196. // some placeholders we should really fill...
  197. // RFC 1889/p64
  198. extended_max= stats->cycles + stats->max_seq;
  199. expected= extended_max - stats->base_seq + 1;
  200. lost= expected - stats->received;
  201. lost= FFMIN(lost, 0xffffff); // clamp it since it's only 24 bits...
  202. expected_interval= expected - stats->expected_prior;
  203. stats->expected_prior= expected;
  204. received_interval= stats->received - stats->received_prior;
  205. stats->received_prior= stats->received;
  206. lost_interval= expected_interval - received_interval;
  207. if (expected_interval==0 || lost_interval<=0) fraction= 0;
  208. else fraction = (lost_interval<<8)/expected_interval;
  209. fraction= (fraction<<24) | lost;
  210. put_be32(pb, fraction); /* 8 bits of fraction, 24 bits of total packets lost */
  211. put_be32(pb, extended_max); /* max sequence received */
  212. put_be32(pb, stats->jitter>>4); /* jitter */
  213. if(s->last_rtcp_ntp_time==AV_NOPTS_VALUE)
  214. {
  215. put_be32(pb, 0); /* last SR timestamp */
  216. put_be32(pb, 0); /* delay since last SR */
  217. } else {
  218. uint32_t middle_32_bits= s->last_rtcp_ntp_time>>16; // this is valid, right? do we need to handle 64 bit values special?
  219. uint32_t delay_since_last= ntp_time - s->last_rtcp_ntp_time;
  220. put_be32(pb, middle_32_bits); /* last SR timestamp */
  221. put_be32(pb, delay_since_last); /* delay since last SR */
  222. }
  223. // CNAME
  224. put_byte(pb, (RTP_VERSION << 6) + 1); /* 1 report block */
  225. put_byte(pb, 202);
  226. len = strlen(s->hostname);
  227. put_be16(pb, (6 + len + 3) / 4); /* length in words - 1 */
  228. put_be32(pb, s->ssrc);
  229. put_byte(pb, 0x01);
  230. put_byte(pb, len);
  231. put_buffer(pb, s->hostname, len);
  232. // padding
  233. for (len = (6 + len) % 4; len % 4; len++) {
  234. put_byte(pb, 0);
  235. }
  236. put_flush_packet(pb);
  237. len = url_close_dyn_buf(pb, &buf);
  238. if ((len > 0) && buf) {
  239. int result;
  240. dprintf(s->ic, "sending %d bytes of RR\n", len);
  241. result= url_write(s->rtp_ctx, buf, len);
  242. dprintf(s->ic, "result from url_write: %d\n", result);
  243. av_free(buf);
  244. }
  245. return 0;
  246. }
  247. void rtp_send_punch_packets(URLContext* rtp_handle)
  248. {
  249. ByteIOContext *pb;
  250. uint8_t *buf;
  251. int len;
  252. /* Send a small RTP packet */
  253. if (url_open_dyn_buf(&pb) < 0)
  254. return;
  255. put_byte(pb, (RTP_VERSION << 6));
  256. put_byte(pb, 0); /* Payload type */
  257. put_be16(pb, 0); /* Seq */
  258. put_be32(pb, 0); /* Timestamp */
  259. put_be32(pb, 0); /* SSRC */
  260. put_flush_packet(pb);
  261. len = url_close_dyn_buf(pb, &buf);
  262. if ((len > 0) && buf)
  263. url_write(rtp_handle, buf, len);
  264. av_free(buf);
  265. /* Send a minimal RTCP RR */
  266. if (url_open_dyn_buf(&pb) < 0)
  267. return;
  268. put_byte(pb, (RTP_VERSION << 6));
  269. put_byte(pb, 201); /* receiver report */
  270. put_be16(pb, 1); /* length in words - 1 */
  271. put_be32(pb, 0); /* our own SSRC */
  272. put_flush_packet(pb);
  273. len = url_close_dyn_buf(pb, &buf);
  274. if ((len > 0) && buf)
  275. url_write(rtp_handle, buf, len);
  276. av_free(buf);
  277. }
  278. /**
  279. * open a new RTP parse context for stream 'st'. 'st' can be NULL for
  280. * MPEG2TS streams to indicate that they should be demuxed inside the
  281. * rtp demux (otherwise CODEC_ID_MPEG2TS packets are returned)
  282. */
  283. RTPDemuxContext *rtp_parse_open(AVFormatContext *s1, AVStream *st, URLContext *rtpc, int payload_type)
  284. {
  285. RTPDemuxContext *s;
  286. s = av_mallocz(sizeof(RTPDemuxContext));
  287. if (!s)
  288. return NULL;
  289. s->payload_type = payload_type;
  290. s->last_rtcp_ntp_time = AV_NOPTS_VALUE;
  291. s->first_rtcp_ntp_time = AV_NOPTS_VALUE;
  292. s->ic = s1;
  293. s->st = st;
  294. rtp_init_statistics(&s->statistics, 0); // do we know the initial sequence from sdp?
  295. if (!strcmp(ff_rtp_enc_name(payload_type), "MP2T")) {
  296. s->ts = ff_mpegts_parse_open(s->ic);
  297. if (s->ts == NULL) {
  298. av_free(s);
  299. return NULL;
  300. }
  301. } else {
  302. av_set_pts_info(st, 32, 1, 90000);
  303. switch(st->codec->codec_id) {
  304. case CODEC_ID_MPEG1VIDEO:
  305. case CODEC_ID_MPEG2VIDEO:
  306. case CODEC_ID_MP2:
  307. case CODEC_ID_MP3:
  308. case CODEC_ID_MPEG4:
  309. case CODEC_ID_H263:
  310. case CODEC_ID_H264:
  311. st->need_parsing = AVSTREAM_PARSE_FULL;
  312. break;
  313. default:
  314. if (st->codec->codec_type == AVMEDIA_TYPE_AUDIO) {
  315. av_set_pts_info(st, 32, 1, st->codec->sample_rate);
  316. }
  317. break;
  318. }
  319. }
  320. // needed to send back RTCP RR in RTSP sessions
  321. s->rtp_ctx = rtpc;
  322. gethostname(s->hostname, sizeof(s->hostname));
  323. return s;
  324. }
  325. void
  326. rtp_parse_set_dynamic_protocol(RTPDemuxContext *s, PayloadContext *ctx,
  327. RTPDynamicProtocolHandler *handler)
  328. {
  329. s->dynamic_protocol_context = ctx;
  330. s->parse_packet = handler->parse_packet;
  331. }
  332. /**
  333. * This was the second switch in rtp_parse packet. Normalizes time, if required, sets stream_index, etc.
  334. */
  335. static void finalize_packet(RTPDemuxContext *s, AVPacket *pkt, uint32_t timestamp)
  336. {
  337. if (s->last_rtcp_ntp_time != AV_NOPTS_VALUE) {
  338. int64_t addend;
  339. int delta_timestamp;
  340. /* compute pts from timestamp with received ntp_time */
  341. delta_timestamp = timestamp - s->last_rtcp_timestamp;
  342. /* convert to the PTS timebase */
  343. addend = av_rescale(s->last_rtcp_ntp_time - s->first_rtcp_ntp_time, s->st->time_base.den, (uint64_t)s->st->time_base.num << 32);
  344. pkt->pts = s->range_start_offset + addend + delta_timestamp;
  345. }
  346. }
  347. /**
  348. * Parse an RTP or RTCP packet directly sent as a buffer.
  349. * @param s RTP parse context.
  350. * @param pkt returned packet
  351. * @param buf input buffer or NULL to read the next packets
  352. * @param len buffer len
  353. * @return 0 if a packet is returned, 1 if a packet is returned and more can follow
  354. * (use buf as NULL to read the next). -1 if no packet (error or no more packet).
  355. */
  356. int rtp_parse_packet(RTPDemuxContext *s, AVPacket *pkt,
  357. const uint8_t *buf, int len)
  358. {
  359. unsigned int ssrc, h;
  360. int payload_type, seq, ret, flags = 0;
  361. AVStream *st;
  362. uint32_t timestamp;
  363. int rv= 0;
  364. if (!buf) {
  365. /* return the next packets, if any */
  366. if(s->st && s->parse_packet) {
  367. timestamp= 0; ///< Should not be used if buf is NULL, but should be set to the timestamp of the packet returned....
  368. rv= s->parse_packet(s->ic, s->dynamic_protocol_context,
  369. s->st, pkt, &timestamp, NULL, 0, flags);
  370. finalize_packet(s, pkt, timestamp);
  371. return rv;
  372. } else {
  373. // TODO: Move to a dynamic packet handler (like above)
  374. if (s->read_buf_index >= s->read_buf_size)
  375. return -1;
  376. ret = ff_mpegts_parse_packet(s->ts, pkt, s->buf + s->read_buf_index,
  377. s->read_buf_size - s->read_buf_index);
  378. if (ret < 0)
  379. return -1;
  380. s->read_buf_index += ret;
  381. if (s->read_buf_index < s->read_buf_size)
  382. return 1;
  383. else
  384. return 0;
  385. }
  386. }
  387. if (len < 12)
  388. return -1;
  389. if ((buf[0] & 0xc0) != (RTP_VERSION << 6))
  390. return -1;
  391. if (buf[1] >= 200 && buf[1] <= 204) {
  392. rtcp_parse_packet(s, buf, len);
  393. return -1;
  394. }
  395. payload_type = buf[1] & 0x7f;
  396. if (buf[1] & 0x80)
  397. flags |= RTP_FLAG_MARKER;
  398. seq = AV_RB16(buf + 2);
  399. timestamp = AV_RB32(buf + 4);
  400. ssrc = AV_RB32(buf + 8);
  401. /* store the ssrc in the RTPDemuxContext */
  402. s->ssrc = ssrc;
  403. /* NOTE: we can handle only one payload type */
  404. if (s->payload_type != payload_type)
  405. return -1;
  406. st = s->st;
  407. // only do something with this if all the rtp checks pass...
  408. if(!rtp_valid_packet_in_sequence(&s->statistics, seq))
  409. {
  410. av_log(st?st->codec:NULL, AV_LOG_ERROR, "RTP: PT=%02x: bad cseq %04x expected=%04x\n",
  411. payload_type, seq, ((s->seq + 1) & 0xffff));
  412. return -1;
  413. }
  414. s->seq = seq;
  415. len -= 12;
  416. buf += 12;
  417. if (!st) {
  418. /* specific MPEG2TS demux support */
  419. ret = ff_mpegts_parse_packet(s->ts, pkt, buf, len);
  420. if (ret < 0)
  421. return -1;
  422. if (ret < len) {
  423. s->read_buf_size = len - ret;
  424. memcpy(s->buf, buf + ret, s->read_buf_size);
  425. s->read_buf_index = 0;
  426. return 1;
  427. }
  428. return 0;
  429. } else if (s->parse_packet) {
  430. rv = s->parse_packet(s->ic, s->dynamic_protocol_context,
  431. s->st, pkt, &timestamp, buf, len, flags);
  432. } else {
  433. // at this point, the RTP header has been stripped; This is ASSUMING that there is only 1 CSRC, which in't wise.
  434. switch(st->codec->codec_id) {
  435. case CODEC_ID_MP2:
  436. case CODEC_ID_MP3:
  437. /* better than nothing: skip mpeg audio RTP header */
  438. if (len <= 4)
  439. return -1;
  440. h = AV_RB32(buf);
  441. len -= 4;
  442. buf += 4;
  443. av_new_packet(pkt, len);
  444. memcpy(pkt->data, buf, len);
  445. break;
  446. case CODEC_ID_MPEG1VIDEO:
  447. case CODEC_ID_MPEG2VIDEO:
  448. /* better than nothing: skip mpeg video RTP header */
  449. if (len <= 4)
  450. return -1;
  451. h = AV_RB32(buf);
  452. buf += 4;
  453. len -= 4;
  454. if (h & (1 << 26)) {
  455. /* mpeg2 */
  456. if (len <= 4)
  457. return -1;
  458. buf += 4;
  459. len -= 4;
  460. }
  461. av_new_packet(pkt, len);
  462. memcpy(pkt->data, buf, len);
  463. break;
  464. default:
  465. av_new_packet(pkt, len);
  466. memcpy(pkt->data, buf, len);
  467. break;
  468. }
  469. pkt->stream_index = st->index;
  470. }
  471. // now perform timestamp things....
  472. finalize_packet(s, pkt, timestamp);
  473. return rv;
  474. }
  475. void rtp_parse_close(RTPDemuxContext *s)
  476. {
  477. if (!strcmp(ff_rtp_enc_name(s->payload_type), "MP2T")) {
  478. ff_mpegts_parse_close(s->ts);
  479. }
  480. av_free(s);
  481. }
  482. int ff_parse_fmtp(AVStream *stream, PayloadContext *data, const char *p,
  483. int (*parse_fmtp)(AVStream *stream,
  484. PayloadContext *data,
  485. char *attr, char *value))
  486. {
  487. char attr[256];
  488. char *value;
  489. int res;
  490. int value_size = strlen(p) + 1;
  491. if (!(value = av_malloc(value_size))) {
  492. av_log(stream, AV_LOG_ERROR, "Failed to allocate data for FMTP.");
  493. return AVERROR(ENOMEM);
  494. }
  495. // remove protocol identifier
  496. while (*p && *p == ' ') p++; // strip spaces
  497. while (*p && *p != ' ') p++; // eat protocol identifier
  498. while (*p && *p == ' ') p++; // strip trailing spaces
  499. while (ff_rtsp_next_attr_and_value(&p,
  500. attr, sizeof(attr),
  501. value, value_size)) {
  502. res = parse_fmtp(stream, data, attr, value);
  503. if (res < 0 && res != AVERROR_PATCHWELCOME) {
  504. av_free(value);
  505. return res;
  506. }
  507. }
  508. av_free(value);
  509. return 0;
  510. }