You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

471 lines
15KB

  1. /*
  2. * Realmedia RTSP protocol (RDT) support.
  3. * Copyright (c) 2007 Ronald S. Bultje
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file rdt.c
  23. * @brief Realmedia RTSP protocol (RDT) support
  24. * @author Ronald S. Bultje <rbultje@ronald.bitfreak.net>
  25. */
  26. #include "avformat.h"
  27. #include "libavutil/avstring.h"
  28. #include "rtp_internal.h"
  29. #include "rdt.h"
  30. #include "libavutil/base64.h"
  31. #include "libavutil/md5.h"
  32. #include "rm.h"
  33. #include "internal.h"
  34. #include <libavcodec/bitstream.h>
  35. struct RDTDemuxContext {
  36. AVFormatContext *ic; /**< the containing (RTSP) demux context */
  37. /** Each RDT stream-set (represented by one RTSPStream) can contain
  38. * multiple streams (of the same content, but with possibly different
  39. * codecs/bitrates). Each such stream is represented by one AVStream
  40. * in the AVFormatContext, and this variable points to the offset in
  41. * that array such that the first is the first stream of this set. */
  42. AVStream **streams;
  43. int n_streams; /**< streams with identifical content in this set */
  44. void *dynamic_protocol_context;
  45. DynamicPayloadPacketHandlerProc parse_packet;
  46. uint32_t prev_timestamp;
  47. int prev_set_id, prev_stream_id;
  48. };
  49. RDTDemuxContext *
  50. ff_rdt_parse_open(AVFormatContext *ic, int first_stream_of_set_idx,
  51. void *priv_data, RTPDynamicProtocolHandler *handler)
  52. {
  53. RDTDemuxContext *s = av_mallocz(sizeof(RDTDemuxContext));
  54. if (!s)
  55. return NULL;
  56. s->ic = ic;
  57. s->streams = &ic->streams[first_stream_of_set_idx];
  58. do {
  59. s->n_streams++;
  60. } while (first_stream_of_set_idx + s->n_streams < ic->nb_streams &&
  61. s->streams[s->n_streams]->priv_data == s->streams[0]->priv_data);
  62. s->prev_set_id = -1;
  63. s->prev_stream_id = -1;
  64. s->prev_timestamp = -1;
  65. s->parse_packet = handler->parse_packet;
  66. s->dynamic_protocol_context = priv_data;
  67. return s;
  68. }
  69. void
  70. ff_rdt_parse_close(RDTDemuxContext *s)
  71. {
  72. av_free(s);
  73. }
  74. struct PayloadContext {
  75. AVFormatContext *rmctx;
  76. RMStream *rmst[MAX_STREAMS];
  77. uint8_t *mlti_data;
  78. unsigned int mlti_data_size;
  79. char buffer[RTP_MAX_PACKET_LENGTH + FF_INPUT_BUFFER_PADDING_SIZE];
  80. int audio_pkt_cnt; /**< remaining audio packets in rmdec */
  81. };
  82. void
  83. ff_rdt_calc_response_and_checksum(char response[41], char chksum[9],
  84. const char *challenge)
  85. {
  86. int ch_len = strlen (challenge), i;
  87. unsigned char zres[16],
  88. buf[64] = { 0xa1, 0xe9, 0x14, 0x9d, 0x0e, 0x6b, 0x3b, 0x59 };
  89. #define XOR_TABLE_SIZE 37
  90. const unsigned char xor_table[XOR_TABLE_SIZE] = {
  91. 0x05, 0x18, 0x74, 0xd0, 0x0d, 0x09, 0x02, 0x53,
  92. 0xc0, 0x01, 0x05, 0x05, 0x67, 0x03, 0x19, 0x70,
  93. 0x08, 0x27, 0x66, 0x10, 0x10, 0x72, 0x08, 0x09,
  94. 0x63, 0x11, 0x03, 0x71, 0x08, 0x08, 0x70, 0x02,
  95. 0x10, 0x57, 0x05, 0x18, 0x54 };
  96. /* some (length) checks */
  97. if (ch_len == 40) /* what a hack... */
  98. ch_len = 32;
  99. else if (ch_len > 56)
  100. ch_len = 56;
  101. memcpy(buf + 8, challenge, ch_len);
  102. /* xor challenge bytewise with xor_table */
  103. for (i = 0; i < XOR_TABLE_SIZE; i++)
  104. buf[8 + i] ^= xor_table[i];
  105. av_md5_sum(zres, buf, 64);
  106. ff_data_to_hex(response, zres, 16);
  107. for (i=0;i<32;i++) response[i] = tolower(response[i]);
  108. /* add tail */
  109. strcpy (response + 32, "01d0a8e3");
  110. /* calculate checksum */
  111. for (i = 0; i < 8; i++)
  112. chksum[i] = response[i * 4];
  113. chksum[8] = 0;
  114. }
  115. static int
  116. rdt_load_mdpr (PayloadContext *rdt, AVStream *st, int rule_nr)
  117. {
  118. ByteIOContext pb;
  119. int size;
  120. uint32_t tag;
  121. /**
  122. * Layout of the MLTI chunk:
  123. * 4:MLTI
  124. * 2:<number of streams>
  125. * Then for each stream ([number_of_streams] times):
  126. * 2:<mdpr index>
  127. * 2:<number of mdpr chunks>
  128. * Then for each mdpr chunk ([number_of_mdpr_chunks] times):
  129. * 4:<size>
  130. * [size]:<data>
  131. * we skip MDPR chunks until we reach the one of the stream
  132. * we're interested in, and forward that ([size]+[data]) to
  133. * the RM demuxer to parse the stream-specific header data.
  134. */
  135. if (!rdt->mlti_data)
  136. return -1;
  137. init_put_byte(&pb, rdt->mlti_data, rdt->mlti_data_size, 0,
  138. NULL, NULL, NULL, NULL);
  139. tag = get_le32(&pb);
  140. if (tag == MKTAG('M', 'L', 'T', 'I')) {
  141. int num, chunk_nr;
  142. /* read index of MDPR chunk numbers */
  143. num = get_be16(&pb);
  144. if (rule_nr < 0 || rule_nr >= num)
  145. return -1;
  146. url_fskip(&pb, rule_nr * 2);
  147. chunk_nr = get_be16(&pb);
  148. url_fskip(&pb, (num - 1 - rule_nr) * 2);
  149. /* read MDPR chunks */
  150. num = get_be16(&pb);
  151. if (chunk_nr >= num)
  152. return -1;
  153. while (chunk_nr--)
  154. url_fskip(&pb, get_be32(&pb));
  155. size = get_be32(&pb);
  156. } else {
  157. size = rdt->mlti_data_size;
  158. url_fseek(&pb, 0, SEEK_SET);
  159. }
  160. if (ff_rm_read_mdpr_codecdata(rdt->rmctx, &pb, st, rdt->rmst[0], size) < 0)
  161. return -1;
  162. return 0;
  163. }
  164. /**
  165. * Actual data handling.
  166. */
  167. int
  168. ff_rdt_parse_header(const uint8_t *buf, int len,
  169. int *pset_id, int *pseq_no, int *pstream_id,
  170. int *pis_keyframe, uint32_t *ptimestamp)
  171. {
  172. GetBitContext gb;
  173. int consumed = 0, set_id, seq_no, stream_id, is_keyframe,
  174. len_included, need_reliable;
  175. uint32_t timestamp;
  176. /* skip status packets */
  177. while (len >= 5 && buf[1] == 0xFF /* status packet */) {
  178. int pkt_len;
  179. if (!(buf[0] & 0x80))
  180. return -1; /* not followed by a data packet */
  181. pkt_len = AV_RB16(buf+3);
  182. buf += pkt_len;
  183. len -= pkt_len;
  184. consumed += pkt_len;
  185. }
  186. if (len < 16)
  187. return -1;
  188. /**
  189. * Layout of the header (in bits):
  190. * 1: len_included
  191. * Flag indicating whether this header includes a length field;
  192. * this can be used to concatenate multiple RDT packets in a
  193. * single UDP/TCP data frame and is used to precede RDT data
  194. * by stream status packets
  195. * 1: need_reliable
  196. * Flag indicating whether this header includes a "reliable
  197. * sequence number"; these are apparently sequence numbers of
  198. * data packets alone. For data packets, this flag is always
  199. * set, according to the Real documentation [1]
  200. * 5: set_id
  201. * ID of a set of streams of identical content, possibly with
  202. * different codecs or bitrates
  203. * 1: is_reliable
  204. * Flag set for certain streams deemed less tolerable for packet
  205. * loss
  206. * 16: seq_no
  207. * Packet sequence number; if >=0xFF00, this is a non-data packet
  208. * containing stream status info, the second byte indicates the
  209. * type of status packet (see wireshark docs / source code [2])
  210. * if (len_included) {
  211. * 16: packet_len
  212. * } else {
  213. * packet_len = remainder of UDP/TCP frame
  214. * }
  215. * 1: is_back_to_back
  216. * Back-to-Back flag; used for timing, set for one in every 10
  217. * packets, according to the Real documentation [1]
  218. * 1: is_slow_data
  219. * Slow-data flag; currently unused, according to Real docs [1]
  220. * 5: stream_id
  221. * ID of the stream within this particular set of streams
  222. * 1: is_no_keyframe
  223. * Non-keyframe flag (unset if packet belongs to a keyframe)
  224. * 32: timestamp (PTS)
  225. * if (set_id == 0x1F) {
  226. * 16: set_id (extended set-of-streams ID; see set_id)
  227. * }
  228. * if (need_reliable) {
  229. * 16: reliable_seq_no
  230. * Reliable sequence number (see need_reliable)
  231. * }
  232. * if (stream_id == 0x3F) {
  233. * 16: stream_id (extended stream ID; see stream_id)
  234. * }
  235. * [1] https://protocol.helixcommunity.org/files/2005/devdocs/RDT_Feature_Level_20.txt
  236. * [2] http://www.wireshark.org/docs/dfref/r/rdt.html and
  237. * http://anonsvn.wireshark.org/viewvc/trunk/epan/dissectors/packet-rdt.c
  238. */
  239. init_get_bits(&gb, buf, len << 3);
  240. len_included = get_bits1(&gb);
  241. need_reliable = get_bits1(&gb);
  242. set_id = get_bits(&gb, 5);
  243. skip_bits(&gb, 1);
  244. seq_no = get_bits(&gb, 16);
  245. if (len_included)
  246. skip_bits(&gb, 16);
  247. skip_bits(&gb, 2);
  248. stream_id = get_bits(&gb, 5);
  249. is_keyframe = !get_bits1(&gb);
  250. timestamp = get_bits_long(&gb, 32);
  251. if (set_id == 0x1f)
  252. set_id = get_bits(&gb, 16);
  253. if (need_reliable)
  254. skip_bits(&gb, 16);
  255. if (stream_id == 0x1f)
  256. stream_id = get_bits(&gb, 16);
  257. if (pset_id) *pset_id = set_id;
  258. if (pseq_no) *pseq_no = seq_no;
  259. if (pstream_id) *pstream_id = stream_id;
  260. if (pis_keyframe) *pis_keyframe = is_keyframe;
  261. if (ptimestamp) *ptimestamp = timestamp;
  262. return consumed + (get_bits_count(&gb) >> 3);
  263. }
  264. /**< return 0 on packet, no more left, 1 on packet, 1 on partial packet... */
  265. static int
  266. rdt_parse_packet (PayloadContext *rdt, AVStream *st,
  267. AVPacket *pkt, uint32_t *timestamp,
  268. const uint8_t *buf, int len, int flags)
  269. {
  270. int seq = 1, res;
  271. ByteIOContext pb;
  272. if (rdt->audio_pkt_cnt == 0) {
  273. int pos;
  274. init_put_byte(&pb, buf, len, 0, NULL, NULL, NULL, NULL);
  275. flags = (flags & PKT_FLAG_KEY) ? 2 : 0;
  276. res = ff_rm_parse_packet (rdt->rmctx, &pb, st, rdt->rmst[0], len, pkt,
  277. &seq, &flags, timestamp);
  278. pos = url_ftell(&pb);
  279. if (res < 0)
  280. return res;
  281. rdt->audio_pkt_cnt = res;
  282. if (rdt->audio_pkt_cnt > 0 &&
  283. st->codec->codec_id == CODEC_ID_AAC) {
  284. memcpy (rdt->buffer, buf + pos, len - pos);
  285. rdt->rmctx->pb = av_alloc_put_byte (rdt->buffer, len - pos, 0,
  286. NULL, NULL, NULL, NULL);
  287. }
  288. } else {
  289. rdt->audio_pkt_cnt =
  290. ff_rm_retrieve_cache (rdt->rmctx, rdt->rmctx->pb,
  291. st, rdt->rmst[0], pkt);
  292. if (rdt->audio_pkt_cnt == 0 &&
  293. st->codec->codec_id == CODEC_ID_AAC)
  294. av_freep(&rdt->rmctx->pb);
  295. }
  296. pkt->stream_index = st->index;
  297. pkt->pts = *timestamp;
  298. return rdt->audio_pkt_cnt > 0;
  299. }
  300. int
  301. ff_rdt_parse_packet(RDTDemuxContext *s, AVPacket *pkt,
  302. const uint8_t *buf, int len)
  303. {
  304. int seq_no, flags = 0, stream_id, set_id, is_keyframe;
  305. uint32_t timestamp;
  306. int rv= 0;
  307. if (!s->parse_packet)
  308. return -1;
  309. if (!buf && s->prev_stream_id != -1) {
  310. /* return the next packets, if any */
  311. timestamp= 0; ///< Should not be used if buf is NULL, but should be set to the timestamp of the packet returned....
  312. rv= s->parse_packet(s->dynamic_protocol_context,
  313. s->streams[s->prev_stream_id],
  314. pkt, &timestamp, NULL, 0, flags);
  315. return rv;
  316. }
  317. if (len < 12)
  318. return -1;
  319. rv = ff_rdt_parse_header(buf, len, &set_id, &seq_no, &stream_id, &is_keyframe, &timestamp);
  320. if (rv < 0)
  321. return rv;
  322. if (is_keyframe &&
  323. (set_id != s->prev_set_id || timestamp != s->prev_timestamp ||
  324. stream_id != s->prev_stream_id)) {
  325. flags |= PKT_FLAG_KEY;
  326. s->prev_set_id = set_id;
  327. s->prev_timestamp = timestamp;
  328. }
  329. s->prev_stream_id = stream_id;
  330. buf += rv;
  331. len -= rv;
  332. if (s->prev_stream_id >= s->n_streams) {
  333. s->prev_stream_id = -1;
  334. return -1;
  335. }
  336. rv = s->parse_packet(s->dynamic_protocol_context,
  337. s->streams[s->prev_stream_id],
  338. pkt, &timestamp, buf, len, flags);
  339. return rv;
  340. }
  341. void
  342. ff_rdt_subscribe_rule (char *cmd, int size,
  343. int stream_nr, int rule_nr)
  344. {
  345. av_strlcatf(cmd, size, "stream=%d;rule=%d,stream=%d;rule=%d",
  346. stream_nr, rule_nr * 2, stream_nr, rule_nr * 2 + 1);
  347. }
  348. void
  349. ff_rdt_subscribe_rule2 (RDTDemuxContext *s, char *cmd, int size,
  350. int stream_nr, int rule_nr)
  351. {
  352. PayloadContext *rdt = s->dynamic_protocol_context;
  353. rdt_load_mdpr(rdt, s->streams[0], rule_nr * 2);
  354. }
  355. static unsigned char *
  356. rdt_parse_b64buf (unsigned int *target_len, const char *p)
  357. {
  358. unsigned char *target;
  359. int len = strlen(p);
  360. if (*p == '\"') {
  361. p++;
  362. len -= 2; /* skip embracing " at start/end */
  363. }
  364. *target_len = len * 3 / 4;
  365. target = av_mallocz(*target_len + FF_INPUT_BUFFER_PADDING_SIZE);
  366. av_base64_decode(target, p, *target_len);
  367. return target;
  368. }
  369. static int
  370. rdt_parse_sdp_line (AVFormatContext *s, int st_index,
  371. PayloadContext *rdt, const char *line)
  372. {
  373. AVStream *stream = s->streams[st_index];
  374. const char *p = line;
  375. if (av_strstart(p, "OpaqueData:buffer;", &p)) {
  376. rdt->mlti_data = rdt_parse_b64buf(&rdt->mlti_data_size, p);
  377. } else if (av_strstart(p, "StartTime:integer;", &p))
  378. stream->first_dts = atoi(p);
  379. return 0;
  380. }
  381. static PayloadContext *
  382. rdt_new_extradata (void)
  383. {
  384. PayloadContext *rdt = av_mallocz(sizeof(PayloadContext));
  385. av_open_input_stream(&rdt->rmctx, NULL, "", &rdt_demuxer, NULL);
  386. rdt->rmst[0] = ff_rm_alloc_rmstream();
  387. return rdt;
  388. }
  389. static void
  390. rdt_free_extradata (PayloadContext *rdt)
  391. {
  392. ff_rm_free_rmstream(rdt->rmst[0]);
  393. av_free(rdt->rmst[0]);
  394. if (rdt->rmctx)
  395. av_close_input_stream(rdt->rmctx);
  396. av_freep(&rdt->mlti_data);
  397. av_free(rdt);
  398. }
  399. #define RDT_HANDLER(n, s, t) \
  400. static RTPDynamicProtocolHandler ff_rdt_ ## n ## _handler = { \
  401. s, \
  402. t, \
  403. CODEC_ID_NONE, \
  404. rdt_parse_sdp_line, \
  405. rdt_new_extradata, \
  406. rdt_free_extradata, \
  407. rdt_parse_packet \
  408. };
  409. RDT_HANDLER(live_video, "x-pn-multirate-realvideo-live", CODEC_TYPE_VIDEO);
  410. RDT_HANDLER(live_audio, "x-pn-multirate-realaudio-live", CODEC_TYPE_AUDIO);
  411. RDT_HANDLER(video, "x-pn-realvideo", CODEC_TYPE_VIDEO);
  412. RDT_HANDLER(audio, "x-pn-realaudio", CODEC_TYPE_AUDIO);
  413. void av_register_rdt_dynamic_payload_handlers(void)
  414. {
  415. ff_register_dynamic_payload_handler(&ff_rdt_video_handler);
  416. ff_register_dynamic_payload_handler(&ff_rdt_audio_handler);
  417. ff_register_dynamic_payload_handler(&ff_rdt_live_video_handler);
  418. ff_register_dynamic_payload_handler(&ff_rdt_live_audio_handler);
  419. }