You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

414 lines
14KB

  1. /*
  2. * RTP H264 Protocol (RFC3984)
  3. * Copyright (c) 2006 Ryan Martell
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file rtp_h264.c
  23. * @brief H.264 / RTP Code (RFC3984)
  24. * @author Ryan Martell <rdm4@martellventures.com>
  25. *
  26. * @note Notes:
  27. * Notes:
  28. * This currently supports packetization mode:
  29. * Single Nal Unit Mode (0), or
  30. * Non-Interleaved Mode (1). It currently does not support
  31. * Interleaved Mode (2). (This requires implementing STAP-B, MTAP16, MTAP24, FU-B packet types)
  32. *
  33. * @note TODO:
  34. * 1) RTCP sender reports for udp streams are required..
  35. *
  36. */
  37. #include "libavutil/base64.h"
  38. #include "libavutil/avstring.h"
  39. #include "libavcodec/bitstream.h"
  40. #include "avformat.h"
  41. #include "mpegts.h"
  42. #include <unistd.h>
  43. #include "network.h"
  44. #include <assert.h>
  45. #include "rtp.h"
  46. #include "rtp_h264.h"
  47. /**
  48. RTP/H264 specific private data.
  49. */
  50. struct PayloadContext {
  51. unsigned long cookie; ///< sanity check, to make sure we get the pointer we're expecting.
  52. //sdp setup parameters
  53. uint8_t profile_idc; ///< from the sdp setup parameters.
  54. uint8_t profile_iop; ///< from the sdp setup parameters.
  55. uint8_t level_idc; ///< from the sdp setup parameters.
  56. int packetization_mode; ///< from the sdp setup parameters.
  57. #ifdef DEBUG
  58. int packet_types_received[32];
  59. #endif
  60. };
  61. #define MAGIC_COOKIE (0xdeadbeef) ///< Cookie for the extradata; to verify we are what we think we are, and that we haven't been freed.
  62. #define DEAD_COOKIE (0xdeaddead) ///< Cookie for the extradata; once it is freed.
  63. /* ---------------- private code */
  64. static void sdp_parse_fmtp_config_h264(AVStream * stream,
  65. PayloadContext * h264_data,
  66. char *attr, char *value)
  67. {
  68. AVCodecContext *codec = stream->codec;
  69. assert(codec->codec_id == CODEC_ID_H264);
  70. assert(h264_data != NULL);
  71. if (!strcmp(attr, "packetization-mode")) {
  72. av_log(NULL, AV_LOG_DEBUG, "H.264/RTP Packetization Mode: %d\n", atoi(value));
  73. h264_data->packetization_mode = atoi(value);
  74. /*
  75. Packetization Mode:
  76. 0 or not present: Single NAL mode (Only nals from 1-23 are allowed)
  77. 1: Non-interleaved Mode: 1-23, 24 (STAP-A), 28 (FU-A) are allowed.
  78. 2: Interleaved Mode: 25 (STAP-B), 26 (MTAP16), 27 (MTAP24), 28 (FU-A), and 29 (FU-B) are allowed.
  79. */
  80. if (h264_data->packetization_mode > 1)
  81. av_log(stream, AV_LOG_ERROR,
  82. "H.264/RTP Interleaved RTP mode is not supported yet.");
  83. } else if (!strcmp(attr, "profile-level-id")) {
  84. if (strlen(value) == 6) {
  85. char buffer[3];
  86. // 6 characters=3 bytes, in hex.
  87. uint8_t profile_idc;
  88. uint8_t profile_iop;
  89. uint8_t level_idc;
  90. buffer[0] = value[0]; buffer[1] = value[1]; buffer[2] = '\0';
  91. profile_idc = strtol(buffer, NULL, 16);
  92. buffer[0] = value[2]; buffer[1] = value[3];
  93. profile_iop = strtol(buffer, NULL, 16);
  94. buffer[0] = value[4]; buffer[1] = value[5];
  95. level_idc = strtol(buffer, NULL, 16);
  96. // set the parameters...
  97. av_log(NULL, AV_LOG_DEBUG,
  98. "H.264/RTP Profile IDC: %x Profile IOP: %x Level: %x\n",
  99. profile_idc, profile_iop, level_idc);
  100. h264_data->profile_idc = profile_idc;
  101. h264_data->profile_iop = profile_iop;
  102. h264_data->level_idc = level_idc;
  103. }
  104. } else if (!strcmp(attr, "sprop-parameter-sets")) {
  105. uint8_t start_sequence[]= { 0, 0, 1 };
  106. codec->extradata_size= 0;
  107. codec->extradata= NULL;
  108. while (*value) {
  109. char base64packet[1024];
  110. uint8_t decoded_packet[1024];
  111. uint32_t packet_size;
  112. char *dst = base64packet;
  113. while (*value && *value != ','
  114. && (dst - base64packet) < sizeof(base64packet) - 1) {
  115. *dst++ = *value++;
  116. }
  117. *dst++ = '\0';
  118. if (*value == ',')
  119. value++;
  120. packet_size= av_base64_decode(decoded_packet, base64packet, sizeof(decoded_packet));
  121. if (packet_size) {
  122. uint8_t *dest= av_malloc(packet_size+sizeof(start_sequence)+codec->extradata_size);
  123. if(dest)
  124. {
  125. if(codec->extradata_size)
  126. {
  127. // av_realloc?
  128. memcpy(dest, codec->extradata, codec->extradata_size);
  129. av_free(codec->extradata);
  130. }
  131. memcpy(dest+codec->extradata_size, start_sequence, sizeof(start_sequence));
  132. memcpy(dest+codec->extradata_size+sizeof(start_sequence), decoded_packet, packet_size);
  133. codec->extradata= dest;
  134. codec->extradata_size+= sizeof(start_sequence)+packet_size;
  135. } else {
  136. av_log(NULL, AV_LOG_ERROR, "H.264/RTP Unable to allocate memory for extradata!");
  137. }
  138. }
  139. }
  140. av_log(NULL, AV_LOG_DEBUG, "H.264/RTP Extradata set to %p (size: %d)!", codec->extradata, codec->extradata_size);
  141. }
  142. }
  143. // return 0 on packet, no more left, 1 on packet, 1 on partial packet...
  144. static int h264_handle_packet(PayloadContext *data,
  145. AVStream *st,
  146. AVPacket * pkt,
  147. uint32_t * timestamp,
  148. const uint8_t * buf,
  149. int len, int flags)
  150. {
  151. uint8_t nal = buf[0];
  152. uint8_t type = (nal & 0x1f);
  153. int result= 0;
  154. uint8_t start_sequence[]= {0, 0, 1};
  155. #ifdef DEBUG
  156. assert(data);
  157. assert(data->cookie == MAGIC_COOKIE);
  158. #endif
  159. assert(buf);
  160. if (type >= 1 && type <= 23)
  161. type = 1; // simplify the case. (these are all the nal types used internally by the h264 codec)
  162. switch (type) {
  163. case 0: // undefined;
  164. result= -1;
  165. break;
  166. case 1:
  167. av_new_packet(pkt, len+sizeof(start_sequence));
  168. memcpy(pkt->data, start_sequence, sizeof(start_sequence));
  169. memcpy(pkt->data+sizeof(start_sequence), buf, len);
  170. #ifdef DEBUG
  171. data->packet_types_received[nal & 0x1f]++;
  172. #endif
  173. break;
  174. case 24: // STAP-A (one packet, multiple nals)
  175. // consume the STAP-A NAL
  176. buf++;
  177. len--;
  178. // first we are going to figure out the total size....
  179. {
  180. int pass= 0;
  181. int total_length= 0;
  182. uint8_t *dst= NULL;
  183. for(pass= 0; pass<2; pass++) {
  184. const uint8_t *src= buf;
  185. int src_len= len;
  186. do {
  187. uint16_t nal_size = AV_RB16(src); // this going to be a problem if unaligned (can it be?)
  188. // consume the length of the aggregate...
  189. src += 2;
  190. src_len -= 2;
  191. if (nal_size <= src_len) {
  192. if(pass==0) {
  193. // counting...
  194. total_length+= sizeof(start_sequence)+nal_size;
  195. } else {
  196. // copying
  197. assert(dst);
  198. memcpy(dst, start_sequence, sizeof(start_sequence));
  199. dst+= sizeof(start_sequence);
  200. memcpy(dst, src, nal_size);
  201. #ifdef DEBUG
  202. data->packet_types_received[*src & 0x1f]++;
  203. #endif
  204. dst+= nal_size;
  205. }
  206. } else {
  207. av_log(NULL, AV_LOG_ERROR,
  208. "nal size exceeds length: %d %d\n", nal_size, src_len);
  209. }
  210. // eat what we handled...
  211. src += nal_size;
  212. src_len -= nal_size;
  213. if (src_len < 0)
  214. av_log(NULL, AV_LOG_ERROR,
  215. "Consumed more bytes than we got! (%d)\n", src_len);
  216. } while (src_len > 2); // because there could be rtp padding..
  217. if(pass==0) {
  218. // now we know the total size of the packet (with the start sequences added)
  219. av_new_packet(pkt, total_length);
  220. dst= pkt->data;
  221. } else {
  222. assert(dst-pkt->data==total_length);
  223. }
  224. }
  225. }
  226. break;
  227. case 25: // STAP-B
  228. case 26: // MTAP-16
  229. case 27: // MTAP-24
  230. case 29: // FU-B
  231. av_log(NULL, AV_LOG_ERROR,
  232. "Unhandled type (%d) (See RFC for implementation details\n",
  233. type);
  234. result= -1;
  235. break;
  236. case 28: // FU-A (fragmented nal)
  237. buf++;
  238. len--; // skip the fu_indicator
  239. {
  240. // these are the same as above, we just redo them here for clarity...
  241. uint8_t fu_indicator = nal;
  242. uint8_t fu_header = *buf; // read the fu_header.
  243. uint8_t start_bit = fu_header >> 7;
  244. // uint8_t end_bit = (fu_header & 0x40) >> 6;
  245. uint8_t nal_type = (fu_header & 0x1f);
  246. uint8_t reconstructed_nal;
  247. // reconstruct this packet's true nal; only the data follows..
  248. reconstructed_nal = fu_indicator & (0xe0); // the original nal forbidden bit and NRI are stored in this packet's nal;
  249. reconstructed_nal |= nal_type;
  250. // skip the fu_header...
  251. buf++;
  252. len--;
  253. #ifdef DEBUG
  254. if (start_bit)
  255. data->packet_types_received[nal_type]++;
  256. #endif
  257. if(start_bit) {
  258. // copy in the start sequence, and the reconstructed nal....
  259. av_new_packet(pkt, sizeof(start_sequence)+sizeof(nal)+len);
  260. memcpy(pkt->data, start_sequence, sizeof(start_sequence));
  261. pkt->data[sizeof(start_sequence)]= reconstructed_nal;
  262. memcpy(pkt->data+sizeof(start_sequence)+sizeof(nal), buf, len);
  263. } else {
  264. av_new_packet(pkt, len);
  265. memcpy(pkt->data, buf, len);
  266. }
  267. }
  268. break;
  269. case 30: // undefined
  270. case 31: // undefined
  271. default:
  272. av_log(NULL, AV_LOG_ERROR, "Undefined type (%d)", type);
  273. result= -1;
  274. break;
  275. }
  276. return result;
  277. }
  278. /* ---------------- public code */
  279. static PayloadContext *h264_new_extradata(void)
  280. {
  281. PayloadContext *data =
  282. av_mallocz(sizeof(PayloadContext) +
  283. FF_INPUT_BUFFER_PADDING_SIZE);
  284. if (data) {
  285. data->cookie = MAGIC_COOKIE;
  286. }
  287. return data;
  288. }
  289. static void h264_free_extradata(PayloadContext *data)
  290. {
  291. #ifdef DEBUG
  292. int ii;
  293. for (ii = 0; ii < 32; ii++) {
  294. if (data->packet_types_received[ii])
  295. av_log(NULL, AV_LOG_DEBUG, "Received %d packets of type %d\n",
  296. data->packet_types_received[ii], ii);
  297. }
  298. #endif
  299. assert(data);
  300. assert(data->cookie == MAGIC_COOKIE);
  301. // avoid stale pointers (assert)
  302. data->cookie = DEAD_COOKIE;
  303. // and clear out this...
  304. av_free(data);
  305. }
  306. static int parse_h264_sdp_line(AVFormatContext *s, int st_index,
  307. PayloadContext *h264_data, const char *line)
  308. {
  309. AVStream *stream = s->streams[st_index];
  310. AVCodecContext *codec = stream->codec;
  311. const char *p = line;
  312. assert(h264_data->cookie == MAGIC_COOKIE);
  313. if (av_strstart(p, "framesize:", &p)) {
  314. char buf1[50];
  315. char *dst = buf1;
  316. // remove the protocol identifier..
  317. while (*p && *p == ' ') p++; // strip spaces.
  318. while (*p && *p != ' ') p++; // eat protocol identifier
  319. while (*p && *p == ' ') p++; // strip trailing spaces.
  320. while (*p && *p != '-' && (buf1 - dst) < sizeof(buf1) - 1) {
  321. *dst++ = *p++;
  322. }
  323. *dst = '\0';
  324. // a='framesize:96 320-240'
  325. // set our parameters..
  326. codec->width = atoi(buf1);
  327. codec->height = atoi(p + 1); // skip the -
  328. codec->pix_fmt = PIX_FMT_YUV420P;
  329. } else if (av_strstart(p, "fmtp:", &p)) {
  330. char attr[256];
  331. char value[4096];
  332. // remove the protocol identifier..
  333. while (*p && *p == ' ') p++; // strip spaces.
  334. while (*p && *p != ' ') p++; // eat protocol identifier
  335. while (*p && *p == ' ') p++; // strip trailing spaces.
  336. /* loop on each attribute */
  337. while (rtsp_next_attr_and_value
  338. (&p, attr, sizeof(attr), value, sizeof(value))) {
  339. /* grab the codec extra_data from the config parameter of the fmtp line */
  340. sdp_parse_fmtp_config_h264(stream, h264_data, attr, value);
  341. }
  342. } else if (av_strstart(p, "cliprect:", &p)) {
  343. // could use this if we wanted.
  344. }
  345. av_set_pts_info(stream, 33, 1, 90000); // 33 should be right, because the pts is 64 bit? (done elsewhere; this is a one time thing)
  346. return 0; // keep processing it the normal way...
  347. }
  348. /**
  349. This is the structure for expanding on the dynamic rtp protocols (makes everything static. yay!)
  350. */
  351. RTPDynamicProtocolHandler ff_h264_dynamic_handler = {
  352. "H264",
  353. CODEC_TYPE_VIDEO,
  354. CODEC_ID_H264,
  355. parse_h264_sdp_line,
  356. h264_new_extradata,
  357. h264_free_extradata,
  358. h264_handle_packet
  359. };