You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

635 lines
22KB

  1. /*
  2. * copyright (c) 2007 Luca Abeni
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #include <string.h>
  21. #include "libavutil/avstring.h"
  22. #include "libavutil/base64.h"
  23. #include "libavutil/dict.h"
  24. #include "libavutil/parseutils.h"
  25. #include "libavutil/opt.h"
  26. #include "libavcodec/xiph.h"
  27. #include "libavcodec/mpeg4audio.h"
  28. #include "avformat.h"
  29. #include "internal.h"
  30. #include "avc.h"
  31. #include "rtp.h"
  32. #if CONFIG_NETWORK
  33. #include "network.h"
  34. #endif
  35. #if CONFIG_RTP_MUXER
  36. #define MAX_EXTRADATA_SIZE ((INT_MAX - 10) / 2)
  37. struct sdp_session_level {
  38. int sdp_version; /**< protocol version (currently 0) */
  39. int id; /**< session ID */
  40. int version; /**< session version */
  41. int start_time; /**< session start time (NTP time, in seconds),
  42. or 0 in case of permanent session */
  43. int end_time; /**< session end time (NTP time, in seconds),
  44. or 0 if the session is not bounded */
  45. int ttl; /**< TTL, in case of multicast stream */
  46. const char *user; /**< username of the session's creator */
  47. const char *src_addr; /**< IP address of the machine from which the session was created */
  48. const char *src_type; /**< address type of src_addr */
  49. const char *dst_addr; /**< destination IP address (can be multicast) */
  50. const char *dst_type; /**< destination IP address type */
  51. const char *name; /**< session name (can be an empty string) */
  52. };
  53. static void sdp_write_address(char *buff, int size, const char *dest_addr,
  54. const char *dest_type, int ttl)
  55. {
  56. if (dest_addr) {
  57. if (!dest_type)
  58. dest_type = "IP4";
  59. if (ttl > 0 && !strcmp(dest_type, "IP4")) {
  60. /* The TTL should only be specified for IPv4 multicast addresses,
  61. * not for IPv6. */
  62. av_strlcatf(buff, size, "c=IN %s %s/%d\r\n", dest_type, dest_addr, ttl);
  63. } else {
  64. av_strlcatf(buff, size, "c=IN %s %s\r\n", dest_type, dest_addr);
  65. }
  66. }
  67. }
  68. static void sdp_write_header(char *buff, int size, struct sdp_session_level *s)
  69. {
  70. av_strlcatf(buff, size, "v=%d\r\n"
  71. "o=- %d %d IN %s %s\r\n"
  72. "s=%s\r\n",
  73. s->sdp_version,
  74. s->id, s->version, s->src_type, s->src_addr,
  75. s->name);
  76. sdp_write_address(buff, size, s->dst_addr, s->dst_type, s->ttl);
  77. av_strlcatf(buff, size, "t=%d %d\r\n"
  78. "a=tool:libavformat " AV_STRINGIFY(LIBAVFORMAT_VERSION) "\r\n",
  79. s->start_time, s->end_time);
  80. }
  81. #if CONFIG_NETWORK
  82. static int resolve_destination(char *dest_addr, int size, char *type,
  83. int type_size)
  84. {
  85. struct addrinfo hints, *ai;
  86. int is_multicast;
  87. av_strlcpy(type, "IP4", type_size);
  88. if (!dest_addr[0])
  89. return 0;
  90. /* Resolve the destination, since it must be written
  91. * as a numeric IP address in the SDP. */
  92. memset(&hints, 0, sizeof(hints));
  93. if (getaddrinfo(dest_addr, NULL, &hints, &ai))
  94. return 0;
  95. getnameinfo(ai->ai_addr, ai->ai_addrlen, dest_addr, size,
  96. NULL, 0, NI_NUMERICHOST);
  97. #ifdef AF_INET6
  98. if (ai->ai_family == AF_INET6)
  99. av_strlcpy(type, "IP6", type_size);
  100. #endif
  101. is_multicast = ff_is_multicast_address(ai->ai_addr);
  102. freeaddrinfo(ai);
  103. return is_multicast;
  104. }
  105. #else
  106. static int resolve_destination(char *dest_addr, int size, char *type,
  107. int type_size)
  108. {
  109. return 0;
  110. }
  111. #endif
  112. static int sdp_get_address(char *dest_addr, int size, int *ttl, const char *url)
  113. {
  114. int port;
  115. const char *p;
  116. char proto[32];
  117. av_url_split(proto, sizeof(proto), NULL, 0, dest_addr, size, &port, NULL, 0, url);
  118. *ttl = 0;
  119. if (strcmp(proto, "rtp")) {
  120. /* The url isn't for the actual rtp sessions,
  121. * don't parse out anything else than the destination.
  122. */
  123. return 0;
  124. }
  125. p = strchr(url, '?');
  126. if (p) {
  127. char buff[64];
  128. if (av_find_info_tag(buff, sizeof(buff), "ttl", p)) {
  129. *ttl = strtol(buff, NULL, 10);
  130. } else {
  131. *ttl = 5;
  132. }
  133. }
  134. return port;
  135. }
  136. #define MAX_PSET_SIZE 1024
  137. static char *extradata2psets(AVCodecContext *c)
  138. {
  139. char *psets, *p;
  140. const uint8_t *r;
  141. const char *pset_string = "; sprop-parameter-sets=";
  142. if (c->extradata_size > MAX_EXTRADATA_SIZE) {
  143. av_log(c, AV_LOG_ERROR, "Too much extradata!\n");
  144. return NULL;
  145. }
  146. if (c->extradata[0] == 1) {
  147. uint8_t *dummy_p;
  148. int dummy_int;
  149. AVBitStreamFilterContext *bsfc= av_bitstream_filter_init("h264_mp4toannexb");
  150. if (!bsfc) {
  151. av_log(c, AV_LOG_ERROR, "Cannot open the h264_mp4toannexb BSF!\n");
  152. return NULL;
  153. }
  154. av_bitstream_filter_filter(bsfc, c, NULL, &dummy_p, &dummy_int, NULL, 0, 0);
  155. av_bitstream_filter_close(bsfc);
  156. }
  157. psets = av_mallocz(MAX_PSET_SIZE);
  158. if (psets == NULL) {
  159. av_log(c, AV_LOG_ERROR, "Cannot allocate memory for the parameter sets.\n");
  160. return NULL;
  161. }
  162. memcpy(psets, pset_string, strlen(pset_string));
  163. p = psets + strlen(pset_string);
  164. r = ff_avc_find_startcode(c->extradata, c->extradata + c->extradata_size);
  165. while (r < c->extradata + c->extradata_size) {
  166. const uint8_t *r1;
  167. uint8_t nal_type;
  168. while (!*(r++));
  169. nal_type = *r & 0x1f;
  170. r1 = ff_avc_find_startcode(r, c->extradata + c->extradata_size);
  171. if (nal_type != 7 && nal_type != 8) { /* Only output SPS and PPS */
  172. r = r1;
  173. continue;
  174. }
  175. if (p != (psets + strlen(pset_string))) {
  176. *p = ',';
  177. p++;
  178. }
  179. if (av_base64_encode(p, MAX_PSET_SIZE - (p - psets), r, r1 - r) == NULL) {
  180. av_log(c, AV_LOG_ERROR, "Cannot Base64-encode %td %td!\n", MAX_PSET_SIZE - (p - psets), r1 - r);
  181. av_free(psets);
  182. return NULL;
  183. }
  184. p += strlen(p);
  185. r = r1;
  186. }
  187. return psets;
  188. }
  189. static char *extradata2config(AVCodecContext *c)
  190. {
  191. char *config;
  192. if (c->extradata_size > MAX_EXTRADATA_SIZE) {
  193. av_log(c, AV_LOG_ERROR, "Too much extradata!\n");
  194. return NULL;
  195. }
  196. config = av_malloc(10 + c->extradata_size * 2);
  197. if (config == NULL) {
  198. av_log(c, AV_LOG_ERROR, "Cannot allocate memory for the config info.\n");
  199. return NULL;
  200. }
  201. memcpy(config, "; config=", 9);
  202. ff_data_to_hex(config + 9, c->extradata, c->extradata_size, 0);
  203. config[9 + c->extradata_size * 2] = 0;
  204. return config;
  205. }
  206. static char *xiph_extradata2config(AVCodecContext *c)
  207. {
  208. char *config, *encoded_config;
  209. uint8_t *header_start[3];
  210. int headers_len, header_len[3], config_len;
  211. int first_header_size;
  212. switch (c->codec_id) {
  213. case CODEC_ID_THEORA:
  214. first_header_size = 42;
  215. break;
  216. case CODEC_ID_VORBIS:
  217. first_header_size = 30;
  218. break;
  219. default:
  220. av_log(c, AV_LOG_ERROR, "Unsupported Xiph codec ID\n");
  221. return NULL;
  222. }
  223. if (avpriv_split_xiph_headers(c->extradata, c->extradata_size,
  224. first_header_size, header_start,
  225. header_len) < 0) {
  226. av_log(c, AV_LOG_ERROR, "Extradata corrupt.\n");
  227. return NULL;
  228. }
  229. headers_len = header_len[0] + header_len[2];
  230. config_len = 4 + // count
  231. 3 + // ident
  232. 2 + // packet size
  233. 1 + // header count
  234. 2 + // header size
  235. headers_len; // and the rest
  236. config = av_malloc(config_len);
  237. if (!config)
  238. goto xiph_fail;
  239. encoded_config = av_malloc(AV_BASE64_SIZE(config_len));
  240. if (!encoded_config) {
  241. av_free(config);
  242. goto xiph_fail;
  243. }
  244. config[0] = config[1] = config[2] = 0;
  245. config[3] = 1;
  246. config[4] = (RTP_XIPH_IDENT >> 16) & 0xff;
  247. config[5] = (RTP_XIPH_IDENT >> 8) & 0xff;
  248. config[6] = (RTP_XIPH_IDENT ) & 0xff;
  249. config[7] = (headers_len >> 8) & 0xff;
  250. config[8] = headers_len & 0xff;
  251. config[9] = 2;
  252. config[10] = header_len[0];
  253. config[11] = 0; // size of comment header; nonexistent
  254. memcpy(config + 12, header_start[0], header_len[0]);
  255. memcpy(config + 12 + header_len[0], header_start[2], header_len[2]);
  256. av_base64_encode(encoded_config, AV_BASE64_SIZE(config_len),
  257. config, config_len);
  258. av_free(config);
  259. return encoded_config;
  260. xiph_fail:
  261. av_log(c, AV_LOG_ERROR,
  262. "Not enough memory for configuration string\n");
  263. return NULL;
  264. }
  265. static int latm_context2profilelevel(AVCodecContext *c)
  266. {
  267. /* MP4A-LATM
  268. * The RTP payload format specification is described in RFC 3016
  269. * The encoding specifications are provided in ISO/IEC 14496-3 */
  270. int profile_level = 0x2B;
  271. /* TODO: AAC Profile only supports AAC LC Object Type.
  272. * Different Object Types should implement different Profile Levels */
  273. if (c->sample_rate <= 24000) {
  274. if (c->channels <= 2)
  275. profile_level = 0x28; // AAC Profile, Level 1
  276. } else if (c->sample_rate <= 48000) {
  277. if (c->channels <= 2) {
  278. profile_level = 0x29; // AAC Profile, Level 2
  279. } else if (c->channels <= 5) {
  280. profile_level = 0x2A; // AAC Profile, Level 4
  281. }
  282. } else if (c->sample_rate <= 96000) {
  283. if (c->channels <= 5) {
  284. profile_level = 0x2B; // AAC Profile, Level 5
  285. }
  286. }
  287. return profile_level;
  288. }
  289. static char *latm_context2config(AVCodecContext *c)
  290. {
  291. /* MP4A-LATM
  292. * The RTP payload format specification is described in RFC 3016
  293. * The encoding specifications are provided in ISO/IEC 14496-3 */
  294. uint8_t config_byte[6];
  295. int rate_index;
  296. char *config;
  297. for (rate_index = 0; rate_index < 16; rate_index++)
  298. if (avpriv_mpeg4audio_sample_rates[rate_index] == c->sample_rate)
  299. break;
  300. if (rate_index == 16) {
  301. av_log(c, AV_LOG_ERROR, "Unsupported sample rate\n");
  302. return NULL;
  303. }
  304. config_byte[0] = 0x40;
  305. config_byte[1] = 0;
  306. config_byte[2] = 0x20 | rate_index;
  307. config_byte[3] = c->channels << 4;
  308. config_byte[4] = 0x3f;
  309. config_byte[5] = 0xc0;
  310. config = av_malloc(6*2+1);
  311. if (!config) {
  312. av_log(c, AV_LOG_ERROR, "Cannot allocate memory for the config info.\n");
  313. return NULL;
  314. }
  315. ff_data_to_hex(config, config_byte, 6, 1);
  316. config[12] = 0;
  317. return config;
  318. }
  319. static char *sdp_write_media_attributes(char *buff, int size, AVCodecContext *c, int payload_type, AVFormatContext *fmt)
  320. {
  321. char *config = NULL;
  322. switch (c->codec_id) {
  323. case CODEC_ID_H264:
  324. if (c->extradata_size) {
  325. config = extradata2psets(c);
  326. }
  327. av_strlcatf(buff, size, "a=rtpmap:%d H264/90000\r\n"
  328. "a=fmtp:%d packetization-mode=1%s\r\n",
  329. payload_type,
  330. payload_type, config ? config : "");
  331. break;
  332. case CODEC_ID_H263:
  333. case CODEC_ID_H263P:
  334. /* a=framesize is required by 3GPP TS 26.234 (PSS). It
  335. * actually specifies the maximum video size, but we only know
  336. * the current size. This is required for playback on Android
  337. * stagefright and on Samsung bada. */
  338. av_strlcatf(buff, size, "a=rtpmap:%d H263-2000/90000\r\n"
  339. "a=framesize:%d %d-%d\r\n",
  340. payload_type,
  341. payload_type, c->width, c->height);
  342. break;
  343. case CODEC_ID_MPEG4:
  344. if (c->extradata_size) {
  345. config = extradata2config(c);
  346. }
  347. av_strlcatf(buff, size, "a=rtpmap:%d MP4V-ES/90000\r\n"
  348. "a=fmtp:%d profile-level-id=1%s\r\n",
  349. payload_type,
  350. payload_type, config ? config : "");
  351. break;
  352. case CODEC_ID_AAC:
  353. if (fmt && fmt->oformat && fmt->oformat->priv_class &&
  354. av_opt_flag_is_set(fmt->priv_data, "rtpflags", "latm")) {
  355. config = latm_context2config(c);
  356. if (!config)
  357. return NULL;
  358. av_strlcatf(buff, size, "a=rtpmap:%d MP4A-LATM/%d/%d\r\n"
  359. "a=fmtp:%d profile-level-id=%d;cpresent=0;config=%s\r\n",
  360. payload_type, c->sample_rate, c->channels,
  361. payload_type, latm_context2profilelevel(c), config);
  362. } else {
  363. if (c->extradata_size) {
  364. config = extradata2config(c);
  365. } else {
  366. /* FIXME: maybe we can forge config information based on the
  367. * codec parameters...
  368. */
  369. av_log(c, AV_LOG_ERROR, "AAC with no global headers is currently not supported.\n");
  370. return NULL;
  371. }
  372. if (config == NULL) {
  373. return NULL;
  374. }
  375. av_strlcatf(buff, size, "a=rtpmap:%d MPEG4-GENERIC/%d/%d\r\n"
  376. "a=fmtp:%d profile-level-id=1;"
  377. "mode=AAC-hbr;sizelength=13;indexlength=3;"
  378. "indexdeltalength=3%s\r\n",
  379. payload_type, c->sample_rate, c->channels,
  380. payload_type, config);
  381. }
  382. break;
  383. case CODEC_ID_PCM_S16BE:
  384. if (payload_type >= RTP_PT_PRIVATE)
  385. av_strlcatf(buff, size, "a=rtpmap:%d L16/%d/%d\r\n",
  386. payload_type,
  387. c->sample_rate, c->channels);
  388. break;
  389. case CODEC_ID_PCM_MULAW:
  390. if (payload_type >= RTP_PT_PRIVATE)
  391. av_strlcatf(buff, size, "a=rtpmap:%d PCMU/%d/%d\r\n",
  392. payload_type,
  393. c->sample_rate, c->channels);
  394. break;
  395. case CODEC_ID_PCM_ALAW:
  396. if (payload_type >= RTP_PT_PRIVATE)
  397. av_strlcatf(buff, size, "a=rtpmap:%d PCMA/%d/%d\r\n",
  398. payload_type,
  399. c->sample_rate, c->channels);
  400. break;
  401. case CODEC_ID_AMR_NB:
  402. av_strlcatf(buff, size, "a=rtpmap:%d AMR/%d/%d\r\n"
  403. "a=fmtp:%d octet-align=1\r\n",
  404. payload_type, c->sample_rate, c->channels,
  405. payload_type);
  406. break;
  407. case CODEC_ID_AMR_WB:
  408. av_strlcatf(buff, size, "a=rtpmap:%d AMR-WB/%d/%d\r\n"
  409. "a=fmtp:%d octet-align=1\r\n",
  410. payload_type, c->sample_rate, c->channels,
  411. payload_type);
  412. break;
  413. case CODEC_ID_VORBIS:
  414. if (c->extradata_size)
  415. config = xiph_extradata2config(c);
  416. else
  417. av_log(c, AV_LOG_ERROR, "Vorbis configuration info missing\n");
  418. if (!config)
  419. return NULL;
  420. av_strlcatf(buff, size, "a=rtpmap:%d vorbis/%d/%d\r\n"
  421. "a=fmtp:%d configuration=%s\r\n",
  422. payload_type, c->sample_rate, c->channels,
  423. payload_type, config);
  424. break;
  425. case CODEC_ID_THEORA: {
  426. const char *pix_fmt;
  427. if (c->extradata_size)
  428. config = xiph_extradata2config(c);
  429. else
  430. av_log(c, AV_LOG_ERROR, "Theora configuation info missing\n");
  431. if (!config)
  432. return NULL;
  433. switch (c->pix_fmt) {
  434. case PIX_FMT_YUV420P:
  435. pix_fmt = "YCbCr-4:2:0";
  436. break;
  437. case PIX_FMT_YUV422P:
  438. pix_fmt = "YCbCr-4:2:2";
  439. break;
  440. case PIX_FMT_YUV444P:
  441. pix_fmt = "YCbCr-4:4:4";
  442. break;
  443. default:
  444. av_log(c, AV_LOG_ERROR, "Unsupported pixel format.\n");
  445. return NULL;
  446. }
  447. av_strlcatf(buff, size, "a=rtpmap:%d theora/90000\r\n"
  448. "a=fmtp:%d delivery-method=inline; "
  449. "width=%d; height=%d; sampling=%s; "
  450. "configuration=%s\r\n",
  451. payload_type, payload_type,
  452. c->width, c->height, pix_fmt, config);
  453. break;
  454. }
  455. case CODEC_ID_VP8:
  456. av_strlcatf(buff, size, "a=rtpmap:%d VP8/90000\r\n",
  457. payload_type);
  458. break;
  459. case CODEC_ID_ADPCM_G722:
  460. if (payload_type >= RTP_PT_PRIVATE)
  461. av_strlcatf(buff, size, "a=rtpmap:%d G722/%d/%d\r\n",
  462. payload_type,
  463. 8000, c->channels);
  464. break;
  465. case CODEC_ID_ADPCM_G726: {
  466. if (payload_type >= RTP_PT_PRIVATE)
  467. av_strlcatf(buff, size, "a=rtpmap:%d G726-%d/%d\r\n",
  468. payload_type,
  469. c->bits_per_coded_sample*8,
  470. c->sample_rate);
  471. break;
  472. }
  473. default:
  474. /* Nothing special to do here... */
  475. break;
  476. }
  477. av_free(config);
  478. return buff;
  479. }
  480. void ff_sdp_write_media(char *buff, int size, AVCodecContext *c, const char *dest_addr, const char *dest_type, int port, int ttl, AVFormatContext *fmt)
  481. {
  482. const char *type;
  483. int payload_type;
  484. payload_type = ff_rtp_get_payload_type(fmt, c);
  485. switch (c->codec_type) {
  486. case AVMEDIA_TYPE_VIDEO : type = "video" ; break;
  487. case AVMEDIA_TYPE_AUDIO : type = "audio" ; break;
  488. case AVMEDIA_TYPE_SUBTITLE: type = "text" ; break;
  489. default : type = "application"; break;
  490. }
  491. av_strlcatf(buff, size, "m=%s %d RTP/AVP %d\r\n", type, port, payload_type);
  492. sdp_write_address(buff, size, dest_addr, dest_type, ttl);
  493. if (c->bit_rate) {
  494. av_strlcatf(buff, size, "b=AS:%d\r\n", c->bit_rate / 1000);
  495. }
  496. sdp_write_media_attributes(buff, size, c, payload_type, fmt);
  497. }
  498. int av_sdp_create(AVFormatContext *ac[], int n_files, char *buf, int size)
  499. {
  500. AVDictionaryEntry *title = av_dict_get(ac[0]->metadata, "title", NULL, 0);
  501. struct sdp_session_level s;
  502. int i, j, port, ttl, is_multicast;
  503. char dst[32], dst_type[5];
  504. memset(buf, 0, size);
  505. memset(&s, 0, sizeof(struct sdp_session_level));
  506. s.user = "-";
  507. s.src_addr = "127.0.0.1"; /* FIXME: Properly set this */
  508. s.src_type = "IP4";
  509. s.name = title ? title->value : "No Name";
  510. port = 0;
  511. ttl = 0;
  512. if (n_files == 1) {
  513. port = sdp_get_address(dst, sizeof(dst), &ttl, ac[0]->filename);
  514. is_multicast = resolve_destination(dst, sizeof(dst), dst_type,
  515. sizeof(dst_type));
  516. if (!is_multicast)
  517. ttl = 0;
  518. if (dst[0]) {
  519. s.dst_addr = dst;
  520. s.dst_type = dst_type;
  521. s.ttl = ttl;
  522. if (!strcmp(dst_type, "IP6")) {
  523. s.src_addr = "::1";
  524. s.src_type = "IP6";
  525. }
  526. }
  527. }
  528. sdp_write_header(buf, size, &s);
  529. dst[0] = 0;
  530. for (i = 0; i < n_files; i++) {
  531. if (n_files != 1) {
  532. port = sdp_get_address(dst, sizeof(dst), &ttl, ac[i]->filename);
  533. is_multicast = resolve_destination(dst, sizeof(dst), dst_type,
  534. sizeof(dst_type));
  535. if (!is_multicast)
  536. ttl = 0;
  537. }
  538. for (j = 0; j < ac[i]->nb_streams; j++) {
  539. ff_sdp_write_media(buf, size,
  540. ac[i]->streams[j]->codec, dst[0] ? dst : NULL,
  541. dst_type, (port > 0) ? port + j * 2 : 0, ttl,
  542. ac[i]);
  543. if (port <= 0) {
  544. av_strlcatf(buf, size,
  545. "a=control:streamid=%d\r\n", i + j);
  546. }
  547. }
  548. }
  549. return 0;
  550. }
  551. #else
  552. int av_sdp_create(AVFormatContext *ac[], int n_files, char *buf, int size)
  553. {
  554. return AVERROR(ENOSYS);
  555. }
  556. void ff_sdp_write_media(char *buff, int size, AVCodecContext *c, const char *dest_addr, const char *dest_type, int port, int ttl, AVFormatContext *fmt)
  557. {
  558. }
  559. #endif
  560. #if FF_API_SDP_CREATE
  561. int avf_sdp_create(AVFormatContext *ac[], int n_files, char *buff, int size)
  562. {
  563. return av_sdp_create(ac, n_files, buff, size);
  564. }
  565. #endif