You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

639 lines
18KB

  1. /*
  2. * Apple HTTP Live Streaming segmenter
  3. * Copyright (c) 2012, Luca Barbato
  4. *
  5. * This file is part of Libav.
  6. *
  7. * Libav is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * Libav is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with Libav; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <float.h>
  22. #include <stdint.h>
  23. #include <config.h>
  24. #if CONFIG_OPENSSL
  25. #include <openssl/rand.h>
  26. #endif
  27. #include "libavutil/mathematics.h"
  28. #include "libavutil/parseutils.h"
  29. #include "libavutil/avstring.h"
  30. #include "libavutil/intreadwrite.h"
  31. #include "libavutil/opt.h"
  32. #include "libavutil/random_seed.h"
  33. #include "libavutil/log.h"
  34. #include "avformat.h"
  35. #include "internal.h"
  36. typedef struct ListEntry {
  37. char name[1024];
  38. int64_t duration; // segment duration in AV_TIME_BASE units
  39. int discont;
  40. struct ListEntry *next;
  41. } ListEntry;
  42. typedef struct HLSContext {
  43. const AVClass *class; // Class for private options.
  44. unsigned number;
  45. int64_t sequence;
  46. int64_t start_sequence;
  47. AVOutputFormat *oformat;
  48. AVFormatContext *avf;
  49. float time; // Set by a private option.
  50. int size; // Set by a private option.
  51. int wrap; // Set by a private option.
  52. int version; // Set by a private option.
  53. int allowcache;
  54. int64_t recording_time;
  55. int has_video;
  56. // The following timestamps are in AV_TIME_BASE units.
  57. int64_t start_pts;
  58. int64_t end_pts;
  59. int64_t duration; // last segment duration computed so far.
  60. int nb_entries;
  61. ListEntry *list;
  62. ListEntry *end_list;
  63. char *basename;
  64. char *baseurl;
  65. int encrypt; // Set by a private option.
  66. char *key; // Set by a private option.
  67. int key_len;
  68. char *key_url; // Set by a private option.
  69. char *iv; // Set by a private option.
  70. int iv_len;
  71. int recovered;
  72. char *key_basename;
  73. AVDictionary *enc_opts;
  74. } HLSContext;
  75. static int randomize(uint8_t *buf, int len)
  76. {
  77. #if CONFIG_OPENSSL
  78. if (RAND_bytes(buf, len))
  79. return 0;
  80. return AVERROR(EIO);
  81. #else
  82. return AVERROR(ENOSYS);
  83. #endif
  84. }
  85. static void free_encryption(AVFormatContext *s)
  86. {
  87. HLSContext *hls = s->priv_data;
  88. av_dict_free(&hls->enc_opts);
  89. av_freep(&hls->key_basename);
  90. }
  91. static int dict_set_bin(AVDictionary **dict, const char *key,
  92. uint8_t *buf, size_t len)
  93. {
  94. char hex[33];
  95. ff_data_to_hex(hex, buf, len, 0);
  96. hex[32] = '\0';
  97. return av_dict_set(dict, key, hex, 0);
  98. }
  99. static int setup_encryption(AVFormatContext *s)
  100. {
  101. HLSContext *hls = s->priv_data;
  102. AVIOContext *out = NULL;
  103. int len, ret;
  104. uint8_t buf[16];
  105. uint8_t *k = NULL;
  106. len = strlen(hls->basename) + 4 + 1;
  107. hls->key_basename = av_mallocz(len);
  108. if (!hls->key_basename)
  109. return AVERROR(ENOMEM);
  110. av_strlcpy(hls->key_basename, hls->basename + 7, len);
  111. av_strlcat(hls->key_basename, ".key", len);
  112. if (hls->key) {
  113. if (hls->key_len != 16) {
  114. av_log(s, AV_LOG_ERROR,
  115. "Invalid key size %d, expected 16-bytes hex-coded key\n",
  116. hls->key_len);
  117. return AVERROR(EINVAL);
  118. }
  119. if ((ret = dict_set_bin(&hls->enc_opts, "key", hls->key, hls->key_len)) < 0)
  120. return ret;
  121. k = hls->key;
  122. } else {
  123. if (hls->start_sequence < 0) {
  124. ret = s->io_open(s, &out, hls->key_basename, AVIO_FLAG_READ, NULL);
  125. if (ret < 0) {
  126. av_log(s, AV_LOG_WARNING,
  127. "Cannot recover the key, generating a new one.\n");
  128. } else {
  129. avio_read(out, buf, 16);
  130. k = buf;
  131. avio_close(out);
  132. }
  133. }
  134. if (!k) {
  135. if ((ret = randomize(buf, sizeof(buf))) < 0) {
  136. av_log(s, AV_LOG_ERROR, "Cannot generate a strong random key\n");
  137. return ret;
  138. }
  139. }
  140. if ((ret = dict_set_bin(&hls->enc_opts, "key", buf, sizeof(buf))) < 0)
  141. return ret;
  142. k = buf;
  143. }
  144. if (hls->iv) {
  145. if (hls->iv_len != 16) {
  146. av_log(s, AV_LOG_ERROR,
  147. "Invalid key size %d, expected 16-bytes hex-coded initialization vector\n",
  148. hls->iv_len);
  149. return AVERROR(EINVAL);
  150. }
  151. if ((ret = dict_set_bin(&hls->enc_opts, "iv", hls->iv, hls->iv_len)) < 0)
  152. return ret;
  153. }
  154. if ((ret = s->io_open(s, &out, hls->key_basename, AVIO_FLAG_WRITE, NULL)) < 0)
  155. return ret;
  156. avio_write(out, k, 16);
  157. avio_close(out);
  158. return 0;
  159. }
  160. static int hls_mux_init(AVFormatContext *s)
  161. {
  162. HLSContext *hls = s->priv_data;
  163. AVFormatContext *oc;
  164. int i;
  165. hls->avf = oc = avformat_alloc_context();
  166. if (!oc)
  167. return AVERROR(ENOMEM);
  168. oc->oformat = hls->oformat;
  169. oc->interrupt_callback = s->interrupt_callback;
  170. oc->opaque = s->opaque;
  171. oc->io_open = s->io_open;
  172. oc->io_close = s->io_close;
  173. for (i = 0; i < s->nb_streams; i++) {
  174. AVStream *st;
  175. if (!(st = avformat_new_stream(oc, NULL)))
  176. return AVERROR(ENOMEM);
  177. avcodec_parameters_copy(st->codecpar, s->streams[i]->codecpar);
  178. st->sample_aspect_ratio = s->streams[i]->sample_aspect_ratio;
  179. st->time_base = s->streams[i]->time_base;
  180. }
  181. return 0;
  182. }
  183. static int append_entry(HLSContext *hls, int64_t duration, const char *name,
  184. int discont)
  185. {
  186. ListEntry *en = av_malloc(sizeof(*en));
  187. if (!en)
  188. return AVERROR(ENOMEM);
  189. av_strlcpy(en->name, name, sizeof(en->name));
  190. en->discont = discont;
  191. en->duration = duration;
  192. en->next = NULL;
  193. if (!hls->list)
  194. hls->list = en;
  195. else
  196. hls->end_list->next = en;
  197. hls->end_list = en;
  198. if (hls->nb_entries >= hls->size) {
  199. en = hls->list;
  200. hls->list = en->next;
  201. av_free(en);
  202. } else
  203. hls->nb_entries++;
  204. hls->sequence++;
  205. return 0;
  206. }
  207. static void free_entries(HLSContext *hls)
  208. {
  209. ListEntry *p = hls->list, *en;
  210. while(p) {
  211. en = p;
  212. p = p->next;
  213. av_free(en);
  214. }
  215. }
  216. static int hls_window(AVFormatContext *s, int last)
  217. {
  218. HLSContext *hls = s->priv_data;
  219. ListEntry *en;
  220. int64_t target_duration = 0;
  221. int ret = 0;
  222. AVIOContext *out = NULL;
  223. char temp_filename[1024];
  224. int64_t sequence = FFMAX(hls->start_sequence, hls->sequence - hls->size);
  225. snprintf(temp_filename, sizeof(temp_filename), "%s.tmp", s->filename);
  226. if ((ret = s->io_open(s, &out, temp_filename, AVIO_FLAG_WRITE, NULL)) < 0)
  227. goto fail;
  228. for (en = hls->list; en; en = en->next) {
  229. if (target_duration < en->duration)
  230. target_duration = en->duration;
  231. }
  232. avio_printf(out, "#EXTM3U\n");
  233. avio_printf(out, "#EXT-X-VERSION:%d\n", hls->version);
  234. if (hls->allowcache == 0 || hls->allowcache == 1) {
  235. avio_printf(out, "#EXT-X-ALLOW-CACHE:%s\n", hls->allowcache == 0 ? "NO" : "YES");
  236. }
  237. avio_printf(out, "#EXT-X-TARGETDURATION:%"PRId64"\n",
  238. av_rescale_rnd(target_duration, 1, AV_TIME_BASE,
  239. AV_ROUND_UP));
  240. avio_printf(out, "#EXT-X-MEDIA-SEQUENCE:%"PRId64"\n", sequence);
  241. av_log(s, AV_LOG_VERBOSE, "EXT-X-MEDIA-SEQUENCE:%"PRId64"\n",
  242. sequence);
  243. for (en = hls->list; en; en = en->next) {
  244. if (en->discont) {
  245. avio_printf(out, "#EXT-X-DISCONTINUITY\n");
  246. }
  247. if (hls->encrypt) {
  248. char *key_url;
  249. if (hls->key_url)
  250. key_url = hls->key_url;
  251. else
  252. key_url = hls->baseurl;
  253. avio_printf(out, "#EXT-X-KEY:METHOD=AES-128");
  254. avio_printf(out, ",URI=\"");
  255. if (key_url)
  256. avio_printf(out, "%s", key_url);
  257. avio_printf(out, "%s\"", av_basename(hls->key_basename));
  258. if (hls->iv)
  259. avio_printf(out, ",IV=\"0x%s\"", hls->iv);
  260. avio_printf(out, "\n");
  261. }
  262. if (hls->version > 2)
  263. avio_printf(out, "#EXTINF:%f\n",
  264. (double)en->duration / AV_TIME_BASE);
  265. else
  266. avio_printf(out, "#EXTINF:%"PRId64",\n",
  267. av_rescale(en->duration, 1, AV_TIME_BASE));
  268. if (hls->baseurl)
  269. avio_printf(out, "%s", hls->baseurl);
  270. avio_printf(out, "%s\n", en->name);
  271. }
  272. if (last)
  273. avio_printf(out, "#EXT-X-ENDLIST\n");
  274. fail:
  275. ff_format_io_close(s, &out);
  276. if (ret >= 0)
  277. ff_rename(temp_filename, s->filename);
  278. return ret;
  279. }
  280. static int hls_start(AVFormatContext *s)
  281. {
  282. HLSContext *c = s->priv_data;
  283. AVFormatContext *oc = c->avf;
  284. int err = 0;
  285. AVDictionary *opts = NULL;
  286. if (av_get_frame_filename(oc->filename, sizeof(oc->filename),
  287. c->basename, c->wrap ? c->sequence % c->wrap : c->sequence) < 0)
  288. return AVERROR(EINVAL);
  289. c->number++;
  290. if (c->encrypt) {
  291. if ((err = av_dict_copy(&opts, c->enc_opts, 0)) < 0)
  292. return err;
  293. if (!c->iv) {
  294. uint8_t iv[16] = { 0 };
  295. char buf[33];
  296. AV_WB64(iv + 8, c->sequence);
  297. ff_data_to_hex(buf, iv, sizeof(iv), 0);
  298. buf[32] = '\0';
  299. if ((err = av_dict_set(&opts, "iv", buf, 0)) < 0)
  300. goto fail;
  301. }
  302. }
  303. if ((err = s->io_open(s, &oc->pb, oc->filename, AVIO_FLAG_WRITE, &opts)) < 0)
  304. return err;
  305. if (oc->oformat->priv_class && oc->priv_data)
  306. av_opt_set(oc->priv_data, "mpegts_flags", "resend_headers", 0);
  307. fail:
  308. av_dict_free(&opts);
  309. return err;
  310. }
  311. static int read_chomp_line(AVIOContext *s, char *buf, int maxlen)
  312. {
  313. int len = ff_get_line(s, buf, maxlen);
  314. while (len > 0 && av_isspace(buf[len - 1]))
  315. buf[--len] = '\0';
  316. return len;
  317. }
  318. static int hls_recover(AVFormatContext *s)
  319. {
  320. HLSContext *hls = s->priv_data;
  321. char line[1024];
  322. AVIOContext *io;
  323. const char *ptr;
  324. int ret, is_segment = 0, is_discont = 0;
  325. int64_t duration = 0;
  326. ret = s->io_open(s, &io, s->filename, AVIO_FLAG_READ, NULL);
  327. if (ret < 0) {
  328. av_log(s, AV_LOG_WARNING,
  329. "Cannot recover the playlist, generating a new one.\n");
  330. hls->start_sequence = 0;
  331. hls->sequence = 0;
  332. return 0;
  333. }
  334. read_chomp_line(io, line, sizeof(line));
  335. if (strcmp(line, "#EXTM3U")) {
  336. av_log(s, AV_LOG_ERROR,
  337. "The playlist file is present but unparsable."
  338. " Please remove it.\n");
  339. return AVERROR_INVALIDDATA;
  340. }
  341. while (!io->eof_reached) {
  342. read_chomp_line(io, line, sizeof(line));
  343. if (av_strstart(line, "#EXT-X-MEDIA-SEQUENCE:", &ptr)) {
  344. hls->sequence = hls->start_sequence = atoi(ptr);
  345. } else if (av_strstart(line, "#EXTINF:", &ptr)) {
  346. is_segment = 1;
  347. duration = atof(ptr) * AV_TIME_BASE;
  348. } else if (av_strstart(line, "#EXT-X-DISCONTINUITY", NULL)) {
  349. is_discont = 1;
  350. } else if (av_strstart(line, "#", NULL)) {
  351. continue;
  352. } else if (line[0]) {
  353. if (is_segment) {
  354. append_entry(hls, duration, av_basename(line), is_discont);
  355. is_segment = 0;
  356. is_discont = 0;
  357. }
  358. }
  359. }
  360. hls->recovered = 1;
  361. return 0;
  362. }
  363. static int hls_setup(AVFormatContext *s)
  364. {
  365. HLSContext *hls = s->priv_data;
  366. const char *pattern = "%d.ts";
  367. int basename_size = strlen(s->filename) + strlen(pattern) + 1;
  368. char *p;
  369. int ret;
  370. if (hls->encrypt)
  371. basename_size += 7;
  372. hls->basename = av_mallocz(basename_size);
  373. if (!hls->basename)
  374. return AVERROR(ENOMEM);
  375. // TODO: support protocol nesting?
  376. if (hls->encrypt)
  377. strcpy(hls->basename, "crypto:");
  378. av_strlcat(hls->basename, s->filename, basename_size);
  379. p = strrchr(hls->basename, '.');
  380. if (p)
  381. *p = '\0';
  382. if (hls->encrypt) {
  383. ret = setup_encryption(s);
  384. if (ret < 0)
  385. return ret;
  386. }
  387. if (hls->start_sequence < 0) {
  388. ret = hls_recover(s);
  389. if (ret < 0)
  390. return ret;
  391. }
  392. av_strlcat(hls->basename, pattern, basename_size);
  393. return 0;
  394. }
  395. static int hls_write_header(AVFormatContext *s)
  396. {
  397. HLSContext *hls = s->priv_data;
  398. int ret, i;
  399. hls->sequence = hls->start_sequence;
  400. hls->recording_time = hls->time * AV_TIME_BASE;
  401. hls->start_pts = AV_NOPTS_VALUE;
  402. for (i = 0; i < s->nb_streams; i++)
  403. hls->has_video +=
  404. s->streams[i]->codecpar->codec_type == AVMEDIA_TYPE_VIDEO;
  405. if (hls->has_video > 1)
  406. av_log(s, AV_LOG_WARNING,
  407. "More than a single video stream present, "
  408. "expect issues decoding it.\n");
  409. hls->oformat = av_guess_format("mpegts", NULL, NULL);
  410. if (!hls->oformat) {
  411. ret = AVERROR_MUXER_NOT_FOUND;
  412. goto fail;
  413. }
  414. if ((ret = hls_setup(s)) < 0)
  415. goto fail;
  416. if ((ret = hls_mux_init(s)) < 0)
  417. goto fail;
  418. if ((ret = hls_start(s)) < 0)
  419. goto fail;
  420. if ((ret = avformat_write_header(hls->avf, NULL)) < 0)
  421. return ret;
  422. fail:
  423. if (ret) {
  424. av_free(hls->basename);
  425. if (hls->avf)
  426. avformat_free_context(hls->avf);
  427. free_encryption(s);
  428. }
  429. return ret;
  430. }
  431. static int hls_write_packet(AVFormatContext *s, AVPacket *pkt)
  432. {
  433. HLSContext *hls = s->priv_data;
  434. AVFormatContext *oc = hls->avf;
  435. AVStream *st = s->streams[pkt->stream_index];
  436. int64_t end_pts = hls->recording_time * hls->number;
  437. int64_t pts = av_rescale_q(pkt->pts, st->time_base, AV_TIME_BASE_Q);
  438. int ret, can_split = 1;
  439. if (hls->start_pts == AV_NOPTS_VALUE) {
  440. hls->start_pts = pts;
  441. hls->end_pts = pts;
  442. }
  443. if (hls->has_video) {
  444. can_split = st->codecpar->codec_type == AVMEDIA_TYPE_VIDEO &&
  445. pkt->flags & AV_PKT_FLAG_KEY;
  446. }
  447. if (pkt->pts == AV_NOPTS_VALUE)
  448. can_split = 0;
  449. else
  450. hls->duration = pts - hls->end_pts;
  451. if (can_split && pts - hls->start_pts >= end_pts) {
  452. ret = append_entry(hls, hls->duration, av_basename(hls->avf->filename), hls->recovered);
  453. hls->recovered = 0;
  454. if (ret)
  455. return ret;
  456. hls->end_pts = pts;
  457. hls->duration = 0;
  458. av_write_frame(oc, NULL); /* Flush any buffered data */
  459. ff_format_io_close(s, &oc->pb);
  460. ret = hls_start(s);
  461. if (ret)
  462. return ret;
  463. oc = hls->avf;
  464. if ((ret = hls_window(s, 0)) < 0)
  465. return ret;
  466. }
  467. ret = ff_write_chained(oc, pkt->stream_index, pkt, s);
  468. return ret;
  469. }
  470. static int hls_write_trailer(struct AVFormatContext *s)
  471. {
  472. HLSContext *hls = s->priv_data;
  473. AVFormatContext *oc = hls->avf;
  474. av_write_trailer(oc);
  475. ff_format_io_close(s, &oc->pb);
  476. avformat_free_context(oc);
  477. av_free(hls->basename);
  478. append_entry(hls, hls->duration, av_basename(hls->avf->filename), 0);
  479. hls_window(s, 1);
  480. free_entries(hls);
  481. free_encryption(s);
  482. return 0;
  483. }
  484. #define OFFSET(x) offsetof(HLSContext, x)
  485. #define E AV_OPT_FLAG_ENCODING_PARAM
  486. static const AVOption options[] = {
  487. {"start_number", "first number in the sequence", OFFSET(start_sequence),AV_OPT_TYPE_INT64, {.i64 = 0}, -1, INT64_MAX, E, "start_number"},
  488. {"recover", "If there is already a m3u8 file in the path, populate the sequence from it", 0, AV_OPT_TYPE_CONST, {.i64 = -1}, 0, 0, E, "start_number"},
  489. {"hls_time", "segment length in seconds", OFFSET(time), AV_OPT_TYPE_FLOAT, {.dbl = 2}, 0, FLT_MAX, E},
  490. {"hls_list_size", "maximum number of playlist entries", OFFSET(size), AV_OPT_TYPE_INT, {.i64 = 5}, 0, INT_MAX, E},
  491. {"hls_wrap", "number after which the index wraps", OFFSET(wrap), AV_OPT_TYPE_INT, {.i64 = 0}, 0, INT_MAX, E},
  492. {"hls_allow_cache", "explicitly set whether the client MAY (1) or MUST NOT (0) cache media segments", OFFSET(allowcache), AV_OPT_TYPE_INT, {.i64 = -1}, INT_MIN, INT_MAX, E},
  493. {"hls_base_url", "url to prepend to each playlist entry", OFFSET(baseurl), AV_OPT_TYPE_STRING, {.str = NULL}, 0, 0, E},
  494. {"hls_version", "protocol version", OFFSET(version), AV_OPT_TYPE_INT, {.i64 = 3}, 2, 3, E},
  495. {"hls_enc", "AES128 encryption support", OFFSET(encrypt), AV_OPT_TYPE_INT, {.i64 = 0}, 0, 1, E},
  496. {"hls_enc_key", "use the specified hex-coded 16byte key to encrypt the segments", OFFSET(key), AV_OPT_TYPE_BINARY, .flags = E},
  497. {"hls_enc_key_url", "url to access the key to decrypt the segments", OFFSET(key_url), AV_OPT_TYPE_STRING, {.str = NULL}, 0, 0, E},
  498. {"hls_enc_iv", "use the specified hex-coded 16byte initialization vector", OFFSET(iv), AV_OPT_TYPE_BINARY, .flags = E},
  499. { NULL },
  500. };
  501. static const AVClass hls_class = {
  502. .class_name = "hls muxer",
  503. .item_name = av_default_item_name,
  504. .option = options,
  505. .version = LIBAVUTIL_VERSION_INT,
  506. };
  507. AVOutputFormat ff_hls_muxer = {
  508. .name = "hls",
  509. .long_name = NULL_IF_CONFIG_SMALL("Apple HTTP Live Streaming"),
  510. .extensions = "m3u8",
  511. .priv_data_size = sizeof(HLSContext),
  512. .audio_codec = AV_CODEC_ID_AAC,
  513. .video_codec = AV_CODEC_ID_H264,
  514. .flags = AVFMT_NOFILE | AVFMT_ALLOW_FLUSH,
  515. .write_header = hls_write_header,
  516. .write_packet = hls_write_packet,
  517. .write_trailer = hls_write_trailer,
  518. .priv_class = &hls_class,
  519. };