2 * Apple HTTP Live Streaming demuxer
3 * Copyright (c) 2010 Martin Storsjo
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24 * Apple HTTP Live Streaming demuxer
25 * http://tools.ietf.org/html/draft-pantos-http-live-streaming
28 #include "libavutil/avstring.h"
29 #include "libavutil/intreadwrite.h"
30 #include "libavutil/mathematics.h"
31 #include "libavutil/opt.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/time.h"
36 #include "avio_internal.h"
39 #define INITIAL_BUFFER_SIZE 32768
42 * An apple http stream consists of a playlist with media segment files,
43 * played sequentially. There may be several playlists with the same
44 * video content, in different bandwidth variants, that are played in
45 * parallel (preferably only one bandwidth variant at a time). In this case,
46 * the user supplied the url to a main playlist that only lists the variant
49 * If the main playlist doesn't point at any variants, we still create
50 * one anonymous toplevel variant for this, to maintain the structure.
60 char url[MAX_URL_SIZE];
61 char key[MAX_URL_SIZE];
62 enum KeyType key_type;
67 * Each variant has its own demuxer. If it currently is active,
68 * it has an open AVIOContext too, and potentially an AVPacket
69 * containing the next packet from this stream.
73 char url[MAX_URL_SIZE];
77 AVFormatContext *parent;
84 int64_t target_duration;
87 struct segment **segments;
88 int needed, cur_needed;
90 int64_t last_load_time;
92 char key_url[MAX_URL_SIZE];
96 typedef struct HLSContext {
98 struct variant **variants;
102 int64_t first_timestamp;
103 int64_t seek_timestamp;
105 AVIOInterruptCB *interrupt_callback;
106 char *user_agent; ///< holds HTTP user agent set as an AVOption to the HTTP protocol context
107 char *cookies; ///< holds HTTP cookie values set in either the initial response or as an AVOption to the HTTP protocol context
108 char *headers; ///< holds HTTP headers set as an AVOption to the HTTP protocol context
111 static int read_chomp_line(AVIOContext *s, char *buf, int maxlen)
113 int len = ff_get_line(s, buf, maxlen);
114 while (len > 0 && av_isspace(buf[len - 1]))
119 static void free_segment_list(struct variant *var)
122 for (i = 0; i < var->n_segments; i++)
123 av_free(var->segments[i]);
124 av_freep(&var->segments);
128 static void free_variant_list(HLSContext *c)
131 for (i = 0; i < c->n_variants; i++) {
132 struct variant *var = c->variants[i];
133 free_segment_list(var);
134 av_free_packet(&var->pkt);
135 av_free(var->pb.buffer);
137 ffurl_close(var->input);
140 avformat_close_input(&var->ctx);
144 av_freep(&c->variants);
145 av_freep(&c->cookies);
146 av_freep(&c->user_agent);
151 * Used to reset a statically allocated AVPacket to a clean slate,
152 * containing no data.
154 static void reset_packet(AVPacket *pkt)
160 static struct variant *new_variant(HLSContext *c, int bandwidth,
161 const char *url, const char *base)
163 struct variant *var = av_mallocz(sizeof(struct variant));
166 reset_packet(&var->pkt);
167 var->bandwidth = bandwidth;
168 ff_make_absolute_url(var->url, sizeof(var->url), base, url);
169 dynarray_add(&c->variants, &c->n_variants, var);
173 struct variant_info {
177 static void handle_variant_args(struct variant_info *info, const char *key,
178 int key_len, char **dest, int *dest_len)
180 if (!strncmp(key, "BANDWIDTH=", key_len)) {
181 *dest = info->bandwidth;
182 *dest_len = sizeof(info->bandwidth);
187 char uri[MAX_URL_SIZE];
192 static void handle_key_args(struct key_info *info, const char *key,
193 int key_len, char **dest, int *dest_len)
195 if (!strncmp(key, "METHOD=", key_len)) {
196 *dest = info->method;
197 *dest_len = sizeof(info->method);
198 } else if (!strncmp(key, "URI=", key_len)) {
200 *dest_len = sizeof(info->uri);
201 } else if (!strncmp(key, "IV=", key_len)) {
203 *dest_len = sizeof(info->iv);
207 static int parse_playlist(HLSContext *c, const char *url,
208 struct variant *var, AVIOContext *in)
210 int ret = 0, is_segment = 0, is_variant = 0, bandwidth = 0;
211 int64_t duration = 0;
212 enum KeyType key_type = KEY_NONE;
215 char key[MAX_URL_SIZE] = "";
216 char line[MAX_URL_SIZE];
219 uint8_t *new_url = NULL;
222 AVDictionary *opts = NULL;
224 /* Some HLS servers don't like being sent the range header */
225 av_dict_set(&opts, "seekable", "0", 0);
227 // broker prior HTTP options that should be consistent across requests
228 av_dict_set(&opts, "user-agent", c->user_agent, 0);
229 av_dict_set(&opts, "cookies", c->cookies, 0);
230 av_dict_set(&opts, "headers", c->headers, 0);
232 ret = avio_open2(&in, url, AVIO_FLAG_READ,
233 c->interrupt_callback, &opts);
239 if (av_opt_get(in, "location", AV_OPT_SEARCH_CHILDREN, &new_url) >= 0)
242 read_chomp_line(in, line, sizeof(line));
243 if (strcmp(line, "#EXTM3U")) {
244 ret = AVERROR_INVALIDDATA;
249 free_segment_list(var);
252 while (!url_feof(in)) {
253 read_chomp_line(in, line, sizeof(line));
254 if (av_strstart(line, "#EXT-X-STREAM-INF:", &ptr)) {
255 struct variant_info info = {{0}};
257 ff_parse_key_value(ptr, (ff_parse_key_val_cb) handle_variant_args,
259 bandwidth = atoi(info.bandwidth);
260 } else if (av_strstart(line, "#EXT-X-KEY:", &ptr)) {
261 struct key_info info = {{0}};
262 ff_parse_key_value(ptr, (ff_parse_key_val_cb) handle_key_args,
266 if (!strcmp(info.method, "AES-128"))
267 key_type = KEY_AES_128;
268 if (!strncmp(info.iv, "0x", 2) || !strncmp(info.iv, "0X", 2)) {
269 ff_hex_to_data(iv, info.iv + 2);
272 av_strlcpy(key, info.uri, sizeof(key));
273 } else if (av_strstart(line, "#EXT-X-TARGETDURATION:", &ptr)) {
275 var = new_variant(c, 0, url, NULL);
277 ret = AVERROR(ENOMEM);
281 var->target_duration = atoi(ptr) * AV_TIME_BASE;
282 } else if (av_strstart(line, "#EXT-X-MEDIA-SEQUENCE:", &ptr)) {
284 var = new_variant(c, 0, url, NULL);
286 ret = AVERROR(ENOMEM);
290 var->start_seq_no = atoi(ptr);
291 } else if (av_strstart(line, "#EXT-X-ENDLIST", &ptr)) {
294 } else if (av_strstart(line, "#EXTINF:", &ptr)) {
296 duration = atof(ptr) * AV_TIME_BASE;
297 } else if (av_strstart(line, "#", NULL)) {
299 } else if (line[0]) {
301 if (!new_variant(c, bandwidth, line, url)) {
302 ret = AVERROR(ENOMEM);
311 var = new_variant(c, 0, url, NULL);
313 ret = AVERROR(ENOMEM);
317 seg = av_malloc(sizeof(struct segment));
319 ret = AVERROR(ENOMEM);
322 seg->duration = duration;
323 seg->key_type = key_type;
325 memcpy(seg->iv, iv, sizeof(iv));
327 int seq = var->start_seq_no + var->n_segments;
328 memset(seg->iv, 0, sizeof(seg->iv));
329 AV_WB32(seg->iv + 12, seq);
331 ff_make_absolute_url(seg->key, sizeof(seg->key), url, key);
332 ff_make_absolute_url(seg->url, sizeof(seg->url), url, line);
333 dynarray_add(&var->segments, &var->n_segments, seg);
339 var->last_load_time = av_gettime();
348 static int open_input(HLSContext *c, struct variant *var)
350 AVDictionary *opts = NULL;
352 struct segment *seg = var->segments[var->cur_seq_no - var->start_seq_no];
354 // broker prior HTTP options that should be consistent across requests
355 av_dict_set(&opts, "user-agent", c->user_agent, 0);
356 av_dict_set(&opts, "cookies", c->cookies, 0);
357 av_dict_set(&opts, "headers", c->headers, 0);
358 av_dict_set(&opts, "seekable", "0", 0);
360 if (seg->key_type == KEY_NONE) {
361 ret = ffurl_open(&var->input, seg->url, AVIO_FLAG_READ,
362 &var->parent->interrupt_callback, &opts);
364 } else if (seg->key_type == KEY_AES_128) {
365 char iv[33], key[33], url[MAX_URL_SIZE];
366 if (strcmp(seg->key, var->key_url)) {
368 if (ffurl_open(&uc, seg->key, AVIO_FLAG_READ,
369 &var->parent->interrupt_callback, &opts) == 0) {
370 if (ffurl_read_complete(uc, var->key, sizeof(var->key))
371 != sizeof(var->key)) {
372 av_log(NULL, AV_LOG_ERROR, "Unable to read key file %s\n",
377 av_log(NULL, AV_LOG_ERROR, "Unable to open key file %s\n",
380 av_strlcpy(var->key_url, seg->key, sizeof(var->key_url));
382 ff_data_to_hex(iv, seg->iv, sizeof(seg->iv), 0);
383 ff_data_to_hex(key, var->key, sizeof(var->key), 0);
384 iv[32] = key[32] = '\0';
385 if (strstr(seg->url, "://"))
386 snprintf(url, sizeof(url), "crypto+%s", seg->url);
388 snprintf(url, sizeof(url), "crypto:%s", seg->url);
389 if ((ret = ffurl_alloc(&var->input, url, AVIO_FLAG_READ,
390 &var->parent->interrupt_callback)) < 0)
392 av_opt_set(var->input->priv_data, "key", key, 0);
393 av_opt_set(var->input->priv_data, "iv", iv, 0);
394 /* Need to repopulate options */
396 av_dict_set(&opts, "seekable", "0", 0);
397 if ((ret = ffurl_connect(var->input, &opts)) < 0) {
398 ffurl_close(var->input);
405 ret = AVERROR(ENOSYS);
412 static int read_data(void *opaque, uint8_t *buf, int buf_size)
414 struct variant *v = opaque;
415 HLSContext *c = v->parent->priv_data;
420 /* If this is a live stream and the reload interval has elapsed since
421 * the last playlist reload, reload the variant playlists now. */
422 int64_t reload_interval = v->n_segments > 0 ?
423 v->segments[v->n_segments - 1]->duration :
428 av_gettime() - v->last_load_time >= reload_interval) {
429 if ((ret = parse_playlist(c, v->url, v, NULL)) < 0)
431 /* If we need to reload the playlist again below (if
432 * there's still no more segments), switch to a reload
433 * interval of half the target duration. */
434 reload_interval = v->target_duration / 2;
436 if (v->cur_seq_no < v->start_seq_no) {
437 av_log(NULL, AV_LOG_WARNING,
438 "skipping %d segments ahead, expired from playlists\n",
439 v->start_seq_no - v->cur_seq_no);
440 v->cur_seq_no = v->start_seq_no;
442 if (v->cur_seq_no >= v->start_seq_no + v->n_segments) {
445 while (av_gettime() - v->last_load_time < reload_interval) {
446 if (ff_check_interrupt(c->interrupt_callback))
450 /* Enough time has elapsed since the last reload */
454 ret = open_input(c, v);
458 ret = ffurl_read(v->input, buf, buf_size);
461 ffurl_close(v->input);
465 c->end_of_segment = 1;
466 c->cur_seq_no = v->cur_seq_no;
468 if (v->ctx && v->ctx->nb_streams &&
469 v->parent->nb_streams >= v->stream_offset + v->ctx->nb_streams) {
471 for (i = v->stream_offset; i < v->stream_offset + v->ctx->nb_streams;
473 if (v->parent->streams[i]->discard < AVDISCARD_ALL)
478 av_log(v->parent, AV_LOG_INFO, "No longer receiving variant %d\n",
485 static int hls_read_header(AVFormatContext *s)
487 URLContext *u = (s->flags & AVFMT_FLAG_CUSTOM_IO) ? NULL : s->pb->opaque;
488 HLSContext *c = s->priv_data;
489 int ret = 0, i, j, stream_offset = 0;
491 c->interrupt_callback = &s->interrupt_callback;
493 // if the URL context is good, read important options we must broker later
494 if (u && u->prot->priv_data_class) {
495 // get the previous user agent & set back to null if string size is zero
496 av_freep(&c->user_agent);
497 av_opt_get(u->priv_data, "user-agent", 0, (uint8_t**)&(c->user_agent));
498 if (c->user_agent && !strlen(c->user_agent))
499 av_freep(&c->user_agent);
501 // get the previous cookies & set back to null if string size is zero
502 av_freep(&c->cookies);
503 av_opt_get(u->priv_data, "cookies", 0, (uint8_t**)&(c->cookies));
504 if (c->cookies && !strlen(c->cookies))
505 av_freep(&c->cookies);
507 // get the previous headers & set back to null if string size is zero
508 av_freep(&c->headers);
509 av_opt_get(u->priv_data, "headers", 0, (uint8_t**)&(c->headers));
510 if (c->headers && !strlen(c->headers))
511 av_freep(&c->headers);
514 if ((ret = parse_playlist(c, s->filename, NULL, s->pb)) < 0)
517 if (c->n_variants == 0) {
518 av_log(NULL, AV_LOG_WARNING, "Empty playlist\n");
522 /* If the playlist only contained variants, parse each individual
523 * variant playlist. */
524 if (c->n_variants > 1 || c->variants[0]->n_segments == 0) {
525 for (i = 0; i < c->n_variants; i++) {
526 struct variant *v = c->variants[i];
527 if ((ret = parse_playlist(c, v->url, v, NULL)) < 0)
532 if (c->variants[0]->n_segments == 0) {
533 av_log(NULL, AV_LOG_WARNING, "Empty playlist\n");
538 /* If this isn't a live stream, calculate the total duration of the
540 if (c->variants[0]->finished) {
541 int64_t duration = 0;
542 for (i = 0; i < c->variants[0]->n_segments; i++)
543 duration += c->variants[0]->segments[i]->duration;
544 s->duration = duration;
547 /* Open the demuxer for each variant */
548 for (i = 0; i < c->n_variants; i++) {
549 struct variant *v = c->variants[i];
550 AVInputFormat *in_fmt = NULL;
551 char bitrate_str[20];
554 if (v->n_segments == 0)
557 if (!(v->ctx = avformat_alloc_context())) {
558 ret = AVERROR(ENOMEM);
566 /* If this is a live stream with more than 3 segments, start at the
567 * third last segment. */
568 v->cur_seq_no = v->start_seq_no;
569 if (!v->finished && v->n_segments > 3)
570 v->cur_seq_no = v->start_seq_no + v->n_segments - 3;
572 v->read_buffer = av_malloc(INITIAL_BUFFER_SIZE);
573 ffio_init_context(&v->pb, v->read_buffer, INITIAL_BUFFER_SIZE, 0, v,
574 read_data, NULL, NULL);
576 ret = av_probe_input_buffer(&v->pb, &in_fmt, v->segments[0]->url,
579 /* Free the ctx - it isn't initialized properly at this point,
580 * so avformat_close_input shouldn't be called. If
581 * avformat_open_input fails below, it frees and zeros the
582 * context, so it doesn't need any special treatment like this. */
583 av_log(s, AV_LOG_ERROR, "Error when loading first segment '%s'\n", v->segments[0]->url);
584 avformat_free_context(v->ctx);
589 v->stream_offset = stream_offset;
590 ret = avformat_open_input(&v->ctx, v->segments[0]->url, in_fmt, NULL);
594 v->ctx->ctx_flags &= ~AVFMTCTX_NOHEADER;
595 ret = avformat_find_stream_info(v->ctx, NULL);
598 snprintf(bitrate_str, sizeof(bitrate_str), "%d", v->bandwidth);
600 program = av_new_program(s, i);
603 av_dict_set(&program->metadata, "variant_bitrate", bitrate_str, 0);
605 /* Create new AVStreams for each stream in this variant */
606 for (j = 0; j < v->ctx->nb_streams; j++) {
607 AVStream *st = avformat_new_stream(s, NULL);
608 AVStream *ist = v->ctx->streams[j];
610 ret = AVERROR(ENOMEM);
613 ff_program_add_stream_index(s, i, stream_offset + j);
615 avpriv_set_pts_info(st, ist->pts_wrap_bits, ist->time_base.num, ist->time_base.den);
616 avcodec_copy_context(st->codec, v->ctx->streams[j]->codec);
618 av_dict_set(&st->metadata, "variant_bitrate", bitrate_str,
621 stream_offset += v->ctx->nb_streams;
625 c->first_timestamp = AV_NOPTS_VALUE;
626 c->seek_timestamp = AV_NOPTS_VALUE;
630 free_variant_list(c);
634 static int recheck_discard_flags(AVFormatContext *s, int first)
636 HLSContext *c = s->priv_data;
639 /* Check if any new streams are needed */
640 for (i = 0; i < c->n_variants; i++)
641 c->variants[i]->cur_needed = 0;
643 for (i = 0; i < s->nb_streams; i++) {
644 AVStream *st = s->streams[i];
645 struct variant *var = c->variants[s->streams[i]->id];
646 if (st->discard < AVDISCARD_ALL)
649 for (i = 0; i < c->n_variants; i++) {
650 struct variant *v = c->variants[i];
651 if (v->cur_needed && !v->needed) {
654 v->cur_seq_no = c->cur_seq_no;
655 v->pb.eof_reached = 0;
656 av_log(s, AV_LOG_INFO, "Now receiving variant %d\n", i);
657 } else if (first && !v->cur_needed && v->needed) {
659 ffurl_close(v->input);
663 av_log(s, AV_LOG_INFO, "No longer receiving variant %d\n", i);
669 static int hls_read_packet(AVFormatContext *s, AVPacket *pkt)
671 HLSContext *c = s->priv_data;
672 int ret, i, minvariant = -1;
674 if (c->first_packet) {
675 recheck_discard_flags(s, 1);
680 c->end_of_segment = 0;
681 for (i = 0; i < c->n_variants; i++) {
682 struct variant *var = c->variants[i];
683 /* Make sure we've got one buffered packet from each open variant
685 if (var->needed && !var->pkt.data) {
689 ret = av_read_frame(var->ctx, &var->pkt);
691 if (!url_feof(&var->pb) && ret != AVERROR_EOF)
693 reset_packet(&var->pkt);
696 if (c->first_timestamp == AV_NOPTS_VALUE &&
697 var->pkt.dts != AV_NOPTS_VALUE)
698 c->first_timestamp = av_rescale_q(var->pkt.dts,
699 var->ctx->streams[var->pkt.stream_index]->time_base,
703 if (c->seek_timestamp == AV_NOPTS_VALUE)
706 if (var->pkt.dts == AV_NOPTS_VALUE) {
707 c->seek_timestamp = AV_NOPTS_VALUE;
711 st = var->ctx->streams[var->pkt.stream_index];
712 ts_diff = av_rescale_rnd(var->pkt.dts, AV_TIME_BASE,
713 st->time_base.den, AV_ROUND_DOWN) -
715 if (ts_diff >= 0 && (c->seek_flags & AVSEEK_FLAG_ANY ||
716 var->pkt.flags & AV_PKT_FLAG_KEY)) {
717 c->seek_timestamp = AV_NOPTS_VALUE;
720 av_free_packet(&var->pkt);
721 reset_packet(&var->pkt);
724 /* Check if this stream still is on an earlier segment number, or
725 * has the packet with the lowest dts */
727 struct variant *minvar = minvariant < 0 ?
728 NULL : c->variants[minvariant];
729 if (minvariant < 0 || var->cur_seq_no < minvar->cur_seq_no) {
731 } else if (var->cur_seq_no == minvar->cur_seq_no) {
732 int64_t dts = var->pkt.dts;
733 int64_t mindts = minvar->pkt.dts;
734 AVStream *st = var->ctx->streams[var->pkt.stream_index];
735 AVStream *minst = minvar->ctx->streams[minvar->pkt.stream_index];
737 if (dts == AV_NOPTS_VALUE) {
739 } else if (mindts != AV_NOPTS_VALUE) {
740 if (st->start_time != AV_NOPTS_VALUE)
741 dts -= st->start_time;
742 if (minst->start_time != AV_NOPTS_VALUE)
743 mindts -= minst->start_time;
745 if (av_compare_ts(dts, st->time_base,
746 mindts, minst->time_base) < 0)
752 if (c->end_of_segment) {
753 if (recheck_discard_flags(s, 0))
756 /* If we got a packet, return it */
757 if (minvariant >= 0) {
758 *pkt = c->variants[minvariant]->pkt;
759 pkt->stream_index += c->variants[minvariant]->stream_offset;
760 reset_packet(&c->variants[minvariant]->pkt);
766 static int hls_close(AVFormatContext *s)
768 HLSContext *c = s->priv_data;
770 free_variant_list(c);
774 static int hls_read_seek(AVFormatContext *s, int stream_index,
775 int64_t timestamp, int flags)
777 HLSContext *c = s->priv_data;
780 if ((flags & AVSEEK_FLAG_BYTE) || !c->variants[0]->finished)
781 return AVERROR(ENOSYS);
783 c->seek_flags = flags;
784 c->seek_timestamp = stream_index < 0 ? timestamp :
785 av_rescale_rnd(timestamp, AV_TIME_BASE,
786 s->streams[stream_index]->time_base.den,
787 flags & AVSEEK_FLAG_BACKWARD ?
788 AV_ROUND_DOWN : AV_ROUND_UP);
789 timestamp = av_rescale_rnd(timestamp, AV_TIME_BASE, stream_index >= 0 ?
790 s->streams[stream_index]->time_base.den :
791 AV_TIME_BASE, flags & AVSEEK_FLAG_BACKWARD ?
792 AV_ROUND_DOWN : AV_ROUND_UP);
793 if (s->duration < c->seek_timestamp) {
794 c->seek_timestamp = AV_NOPTS_VALUE;
799 for (i = 0; i < c->n_variants; i++) {
801 struct variant *var = c->variants[i];
802 int64_t pos = c->first_timestamp == AV_NOPTS_VALUE ?
803 0 : c->first_timestamp;
805 ffurl_close(var->input);
808 av_free_packet(&var->pkt);
809 reset_packet(&var->pkt);
810 var->pb.eof_reached = 0;
811 /* Clear any buffered data */
812 var->pb.buf_end = var->pb.buf_ptr = var->pb.buffer;
813 /* Reset the pos, to let the mpegts demuxer know we've seeked. */
816 /* Locate the segment that contains the target timestamp */
817 for (j = 0; j < var->n_segments; j++) {
818 if (timestamp >= pos &&
819 timestamp < pos + var->segments[j]->duration) {
820 var->cur_seq_no = var->start_seq_no + j;
824 pos += var->segments[j]->duration;
827 c->seek_timestamp = AV_NOPTS_VALUE;
832 static int hls_probe(AVProbeData *p)
834 /* Require #EXTM3U at the start, and either one of the ones below
835 * somewhere for a proper match. */
836 if (strncmp(p->buf, "#EXTM3U", 7))
838 if (strstr(p->buf, "#EXT-X-STREAM-INF:") ||
839 strstr(p->buf, "#EXT-X-TARGETDURATION:") ||
840 strstr(p->buf, "#EXT-X-MEDIA-SEQUENCE:"))
841 return AVPROBE_SCORE_MAX;
845 AVInputFormat ff_hls_demuxer = {
846 .name = "hls,applehttp",
847 .long_name = NULL_IF_CONFIG_SMALL("Apple HTTP Live Streaming"),
848 .priv_data_size = sizeof(HLSContext),
849 .read_probe = hls_probe,
850 .read_header = hls_read_header,
851 .read_packet = hls_read_packet,
852 .read_close = hls_close,
853 .read_seek = hls_read_seek,