/* * TED Talks captions format decoder * Copyright (c) 2012 Nicolas George * * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #include "libavutil/bprint.h" #include "libavutil/log.h" #include "libavutil/opt.h" #include "avformat.h" #include "demux.h" #include "internal.h" #include "subtitles.h" typedef struct { AVClass *class; int64_t start_time; FFDemuxSubtitlesQueue subs; } TEDCaptionsDemuxer; static const AVOption tedcaptions_options[] = { { "start_time", "set the start time (offset) of the subtitles, in ms", offsetof(TEDCaptionsDemuxer, start_time), AV_OPT_TYPE_INT64, { .i64 = 15000 }, INT64_MIN, INT64_MAX, AV_OPT_FLAG_SUBTITLE_PARAM | AV_OPT_FLAG_DECODING_PARAM }, { NULL }, }; static const AVClass tedcaptions_demuxer_class = { .class_name = "tedcaptions_demuxer", .option = tedcaptions_options, .version = LIBAVUTIL_VERSION_INT, }; #define BETWEEN(a, amin, amax) ((unsigned)((a) - (amin)) <= (amax) - (amin)) #define HEX_DIGIT_TEST(c) (BETWEEN(c, '0', '9') || BETWEEN((c) | 32, 'a', 'z')) #define HEX_DIGIT_VAL(c) ((c) <= '9' ? (c) - '0' : ((c) | 32) - 'a' + 10) #define ERR_CODE(c) ((c) < 0 ? (c) : AVERROR_INVALIDDATA) static void av_bprint_utf8(AVBPrint *bp, unsigned c) { int bytes, i; if (c <= 0x7F) { av_bprint_chars(bp, c, 1); return; } bytes = (av_log2(c) - 2) / 5; av_bprint_chars(bp, (c >> (bytes * 6)) | ((0xFF80 >> bytes) & 0xFF), 1); for (i = bytes - 1; i >= 0; i--) av_bprint_chars(bp, ((c >> (i * 6)) & 0x3F) | 0x80, 1); } static void next_byte(AVIOContext *pb, int *cur_byte) { uint8_t b; int ret = avio_read(pb, &b, 1); *cur_byte = ret > 0 ? b : ret == 0 ? AVERROR_EOF : ret; } static void skip_spaces(AVIOContext *pb, int *cur_byte) { while (*cur_byte == ' ' || *cur_byte == '\t' || *cur_byte == '\n' || *cur_byte == '\r') next_byte(pb, cur_byte); } static int expect_byte(AVIOContext *pb, int *cur_byte, uint8_t c) { skip_spaces(pb, cur_byte); if (*cur_byte != c) return ERR_CODE(*cur_byte); next_byte(pb, cur_byte); return 0; } static int parse_string(AVIOContext *pb, int *cur_byte, AVBPrint *bp, int full) { int ret; ret = expect_byte(pb, cur_byte, '"'); if (ret < 0) return ret; while (*cur_byte > 0 && *cur_byte != '"') { if (*cur_byte == '\\') { next_byte(pb, cur_byte); if (*cur_byte < 0) return AVERROR_INVALIDDATA; if ((*cur_byte | 32) == 'u') { unsigned chr = 0, i; for (i = 0; i < 4; i++) { next_byte(pb, cur_byte); if (!HEX_DIGIT_TEST(*cur_byte)) return ERR_CODE(*cur_byte); chr = chr * 16 + HEX_DIGIT_VAL(*cur_byte); } av_bprint_utf8(bp, chr); } else { av_bprint_chars(bp, *cur_byte, 1); } } else { av_bprint_chars(bp, *cur_byte, 1); } next_byte(pb, cur_byte); } ret = expect_byte(pb, cur_byte, '"'); if (ret < 0) return ret; if (full && !av_bprint_is_complete(bp)) return AVERROR(ENOMEM); return 0; } static int parse_label(AVIOContext *pb, int *cur_byte, AVBPrint *bp) { int ret; av_bprint_init(bp, 0, AV_BPRINT_SIZE_AUTOMATIC); ret = parse_string(pb, cur_byte, bp, 0); if (ret < 0) return ret; ret = expect_byte(pb, cur_byte, ':'); if (ret < 0) return ret; return 0; } static int parse_boolean(AVIOContext *pb, int *cur_byte, int *result) { static const char * const text[] = { "false", "true" }; const char *p; int i; skip_spaces(pb, cur_byte); for (i = 0; i < 2; i++) { p = text[i]; if (*cur_byte != *p) continue; for (; *p; p++, next_byte(pb, cur_byte)) if (*cur_byte != *p) return AVERROR_INVALIDDATA; if (BETWEEN(*cur_byte | 32, 'a', 'z')) return AVERROR_INVALIDDATA; *result = i; return 0; } return AVERROR_INVALIDDATA; } static int parse_int(AVIOContext *pb, int *cur_byte, int64_t *result) { int64_t val = 0; skip_spaces(pb, cur_byte); if ((unsigned)*cur_byte - '0' > 9) return AVERROR_INVALIDDATA; while (BETWEEN(*cur_byte, '0', '9')) { if (val > INT_MAX/10 - (*cur_byte - '0')) return AVERROR_INVALIDDATA; val = val * 10 + (*cur_byte - '0'); next_byte(pb, cur_byte); } *result = val; return 0; } static int parse_file(AVIOContext *pb, FFDemuxSubtitlesQueue *subs) { int ret, cur_byte, start_of_par; AVBPrint label, content; int64_t pos, start, duration; AVPacket *pkt; av_bprint_init(&content, 0, AV_BPRINT_SIZE_UNLIMITED); next_byte(pb, &cur_byte); ret = expect_byte(pb, &cur_byte, '{'); if (ret < 0) return AVERROR_INVALIDDATA; ret = parse_label(pb, &cur_byte, &label); if (ret < 0 || strcmp(label.str, "captions")) return AVERROR_INVALIDDATA; ret = expect_byte(pb, &cur_byte, '['); if (ret < 0) return AVERROR_INVALIDDATA; while (1) { start = duration = AV_NOPTS_VALUE; ret = expect_byte(pb, &cur_byte, '{'); if (ret < 0) goto fail; pos = avio_tell(pb) - 1; while (1) { ret = parse_label(pb, &cur_byte, &label); if (ret < 0) goto fail; if (!strcmp(label.str, "startOfParagraph")) { ret = parse_boolean(pb, &cur_byte, &start_of_par); if (ret < 0) goto fail; } else if (!strcmp(label.str, "content")) { ret = parse_string(pb, &cur_byte, &content, 1); if (ret < 0) goto fail; } else if (!strcmp(label.str, "startTime")) { ret = parse_int(pb, &cur_byte, &start); if (ret < 0) goto fail; } else if (!strcmp(label.str, "duration")) { ret = parse_int(pb, &cur_byte, &duration); if (ret < 0) goto fail; } else { ret = AVERROR_INVALIDDATA; goto fail; } skip_spaces(pb, &cur_byte); if (cur_byte != ',') break; next_byte(pb, &cur_byte); } ret = expect_byte(pb, &cur_byte, '}'); if (ret < 0) goto fail; if (!content.size || start == AV_NOPTS_VALUE || duration == AV_NOPTS_VALUE) { ret = AVERROR_INVALIDDATA; goto fail; } pkt = ff_subtitles_queue_insert_bprint(subs, &content, 0); if (!pkt) { ret = AVERROR(ENOMEM); goto fail; } pkt->pos = pos; pkt->pts = start; pkt->duration = duration; av_bprint_clear(&content); skip_spaces(pb, &cur_byte); if (cur_byte != ',') break; next_byte(pb, &cur_byte); } ret = expect_byte(pb, &cur_byte, ']'); if (ret < 0) goto fail; ret = expect_byte(pb, &cur_byte, '}'); if (ret < 0) goto fail; skip_spaces(pb, &cur_byte); if (cur_byte != AVERROR_EOF) ret = ERR_CODE(cur_byte); fail: av_bprint_finalize(&content, NULL); return ret; } static av_cold int tedcaptions_read_header(AVFormatContext *avf) { TEDCaptionsDemuxer *tc = avf->priv_data; AVStream *st = avformat_new_stream(avf, NULL); FFStream *sti; int ret, i; AVPacket *last; if (!st) return AVERROR(ENOMEM); sti = ffstream(st); ret = parse_file(avf->pb, &tc->subs); if (ret < 0) { if (ret == AVERROR_INVALIDDATA) av_log(avf, AV_LOG_ERROR, "Syntax error near offset %"PRId64".\n", avio_tell(avf->pb)); return ret; } ff_subtitles_queue_finalize(avf, &tc->subs); for (i = 0; i < tc->subs.nb_subs; i++) tc->subs.subs[i]->pts += tc->start_time; last = tc->subs.subs[tc->subs.nb_subs - 1]; st->codecpar->codec_type = AVMEDIA_TYPE_SUBTITLE; st->codecpar->codec_id = AV_CODEC_ID_TEXT; avpriv_set_pts_info(st, 64, 1, 1000); sti->probe_packets = 0; st->start_time = 0; st->duration = last->pts + last->duration; sti->cur_dts = 0; return 0; } static int tedcaptions_read_packet(AVFormatContext *avf, AVPacket *packet) { TEDCaptionsDemuxer *tc = avf->priv_data; return ff_subtitles_queue_read_packet(&tc->subs, packet); } static int tedcaptions_read_close(AVFormatContext *avf) { TEDCaptionsDemuxer *tc = avf->priv_data; ff_subtitles_queue_clean(&tc->subs); return 0; } static av_cold int tedcaptions_read_probe(const AVProbeData *p) { static const char *const tags[] = { "\"captions\"", "\"duration\"", "\"content\"", "\"startOfParagraph\"", "\"startTime\"", }; unsigned i, count = 0; const char *t; if (p->buf[strspn(p->buf, " \t\r\n")] != '{') return 0; for (i = 0; i < FF_ARRAY_ELEMS(tags); i++) { if (!(t = strstr(p->buf, tags[i]))) continue; t += strlen(tags[i]); t += strspn(t, " \t\r\n"); if (*t == ':') count++; } return count == FF_ARRAY_ELEMS(tags) ? AVPROBE_SCORE_MAX : count ? AVPROBE_SCORE_EXTENSION : 0; } static int tedcaptions_read_seek(AVFormatContext *avf, int stream_index, int64_t min_ts, int64_t ts, int64_t max_ts, int flags) { TEDCaptionsDemuxer *tc = avf->priv_data; return ff_subtitles_queue_seek(&tc->subs, avf, stream_index, min_ts, ts, max_ts, flags); } const FFInputFormat ff_tedcaptions_demuxer = { .p.name = "tedcaptions", .p.long_name = NULL_IF_CONFIG_SMALL("TED Talks captions"), .p.priv_class = &tedcaptions_demuxer_class, .priv_data_size = sizeof(TEDCaptionsDemuxer), .flags_internal = FF_INFMT_FLAG_INIT_CLEANUP, .read_header = tedcaptions_read_header, .read_packet = tedcaptions_read_packet, .read_close = tedcaptions_read_close, .read_probe = tedcaptions_read_probe, .read_seek2 = tedcaptions_read_seek, };