1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * Copyright (c) 2012 Clément Bœsch
3cabdff1aSopenharmony_ci *
4cabdff1aSopenharmony_ci * This file is part of FFmpeg.
5cabdff1aSopenharmony_ci *
6cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
7cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
8cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
9cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
10cabdff1aSopenharmony_ci *
11cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
12cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
13cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14cabdff1aSopenharmony_ci * Lesser General Public License for more details.
15cabdff1aSopenharmony_ci *
16cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
17cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
18cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19cabdff1aSopenharmony_ci */
20cabdff1aSopenharmony_ci
21cabdff1aSopenharmony_ci/**
22cabdff1aSopenharmony_ci * @file
23cabdff1aSopenharmony_ci * WebVTT subtitle decoder
24cabdff1aSopenharmony_ci * @see http://dev.w3.org/html5/webvtt/
25cabdff1aSopenharmony_ci * @todo need to support extended markups and cue settings
26cabdff1aSopenharmony_ci */
27cabdff1aSopenharmony_ci
28cabdff1aSopenharmony_ci#include "avcodec.h"
29cabdff1aSopenharmony_ci#include "ass.h"
30cabdff1aSopenharmony_ci#include "codec_internal.h"
31cabdff1aSopenharmony_ci#include "libavutil/bprint.h"
32cabdff1aSopenharmony_ci
33cabdff1aSopenharmony_cistatic const struct {
34cabdff1aSopenharmony_ci    const char *from;
35cabdff1aSopenharmony_ci    const char *to;
36cabdff1aSopenharmony_ci} webvtt_tag_replace[] = {
37cabdff1aSopenharmony_ci    {"<i>", "{\\i1}"}, {"</i>", "{\\i0}"},
38cabdff1aSopenharmony_ci    {"<b>", "{\\b1}"}, {"</b>", "{\\b0}"},
39cabdff1aSopenharmony_ci    {"<u>", "{\\u1}"}, {"</u>", "{\\u0}"},
40cabdff1aSopenharmony_ci    {"{", "\\{"}, {"}", "\\}"}, // escape to avoid ASS markup conflicts
41cabdff1aSopenharmony_ci    {"&gt;", ">"}, {"&lt;", "<"},
42cabdff1aSopenharmony_ci    {"&lrm;", ""}, {"&rlm;", ""}, // FIXME: properly honor bidi marks
43cabdff1aSopenharmony_ci    {"&amp;", "&"}, {"&nbsp;", "\\h"},
44cabdff1aSopenharmony_ci};
45cabdff1aSopenharmony_ci
46cabdff1aSopenharmony_cistatic int webvtt_event_to_ass(AVBPrint *buf, const char *p)
47cabdff1aSopenharmony_ci{
48cabdff1aSopenharmony_ci    int i, again = 0, skip = 0;
49cabdff1aSopenharmony_ci
50cabdff1aSopenharmony_ci    while (*p) {
51cabdff1aSopenharmony_ci
52cabdff1aSopenharmony_ci        for (i = 0; i < FF_ARRAY_ELEMS(webvtt_tag_replace); i++) {
53cabdff1aSopenharmony_ci            const char *from = webvtt_tag_replace[i].from;
54cabdff1aSopenharmony_ci            const size_t len = strlen(from);
55cabdff1aSopenharmony_ci            if (!strncmp(p, from, len)) {
56cabdff1aSopenharmony_ci                av_bprintf(buf, "%s", webvtt_tag_replace[i].to);
57cabdff1aSopenharmony_ci                p += len;
58cabdff1aSopenharmony_ci                again = 1;
59cabdff1aSopenharmony_ci                break;
60cabdff1aSopenharmony_ci            }
61cabdff1aSopenharmony_ci        }
62cabdff1aSopenharmony_ci        if (!*p)
63cabdff1aSopenharmony_ci            break;
64cabdff1aSopenharmony_ci
65cabdff1aSopenharmony_ci        if (again) {
66cabdff1aSopenharmony_ci            again = 0;
67cabdff1aSopenharmony_ci            skip = 0;
68cabdff1aSopenharmony_ci            continue;
69cabdff1aSopenharmony_ci        }
70cabdff1aSopenharmony_ci        if (*p == '<')
71cabdff1aSopenharmony_ci            skip = 1;
72cabdff1aSopenharmony_ci        else if (*p == '>')
73cabdff1aSopenharmony_ci            skip = 0;
74cabdff1aSopenharmony_ci        else if (p[0] == '\n' && p[1])
75cabdff1aSopenharmony_ci            av_bprintf(buf, "\\N");
76cabdff1aSopenharmony_ci        else if (!skip && *p != '\r')
77cabdff1aSopenharmony_ci            av_bprint_chars(buf, *p, 1);
78cabdff1aSopenharmony_ci        p++;
79cabdff1aSopenharmony_ci    }
80cabdff1aSopenharmony_ci    return 0;
81cabdff1aSopenharmony_ci}
82cabdff1aSopenharmony_ci
83cabdff1aSopenharmony_cistatic int webvtt_decode_frame(AVCodecContext *avctx, AVSubtitle *sub,
84cabdff1aSopenharmony_ci                               int *got_sub_ptr, const AVPacket *avpkt)
85cabdff1aSopenharmony_ci{
86cabdff1aSopenharmony_ci    int ret = 0;
87cabdff1aSopenharmony_ci    const char *ptr = avpkt->data;
88cabdff1aSopenharmony_ci    FFASSDecoderContext *s = avctx->priv_data;
89cabdff1aSopenharmony_ci    AVBPrint buf;
90cabdff1aSopenharmony_ci
91cabdff1aSopenharmony_ci    av_bprint_init(&buf, 0, AV_BPRINT_SIZE_UNLIMITED);
92cabdff1aSopenharmony_ci    if (ptr && avpkt->size > 0 && !webvtt_event_to_ass(&buf, ptr))
93cabdff1aSopenharmony_ci        ret = ff_ass_add_rect(sub, buf.str, s->readorder++, 0, NULL, NULL);
94cabdff1aSopenharmony_ci    av_bprint_finalize(&buf, NULL);
95cabdff1aSopenharmony_ci    if (ret < 0)
96cabdff1aSopenharmony_ci        return ret;
97cabdff1aSopenharmony_ci    *got_sub_ptr = sub->num_rects > 0;
98cabdff1aSopenharmony_ci    return avpkt->size;
99cabdff1aSopenharmony_ci}
100cabdff1aSopenharmony_ci
101cabdff1aSopenharmony_ciconst FFCodec ff_webvtt_decoder = {
102cabdff1aSopenharmony_ci    .p.name         = "webvtt",
103cabdff1aSopenharmony_ci    .p.long_name    = NULL_IF_CONFIG_SMALL("WebVTT subtitle"),
104cabdff1aSopenharmony_ci    .p.type         = AVMEDIA_TYPE_SUBTITLE,
105cabdff1aSopenharmony_ci    .p.id           = AV_CODEC_ID_WEBVTT,
106cabdff1aSopenharmony_ci    FF_CODEC_DECODE_SUB_CB(webvtt_decode_frame),
107cabdff1aSopenharmony_ci    .init           = ff_ass_subtitle_header_default,
108cabdff1aSopenharmony_ci    .flush          = ff_ass_decoder_flush,
109cabdff1aSopenharmony_ci    .priv_data_size = sizeof(FFASSDecoderContext),
110cabdff1aSopenharmony_ci    .caps_internal  = FF_CODEC_CAP_INIT_THREADSAFE,
111cabdff1aSopenharmony_ci};
112