| Line | Branch | Exec | Source |
|---|---|---|---|
| 1 | /* | ||
| 2 | * Copyright (c) 2012 Clément Bœsch | ||
| 3 | * | ||
| 4 | * This file is part of FFmpeg. | ||
| 5 | * | ||
| 6 | * FFmpeg is free software; you can redistribute it and/or | ||
| 7 | * modify it under the terms of the GNU Lesser General Public | ||
| 8 | * License as published by the Free Software Foundation; either | ||
| 9 | * version 2.1 of the License, or (at your option) any later version. | ||
| 10 | * | ||
| 11 | * FFmpeg is distributed in the hope that it will be useful, | ||
| 12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | ||
| 14 | * Lesser General Public License for more details. | ||
| 15 | * | ||
| 16 | * You should have received a copy of the GNU Lesser General Public | ||
| 17 | * License along with FFmpeg; if not, write to the Free Software | ||
| 18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | ||
| 19 | */ | ||
| 20 | |||
| 21 | /** | ||
| 22 | * @file | ||
| 23 | * WebVTT subtitle decoder | ||
| 24 | * @see https://www.w3.org/TR/webvtt1/ | ||
| 25 | * @todo need to support extended markups and cue settings | ||
| 26 | */ | ||
| 27 | |||
| 28 | #include "avcodec.h" | ||
| 29 | #include "ass.h" | ||
| 30 | #include "codec_internal.h" | ||
| 31 | #include "libavutil/bprint.h" | ||
| 32 | |||
| 33 | static const struct { | ||
| 34 | const char *from; | ||
| 35 | const char *to; | ||
| 36 | } webvtt_tag_replace[] = { | ||
| 37 | {"{", "\\{{}"}, {"\\", "\\\xe2\x81\xa0"}, // escape to avoid ASS markup conflicts | ||
| 38 | {">", ">"}, {"<", "<"}, | ||
| 39 | {"‎", "\xe2\x80\x8e"}, {"‏", "\xe2\x80\x8f"}, | ||
| 40 | {"&", "&"}, {" ", "\\h"}, | ||
| 41 | }; | ||
| 42 | static const struct { | ||
| 43 | const char from[6]; | ||
| 44 | const char to[6]; | ||
| 45 | } webvtt_valid_tags[] = { | ||
| 46 | {"i", "{\\i1}"}, {"/i", "{\\i0}"}, | ||
| 47 | {"b", "{\\b1}"}, {"/b", "{\\b0}"}, | ||
| 48 | {"u", "{\\u1}"}, {"/u", "{\\u0}"}, | ||
| 49 | }; | ||
| 50 | |||
| 51 | 27 | static int webvtt_event_to_ass(AVBPrint *buf, const char *p) | |
| 52 | { | ||
| 53 | 27 | int i, again = 0; | |
| 54 | |||
| 55 |
2/2✓ Branch 0 taken 1094 times.
✓ Branch 1 taken 27 times.
|
1121 | while (*p) { |
| 56 |
2/2✓ Branch 0 taken 49 times.
✓ Branch 1 taken 1045 times.
|
1094 | if (*p == '<') { |
| 57 | 49 | const char *tag_end = strchr(p, '>'); | |
| 58 | ptrdiff_t len; | ||
| 59 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 49 times.
|
49 | if (!tag_end) |
| 60 | ✗ | break; | |
| 61 | 49 | len = tag_end - p + 1; | |
| 62 |
2/2✓ Branch 0 taken 262 times.
✓ Branch 1 taken 41 times.
|
303 | for (i = 0; i < FF_ARRAY_ELEMS(webvtt_valid_tags); i++) { |
| 63 | 262 | const char *from = webvtt_valid_tags[i].from; | |
| 64 |
2/2✓ Branch 0 taken 8 times.
✓ Branch 1 taken 254 times.
|
262 | if(!strncmp(p + 1, from, strlen(from))) { |
| 65 | 8 | av_bprintf(buf, "%s", webvtt_valid_tags[i].to); | |
| 66 | 8 | break; | |
| 67 | } | ||
| 68 | } | ||
| 69 | 49 | p += len; | |
| 70 | 49 | again = 1; | |
| 71 | } | ||
| 72 | |||
| 73 |
2/2✓ Branch 0 taken 8729 times.
✓ Branch 1 taken 1084 times.
|
9813 | for (i = 0; i < FF_ARRAY_ELEMS(webvtt_tag_replace); i++) { |
| 74 | 8729 | const char *from = webvtt_tag_replace[i].from; | |
| 75 | 8729 | const size_t len = strlen(from); | |
| 76 |
2/2✓ Branch 0 taken 10 times.
✓ Branch 1 taken 8719 times.
|
8729 | if (!strncmp(p, from, len)) { |
| 77 | 10 | av_bprintf(buf, "%s", webvtt_tag_replace[i].to); | |
| 78 | 10 | p += len; | |
| 79 | 10 | again = 1; | |
| 80 | 10 | break; | |
| 81 | } | ||
| 82 | } | ||
| 83 | |||
| 84 |
2/2✓ Branch 0 taken 59 times.
✓ Branch 1 taken 1035 times.
|
1094 | if (again) { |
| 85 | 59 | again = 0; | |
| 86 | 59 | continue; | |
| 87 | } | ||
| 88 |
3/4✓ Branch 0 taken 9 times.
✓ Branch 1 taken 1026 times.
✓ Branch 2 taken 9 times.
✗ Branch 3 not taken.
|
1035 | if (p[0] == '\n' && p[1]) |
| 89 | 9 | av_bprintf(buf, "\\N"); | |
| 90 |
2/2✓ Branch 0 taken 1025 times.
✓ Branch 1 taken 1 times.
|
1026 | else if (*p != '\r') |
| 91 | 1025 | av_bprint_chars(buf, *p, 1); | |
| 92 | 1035 | p++; | |
| 93 | } | ||
| 94 | 27 | return 0; | |
| 95 | } | ||
| 96 | |||
| 97 | 27 | static int webvtt_decode_frame(AVCodecContext *avctx, AVSubtitle *sub, | |
| 98 | int *got_sub_ptr, const AVPacket *avpkt) | ||
| 99 | { | ||
| 100 | 27 | int ret = 0; | |
| 101 | 27 | const char *ptr = avpkt->data; | |
| 102 | 27 | FFASSDecoderContext *s = avctx->priv_data; | |
| 103 | AVBPrint buf; | ||
| 104 | |||
| 105 | 27 | av_bprint_init(&buf, 0, AV_BPRINT_SIZE_UNLIMITED); | |
| 106 |
3/6✓ Branch 0 taken 27 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 27 times.
✗ Branch 3 not taken.
✓ Branch 5 taken 27 times.
✗ Branch 6 not taken.
|
27 | if (ptr && avpkt->size > 0 && !webvtt_event_to_ass(&buf, ptr)) |
| 107 | 27 | ret = ff_ass_add_rect(sub, buf.str, s->readorder++, 0, NULL, NULL); | |
| 108 | 27 | av_bprint_finalize(&buf, NULL); | |
| 109 |
1/2✗ Branch 0 not taken.
✓ Branch 1 taken 27 times.
|
27 | if (ret < 0) |
| 110 | ✗ | return ret; | |
| 111 | 27 | *got_sub_ptr = sub->num_rects > 0; | |
| 112 | 27 | return avpkt->size; | |
| 113 | } | ||
| 114 | |||
| 115 | const FFCodec ff_webvtt_decoder = { | ||
| 116 | .p.name = "webvtt", | ||
| 117 | CODEC_LONG_NAME("WebVTT subtitle"), | ||
| 118 | .p.type = AVMEDIA_TYPE_SUBTITLE, | ||
| 119 | .p.id = AV_CODEC_ID_WEBVTT, | ||
| 120 | FF_CODEC_DECODE_SUB_CB(webvtt_decode_frame), | ||
| 121 | .init = ff_ass_subtitle_header_default, | ||
| 122 | .flush = ff_ass_decoder_flush, | ||
| 123 | .priv_data_size = sizeof(FFASSDecoderContext), | ||
| 124 | }; | ||
| 125 |