mirror of https://github.com/FFmpeg/FFmpeg.git
Based off the srt encoder. The following features are unimplemented: - fonts, colors, sizes - alignment and positioning The rest works well. For example, use ffmpeg to convert subtitles into the .vtt format: ffmpeg -i input.srt output.vtt Signed-off-by: Aman Gupta <ffmpeg@tmm1.net> Signed-off-by: Clément Bœsch <u@pkh.me>pull/72/head
parent
d94e255dd1
commit
4372fb7a57
9 changed files with 229 additions and 3 deletions
@ -0,0 +1,219 @@ |
||||
/*
|
||||
* WebVTT subtitle encoder |
||||
* Copyright (c) 2010 Aurelien Jacobs <aurel@gnuage.org> |
||||
* Copyright (c) 2014 Aman Gupta <ffmpeg@tmm1.net> |
||||
* |
||||
* This file is part of FFmpeg. |
||||
* |
||||
* FFmpeg is free software; you can redistribute it and/or |
||||
* modify it under the terms of the GNU Lesser General Public |
||||
* License as published by the Free Software Foundation; either |
||||
* version 2.1 of the License, or (at your option) any later version. |
||||
* |
||||
* FFmpeg is distributed in the hope that it will be useful, |
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
||||
* Lesser General Public License for more details. |
||||
* |
||||
* You should have received a copy of the GNU Lesser General Public |
||||
* License along with FFmpeg; if not, write to the Free Software |
||||
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
||||
*/ |
||||
|
||||
#include <stdarg.h> |
||||
#include "avcodec.h" |
||||
#include "libavutil/avstring.h" |
||||
#include "libavutil/bprint.h" |
||||
#include "ass_split.h" |
||||
#include "ass.h" |
||||
|
||||
#define WEBVTT_STACK_SIZE 64 |
||||
typedef struct { |
||||
AVCodecContext *avctx; |
||||
ASSSplitContext *ass_ctx; |
||||
AVBPrint buffer; |
||||
unsigned timestamp_end; |
||||
int count; |
||||
char stack[WEBVTT_STACK_SIZE]; |
||||
int stack_ptr; |
||||
} WebVTTContext; |
||||
|
||||
#ifdef __GNUC__ |
||||
__attribute__ ((__format__ (__printf__, 2, 3))) |
||||
#endif |
||||
static void webvtt_print(WebVTTContext *s, const char *str, ...) |
||||
{ |
||||
va_list vargs; |
||||
va_start(vargs, str); |
||||
av_vbprintf(&s->buffer, str, vargs); |
||||
va_end(vargs); |
||||
} |
||||
|
||||
static int webvtt_stack_push(WebVTTContext *s, const char c) |
||||
{ |
||||
if (s->stack_ptr >= WEBVTT_STACK_SIZE) |
||||
return AVERROR(EOVERFLOW); |
||||
s->stack[s->stack_ptr++] = c; |
||||
return 0; |
||||
} |
||||
|
||||
static char webvtt_stack_pop(WebVTTContext *s) |
||||
{ |
||||
if (s->stack_ptr <= 0) |
||||
return 0; |
||||
return s->stack[--s->stack_ptr]; |
||||
} |
||||
|
||||
static int webvtt_stack_find(WebVTTContext *s, const char c) |
||||
{ |
||||
int i; |
||||
for (i = s->stack_ptr-1; i >= 0; i--) |
||||
if (s->stack[i] == c) |
||||
break; |
||||
return i; |
||||
} |
||||
|
||||
static void webvtt_close_tag(WebVTTContext *s, char tag) |
||||
{ |
||||
webvtt_print(s, "</%c>", tag); |
||||
} |
||||
|
||||
static void webvtt_stack_push_pop(WebVTTContext *s, const char c, int close) |
||||
{ |
||||
if (close) { |
||||
int i = c ? webvtt_stack_find(s, c) : 0; |
||||
if (i < 0) |
||||
return; |
||||
while (s->stack_ptr != i) |
||||
webvtt_close_tag(s, webvtt_stack_pop(s)); |
||||
} else if (webvtt_stack_push(s, c) < 0) |
||||
av_log(s->avctx, AV_LOG_ERROR, "tag stack overflow\n"); |
||||
} |
||||
|
||||
static void webvtt_style_apply(WebVTTContext *s, const char *style) |
||||
{ |
||||
ASSStyle *st = ff_ass_style_get(s->ass_ctx, style); |
||||
if (st) { |
||||
if (st->bold != ASS_DEFAULT_BOLD) { |
||||
webvtt_print(s, "<b>"); |
||||
webvtt_stack_push(s, 'b'); |
||||
} |
||||
if (st->italic != ASS_DEFAULT_ITALIC) { |
||||
webvtt_print(s, "<i>"); |
||||
webvtt_stack_push(s, 'i'); |
||||
} |
||||
if (st->underline != ASS_DEFAULT_UNDERLINE) { |
||||
webvtt_print(s, "<u>"); |
||||
webvtt_stack_push(s, 'u'); |
||||
} |
||||
} |
||||
} |
||||
|
||||
static void webvtt_text_cb(void *priv, const char *text, int len) |
||||
{ |
||||
WebVTTContext *s = priv; |
||||
av_bprint_append_data(&s->buffer, text, len); |
||||
} |
||||
|
||||
static void webvtt_new_line_cb(void *priv, int forced) |
||||
{ |
||||
webvtt_print(priv, "\n"); |
||||
} |
||||
|
||||
static void webvtt_style_cb(void *priv, char style, int close) |
||||
{ |
||||
if (style == 's') // strikethrough unsupported
|
||||
return; |
||||
|
||||
webvtt_stack_push_pop(priv, style, close); |
||||
if (!close) |
||||
webvtt_print(priv, "<%c>", style); |
||||
} |
||||
|
||||
static void webvtt_cancel_overrides_cb(void *priv, const char *style) |
||||
{ |
||||
webvtt_stack_push_pop(priv, 0, 1); |
||||
webvtt_style_apply(priv, style); |
||||
} |
||||
|
||||
static void webvtt_end_cb(void *priv) |
||||
{ |
||||
webvtt_stack_push_pop(priv, 0, 1); |
||||
} |
||||
|
||||
static const ASSCodesCallbacks webvtt_callbacks = { |
||||
.text = webvtt_text_cb, |
||||
.new_line = webvtt_new_line_cb, |
||||
.style = webvtt_style_cb, |
||||
.color = NULL, |
||||
.font_name = NULL, |
||||
.font_size = NULL, |
||||
.alignment = NULL, |
||||
.cancel_overrides = webvtt_cancel_overrides_cb, |
||||
.move = NULL, |
||||
.end = webvtt_end_cb, |
||||
}; |
||||
|
||||
static int webvtt_encode_frame(AVCodecContext *avctx, |
||||
unsigned char *buf, int bufsize, const AVSubtitle *sub) |
||||
{ |
||||
WebVTTContext *s = avctx->priv_data; |
||||
ASSDialog *dialog; |
||||
int i, num; |
||||
|
||||
av_bprint_clear(&s->buffer); |
||||
|
||||
for (i=0; i<sub->num_rects; i++) { |
||||
if (sub->rects[i]->type != SUBTITLE_ASS) { |
||||
av_log(avctx, AV_LOG_ERROR, "Only SUBTITLE_ASS type supported.\n"); |
||||
return AVERROR(ENOSYS); |
||||
} |
||||
|
||||
dialog = ff_ass_split_dialog(s->ass_ctx, sub->rects[i]->ass, 0, &num); |
||||
for (; dialog && num--; dialog++) { |
||||
webvtt_style_apply(s, dialog->style); |
||||
ff_ass_split_override_codes(&webvtt_callbacks, s, dialog->text); |
||||
} |
||||
} |
||||
|
||||
if (!av_bprint_is_complete(&s->buffer)) |
||||
return AVERROR(ENOMEM); |
||||
if (!s->buffer.len) |
||||
return 0; |
||||
|
||||
if (s->buffer.len > bufsize) { |
||||
av_log(avctx, AV_LOG_ERROR, "Buffer too small for ASS event.\n"); |
||||
return -1; |
||||
} |
||||
memcpy(buf, s->buffer.str, s->buffer.len); |
||||
|
||||
return s->buffer.len; |
||||
} |
||||
|
||||
static int webvtt_encode_close(AVCodecContext *avctx) |
||||
{ |
||||
WebVTTContext *s = avctx->priv_data; |
||||
ff_ass_split_free(s->ass_ctx); |
||||
av_bprint_finalize(&s->buffer, NULL); |
||||
return 0; |
||||
} |
||||
|
||||
static av_cold int webvtt_encode_init(AVCodecContext *avctx) |
||||
{ |
||||
WebVTTContext *s = avctx->priv_data; |
||||
s->avctx = avctx; |
||||
s->ass_ctx = ff_ass_split(avctx->subtitle_header); |
||||
av_bprint_init(&s->buffer, 0, AV_BPRINT_SIZE_UNLIMITED); |
||||
return s->ass_ctx ? 0 : AVERROR_INVALIDDATA; |
||||
} |
||||
|
||||
AVCodec ff_webvtt_encoder = { |
||||
.name = "webvtt", |
||||
.long_name = NULL_IF_CONFIG_SMALL("WebVTT subtitle"), |
||||
.type = AVMEDIA_TYPE_SUBTITLE, |
||||
.id = AV_CODEC_ID_WEBVTT, |
||||
.priv_data_size = sizeof(WebVTTContext), |
||||
.init = webvtt_encode_init, |
||||
.encode_sub = webvtt_encode_frame, |
||||
.close = webvtt_encode_close, |
||||
}; |
@ -0,0 +1 @@ |
||||
8683216a86e147a98f29dafee33a0987 |
Loading…
Reference in new issue