mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
193 lines
5.8 KiB
193 lines
5.8 KiB
/* |
|
* Copyright (c) 2012 Clément Bœsch |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
/** |
|
* @file |
|
* SAMI subtitle decoder |
|
* @see http://msdn.microsoft.com/en-us/library/ms971327.aspx |
|
*/ |
|
|
|
#include "ass.h" |
|
#include "libavutil/avstring.h" |
|
#include "libavutil/bprint.h" |
|
#include "codec_internal.h" |
|
#include "htmlsubtitles.h" |
|
|
|
typedef struct { |
|
AVBPrint source; |
|
AVBPrint content; |
|
AVBPrint encoded_source; |
|
AVBPrint encoded_content; |
|
AVBPrint full; |
|
int readorder; |
|
} SAMIContext; |
|
|
|
static int sami_paragraph_to_ass(AVCodecContext *avctx, const char *src) |
|
{ |
|
SAMIContext *sami = avctx->priv_data; |
|
int ret = 0; |
|
char *tag = NULL; |
|
char *dupsrc = av_strdup(src); |
|
char *p = dupsrc; |
|
AVBPrint *dst_content = &sami->encoded_content; |
|
AVBPrint *dst_source = &sami->encoded_source; |
|
|
|
if (!dupsrc) |
|
return AVERROR(ENOMEM); |
|
|
|
av_bprint_clear(&sami->encoded_content); |
|
av_bprint_clear(&sami->content); |
|
av_bprint_clear(&sami->encoded_source); |
|
for (;;) { |
|
char *saveptr = NULL; |
|
int prev_chr_is_space = 0; |
|
AVBPrint *dst = &sami->content; |
|
|
|
/* parse & extract paragraph tag */ |
|
p = av_stristr(p, "<P"); |
|
if (!p) |
|
break; |
|
if (p[2] != '>' && !av_isspace(p[2])) { // avoid confusion with tags such as <PRE> |
|
p++; |
|
continue; |
|
} |
|
if (dst->len) // add a separator with the previous paragraph if there was one |
|
av_bprintf(dst, "\\N"); |
|
tag = av_strtok(p, ">", &saveptr); |
|
if (!tag || !saveptr) |
|
break; |
|
p = saveptr; |
|
|
|
/* check if the current paragraph is the "source" (speaker name) */ |
|
if (av_stristr(tag, "ID=Source") || av_stristr(tag, "ID=\"Source\"")) { |
|
dst = &sami->source; |
|
av_bprint_clear(dst); |
|
} |
|
|
|
/* if empty event -> skip subtitle */ |
|
while (av_isspace(*p)) |
|
p++; |
|
if (!strncmp(p, " ", 6)) { |
|
ret = -1; |
|
goto end; |
|
} |
|
|
|
/* extract the text, stripping most of the tags */ |
|
while (*p) { |
|
if (*p == '<') { |
|
if (!av_strncasecmp(p, "<P", 2) && (p[2] == '>' || av_isspace(p[2]))) |
|
break; |
|
} |
|
if (!av_strncasecmp(p, "<BR", 3)) { |
|
av_bprintf(dst, "\\N"); |
|
p++; |
|
while (*p && *p != '>') |
|
p++; |
|
if (!*p) |
|
break; |
|
if (*p == '>') |
|
p++; |
|
continue; |
|
} |
|
if (!av_isspace(*p)) |
|
av_bprint_chars(dst, *p, 1); |
|
else if (!prev_chr_is_space) |
|
av_bprint_chars(dst, ' ', 1); |
|
prev_chr_is_space = av_isspace(*p); |
|
p++; |
|
} |
|
} |
|
|
|
av_bprint_clear(&sami->full); |
|
if (sami->source.len) { |
|
ret = ff_htmlmarkup_to_ass(avctx, dst_source, sami->source.str); |
|
if (ret < 0) |
|
goto end; |
|
av_bprintf(&sami->full, "{\\i1}%s{\\i0}\\N", sami->encoded_source.str); |
|
} |
|
ret = ff_htmlmarkup_to_ass(avctx, dst_content, sami->content.str); |
|
if (ret < 0) |
|
goto end; |
|
av_bprintf(&sami->full, "%s", sami->encoded_content.str); |
|
|
|
end: |
|
av_free(dupsrc); |
|
return ret; |
|
} |
|
|
|
static int sami_decode_frame(AVCodecContext *avctx, AVSubtitle *sub, |
|
int *got_sub_ptr, const AVPacket *avpkt) |
|
{ |
|
const char *ptr = avpkt->data; |
|
SAMIContext *sami = avctx->priv_data; |
|
|
|
if (ptr && avpkt->size > 0) { |
|
int ret = sami_paragraph_to_ass(avctx, ptr); |
|
if (ret < 0) |
|
return ret; |
|
// TODO: pass escaped sami->encoded_source.str as source |
|
ret = ff_ass_add_rect(sub, sami->full.str, sami->readorder++, 0, NULL, NULL); |
|
if (ret < 0) |
|
return ret; |
|
} |
|
*got_sub_ptr = sub->num_rects > 0; |
|
return avpkt->size; |
|
} |
|
|
|
static av_cold int sami_init(AVCodecContext *avctx) |
|
{ |
|
SAMIContext *sami = avctx->priv_data; |
|
av_bprint_init(&sami->source, 0, 2048); |
|
av_bprint_init(&sami->content, 0, 2048); |
|
av_bprint_init(&sami->encoded_source, 0, 2048); |
|
av_bprint_init(&sami->encoded_content, 0, 2048); |
|
av_bprint_init(&sami->full, 0, 2048); |
|
return ff_ass_subtitle_header_default(avctx); |
|
} |
|
|
|
static av_cold int sami_close(AVCodecContext *avctx) |
|
{ |
|
SAMIContext *sami = avctx->priv_data; |
|
av_bprint_finalize(&sami->source, NULL); |
|
av_bprint_finalize(&sami->content, NULL); |
|
av_bprint_finalize(&sami->encoded_source, NULL); |
|
av_bprint_finalize(&sami->encoded_content, NULL); |
|
av_bprint_finalize(&sami->full, NULL); |
|
return 0; |
|
} |
|
|
|
static void sami_flush(AVCodecContext *avctx) |
|
{ |
|
SAMIContext *sami = avctx->priv_data; |
|
if (!(avctx->flags2 & AV_CODEC_FLAG2_RO_FLUSH_NOOP)) |
|
sami->readorder = 0; |
|
} |
|
|
|
const FFCodec ff_sami_decoder = { |
|
.p.name = "sami", |
|
.p.long_name = NULL_IF_CONFIG_SMALL("SAMI subtitle"), |
|
.p.type = AVMEDIA_TYPE_SUBTITLE, |
|
.p.id = AV_CODEC_ID_SAMI, |
|
.priv_data_size = sizeof(SAMIContext), |
|
.init = sami_init, |
|
.close = sami_close, |
|
FF_CODEC_DECODE_SUB_CB(sami_decode_frame), |
|
.flush = sami_flush, |
|
};
|
|
|