mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
514 lines
16 KiB
514 lines
16 KiB
/* |
|
* DVD subtitle encoding |
|
* Copyright (c) 2005 Wolfram Gloger |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
#include "avcodec.h" |
|
#include "bytestream.h" |
|
#include "codec_internal.h" |
|
#include "dvdsub.h" |
|
#include "libavutil/avassert.h" |
|
#include "libavutil/bprint.h" |
|
#include "libavutil/imgutils.h" |
|
#include "libavutil/mem.h" |
|
#include "libavutil/opt.h" |
|
|
|
typedef struct { |
|
AVClass *class; |
|
uint32_t global_palette[16]; |
|
char *palette_str; |
|
int even_rows_fix; |
|
} DVDSubtitleContext; |
|
|
|
// ncnt is the nibble counter |
|
#define PUTNIBBLE(val)\ |
|
do {\ |
|
if (ncnt++ & 1)\ |
|
*q++ = bitbuf | ((val) & 0x0f);\ |
|
else\ |
|
bitbuf = (val) << 4;\ |
|
} while(0) |
|
|
|
static void dvd_encode_rle(uint8_t **pq, |
|
const uint8_t *bitmap, int linesize, |
|
int w, int h, |
|
const int cmap[256]) |
|
{ |
|
uint8_t *q; |
|
unsigned int bitbuf = 0; |
|
int ncnt; |
|
int x, y, len, color; |
|
|
|
q = *pq; |
|
|
|
for (y = 0; y < h; ++y) { |
|
ncnt = 0; |
|
for(x = 0; x < w; x += len) { |
|
color = bitmap[x]; |
|
for (len=1; x+len < w; ++len) |
|
if (bitmap[x+len] != color) |
|
break; |
|
color = cmap[color]; |
|
av_assert0(color < 4); |
|
if (len < 0x04) { |
|
PUTNIBBLE((len << 2)|color); |
|
} else if (len < 0x10) { |
|
PUTNIBBLE(len >> 2); |
|
PUTNIBBLE((len << 2)|color); |
|
} else if (len < 0x40) { |
|
PUTNIBBLE(0); |
|
PUTNIBBLE(len >> 2); |
|
PUTNIBBLE((len << 2)|color); |
|
} else if (x+len == w) { |
|
PUTNIBBLE(0); |
|
PUTNIBBLE(0); |
|
PUTNIBBLE(0); |
|
PUTNIBBLE(color); |
|
} else { |
|
if (len > 0xff) |
|
len = 0xff; |
|
PUTNIBBLE(0); |
|
PUTNIBBLE(len >> 6); |
|
PUTNIBBLE(len >> 2); |
|
PUTNIBBLE((len << 2)|color); |
|
} |
|
} |
|
/* end of line */ |
|
if (ncnt & 1) |
|
PUTNIBBLE(0); |
|
bitmap += linesize; |
|
} |
|
|
|
*pq = q; |
|
} |
|
|
|
static int color_distance(uint32_t a, uint32_t b) |
|
{ |
|
int r = 0, d, i; |
|
int alpha_a = 8, alpha_b = 8; |
|
|
|
for (i = 24; i >= 0; i -= 8) { |
|
d = alpha_a * (int)((a >> i) & 0xFF) - |
|
alpha_b * (int)((b >> i) & 0xFF); |
|
r += d * d; |
|
alpha_a = a >> 28; |
|
alpha_b = b >> 28; |
|
} |
|
return r; |
|
} |
|
|
|
/** |
|
* Count colors used in a rectangle, quantizing alpha and grouping by |
|
* nearest global palette entry. |
|
*/ |
|
static void count_colors(AVCodecContext *avctx, unsigned hits[33], |
|
const AVSubtitleRect *r) |
|
{ |
|
DVDSubtitleContext *dvdc = avctx->priv_data; |
|
unsigned count[256] = { 0 }; |
|
uint32_t *palette = (uint32_t *)r->data[1]; |
|
uint32_t color; |
|
int x, y, i, j, match, d, best_d, av_uninit(best_j); |
|
uint8_t *p = r->data[0]; |
|
|
|
for (y = 0; y < r->h; y++) { |
|
for (x = 0; x < r->w; x++) |
|
count[*(p++)]++; |
|
p += r->linesize[0] - r->w; |
|
} |
|
for (i = 0; i < 256; i++) { |
|
if (!count[i]) /* avoid useless search */ |
|
continue; |
|
color = palette[i]; |
|
/* 0: transparent, 1-16: semi-transparent, 17-33 opaque */ |
|
match = color < 0x33000000 ? 0 : color < 0xCC000000 ? 1 : 17; |
|
if (match) { |
|
best_d = INT_MAX; |
|
for (j = 0; j < 16; j++) { |
|
d = color_distance(0xFF000000 | color, |
|
0xFF000000 | dvdc->global_palette[j]); |
|
if (d < best_d) { |
|
best_d = d; |
|
best_j = j; |
|
} |
|
} |
|
match += best_j; |
|
} |
|
hits[match] += count[i]; |
|
} |
|
} |
|
|
|
static void select_palette(AVCodecContext *avctx, int out_palette[4], |
|
int out_alpha[4], unsigned hits[33]) |
|
{ |
|
DVDSubtitleContext *dvdc = avctx->priv_data; |
|
int i, j, bright, mult; |
|
uint32_t color; |
|
int selected[4] = { 0 }; |
|
uint32_t pseudopal[33] = { 0 }; |
|
uint32_t refcolor[3] = { 0x00000000, 0xFFFFFFFF, 0xFF000000 }; |
|
|
|
/* Bonus for transparent: if the rectangle fits tightly the text, the |
|
background color can be quite rare, but it would be ugly without it */ |
|
hits[0] *= 16; |
|
/* Bonus for bright colors */ |
|
for (i = 0; i < 16; i++) { |
|
if (!(hits[1 + i] + hits[17 + i])) |
|
continue; /* skip unused colors to gain time */ |
|
color = dvdc->global_palette[i]; |
|
bright = 0; |
|
for (j = 0; j < 3; j++, color >>= 8) |
|
bright += (color & 0xFF) < 0x40 || (color & 0xFF) >= 0xC0; |
|
mult = 2 + FFMIN(bright, 2); |
|
hits[ 1 + i] *= mult; |
|
hits[17 + i] *= mult; |
|
} |
|
|
|
/* Select four most frequent colors */ |
|
for (i = 0; i < 4; i++) { |
|
for (j = 0; j < 33; j++) |
|
if (hits[j] > hits[selected[i]]) |
|
selected[i] = j; |
|
hits[selected[i]] = 0; |
|
} |
|
|
|
/* Order the colors like in most DVDs: |
|
0: background, 1: foreground, 2: outline */ |
|
for (i = 0; i < 16; i++) { |
|
pseudopal[ 1 + i] = 0x80000000 | dvdc->global_palette[i]; |
|
pseudopal[17 + i] = 0xFF000000 | dvdc->global_palette[i]; |
|
} |
|
for (i = 0; i < 3; i++) { |
|
int best_d = color_distance(refcolor[i], pseudopal[selected[i]]); |
|
for (j = i + 1; j < 4; j++) { |
|
int d = color_distance(refcolor[i], pseudopal[selected[j]]); |
|
if (d < best_d) { |
|
FFSWAP(int, selected[i], selected[j]); |
|
best_d = d; |
|
} |
|
} |
|
} |
|
|
|
/* Output */ |
|
for (i = 0; i < 4; i++) { |
|
out_palette[i] = selected[i] ? (selected[i] - 1) & 0xF : 0; |
|
out_alpha [i] = !selected[i] ? 0 : selected[i] < 17 ? 0x80 : 0xFF; |
|
} |
|
} |
|
|
|
static void build_color_map(AVCodecContext *avctx, int cmap[], |
|
const uint32_t palette[], |
|
const int out_palette[], unsigned int const out_alpha[]) |
|
{ |
|
DVDSubtitleContext *dvdc = avctx->priv_data; |
|
int i, j, d, best_d; |
|
uint32_t pseudopal[4]; |
|
|
|
for (i = 0; i < 4; i++) |
|
pseudopal[i] = (out_alpha[i] << 24) | |
|
dvdc->global_palette[out_palette[i]]; |
|
for (i = 0; i < 256; i++) { |
|
best_d = INT_MAX; |
|
for (j = 0; j < 4; j++) { |
|
d = color_distance(pseudopal[j], palette[i]); |
|
if (d < best_d) { |
|
cmap[i] = j; |
|
best_d = d; |
|
} |
|
} |
|
} |
|
} |
|
|
|
static void copy_rectangle(AVSubtitleRect *dst, AVSubtitleRect *src, int cmap[]) |
|
{ |
|
int x, y; |
|
uint8_t *p, *q; |
|
|
|
p = src->data[0]; |
|
q = dst->data[0] + (src->x - dst->x) + |
|
(src->y - dst->y) * dst->linesize[0]; |
|
for (y = 0; y < src->h; y++) { |
|
for (x = 0; x < src->w; x++) |
|
*(q++) = cmap[*(p++)]; |
|
p += src->linesize[0] - src->w; |
|
q += dst->linesize[0] - src->w; |
|
} |
|
} |
|
|
|
static int encode_dvd_subtitles(AVCodecContext *avctx, |
|
uint8_t *outbuf, int outbuf_size, |
|
const AVSubtitle *h) |
|
{ |
|
DVDSubtitleContext *dvdc = avctx->priv_data; |
|
uint8_t *q, *qq; |
|
int offset1, offset2; |
|
int i, rects = h->num_rects, ret; |
|
unsigned global_palette_hits[33] = { 0 }; |
|
int cmap[256]; |
|
int out_palette[4]; |
|
int out_alpha[4]; |
|
AVSubtitleRect vrect; |
|
uint8_t *vrect_data = NULL; |
|
int x2, y2; |
|
int forced = 0; |
|
|
|
if (rects == 0 || !h->rects) |
|
return AVERROR(EINVAL); |
|
for (i = 0; i < rects; i++) |
|
if (h->rects[i]->type != SUBTITLE_BITMAP) { |
|
av_log(avctx, AV_LOG_ERROR, "Bitmap subtitle required\n"); |
|
return AVERROR(EINVAL); |
|
} |
|
/* Mark this subtitle forced if any of the rectangles is forced. */ |
|
for (i = 0; i < rects; i++) |
|
if ((h->rects[i]->flags & AV_SUBTITLE_FLAG_FORCED) != 0) { |
|
forced = 1; |
|
break; |
|
} |
|
|
|
vrect = *h->rects[0]; |
|
|
|
if (rects > 1) { |
|
/* DVD subtitles can have only one rectangle: build a virtual |
|
rectangle containing all actual rectangles. |
|
The data of the rectangles will be copied later, when the palette |
|
is decided, because the rectangles may have different palettes. */ |
|
int xmin = h->rects[0]->x, xmax = xmin + h->rects[0]->w; |
|
int ymin = h->rects[0]->y, ymax = ymin + h->rects[0]->h; |
|
for (i = 1; i < rects; i++) { |
|
xmin = FFMIN(xmin, h->rects[i]->x); |
|
ymin = FFMIN(ymin, h->rects[i]->y); |
|
xmax = FFMAX(xmax, h->rects[i]->x + h->rects[i]->w); |
|
ymax = FFMAX(ymax, h->rects[i]->y + h->rects[i]->h); |
|
} |
|
vrect.x = xmin; |
|
vrect.y = ymin; |
|
vrect.w = xmax - xmin; |
|
vrect.h = ymax - ymin; |
|
if ((ret = av_image_check_size(vrect.w, vrect.h, 0, avctx)) < 0) |
|
return ret; |
|
|
|
/* Count pixels outside the virtual rectangle as transparent */ |
|
global_palette_hits[0] = vrect.w * vrect.h; |
|
for (i = 0; i < rects; i++) |
|
global_palette_hits[0] -= h->rects[i]->w * h->rects[i]->h; |
|
} |
|
|
|
for (i = 0; i < rects; i++) |
|
count_colors(avctx, global_palette_hits, h->rects[i]); |
|
select_palette(avctx, out_palette, out_alpha, global_palette_hits); |
|
|
|
if (rects > 1) { |
|
if (!(vrect_data = av_calloc(vrect.w, vrect.h))) |
|
return AVERROR(ENOMEM); |
|
vrect.data [0] = vrect_data; |
|
vrect.linesize[0] = vrect.w; |
|
for (i = 0; i < rects; i++) { |
|
build_color_map(avctx, cmap, (uint32_t *)h->rects[i]->data[1], |
|
out_palette, out_alpha); |
|
copy_rectangle(&vrect, h->rects[i], cmap); |
|
} |
|
for (i = 0; i < 4; i++) |
|
cmap[i] = i; |
|
} else { |
|
build_color_map(avctx, cmap, (uint32_t *)h->rects[0]->data[1], |
|
out_palette, out_alpha); |
|
} |
|
|
|
av_log(avctx, AV_LOG_DEBUG, "Selected palette:"); |
|
for (i = 0; i < 4; i++) |
|
av_log(avctx, AV_LOG_DEBUG, " 0x%06"PRIx32"@@%02x (0x%x,0x%x)", |
|
dvdc->global_palette[out_palette[i]], out_alpha[i], |
|
out_palette[i], out_alpha[i] >> 4); |
|
av_log(avctx, AV_LOG_DEBUG, "\n"); |
|
|
|
// encode data block |
|
q = outbuf + 4; |
|
offset1 = q - outbuf; |
|
// worst case memory requirement: 1 nibble per pixel.. |
|
if ((q - outbuf) + vrect.w * vrect.h / 2 + 17 + 21 > outbuf_size) { |
|
av_log(NULL, AV_LOG_ERROR, "dvd_subtitle too big\n"); |
|
ret = AVERROR_BUFFER_TOO_SMALL; |
|
goto fail; |
|
} |
|
dvd_encode_rle(&q, vrect.data[0], vrect.w * 2, |
|
vrect.w, (vrect.h + 1) >> 1, cmap); |
|
offset2 = q - outbuf; |
|
dvd_encode_rle(&q, vrect.data[0] + vrect.w, vrect.w * 2, |
|
vrect.w, vrect.h >> 1, cmap); |
|
|
|
if (dvdc->even_rows_fix && (vrect.h & 1)) { |
|
// Work-around for some players that want the height to be even. |
|
vrect.h++; |
|
*q++ = 0x00; // 0x00 0x00 == empty row, i.e. fully transparent |
|
*q++ = 0x00; |
|
} |
|
|
|
// set data packet size |
|
qq = outbuf + 2; |
|
bytestream_put_be16(&qq, q - outbuf); |
|
|
|
// send start display command |
|
bytestream_put_be16(&q, (h->start_display_time*90) >> 10); |
|
bytestream_put_be16(&q, (q - outbuf) /*- 2 */ + 8 + 12 + 2); |
|
*q++ = 0x03; // palette - 4 nibbles |
|
*q++ = (out_palette[3] << 4) | out_palette[2]; |
|
*q++ = (out_palette[1] << 4) | out_palette[0]; |
|
*q++ = 0x04; // alpha - 4 nibbles |
|
*q++ = (out_alpha[3] & 0xF0) | (out_alpha[2] >> 4); |
|
*q++ = (out_alpha[1] & 0xF0) | (out_alpha[0] >> 4); |
|
|
|
// 12 bytes per rect |
|
x2 = vrect.x + vrect.w - 1; |
|
y2 = vrect.y + vrect.h - 1; |
|
|
|
if ((avctx->width > 0 && x2 > avctx->width) || |
|
(avctx->height > 0 && y2 > avctx->height)) { |
|
av_log(avctx, AV_LOG_ERROR, "canvas_size(%d:%d) is too small(%d:%d) for render\n", |
|
avctx->width, avctx->height, x2, y2); |
|
ret = AVERROR(EINVAL); |
|
goto fail; |
|
} |
|
*q++ = 0x05; |
|
// x1 x2 -> 6 nibbles |
|
*q++ = vrect.x >> 4; |
|
*q++ = (vrect.x << 4) | ((x2 >> 8) & 0xf); |
|
*q++ = x2; |
|
// y1 y2 -> 6 nibbles |
|
*q++ = vrect.y >> 4; |
|
*q++ = (vrect.y << 4) | ((y2 >> 8) & 0xf); |
|
*q++ = y2; |
|
|
|
*q++ = 0x06; |
|
// offset1, offset2 |
|
bytestream_put_be16(&q, offset1); |
|
bytestream_put_be16(&q, offset2); |
|
|
|
*q++ = forced ? 0x00 : 0x01; // start command |
|
*q++ = 0xff; // terminating command |
|
|
|
// send stop display command last |
|
bytestream_put_be16(&q, (h->end_display_time*90) >> 10); |
|
bytestream_put_be16(&q, (q - outbuf) - 2 /*+ 4*/); |
|
*q++ = 0x02; // set end |
|
*q++ = 0xff; // terminating command |
|
|
|
qq = outbuf; |
|
bytestream_put_be16(&qq, q - outbuf); |
|
|
|
av_log(NULL, AV_LOG_DEBUG, "subtitle_packet size=%"PTRDIFF_SPECIFIER"\n", q - outbuf); |
|
ret = q - outbuf; |
|
|
|
fail: |
|
av_free(vrect_data); |
|
return ret; |
|
} |
|
|
|
static int bprint_to_extradata(AVCodecContext *avctx, struct AVBPrint *buf) |
|
{ |
|
int ret; |
|
char *str; |
|
|
|
ret = av_bprint_finalize(buf, &str); |
|
if (ret < 0) |
|
return ret; |
|
if (!av_bprint_is_complete(buf)) { |
|
av_free(str); |
|
return AVERROR(ENOMEM); |
|
} |
|
|
|
avctx->extradata = str; |
|
/* Note: the string is NUL terminated (so extradata can be read as a |
|
* string), but the ending character is not accounted in the size (in |
|
* binary formats you are likely not supposed to mux that character). When |
|
* extradata is copied, it is also padded with AV_INPUT_BUFFER_PADDING_SIZE |
|
* zeros. */ |
|
avctx->extradata_size = buf->len; |
|
return 0; |
|
} |
|
|
|
static int dvdsub_init(AVCodecContext *avctx) |
|
{ |
|
DVDSubtitleContext *dvdc = avctx->priv_data; |
|
static const uint32_t default_palette[16] = { |
|
0x000000, 0x0000FF, 0x00FF00, 0xFF0000, |
|
0xFFFF00, 0xFF00FF, 0x00FFFF, 0xFFFFFF, |
|
0x808000, 0x8080FF, 0x800080, 0x80FF80, |
|
0x008080, 0xFF8080, 0x555555, 0xAAAAAA, |
|
}; |
|
AVBPrint extradata; |
|
int i, ret; |
|
|
|
av_assert0(sizeof(dvdc->global_palette) == sizeof(default_palette)); |
|
if (dvdc->palette_str) { |
|
ff_dvdsub_parse_palette(dvdc->global_palette, dvdc->palette_str); |
|
} else { |
|
memcpy(dvdc->global_palette, default_palette, sizeof(dvdc->global_palette)); |
|
} |
|
|
|
av_bprint_init(&extradata, 0, AV_BPRINT_SIZE_AUTOMATIC); |
|
if (avctx->width && avctx->height) |
|
av_bprintf(&extradata, "size: %dx%d\n", avctx->width, avctx->height); |
|
av_bprintf(&extradata, "palette:"); |
|
for (i = 0; i < 16; i++) |
|
av_bprintf(&extradata, " %06"PRIx32"%c", |
|
dvdc->global_palette[i] & 0xFFFFFF, i < 15 ? ',' : '\n'); |
|
|
|
ret = bprint_to_extradata(avctx, &extradata); |
|
if (ret < 0) |
|
return ret; |
|
|
|
return 0; |
|
} |
|
|
|
static int dvdsub_encode(AVCodecContext *avctx, |
|
unsigned char *buf, int buf_size, |
|
const AVSubtitle *sub) |
|
{ |
|
//DVDSubtitleContext *s = avctx->priv_data; |
|
int ret; |
|
|
|
ret = encode_dvd_subtitles(avctx, buf, buf_size, sub); |
|
return ret; |
|
} |
|
|
|
#define OFFSET(x) offsetof(DVDSubtitleContext, x) |
|
#define SE AV_OPT_FLAG_SUBTITLE_PARAM | AV_OPT_FLAG_ENCODING_PARAM |
|
static const AVOption options[] = { |
|
{"palette", "set the global palette", OFFSET(palette_str), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, SE }, |
|
{"even_rows_fix", "Make number of rows even (workaround for some players)", OFFSET(even_rows_fix), AV_OPT_TYPE_BOOL, {.i64 = 0}, 0, 1, SE}, |
|
{ NULL }, |
|
}; |
|
|
|
static const AVClass dvdsubenc_class = { |
|
.class_name = "VOBSUB subtitle encoder", |
|
.item_name = av_default_item_name, |
|
.option = options, |
|
.version = LIBAVUTIL_VERSION_INT, |
|
}; |
|
|
|
const FFCodec ff_dvdsub_encoder = { |
|
.p.name = "dvdsub", |
|
CODEC_LONG_NAME("DVD subtitles"), |
|
.p.type = AVMEDIA_TYPE_SUBTITLE, |
|
.p.id = AV_CODEC_ID_DVD_SUBTITLE, |
|
.init = dvdsub_init, |
|
FF_CODEC_ENCODE_SUB_CB(dvdsub_encode), |
|
.p.priv_class = &dvdsubenc_class, |
|
.priv_data_size = sizeof(DVDSubtitleContext), |
|
};
|
|
|