You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

428 lines
12 KiB

/*
* USM demuxer
* Copyright (c) 2023 Paul B Mahol
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include "libavutil/intreadwrite.h"
#include "libavcodec/bytestream.h"
#include "avformat.h"
#include "demux.h"
#include "internal.h"
#define VIDEOI 0
#define AUDIOI 1
#define ALPHAI 2
#define SUBTTI 3
typedef struct USMChannel {
int index;
int used;
int type;
int codec_id;
int nb_channels;
int nb_frames;
AVRational rate;
int width, height;
int64_t duration;
int64_t extradata_pos;
} USMChannel;
typedef struct USMDemuxContext {
USMChannel ch[4][256];
int nb_channels[4];
uint8_t *header;
unsigned header_size;
} USMDemuxContext;
static int usm_probe(const AVProbeData *p)
{
if (AV_RL32(p->buf) != MKTAG('C','R','I','D'))
return 0;
if (AV_RN32(p->buf + 4) == 0)
return 0;
return AVPROBE_SCORE_MAX / 3;
}
static int usm_read_header(AVFormatContext *s)
{
s->ctx_flags |= AVFMTCTX_NOHEADER;
return 0;
}
static int parse_utf(AVFormatContext *s, AVIOContext *pb,
USMChannel *ch, int ch_type,
uint32_t parent_chunk_size)
{
USMDemuxContext *usm = s->priv_data;
GetByteContext gb, ugb, sgb;
uint32_t chunk_type, chunk_size, offset;
uint32_t unique_offset, string_offset;
int nb_items, unique_size, nb_dictionaries;
AVRational fps = { 0 };
int type;
chunk_type = avio_rb32(pb);
chunk_size = avio_rb32(pb);
if (chunk_type != MKBETAG('@','U','T','F'))
return AVERROR_INVALIDDATA;
if (!chunk_size || chunk_size >= parent_chunk_size)
return AVERROR_INVALIDDATA;
av_fast_malloc(&usm->header, &usm->header_size, chunk_size);
if (!usm->header)
return AVERROR(ENOMEM);
if (avio_read(pb, usm->header, chunk_size) != chunk_size)
return AVERROR_EOF;
bytestream2_init(&gb, usm->header, chunk_size);
ugb = gb;
sgb = gb;
unique_offset = bytestream2_get_be32(&gb);
string_offset = bytestream2_get_be32(&gb);
/*byte_offset =*/ bytestream2_get_be32(&gb);
/*payload_name_offset =*/ bytestream2_get_be32(&gb);
nb_items = bytestream2_get_be16(&gb);
unique_size = bytestream2_get_be16(&gb);
nb_dictionaries = bytestream2_get_be32(&gb);
if (nb_dictionaries == 0)
return AVERROR_INVALIDDATA;
bytestream2_skip(&ugb, unique_offset);
if (bytestream2_get_bytes_left(&ugb) < unique_size)
return AVERROR_INVALIDDATA;
bytestream2_init(&ugb, ugb.buffer, unique_size);
bytestream2_skip(&sgb, string_offset);
for (int i = 0; i < nb_items; i++) {
GetByteContext *xgb;
uint8_t key[256];
int64_t value;
int n = 0;
type = bytestream2_get_byte(&gb);
offset = bytestream2_get_be32(&gb);
bytestream2_seek(&sgb, string_offset + offset, SEEK_SET);
while (bytestream2_get_bytes_left(&sgb) > 0) {
key[n] = bytestream2_get_byte(&sgb);
if (!key[n])
break;
if (n >= sizeof(key) - 1)
break;
n++;
}
key[n] = '\0';
if ((type >> 5) == 1)
xgb = &gb;
else
xgb = &ugb;
switch (type & 0x1F) {
case 0x10:
case 0x11:
value = bytestream2_get_byte(xgb);
break;
case 0x12:
case 0x13:
value = bytestream2_get_be16(xgb);
break;
case 0x14:
case 0x15:
value = bytestream2_get_be32(xgb);
break;
case 0x16:
case 0x17:
value = bytestream2_get_be64(xgb);
break;
case 0x18:
value = av_int2float(bytestream2_get_be32(xgb));
break;
case 0x19:
value = av_int2double(bytestream2_get_be64(xgb));
break;
case 0x1A:
break;
}
if (ch_type == AUDIOI) {
if (!strcmp(key, "sampling_rate")) {
ch->rate.num = value;
ch->rate.den = 1;
} else if (!strcmp(key, "num_channels")) {
ch->nb_channels = value;
} else if (!strcmp(key, "total_samples")) {
ch->duration = value;
} else if (!strcmp(key, "audio_codec")) {
switch (value) {
case 2:
ch->codec_id = AV_CODEC_ID_ADPCM_ADX;
break;
case 4:
ch->codec_id = AV_CODEC_ID_HCA;
break;
default:
av_log(s, AV_LOG_ERROR, "unsupported audio: %d\n", (int)value);
break;
}
}
} else if (ch_type == VIDEOI || ch_type == ALPHAI) {
if (!strcmp(key, "width")) {
ch->width = value;
} else if (!strcmp(key, "height")) {
ch->height = value;
} else if (!strcmp(key, "total_frames")) {
ch->nb_frames = value;
} else if (!strcmp(key, "framerate_n")) {
fps.num = value;
} else if (!strcmp(key, "framerate_d")) {
fps.den = value;
} else if (!strcmp(key, "mpeg_codec")) {
switch (value) {
case 1:
ch->codec_id = AV_CODEC_ID_MPEG1VIDEO;
break;
case 5:
ch->codec_id = AV_CODEC_ID_H264;
break;
case 9:
ch->codec_id = AV_CODEC_ID_VP9;
break;
default:
av_log(s, AV_LOG_ERROR, "unsupported video: %d\n", (int)value);
break;
}
}
}
}
if (ch_type == VIDEOI && fps.num && fps.den)
ch->rate = fps;
return 0;
}
static int64_t parse_chunk(AVFormatContext *s, AVIOContext *pb,
uint32_t chunk_type, uint32_t chunk_size,
AVPacket *pkt)
{
const int is_audio = chunk_type == MKBETAG('@','S','F','A');
const int is_alpha = chunk_type == MKBETAG('@','A','L','P');
const int is_subtt = chunk_type == MKBETAG('@','S','B','T');
USMDemuxContext *usm = s->priv_data;
int padding_size, payload_type, payload_offset;
const int ch_type = is_subtt ? SUBTTI : is_audio ? AUDIOI : is_alpha ? ALPHAI : VIDEOI;
int stream_index, frame_rate;
int64_t chunk_start, ret;
ret = avio_tell(pb);
if (ret < 0)
return ret;
chunk_start = ret;
avio_skip(pb, 1);
payload_offset = avio_r8(pb);
padding_size = avio_rb16(pb);
stream_index = avio_r8(pb);
avio_skip(pb, 2);
payload_type = avio_r8(pb);
/*frame_time =*/ avio_rb32(pb);
frame_rate = avio_rb32(pb);
avio_skip(pb, 8);
ret = avio_tell(pb);
if (ret < 0)
return ret;
ret = avio_skip(pb, FFMAX(0, (ret - chunk_start) - payload_offset));
if (ret < 0)
return ret;
if (payload_type == 1) {
if (usm->ch[ch_type][stream_index].used == 0) {
USMChannel *ch = &usm->ch[ch_type][stream_index];
switch (ch_type) {
case ALPHAI:
case VIDEOI:
ch->type = AVMEDIA_TYPE_VIDEO;
break;
case AUDIOI:
ch->type = AVMEDIA_TYPE_AUDIO;
break;
case SUBTTI:
ch->type = AVMEDIA_TYPE_SUBTITLE;
break;
default:
return AVERROR_INVALIDDATA;
}
ch->used = 1;
ch->index = -1;
usm->nb_channels[ch_type]++;
ret = parse_utf(s, pb, ch, ch_type, chunk_size);
if (ret < 0)
return ret;
}
} else if (payload_type == 0) {
if (usm->ch[ch_type][stream_index].used == 1) {
USMChannel *ch = &usm->ch[ch_type][stream_index];
int get_extradata = 0;
uint32_t pkt_size;
AVStream *st;
if (ch->index < 0) {
AVCodecParameters *par;
st = avformat_new_stream(s, NULL);
if (!st)
return AVERROR(ENOMEM);
par = st->codecpar;
par->codec_type = ch->type;
par->codec_id = ch->codec_id;
st->start_time = 0;
switch (ch->type) {
case AVMEDIA_TYPE_VIDEO:
par->width = ch->width;
par->height = ch->height;
st->nb_frames = ch->nb_frames;
break;
case AVMEDIA_TYPE_AUDIO:
par->sample_rate = ch->rate.num;
par->ch_layout.nb_channels = ch->nb_channels;
st->duration = ch->duration;
break;
}
ch->index = st->index;
if (!ch->rate.num || !ch->rate.den)
ch->rate = av_make_q(frame_rate, 100);
avpriv_set_pts_info(st, 64, ch->rate.den, ch->rate.num);
ffstream(st)->need_parsing = AVSTREAM_PARSE_TIMESTAMPS;
get_extradata = ch->codec_id == AV_CODEC_ID_ADPCM_ADX;
ch->extradata_pos = avio_tell(pb);
}
ret = avio_tell(pb);
if (ret < 0)
return ret;
pkt_size = chunk_size - (ret - chunk_start) - padding_size;
if (get_extradata) {
if ((ret = ff_get_extradata(s, st->codecpar, pb, pkt_size)) < 0)
return ret;
} else {
if (ret == ch->extradata_pos && ch->codec_id == AV_CODEC_ID_ADPCM_ADX) {
avio_skip(pb, pkt_size);
ret = 0;
} else {
ret = av_get_packet(pb, pkt, pkt_size);
if (ret < 0)
return ret;
pkt->stream_index = ch->index;
}
}
avio_skip(pb, padding_size);
if (ret != pkt_size)
return AVERROR_EOF;
if (get_extradata == 0)
return ret;
}
}
ret = avio_tell(pb);
if (ret < 0)
return ret;
ret = avio_skip(pb, FFMAX(0, chunk_size - (ret - chunk_start)));
if (ret < 0)
return ret;
return FFERROR_REDO;
}
static int usm_read_packet(AVFormatContext *s, AVPacket *pkt)
{
AVIOContext *pb = s->pb;
int64_t ret = AVERROR_EOF;
while (!avio_feof(pb)) {
uint32_t chunk_type, chunk_size;
int got_packet = 0;
int64_t pos;
pos = avio_tell(pb);
if (pos < 0)
return pos;
chunk_type = avio_rb32(pb);
chunk_size = avio_rb32(pb);
if (!chunk_size)
return AVERROR_INVALIDDATA;
switch (chunk_type) {
case MKBETAG('C','R','I','D'):
default:
ret = avio_skip(pb, chunk_size);
break;
case MKBETAG('@','A','L','P'):
case MKBETAG('@','S','B','T'):
case MKBETAG('@','S','F','A'):
case MKBETAG('@','S','F','V'):
ret = parse_chunk(s, pb, chunk_type, chunk_size, pkt);
got_packet = ret > 0;
break;
}
if (got_packet)
pkt->pos = pos;
if (got_packet || ret < 0)
break;
}
return ret;
}
static int usm_read_close(AVFormatContext *s)
{
USMDemuxContext *usm = s->priv_data;
av_freep(&usm->header);
usm->header_size = 0;
return 0;
}
const AVInputFormat ff_usm_demuxer = {
.name = "usm",
.long_name = NULL_IF_CONFIG_SMALL("CRI USM"),
.priv_data_size = sizeof(USMDemuxContext),
.read_probe = usm_probe,
.read_header = usm_read_header,
.read_packet = usm_read_packet,
.read_close = usm_read_close,
.extensions = "usm",
.flags = AVFMT_GENERIC_INDEX | AVFMT_NO_BYTE_SEEK | AVFMT_NOBINSEARCH,
};