mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
445 lines
14 KiB
445 lines
14 KiB
/* |
|
* AIFF/AIFF-C demuxer |
|
* Copyright (c) 2006 Patrick Guimond |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#include "libavutil/intreadwrite.h" |
|
#include "libavutil/dict.h" |
|
#include "avformat.h" |
|
#include "demux.h" |
|
#include "internal.h" |
|
#include "pcm.h" |
|
#include "aiff.h" |
|
#include "id3v2.h" |
|
#include "mov_chan.h" |
|
#include "replaygain.h" |
|
|
|
#define AIFF 0 |
|
#define AIFF_C_VERSION1 0xA2805140 |
|
|
|
typedef struct AIFFInputContext { |
|
int64_t data_end; |
|
int block_duration; |
|
} AIFFInputContext; |
|
|
|
static enum AVCodecID aiff_codec_get_id(int bps) |
|
{ |
|
if (bps <= 8) |
|
return AV_CODEC_ID_PCM_S8; |
|
if (bps <= 16) |
|
return AV_CODEC_ID_PCM_S16BE; |
|
if (bps <= 24) |
|
return AV_CODEC_ID_PCM_S24BE; |
|
if (bps <= 32) |
|
return AV_CODEC_ID_PCM_S32BE; |
|
|
|
/* bigger than 32 isn't allowed */ |
|
return AV_CODEC_ID_NONE; |
|
} |
|
|
|
/* returns the size of the found tag */ |
|
static int64_t get_tag(AVIOContext *pb, uint32_t * tag) |
|
{ |
|
int64_t size; |
|
|
|
if (avio_feof(pb)) |
|
return AVERROR(EIO); |
|
|
|
*tag = avio_rl32(pb); |
|
size = avio_rb32(pb); |
|
|
|
return size; |
|
} |
|
|
|
/* Metadata string read */ |
|
static void get_meta(AVFormatContext *s, const char *key, int64_t size) |
|
{ |
|
uint8_t *str = NULL; |
|
|
|
if (size < SIZE_MAX) |
|
str = av_malloc(size+1); |
|
|
|
if (str) { |
|
int res = avio_read(s->pb, str, size); |
|
if (res < 0){ |
|
av_free(str); |
|
return; |
|
} |
|
size -= res; |
|
str[res] = 0; |
|
av_dict_set(&s->metadata, key, str, AV_DICT_DONT_STRDUP_VAL); |
|
} |
|
|
|
avio_skip(s->pb, size); |
|
} |
|
|
|
/* Returns the number of sound data frames or negative on error */ |
|
static int get_aiff_header(AVFormatContext *s, int64_t size, |
|
unsigned version) |
|
{ |
|
AVIOContext *pb = s->pb; |
|
AVCodecParameters *par = s->streams[0]->codecpar; |
|
AIFFInputContext *aiff = s->priv_data; |
|
int exp; |
|
uint64_t val; |
|
int sample_rate; |
|
unsigned int num_frames; |
|
int channels; |
|
|
|
if (size & 1) |
|
size++; |
|
par->codec_type = AVMEDIA_TYPE_AUDIO; |
|
channels = avio_rb16(pb); |
|
par->ch_layout.nb_channels = channels; |
|
num_frames = avio_rb32(pb); |
|
par->bits_per_coded_sample = avio_rb16(pb); |
|
|
|
exp = avio_rb16(pb) - 16383 - 63; |
|
val = avio_rb64(pb); |
|
if (exp <-63 || exp >63) { |
|
av_log(s, AV_LOG_ERROR, "exp %d is out of range\n", exp); |
|
return AVERROR_INVALIDDATA; |
|
} |
|
if (exp >= 0) |
|
sample_rate = val << exp; |
|
else |
|
sample_rate = (val + (1ULL<<(-exp-1))) >> -exp; |
|
if (sample_rate <= 0) |
|
return AVERROR_INVALIDDATA; |
|
|
|
par->sample_rate = sample_rate; |
|
if (size < 18) |
|
return AVERROR_INVALIDDATA; |
|
size -= 18; |
|
|
|
/* get codec id for AIFF-C */ |
|
if (size < 4) { |
|
version = AIFF; |
|
} else if (version == AIFF_C_VERSION1) { |
|
par->codec_tag = avio_rl32(pb); |
|
par->codec_id = ff_codec_get_id(ff_codec_aiff_tags, par->codec_tag); |
|
if (par->codec_id == AV_CODEC_ID_NONE) |
|
avpriv_request_sample(s, "unknown or unsupported codec tag: %s", |
|
av_fourcc2str(par->codec_tag)); |
|
size -= 4; |
|
} |
|
|
|
if (version != AIFF_C_VERSION1 || par->codec_id == AV_CODEC_ID_PCM_S16BE) { |
|
par->codec_id = aiff_codec_get_id(par->bits_per_coded_sample); |
|
par->bits_per_coded_sample = av_get_bits_per_sample(par->codec_id); |
|
aiff->block_duration = 1; |
|
} else { |
|
switch (par->codec_id) { |
|
case AV_CODEC_ID_PCM_F32BE: |
|
case AV_CODEC_ID_PCM_F64BE: |
|
case AV_CODEC_ID_PCM_S16LE: |
|
case AV_CODEC_ID_PCM_ALAW: |
|
case AV_CODEC_ID_PCM_MULAW: |
|
aiff->block_duration = 1; |
|
break; |
|
case AV_CODEC_ID_ADPCM_IMA_QT: |
|
par->block_align = 34 * channels; |
|
break; |
|
case AV_CODEC_ID_MACE3: |
|
par->block_align = 2 * channels; |
|
break; |
|
case AV_CODEC_ID_ADPCM_G726LE: |
|
par->bits_per_coded_sample = 5; |
|
case AV_CODEC_ID_ADPCM_IMA_WS: |
|
case AV_CODEC_ID_ADPCM_G722: |
|
case AV_CODEC_ID_MACE6: |
|
case AV_CODEC_ID_CBD2_DPCM: |
|
case AV_CODEC_ID_SDX2_DPCM: |
|
par->block_align = 1 * channels; |
|
break; |
|
case AV_CODEC_ID_GSM: |
|
par->block_align = 33; |
|
break; |
|
default: |
|
aiff->block_duration = 1; |
|
break; |
|
} |
|
if (par->block_align > 0) |
|
aiff->block_duration = av_get_audio_frame_duration2(par, |
|
par->block_align); |
|
} |
|
|
|
/* Block align needs to be computed in all cases, as the definition |
|
* is specific to applications -> here we use the WAVE format definition */ |
|
if (!par->block_align) |
|
par->block_align = (av_get_bits_per_sample(par->codec_id) * channels) >> 3; |
|
|
|
if (aiff->block_duration) { |
|
par->bit_rate = av_rescale(par->sample_rate, par->block_align * 8LL, |
|
aiff->block_duration); |
|
if (par->bit_rate < 0) |
|
par->bit_rate = 0; |
|
} |
|
|
|
/* Chunk is over */ |
|
if (size) |
|
avio_skip(pb, size); |
|
|
|
return num_frames; |
|
} |
|
|
|
static int aiff_probe(const AVProbeData *p) |
|
{ |
|
/* check file header */ |
|
if (AV_RL32(p->buf) == MKTAG('F', 'O', 'R', 'M') && |
|
AV_RB32(p->buf + 4) >= 4 && |
|
p->buf[8] == 'A' && p->buf[9] == 'I' && |
|
p->buf[10] == 'F' && (p->buf[11] == 'F' || p->buf[11] == 'C')) |
|
return AVPROBE_SCORE_MAX; |
|
else |
|
return 0; |
|
} |
|
|
|
/* aiff input */ |
|
static int aiff_read_header(AVFormatContext *s) |
|
{ |
|
int ret; |
|
int64_t filesize, size; |
|
int64_t offset = 0, position; |
|
uint32_t tag; |
|
unsigned version = AIFF_C_VERSION1; |
|
AVIOContext *pb = s->pb; |
|
AVStream * st; |
|
AIFFInputContext *aiff = s->priv_data; |
|
ID3v2ExtraMeta *id3v2_extra_meta; |
|
|
|
/* check FORM header */ |
|
filesize = get_tag(pb, &tag); |
|
if (filesize < 4 || tag != MKTAG('F', 'O', 'R', 'M')) |
|
return AVERROR_INVALIDDATA; |
|
|
|
/* AIFF data type */ |
|
tag = avio_rl32(pb); |
|
if (tag == MKTAG('A', 'I', 'F', 'F')) /* Got an AIFF file */ |
|
version = AIFF; |
|
else if (tag != MKTAG('A', 'I', 'F', 'C')) /* An AIFF-C file then */ |
|
return AVERROR_INVALIDDATA; |
|
|
|
filesize -= 4; |
|
|
|
st = avformat_new_stream(s, NULL); |
|
if (!st) |
|
return AVERROR(ENOMEM); |
|
|
|
while (filesize > 0) { |
|
/* parse different chunks */ |
|
size = get_tag(pb, &tag); |
|
|
|
if (size == AVERROR_EOF && offset > 0 && st->codecpar->block_align) { |
|
av_log(s, AV_LOG_WARNING, "header parser hit EOF\n"); |
|
goto got_sound; |
|
} |
|
if (size < 0) |
|
return size; |
|
|
|
filesize -= size + 8; |
|
|
|
switch (tag) { |
|
case MKTAG('C', 'O', 'M', 'M'): /* Common chunk */ |
|
/* Then for the complete header info */ |
|
st->nb_frames = get_aiff_header(s, size, version); |
|
if (st->nb_frames < 0) |
|
return st->nb_frames; |
|
if (offset > 0) // COMM is after SSND |
|
goto got_sound; |
|
break; |
|
case MKTAG('I', 'D', '3', ' '): |
|
position = avio_tell(pb); |
|
ff_id3v2_read(s, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta, size); |
|
if (id3v2_extra_meta) |
|
if ((ret = ff_id3v2_parse_apic(s, id3v2_extra_meta)) < 0 || |
|
(ret = ff_id3v2_parse_chapters(s, id3v2_extra_meta)) < 0) { |
|
ff_id3v2_free_extra_meta(&id3v2_extra_meta); |
|
return ret; |
|
} |
|
ff_id3v2_free_extra_meta(&id3v2_extra_meta); |
|
if (position + size > avio_tell(pb)) |
|
avio_skip(pb, position + size - avio_tell(pb)); |
|
break; |
|
case MKTAG('F', 'V', 'E', 'R'): /* Version chunk */ |
|
version = avio_rb32(pb); |
|
break; |
|
case MKTAG('N', 'A', 'M', 'E'): /* Sample name chunk */ |
|
get_meta(s, "title" , size); |
|
break; |
|
case MKTAG('A', 'U', 'T', 'H'): /* Author chunk */ |
|
get_meta(s, "author" , size); |
|
break; |
|
case MKTAG('(', 'c', ')', ' '): /* Copyright chunk */ |
|
get_meta(s, "copyright", size); |
|
break; |
|
case MKTAG('A', 'N', 'N', 'O'): /* Annotation chunk */ |
|
get_meta(s, "comment" , size); |
|
break; |
|
case MKTAG('S', 'S', 'N', 'D'): /* Sampled sound chunk */ |
|
if (size < 8) |
|
return AVERROR_INVALIDDATA; |
|
aiff->data_end = avio_tell(pb) + size; |
|
offset = avio_rb32(pb); /* Offset of sound data */ |
|
avio_rb32(pb); /* BlockSize... don't care */ |
|
offset += avio_tell(pb); /* Compute absolute data offset */ |
|
if (st->codecpar->block_align && !(pb->seekable & AVIO_SEEKABLE_NORMAL)) /* Assume COMM already parsed */ |
|
goto got_sound; |
|
if (!(pb->seekable & AVIO_SEEKABLE_NORMAL)) { |
|
av_log(s, AV_LOG_ERROR, "file is not seekable\n"); |
|
return -1; |
|
} |
|
avio_skip(pb, size - 8); |
|
break; |
|
case MKTAG('w', 'a', 'v', 'e'): |
|
if ((uint64_t)size > (1<<30)) |
|
return AVERROR_INVALIDDATA; |
|
if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0) |
|
return ret; |
|
if ( (st->codecpar->codec_id == AV_CODEC_ID_QDMC || st->codecpar->codec_id == AV_CODEC_ID_QDM2) |
|
&& size>=12*4 && !st->codecpar->block_align) { |
|
st->codecpar->block_align = AV_RB32(st->codecpar->extradata+11*4); |
|
aiff->block_duration = AV_RB32(st->codecpar->extradata+9*4); |
|
} else if (st->codecpar->codec_id == AV_CODEC_ID_QCELP) { |
|
char rate = 0; |
|
if (size >= 25) |
|
rate = st->codecpar->extradata[24]; |
|
switch (rate) { |
|
case 'H': // RATE_HALF |
|
st->codecpar->block_align = 17; |
|
break; |
|
case 'F': // RATE_FULL |
|
default: |
|
st->codecpar->block_align = 35; |
|
} |
|
aiff->block_duration = 160; |
|
st->codecpar->bit_rate = (int64_t)st->codecpar->sample_rate * (st->codecpar->block_align << 3) / |
|
aiff->block_duration; |
|
} |
|
break; |
|
case MKTAG('C','H','A','N'): |
|
if ((ret = ff_mov_read_chan(s, pb, st, size)) < 0) |
|
return ret; |
|
break; |
|
case MKTAG('A','P','C','M'): /* XA ADPCM compressed sound chunk */ |
|
st->codecpar->codec_id = AV_CODEC_ID_ADPCM_XA; |
|
aiff->data_end = avio_tell(pb) + size; |
|
offset = avio_tell(pb) + 8; |
|
/* This field is unknown and its data seems to be irrelevant */ |
|
avio_rb32(pb); |
|
st->codecpar->block_align = avio_rb32(pb); |
|
|
|
goto got_sound; |
|
break; |
|
case 0: |
|
if (offset > 0 && st->codecpar->block_align) // COMM && SSND |
|
goto got_sound; |
|
default: /* Jump */ |
|
avio_skip(pb, size); |
|
} |
|
|
|
/* Skip required padding byte for odd-sized chunks. */ |
|
if (size & 1) { |
|
filesize--; |
|
avio_skip(pb, 1); |
|
} |
|
} |
|
|
|
ret = ff_replaygain_export(st, s->metadata); |
|
if (ret < 0) |
|
return ret; |
|
|
|
got_sound: |
|
if (!st->codecpar->block_align && st->codecpar->codec_id == AV_CODEC_ID_QCELP) { |
|
av_log(s, AV_LOG_WARNING, "qcelp without wave chunk, assuming full rate\n"); |
|
st->codecpar->block_align = 35; |
|
} else if (st->codecpar->block_align <= 0) { |
|
av_log(s, AV_LOG_ERROR, "could not find COMM tag or invalid block_align value\n"); |
|
return AVERROR_INVALIDDATA; |
|
} |
|
if (aiff->block_duration < 0) |
|
return AVERROR_INVALIDDATA; |
|
|
|
/* Now positioned, get the sound data start and end */ |
|
avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate); |
|
st->start_time = 0; |
|
st->duration = st->nb_frames * aiff->block_duration; |
|
|
|
/* Position the stream at the first block */ |
|
avio_seek(pb, offset, SEEK_SET); |
|
|
|
return 0; |
|
} |
|
|
|
#define MAX_SIZE 4096 |
|
|
|
static int aiff_read_packet(AVFormatContext *s, |
|
AVPacket *pkt) |
|
{ |
|
AVStream *st = s->streams[0]; |
|
AIFFInputContext *aiff = s->priv_data; |
|
int64_t max_size; |
|
int res, size; |
|
|
|
/* calculate size of remaining data */ |
|
max_size = aiff->data_end - avio_tell(s->pb); |
|
if (max_size <= 0) |
|
return AVERROR_EOF; |
|
|
|
if (!st->codecpar->block_align) { |
|
av_log(s, AV_LOG_ERROR, "block_align not set\n"); |
|
return AVERROR_INVALIDDATA; |
|
} |
|
|
|
/* Now for that packet */ |
|
switch (st->codecpar->codec_id) { |
|
case AV_CODEC_ID_ADPCM_IMA_QT: |
|
case AV_CODEC_ID_GSM: |
|
case AV_CODEC_ID_QDM2: |
|
case AV_CODEC_ID_QCELP: |
|
size = st->codecpar->block_align; |
|
break; |
|
default: |
|
size = st->codecpar->block_align ? (MAX_SIZE / st->codecpar->block_align) * st->codecpar->block_align : MAX_SIZE; |
|
if (!size) |
|
return AVERROR_INVALIDDATA; |
|
} |
|
size = FFMIN(max_size, size); |
|
res = av_get_packet(s->pb, pkt, size); |
|
if (res < 0) |
|
return res; |
|
|
|
if (size >= st->codecpar->block_align) |
|
pkt->flags &= ~AV_PKT_FLAG_CORRUPT; |
|
/* Only one stream in an AIFF file */ |
|
pkt->stream_index = 0; |
|
pkt->duration = (res / st->codecpar->block_align) * (int64_t) aiff->block_duration; |
|
return 0; |
|
} |
|
|
|
const FFInputFormat ff_aiff_demuxer = { |
|
.p.name = "aiff", |
|
.p.long_name = NULL_IF_CONFIG_SMALL("Audio IFF"), |
|
.p.codec_tag = ff_aiff_codec_tags_list, |
|
.priv_data_size = sizeof(AIFFInputContext), |
|
.read_probe = aiff_probe, |
|
.read_header = aiff_read_header, |
|
.read_packet = aiff_read_packet, |
|
.read_seek = ff_pcm_read_seek, |
|
};
|
|
|