mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
206 lines
7.0 KiB
206 lines
7.0 KiB
/* |
|
* Copyright (C) 2008 David Conrad |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or |
|
* modify it under the terms of the GNU Lesser General Public |
|
* License as published by the Free Software Foundation; either |
|
* version 2.1 of the License, or (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
* Lesser General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU Lesser General Public |
|
* License along with FFmpeg; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
|
*/ |
|
|
|
#include <speex/speex.h> |
|
#include <speex/speex_header.h> |
|
#include <speex/speex_stereo.h> |
|
#include <speex/speex_callbacks.h> |
|
|
|
#include "libavutil/channel_layout.h" |
|
#include "libavutil/common.h" |
|
#include "avcodec.h" |
|
#include "codec_internal.h" |
|
#include "decode.h" |
|
|
|
typedef struct LibSpeexContext { |
|
SpeexBits bits; |
|
SpeexStereoState stereo; |
|
void *dec_state; |
|
int frame_size; |
|
int pktsize; |
|
} LibSpeexContext; |
|
|
|
|
|
static av_cold int libspeex_decode_init(AVCodecContext *avctx) |
|
{ |
|
LibSpeexContext *s = avctx->priv_data; |
|
const SpeexMode *mode; |
|
SpeexHeader *header = NULL; |
|
int spx_mode, channels = avctx->ch_layout.nb_channels; |
|
|
|
if (avctx->extradata && avctx->extradata_size >= 80) { |
|
header = speex_packet_to_header(avctx->extradata, |
|
avctx->extradata_size); |
|
if (!header) |
|
av_log(avctx, AV_LOG_WARNING, "Invalid Speex header\n"); |
|
} |
|
if (avctx->codec_tag == MKTAG('S', 'P', 'X', 'N')) { |
|
int quality; |
|
if (!avctx->extradata || avctx->extradata && avctx->extradata_size < 47) { |
|
av_log(avctx, AV_LOG_ERROR, "Missing or invalid extradata.\n"); |
|
return AVERROR_INVALIDDATA; |
|
} |
|
|
|
quality = avctx->extradata[37]; |
|
if (quality > 10) { |
|
av_log(avctx, AV_LOG_ERROR, "Unsupported quality mode %d.\n", quality); |
|
return AVERROR_PATCHWELCOME; |
|
} |
|
|
|
s->pktsize = ((const int[]){5,10,15,20,20,28,28,38,38,46,62})[quality]; |
|
|
|
spx_mode = 0; |
|
} else if (header) { |
|
avctx->sample_rate = header->rate; |
|
channels = header->nb_channels; |
|
spx_mode = header->mode; |
|
speex_header_free(header); |
|
} else { |
|
switch (avctx->sample_rate) { |
|
case 8000: spx_mode = 0; break; |
|
case 16000: spx_mode = 1; break; |
|
case 32000: spx_mode = 2; break; |
|
default: |
|
/* libspeex can handle any mode if initialized as ultra-wideband */ |
|
av_log(avctx, AV_LOG_WARNING, "Invalid sample rate: %d\n" |
|
"Decoding as 32kHz ultra-wideband\n", |
|
avctx->sample_rate); |
|
spx_mode = 2; |
|
} |
|
} |
|
|
|
mode = speex_lib_get_mode(spx_mode); |
|
if (!mode) { |
|
av_log(avctx, AV_LOG_ERROR, "Unknown Speex mode %d", spx_mode); |
|
return AVERROR_INVALIDDATA; |
|
} |
|
s->frame_size = 160 << spx_mode; |
|
if (!avctx->sample_rate) |
|
avctx->sample_rate = 8000 << spx_mode; |
|
|
|
if (channels < 1 || channels > 2) { |
|
/* libspeex can handle mono or stereo if initialized as stereo */ |
|
av_log(avctx, AV_LOG_ERROR, "Invalid channel count: %d.\n" |
|
"Decoding as stereo.\n", channels); |
|
channels = 2; |
|
} |
|
av_channel_layout_uninit(&avctx->ch_layout); |
|
avctx->ch_layout = channels == 2 ? (AVChannelLayout)AV_CHANNEL_LAYOUT_STEREO : |
|
(AVChannelLayout)AV_CHANNEL_LAYOUT_MONO; |
|
|
|
speex_bits_init(&s->bits); |
|
s->dec_state = speex_decoder_init(mode); |
|
if (!s->dec_state) { |
|
av_log(avctx, AV_LOG_ERROR, "Error initializing libspeex decoder.\n"); |
|
return -1; |
|
} |
|
|
|
if (channels == 2) { |
|
SpeexCallback callback; |
|
callback.callback_id = SPEEX_INBAND_STEREO; |
|
callback.func = speex_std_stereo_request_handler; |
|
callback.data = &s->stereo; |
|
s->stereo = (SpeexStereoState)SPEEX_STEREO_STATE_INIT; |
|
speex_decoder_ctl(s->dec_state, SPEEX_SET_HANDLER, &callback); |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int libspeex_decode_frame(AVCodecContext *avctx, AVFrame *frame, |
|
int *got_frame_ptr, AVPacket *avpkt) |
|
{ |
|
uint8_t *buf = avpkt->data; |
|
int buf_size = avpkt->size; |
|
LibSpeexContext *s = avctx->priv_data; |
|
int16_t *output; |
|
int ret, consumed = 0; |
|
avctx->sample_fmt = AV_SAMPLE_FMT_S16; |
|
|
|
/* get output buffer */ |
|
frame->nb_samples = s->frame_size; |
|
if ((ret = ff_get_buffer(avctx, frame, 0)) < 0) |
|
return ret; |
|
output = (int16_t *)frame->data[0]; |
|
|
|
/* if there is not enough data left for the smallest possible frame or the |
|
next 5 bits are a terminator code, reset the libspeex buffer using the |
|
current packet, otherwise ignore the current packet and keep decoding |
|
frames from the libspeex buffer. */ |
|
if (speex_bits_remaining(&s->bits) < 5 || |
|
speex_bits_peek_unsigned(&s->bits, 5) == 0xF) { |
|
/* check for flush packet */ |
|
if (!buf || !buf_size) { |
|
*got_frame_ptr = 0; |
|
return buf_size; |
|
} |
|
if (s->pktsize && buf_size == 62) |
|
buf_size = s->pktsize; |
|
/* set new buffer */ |
|
speex_bits_read_from(&s->bits, buf, buf_size); |
|
consumed = avpkt->size; |
|
} |
|
|
|
/* decode a single frame */ |
|
ret = speex_decode_int(s->dec_state, &s->bits, output); |
|
if (ret <= -2) { |
|
av_log(avctx, AV_LOG_ERROR, "Error decoding Speex frame.\n"); |
|
return AVERROR_INVALIDDATA; |
|
} |
|
if (avctx->ch_layout.nb_channels == 2) |
|
speex_decode_stereo_int(output, s->frame_size, &s->stereo); |
|
|
|
*got_frame_ptr = 1; |
|
|
|
if (!avctx->bit_rate) |
|
speex_decoder_ctl(s->dec_state, SPEEX_GET_BITRATE, &avctx->bit_rate); |
|
return consumed; |
|
} |
|
|
|
static av_cold int libspeex_decode_close(AVCodecContext *avctx) |
|
{ |
|
LibSpeexContext *s = avctx->priv_data; |
|
|
|
speex_bits_destroy(&s->bits); |
|
speex_decoder_destroy(s->dec_state); |
|
|
|
return 0; |
|
} |
|
|
|
static av_cold void libspeex_decode_flush(AVCodecContext *avctx) |
|
{ |
|
LibSpeexContext *s = avctx->priv_data; |
|
speex_bits_reset(&s->bits); |
|
} |
|
|
|
const FFCodec ff_libspeex_decoder = { |
|
.p.name = "libspeex", |
|
.p.long_name = NULL_IF_CONFIG_SMALL("libspeex Speex"), |
|
.p.type = AVMEDIA_TYPE_AUDIO, |
|
.p.id = AV_CODEC_ID_SPEEX, |
|
.p.capabilities = AV_CODEC_CAP_SUBFRAMES | AV_CODEC_CAP_DELAY | AV_CODEC_CAP_DR1 | AV_CODEC_CAP_CHANNEL_CONF, |
|
.p.wrapper_name = "libspeex", |
|
.caps_internal = FF_CODEC_CAP_NOT_INIT_THREADSAFE, |
|
.priv_data_size = sizeof(LibSpeexContext), |
|
.init = libspeex_decode_init, |
|
.close = libspeex_decode_close, |
|
FF_CODEC_DECODE_CB(libspeex_decode_frame), |
|
.flush = libspeex_decode_flush, |
|
};
|
|
|