mirror of https://github.com/FFmpeg/FFmpeg.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
209 lines
7.9 KiB
209 lines
7.9 KiB
/* |
|
* Copyright (c) 2015 James Almer |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or modify |
|
* it under the terms of the GNU General Public License as published by |
|
* the Free Software Foundation; either version 2 of the License, or |
|
* (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
* GNU General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU General Public License along |
|
* with FFmpeg; if not, write to the Free Software Foundation, Inc., |
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. |
|
*/ |
|
|
|
#include <string.h> |
|
#include "checkasm.h" |
|
#include "libavcodec/flacdsp.h" |
|
#include "libavcodec/mathops.h" |
|
#include "libavutil/common.h" |
|
#include "libavutil/internal.h" |
|
#include "libavutil/intreadwrite.h" |
|
#include "libavutil/mem_internal.h" |
|
|
|
#define BUF_SIZE 256 |
|
#define MAX_CHANNELS 8 |
|
|
|
#define randomize_buffers() \ |
|
do { \ |
|
int i, j; \ |
|
for (i = 0; i < BUF_SIZE; i += 4) { \ |
|
for (j = 0; j < channels; j++) { \ |
|
uint32_t r = rnd() & (1 << (bits - 2)) - 1; \ |
|
AV_WN32A(ref_src[j] + i, r); \ |
|
AV_WN32A(new_src[j] + i, r); \ |
|
} \ |
|
} \ |
|
} while (0) |
|
|
|
static void check_decorrelate(uint8_t **ref_dst, uint8_t **ref_src, uint8_t **new_dst, uint8_t **new_src, |
|
int channels, int bits) { |
|
declare_func(void, uint8_t **out, int32_t **in, int channels, int len, int shift); |
|
|
|
randomize_buffers(); |
|
call_ref(ref_dst, (int32_t **)ref_src, channels, BUF_SIZE / sizeof(int32_t), 8); |
|
call_new(new_dst, (int32_t **)new_src, channels, BUF_SIZE / sizeof(int32_t), 8); |
|
if (memcmp(*ref_dst, *new_dst, bits == 16 ? BUF_SIZE * (channels/2) : BUF_SIZE * channels) || |
|
memcmp(*ref_src, *new_src, BUF_SIZE * channels)) |
|
fail(); |
|
bench_new(new_dst, (int32_t **)new_src, channels, BUF_SIZE / sizeof(int32_t), 8); |
|
} |
|
|
|
static void check_lpc(int pred_order, int bps) |
|
{ |
|
int qlevel = rnd() % 16; |
|
int coeff_prec = (rnd() % 15) + 1; |
|
LOCAL_ALIGNED_16(int32_t, coeffs, [32]); |
|
LOCAL_ALIGNED_16(int32_t, dst, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int32_t, dst0, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int32_t, dst1, [BUF_SIZE]); |
|
|
|
declare_func(void, int32_t *, const int[32], int, int, int); |
|
|
|
if (bps <= 16) |
|
coeff_prec = av_clip(coeff_prec, 0, 32 - bps - av_log2(pred_order)); |
|
|
|
for (int i = 0; i < 32; i++) |
|
coeffs[i] = sign_extend(rnd(), coeff_prec); |
|
for (int i = 0; i < BUF_SIZE; i++) |
|
dst[i] = sign_extend(rnd(), bps); |
|
|
|
memcpy(dst0, dst, BUF_SIZE * sizeof (int32_t)); |
|
memcpy(dst1, dst, BUF_SIZE * sizeof (int32_t)); |
|
call_ref(dst0, coeffs, pred_order, qlevel, BUF_SIZE); |
|
call_new(dst1, coeffs, pred_order, qlevel, BUF_SIZE); |
|
if (memcmp(dst0, dst1, BUF_SIZE * sizeof (int32_t)) != 0) |
|
fail(); |
|
bench_new(dst, coeffs, pred_order, qlevel, BUF_SIZE); |
|
} |
|
|
|
static void check_lpc33(int pred_order) |
|
{ |
|
int qlevel = rnd() % 16; |
|
int coeff_prec = (rnd() % 15) + 1; |
|
LOCAL_ALIGNED_16(int64_t, dst, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int64_t, dst0, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int64_t, dst1, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int32_t, residuals, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int32_t, coeffs, [32]); |
|
|
|
declare_func(void, int64_t *, const int32_t *, const int[32], int, int, int); |
|
|
|
for (int i = 0; i < 32; i++) |
|
coeffs[i] = sign_extend(rnd(), coeff_prec); |
|
|
|
for (int i = 0; i < BUF_SIZE; i++) { |
|
residuals[i] = sign_extend(rnd(), pred_order); |
|
dst[i] = sign_extend64(((int64_t)rnd() << 1) | (rnd() & 1), 33); |
|
} |
|
|
|
memcpy(dst0, dst, BUF_SIZE * sizeof (int64_t)); |
|
memcpy(dst1, dst, BUF_SIZE * sizeof (int64_t)); |
|
call_ref(dst0, residuals, coeffs, pred_order, qlevel, BUF_SIZE); |
|
call_new(dst1, residuals, coeffs, pred_order, qlevel, BUF_SIZE); |
|
if (memcmp(dst0, dst1, BUF_SIZE * sizeof (int64_t)) != 0) |
|
fail(); |
|
bench_new(dst, residuals, coeffs, pred_order, qlevel, BUF_SIZE); |
|
} |
|
|
|
static void check_wasted32(void) |
|
{ |
|
int wasted = rnd() % 32; |
|
LOCAL_ALIGNED_16(int32_t, dst, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int32_t, dst0, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int32_t, dst1, [BUF_SIZE]); |
|
|
|
declare_func(void, int32_t *, int, int); |
|
|
|
for (int i = 0; i < BUF_SIZE; i++) |
|
dst[i] = rnd(); |
|
|
|
memcpy(dst0, dst, BUF_SIZE * sizeof (int32_t)); |
|
memcpy(dst1, dst, BUF_SIZE * sizeof (int32_t)); |
|
call_ref(dst0, wasted, BUF_SIZE); |
|
call_new(dst1, wasted, BUF_SIZE); |
|
if (memcmp(dst0, dst1, BUF_SIZE * sizeof (int32_t)) != 0) |
|
fail(); |
|
bench_new(dst, wasted, BUF_SIZE); |
|
} |
|
|
|
static void check_wasted33(void) |
|
{ |
|
int wasted = rnd() % 33; |
|
LOCAL_ALIGNED_16(int64_t, dst0, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int64_t, dst1, [BUF_SIZE]); |
|
LOCAL_ALIGNED_16(int32_t, residuals, [BUF_SIZE]); |
|
|
|
declare_func(void, int64_t *, const int32_t *, int, int); |
|
|
|
for (int i = 0; i < BUF_SIZE; i++) |
|
residuals[i] = rnd(); |
|
|
|
call_ref(dst0, residuals, wasted, BUF_SIZE); |
|
call_new(dst1, residuals, wasted, BUF_SIZE); |
|
if (memcmp(dst0, dst1, BUF_SIZE * sizeof (int64_t)) != 0) |
|
fail(); |
|
bench_new(dst0, residuals, wasted, BUF_SIZE); |
|
} |
|
|
|
void checkasm_check_flacdsp(void) |
|
{ |
|
LOCAL_ALIGNED_16(uint8_t, ref_dst, [BUF_SIZE*MAX_CHANNELS]); |
|
LOCAL_ALIGNED_16(uint8_t, ref_buf, [BUF_SIZE*MAX_CHANNELS]); |
|
LOCAL_ALIGNED_16(uint8_t, new_dst, [BUF_SIZE*MAX_CHANNELS]); |
|
LOCAL_ALIGNED_16(uint8_t, new_buf, [BUF_SIZE*MAX_CHANNELS]); |
|
uint8_t *ref_src[] = { &ref_buf[BUF_SIZE*0], &ref_buf[BUF_SIZE*1], &ref_buf[BUF_SIZE*2], &ref_buf[BUF_SIZE*3], |
|
&ref_buf[BUF_SIZE*4], &ref_buf[BUF_SIZE*5], &ref_buf[BUF_SIZE*6], &ref_buf[BUF_SIZE*7] }; |
|
uint8_t *new_src[] = { &new_buf[BUF_SIZE*0], &new_buf[BUF_SIZE*1], &new_buf[BUF_SIZE*2], &new_buf[BUF_SIZE*3], |
|
&new_buf[BUF_SIZE*4], &new_buf[BUF_SIZE*5], &new_buf[BUF_SIZE*6], &new_buf[BUF_SIZE*7] }; |
|
static const char * const names[3] = { "ls", "rs", "ms" }; |
|
static const struct { |
|
enum AVSampleFormat fmt; |
|
int bits; |
|
} fmts[] = { |
|
{ AV_SAMPLE_FMT_S16, 16 }, |
|
{ AV_SAMPLE_FMT_S32, 32 }, |
|
}; |
|
static const signed char pred_orders[] = { 13, 16, 29, 32 }; |
|
FLACDSPContext h; |
|
int i, j; |
|
|
|
for (i = 0; i < 2; i++) { |
|
ff_flacdsp_init(&h, fmts[i].fmt, 2); |
|
for (j = 0; j < 3; j++) |
|
if (check_func(h.decorrelate[j + 1], "flac_decorrelate_%s_%d", names[j], fmts[i].bits)) |
|
check_decorrelate(&ref_dst, ref_src, &new_dst, new_src, 2, fmts[i].bits); |
|
for (j = 2; j <= MAX_CHANNELS; j += 2) { |
|
ff_flacdsp_init(&h, fmts[i].fmt, j); |
|
if (check_func(h.decorrelate[0], "flac_decorrelate_indep%d_%d", j, fmts[i].bits)) |
|
check_decorrelate(&ref_dst, ref_src, &new_dst, new_src, j, fmts[i].bits); |
|
} |
|
} |
|
|
|
report("decorrelate"); |
|
|
|
for (i = 0; i < FF_ARRAY_ELEMS(pred_orders); i++) |
|
if (check_func(h.lpc16, "flac_lpc_16_%d", pred_orders[i])) |
|
check_lpc(pred_orders[i], 16); |
|
for (i = 0; i < FF_ARRAY_ELEMS(pred_orders); i++) |
|
if (check_func(h.lpc32, "flac_lpc_32_%d", pred_orders[i])) |
|
check_lpc(pred_orders[i], 32); |
|
for (i = 0; i < FF_ARRAY_ELEMS(pred_orders); i++) |
|
if (check_func(h.lpc33, "flac_lpc_33_%d", pred_orders[i])) |
|
check_lpc33(pred_orders[i]); |
|
|
|
report("lpc"); |
|
|
|
if (check_func(h.wasted32, "flac_wasted_32")) |
|
check_wasted32(); |
|
if (check_func(h.wasted33, "flac_wasted_33")) |
|
check_wasted33(); |
|
|
|
report("wasted"); |
|
}
|
|
|