|
|
|
@ -47,6 +47,129 @@ extern void ff_mix_1_to_2_s16p_flt_sse4(int16_t **src, float **matrix, int len, |
|
|
|
|
extern void ff_mix_1_to_2_s16p_flt_avx (int16_t **src, float **matrix, int len, |
|
|
|
|
int out_ch, int in_ch); |
|
|
|
|
|
|
|
|
|
#define DEFINE_MIX_3_8_TO_1_2(chan) \ |
|
|
|
|
extern void ff_mix_ ## chan ## _to_1_fltp_flt_sse(float **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_2_fltp_flt_sse(float **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
\
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_1_s16p_flt_sse2(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_2_s16p_flt_sse2(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
\
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_1_s16p_flt_sse4(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_2_s16p_flt_sse4(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
\
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_1_fltp_flt_avx(float **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_2_fltp_flt_avx(float **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
\
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_1_s16p_flt_avx(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_2_s16p_flt_avx(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
\
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_1_fltp_flt_fma4(float **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_2_fltp_flt_fma4(float **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
\
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_1_s16p_flt_fma4(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); \
|
|
|
|
|
extern void ff_mix_ ## chan ## _to_2_s16p_flt_fma4(int16_t **src, \
|
|
|
|
|
float **matrix, int len, \
|
|
|
|
|
int out_ch, int in_ch); |
|
|
|
|
|
|
|
|
|
DEFINE_MIX_3_8_TO_1_2(3) |
|
|
|
|
DEFINE_MIX_3_8_TO_1_2(4) |
|
|
|
|
DEFINE_MIX_3_8_TO_1_2(5) |
|
|
|
|
DEFINE_MIX_3_8_TO_1_2(6) |
|
|
|
|
DEFINE_MIX_3_8_TO_1_2(7) |
|
|
|
|
DEFINE_MIX_3_8_TO_1_2(8) |
|
|
|
|
|
|
|
|
|
#define SET_MIX_3_8_TO_1_2(chan) \ |
|
|
|
|
if (mm_flags & AV_CPU_FLAG_SSE && HAVE_SSE) { \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_FLTP, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 1, 16, 4, "SSE", \
|
|
|
|
|
ff_mix_ ## chan ## _to_1_fltp_flt_sse); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_FLTP, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 2, 16, 4, "SSE", \
|
|
|
|
|
ff_mix_## chan ##_to_2_fltp_flt_sse); \
|
|
|
|
|
} \
|
|
|
|
|
if (mm_flags & AV_CPU_FLAG_SSE2 && HAVE_SSE) { \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 1, 16, 8, "SSE2", \
|
|
|
|
|
ff_mix_ ## chan ## _to_1_s16p_flt_sse2); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 2, 16, 8, "SSE2", \
|
|
|
|
|
ff_mix_ ## chan ## _to_2_s16p_flt_sse2); \
|
|
|
|
|
} \
|
|
|
|
|
if (mm_flags & AV_CPU_FLAG_SSE4 && HAVE_SSE) { \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 1, 16, 8, "SSE4", \
|
|
|
|
|
ff_mix_ ## chan ## _to_1_s16p_flt_sse4); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 2, 16, 8, "SSE4", \
|
|
|
|
|
ff_mix_ ## chan ## _to_2_s16p_flt_sse4); \
|
|
|
|
|
} \
|
|
|
|
|
if (mm_flags & AV_CPU_FLAG_AVX && HAVE_AVX) { \
|
|
|
|
|
int ptr_align = 32; \
|
|
|
|
|
int smp_align = 8; \
|
|
|
|
|
if (ARCH_X86_32 || chan >= 6) { \
|
|
|
|
|
ptr_align = 16; \
|
|
|
|
|
smp_align = 4; \
|
|
|
|
|
} \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_FLTP, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 1, ptr_align, smp_align, "AVX", \
|
|
|
|
|
ff_mix_ ## chan ## _to_1_fltp_flt_avx); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_FLTP, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 2, ptr_align, smp_align, "AVX", \
|
|
|
|
|
ff_mix_ ## chan ## _to_2_fltp_flt_avx); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 1, 16, 8, "AVX", \
|
|
|
|
|
ff_mix_ ## chan ## _to_1_s16p_flt_avx); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 2, 16, 8, "AVX", \
|
|
|
|
|
ff_mix_ ## chan ## _to_2_s16p_flt_avx); \
|
|
|
|
|
} \
|
|
|
|
|
if (mm_flags & AV_CPU_FLAG_FMA4 && HAVE_FMA4) { \
|
|
|
|
|
int ptr_align = 32; \
|
|
|
|
|
int smp_align = 8; \
|
|
|
|
|
if (ARCH_X86_32 || chan >= 6) { \
|
|
|
|
|
ptr_align = 16; \
|
|
|
|
|
smp_align = 4; \
|
|
|
|
|
} \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_FLTP, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 1, ptr_align, smp_align, "FMA4", \
|
|
|
|
|
ff_mix_ ## chan ## _to_1_fltp_flt_fma4); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_FLTP, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 2, ptr_align, smp_align, "FMA4", \
|
|
|
|
|
ff_mix_ ## chan ## _to_2_fltp_flt_fma4); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 1, 16, 8, "FMA4", \
|
|
|
|
|
ff_mix_ ## chan ## _to_1_s16p_flt_fma4); \
|
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT,\
|
|
|
|
|
chan, 2, 16, 8, "FMA4", \
|
|
|
|
|
ff_mix_ ## chan ## _to_2_s16p_flt_fma4); \
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
av_cold void ff_audio_mix_init_x86(AudioMix *am) |
|
|
|
|
{ |
|
|
|
|
#if HAVE_YASM |
|
|
|
@ -80,5 +203,12 @@ av_cold void ff_audio_mix_init_x86(AudioMix *am) |
|
|
|
|
ff_audio_mix_set_func(am, AV_SAMPLE_FMT_S16P, AV_MIX_COEFF_TYPE_FLT, |
|
|
|
|
1, 2, 16, 8, "AVX", ff_mix_1_to_2_s16p_flt_avx); |
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
SET_MIX_3_8_TO_1_2(3) |
|
|
|
|
SET_MIX_3_8_TO_1_2(4) |
|
|
|
|
SET_MIX_3_8_TO_1_2(5) |
|
|
|
|
SET_MIX_3_8_TO_1_2(6) |
|
|
|
|
SET_MIX_3_8_TO_1_2(7) |
|
|
|
|
SET_MIX_3_8_TO_1_2(8) |
|
|
|
|
#endif |
|
|
|
|
} |
|
|
|
|