|
|
|
@ -38,6 +38,8 @@ TX_DECL_FN(fft32, avx) |
|
|
|
|
TX_DECL_FN(fft32_ns, avx) |
|
|
|
|
TX_DECL_FN(fft32, fma3) |
|
|
|
|
TX_DECL_FN(fft32_ns, fma3) |
|
|
|
|
TX_DECL_FN(fft_sr, avx) |
|
|
|
|
TX_DECL_FN(fft_sr_ns, avx) |
|
|
|
|
TX_DECL_FN(fft_sr, fma3) |
|
|
|
|
TX_DECL_FN(fft_sr_ns, fma3) |
|
|
|
|
TX_DECL_FN(fft_sr, avx2) |
|
|
|
@ -57,6 +59,7 @@ TX_DECL_FN(fft16_asm, avx) |
|
|
|
|
TX_DECL_FN(fft16_asm, fma3) |
|
|
|
|
TX_DECL_FN(fft32_asm, avx) |
|
|
|
|
TX_DECL_FN(fft32_asm, fma3) |
|
|
|
|
TX_DECL_FN(fft_sr_asm, avx) |
|
|
|
|
TX_DECL_FN(fft_sr_asm, fma3) |
|
|
|
|
TX_DECL_FN(fft_sr_asm, avx2) |
|
|
|
|
|
|
|
|
@ -214,6 +217,11 @@ const FFTXCodelet * const ff_tx_codelet_list_float_x86[] = { |
|
|
|
|
AV_TX_INPLACE | FF_TX_PRESHUFFLE | FF_TX_ASM_CALL, AV_CPU_FLAG_AVXSLOW), |
|
|
|
|
TX_DEF(fft32_ns, FFT, 32, 32, 2, 0, 352, b8_i2, fma3, FMA3, AV_TX_INPLACE | FF_TX_PRESHUFFLE, |
|
|
|
|
AV_CPU_FLAG_AVXSLOW), |
|
|
|
|
TX_DEF(fft_sr, FFT, 64, 131072, 2, 0, 256, b8_i2, avx, AVX, 0, AV_CPU_FLAG_AVXSLOW), |
|
|
|
|
TX_DEF(fft_sr_asm, FFT, 64, 131072, 2, 0, 320, b8_i2, avx, AVX, |
|
|
|
|
AV_TX_INPLACE | FF_TX_PRESHUFFLE | FF_TX_ASM_CALL, AV_CPU_FLAG_AVXSLOW), |
|
|
|
|
TX_DEF(fft_sr_ns, FFT, 64, 131072, 2, 0, 320, b8_i2, avx, AVX, AV_TX_INPLACE | FF_TX_PRESHUFFLE, |
|
|
|
|
AV_CPU_FLAG_AVXSLOW), |
|
|
|
|
TX_DEF(fft_sr, FFT, 64, 131072, 2, 0, 288, b8_i2, fma3, FMA3, 0, AV_CPU_FLAG_AVXSLOW), |
|
|
|
|
TX_DEF(fft_sr_asm, FFT, 64, 131072, 2, 0, 352, b8_i2, fma3, FMA3, |
|
|
|
|
AV_TX_INPLACE | FF_TX_PRESHUFFLE | FF_TX_ASM_CALL, AV_CPU_FLAG_AVXSLOW), |
|
|
|
|