|
|
|
@ -32,7 +32,7 @@ pd_32: times 4 dd 32 |
|
|
|
|
SECTION .text |
|
|
|
|
|
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; void h264_idct_add(pixel *dst, dctcoef *block, int stride) |
|
|
|
|
; void h264_idct_add(pixel *dst, int16_t *block, int stride) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
%macro STORE_DIFFx2 6 |
|
|
|
|
psrad %1, 6 |
|
|
|
@ -87,7 +87,8 @@ INIT_XMM avx |
|
|
|
|
IDCT_ADD_10 |
|
|
|
|
|
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; h264_idct_add16(pixel *dst, const int *block_offset, dctcoef *block, int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
; h264_idct_add16(pixel *dst, const int *block_offset, int16_t *block, |
|
|
|
|
; int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
;;;;;;; NO FATE SAMPLES TRIGGER THIS |
|
|
|
|
%macro ADD4x4IDCT 0 |
|
|
|
@ -157,7 +158,7 @@ INIT_XMM avx |
|
|
|
|
IDCT_ADD16_10 |
|
|
|
|
|
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; void h264_idct_dc_add(pixel *dst, dctcoef *block, int stride) |
|
|
|
|
; void h264_idct_dc_add(pixel *dst, int16_t *block, int stride) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
%macro IDCT_DC_ADD_OP_10 3 |
|
|
|
|
pxor m5, m5 |
|
|
|
@ -199,7 +200,7 @@ cglobal h264_idct_dc_add_10,3,3 |
|
|
|
|
RET |
|
|
|
|
|
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; void h264_idct8_dc_add(pixel *dst, dctcoef *block, int stride) |
|
|
|
|
; void h264_idct8_dc_add(pixel *dst, int16_t *block, int stride) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
%macro IDCT8_DC_ADD 0 |
|
|
|
|
cglobal h264_idct8_dc_add_10,3,4,7 |
|
|
|
@ -222,7 +223,8 @@ INIT_XMM avx |
|
|
|
|
IDCT8_DC_ADD |
|
|
|
|
|
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; h264_idct_add16intra(pixel *dst, const int *block_offset, dctcoef *block, int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
; h264_idct_add16intra(pixel *dst, const int *block_offset, int16_t *block, |
|
|
|
|
; int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
%macro AC 1 |
|
|
|
|
.ac%1: |
|
|
|
@ -294,7 +296,8 @@ IDCT_ADD16INTRA_10 |
|
|
|
|
|
|
|
|
|
%assign last_block 36 |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; h264_idct_add8(pixel **dst, const int *block_offset, dctcoef *block, int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
; h264_idct_add8(pixel **dst, const int *block_offset, int16_t *block, |
|
|
|
|
; int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
%macro IDCT_ADD8 0 |
|
|
|
|
cglobal h264_idct_add8_10,5,8,7 |
|
|
|
@ -328,7 +331,7 @@ INIT_XMM avx |
|
|
|
|
IDCT_ADD8 |
|
|
|
|
|
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; void h264_idct8_add(pixel *dst, dctcoef *block, int stride) |
|
|
|
|
; void h264_idct8_add(pixel *dst, int16_t *block, int stride) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
%macro IDCT8_1D 2 |
|
|
|
|
SWAP 0, 1 |
|
|
|
@ -535,7 +538,8 @@ INIT_XMM avx |
|
|
|
|
IDCT8_ADD |
|
|
|
|
|
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
; h264_idct8_add4(pixel **dst, const int *block_offset, dctcoef *block, int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
; h264_idct8_add4(pixel **dst, const int *block_offset, int16_t *block, |
|
|
|
|
; int stride, const uint8_t nnzc[6*8]) |
|
|
|
|
;----------------------------------------------------------------------------- |
|
|
|
|
;;;;;;; NO FATE SAMPLES TRIGGER THIS |
|
|
|
|
%macro IDCT8_ADD4_OP 2 |
|
|
|
|