|
|
|
@ -56,8 +56,8 @@ static const vec_s8 h_subpel_filters_outer[3] = |
|
|
|
|
vec_s8 filter_outerl = vec_sld(filter_outerh, filter_outerh, 2) |
|
|
|
|
|
|
|
|
|
#define FILTER_H(dstv, off) \ |
|
|
|
|
a = vec_ld((off)-2, src); \
|
|
|
|
|
b = vec_ld((off)-2+15, src); \
|
|
|
|
|
a = vec_ld((off)-is6tap-1, src); \
|
|
|
|
|
b = vec_ld((off)-is6tap-1+15, src); \
|
|
|
|
|
\
|
|
|
|
|
pixh = vec_perm(a, b, permh##off); \
|
|
|
|
|
pixl = vec_perm(a, b, perml##off); \
|
|
|
|
@ -86,13 +86,15 @@ void put_vp8_epel_h_altivec_core(uint8_t *dst, int dst_stride, |
|
|
|
|
vec_s16 f16h, f16l; |
|
|
|
|
vec_s32 filth, filtl; |
|
|
|
|
|
|
|
|
|
vec_u8 perm_inner = { 1,2,3,4, 2,3,4,5, 3,4,5,6, 4,5,6,7 }; |
|
|
|
|
vec_u8 perm_inner6 = { 1,2,3,4, 2,3,4,5, 3,4,5,6, 4,5,6,7 }; |
|
|
|
|
vec_u8 perm_inner4 = { 0,1,2,3, 1,2,3,4, 2,3,4,5, 3,4,5,6 }; |
|
|
|
|
vec_u8 perm_inner = is6tap ? perm_inner6 : perm_inner4; |
|
|
|
|
vec_u8 perm_outer = { 4,9, 0,5, 5,10, 1,6, 6,11, 2,7, 7,12, 3,8 }; |
|
|
|
|
vec_s32 c64 = vec_sl(vec_splat_s32(1), vec_splat_u32(6)); |
|
|
|
|
vec_u16 c7 = vec_splat_u16(7); |
|
|
|
|
|
|
|
|
|
align_vec0 = vec_lvsl( -2, src); |
|
|
|
|
align_vec8 = vec_lvsl(8-2, src); |
|
|
|
|
align_vec0 = vec_lvsl( -is6tap-1, src); |
|
|
|
|
align_vec8 = vec_lvsl(8-is6tap-1, src); |
|
|
|
|
|
|
|
|
|
permh0 = vec_perm(align_vec0, align_vec0, perm_inner); |
|
|
|
|
permh8 = vec_perm(align_vec8, align_vec8, perm_inner); |
|
|
|
@ -239,8 +241,13 @@ void put_vp8_epel ## WIDTH ## _v ## TAPS ## _altivec(uint8_t *dst, int dst_strid |
|
|
|
|
static void put_vp8_epel ## WIDTH ## _h ## HTAPS ## v ## VTAPS ## _altivec(uint8_t *dst, int stride, uint8_t *src, int s, int h, int mx, int my) \
|
|
|
|
|
{ \
|
|
|
|
|
DECLARE_ALIGNED(16, uint8_t, tmp)[(2*WIDTH+5)*16]; \
|
|
|
|
|
if (VTAPS == 6) { \
|
|
|
|
|
put_vp8_epel ## WIDTH ## _h ## HTAPS ## _altivec(tmp, 16, src-2*stride, stride, h+5, mx, my); \
|
|
|
|
|
put_vp8_epel ## WIDTH ## _v ## VTAPS ## _altivec(dst, stride, tmp+2*16, 16, h, mx, my); \
|
|
|
|
|
} else { \
|
|
|
|
|
put_vp8_epel ## WIDTH ## _h ## HTAPS ## _altivec(tmp, 16, src-stride, stride, h+4, mx, my); \
|
|
|
|
|
put_vp8_epel ## WIDTH ## _v ## VTAPS ## _altivec(dst, stride, tmp+16, 16, h, mx, my); \
|
|
|
|
|
} \
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
EPEL_FUNCS(16,6) |
|
|
|
|