|
|
|
@ -32,8 +32,13 @@ |
|
|
|
|
|
|
|
|
|
static const vec_s16 constants = |
|
|
|
|
{0, 64277, 60547, 54491, 46341, 36410, 25080, 12785}; |
|
|
|
|
#if HAVE_BIGENDIAN |
|
|
|
|
static const vec_u8 interleave_high = |
|
|
|
|
{0, 1, 16, 17, 4, 5, 20, 21, 8, 9, 24, 25, 12, 13, 28, 29}; |
|
|
|
|
#else |
|
|
|
|
static const vec_u8 interleave_high = |
|
|
|
|
{2, 3, 18, 19, 6, 7, 22, 23, 10, 11, 26, 27, 14, 15, 30, 31}; |
|
|
|
|
#endif |
|
|
|
|
|
|
|
|
|
#define IDCT_START \ |
|
|
|
|
vec_s16 A, B, C, D, Ad, Bd, Cd, Dd, E, F, G, H;\
|
|
|
|
@ -156,9 +161,18 @@ static void vp3_idct_add_altivec(uint8_t *dst, int stride, int16_t block[64]) |
|
|
|
|
TRANSPOSE8(b0, b1, b2, b3, b4, b5, b6, b7); |
|
|
|
|
IDCT_1D(ADD8, SHIFT4) |
|
|
|
|
|
|
|
|
|
#define ADD(a)\ |
|
|
|
|
#if HAVE_BIGENDIAN |
|
|
|
|
#define GET_VDST16\ |
|
|
|
|
vdst = vec_ld(0, dst);\
|
|
|
|
|
vdst_16 = (vec_s16)vec_perm(vdst, zero_u8v, vdst_mask);\
|
|
|
|
|
vdst_16 = (vec_s16)vec_perm(vdst, zero_u8v, vdst_mask); |
|
|
|
|
#else |
|
|
|
|
#define GET_VDST16\ |
|
|
|
|
vdst = vec_vsx_ld(0,dst);\
|
|
|
|
|
vdst_16 = (vec_s16)vec_mergeh(vdst, zero_u8v); |
|
|
|
|
#endif |
|
|
|
|
|
|
|
|
|
#define ADD(a)\ |
|
|
|
|
GET_VDST16;\
|
|
|
|
|
vdst_16 = vec_adds(a, vdst_16);\
|
|
|
|
|
t = vec_packsu(vdst_16, vdst_16);\
|
|
|
|
|
vec_ste((vec_u32)t, 0, (unsigned int *)dst);\
|
|
|
|
|