FFmpeg/libavcodec/h264chroma_template.c

/*
 * Copyright (c) 2000, 2001 Fabrice Bellard
 * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include "libavutil/avassert.h"

#include "bit_depth_template.c"

#define H264_CHROMA_MC(OPNAME, OP)\
static void FUNCC(OPNAME ## h264_chroma_mc1)(uint8_t *_dst/*align 8*/, uint8_t *_src/*align 1*/, int stride, int h, int x, int y){\
    pixel *dst = (pixel*)_dst;\
    pixel *src = (pixel*)_src;\
    const int A=(8-x)*(8-y);\
    const int B=(  x)*(8-y);\
    const int C=(8-x)*(  y);\
    const int D=(  x)*(  y);\
    int i;\
    stride >>= sizeof(pixel)-1;\
    \
    av_assert2(x<8 && y<8 && x>=0 && y>=0);\
\
    if(D){\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1]));\
            dst+= stride;\
            src+= stride;\
        }\
    }else{\
        const int E= B+C;\
        const int step= C ? stride : 1;\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + E*src[step+0]));\
            dst+= stride;\
            src+= stride;\
        }\
    }\
}\
static void FUNCC(OPNAME ## h264_chroma_mc2)(uint8_t *_dst/*align 8*/, uint8_t *_src/*align 1*/, int stride, int h, int x, int y){\
    pixel *dst = (pixel*)_dst;\
    pixel *src = (pixel*)_src;\
    const int A=(8-x)*(8-y);\
    const int B=(  x)*(8-y);\
    const int C=(8-x)*(  y);\
    const int D=(  x)*(  y);\
    int i;\
    stride >>= sizeof(pixel)-1;\
    \
    av_assert2(x<8 && y<8 && x>=0 && y>=0);\
\
    if(D){\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1]));\
            OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2]));\
            dst+= stride;\
            src+= stride;\
        }\
    }else{\
        const int E= B+C;\
        const int step= C ? stride : 1;\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + E*src[step+0]));\
            OP(dst[1], (A*src[1] + E*src[step+1]));\
            dst+= stride;\
            src+= stride;\
        }\
    }\
}\
\
static void FUNCC(OPNAME ## h264_chroma_mc4)(uint8_t *_dst/*align 8*/, uint8_t *_src/*align 1*/, int stride, int h, int x, int y){\
    pixel *dst = (pixel*)_dst;\
    pixel *src = (pixel*)_src;\
    const int A=(8-x)*(8-y);\
    const int B=(  x)*(8-y);\
    const int C=(8-x)*(  y);\
    const int D=(  x)*(  y);\
    int i;\
    stride >>= sizeof(pixel)-1;\
    \
    av_assert2(x<8 && y<8 && x>=0 && y>=0);\
\
    if(D){\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1]));\
            OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2]));\
            OP(dst[2], (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3]));\
            OP(dst[3], (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4]));\
            dst+= stride;\
            src+= stride;\
        }\
    }else{\
        const int E= B+C;\
        const int step= C ? stride : 1;\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + E*src[step+0]));\
            OP(dst[1], (A*src[1] + E*src[step+1]));\
            OP(dst[2], (A*src[2] + E*src[step+2]));\
            OP(dst[3], (A*src[3] + E*src[step+3]));\
            dst+= stride;\
            src+= stride;\
        }\
    }\
}\
\
static void FUNCC(OPNAME ## h264_chroma_mc8)(uint8_t *_dst/*align 8*/, uint8_t *_src/*align 1*/, int stride, int h, int x, int y){\
    pixel *dst = (pixel*)_dst;\
    pixel *src = (pixel*)_src;\
    const int A=(8-x)*(8-y);\
    const int B=(  x)*(8-y);\
    const int C=(8-x)*(  y);\
    const int D=(  x)*(  y);\
    int i;\
    stride >>= sizeof(pixel)-1;\
    \
    av_assert2(x<8 && y<8 && x>=0 && y>=0);\
\
    if(D){\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1]));\
            OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2]));\
            OP(dst[2], (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3]));\
            OP(dst[3], (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4]));\
            OP(dst[4], (A*src[4] + B*src[5] + C*src[stride+4] + D*src[stride+5]));\
            OP(dst[5], (A*src[5] + B*src[6] + C*src[stride+5] + D*src[stride+6]));\
            OP(dst[6], (A*src[6] + B*src[7] + C*src[stride+6] + D*src[stride+7]));\
            OP(dst[7], (A*src[7] + B*src[8] + C*src[stride+7] + D*src[stride+8]));\
            dst+= stride;\
            src+= stride;\
        }\
    }else{\
        const int E= B+C;\
        const int step= C ? stride : 1;\
        for(i=0; i<h; i++){\
            OP(dst[0], (A*src[0] + E*src[step+0]));\
            OP(dst[1], (A*src[1] + E*src[step+1]));\
            OP(dst[2], (A*src[2] + E*src[step+2]));\
            OP(dst[3], (A*src[3] + E*src[step+3]));\
            OP(dst[4], (A*src[4] + E*src[step+4]));\
            OP(dst[5], (A*src[5] + E*src[step+5]));\
            OP(dst[6], (A*src[6] + E*src[step+6]));\
            OP(dst[7], (A*src[7] + E*src[step+7]));\
            dst+= stride;\
            src+= stride;\
        }\
    }\
}

#define op_avg(a, b) a = (((a)+(((b) + 32)>>6)+1)>>1)
#define op_put(a, b) a = (((b) + 32)>>6)

H264_CHROMA_MC(put_       , op_put)
H264_CHROMA_MC(avg_       , op_avg)
#undef op_avg
#undef op_put
dsputil: Separate h264chroma 12 years ago			`/*`
			`* Copyright (c) 2000, 2001 Fabrice Bellard`
			`* Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>`
			`*`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`* This file is part of FFmpeg.`
dsputil: Separate h264chroma 12 years ago			`*`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`* FFmpeg is free software; you can redistribute it and/or`
dsputil: Separate h264chroma 12 years ago			`* modify it under the terms of the GNU Lesser General Public`
			`* License as published by the Free Software Foundation; either`
			`* version 2.1 of the License, or (at your option) any later version.`
			`*`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`* FFmpeg is distributed in the hope that it will be useful,`
dsputil: Separate h264chroma 12 years ago			`* but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
			`* Lesser General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU Lesser General Public`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`* License along with FFmpeg; if not, write to the Free Software`
dsputil: Separate h264chroma 12 years ago			`* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA`
			`*/`

Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`#include "libavutil/avassert.h"`
dsputil: Separate h264chroma 12 years ago
			`#include "bit_depth_template.c"`

			`#define H264_CHROMA_MC(OPNAME, OP)\`
mpegvideo: implement ff_put_h264_chroma_mc1 & ff_avg_h264_chroma_mc2 These are needed for lowres 3 This may fix Ticket2538 Signed-off-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`static void FUNCC(OPNAME ## h264_chroma_mc1)(uint8_t _dst/align 8/, uint8_t _src/align 1/, int stride, int h, int x, int y){\`
			`pixel dst = (pixel)_dst;\`
			`pixel src = (pixel)_src;\`
			`const int A=(8-x)*(8-y);\`
			`const int B=( x)*(8-y);\`
			`const int C=(8-x)*( y);\`
			`const int D=( x)*( y);\`
			`int i;\`
			`stride >>= sizeof(pixel)-1;\`
			`\`
			`av_assert2(x<8 && y<8 && x>=0 && y>=0);\`
			`\`
			`if(D){\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}else{\`
			`const int E= B+C;\`
			`const int step= C ? stride : 1;\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Esrc[step+0]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}\`
			`}\`
dsputil: Separate h264chroma 12 years ago			`static void FUNCC(OPNAME ## h264_chroma_mc2)(uint8_t _dst/align 8/, uint8_t _src/align 1/, int stride, int h, int x, int y){\`
			`pixel dst = (pixel)_dst;\`
			`pixel src = (pixel)_src;\`
			`const int A=(8-x)*(8-y);\`
			`const int B=( x)*(8-y);\`
			`const int C=(8-x)*( y);\`
			`const int D=( x)*( y);\`
			`int i;\`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`stride >>= sizeof(pixel)-1;\`
dsputil: Separate h264chroma 12 years ago			`\`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`av_assert2(x<8 && y<8 && x>=0 && y>=0);\`
dsputil: Separate h264chroma 12 years ago			`\`
			`if(D){\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1]));\`
			`OP(dst[1], (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}else{\`
			`const int E= B+C;\`
			`const int step= C ? stride : 1;\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Esrc[step+0]));\`
			`OP(dst[1], (Asrc[1] + Esrc[step+1]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}\`
			`}\`
			`\`
			`static void FUNCC(OPNAME ## h264_chroma_mc4)(uint8_t _dst/align 8/, uint8_t _src/align 1/, int stride, int h, int x, int y){\`
			`pixel dst = (pixel)_dst;\`
			`pixel src = (pixel)_src;\`
			`const int A=(8-x)*(8-y);\`
			`const int B=( x)*(8-y);\`
			`const int C=(8-x)*( y);\`
			`const int D=( x)*( y);\`
			`int i;\`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`stride >>= sizeof(pixel)-1;\`
dsputil: Separate h264chroma 12 years ago			`\`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`av_assert2(x<8 && y<8 && x>=0 && y>=0);\`
dsputil: Separate h264chroma 12 years ago			`\`
			`if(D){\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1]));\`
			`OP(dst[1], (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2]));\`
			`OP(dst[2], (Asrc[2] + Bsrc[3] + Csrc[stride+2] + Dsrc[stride+3]));\`
			`OP(dst[3], (Asrc[3] + Bsrc[4] + Csrc[stride+3] + Dsrc[stride+4]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}else{\`
			`const int E= B+C;\`
			`const int step= C ? stride : 1;\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Esrc[step+0]));\`
			`OP(dst[1], (Asrc[1] + Esrc[step+1]));\`
			`OP(dst[2], (Asrc[2] + Esrc[step+2]));\`
			`OP(dst[3], (Asrc[3] + Esrc[step+3]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}\`
			`}\`
			`\`
			`static void FUNCC(OPNAME ## h264_chroma_mc8)(uint8_t _dst/align 8/, uint8_t _src/align 1/, int stride, int h, int x, int y){\`
			`pixel dst = (pixel)_dst;\`
			`pixel src = (pixel)_src;\`
			`const int A=(8-x)*(8-y);\`
			`const int B=( x)*(8-y);\`
			`const int C=(8-x)*( y);\`
			`const int D=( x)*( y);\`
			`int i;\`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`stride >>= sizeof(pixel)-1;\`
dsputil: Separate h264chroma 12 years ago			`\`
Merge commit '79dad2a932534d1155079f937649e099f9e5cc27' * commit '79dad2a932534d1155079f937649e099f9e5cc27': dsputil: Separate h264chroma Conflicts: libavcodec/dsputil_template.c libavcodec/ppc/dsputil_ppc.c libavcodec/vc1dec.c libavcodec/vc1dsp.c Merged-by: Michael Niedermayer <michaelni@gmx.at> 12 years ago			`av_assert2(x<8 && y<8 && x>=0 && y>=0);\`
dsputil: Separate h264chroma 12 years ago			`\`
			`if(D){\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1]));\`
			`OP(dst[1], (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2]));\`
			`OP(dst[2], (Asrc[2] + Bsrc[3] + Csrc[stride+2] + Dsrc[stride+3]));\`
			`OP(dst[3], (Asrc[3] + Bsrc[4] + Csrc[stride+3] + Dsrc[stride+4]));\`
			`OP(dst[4], (Asrc[4] + Bsrc[5] + Csrc[stride+4] + Dsrc[stride+5]));\`
			`OP(dst[5], (Asrc[5] + Bsrc[6] + Csrc[stride+5] + Dsrc[stride+6]));\`
			`OP(dst[6], (Asrc[6] + Bsrc[7] + Csrc[stride+6] + Dsrc[stride+7]));\`
			`OP(dst[7], (Asrc[7] + Bsrc[8] + Csrc[stride+7] + Dsrc[stride+8]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}else{\`
			`const int E= B+C;\`
			`const int step= C ? stride : 1;\`
			`for(i=0; i<h; i++){\`
			`OP(dst[0], (Asrc[0] + Esrc[step+0]));\`
			`OP(dst[1], (Asrc[1] + Esrc[step+1]));\`
			`OP(dst[2], (Asrc[2] + Esrc[step+2]));\`
			`OP(dst[3], (Asrc[3] + Esrc[step+3]));\`
			`OP(dst[4], (Asrc[4] + Esrc[step+4]));\`
			`OP(dst[5], (Asrc[5] + Esrc[step+5]));\`
			`OP(dst[6], (Asrc[6] + Esrc[step+6]));\`
			`OP(dst[7], (Asrc[7] + Esrc[step+7]));\`
			`dst+= stride;\`
			`src+= stride;\`
			`}\`
			`}\`
			`}`

			`#define op_avg(a, b) a = (((a)+(((b) + 32)>>6)+1)>>1)`
			`#define op_put(a, b) a = (((b) + 32)>>6)`

			`H264_CHROMA_MC(put_ , op_put)`
			`H264_CHROMA_MC(avg_ , op_avg)`
			`#undef op_avg`
			`#undef op_put`