@ -78,15 +78,15 @@ cglobal vector_clip_int32%5, 5,5,%1, dst, src, min, max, len
.loop:
% assign %%i 0
% rep %2
mova m0 , [ srcq + mmsize * ( 0 +%% i )]
mova m1 , [ srcq + mmsize * ( 1 +%% i )]
mova m2 , [ srcq + mmsize * ( 2 +%% i )]
mova m3 , [ srcq + mmsize * ( 3 +%% i )]
mova m0 , [ srcq + mmsize * ( 0 + %% i )]
mova m1 , [ srcq + mmsize * ( 1 + %% i )]
mova m2 , [ srcq + mmsize * ( 2 + %% i )]
mova m3 , [ srcq + mmsize * ( 3 + %% i )]
% if %3
mova m7 , [ srcq + mmsize * ( 4 +%% i )]
mova m8 , [ srcq + mmsize * ( 5 +%% i )]
mova m9 , [ srcq + mmsize * ( 6 +%% i )]
mova m10 , [ srcq + mmsize * ( 7 +%% i )]
mova m7 , [ srcq + mmsize * ( 4 + %% i )]
mova m8 , [ srcq + mmsize * ( 5 + %% i )]
mova m9 , [ srcq + mmsize * ( 6 + %% i )]
mova m10 , [ srcq + mmsize * ( 7 + %% i )]
% endif
CLIPD m0 , m4 , m5 , m6
CLIPD m1 , m4 , m5 , m6
@ -98,17 +98,17 @@ cglobal vector_clip_int32%5, 5,5,%1, dst, src, min, max, len
CLIPD m9 , m4 , m5 , m6
CLIPD m10 , m4 , m5 , m6
% endif
mova [ ds tq + mmsize * ( 0 +%% i )], m0
mova [ ds tq + mmsize * ( 1 +%% i )], m1
mova [ ds tq + mmsize * ( 2 +%% i )], m2
mova [ ds tq + mmsize * ( 3 +%% i )], m3
mova [ ds tq + mmsize * ( 0 + %% i )], m0
mova [ ds tq + mmsize * ( 1 + %% i )], m1
mova [ ds tq + mmsize * ( 2 + %% i )], m2
mova [ ds tq + mmsize * ( 3 + %% i )], m3
% if %3
mova [ ds tq + mmsize * ( 4 +%% i )], m7
mova [ ds tq + mmsize * ( 5 +%% i )], m8
mova [ ds tq + mmsize * ( 6 +%% i )], m9
mova [ ds tq + mmsize * ( 7 +%% i )], m10
mova [ ds tq + mmsize * ( 4 + %% i )], m7
mova [ ds tq + mmsize * ( 5 + %% i )], m8
mova [ ds tq + mmsize * ( 6 + %% i )], m9
mova [ ds tq + mmsize * ( 7 + %% i )], m10
% endif
% assign %%i %%i+4*(%3+1 )
% assign %%i (%%i + 4 * (1 + %3) )
% endrep
add srcq , mmsize * 4 * ( % 2 +% 3 )
add ds tq , mmsize * 4 * ( % 2 +% 3 )