@ -2166,6 +2166,10 @@ function ff_hevc_put_hevc_qpel_uni_hv4_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldr x30 , [ s p ] , #48
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v4 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v4 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x6 , x5
ldr d16 , [ s p ]
@ -2208,6 +2212,10 @@ function ff_hevc_put_hevc_qpel_uni_hv6_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldr x30 , [ s p ] , #48
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v6 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v6 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x6 , x5
sub x1 , x1 , #4
@ -2253,6 +2261,10 @@ function ff_hevc_put_hevc_qpel_uni_hv8_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldr x30 , [ s p ] , #48
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v8 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v8 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x6 , x5
ldr q16 , [ s p ]
@ -2296,6 +2308,10 @@ function ff_hevc_put_hevc_qpel_uni_hv12_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v12 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v12 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x6 , x5
sub x1 , x1 , #8
@ -2339,7 +2355,10 @@ function ff_hevc_put_hevc_qpel_uni_hv16_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
.Lqpel_uni_hv16_loop :
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v16 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v16 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x6 , x5
sub w12 , w9 , w7 , l s l #1
@ -2414,7 +2433,7 @@ function ff_hevc_put_hevc_qpel_uni_hv32_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
b . L q p e l _ u n i _ h v16 _ l o o p
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v16 _ 8 _ e n d _ n e o n
endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v48 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
@ -2434,7 +2453,7 @@ function ff_hevc_put_hevc_qpel_uni_hv48_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
b . L q p e l _ u n i _ h v16 _ l o o p
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v16 _ 8 _ e n d _ n e o n
endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v64 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
@ -2454,7 +2473,7 @@ function ff_hevc_put_hevc_qpel_uni_hv64_8_neon_i8mm, export=1
ldp x4 , x6 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
b . L q p e l _ u n i _ h v16 _ l o o p
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ h v16 _ 8 _ e n d _ n e o n
endfunc
DISABLE_ I 8 M M
# endif
@ -3776,6 +3795,10 @@ function ff_hevc_put_hevc_qpel_hv4_8_neon_i8mm, export=1
bl X ( f f _ h e v c _ p u t _ h e v c _ q p e l _ h4 _ 8 _ n e o n _ i 8 m m )
ldp x0 , x3 , [ s p , #16 ]
ldp x5 , x30 , [ s p ] , #32
b h e v c _ p u t _ h e v c _ q p e l _ h v4 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ h v4 _ 8 _ e n d _ n e o n
load_ q p e l _ f i l t e r h x5 , x4
ldr d16 , [ s p ]
ldr d17 , [ s p , x7 ]
@ -3813,6 +3836,10 @@ function ff_hevc_put_hevc_qpel_hv6_8_neon_i8mm, export=1
bl X ( f f _ h e v c _ p u t _ h e v c _ q p e l _ h6 _ 8 _ n e o n _ i 8 m m )
ldp x0 , x3 , [ s p , #16 ]
ldp x5 , x30 , [ s p ] , #32
b h e v c _ p u t _ h e v c _ q p e l _ h v6 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ h v6 _ 8 _ e n d _ n e o n
mov x8 , #120
load_ q p e l _ f i l t e r h x5 , x4
ldr q16 , [ s p ]
@ -3852,6 +3879,10 @@ function ff_hevc_put_hevc_qpel_hv8_8_neon_i8mm, export=1
bl X ( f f _ h e v c _ p u t _ h e v c _ q p e l _ h8 _ 8 _ n e o n _ i 8 m m )
ldp x0 , x3 , [ s p , #16 ]
ldp x5 , x30 , [ s p ] , #32
b h e v c _ p u t _ h e v c _ q p e l _ h v8 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ h v8 _ 8 _ e n d _ n e o n
mov x7 , #128
load_ q p e l _ f i l t e r h x5 , x4
ldr q16 , [ s p ]
@ -3890,6 +3921,10 @@ function ff_hevc_put_hevc_qpel_hv12_8_neon_i8mm, export=1
bl X ( f f _ h e v c _ p u t _ h e v c _ q p e l _ h12 _ 8 _ n e o n _ i 8 m m )
ldp x0 , x3 , [ s p , #16 ]
ldp x5 , x30 , [ s p ] , #32
b h e v c _ p u t _ h e v c _ q p e l _ h v12 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ h v12 _ 8 _ e n d _ n e o n
mov x7 , #128
load_ q p e l _ f i l t e r h x5 , x4
mov x8 , #112
@ -3927,6 +3962,10 @@ function ff_hevc_put_hevc_qpel_hv16_8_neon_i8mm, export=1
bl X ( f f _ h e v c _ p u t _ h e v c _ q p e l _ h16 _ 8 _ n e o n _ i 8 m m )
ldp x0 , x3 , [ s p , #16 ]
ldp x5 , x30 , [ s p ] , #32
b h e v c _ p u t _ h e v c _ q p e l _ h v16 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ h v16 _ 8 _ e n d _ n e o n
mov x7 , #128
load_ q p e l _ f i l t e r h x5 , x4
ld1 { v16 . 8 h , v17 . 8 h } , [ s p ] , x7
@ -3979,6 +4018,10 @@ function ff_hevc_put_hevc_qpel_hv32_8_neon_i8mm, export=1
bl X ( f f _ h e v c _ p u t _ h e v c _ q p e l _ h32 _ 8 _ n e o n _ i 8 m m )
ldp x0 , x3 , [ s p , #16 ]
ldp x5 , x30 , [ s p ] , #32
b h e v c _ p u t _ h e v c _ q p e l _ h v32 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ h v32 _ 8 _ e n d _ n e o n
mov x7 , #128
load_ q p e l _ f i l t e r h x5 , x4
0 : mov x8 , s p / / s r c
@ -4127,6 +4170,10 @@ endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v4 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
QPEL_ U N I _ W _ H V _ H E A D E R 4
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v4 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v4 _ 8 _ e n d _ n e o n
ldr d16 , [ s p ]
ldr d17 , [ s p , x10 ]
add s p , s p , x10 , l s l #1
@ -4217,6 +4264,10 @@ endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v8 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
QPEL_ U N I _ W _ H V _ H E A D E R 8
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v8 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v8 _ 8 _ e n d _ n e o n
ldr q16 , [ s p ]
ldr q17 , [ s p , x10 ]
add s p , s p , x10 , l s l #1
@ -4327,6 +4378,10 @@ endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v16 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
QPEL_ U N I _ W _ H V _ H E A D E R 1 6
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v16 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v16 _ 8 _ e n d _ n e o n
ldp q16 , q1 , [ s p ]
add s p , s p , x10
ldp q17 , q2 , [ s p ]
@ -4430,6 +4485,10 @@ endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v32 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
QPEL_ U N I _ W _ H V _ H E A D E R 3 2
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v32 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v32 _ 8 _ e n d _ n e o n
mov x11 , s p
mov w12 , w22
mov x13 , x20
@ -4543,6 +4602,10 @@ endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v64 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
QPEL_ U N I _ W _ H V _ H E A D E R 6 4
b h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v64 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ u n i _ w _ h v64 _ 8 _ e n d _ n e o n
mov x11 , s p
mov w12 , w22
mov x13 , x20
@ -4671,6 +4734,10 @@ function ff_hevc_put_hevc_qpel_bi_hv4_8_neon_i8mm, export=1
ldp x4 , x5 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
b h e v c _ p u t _ h e v c _ q p e l _ b i _ h v4 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ b i _ h v4 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x7 , x6
ld1 { v16 . 4 h } , [ s p ] , x9
@ -4712,6 +4779,10 @@ function ff_hevc_put_hevc_qpel_bi_hv6_8_neon_i8mm, export=1
ldp x4 , x5 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
b h e v c _ p u t _ h e v c _ q p e l _ b i _ h v6 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ b i _ h v6 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x7 , x6
sub x1 , x1 , #4
@ -4758,6 +4829,10 @@ function ff_hevc_put_hevc_qpel_bi_hv8_8_neon_i8mm, export=1
ldp x4 , x5 , [ s p , #16 ]
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
b h e v c _ p u t _ h e v c _ q p e l _ b i _ h v8 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ b i _ h v8 _ 8 _ e n d _ n e o n
mov x9 , #( M A X _ P B _ S I Z E * 2 )
load_ q p e l _ f i l t e r h x7 , x6
ld1 { v16 . 8 h } , [ s p ] , x9
@ -4822,7 +4897,10 @@ function ff_hevc_put_hevc_qpel_bi_hv16_8_neon_i8mm, export=1
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
mov x6 , #16 / / w i d t h
.Lqpel_bi_hv16_loop :
b h e v c _ p u t _ h e v c _ q p e l _ b i _ h v16 _ 8 _ e n d _ n e o n
endfunc
function h e v c _ p u t _ h e v c _ q p e l _ b i _ h v16 _ 8 _ e n d _ n e o n
load_ q p e l _ f i l t e r h x7 , x8
mov x9 , #( M A X _ P B _ S I Z E * 2 )
mov x10 , x6
@ -4908,7 +4986,7 @@ function ff_hevc_put_hevc_qpel_bi_hv32_8_neon_i8mm, export=1
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
mov x6 , #32 / / w i d t h
b . L q p e l _ b i _ h v16 _ l o o p
b h e v c _ p u t _ h e v c _ q p e l _ b i _ h v16 _ 8 _ e n d _ n e o n
endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ b i _ h v48 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
@ -4929,7 +5007,7 @@ function ff_hevc_put_hevc_qpel_bi_hv48_8_neon_i8mm, export=1
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
mov x6 , #48 / / w i d t h
b . L q p e l _ b i _ h v16 _ l o o p
b h e v c _ p u t _ h e v c _ q p e l _ b i _ h v16 _ 8 _ e n d _ n e o n
endfunc
function f f _ h e v c _ p u t _ h e v c _ q p e l _ b i _ h v64 _ 8 _ n e o n _ i 8 m m , e x p o r t =1
@ -4950,7 +5028,7 @@ function ff_hevc_put_hevc_qpel_bi_hv64_8_neon_i8mm, export=1
ldp x0 , x1 , [ s p , #32 ]
ldp x7 , x30 , [ s p ] , #48
mov x6 , #64 / / w i d t h
b . L q p e l _ b i _ h v16 _ l o o p
b h e v c _ p u t _ h e v c _ q p e l _ b i _ h v16 _ 8 _ e n d _ n e o n
endfunc
DISABLE_ I 8 M M