1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * Copyright (c) 2010 Mans Rullgard <mans@mansr.com>
3cabdff1aSopenharmony_ci *
4cabdff1aSopenharmony_ci * This file is part of FFmpeg.
5cabdff1aSopenharmony_ci *
6cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
7cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
8cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
9cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
10cabdff1aSopenharmony_ci *
11cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
12cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
13cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14cabdff1aSopenharmony_ci * Lesser General Public License for more details.
15cabdff1aSopenharmony_ci *
16cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
17cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
18cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19cabdff1aSopenharmony_ci */
20cabdff1aSopenharmony_ci
21cabdff1aSopenharmony_ci#include "libavutil/arm/asm.S"
22cabdff1aSopenharmony_ci
23cabdff1aSopenharmony_ci.macro  vp6_edge_filter
24cabdff1aSopenharmony_ci        vdup.16         q3,  r2                 @ t
25cabdff1aSopenharmony_ci        vmov.i16        q13, #1
26cabdff1aSopenharmony_ci        vsubl.u8        q0,  d20, d18           @ p[   0] - p[-s]
27cabdff1aSopenharmony_ci        vsubl.u8        q1,  d16, d22           @ p[-2*s] - p[ s]
28cabdff1aSopenharmony_ci        vsubl.u8        q14, d21, d19
29cabdff1aSopenharmony_ci        vsubl.u8        q15, d17, d23
30cabdff1aSopenharmony_ci        vadd.i16        q2,  q0,  q0            @ 2*(p[0]-p[-s])
31cabdff1aSopenharmony_ci        vadd.i16        d29, d28, d28
32cabdff1aSopenharmony_ci        vadd.i16        q0,  q0,  q1            @    p[0]-p[-s]  + p[-2*s]-p[s]
33cabdff1aSopenharmony_ci        vadd.i16        d28, d28, d30
34cabdff1aSopenharmony_ci        vadd.i16        q0,  q0,  q2            @ 3*(p[0]-p[-s]) + p[-2*s]-p[s]
35cabdff1aSopenharmony_ci        vadd.i16        d28, d28, d29
36cabdff1aSopenharmony_ci        vrshr.s16       q0,  q0,  #3            @ v
37cabdff1aSopenharmony_ci        vrshr.s16       d28, d28, #3
38cabdff1aSopenharmony_ci        vsub.i16        q8,  q3,  q13           @ t-1
39cabdff1aSopenharmony_ci        vabs.s16        q1,  q0                 @ V
40cabdff1aSopenharmony_ci        vshr.s16        q2,  q0,  #15           @ s
41cabdff1aSopenharmony_ci        vabs.s16        d30, d28
42cabdff1aSopenharmony_ci        vshr.s16        d29, d28, #15
43cabdff1aSopenharmony_ci        vsub.i16        q12, q1,  q3            @ V-t
44cabdff1aSopenharmony_ci        vsub.i16        d31, d30, d6
45cabdff1aSopenharmony_ci        vsub.i16        q12, q12, q13           @ V-t-1
46cabdff1aSopenharmony_ci        vsub.i16        d31, d31, d26
47cabdff1aSopenharmony_ci        vcge.u16        q12, q12, q8            @ V-t-1 >= t-1
48cabdff1aSopenharmony_ci        vcge.u16        d31, d31, d16
49cabdff1aSopenharmony_ci        vadd.i16        q13, q3,  q3            @ 2*t
50cabdff1aSopenharmony_ci        vadd.i16        d16, d6,  d6
51cabdff1aSopenharmony_ci        vsub.i16        q13, q13, q1            @ 2*t - V
52cabdff1aSopenharmony_ci        vsub.i16        d16, d16, d30
53cabdff1aSopenharmony_ci        vadd.i16        q13, q13, q2            @ += s
54cabdff1aSopenharmony_ci        vadd.i16        d16, d16, d29
55cabdff1aSopenharmony_ci        veor            q13, q13, q2            @ ^= s
56cabdff1aSopenharmony_ci        veor            d16, d16, d29
57cabdff1aSopenharmony_ci        vbif            q0,  q13, q12
58cabdff1aSopenharmony_ci        vbif            d28, d16, d31
59cabdff1aSopenharmony_ci        vmovl.u8        q1,  d20
60cabdff1aSopenharmony_ci        vmovl.u8        q15, d21
61cabdff1aSopenharmony_ci        vaddw.u8        q2,  q0,  d18
62cabdff1aSopenharmony_ci        vaddw.u8        q3,  q14, d19
63cabdff1aSopenharmony_ci        vsub.i16        q1,  q1,  q0
64cabdff1aSopenharmony_ci        vsub.i16        d30, d30, d28
65cabdff1aSopenharmony_ci        vqmovun.s16     d18, q2
66cabdff1aSopenharmony_ci        vqmovun.s16     d19, q3
67cabdff1aSopenharmony_ci        vqmovun.s16     d20, q1
68cabdff1aSopenharmony_ci        vqmovun.s16     d21, q15
69cabdff1aSopenharmony_ci.endm
70cabdff1aSopenharmony_ci
71cabdff1aSopenharmony_cifunction ff_vp6_edge_filter_ver_neon, export=1
72cabdff1aSopenharmony_ci        sub             r0,  r0,  r1,  lsl #1
73cabdff1aSopenharmony_ci        vld1.8          {q8},     [r0], r1      @ p[-2*s]
74cabdff1aSopenharmony_ci        vld1.8          {q9},     [r0], r1      @ p[-s]
75cabdff1aSopenharmony_ci        vld1.8          {q10},    [r0], r1      @ p[0]
76cabdff1aSopenharmony_ci        vld1.8          {q11},    [r0]          @ p[s]
77cabdff1aSopenharmony_ci        vp6_edge_filter
78cabdff1aSopenharmony_ci        sub             r0,  r0,  r1,  lsl #1
79cabdff1aSopenharmony_ci        sub             r1,  r1,  #8
80cabdff1aSopenharmony_ci        vst1.8          {d18},    [r0]!
81cabdff1aSopenharmony_ci        vst1.32         {d19[0]}, [r0], r1
82cabdff1aSopenharmony_ci        vst1.8          {d20},    [r0]!
83cabdff1aSopenharmony_ci        vst1.32         {d21[0]}, [r0]
84cabdff1aSopenharmony_ci        bx              lr
85cabdff1aSopenharmony_ciendfunc
86cabdff1aSopenharmony_ci
87cabdff1aSopenharmony_cifunction ff_vp6_edge_filter_hor_neon, export=1
88cabdff1aSopenharmony_ci        sub             r3,  r0,  #1
89cabdff1aSopenharmony_ci        sub             r0,  r0,  #2
90cabdff1aSopenharmony_ci        vld1.32         {d16[0]}, [r0], r1
91cabdff1aSopenharmony_ci        vld1.32         {d18[0]}, [r0], r1
92cabdff1aSopenharmony_ci        vld1.32         {d20[0]}, [r0], r1
93cabdff1aSopenharmony_ci        vld1.32         {d22[0]}, [r0], r1
94cabdff1aSopenharmony_ci        vld1.32         {d16[1]}, [r0], r1
95cabdff1aSopenharmony_ci        vld1.32         {d18[1]}, [r0], r1
96cabdff1aSopenharmony_ci        vld1.32         {d20[1]}, [r0], r1
97cabdff1aSopenharmony_ci        vld1.32         {d22[1]}, [r0], r1
98cabdff1aSopenharmony_ci        vld1.32         {d17[0]}, [r0], r1
99cabdff1aSopenharmony_ci        vld1.32         {d19[0]}, [r0], r1
100cabdff1aSopenharmony_ci        vld1.32         {d21[0]}, [r0], r1
101cabdff1aSopenharmony_ci        vld1.32         {d23[0]}, [r0], r1
102cabdff1aSopenharmony_ci        vtrn.8          q8,  q9
103cabdff1aSopenharmony_ci        vtrn.8          q10, q11
104cabdff1aSopenharmony_ci        vtrn.16         q8,  q10
105cabdff1aSopenharmony_ci        vtrn.16         q9,  q11
106cabdff1aSopenharmony_ci        vp6_edge_filter
107cabdff1aSopenharmony_ci        vtrn.8          q9,  q10
108cabdff1aSopenharmony_ci        vst1.16         {d18[0]}, [r3], r1
109cabdff1aSopenharmony_ci        vst1.16         {d20[0]}, [r3], r1
110cabdff1aSopenharmony_ci        vst1.16         {d18[1]}, [r3], r1
111cabdff1aSopenharmony_ci        vst1.16         {d20[1]}, [r3], r1
112cabdff1aSopenharmony_ci        vst1.16         {d18[2]}, [r3], r1
113cabdff1aSopenharmony_ci        vst1.16         {d20[2]}, [r3], r1
114cabdff1aSopenharmony_ci        vst1.16         {d18[3]}, [r3], r1
115cabdff1aSopenharmony_ci        vst1.16         {d20[3]}, [r3], r1
116cabdff1aSopenharmony_ci        vst1.16         {d19[0]}, [r3], r1
117cabdff1aSopenharmony_ci        vst1.16         {d21[0]}, [r3], r1
118cabdff1aSopenharmony_ci        vst1.16         {d19[1]}, [r3], r1
119cabdff1aSopenharmony_ci        vst1.16         {d21[1]}, [r3], r1
120cabdff1aSopenharmony_ci        bx              lr
121cabdff1aSopenharmony_ciendfunc
122