Skip to content
GitLab
Projects
Groups
Snippets
/
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Sign in
Toggle navigation
Menu
Open sidebar
VideoLAN
dav1d
Commits
65a1aafd
Commit
65a1aafd
authored
Sep 03, 2020
by
Martin Storsjö
Browse files
arm: mc: Avoid an unnecessary mov in 8tap_hv w2
This matches how the same logic is written for w4 and above.
parent
458273ed
Changes
3
Hide whitespace changes
Inline
Side-by-side
src/arm/32/mc.S
View file @
65a1aafd
...
...
@@ -1951,11 +1951,10 @@ L(\type\()_8tap_hv_tbl):
bl
L
(
\
type
\
()
_8tap_filter_2
)
vext.8
d18
,
d17
,
d26
,
#
4
vmov
d19
,
d26
vmull.s16
q2
,
d16
,
d2
[
0
]
vmlal.s16
q2
,
d17
,
d2
[
1
]
vmlal.s16
q2
,
d18
,
d2
[
2
]
vmlal.s16
q2
,
d
19
,
d2
[
3
]
vmlal.s16
q2
,
d
26
,
d2
[
3
]
vqrshrn.s32
d4
,
q2
,
#
\
shift_hv
vqmovun.s16
d4
,
q2
...
...
@@ -1964,7 +1963,7 @@ L(\type\()_8tap_hv_tbl):
vst1.16
{
d4
[
1
]},
[
\
ds2
,
:
16
],
\
d_strd
ble
0
f
vmov
d16
,
d18
vmov
d17
,
d
19
vmov
d17
,
d
26
b
2
b
280
:
//
2
x8
,
2
x16
,
2
x32
hv
...
...
@@ -2001,7 +2000,6 @@ L(\type\()_8tap_hv_tbl):
28
:
bl
L
(
\
type
\
()
_8tap_filter_2
)
vext.8
d22
,
d21
,
d26
,
#
4
vmov
d23
,
d26
vmull.s16
q2
,
d16
,
d2
[
0
]
vmlal.s16
q2
,
d17
,
d2
[
1
]
vmlal.s16
q2
,
d18
,
d2
[
2
]
...
...
@@ -2009,7 +2007,7 @@ L(\type\()_8tap_hv_tbl):
vmlal.s16
q2
,
d20
,
d3
[
0
]
vmlal.s16
q2
,
d21
,
d3
[
1
]
vmlal.s16
q2
,
d22
,
d3
[
2
]
vmlal.s16
q2
,
d2
3
,
d3
[
3
]
vmlal.s16
q2
,
d2
6
,
d3
[
3
]
vqrshrn.s32
d4
,
q2
,
#
\
shift_hv
vqmovun.s16
d4
,
q2
...
...
@@ -2022,7 +2020,7 @@ L(\type\()_8tap_hv_tbl):
vmov
d18
,
d20
vmov
d19
,
d21
vmov
d20
,
d22
vmov
d21
,
d2
3
vmov
d21
,
d2
6
b
28
b
0
:
...
...
src/arm/64/mc.S
View file @
65a1aafd
...
...
@@ -1906,11 +1906,10 @@ L(\type\()_8tap_hv):
bl
L
(
\
type
\
()
_8tap_filter_2
)
ext
v18
.8
b
,
v17
.8
b
,
v28
.8
b
,
#
4
mov
v19
.8
b
,
v28
.8
b
smull
v2
.4
s
,
v16
.4
h
,
v1
.
h
[
0
]
smlal
v2
.4
s
,
v17
.4
h
,
v1
.
h
[
1
]
smlal
v2
.4
s
,
v18
.4
h
,
v1
.
h
[
2
]
smlal
v2
.4
s
,
v
19
.4
h
,
v1
.
h
[
3
]
smlal
v2
.4
s
,
v
28
.4
h
,
v1
.
h
[
3
]
sqrshrn
v2
.4
h
,
v2
.4
s
,
#
\
shift_hv
sqxtun
v2
.8
b
,
v2
.8
h
...
...
@@ -1919,7 +1918,7 @@ L(\type\()_8tap_hv):
st1
{
v2
.
h
}[
1
],
[
\
ds2
],
\
d_strd
b.le
0
f
mov
v16
.8
b
,
v18
.8
b
mov
v17
.8
b
,
v
19
.8
b
mov
v17
.8
b
,
v
28
.8
b
b
2
b
280
:
//
2
x8
,
2
x16
,
2
x32
hv
...
...
@@ -1956,7 +1955,6 @@ L(\type\()_8tap_hv):
28
:
bl
L
(
\
type
\
()
_8tap_filter_2
)
ext
v22
.8
b
,
v21
.8
b
,
v28
.8
b
,
#
4
mov
v23
.8
b
,
v28
.8
b
smull
v2
.4
s
,
v16
.4
h
,
v1
.
h
[
0
]
smlal
v2
.4
s
,
v17
.4
h
,
v1
.
h
[
1
]
smlal
v2
.4
s
,
v18
.4
h
,
v1
.
h
[
2
]
...
...
@@ -1964,7 +1962,7 @@ L(\type\()_8tap_hv):
smlal
v2
.4
s
,
v20
.4
h
,
v1
.
h
[
4
]
smlal
v2
.4
s
,
v21
.4
h
,
v1
.
h
[
5
]
smlal
v2
.4
s
,
v22
.4
h
,
v1
.
h
[
6
]
smlal
v2
.4
s
,
v2
3
.4
h
,
v1
.
h
[
7
]
smlal
v2
.4
s
,
v2
8
.4
h
,
v1
.
h
[
7
]
sqrshrn
v2
.4
h
,
v2
.4
s
,
#
\
shift_hv
sqxtun
v2
.8
b
,
v2
.8
h
...
...
@@ -1977,7 +1975,7 @@ L(\type\()_8tap_hv):
mov
v18
.8
b
,
v20
.8
b
mov
v19
.8
b
,
v21
.8
b
mov
v20
.8
b
,
v22
.8
b
mov
v21
.8
b
,
v2
3
.8
b
mov
v21
.8
b
,
v2
8
.8
b
b
28
b
0
:
...
...
src/arm/64/mc16.S
View file @
65a1aafd
...
...
@@ -2057,11 +2057,10 @@ L(\type\()_8tap_hv):
bl
L
(
\
type
\
()
_8tap_filter_2
)
ext
v18
.16
b
,
v17
.16
b
,
v24
.16
b
,
#
8
mov
v19
.16
b
,
v24
.16
b
mul
v2
.4
s
,
v16
.4
s
,
v1
.
s
[
0
]
mla
v2
.4
s
,
v17
.4
s
,
v1
.
s
[
1
]
mla
v2
.4
s
,
v18
.4
s
,
v1
.
s
[
2
]
mla
v2
.4
s
,
v
19
.4
s
,
v1
.
s
[
3
]
mla
v2
.4
s
,
v
24
.4
s
,
v1
.
s
[
3
]
srshl
v2
.4
s
,
v2
.4
s
,
v29
.4
s
//
-(
6
+
intermediate_bits
)
sqxtun
v2
.4
h
,
v2
.4
s
...
...
@@ -2071,7 +2070,7 @@ L(\type\()_8tap_hv):
st1
{
v2
.
s
}[
1
],
[
\
ds2
],
\
d_strd
b.le
0
f
mov
v16
.16
b
,
v18
.16
b
mov
v17
.16
b
,
v
19
.16
b
mov
v17
.16
b
,
v
24
.16
b
b
2
b
280
:
//
2
x8
,
2
x16
,
2
x32
hv
...
...
@@ -2109,7 +2108,6 @@ L(\type\()_8tap_hv):
28
:
bl
L
(
\
type
\
()
_8tap_filter_2
)
ext
v22
.16
b
,
v21
.16
b
,
v24
.16
b
,
#
8
mov
v23
.16
b
,
v24
.16
b
mul
v3
.4
s
,
v16
.4
s
,
v1
.
s
[
0
]
mla
v3
.4
s
,
v17
.4
s
,
v1
.
s
[
1
]
mla
v3
.4
s
,
v18
.4
s
,
v1
.
s
[
2
]
...
...
@@ -2117,7 +2115,7 @@ L(\type\()_8tap_hv):
mla
v3
.4
s
,
v20
.4
s
,
v2
.
s
[
0
]
mla
v3
.4
s
,
v21
.4
s
,
v2
.
s
[
1
]
mla
v3
.4
s
,
v22
.4
s
,
v2
.
s
[
2
]
mla
v3
.4
s
,
v2
3
.4
s
,
v2
.
s
[
3
]
mla
v3
.4
s
,
v2
4
.4
s
,
v2
.
s
[
3
]
srshl
v3
.4
s
,
v3
.4
s
,
v29
.4
s
//
-(
6
+
intermediate_bits
)
sqxtun
v3
.4
h
,
v3
.4
s
...
...
@@ -2131,7 +2129,7 @@ L(\type\()_8tap_hv):
mov
v18
.16
b
,
v20
.16
b
mov
v19
.16
b
,
v21
.16
b
mov
v20
.16
b
,
v22
.16
b
mov
v21
.16
b
,
v2
3
.16
b
mov
v21
.16
b
,
v2
4
.16
b
b
28
b
0
:
...
...
Write
Preview
Supports
Markdown
0%
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment