Skip to content
GitLab
Projects
Groups
Snippets
Help
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
A
aom-rav1e
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Service Desk
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Operations
Operations
Incidents
Environments
Packages & Registries
Packages & Registries
Container Registry
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Xiph.Org
aom-rav1e
Commits
7725a7eb
Commit
7725a7eb
authored
Feb 14, 2011
by
Yunqing Wang
Committed by
Code Review
Feb 14, 2011
Browse files
Options
Browse Files
Download
Plain Diff
Merge "Improve vp8_sad16x16_sse3 function"
parents
27dad215
2debd5b5
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
25 additions
and
32 deletions
+25
-32
vp8/encoder/x86/sad_sse3.asm
vp8/encoder/x86/sad_sse3.asm
+25
-32
No files found.
vp8/encoder/x86/sad_sse3.asm
View file @
7725a7eb
...
...
@@ -586,52 +586,45 @@ sym(vp8_sad16x16_sse3):
STACK_FRAME_CREATE_X3
lea
end_ptr
,
[
src_ptr
+
src_stride
*
8
]
lea
end_ptr
,
[
end_ptr
+
src_stride
*
8
]
pxor
mm7
,
mm7
mov
end_ptr
,
4
pxor
xmm7
,
xmm7
.vp8_sad16x16_sse3_loop:
movdqa
xmm0
,
XMMWORD
PTR
[
src_ptr
]
movdqu
xmm1
,
XMMWORD
PTR
[
ref_ptr
]
movdqa
xmm2
,
XMMWORD
PTR
[
src_ptr
+
src_stride
]
movdqu
xmm3
,
XMMWORD
PTR
[
ref_ptr
+
ref_stride
]
movq
ret_var
,
mm7
cmp
ret_var
,
max_err
jg
.vp8_sad16x16_early_exit
movq
mm0
,
QWORD
PTR
[
src_ptr
]
movq
mm2
,
QWORD
PTR
[
src_ptr
+
8
]
movq
mm1
,
QWORD
PTR
[
ref_ptr
]
movq
mm3
,
QWORD
PTR
[
ref_ptr
+
8
]
lea
src_ptr
,
[
src_ptr
+
src_stride
*
2
]
lea
ref_ptr
,
[
ref_ptr
+
ref_stride
*
2
]
movq
mm4
,
QWORD
PTR
[
src_ptr
+
src_stride
]
movq
mm5
,
QWORD
PTR
[
ref_ptr
+
ref_stride
]
movdqa
xmm4
,
XMMWORD
PTR
[
src_ptr
]
movdqu
xmm5
,
XMMWORD
PTR
[
ref_ptr
]
movdqa
xmm6
,
XMMWORD
PTR
[
src_ptr
+
src_stride
]
psadbw
mm0
,
mm1
psadbw
mm2
,
mm3
psadbw
xmm0
,
xmm1
movq
mm1
,
QWORD
PTR
[
src_ptr
+
src_stride
+
8
]
movq
mm3
,
QWORD
PTR
[
ref_ptr
+
ref_stride
+
8
]
movdqu
xmm1
,
XMMWORD
PTR
[
ref_ptr
+
ref_stride
]
psadbw
mm4
,
mm5
psadbw
mm1
,
mm3
psadbw
xmm2
,
xmm3
psadbw
xmm4
,
xmm5
psadbw
xmm6
,
xmm1
lea
src_ptr
,
[
src_ptr
+
src_stride
*
2
]
lea
ref_ptr
,
[
ref_ptr
+
ref_stride
*
2
]
paddw
mm0
,
mm2
paddw
mm4
,
mm1
paddw
mm7
,
mm0
paddw
mm7
,
mm4
paddw
xmm7
,
xmm0
paddw
xmm7
,
xmm2
paddw
xmm7
,
xmm4
paddw
xmm7
,
xmm6
cmp
src_ptr
,
end_ptr
sub
end_ptr
,
1
jne
.vp8_sad16x16_sse3_loop
movq
ret_var
,
mm7
.vp8_sad16x16_early_exit:
mov
rax
,
ret_var
movq
xmm0
,
xmm7
psrldq
xmm7
,
8
paddw
xmm0
,
xmm7
movq
rax
,
xmm0
STACK_FRAME_DESTROY_X3
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment