Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Contribute to GitLab
Sign in / Register
Toggle navigation
F
ffmpeg.wasm-core
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Linshizhi
ffmpeg.wasm-core
Commits
a493f854
Commit
a493f854
authored
Jan 20, 2014
by
Michael Niedermayer
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
avcodec/x86/dsp: add_int16_mmx / add_int16_sse2
Signed-off-by:
Michael Niedermayer
<
michaelni@gmx.at
>
parent
da068482
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
70 additions
and
0 deletions
+70
-0
dsputil.asm
libavcodec/x86/dsputil.asm
+65
-0
dsputil_init.c
libavcodec/x86/dsputil_init.c
+3
-0
dsputil_x86.h
libavcodec/x86/dsputil_x86.h
+2
-0
No files found.
libavcodec/x86/dsputil.asm
View file @
a493f854
...
@@ -465,6 +465,71 @@ cglobal add_hfyu_left_prediction, 3,3,7, dst, src, w, left
...
@@ -465,6 +465,71 @@ cglobal add_hfyu_left_prediction, 3,3,7, dst, src, w, left
.
src_unaligned
:
.
src_unaligned
:
ADD_HFYU_LEFT_LOOP
0
,
0
ADD_HFYU_LEFT_LOOP
0
,
0
%macro
ADD_INT16_LOOP
1
; %1 = is_aligned
movd
m4
,
maskq
punpcklwd
m4
,
m4
punpcklwd
m4
,
m4
punpcklwd
m4
,
m4
add
wq
,
wq
test
wq
,
2
*
mmsize
-
1
jz
%%
.
tomainloop
%%
.
wordloop
:
sub
wq
,
2
mov
ax
,
[
srcq
+
wq
]
add
ax
,
[
dstq
+
wq
]
and
ax
,
maskw
mov
[
dstq
+
wq
]
,
ax
test
wq
,
2
*
mmsize
-
1
jnz
%%
.
wordloop
%%
.
tomainloop
:
add
srcq
,
wq
add
dstq
,
wq
neg
wq
jz
%%
.
end
%%
.
loop
:
%if
%1
mova
m0
,
[
srcq
+
wq
]
mova
m1
,
[
dstq
+
wq
]
mova
m2
,
[
srcq
+
wq
+
mmsize
]
mova
m3
,
[
dstq
+
wq
+
mmsize
]
%else
movu
m0
,
[
srcq
+
wq
]
movu
m1
,
[
dstq
+
wq
]
movu
m2
,
[
srcq
+
wq
+
mmsize
]
movu
m3
,
[
dstq
+
wq
+
mmsize
]
%endif
paddw
m0
,
m1
paddw
m2
,
m3
pand
m0
,
m4
pand
m2
,
m4
%if
%1
mova
[
dstq
+
wq
]
,
m0
mova
[
dstq
+
wq
+
mmsize
]
,
m2
%else
movu
[
dstq
+
wq
]
,
m0
movu
[
dstq
+
wq
+
mmsize
]
,
m2
%endif
add
wq
,
2
*
mmsize
jl
%%
.
loop
%%
.
end
:
RET
%endmacro
INIT_MMX
mmx
cglobal
add_int16
,
4
,
4
,
5
,
dst
,
src
,
mask
,
w
ADD_INT16_LOOP
1
INIT_XMM
sse2
cglobal
add_int16
,
4
,
4
,
5
,
dst
,
src
,
mask
,
w
test
srcq
,
mmsize
-
1
jnz
.
unaligned
test
dstq
,
mmsize
-
1
jnz
.
unaligned
ADD_INT16_LOOP
1
.
unaligned
:
ADD_INT16_LOOP
0
;-----------------------------------------------------------------------------
;-----------------------------------------------------------------------------
; void ff_vector_clip_int32(int32_t *dst, const int32_t *src, int32_t min,
; void ff_vector_clip_int32(int32_t *dst, const int32_t *src, int32_t min,
; int32_t max, unsigned int len)
; int32_t max, unsigned int len)
...
...
libavcodec/x86/dsputil_init.c
View file @
a493f854
...
@@ -542,6 +542,7 @@ static av_cold void dsputil_init_mmx(DSPContext *c, AVCodecContext *avctx,
...
@@ -542,6 +542,7 @@ static av_cold void dsputil_init_mmx(DSPContext *c, AVCodecContext *avctx,
#endif
/* HAVE_MMX_INLINE */
#endif
/* HAVE_MMX_INLINE */
#if HAVE_MMX_EXTERNAL
#if HAVE_MMX_EXTERNAL
c
->
add_int16
=
ff_add_int16_mmx
;
c
->
vector_clip_int32
=
ff_vector_clip_int32_mmx
;
c
->
vector_clip_int32
=
ff_vector_clip_int32_mmx
;
#endif
/* HAVE_MMX_EXTERNAL */
#endif
/* HAVE_MMX_EXTERNAL */
}
}
...
@@ -625,6 +626,8 @@ static av_cold void dsputil_init_sse2(DSPContext *c, AVCodecContext *avctx,
...
@@ -625,6 +626,8 @@ static av_cold void dsputil_init_sse2(DSPContext *c, AVCodecContext *avctx,
c
->
vector_clip_int32
=
ff_vector_clip_int32_sse2
;
c
->
vector_clip_int32
=
ff_vector_clip_int32_sse2
;
}
}
c
->
bswap_buf
=
ff_bswap32_buf_sse2
;
c
->
bswap_buf
=
ff_bswap32_buf_sse2
;
c
->
add_int16
=
ff_add_int16_sse2
;
#endif
/* HAVE_SSE2_EXTERNAL */
#endif
/* HAVE_SSE2_EXTERNAL */
}
}
...
...
libavcodec/x86/dsputil_x86.h
View file @
a493f854
...
@@ -116,6 +116,8 @@ void ff_clear_blocks_mmx(int16_t *blocks);
...
@@ -116,6 +116,8 @@ void ff_clear_blocks_mmx(int16_t *blocks);
void
ff_clear_blocks_sse
(
int16_t
*
blocks
);
void
ff_clear_blocks_sse
(
int16_t
*
blocks
);
void
ff_add_bytes_mmx
(
uint8_t
*
dst
,
uint8_t
*
src
,
int
w
);
void
ff_add_bytes_mmx
(
uint8_t
*
dst
,
uint8_t
*
src
,
int
w
);
void
ff_add_int16_mmx
(
uint16_t
*
dst
,
const
uint16_t
*
src
,
unsigned
mask
,
int
w
);
void
ff_add_int16_sse2
(
uint16_t
*
dst
,
const
uint16_t
*
src
,
unsigned
mask
,
int
w
);
void
ff_add_hfyu_median_prediction_cmov
(
uint8_t
*
dst
,
const
uint8_t
*
top
,
void
ff_add_hfyu_median_prediction_cmov
(
uint8_t
*
dst
,
const
uint8_t
*
top
,
const
uint8_t
*
diff
,
int
w
,
const
uint8_t
*
diff
,
int
w
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment