Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Contribute to GitLab
Sign in / Register
Toggle navigation
F
ffmpeg.wasm-core
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Linshizhi
ffmpeg.wasm-core
Commits
562653b7
Commit
562653b7
authored
Mar 27, 2016
by
Matthieu Bouron
Committed by
Matthieu Bouron
Apr 01, 2016
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
swscale/arm/yuv2rgb: macro-ify
parent
0286b56f
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
62 additions
and
79 deletions
+62
-79
yuv2rgb_neon.S
libswscale/arm/yuv2rgb_neon.S
+62
-79
No files found.
libswscale/arm/yuv2rgb_neon.S
View file @
562653b7
...
@@ -99,23 +99,23 @@
...
@@ -99,23 +99,23 @@
.endm
.endm
.macro process_1l_16px_internal dst src ofmt
vld1.8 {q7}, [\src]!
compute_16px \dst, d14, d15, \ofmt
.endm
.macro process_1l_16px ofmt
.macro process_1l_16px ofmt
compute_premult d28, d29, d30, d31
compute_premult d28, d29, d30, d31
vld1.8 {q7}, [r4]!
process_1l_16px_internal r2, r4, \ofmt
compute_16px r2, d14, d15, \ofmt
.endm
.endm
.macro process_2l_16px ofmt
.macro process_2l_16px ofmt
compute_premult d28, d29, d30, d31
compute_premult d28, d29, d30, d31
process_1l_16px_internal r2, r4, \ofmt
vld1.8 {q7}, [r4]! @ first line of luma
process_1l_16px_internal r11,r12,\ofmt
compute_16px r2, d14, d15, \ofmt
vld1.8 {q7}, [r12]! @ second line of luma
compute_16px r11, d14, d15, \ofmt
.endm
.endm
.macro load_args_nv
x
.macro load_args_nv
12
push {r4-r12, lr}
push {r4-r12, lr}
vpush {q4-q7}
vpush {q4-q7}
ldr r4, [sp, #104] @ r4 = srcY
ldr r4, [sp, #104] @ r4 = srcY
...
@@ -136,6 +136,10 @@
...
@@ -136,6 +136,10 @@
sub r7, r7, r0 @ r7 = linesizeC - width (paddingC)
sub r7, r7, r0 @ r7 = linesizeC - width (paddingC)
.endm
.endm
.macro load_args_nv21
load_args_nv12
.endm
.macro load_args_yuv420p
.macro load_args_yuv420p
push {r4-r12, lr}
push {r4-r12, lr}
vpush {q4-q7}
vpush {q4-q7}
...
@@ -176,55 +180,23 @@
...
@@ -176,55 +180,23 @@
ldr r10,[sp, #120] @ r10 = srcV
ldr r10,[sp, #120] @ r10 = srcV
.endm
.endm
.macro declare_func ifmt ofmt
.macro load_chroma_nv12
function ff_\ifmt\()_to_\ofmt\()_neon, export=1
.ifc \ifmt,nv12
load_args_nvx
.endif
.ifc \ifmt,nv21
load_args_nvx
.endif
.ifc \ifmt,yuv420p
load_args_yuv420p
.endif
.ifc \ifmt,yuv422p
load_args_yuv422p
.endif
1:
mov r8, r0 @ r8 = width
2:
pld [r6, #64*3]
pld [r4, #64*3]
vmov.i8 d10, #128
.ifc \ifmt,nv12
pld [r12, #64*3]
pld [r12, #64*3]
vld2.8 {d2, d3}, [r6]! @ q1: interleaved chroma line
vld2.8 {d2, d3}, [r6]! @ q1: interleaved chroma line
vsubl.u8 q14, d2, d10 @ q14 = U - 128
vsubl.u8 q14, d2, d10 @ q14 = U - 128
vsubl.u8 q15, d3, d10 @ q15 = V - 128
vsubl.u8 q15, d3, d10 @ q15 = V - 128
.endm
process_2l_16px \ofmt
.macro load_chroma_nv21
.endif
.ifc \ifmt,nv21
pld [r12, #64*3]
pld [r12, #64*3]
vld2.8 {d2, d3}, [r6]! @ q1: interleaved chroma line
vld2.8 {d2, d3}, [r6]! @ q1: interleaved chroma line
vsubl.u8 q14, d3, d10 @ q14 = U - 128
vsubl.u8 q14, d3, d10 @ q14 = U - 128
vsubl.u8 q15, d2, d10 @ q15 = V - 128
vsubl.u8 q15, d2, d10 @ q15 = V - 128
.endm
process_2l_16px \ofmt
.macro load_chroma_yuv420p
.endif
.ifc \ifmt,yuv420p
pld [r10, #64*3]
pld [r10, #64*3]
pld [r12, #64*3]
pld [r12, #64*3]
...
@@ -232,68 +204,79 @@ function ff_\ifmt\()_to_\ofmt\()_neon, export=1
...
@@ -232,68 +204,79 @@ function ff_\ifmt\()_to_\ofmt\()_neon, export=1
vld1.8 d3, [r10]! @ d3: chroma blue line
vld1.8 d3, [r10]! @ d3: chroma blue line
vsubl.u8 q14, d2, d10 @ q14 = U - 128
vsubl.u8 q14, d2, d10 @ q14 = U - 128
vsubl.u8 q15, d3, d10 @ q15 = V - 128
vsubl.u8 q15, d3, d10 @ q15 = V - 128
.endm
process_2l_16px \ofmt
.macro load_chroma_yuv422p
.endif
.ifc \ifmt,yuv422p
pld [r10, #64*3]
pld [r10, #64*3]
vld1.8 d2, [r6]! @ d2: chroma red line
vld1.8 d2, [r6]! @ d2: chroma red line
vld1.8 d3, [r10]! @ d3: chroma blue line
vld1.8 d3, [r10]! @ d3: chroma blue line
vsubl.u8 q14, d2, d10 @ q14 = U - 128
vsubl.u8 q14, d2, d10 @ q14 = U - 128
vsubl.u8 q15, d3, d10 @ q15 = V - 128
vsubl.u8 q15, d3, d10 @ q15 = V - 128
.endm
process_1l_16px \ofmt
.macro increment_and_test_nv12
.endif
subs r8, r8, #16 @ width -= 16
bgt 2b
add r2, r2, r3 @ dst += padding
add r4, r4, r5 @ srcY += paddingY
.ifc \ifmt,nv12
add r11, r11, r3 @ dst2 += padding
add r11, r11, r3 @ dst2 += padding
add r12, r12, r5 @ srcY2 += paddingY
add r12, r12, r5 @ srcY2 += paddingY
add r6, r6, r7 @ srcC += paddingC
add r6, r6, r7 @ srcC += paddingC
subs r1, r1, #2 @ height -= 2
subs r1, r1, #2 @ height -= 2
.endif
.endm
.ifc \ifmt,nv21
add r11, r11, r3 @ dst2 += padding
add r12, r12, r5 @ srcY2 += paddingY
add r6, r6, r7 @ srcC += paddingC
.macro increment_and_test_nv21
subs r1, r1, #2 @ height -=
2
increment_and_test_nv1
2
.end
if
.end
m
.
ifc \ifmt,
yuv420p
.
macro increment_and_test_
yuv420p
add r11, r11, r3 @ dst2 += padding
add r11, r11, r3 @ dst2 += padding
add r12, r12, r5 @ srcY2 += paddingY
add r12, r12, r5 @ srcY2 += paddingY
ldr r7, [sp, #116] @ r7 = linesizeU
ldr r7, [sp, #116] @ r7 = linesizeU
sub r7, r7, r0, lsr #1 @ r7 = linesizeU - width / 2 (paddingU)
sub r7, r7, r0, lsr #1 @ r7 = linesizeU - width / 2 (paddingU)
add r6, r6, r7 @ srcU += paddingU
add r6, r6, r7 @ srcU += paddingU
ldr r7, [sp, #124] @ r7 = linesizeV
ldr r7, [sp, #124] @ r7 = linesizeV
sub r7, r7, r0, lsr #1 @ r7 = linesizeV - width / 2 (paddingV)
sub r7, r7, r0, lsr #1 @ r7 = linesizeV - width / 2 (paddingV)
add r10, r10, r7 @ srcV += paddingV
add r10, r10, r7 @ srcV += paddingV
subs r1, r1, #2 @ height -= 2
subs r1, r1, #2 @ height -= 2
.end
if
.end
m
.
ifc \ifmt,
yuv422p
.
macro increment_and_test_
yuv422p
add r6, r6, r7 @ srcU += paddingU
add r6, r6, r7 @ srcU += paddingU
add r10,r10,r12 @ srcV += paddingV
add r10,r10,r12 @ srcV += paddingV
subs r1, r1, #1 @ height -= 1
subs r1, r1, #1 @ height -= 1
.end
if
.end
m
bgt 1b
.macro process_nv12 ofmt
process_2l_16px \ofmt
.endm
.macro process_nv21 ofmt
process_2l_16px \ofmt
.endm
.macro process_yuv420p ofmt
process_2l_16px \ofmt
.endm
.macro process_yuv422p ofmt
process_1l_16px \ofmt
.endm
.macro declare_func ifmt ofmt
function ff_\ifmt\()_to_\ofmt\()_neon, export=1
load_args_\ifmt
1:
mov r8, r0 @ r8 = width
2:
pld [r6, #64*3]
pld [r4, #64*3]
vmov.i8 d10, #128
load_chroma_\ifmt
process_\ifmt \ofmt
subs r8, r8, #16 @ width -= 16
bgt 2b
add r2, r2, r3 @ dst += padding
add r4, r4, r5 @ srcY += paddingY
increment_and_test_\ifmt
bgt 1b
vpop {q4-q7}
vpop {q4-q7}
pop {r4-r12, lr}
pop {r4-r12, lr}
mov pc, lr
mov pc, lr
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment