Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
F
ffmpeg
Project
Project
Details
Activity
Releases
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Stefan Westerfeld
ffmpeg
Commits
28840cf4
Commit
28840cf4
authored
Oct 28, 2023
by
Rémi Denis-Courmont
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
lavc/jpeg2000dsp: R-V V rct_int
jpeg2000_rct_int_c: 2592.2 jpeg2000_rct_int_rvv_i32: 1154.2
parent
73dea2bb
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
29 additions
and
2 deletions
+29
-2
jpeg2000dsp_init.c
libavcodec/riscv/jpeg2000dsp_init.c
+6
-2
jpeg2000dsp_rvv.S
libavcodec/riscv/jpeg2000dsp_rvv.S
+23
-0
No files found.
libavcodec/riscv/jpeg2000dsp_init.c
View file @
28840cf4
...
...
@@ -24,13 +24,17 @@
#include "libavcodec/jpeg2000dsp.h"
void
ff_ict_float_rvv
(
void
*
src0
,
void
*
src1
,
void
*
src2
,
int
csize
);
void
ff_rct_int_rvv
(
void
*
src0
,
void
*
src1
,
void
*
src2
,
int
csize
);
av_cold
void
ff_jpeg2000dsp_init_riscv
(
Jpeg2000DSPContext
*
c
)
{
#if HAVE_RVV
int
flags
=
av_get_cpu_flags
();
if
((
flags
&
AV_CPU_FLAG_RVV_F32
)
&&
(
flags
&
AV_CPU_FLAG_RVB_ADDR
))
c
->
mct_decode
[
FF_DWT97
]
=
ff_ict_float_rvv
;
if
((
flags
&
AV_CPU_FLAG_RVV_I32
)
&&
(
flags
&
AV_CPU_FLAG_RVB_ADDR
))
{
if
(
flags
&
AV_CPU_FLAG_RVV_F32
)
c
->
mct_decode
[
FF_DWT97
]
=
ff_ict_float_rvv
;
c
->
mct_decode
[
FF_DWT53
]
=
ff_rct_int_rvv
;
}
#endif
}
libavcodec/riscv/jpeg2000dsp_rvv.S
View file @
28840cf4
...
...
@@ -47,3 +47,26 @@ func ff_ict_float_rvv, zve32f
ret
endfunc
func ff_rct_int_rvv, zve32x
1:
vsetvli t0, a3, e32, m8, ta, ma
vle32.v v16, (a1)
sub a3, a3, t0
vle32.v v24, (a2)
vle32.v v8, (a0)
vadd.vv v0, v16, v24
vsra.vi v0, v0, 2
vsub.vv v0, v8, v0
vadd.vv v8, v0, v24
vadd.vv v24, v0, v16
vse32.v v8, (a0)
sh2add a0, t0, a0
vse32.v v0, (a1)
sh2add a1, t0, a1
vse32.v v24, (a2)
sh2add a2, t0, a2
bnez a3, 1b
ret
endfunc
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment