diff options
author | Martin Storsjö <martin@martin.st> | 2019-02-08 15:19:55 +0300 |
---|---|---|
committer | Martin Storsjö <martin@martin.st> | 2019-02-14 01:00:41 +0300 |
commit | b3f0c9844be8610e23b0aa29e52f499de4eda083 (patch) | |
tree | 9adefc7c537e0618c718b402910f8a6306c12982 /src/arm/cdef_init_tmpl.c | |
parent | d1c56da1d1c65767924d6752e802380409a38d17 (diff) |
arm64: cdef: NEON implementation of the dir function
Speedup vs C code:
Cortex A53 A72 A73
cdef_dir_8bpc_neon: 4.43 3.51 4.39
Diffstat (limited to 'src/arm/cdef_init_tmpl.c')
-rw-r--r-- | src/arm/cdef_init_tmpl.c | 3 |
1 files changed, 3 insertions, 0 deletions
diff --git a/src/arm/cdef_init_tmpl.c b/src/arm/cdef_init_tmpl.c index 44beb08..a7d58ff 100644 --- a/src/arm/cdef_init_tmpl.c +++ b/src/arm/cdef_init_tmpl.c @@ -29,6 +29,8 @@ #include "src/cdef.h" #if BITDEPTH == 8 && ARCH_AARCH64 +decl_cdef_dir_fn(dav1d_cdef_find_dir_neon); + void dav1d_cdef_padding4_neon(uint16_t *tmp, const pixel *src, ptrdiff_t src_stride, const pixel (*left)[2], /*const*/ pixel *const top[2], int h, @@ -76,6 +78,7 @@ void bitfn(dav1d_cdef_dsp_init_arm)(Dav1dCdefDSPContext *const c) { if (!(flags & DAV1D_ARM_CPU_FLAG_NEON)) return; #if BITDEPTH == 8 && ARCH_AARCH64 + c->dir = dav1d_cdef_find_dir_neon; c->fb[0] = cdef_filter_8x8_neon; c->fb[1] = cdef_filter_4x8_neon; c->fb[2] = cdef_filter_4x4_neon; |