diff options
author | Martin Storsjö <martin@martin.st> | 2019-02-04 17:00:27 +0300 |
---|---|---|
committer | Martin Storsjö <martin@martin.st> | 2019-02-11 00:11:03 +0300 |
commit | 0d18b15aa084d180aa41f3c4b2cff7bf8cb68fdc (patch) | |
tree | 0b59a7bec4dc1f68ce204944b01f50fa7dbe1204 /src/cdef_tmpl.c | |
parent | 109ee5139931072df0a37021c61e32b3f8ab1172 (diff) |
arm64: cdef: NEON optimized cdef filter function
Speedup vs C code: Cortex A53 A72 A73
cdef_filter_4x4_8bpc_neon: 4.62 4.48 4.76
cdef_filter_4x8_8bpc_neon: 4.82 4.80 5.08
cdef_filter_8x8_8bpc_neon: 5.29 5.33 5.79
Diffstat (limited to 'src/cdef_tmpl.c')
-rw-r--r-- | src/cdef_tmpl.c | 6 |
1 files changed, 5 insertions, 1 deletions
diff --git a/src/cdef_tmpl.c b/src/cdef_tmpl.c index cb0b649..c6f8a9e 100644 --- a/src/cdef_tmpl.c +++ b/src/cdef_tmpl.c @@ -257,7 +257,11 @@ void bitfn(dav1d_cdef_dsp_init)(Dav1dCdefDSPContext *const c) { c->fb[1] = cdef_filter_block_4x8_c; c->fb[2] = cdef_filter_block_4x4_c; -#if HAVE_ASM && ARCH_X86 && BITDEPTH == 8 +#if HAVE_ASM +#if ARCH_AARCH64 || ARCH_ARM + bitfn(dav1d_cdef_dsp_init_arm)(c); +#elif ARCH_X86 bitfn(dav1d_cdef_dsp_init_x86)(c); #endif +#endif } |