diff options
author | Johann <johann.koenig@duck.com> | 2013-05-23 12:50:41 -0700 |
---|---|---|
committer | Johann <johann.koenig@duck.com> | 2013-07-11 11:08:19 -0700 |
commit | 158c80cbb0aa6ab5e054d64917900a4422165777 (patch) | |
tree | 51986b0bbbd5be9c9bba32da9f9bca34c788ef5a /vp9/common/x86 | |
parent | c9b25dcae4f492b558f2025d96664f4d4b2b42ea (diff) | |
download | libvpx-158c80cbb0aa6ab5e054d64917900a4422165777.tar libvpx-158c80cbb0aa6ab5e054d64917900a4422165777.tar.gz libvpx-158c80cbb0aa6ab5e054d64917900a4422165777.tar.bz2 libvpx-158c80cbb0aa6ab5e054d64917900a4422165777.zip |
convolve8 optimizations for neon
Independent horizontal and vertical implementations.
Requires that blocks be built from 4x4 and [xy]_step_q4 == 16
6-10% improvement. CIF improved the least.
Change-Id: I137f5ceae4440adc0960bf88e4453e55a618bcda
Diffstat (limited to 'vp9/common/x86')
-rw-r--r-- | vp9/common/x86/vp9_asm_stubs.c | 1 |
1 files changed, 1 insertions, 0 deletions
diff --git a/vp9/common/x86/vp9_asm_stubs.c b/vp9/common/x86/vp9_asm_stubs.c index 98fc4dc83..3f1c19828 100644 --- a/vp9/common/x86/vp9_asm_stubs.c +++ b/vp9/common/x86/vp9_asm_stubs.c @@ -126,6 +126,7 @@ void vp9_convolve8_horiz_ssse3(const uint8_t *src, ptrdiff_t src_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h) { + /* Ensure the filter can be compressed to int16_t. */ if (x_step_q4 == 16 && filter_x[3] != 128) { while (w >= 16) { vp9_filter_block1d16_h8_ssse3(src, src_stride, |