summaryrefslogtreecommitdiff
path: root/vp9/common/x86
diff options
context:
space:
mode:
authorJohann <johann.koenig@duck.com>2013-05-23 12:50:41 -0700
committerJohann <johann.koenig@duck.com>2013-07-11 11:08:19 -0700
commit158c80cbb0aa6ab5e054d64917900a4422165777 (patch)
tree51986b0bbbd5be9c9bba32da9f9bca34c788ef5a /vp9/common/x86
parentc9b25dcae4f492b558f2025d96664f4d4b2b42ea (diff)
downloadlibvpx-158c80cbb0aa6ab5e054d64917900a4422165777.tar
libvpx-158c80cbb0aa6ab5e054d64917900a4422165777.tar.gz
libvpx-158c80cbb0aa6ab5e054d64917900a4422165777.tar.bz2
libvpx-158c80cbb0aa6ab5e054d64917900a4422165777.zip
convolve8 optimizations for neon
Independent horizontal and vertical implementations. Requires that blocks be built from 4x4 and [xy]_step_q4 == 16 6-10% improvement. CIF improved the least. Change-Id: I137f5ceae4440adc0960bf88e4453e55a618bcda
Diffstat (limited to 'vp9/common/x86')
-rw-r--r--vp9/common/x86/vp9_asm_stubs.c1
1 files changed, 1 insertions, 0 deletions
diff --git a/vp9/common/x86/vp9_asm_stubs.c b/vp9/common/x86/vp9_asm_stubs.c
index 98fc4dc83..3f1c19828 100644
--- a/vp9/common/x86/vp9_asm_stubs.c
+++ b/vp9/common/x86/vp9_asm_stubs.c
@@ -126,6 +126,7 @@ void vp9_convolve8_horiz_ssse3(const uint8_t *src, ptrdiff_t src_stride,
const int16_t *filter_x, int x_step_q4,
const int16_t *filter_y, int y_step_q4,
int w, int h) {
+ /* Ensure the filter can be compressed to int16_t. */
if (x_step_q4 == 16 && filter_x[3] != 128) {
while (w >= 16) {
vp9_filter_block1d16_h8_ssse3(src, src_stride,