summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorYunqing Wang <yunqingwang@google.com>2011-03-11 08:24:23 -0500
committerYunqing Wang <yunqingwang@google.com>2011-03-11 08:24:23 -0500
commitb2aa4017760c9bf9d267470ac235650e24b8adc5 (patch)
tree2e0af83e9567fa226af483d8332d9b622edbd3d3
parent6daacdb785f34efcf3c8600c65590199e79847d6 (diff)
downloadlibvpx-b2aa4017760c9bf9d267470ac235650e24b8adc5.tar
libvpx-b2aa4017760c9bf9d267470ac235650e24b8adc5.tar.gz
libvpx-b2aa4017760c9bf9d267470ac235650e24b8adc5.tar.bz2
libvpx-b2aa4017760c9bf9d267470ac235650e24b8adc5.zip
Align SAD output array to be 16-byte aligned
Use aligned store. Change-Id: Icab4c0c53da811d0c52bb7e8134927f249ba2499
-rw-r--r--vp8/encoder/mcomp.c2
-rw-r--r--vp8/encoder/x86/sad_sse4.asm10
2 files changed, 6 insertions, 6 deletions
diff --git a/vp8/encoder/mcomp.c b/vp8/encoder/mcomp.c
index 33aaa2ca9..c210c1de2 100644
--- a/vp8/encoder/mcomp.c
+++ b/vp8/encoder/mcomp.c
@@ -1415,7 +1415,7 @@ int vp8_full_search_sadx8(MACROBLOCK *x, BLOCK *b, BLOCKD *d, MV *ref_mv, int er
int col_min = ref_col - distance;
int col_max = ref_col + distance;
- unsigned short sad_array8[8];
+ DECLARE_ALIGNED_ARRAY(16, unsigned short, sad_array8, 8);
unsigned int sad_array[3];
// Work out the mid point for the search
diff --git a/vp8/encoder/x86/sad_sse4.asm b/vp8/encoder/x86/sad_sse4.asm
index 21e2e5007..03ecec4b3 100644
--- a/vp8/encoder/x86/sad_sse4.asm
+++ b/vp8/encoder/x86/sad_sse4.asm
@@ -186,7 +186,7 @@ sym(vp8_sad16x16x8_sse4):
PROCESS_16X2X8 0
mov rdi, arg(4) ;Results
- movdqu XMMWORD PTR [rdi], xmm1
+ movdqa XMMWORD PTR [rdi], xmm1
; begin epilog
pop rdi
@@ -224,7 +224,7 @@ sym(vp8_sad16x8x8_sse4):
PROCESS_16X2X8 0
mov rdi, arg(4) ;Results
- movdqu XMMWORD PTR [rdi], xmm1
+ movdqa XMMWORD PTR [rdi], xmm1
; begin epilog
pop rdi
@@ -262,7 +262,7 @@ sym(vp8_sad8x8x8_sse4):
PROCESS_8X2X8 0
mov rdi, arg(4) ;Results
- movdqu XMMWORD PTR [rdi], xmm1
+ movdqa XMMWORD PTR [rdi], xmm1
; begin epilog
pop rdi
@@ -303,7 +303,7 @@ sym(vp8_sad8x16x8_sse4):
PROCESS_8X2X8 0
PROCESS_8X2X8 0
mov rdi, arg(4) ;Results
- movdqu XMMWORD PTR [rdi], xmm1
+ movdqa XMMWORD PTR [rdi], xmm1
; begin epilog
pop rdi
@@ -339,7 +339,7 @@ sym(vp8_sad4x4x8_sse4):
PROCESS_4X2X8 0
mov rdi, arg(4) ;Results
- movdqu XMMWORD PTR [rdi], xmm1
+ movdqa XMMWORD PTR [rdi], xmm1
; begin epilog
pop rdi