From 09673deba953627af2f7ae12a8447136c77a62e4 Mon Sep 17 00:00:00 2001 From: JackyChen Date: Tue, 13 Jan 2015 10:50:50 -0800 Subject: SSE2 code for the filter in MFQE. The SSE2 code is from VP8 MFQE, reuse it in VP9. No change on VP8 side. In our testing, we achieve 2X speed by adopting this change. Change-Id: Ib2b14144ae57c892005c1c4b84e3379d02e56716 --- vp9/common/vp9_rtcd_defs.pl | 6 ++++++ 1 file changed, 6 insertions(+) (limited to 'vp9/common/vp9_rtcd_defs.pl') diff --git a/vp9/common/vp9_rtcd_defs.pl b/vp9/common/vp9_rtcd_defs.pl index 88f85a86d..f715c9f28 100644 --- a/vp9/common/vp9_rtcd_defs.pl +++ b/vp9/common/vp9_rtcd_defs.pl @@ -274,6 +274,12 @@ $vp9_post_proc_down_and_across_sse2=vp9_post_proc_down_and_across_xmm; add_proto qw/void vp9_plane_add_noise/, "uint8_t *Start, char *noise, char blackclamp[16], char whiteclamp[16], char bothclamp[16], unsigned int Width, unsigned int Height, int Pitch"; specialize qw/vp9_plane_add_noise sse2/; $vp9_plane_add_noise_sse2=vp9_plane_add_noise_wmt; + +add_proto qw/void vp9_filter_by_weight16x16/, "const uint8_t *src, int src_stride, uint8_t *dst, int dst_stride, int src_weight"; +specialize qw/vp9_filter_by_weight16x16 sse2/; + +add_proto qw/void vp9_filter_by_weight8x8/, "const uint8_t *src, int src_stride, uint8_t *dst, int dst_stride, int src_weight"; +specialize qw/vp9_filter_by_weight8x8 sse2/; } # -- cgit v1.2.3