diff options
author | Dragan Mrdjan <dmrdjan@mips.com> | 2012-04-11 09:53:15 -0700 |
---|---|---|
committer | Johann <johannkoenig@google.com> | 2012-07-10 10:01:54 -0700 |
commit | 07ff7fa8114d1d569e5b08d665c887af9bb9495f (patch) | |
tree | fab1f11267c2356b2449c86ed96cc899fa428a4b /vp8/common/rtcd_defs.sh | |
parent | bb3d510a18350eb44038897187b1c4b28da86200 (diff) | |
download | libvpx-07ff7fa8114d1d569e5b08d665c887af9bb9495f.tar libvpx-07ff7fa8114d1d569e5b08d665c887af9bb9495f.tar.gz libvpx-07ff7fa8114d1d569e5b08d665c887af9bb9495f.tar.bz2 libvpx-07ff7fa8114d1d569e5b08d665c887af9bb9495f.zip |
VP8 optimizations for MIPS dspr2
Signed-off-by: Raghu Gandham <raghu@mips.com>
Change-Id: I3a8bca425cd3dab746a6328c8fc8843c8e87aea6
Diffstat (limited to 'vp8/common/rtcd_defs.sh')
-rw-r--r-- | vp8/common/rtcd_defs.sh | 53 |
1 files changed, 36 insertions, 17 deletions
diff --git a/vp8/common/rtcd_defs.sh b/vp8/common/rtcd_defs.sh index d6cbd4ad5..f252d98fa 100644 --- a/vp8/common/rtcd_defs.sh +++ b/vp8/common/rtcd_defs.sh @@ -22,35 +22,42 @@ specialize vp8_dequantize_b mmx media neon vp8_dequantize_b_media=vp8_dequantize_b_v6 prototype void vp8_dequant_idct_add "short *input, short *dq, unsigned char *output, int stride" -specialize vp8_dequant_idct_add mmx media neon +specialize vp8_dequant_idct_add mmx media neon dspr2 vp8_dequant_idct_add_media=vp8_dequant_idct_add_v6 +vp8_dequant_idct_add_dspr2=vp8_dequant_idct_add_dspr2 prototype void vp8_dequant_idct_add_y_block "short *q, short *dq, unsigned char *dst, int stride, char *eobs" -specialize vp8_dequant_idct_add_y_block mmx sse2 media neon +specialize vp8_dequant_idct_add_y_block mmx sse2 media neon dspr2 vp8_dequant_idct_add_y_block_media=vp8_dequant_idct_add_y_block_v6 +vp8_dequant_idct_add_y_block_dspr2=vp8_dequant_idct_add_y_block_dspr2 prototype void vp8_dequant_idct_add_uv_block "short *q, short *dq, unsigned char *dst_u, unsigned char *dst_v, int stride, char *eobs" -specialize vp8_dequant_idct_add_uv_block mmx sse2 media neon +specialize vp8_dequant_idct_add_uv_block mmx sse2 media neon dspr2 vp8_dequant_idct_add_uv_block_media=vp8_dequant_idct_add_uv_block_v6 +vp8_dequant_idct_add_y_block_dspr2=vp8_dequant_idct_add_y_block_dspr2 # # Loopfilter # prototype void vp8_loop_filter_mbv "unsigned char *y, unsigned char *u, unsigned char *v, int ystride, int uv_stride, struct loop_filter_info *lfi" -specialize vp8_loop_filter_mbv mmx sse2 media neon +specialize vp8_loop_filter_mbv mmx sse2 media neon dspr2 vp8_loop_filter_mbv_media=vp8_loop_filter_mbv_armv6 +vp8_loop_filter_mbv_dspr2=vp8_loop_filter_mbv_dspr2 prototype void vp8_loop_filter_bv "unsigned char *y, unsigned char *u, unsigned char *v, int ystride, int uv_stride, struct loop_filter_info *lfi" -specialize vp8_loop_filter_bv mmx sse2 media neon +specialize vp8_loop_filter_bv mmx sse2 media neon dspr2 vp8_loop_filter_bv_media=vp8_loop_filter_bv_armv6 +vp8_loop_filter_bv_dspr2=vp8_loop_filter_bv_dspr2 prototype void vp8_loop_filter_mbh "unsigned char *y, unsigned char *u, unsigned char *v, int ystride, int uv_stride, struct loop_filter_info *lfi" -specialize vp8_loop_filter_mbh mmx sse2 media neon +specialize vp8_loop_filter_mbh mmx sse2 media neon dspr2 vp8_loop_filter_mbh_media=vp8_loop_filter_mbh_armv6 +vp8_loop_filter_mbh_dspr2=vp8_loop_filter_mbh_dspr2 prototype void vp8_loop_filter_bh "unsigned char *y, unsigned char *u, unsigned char *v, int ystride, int uv_stride, struct loop_filter_info *lfi" -specialize vp8_loop_filter_bh mmx sse2 media neon +specialize vp8_loop_filter_bh mmx sse2 media neon dspr2 vp8_loop_filter_bh_media=vp8_loop_filter_bh_armv6 +vp8_loop_filter_bh_dspr2=vp8_loop_filter_bh_dspr2 prototype void vp8_loop_filter_simple_mbv "unsigned char *y, int ystride, const unsigned char *blimit" @@ -90,37 +97,45 @@ vp8_loop_filter_simple_bh_neon=vp8_loop_filter_bhs_neon # #idct16 prototype void vp8_short_idct4x4llm "short *input, unsigned char *pred, int pitch, unsigned char *dst, int dst_stride" -specialize vp8_short_idct4x4llm mmx media neon +specialize vp8_short_idct4x4llm mmx media neon dspr2 vp8_short_idct4x4llm_media=vp8_short_idct4x4llm_v6_dual +vp8_short_idct4x4llm_dspr2=vp8_short_idct4x4llm_dspr2 #iwalsh1 prototype void vp8_short_inv_walsh4x4_1 "short *input, short *output" +specialize vp8_short_inv_walsh4x4_1 dspr2 +vp8_short_inv_walsh4x4_1_dspr2=vp8_short_inv_walsh4x4_1_dspr2 # no asm yet #iwalsh16 prototype void vp8_short_inv_walsh4x4 "short *input, short *output" -specialize vp8_short_inv_walsh4x4 mmx sse2 media neon +specialize vp8_short_inv_walsh4x4 mmx sse2 media neon dspr2 vp8_short_inv_walsh4x4_media=vp8_short_inv_walsh4x4_v6 +vp8_short_inv_walsh4x4_dspr2=vp8_short_inv_walsh4x4_dspr2 #idct1_scalar_add prototype void vp8_dc_only_idct_add "short input, unsigned char *pred, int pred_stride, unsigned char *dst, int dst_stride" -specialize vp8_dc_only_idct_add mmx media neon +specialize vp8_dc_only_idct_add mmx media neon dspr2 vp8_dc_only_idct_add_media=vp8_dc_only_idct_add_v6 +vp8_dc_only_idct_add_dspr2=vp8_dc_only_idct_add_dspr2 # # RECON # prototype void vp8_copy_mem16x16 "unsigned char *src, int src_pitch, unsigned char *dst, int dst_pitch" -specialize vp8_copy_mem16x16 mmx sse2 media neon +specialize vp8_copy_mem16x16 mmx sse2 media neon dspr2 vp8_copy_mem16x16_media=vp8_copy_mem16x16_v6 +vp8_copy_mem16x16_dspr2=vp8_copy_mem16x16_dspr2 prototype void vp8_copy_mem8x8 "unsigned char *src, int src_pitch, unsigned char *dst, int dst_pitch" -specialize vp8_copy_mem8x8 mmx media neon +specialize vp8_copy_mem8x8 mmx media neon dspr2 vp8_copy_mem8x8_media=vp8_copy_mem8x8_v6 +vp8_copy_mem8x8_dspr2=vp8_copy_mem8x8_dspr2 prototype void vp8_copy_mem8x4 "unsigned char *src, int src_pitch, unsigned char *dst, int dst_pitch" -specialize vp8_copy_mem8x4 mmx media neon +specialize vp8_copy_mem8x4 mmx media neon dspr2 vp8_copy_mem8x4_media=vp8_copy_mem8x4_v6 +vp8_copy_mem8x4_dspr2=vp8_copy_mem8x4_dspr2 prototype void vp8_build_intra_predictors_mby_s "struct macroblockd *x, unsigned char * yabove_row, unsigned char * yleft, int left_stride, unsigned char * ypred_ptr, int y_stride" specialize vp8_build_intra_predictors_mby_s sse2 ssse3 @@ -177,20 +192,24 @@ fi # Subpixel # prototype void vp8_sixtap_predict16x16 "unsigned char *src, int src_pitch, int xofst, int yofst, unsigned char *dst, int dst_pitch" -specialize vp8_sixtap_predict16x16 mmx sse2 ssse3 media neon +specialize vp8_sixtap_predict16x16 mmx sse2 ssse3 media neon dspr2 vp8_sixtap_predict16x16_media=vp8_sixtap_predict16x16_armv6 +vp8_sixtap_predict16x16_dspr2=vp8_sixtap_predict16x16_dspr2 prototype void vp8_sixtap_predict8x8 "unsigned char *src, int src_pitch, int xofst, int yofst, unsigned char *dst, int dst_pitch" -specialize vp8_sixtap_predict8x8 mmx sse2 ssse3 media neon +specialize vp8_sixtap_predict8x8 mmx sse2 ssse3 media neon dspr2 vp8_sixtap_predict8x8_media=vp8_sixtap_predict8x8_armv6 +vp8_sixtap_predict8x8_dspr2=vp8_sixtap_predict8x8_dspr2 prototype void vp8_sixtap_predict8x4 "unsigned char *src, int src_pitch, int xofst, int yofst, unsigned char *dst, int dst_pitch" -specialize vp8_sixtap_predict8x4 mmx sse2 ssse3 media neon +specialize vp8_sixtap_predict8x4 mmx sse2 ssse3 media neon dspr2 vp8_sixtap_predict8x4_media=vp8_sixtap_predict8x4_armv6 +vp8_sixtap_predict8x4_dspr2=vp8_sixtap_predict8x4_dspr2 prototype void vp8_sixtap_predict4x4 "unsigned char *src, int src_pitch, int xofst, int yofst, unsigned char *dst, int dst_pitch" -specialize vp8_sixtap_predict4x4 mmx ssse3 media neon +specialize vp8_sixtap_predict4x4 mmx ssse3 media neon dspr2 vp8_sixtap_predict4x4_media=vp8_sixtap_predict4x4_armv6 +vp8_sixtap_predict4x4_dspr2=vp8_sixtap_predict4x4_dspr2 prototype void vp8_bilinear_predict16x16 "unsigned char *src, int src_pitch, int xofst, int yofst, unsigned char *dst, int dst_pitch" specialize vp8_bilinear_predict16x16 mmx sse2 ssse3 media neon |