diff --git a/vp8/common/x86/idctllm_mmx.asm b/vp8/common/x86/idctllm_mmx.asm index 815ee8eb9328c8591207421f043d0a79f7a59749..15e81addb3d6628231adccd5f6d2f2ccaa271ecc 100644 --- a/vp8/common/x86/idctllm_mmx.asm +++ b/vp8/common/x86/idctllm_mmx.asm @@ -196,7 +196,12 @@ cglobal short_idct4x4llm_1_mmx,3,3,0,inp,out,pit ;void dc_only_idct_add_mmx(short input_dc, unsigned char *pred_ptr, unsigned char *dst_ptr, int pitch, int stride) -cglobal dc_only_idct_add_mmx, 5,5,0,in_dc,pred,dst,pit,stride +cglobal dc_only_idct_add_mmx, 4,5,0,in_dc,pred,dst,pit,stride +%if ARCH_X86_64 + movsxd strideq, dword stridem +%else + mov strideq, stridem +%endif pxor m0, m0 movh m5, in_dcq ; dc diff --git a/vp8/decoder/x86/dequantize_mmx.asm b/vp8/decoder/x86/dequantize_mmx.asm index cc5bd156cad28a45c6efc716783cb74d471e112a..23080bfee88d2d5c70a425e9c4f9f447858281f3 100644 --- a/vp8/decoder/x86/dequantize_mmx.asm +++ b/vp8/decoder/x86/dequantize_mmx.asm @@ -44,7 +44,16 @@ cglobal dequantize_b_impl_mmx, 3,3,0,sq,dq,arg3 ;void dequant_idct_add_mmx(short *input, short *dq, unsigned char *pred, unsigned char *dest, int pitch, int stride) -cglobal dequant_idct_add_mmx, 6,6,0,inp,dq,pred,dest,pit,stride +cglobal dequant_idct_add_mmx, 4,6,0,inp,dq,pred,dest,pit,stride + +%if ARCH_X86_64 + movsxd strideq, dword stridem + movsxd pitq, dword pitm +%else + mov strideq, stridem + mov pitq, pitm +%endif + mova m0, [inpq+ 0] pmullw m0, [dqq] @@ -213,7 +222,17 @@ cglobal dequant_idct_add_mmx, 6,6,0,inp,dq,pred,dest,pit,stride ;void dequant_dc_idct_add_mmx(short *input, short *dq, unsigned char *pred, unsigned char *dest, int pitch, int stride, int Dc) -cglobal dequant_dc_idct_add_mmx, 7,7,0,inp,dq,pred,dest,pit,stride,Dc +cglobal dequant_dc_idct_add_mmx, 4,7,0,inp,dq,pred,dest,pit,stride,Dc + +%if ARCH_X86_64 + movsxd strideq, dword stridem + movsxd pitq, dword pitm +%else + mov strideq, stridem + mov pitq, pitm +%endif + + mov Dcq, Dcm mova m0, [inpq+ 0] pmullw m0, [dqq+ 0]