Mercurial > libavcodec.hg
diff x86/vp8dsp.asm @ 11992:da388061b227 libavcodec
Add x86 asm functions for VP8 put_pixels
author | darkshikari |
---|---|
date | Mon, 28 Jun 2010 19:14:40 +0000 |
parents | a6d24fc1deb7 |
children | a717c1a93036 |
line wrap: on
line diff
--- a/x86/vp8dsp.asm Mon Jun 28 18:56:24 2010 +0000 +++ b/x86/vp8dsp.asm Mon Jun 28 19:14:40 2010 +0000 @@ -810,6 +810,46 @@ jg .nextrow REP_RET +cglobal put_vp8_pixels8_mmx, 5,5 +.nextrow: + movq mm0, [r2+r3*0] + movq mm1, [r2+r3*1] + lea r2, [r2+r3*2] + movq [r0+r1*0], mm0 + movq [r0+r1*1], mm1 + lea r0, [r0+r1*2] + sub r4d, 2 + jg .nextrow + REP_RET + +cglobal put_vp8_pixels16_mmx, 5,5 +.nextrow: + movq mm0, [r2+r3*0+0] + movq mm1, [r2+r3*0+8] + movq mm2, [r2+r3*1+0] + movq mm3, [r2+r3*1+8] + lea r2, [r2+r3*2] + movq [r0+r1*0+0], mm0 + movq [r0+r1*0+8], mm1 + movq [r0+r1*1+0], mm2 + movq [r0+r1*1+8], mm3 + lea r0, [r0+r1*2] + sub r4d, 2 + jg .nextrow + REP_RET + +cglobal put_vp8_pixels16_sse, 5,5,2 +.nextrow: + movups xmm0, [r2+r3*0] + movups xmm1, [r2+r3*1] + lea r2, [r2+r3*2] + movaps [r0+r1*0], xmm0 + movaps [r0+r1*1], xmm1 + lea r0, [r0+r1*2] + sub r4d, 2 + jg .nextrow + REP_RET + ;----------------------------------------------------------------------------- ; IDCT functions: ;