Mercurial > libavcodec.hg
changeset 8542:5a923bd4f5c6 libavcodec
Add Altivec version of vector_fmul_window.
Patch by David Conrad %lessen42 A gmail P com%
author | gpoirier |
---|---|
date | Tue, 06 Jan 2009 23:03:33 +0000 |
parents | 16a315fdad0b |
children | 2cc3cf7b09b1 |
files | ppc/float_altivec.c |
diffstat | 1 files changed, 39 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- a/ppc/float_altivec.c Tue Jan 06 22:29:26 2009 +0000 +++ b/ppc/float_altivec.c Tue Jan 06 23:03:33 2009 +0000 @@ -23,6 +23,7 @@ #include "gcc_fixes.h" #include "dsputil_altivec.h" +#include "util_altivec.h" static void vector_fmul_altivec(float *dst, const float *src, int len) { @@ -149,6 +150,43 @@ ff_vector_fmul_add_add_c(dst, src0, src1, src2, src3, len, step); } +static void vector_fmul_window_altivec(float *dst, const float *src0, const float *src1, const float *win, float add_bias, int len) +{ + union { + vector float v; + float s[4]; + } vadd; + vector float vadd_bias, zero, t0, t1, s0, s1, wi, wj; + const vector unsigned char reverse = vcprm(3,2,1,0); + int i,j; + + dst += len; + win += len; + src0+= len; + + vadd.s[0] = add_bias; + vadd_bias = vec_splat(vadd.v, 0); + zero = (vector float)vec_splat_u32(0); + + for(i=-len*4, j=len*4-16; i<0; i+=16, j-=16) { + s0 = vec_ld(i, src0); + s1 = vec_ld(j, src1); + wi = vec_ld(i, win); + wj = vec_ld(j, win); + + s1 = vec_perm(s1, s1, reverse); + wj = vec_perm(wj, wj, reverse); + + t0 = vec_madd(s0, wj, vadd_bias); + t0 = vec_nmsub(s1, wi, t0); + t1 = vec_madd(s0, wi, vadd_bias); + t1 = vec_madd(s1, wj, t1); + t1 = vec_perm(t1, t1, reverse); + + vec_st(t0, i, dst); + vec_st(t1, j, dst); + } +} static void int32_to_float_fmul_scalar_altivec(float *dst, const int *src, float mul, int len) { @@ -266,6 +304,7 @@ c->vector_fmul_add_add = vector_fmul_add_add_altivec; c->int32_to_float_fmul_scalar = int32_to_float_fmul_scalar_altivec; if(!(avctx->flags & CODEC_FLAG_BITEXACT)) { + c->vector_fmul_window = vector_fmul_window_altivec; c->float_to_int16 = float_to_int16_altivec; c->float_to_int16_interleave = float_to_int16_interleave_altivec; }