libavcodec.hg: ppc/gmc_altivec.c comparison

comparison ppc/gmc_altivec.c @ 1352:e8ff4783f188 libavcodec

1) remove TBL support in PPC performance. It's much more useful to use the PMCs, and with Apple's CHUD it's fairly easy too. No reason to keep useless code around 2) make the PPC perf stuff a configure option 3) make put_pixels16_altivec a bit faster by unrolling the loop by 4 patch by (Romain Dolbeau <dolbeau at irisa dot fr>)

author	michaelni
date	Wed, 09 Jul 2003 20:18:13 +0000
parents	09b8fe0f0139
children	b370288f004d

comparison

equal deleted inserted replaced

-:0fc1a6f8ca94
+:e8ff4783f188
 to preserve proper dst alignement.
 */
 #define GMC1_PERF_COND (h==8)
 void gmc1_altivec(uint8_t *dst /* align 8 */, uint8_t *src /* align1 */, int stride, int h, int x16, int y16, int rounder)
 {
-POWERPC_TBL_DECLARE(altivec_gmc1_num, GMC1_PERF_COND);
+POWERPC_PERF_DECLARE(altivec_gmc1_num, GMC1_PERF_COND);
 #ifdef ALTIVEC_USE_REFERENCE_C_CODE
 const int A=(16-x16)*(16-y16);
 const int B=(   x16)*(16-y16);
 const int C=(16-x16)*(   y16);
 const int D=(   x16)*(   y16);
 int i;
-POWERPC_TBL_START_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
+POWERPC_PERF_START_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
 for(i=0; i<h; i++)
 {
 dst[0]= (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1] + rounder)>>8;
 dst[1]= (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2] + rounder)>>8;
 dst[7]= (A*src[7] + B*src[8] + C*src[stride+7] + D*src[stride+8] + rounder)>>8;
 dst+= stride;
 src+= stride;
 }
-POWERPC_TBL_STOP_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
+POWERPC_PERF_STOP_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
 #else /* ALTIVEC_USE_REFERENCE_C_CODE */
 const unsigned short __attribute__ ((aligned(16))) rounder_a[8] =
 {rounder, rounder, rounder, rounder,
 rounder, rounder, rounder, rounder};
 int i;
 unsigned long dst_odd = (unsigned long)dst & 0x0000000F;
 unsigned long src_really_odd = (unsigned long)src & 0x0000000F;
-POWERPC_TBL_START_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
+POWERPC_PERF_START_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
 tempA = vec_ld(0, (unsigned short*)ABCD);
 Av = vec_splat(tempA, 0);
 Bv = vec_splat(tempA, 1);
 Cv = vec_splat(tempA, 2);
 dst += stride;
 src += stride;
 }
-POWERPC_TBL_STOP_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
+POWERPC_PERF_STOP_COUNT(altivec_gmc1_num, GMC1_PERF_COND);
 #endif /* ALTIVEC_USE_REFERENCE_C_CODE */
 }

Mercurial > libavcodec.hg

comparison ppc/gmc_altivec.c @ 1352:e8ff4783f188 libavcodec