# HG changeset patch # User diego # Date 1158445569 0 # Node ID 4d346abd723c9ccf3e4de0b4667fb2cfc8c7de4c # Parent eae401c5bf30a7e32952ef75627784138666b72c ADI Blackfin optimizations patch by Michael Benjamin, neuroptik gmail com diff -r eae401c5bf30 -r 4d346abd723c Makefile --- a/Makefile Sat Sep 16 00:51:49 2006 +0000 +++ b/Makefile Sat Sep 16 22:26:09 2006 +0000 @@ -357,6 +357,7 @@ ppc/snow_altivec.o \ ppc/vc1dsp_altivec.o \ ppc/float_altivec.o +OBJS-$(TARGET_ARCH_BFIN) += bfin/dsputil_bfin.o CFLAGS += $(CFLAGS-yes) OBJS += $(OBJS-yes) diff -r eae401c5bf30 -r 4d346abd723c bfin/dsputil_bfin.c --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/bfin/dsputil_bfin.c Sat Sep 16 22:26:09 2006 +0000 @@ -0,0 +1,53 @@ +/* + * Copyright (c) 2006 Michael Benjamin + * + * This library is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2 of the License, or (at your option) any later version. + * + * This library is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with this library; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#include "../avcodec.h" +#include "../dsputil.h" + +static int sad8x8_bfin( void *c, uint8_t *blk1, uint8_t *blk2, int line_size, int h ) +{ + int sum; + __asm__ __volatile__ ( + "P0 = %1;" // blk1 + "P1 = %2;" // blk2 + "P2 = %3;\n" // h + "I0 = P0;" + "I1 = P1;\n" + "A0 = 0;" + "A1 = 0;\n" + "M0 = P2;\n" + "P3 = 32;\n" + "LSETUP (sad8x8LoopBegin, sad8x8LoopEnd) LC0=P3;\n" + "sad8x8LoopBegin:\n" + " DISALGNEXCPT || R0 = [I0] || R2 = [I1];\n" + " DISALGNEXCPT || R1 = [I0++] || R3 = [I1++];\n" + "sad8x8LoopEnd:\n" + " SAA ( R1:0 , R3:2 );\n" + "R3 = A1.L + A1.H, R2 = A0.L + A0.H;\n" + "%0 = R2 + R3 (S);\n" + : "=&d" (sum) + : "m"(blk1), "m"(blk2), "m"(h) + : "P0","P1","P2","I0","I1","A0","A1","R0","R1","R2","R3"); + return sum; +} + +void dsputil_init_bfin( DSPContext* c, AVCodecContext *avctx ) +{ + c->pix_abs[1][0] = sad8x8_bfin; + c->sad[1] = sad8x8_bfin; +} diff -r eae401c5bf30 -r 4d346abd723c dsputil.c --- a/dsputil.c Sat Sep 16 00:51:49 2006 +0000 +++ b/dsputil.c Sat Sep 16 22:26:09 2006 +0000 @@ -4189,6 +4189,9 @@ #ifdef ARCH_SH4 dsputil_init_sh4(c,avctx); #endif +#ifdef ARCH_BFIN + dsputil_init_bfin(c,avctx); +#endif switch(c->idct_permutation_type){ case FF_NO_IDCT_PERM: diff -r eae401c5bf30 -r 4d346abd723c dsputil.h --- a/dsputil.h Sat Sep 16 00:51:49 2006 +0000 +++ b/dsputil.h Sat Sep 16 22:26:09 2006 +0000 @@ -571,6 +571,13 @@ void dsputil_init_sh4(DSPContext* c, AVCodecContext *avctx); +#elif defined(ARCH_BFIN) + +#define DECLARE_ALIGNED_8(t,v) t v __attribute__ ((aligned (8))) +#define STRIDE_ALIGN 8 + +void dsputil_init_bfin(DSPContext* c, AVCodecContext *avctx); + #else #define DECLARE_ALIGNED_8(t,v) t v __attribute__ ((aligned (8)))