Mercurial > libavcodec.hg
annotate bfin/dsputil_bfin.h @ 12049:e6305257ceb6 libavcodec
PPC: Altivec IMDCT
Patch by Loren Merritt
author | mru |
---|---|
date | Thu, 01 Jul 2010 23:21:49 +0000 |
parents | 9f2381fb271b |
children |
rev | line source |
---|---|
5131 | 1 /* |
2 * BlackFin DSPUTILS COMMON OPTIMIZATIONS HEADER | |
3 * | |
4 * Copyright (C) 2007 Marc Hoffman <mmh@pleasantst.com> | |
5 * | |
6 * This file is part of FFmpeg. | |
7 * | |
8 * FFmpeg is free software; you can redistribute it and/or | |
9 * modify it under the terms of the GNU Lesser General Public | |
10 * License as published by the Free Software Foundation; either | |
11 * version 2.1 of the License, or (at your option) any later version. | |
12 * | |
13 * FFmpeg is distributed in the hope that it will be useful, | |
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
16 * Lesser General Public License for more details. | |
17 * | |
18 * You should have received a copy of the GNU Lesser General Public | |
19 * License along with FFmpeg; if not, write to the Free Software | |
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | |
21 */ | |
22 | |
23 | |
7760 | 24 #ifndef AVCODEC_BFIN_DSPUTIL_BFIN_H |
25 #define AVCODEC_BFIN_DSPUTIL_BFIN_H | |
5131 | 26 |
11416 | 27 #include "config.h" |
28 #include "libavcodec/dsputil.h" | |
29 | |
11063 | 30 #if defined(__FDPIC__) && CONFIG_SRAM |
5131 | 31 #define attribute_l1_text __attribute__ ((l1_text)) |
6362
78aa57eba353
FLAT objects cannot have multiple sections, so using the L1 attributes breaks
diego
parents:
5830
diff
changeset
|
32 #define attribute_l1_data_b __attribute__((l1_data_B)) |
78aa57eba353
FLAT objects cannot have multiple sections, so using the L1 attributes breaks
diego
parents:
5830
diff
changeset
|
33 #else |
78aa57eba353
FLAT objects cannot have multiple sections, so using the L1 attributes breaks
diego
parents:
5830
diff
changeset
|
34 #define attribute_l1_text |
78aa57eba353
FLAT objects cannot have multiple sections, so using the L1 attributes breaks
diego
parents:
5830
diff
changeset
|
35 #define attribute_l1_data_b |
78aa57eba353
FLAT objects cannot have multiple sections, so using the L1 attributes breaks
diego
parents:
5830
diff
changeset
|
36 #endif |
5131 | 37 |
11398 | 38 void ff_bfin_idct (DCTELEM *block) attribute_l1_text; |
39 void ff_bfin_fdct (DCTELEM *block) attribute_l1_text; | |
40 void ff_bfin_vp3_idct (DCTELEM *block); | |
41 void ff_bfin_vp3_idct_put (uint8_t *dest, int line_size, DCTELEM *block); | |
42 void ff_bfin_vp3_idct_add (uint8_t *dest, int line_size, DCTELEM *block); | |
43 void ff_bfin_add_pixels_clamped (const DCTELEM *block, uint8_t *dest, int line_size) attribute_l1_text; | |
44 void ff_bfin_put_pixels_clamped (const DCTELEM *block, uint8_t *dest, int line_size) attribute_l1_text; | |
45 void ff_bfin_diff_pixels (DCTELEM *block, const uint8_t *s1, const uint8_t *s2, int stride) attribute_l1_text; | |
46 void ff_bfin_get_pixels (DCTELEM *restrict block, const uint8_t *pixels, int line_size) attribute_l1_text; | |
47 int ff_bfin_pix_norm1 (uint8_t * pix, int line_size) attribute_l1_text; | |
48 int ff_bfin_z_sad8x8 (uint8_t *blk1, uint8_t *blk2, int dsz, int line_size, int h) attribute_l1_text; | |
49 int ff_bfin_z_sad16x16 (uint8_t *blk1, uint8_t *blk2, int dsz, int line_size, int h) attribute_l1_text; | |
50 | |
51 void ff_bfin_z_put_pixels16_xy2 (uint8_t *block, const uint8_t *s0, int dest_size, int line_size, int h) attribute_l1_text; | |
52 void ff_bfin_z_put_pixels8_xy2 (uint8_t *block, const uint8_t *s0, int dest_size, int line_size, int h) attribute_l1_text; | |
53 void ff_bfin_put_pixels16_xy2_nornd (uint8_t *block, const uint8_t *s0, int line_size, int h) attribute_l1_text; | |
54 void ff_bfin_put_pixels8_xy2_nornd (uint8_t *block, const uint8_t *s0, int line_size, int h) attribute_l1_text; | |
55 | |
56 | |
57 int ff_bfin_pix_sum (uint8_t *p, int stride) attribute_l1_text; | |
58 | |
59 void ff_bfin_put_pixels8uc (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int dest_size, int line_size, int h) attribute_l1_text; | |
60 void ff_bfin_put_pixels16uc (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int dest_size, int line_size, int h) attribute_l1_text; | |
61 void ff_bfin_put_pixels8uc_nornd (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int line_size, int h) attribute_l1_text; | |
62 void ff_bfin_put_pixels16uc_nornd (uint8_t *block, const uint8_t *s0, const uint8_t *s1, int line_size, int h) attribute_l1_text; | |
63 | |
64 int ff_bfin_sse4 (void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h) attribute_l1_text; | |
65 int ff_bfin_sse8 (void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h) attribute_l1_text; | |
66 int ff_bfin_sse16 (void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h) attribute_l1_text; | |
67 | |
68 | |
5131 | 69 #ifdef BFIN_PROFILE |
70 | |
71 static double Telem[16]; | |
72 static char *TelemNames[16]; | |
73 static int TelemCnt; | |
74 | |
5138
189a1229a7a6
removing underscores from block profiling renaming to xx_
mhoffman
parents:
5131
diff
changeset
|
75 #define PROF(lab,e) { int xx_e = e; char*xx_lab = lab; uint64_t xx_t0 = read_time(); |
189a1229a7a6
removing underscores from block profiling renaming to xx_
mhoffman
parents:
5131
diff
changeset
|
76 #define EPROF() xx_t0 = read_time()-xx_t0; Telem[xx_e] = Telem[xx_e] + xx_t0; TelemNames[xx_e] = xx_lab; } |
5131 | 77 |
78 static void prof_report (void) | |
79 { | |
80 int i; | |
81 double s = 0; | |
82 for (i=0;i<16;i++) { | |
83 double v; | |
84 if (TelemNames[i]) { | |
85 v = Telem[i]/TelemCnt; | |
86 av_log (NULL,AV_LOG_DEBUG,"%-20s: %12.4f\t%12.4f\n", TelemNames[i],v,v/64); | |
87 s = s + Telem[i]; | |
88 } | |
89 } | |
90 av_log (NULL,AV_LOG_DEBUG,"%-20s: %12.4f\t%12.4f\n%20.4f\t%d\n", | |
91 "total",s/TelemCnt,s/TelemCnt/64,s,TelemCnt); | |
92 } | |
93 | |
94 static void bfprof (void) | |
95 { | |
96 static int init; | |
97 if (!init) atexit (prof_report); | |
98 init=1; | |
99 TelemCnt++; | |
100 } | |
101 | |
102 #else | |
103 #define PROF(a,b) | |
104 #define EPROF() | |
105 #define bfprof() | |
106 #endif | |
107 | |
7760 | 108 #endif /* AVCODEC_BFIN_DSPUTIL_BFIN_H */ |