diff fft.c @ 10400:866dffa620d1 libavcodec

Use hardcoded instead of runtime-calculated ff_cos_* tables if --enable-hardcoded-tables was used. Due to the size, the code for the tables is generated at compile time.
author reimar
date Wed, 14 Oct 2009 21:41:24 +0000
parents 74715d4288ad
children 57acce8b1380
line wrap: on
line diff
--- a/fft.c	Wed Oct 14 05:28:24 2009 +0000
+++ b/fft.c	Wed Oct 14 21:41:24 2009 +0000
@@ -28,20 +28,31 @@
 
 #include "dsputil.h"
 
+#if CONFIG_HARDCODED_TABLES
+#define COSTABLE(size) \
+    extern const DECLARE_ALIGNED_16(FFTSample, ff_cos_##size[size/2]);
+#else
+#define COSTABLE(size) \
+    DECLARE_ALIGNED_16(FFTSample, ff_cos_##size[size/2]);
+#endif
+
 /* cos(2*pi*x/n) for 0<=x<=n/4, followed by its reverse */
-DECLARE_ALIGNED_16(FFTSample, ff_cos_16[8]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_32[16]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_64[32]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_128[64]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_256[128]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_512[256]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_1024[512]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_2048[1024]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_4096[2048]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_8192[4096]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_16384[8192]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_32768[16384]);
-DECLARE_ALIGNED_16(FFTSample, ff_cos_65536[32768]);
+COSTABLE(16)
+COSTABLE(32)
+COSTABLE(64)
+COSTABLE(128)
+COSTABLE(256)
+COSTABLE(512)
+COSTABLE(1024)
+COSTABLE(2048)
+COSTABLE(4096)
+COSTABLE(8192)
+COSTABLE(16384)
+COSTABLE(32768)
+COSTABLE(65536)
+#if CONFIG_HARDCODED_TABLES
+const
+#endif
 FFTSample * const ff_cos_tabs[] = {
     ff_cos_16, ff_cos_32, ff_cos_64, ff_cos_128, ff_cos_256, ff_cos_512, ff_cos_1024,
     ff_cos_2048, ff_cos_4096, ff_cos_8192, ff_cos_16384, ff_cos_32768, ff_cos_65536,
@@ -93,6 +104,7 @@
     if (HAVE_MMX)     ff_fft_init_mmx(s);
 
     if (s->split_radix) {
+#if !CONFIG_HARDCODED_TABLES
         for(j=4; j<=nbits; j++) {
             int m = 1<<j;
             double freq = 2*M_PI/m;
@@ -102,6 +114,7 @@
             for(i=1; i<m/4; i++)
                 tab[m/2-i] = tab[i];
         }
+#endif
         for(i=0; i<n; i++)
             s->revtab[-split_radix_permutation(i, n, s->inverse) & (n-1)] = i;
         s->tmp_buf = av_malloc(n * sizeof(FFTComplex));