changeset 2082:3dc9bbe1b152 libavcodec

polyphase kaiser windowed sinc and blackman nuttall windowed sinc audio resample filters
author michael
date Thu, 17 Jun 2004 15:43:23 +0000
parents d3015863f745
children 76cdbe832239
files avcodec.h imgresample.c resample.c resample2.c
diffstat 4 files changed, 249 insertions(+), 174 deletions(-) [+]
line wrap: on
line diff
--- a/avcodec.h	Wed Jun 16 02:53:12 2004 +0000
+++ b/avcodec.h	Thu Jun 17 15:43:23 2004 +0000
@@ -1846,6 +1846,7 @@
 /* resample.c */
 
 struct ReSampleContext;
+struct AVResampleContext;
 
 typedef struct ReSampleContext ReSampleContext;
 
@@ -1854,6 +1855,9 @@
 int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
 void audio_resample_close(ReSampleContext *s);
 
+struct AVResampleContext *av_resample_init(int out_rate, int in_rate);
+int av_resample(struct AVResampleContext *c, short *dst, short *src, int *consumed, int src_size, int dst_size, int update_ctx);
+
 /* YUV420 format is assumed ! */
 
 struct ImgReSampleContext;
--- a/imgresample.c	Wed Jun 16 02:53:12 2004 +0000
+++ b/imgresample.c	Thu Jun 17 15:43:23 2004 +0000
@@ -55,6 +55,8 @@
     uint8_t *line_buf;
 };
 
+void av_build_filter(int16_t *filter, double factor, int tap_count, int phase_count, int scale, int type);
+
 static inline int get_phase(int pos)
 {
     return ((pos) >> (POS_FRAC_BITS - PHASE_BITS)) & ((1 << PHASE_BITS) - 1);
@@ -540,48 +542,6 @@
     }
 }
 
-/* XXX: the following filter is quite naive, but it seems to suffice
-   for 4 taps */
-static void build_filter(int16_t *filter, float factor)
-{
-    int ph, i, v;
-    float x, y, tab[NB_TAPS], norm, mult, target;
-
-    /* if upsampling, only need to interpolate, no filter */
-    if (factor > 1.0)
-        factor = 1.0;
-
-    for(ph=0;ph<NB_PHASES;ph++) {
-        norm = 0;
-        for(i=0;i<NB_TAPS;i++) {
-#if 1
-            const float d= -0.5; //first order derivative = -0.5
-            x = fabs(((float)(i - FCENTER) - (float)ph / NB_PHASES) * factor);
-            if(x<1.0) y= 1 - 3*x*x + 2*x*x*x + d*(            -x*x + x*x*x);
-            else      y=                       d*(-4 + 8*x - 5*x*x + x*x*x);
-#else
-            x = M_PI * ((float)(i - FCENTER) - (float)ph / NB_PHASES) * factor;
-            if (x == 0)
-                y = 1.0;
-            else
-                y = sin(x) / x;
-#endif
-            tab[i] = y;
-            norm += y;
-        }
-
-        /* normalize so that an uniform color remains the same */
-        target= 1 << FILTER_BITS;
-        for(i=0;i<NB_TAPS;i++) {
-            mult = target / norm;
-            v = lrintf(tab[i] * mult);
-            filter[ph * NB_TAPS + i] = v;
-            norm -= tab[i];
-            target -= v;
-        }
-    }
-}
-
 ImgReSampleContext *img_resample_init(int owidth, int oheight,
                                       int iwidth, int iheight)
 {
@@ -626,10 +586,10 @@
     s->h_incr = ((iwidth - leftBand - rightBand) * POS_FRAC) / s->pad_owidth;
     s->v_incr = ((iheight - topBand - bottomBand) * POS_FRAC) / s->pad_oheight; 
 
-    build_filter(&s->h_filters[0][0], (float) s->pad_owidth  / 
-            (float) (iwidth - leftBand - rightBand));
-    build_filter(&s->v_filters[0][0], (float) s->pad_oheight / 
-            (float) (iheight - topBand - bottomBand));
+    av_build_filter(&s->h_filters[0][0], (float) s->pad_owidth  / 
+            (float) (iwidth - leftBand - rightBand), NB_TAPS, NB_PHASES, 1<<FILTER_BITS, 0);
+    av_build_filter(&s->v_filters[0][0], (float) s->pad_oheight / 
+            (float) (iheight - topBand - bottomBand), NB_TAPS, NB_PHASES, 1<<FILTER_BITS, 0);
 
     return s;
 fail:
--- a/resample.c	Wed Jun 16 02:53:12 2004 +0000
+++ b/resample.c	Thu Jun 17 15:43:23 2004 +0000
@@ -24,103 +24,17 @@
 
 #include "avcodec.h"
 
-typedef struct {
-    /* fractional resampling */
-    uint32_t incr; /* fractional increment */
-    uint32_t frac;
-    int last_sample;
-    /* integer down sample */
-    int iratio;  /* integer divison ratio */
-    int icount, isum;
-    int inv;
-} ReSampleChannelContext;
+struct AVResampleContext;
 
 struct ReSampleContext {
-    ReSampleChannelContext channel_ctx[2];
+    struct AVResampleContext *resample_context;
+    short *temp[2];
+    int temp_len;
     float ratio;
     /* channel convert */
     int input_channels, output_channels, filter_channels;
 };
 
-
-#define FRAC_BITS 16
-#define FRAC (1 << FRAC_BITS)
-
-static void init_mono_resample(ReSampleChannelContext *s, float ratio)
-{
-    ratio = 1.0 / ratio;
-    s->iratio = (int)floorf(ratio);
-    if (s->iratio == 0)
-        s->iratio = 1;
-    s->incr = (int)((ratio / s->iratio) * FRAC);
-    s->frac = FRAC;
-    s->last_sample = 0;
-    s->icount = s->iratio;
-    s->isum = 0;
-    s->inv = (FRAC / s->iratio);
-}
-
-/* fractional audio resampling */
-static int fractional_resample(ReSampleChannelContext *s, short *output, short *input, int nb_samples)
-{
-    unsigned int frac, incr;
-    int l0, l1;
-    short *q, *p, *pend;
-
-    l0 = s->last_sample;
-    incr = s->incr;
-    frac = s->frac;
-
-    p = input;
-    pend = input + nb_samples;
-    q = output;
-
-    l1 = *p++;
-    for(;;) {
-        /* interpolate */
-        *q++ = (l0 * (FRAC - frac) + l1 * frac) >> FRAC_BITS;
-        frac = frac + s->incr;
-        while (frac >= FRAC) {
-            frac -= FRAC;
-            if (p >= pend)
-                goto the_end;
-            l0 = l1;
-            l1 = *p++;
-        }
-    }
- the_end:
-    s->last_sample = l1;
-    s->frac = frac;
-    return q - output;
-}
-
-static int integer_downsample(ReSampleChannelContext *s, short *output, short *input, int nb_samples)
-{
-    short *q, *p, *pend;
-    int c, sum;
-
-    p = input;
-    pend = input + nb_samples;
-    q = output;
-
-    c = s->icount;
-    sum = s->isum;
-
-    for(;;) {
-        sum += *p++;
-        if (--c == 0) {
-            *q++ = (sum * s->inv) >> FRAC_BITS;
-            c = s->iratio;
-            sum = 0;
-        }
-        if (p >= pend)
-            break;
-    }
-    s->isum = sum;
-    s->icount = c;
-    return q - output;
-}
-
 /* n1: number of samples */
 static void stereo_to_mono(short *output, short *input, int n1)
 {
@@ -210,31 +124,6 @@
     }
 }
 
-static int mono_resample(ReSampleChannelContext *s, short *output, short *input, int nb_samples)
-{
-    short *buf1;
-    short *buftmp;
-
-    buf1= (short*)av_malloc( nb_samples * sizeof(short) );
-
-    /* first downsample by an integer factor with averaging filter */
-    if (s->iratio > 1) {
-        buftmp = buf1;
-        nb_samples = integer_downsample(s, buftmp, input, nb_samples);
-    } else {
-        buftmp = input;
-    }
-
-    /* then do a fractional resampling with linear interpolation */
-    if (s->incr != FRAC) {
-        nb_samples = fractional_resample(s, output, buftmp, nb_samples);
-    } else {
-        memcpy(output, buftmp, nb_samples * sizeof(short));
-    }
-    av_free(buf1);
-    return nb_samples;
-}
-
 ReSampleContext *audio_resample_init(int output_channels, int input_channels, 
                                       int output_rate, int input_rate)
 {
@@ -271,16 +160,13 @@
     if(s->filter_channels>2)
       s->filter_channels = 2;
 
-    for(i=0;i<s->filter_channels;i++) {
-        init_mono_resample(&s->channel_ctx[i], s->ratio);
-    }
+    s->resample_context= av_resample_init(output_rate, input_rate);
+    
     return s;
 }
 
 /* resample audio. 'nb_samples' is the number of input samples */
 /* XXX: optimize it ! */
-/* XXX: do it with polyphase filters, since the quality here is
-   HORRIBLE. Return the number of samples available in output */
 int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples)
 {
     int i, nb_samples1;
@@ -296,8 +182,11 @@
     }
 
     /* XXX: move those malloc to resample init code */
-    bufin[0]= (short*) av_malloc( nb_samples * sizeof(short) );
-    bufin[1]= (short*) av_malloc( nb_samples * sizeof(short) );
+    for(i=0; i<s->filter_channels; i++){
+        bufin[i]= (short*) av_malloc( (nb_samples + s->temp_len) * sizeof(short) );
+        memcpy(bufin[i], s->temp[i], s->temp_len * sizeof(short));
+        buftmp2[i] = bufin[i] + s->temp_len;
+    }
     
     /* make some zoom to avoid round pb */
     lenout= (int)(nb_samples * s->ratio) + 16;
@@ -306,27 +195,32 @@
 
     if (s->input_channels == 2 &&
         s->output_channels == 1) {
-        buftmp2[0] = bufin[0];
         buftmp3[0] = output;
         stereo_to_mono(buftmp2[0], input, nb_samples);
     } else if (s->output_channels >= 2 && s->input_channels == 1) {
-        buftmp2[0] = input;
         buftmp3[0] = bufout[0];
+        memcpy(buftmp2[0], input, nb_samples*sizeof(short));
     } else if (s->output_channels >= 2) {
-        buftmp2[0] = bufin[0];
-        buftmp2[1] = bufin[1];
         buftmp3[0] = bufout[0];
         buftmp3[1] = bufout[1];
         stereo_split(buftmp2[0], buftmp2[1], input, nb_samples);
     } else {
-        buftmp2[0] = input;
         buftmp3[0] = output;
+        memcpy(buftmp2[0], input, nb_samples*sizeof(short));
     }
 
+    nb_samples += s->temp_len;
+
     /* resample each channel */
     nb_samples1 = 0; /* avoid warning */
     for(i=0;i<s->filter_channels;i++) {
-        nb_samples1 = mono_resample(&s->channel_ctx[i], buftmp3[i], buftmp2[i], nb_samples);
+        int consumed;
+        int is_last= i+1 == s->filter_channels;
+
+        nb_samples1 = av_resample(s->resample_context, buftmp3[i], bufin[i], &consumed, nb_samples, lenout, is_last);
+        s->temp_len= nb_samples - consumed;
+        s->temp[i]= av_realloc(s->temp[i], s->temp_len*sizeof(short));
+        memcpy(s->temp[i], bufin[i] + consumed, s->temp_len*sizeof(short));
     }
 
     if (s->output_channels == 2 && s->input_channels == 1) {
@@ -347,5 +241,8 @@
 
 void audio_resample_close(ReSampleContext *s)
 {
+    av_resample_close(s->resample_context);
+    av_freep(&s->temp[0]);
+    av_freep(&s->temp[1]);
     av_free(s);
 }
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/resample2.c	Thu Jun 17 15:43:23 2004 +0000
@@ -0,0 +1,214 @@
+/*
+ * audio resampling
+ * Copyright (c) 2004 Michael Niedermayer <michaelni@gmx.at>
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+ *
+ */
+ 
+/**
+ * @file resample2.c
+ * audio resampling
+ * @author Michael Niedermayer <michaelni@gmx.at>
+ */
+
+#include "avcodec.h"
+#include "common.h"
+
+#define PHASE_SHIFT 10
+#define PHASE_COUNT (1<<PHASE_SHIFT)
+#define PHASE_MASK (PHASE_COUNT-1)
+#define FILTER_SHIFT 15
+
+typedef struct AVResampleContext{
+    short *filter_bank;
+    int filter_length;
+    int ideal_dst_incr;
+    int dst_incr;
+    int index;
+    int frac;
+    int src_incr;
+    int compensation_distance;
+}AVResampleContext;
+
+/**
+ * 0th order modified bessel function of the first kind.
+ */
+double bessel(double x){
+    double v=1;
+    double t=1;
+    int i;
+    
+    for(i=1; i<50; i++){
+        t *= i;
+        v += pow(x*x/4, i)/(t*t);
+    }
+    return v;
+}
+
+/**
+ * builds a polyphase filterbank.
+ * @param factor resampling factor
+ * @param scale wanted sum of coefficients for each filter
+ * @param type 0->cubic, 1->blackman nuttall windowed sinc, 2->kaiser windowed sinc beta=16
+ */
+void av_build_filter(int16_t *filter, double factor, int tap_count, int phase_count, int scale, int type){
+    int ph, i, v;
+    double x, y, w, tab[tap_count];
+    const int center= (tap_count-1)/2;
+
+    /* if upsampling, only need to interpolate, no filter */
+    if (factor > 1.0)
+        factor = 1.0;
+
+    for(ph=0;ph<phase_count;ph++) {
+        double norm = 0;
+        double e= 0;
+        for(i=0;i<tap_count;i++) {
+            x = M_PI * ((double)(i - center) - (double)ph / phase_count) * factor;
+            if (x == 0) y = 1.0;
+            else        y = sin(x) / x;
+            switch(type){
+            case 0:{
+                const float d= -0.5; //first order derivative = -0.5
+                x = fabs(((double)(i - center) - (double)ph / phase_count) * factor);
+                if(x<1.0) y= 1 - 3*x*x + 2*x*x*x + d*(            -x*x + x*x*x);
+                else      y=                       d*(-4 + 8*x - 5*x*x + x*x*x);
+                break;}
+            case 1:
+                w = 2.0*x / (factor*tap_count) + M_PI;
+                y *= 0.3635819 - 0.4891775 * cos(w) + 0.1365995 * cos(2*w) - 0.0106411 * cos(3*w);
+                break;
+            case 2:
+                w = 2.0*x / (factor*tap_count*M_PI);
+                y *= bessel(16*sqrt(FFMAX(1-w*w, 0))) / bessel(16);
+                break;
+            }
+
+            tab[i] = y;
+            norm += y;
+        }
+
+        /* normalize so that an uniform color remains the same */
+        for(i=0;i<tap_count;i++) {
+            v = clip(lrintf(tab[i] * scale / norm) + e, -32768, 32767);
+            filter[ph * tap_count + i] = v;
+            e += tab[i] * scale / norm - v;
+        }
+    }
+}
+
+/**
+ * initalizes a audio resampler.
+ * note, if either rate is not a integer then simply scale both rates up so they are
+ */
+AVResampleContext *av_resample_init(int out_rate, int in_rate){
+    AVResampleContext *c= av_mallocz(sizeof(AVResampleContext));
+    double factor= FFMIN(out_rate / (double)in_rate, 1.0);
+
+    memset(c, 0, sizeof(AVResampleContext));
+
+    c->filter_length= ceil(16.0/factor);
+    c->filter_bank= av_mallocz(c->filter_length*(PHASE_COUNT+1)*sizeof(short));
+    av_build_filter(c->filter_bank, factor, c->filter_length, PHASE_COUNT, 1<<FILTER_SHIFT, 1);
+    c->filter_bank[c->filter_length*PHASE_COUNT + (c->filter_length-1) + 1]= (1<<FILTER_SHIFT)-1;
+    c->filter_bank[c->filter_length*PHASE_COUNT + (c->filter_length-1) + 2]= 1;
+
+    c->src_incr= out_rate;
+    c->ideal_dst_incr= c->dst_incr= in_rate * PHASE_COUNT;
+    c->index= -PHASE_COUNT*((c->filter_length-1)/2);
+
+    return c;
+}
+
+void av_resample_close(AVResampleContext *c){
+    av_freep(&c->filter_bank);
+    av_freep(&c);
+}
+
+void av_resample_compensate(AVResampleContext *c, int sample_delta, int compensation_distance){
+    assert(!c->compensation_distance); //FIXME
+
+    c->compensation_distance= compensation_distance;
+    c->dst_incr-= c->ideal_dst_incr * sample_delta / compensation_distance;
+}
+
+/**
+ * resamples.
+ * @param src an array of unconsumed samples
+ * @param consumed the number of samples of src which have been consumed are returned here
+ * @param src_size the number of unconsumed samples available
+ * @param dst_size the amount of space in samples available in dst
+ * @param update_ctx if this is 0 then the context wont be modified, that way several channels can be resampled with the same context
+ * @return the number of samples written in dst or -1 if an error occured
+ */
+int av_resample(AVResampleContext *c, short *dst, short *src, int *consumed, int src_size, int dst_size, int update_ctx){
+    int dst_index, i;
+    int index= c->index;
+    int frac= c->frac;
+    int dst_incr_frac= c->dst_incr % c->src_incr;
+    int dst_incr=      c->dst_incr / c->src_incr;
+    
+    if(c->compensation_distance && c->compensation_distance < dst_size)
+        dst_size= c->compensation_distance;
+    
+    for(dst_index=0; dst_index < dst_size; dst_index++){
+        short *filter= c->filter_bank + c->filter_length*(index & PHASE_MASK);
+        int sample_index= index >> PHASE_SHIFT;
+        int val=0;
+        
+        if(sample_index < 0){
+            for(i=0; i<c->filter_length; i++)
+                val += src[ABS(sample_index + i)] * filter[i];
+        }else if(sample_index + c->filter_length > src_size){
+            break;
+        }else{
+#if 0
+            int64_t v=0;
+            int sub_phase= (frac<<12) / c->src_incr;
+            for(i=0; i<c->filter_length; i++){
+                int64_t coeff= filter[i]*(4096 - sub_phase) + filter[i + c->filter_length]*sub_phase;
+                v += src[sample_index + i] * coeff;
+            }
+            val= v>>12;
+#else
+            for(i=0; i<c->filter_length; i++){
+                val += src[sample_index + i] * filter[i];
+            }
+#endif
+        }
+
+        val = (val + (1<<(FILTER_SHIFT-1)))>>FILTER_SHIFT;
+        dst[dst_index] = (unsigned)(val + 32768) > 65535 ? (val>>31) ^ 32767 : val;
+
+        frac += dst_incr_frac;
+        index += dst_incr;
+        if(frac >= c->src_incr){
+            frac -= c->src_incr;
+            index++;
+        }
+    }
+    if(update_ctx){
+        if(c->compensation_distance){
+            c->compensation_distance -= index;
+            if(!c->compensation_distance)
+                c->dst_incr= c->ideal_dst_incr;
+        }
+        c->frac= frac;
+        c->index=0;
+    }
+    *consumed= index >> PHASE_SHIFT;
+    return dst_index;
+}