view ra144.c @ 6833:37464a7b3f59 libavcodec

Use ff_sqrt() function instead of using a table
author vitor
date Wed, 21 May 2008 16:33:49 +0000
parents 9584a95fefcd
children bf3bc36715e6
line wrap: on
line source

/*
 * Real Audio 1.0 (14.4K)
 * Copyright (c) 2003 the ffmpeg project
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include "avcodec.h"
#include "bitstream.h"
#include "ra144.h"

#define NBLOCKS         4       /* number of segments within a block */
#define BLOCKSIZE       40      /* (quarter) block size in 16-bit words (80 bytes) */
#define HALFBLOCK       20      /* BLOCKSIZE/2 */
#define BUFFERSIZE      146     /* for do_output */


/* internal globals */
typedef struct {
    unsigned int     oldval;
    unsigned int     gbuf1[8];
    unsigned short   gbuf2[120];
    unsigned int    *decptr;                /* decoder ptr */
    signed   short  *decsp;

    /* the swapped buffers */
    unsigned int     swapbuffers[4][10];
    unsigned int    *swapbuf1;
    unsigned int    *swapbuf2;
    unsigned int    *swapbuf1alt;
    unsigned int    *swapbuf2alt;

    unsigned int buffer[5];
    unsigned short int buffer_2[148];

    unsigned short *sptr;
} Real144_internal;

static int ra144_decode_init(AVCodecContext * avctx)
{
    Real144_internal *glob = avctx->priv_data;

    glob->swapbuf1    = glob->swapbuffers[0];
    glob->swapbuf2    = glob->swapbuffers[1];
    glob->swapbuf1alt = glob->swapbuffers[2];
    glob->swapbuf2alt = glob->swapbuffers[3];

    return 0;
}

/* lookup square roots in table */
static int t_sqrt(unsigned int x)
{
    int s = 0;
    while (x > 0xfff) {
        s++;
        x = x >> 2;
    }

    return (ff_sqrt(x << 20) << s) << 2;
}

/* do 'voice' */
static void do_voice(const int *a1, int *a2)
{
    int buffer[10];
    int *b1 = buffer;
    int *b2 = a2;
    int x, y;

    for (x=0; x < 10; x++) {
        b1[x] = a1[x] << 4;

        for (y=0; y < x; y++)
            b1[y] = ((a1[x] * b2[x-y-1]) >> 12) + b2[y];

        FFSWAP(int *, b1, b2);
    }

    for (x=0; x < 10; x++)
        a2[x] >>= 4;
}

/* rotate block */
static void rotate_block(const short *source, short *target, int offset)
{
    int i=0, k=0;
    source += BUFFERSIZE - offset;

    while (i<BLOCKSIZE) {
        target[i++] = source[k++];

        if (k == offset)
            k = 0;
    }
}

/* inverse root mean square */
static int irms(const short *data, int factor)
{
    const short *p1, *p2;
    unsigned int sum;

    p2 = (p1 = data) + BLOCKSIZE;
    for (sum=0; p2 > p1; p1++)
        sum += (*p1) * (*p1);

    if (sum == 0)
        return 0; /* OOPS - division by zero */

    return (0x20000000 / (t_sqrt(sum) >> 8)) * factor;
}

/* multiply/add wavetable */
static void add_wav(int n, int f, int m1, int m2, int m3, const short *s1,
                    const short *s2, const short *s3, short *dest)
{
    int a, b, c, i;
    const short *ptr, *ptr2;

    ptr  = wavtable1 + n * 9;
    ptr2 = wavtable2 + n * 9;

    if (f != 0)
        a = ((*ptr) * m1) >> ((*ptr2) + 1);
    else
        a = 0;

    ptr++;
    ptr2++;
    b = ((*ptr) * m2) >> ((*ptr2) + 1);
    ptr++;
    ptr2++;
    c = ((*ptr) * m3) >> ((*ptr2) + 1);

    if (f != 0)
        for (i=0; i < BLOCKSIZE; i++)
            dest[i] = ((*(s1++)) * a + (*(s2++)) * b + (*(s3++)) * c) >> 12;
    else
        for (i=0; i < BLOCKSIZE; i++)
            dest[i] = ((*(s2++)) * b + (*(s3++)) * c) >> 12;
}


static void final(const short *i1, const short *i2,
                  void *out, int *statbuf, int len)
{
    int x, sum, i;
    int buffer[10];
    short *ptr;
    short *ptr2;
    unsigned short int work[50];

    memcpy(work, statbuf,20);
    memcpy(work + 10, i2, len * 2);

    for(i=0; i<10; i++)
        buffer[9-i] = i1[i];

    ptr2 = (ptr = work) + len;

    while (ptr < ptr2) {
        for(sum=0, x=0; x<=9; x++)
            sum += buffer[x] * (ptr[x]);

        sum = sum >> 12;
        x = ptr[10] - sum;

        if (x<-32768 || x>32767) {
            memset(out, 0, len * 2);
            memset(statbuf, 0, 20);
            return;
        }

        ptr[10] = x;
        ptr++;
    }
    memcpy(out, ptr+10 - len, len * 2);
    memcpy(statbuf, ptr, 20);
}

static unsigned int rms(const int *data, int f)
{
    const int *c;
    int x;
    unsigned int res;
    int b;

    c = data;
    b = 0;
    res = 0x10000;
    for (x=0; x<10; x++) {
        res = (((0x1000000 - (*c) * (*c)) >> 12) * res) >> 12;

        if (res == 0)
            return 0;

        if (res <= 0x3fff) {
            while (res <= 0x3fff) {
                b++;
                res <<= 2;
            }
        } else {
            if (res > 0x10000)
                return 0; /* We're screwed, might as well go out with a bang. :P */
        }
        c++;
    }

    if (res > 0)
        res = t_sqrt(res);

    res >>= (b + 10);
    res = (res * f) >> 10;
    return res;
}

/* do quarter-block output */
static void do_output_subblock(Real144_internal *glob, const unsigned short  *gsp, unsigned int gval, signed short *output_buffer, GetBitContext *gb)
{
    unsigned short int buffer_a[40];
    unsigned short int *block;
    int e, f, g;
    int a = get_bits(gb, 7);
    int d = get_bits(gb, 8);
    int b = get_bits(gb, 7);
    int c = get_bits(gb, 7);

    if (a) {
        a += HALFBLOCK - 1;
        rotate_block(glob->buffer_2, buffer_a, a);
    }

    e = ((ftable1[b] >> 4) * gval) >> 8;
    f = ((ftable2[c] >> 4) * gval) >> 8;

    if (a)
        g = irms(buffer_a, gval) >> 12;
    else
        g = 0;

    memmove(glob->buffer_2, glob->buffer_2 + BLOCKSIZE, (BUFFERSIZE - BLOCKSIZE) * 2);
    block = glob->buffer_2 + BUFFERSIZE - BLOCKSIZE;

    add_wav(d, a, g, e, f, buffer_a, etable1 + b*BLOCKSIZE,
            etable2 + c*BLOCKSIZE, block);

    final(gsp, block, output_buffer, glob->buffer, BLOCKSIZE);
}

static void dec1(Real144_internal *glob, const int *data, const int *inp,
                 int n, int f)
{
    short *ptr,*end;

    *(glob->decptr++) = rms(data, f);
    glob->decptr++;
    end = (ptr = glob->decsp) + (n * 10);

    while (ptr < end)
        *(ptr++) = *(inp++);
}

static int eq(const short *in, int *target)
{
    int retval;
    int a;
    int b;
    int c;
    unsigned int u;
    const short *sptr;
    int *ptr1, *ptr2, *ptr3;
    int *bp1, *bp2;
    int buffer1[10];
    int buffer2[10];

    retval = 0;
    bp1 = buffer1;
    bp2 = buffer2;
    ptr2 = (ptr3 = buffer2) + 9;
    sptr = in;

    while (ptr2 >= ptr3)
        *(ptr3++) = *(sptr++);

    target += 9;
    a = bp2[9];
    *target = a;

    if (a + 0x1000 > 0x1fff)
        return 0; /* We're screwed, might as well go out with a bang. :P */

    c = 8;
    u = a;

    while (c >= 0) {
        if (u == 0x1000)
            u++;

        if (u == 0xfffff000)
            u--;

        b = 0x1000-((u * u) >> 12);

        if (b == 0)
            b++;

        ptr2 = bp1;
        ptr1 = (ptr3 = bp2) + c;

        for (u=0; u<=c; u++)
            *(ptr2++) = ((*(ptr3++) - (((*target) * (*(ptr1--))) >> 12)) * (0x1000000 / b)) >> 12;

        *(--target) = u = bp1[(c--)];

        if ((u + 0x1000) > 0x1fff)
            retval = 1;

        FFSWAP(int *, bp1, bp2);
    }
    return retval;
}

static void dec2(Real144_internal *glob, const int *data, const int *inp,
                 int n, int f, const int *inp2, int l)
{
    unsigned const int *ptr1,*ptr2;
    int work[10];
    int a,b;
    int x;
    int result;

    if(l + 1 < NBLOCKS / 2)
        a = NBLOCKS - (l + 1);
    else
        a = l + 1;

    b = NBLOCKS - a;

    if (l == 0) {
        glob->decsp = glob->sptr = glob->gbuf2;
        glob->decptr = glob->gbuf1;
    }
    ptr1 = inp;
    ptr2 = inp2;

    for (x=0; x<10*n; x++)
        *(glob->sptr++) = (a * (*ptr1++) + b * (*ptr2++)) >> 2;

    result = eq(glob->decsp, work);

    if (result == 1) {
        dec1(glob, data, inp, n, f);
    } else {
        *(glob->decptr++) = rms(work, f);
        glob->decptr++;
    }
    glob->decsp += n * 10;
}

/* Uncompress one block (20 bytes -> 160*2 bytes) */
static int ra144_decode_frame(AVCodecContext * avctx,
            void *vdata, int *data_size,
            const uint8_t * buf, int buf_size)
{
    static const uint8_t sizes[10] = {6, 5, 5, 4, 4, 3, 3, 3, 3, 2};
    unsigned int a, b, c;
    int i;
    signed short *shptr;
    int16_t *data = vdata;
    unsigned int val;

    Real144_internal *glob = avctx->priv_data;
    GetBitContext gb;

    if(buf_size == 0)
        return 0;

    init_get_bits(&gb, buf, 20 * 8);

    for (i=0; i<10; i++)
        // "<< 1"? Doesn't this make one value out of two of the table useless?
        glob->swapbuf1[i] = decodetable[i][get_bits(&gb, sizes[i]) << 1];

    do_voice(glob->swapbuf1, glob->swapbuf2);

    val = decodeval[get_bits(&gb, 5) << 1]; // Useless table entries?
    a = t_sqrt(val*glob->oldval) >> 12;

    for (c=0; c < NBLOCKS; c++) {
        if (c == (NBLOCKS - 1)) {
            dec1(glob, glob->swapbuf1, glob->swapbuf2, 3, val);
        } else {
            if (c * 2 == (NBLOCKS - 2)) {
                if (glob->oldval < val) {
                    dec2(glob, glob->swapbuf1, glob->swapbuf2, 3, a, glob->swapbuf2alt, c);
                } else {
                    dec2(glob, glob->swapbuf1alt, glob->swapbuf2alt, 3, a, glob->swapbuf2, c);
                }
            } else {
                if (c * 2 < (NBLOCKS - 2)) {
                    dec2(glob, glob->swapbuf1alt, glob->swapbuf2alt, 3, glob->oldval, glob->swapbuf2, c);
                } else {
                    dec2(glob, glob->swapbuf1, glob->swapbuf2, 3, val, glob->swapbuf2alt, c);
                }
            }
        }
    }

    /* do output */
    for (b=0, c=0; c<4; c++) {
        unsigned int gval = glob->gbuf1[c * 2];
        unsigned short *gsp = glob->gbuf2 + b;
        signed short output_buffer[40];

        do_output_subblock(glob, gsp, gval, output_buffer, &gb);

        shptr = output_buffer;
        while (shptr < output_buffer + BLOCKSIZE)
            *data++ = av_clip_int16(*(shptr++) << 2);
        b += 30;
    }

    glob->oldval = val;

    FFSWAP(unsigned int *, glob->swapbuf1alt, glob->swapbuf1);
    FFSWAP(unsigned int *, glob->swapbuf2alt, glob->swapbuf2);

    *data_size = 2*160;
    return 20;
}


AVCodec ra_144_decoder =
{
    "real_144",
    CODEC_TYPE_AUDIO,
    CODEC_ID_RA_144,
    sizeof(Real144_internal),
    ra144_decode_init,
    NULL,
    NULL,
    ra144_decode_frame,
    .long_name = "RealAudio 1.0 (14.4K)",
};