# HG changeset patch # User tmmm # Date 1065072007 0 # Node ID b78a9ba6a568622762e53f1b2eaebaf8c31e6d7d # Parent 07029b2cd44fc907136f560d1d0a52326b08d787 first pass at a VQA video decoder diff -r 07029b2cd44f -r b78a9ba6a568 Makefile --- a/Makefile Thu Oct 02 04:19:56 2003 +0000 +++ b/Makefile Thu Oct 02 05:20:07 2003 +0000 @@ -18,7 +18,7 @@ fft.o mdct.o mace.o huffyuv.o cyuv.o opts.o raw.o h264.o golomb.o \ vp3.o asv1.o 4xm.o cabac.o ffv1.o ra144.o ra288.o vcr1.o cljr.o \ roqvideo.o dpcm.o interplayvideo.o xan.o rpza.o cinepak.o msrle.o \ - msvideo1.o + msvideo1.o vqavideo.o ifeq ($(AMR_NB),yes) ifeq ($(AMR_NB_FIXED),yes) diff -r 07029b2cd44f -r b78a9ba6a568 allcodecs.c --- a/allcodecs.c Thu Oct 02 04:19:56 2003 +0000 +++ b/allcodecs.c Thu Oct 02 05:20:07 2003 +0000 @@ -127,6 +127,7 @@ register_avcodec(&cinepak_decoder); register_avcodec(&msrle_decoder); register_avcodec(&msvideo1_decoder); + register_avcodec(&vqa_decoder); #ifdef CONFIG_AC3 register_avcodec(&ac3_decoder); #endif diff -r 07029b2cd44f -r b78a9ba6a568 avcodec.h --- a/avcodec.h Thu Oct 02 04:19:56 2003 +0000 +++ b/avcodec.h Thu Oct 02 05:20:07 2003 +0000 @@ -1432,6 +1432,7 @@ extern AVCodec cinepak_decoder; extern AVCodec msrle_decoder; extern AVCodec msvideo1_decoder; +extern AVCodec vqa_decoder; extern AVCodec ra_144_decoder; extern AVCodec ra_288_decoder; extern AVCodec roq_dpcm_decoder; diff -r 07029b2cd44f -r b78a9ba6a568 vqavideo.c --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/vqavideo.c Thu Oct 02 05:20:07 2003 +0000 @@ -0,0 +1,610 @@ +/* + * Westwood Studios VQA Video Decoder + * Copyright (C) 2003 the ffmpeg project + * + * This library is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2 of the License, or (at your option) any later version. + * + * This library is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with this library; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + * + */ + +/** + * @file vqavideo.c + * VQA Video Decoder by Mike Melanson (melanson@pcisys.net) + * For more information about the RPZA format, visit: + * http://www.pcisys.net/~melanson/codecs/ + * + * The VQA video decoder outputs PAL8 colorspace data. + * + * This decoder needs the 42-byte VQHD header from the beginning + * of the VQA file passed through the extradata field. The VQHD header + * is laid out as: + * + * bytes 0-3 chunk fourcc: 'VQHD' + * bytes 4-7 chunk size in big-endian format, should be 0x0000002A + * bytes 8-50 VQHD chunk data + * + * Bytes 8-50 are what this decoder expects to see. + * + * Briefly, VQA is a vector quantized animation format that operates in a + * 6-bit VGA palettized colorspace. It operates on pixel vectors (blocks) + * of either 4x2 or 4x4 in size. Compressed VQA chunks can contain vector + * codebooks, palette information, and code maps for rendering vectors onto + * frames. Any of these components can also be compressed with a run-length + * encoding (RLE) algorithm commonly referred to as "format80". + * + * VQA takes a novel approach to rate control. Each group of n frames + * (usually, n = 8) relies on a different vector codebook. Rather than + * transporting an entire codebook every 8th frame, the new codebook is + * broken up into 8 pieces and sent along with the compressed video chunks + * for each of the 8 frames preceding the 8 frames which require the + * codebook. A full codebook is also sent on the very first frame of a + * file. This is an interesting technique, although it makes random file + * seeking difficult despite the fact that the frames are all intracoded. + * + * V1,2 VQA uses 12-bit codebook indices. If the 12-bit indices were + * packed into bytes and then RLE compressed, bytewise, the results would + * be poor. That is why the coding method divides each index into 2 parts, + * the top 4 bits and the bottom 8 bits, the RL encodes the 4-bit pieces + * together and the 8-bit pieces together. If most of the vectors are + * clustered into one group of 256 vectors, most of the 4-bit index pieces + * should be the same. + */ + +#include +#include +#include +#include + +#include "common.h" +#include "avcodec.h" +#include "dsputil.h" + +#define PALETTE_COUNT 256 +#define VQA_HEADER_SIZE 0x2A +#define CHUNK_PREAMBLE_SIZE 8 + +/* v1, v2 files: each vector codebook entry is 4x2=8 pixels = 8 bytes */ +#define V1_2_VECTOR_SIZE 8 +#define V1_2_MAX_VECTORS 0xF00 +/* v3 files: each vector codebook entry is 4x4=16 pixels = 16 bytes */ +#define V3_VECTOR_SIZE 16 +#define V3_MAX_VECTORS 0xFF00 + +#define LE_16(x) ((((uint8_t*)(x))[1] << 8) | ((uint8_t*)(x))[0]) +#define BE_16(x) ((((uint8_t*)(x))[0] << 8) | ((uint8_t*)(x))[1]) +#define BE_32(x) ((((uint8_t*)(x))[0] << 24) | \ + (((uint8_t*)(x))[1] << 16) | \ + (((uint8_t*)(x))[2] << 8) | \ + ((uint8_t*)(x))[3]) + +#define FOURCC_TAG( ch0, ch1, ch2, ch3 ) \ + ( (long)(unsigned char)(ch3) | \ + ( (long)(unsigned char)(ch2) << 8 ) | \ + ( (long)(unsigned char)(ch1) << 16 ) | \ + ( (long)(unsigned char)(ch0) << 24 ) ) + +#define CBF0_TAG FOURCC_TAG('C', 'B', 'F', '0') +#define CBFZ_TAG FOURCC_TAG('C', 'B', 'F', 'Z') +#define CBP0_TAG FOURCC_TAG('C', 'B', 'P', '0') +#define CBPZ_TAG FOURCC_TAG('C', 'B', 'P', 'Z') +#define CPL0_TAG FOURCC_TAG('C', 'P', 'L', '0') +#define CPLZ_TAG FOURCC_TAG('C', 'P', 'L', 'Z') +#define VPTZ_TAG FOURCC_TAG('V', 'P', 'T', 'Z') + +#define VQA_DEBUG 0 + +#if VQA_DEBUG +#define vqa_debug printf +#else +static inline void vqa_debug(const char *format, ...) { } +#endif + +typedef struct VqaContext { + + AVCodecContext *avctx; + DSPContext dsp; + AVFrame frame; + + unsigned char *buf; + int size; + + unsigned char palette[PALETTE_COUNT * 4]; + + int width; /* width of a frame */ + int height; /* height of a frame */ + int vector_width; /* width of individual vector */ + int vector_height; /* height of individual vector */ + int vqa_version; /* this should be either 1, 2 or 3 */ + + unsigned char *codebook; /* the current codebook */ + unsigned char *next_codebook_buffer; /* accumulator for next codebook */ + int next_codebook_buffer_index; + + unsigned char *decode_buffer; + int decode_buffer_size; + + /* number of frames to go before replacing codebook */ + int partial_countdown; + int partial_count; + +} VqaContext; + +static int vqa_decode_init(AVCodecContext *avctx) +{ + VqaContext *s = (VqaContext *)avctx->priv_data; + unsigned char *vqa_header; + + s->avctx = avctx; + avctx->pix_fmt = PIX_FMT_PAL8; + avctx->has_b_frames = 0; + dsputil_init(&s->dsp, avctx); + + /* make sure the extradata made it */ + if (s->avctx->extradata_size != VQA_HEADER_SIZE) { + printf(" VQA video: expected extradata size of %d\n", VQA_HEADER_SIZE); + return -1; + } + + /* load up the VQA parameters from the header */ + vqa_header = (unsigned char *)s->avctx->extradata; + s->vqa_version = vqa_header[0]; + s->width = LE_16(&vqa_header[6]); + s->height = LE_16(&vqa_header[8]); + s->vector_width = vqa_header[10]; + s->vector_height = vqa_header[11]; + s->partial_count = s->partial_countdown = vqa_header[13]; + + /* the vector dimensions have to meet very stringent requirements */ + if ((s->vector_width != 4) || + ((s->vector_height != 2) && (s->vector_height != 4))) { + /* return without further initialization */ + return -1; + } + + /* allocate codebooks */ + if (s->vqa_version == 3) { + s->codebook = av_malloc(V3_VECTOR_SIZE * V3_MAX_VECTORS); + s->next_codebook_buffer = av_malloc(V3_VECTOR_SIZE * V3_MAX_VECTORS); + } else { + s->codebook = av_malloc(V1_2_VECTOR_SIZE * V1_2_MAX_VECTORS); + s->next_codebook_buffer = av_malloc(V1_2_VECTOR_SIZE * V1_2_MAX_VECTORS); + } + s->next_codebook_buffer_index = 0; + + /* allocate decode buffer */ + s->decode_buffer_size = (s->width / s->vector_width) * + (s->height / s->vector_height) * 2; + s->decode_buffer = av_malloc(s->decode_buffer_size); + + s->frame.data[0] = NULL; + + return 0; +} + +#define CHECK_COUNT() \ + if (dest_index + count > dest_size) { \ + printf ("vqavideo: decode_format80 problem: next op would overflow dest_index\n"); \ + printf ("vqavideo: current dest_index = %d, count = %d, dest_size = %d\n", \ + dest_index, count, dest_size); \ + return; \ + } + +static void decode_format80(unsigned char *src, int src_size, + unsigned char *dest, int dest_size) { + + int src_index = 0; + int dest_index = 0; + int count; + int src_pos; + unsigned char color; + int i; + + while (src_index < src_size) { + + vqa_debug(" opcode %02X: ", src[src_index]); + + /* 0x80 means that frame is finished */ + if (src[src_index] == 0x80) + return; + + if (dest_index >= dest_size) { + printf ("vqavideo: decode_format80 problem: dest_index (%d) exceeded dest_size (%d)\n", + dest_index, dest_size); + return; + } + + if (src[src_index] == 0xFF) { + + src_index++; + count = LE_16(&src[src_index]); + src_index += 2; + src_pos = LE_16(&src[src_index]); + src_index += 2; + vqa_debug("(1) copy %X bytes from absolute pos %X\n", count, src_pos); + CHECK_COUNT(); + for (i = 0; i < count; i++) + dest[dest_index + i] = dest[src_pos + i]; + dest_index += count; + + } else if (src[src_index] == 0xFE) { + + src_index++; + count = LE_16(&src[src_index]); + src_index += 2; + color = src[src_index++]; + vqa_debug("(2) set %X bytes to %02X\n", count, color); + CHECK_COUNT(); + memset(&dest[dest_index], color, count); + dest_index += count; + + } else if ((src[src_index] & 0xC0) == 0xC0) { + + count = (src[src_index++] & 0x3F) + 3; + src_pos = LE_16(&src[src_index]); + src_index += 2; + vqa_debug("(3) copy %X bytes from absolute pos %X\n", count, src_pos); + CHECK_COUNT(); + for (i = 0; i < count; i++) + dest[dest_index + i] = dest[src_pos + i]; + dest_index += count; + + } else if (src[src_index] > 0x80) { + + count = src[src_index++] & 0x3F; + vqa_debug("(4) copy %X bytes from source to dest\n", count); + CHECK_COUNT(); + memcpy(&dest[dest_index], &src[src_index], count); + src_index += count; + dest_index += count; + + } else { + + count = ((src[src_index] & 0x70) >> 4) + 3; + src_pos = BE_16(&src[src_index]) & 0x0FFF; + src_index += 2; + vqa_debug("(5) copy %X bytes from relpos %X\n", count, src_pos); + CHECK_COUNT(); + for (i = 0; i < count; i++) + dest[dest_index + i] = dest[dest_index - src_pos + i]; + dest_index += count; + } + } + + if (dest_index < dest_size) + printf ("vqavideo: decode_format80 problem: decode finished with dest_index (%d) < dest_size (%d)\n", + dest_index, dest_size); +} + +static void vqa_decode_chunk(VqaContext *s) +{ + +//static int frame = 0; + unsigned int chunk_type; + unsigned int chunk_size; + int byte_skip; + unsigned int index = 0; + int i; + unsigned char r, g, b; + unsigned int *palette32; + + int cbf0_chunk = -1; + int cbfz_chunk = -1; + int cbp0_chunk = -1; + int cbpz_chunk = -1; + int cpl0_chunk = -1; + int cplz_chunk = -1; + int vptz_chunk = -1; + + int x, y; + int lines = 0; + int pixel_ptr; + int vector_index = 0; + int lobyte = 0; + int hibyte = 0; + int lobytes = 0; + int hibytes = s->decode_buffer_size / 2; + +//printf (" **** decoding frame #%d, stride = %d\n", frame++, s->frame.linesize[0]); + /* first, traverse through the frame and find the subchunks */ + while (index < s->size) { + + chunk_type = BE_32(&s->buf[index]); + chunk_size = BE_32(&s->buf[index + 4]); + + switch (chunk_type) { + + case CBF0_TAG: + cbf0_chunk = index; + break; + + case CBFZ_TAG: + cbfz_chunk = index; + break; + + case CBP0_TAG: + cbp0_chunk = index; + break; + + case CBPZ_TAG: + cbpz_chunk = index; + break; + + case CPL0_TAG: + cpl0_chunk = index; + break; + + case CPLZ_TAG: + cplz_chunk = index; + break; + + case VPTZ_TAG: + vptz_chunk = index; + break; + + default: + printf (" VQA video: Found unknown chunk type: %c%c%c%c (%08X)\n", + (chunk_type >> 24) & 0xFF, + (chunk_type >> 16) & 0xFF, + (chunk_type >> 8) & 0xFF, + (chunk_type >> 0) & 0xFF, + chunk_type); + break; + } + + byte_skip = chunk_size & 0x01; + index += (CHUNK_PREAMBLE_SIZE + chunk_size + byte_skip); + } + + /* next, deal with the palette */ + if ((cpl0_chunk != -1) && (cplz_chunk != -1)) { + + /* a chunk should not have both chunk types */ + printf (" VQA video: problem: found both CPL0 and CPLZ chunks\n"); + return; + } + + /* decompress the palette chunk */ + if (cplz_chunk != -1) { + +/* yet to be handled */ + + } + + /* convert the RGB palette into the machine's endian format */ + if (cpl0_chunk != -1) { + + chunk_size = BE_32(&s->buf[cpl0_chunk + 4]); + /* sanity check the palette size */ + if (chunk_size / 3 > 256) { + printf ("vqavideo: problem: found a palette chunk with %d colors\n", + chunk_size / 3); + return; + } + cpl0_chunk += CHUNK_PREAMBLE_SIZE; + palette32 = (unsigned int *)s->palette; + for (i = 0; i < chunk_size / 3; i++) { + /* scale by 4 to transform 6-bit palette -> 8-bit */ + r = s->buf[cpl0_chunk++] * 4; + g = s->buf[cpl0_chunk++] * 4; + b = s->buf[cpl0_chunk++] * 4; + palette32[i] = (r << 16) | (g << 8) | (b); + } + } + + /* next, look for a full codebook */ + if ((cbf0_chunk != -1) && (cbfz_chunk != -1)) { + + /* a chunk should not have both chunk types */ + printf (" VQA video: problem: found both CBF0 and CBFZ chunks\n"); + return; + } + + /* decompress the full codebook chunk into the codebook accumulation + * buffer; this is safe since only the first frame is supposed to have + * a full codebook */ + if (cbfz_chunk != -1) { + +/* yet to be handled */ + + } + + /* copy a full codebook */ + if (cbf0_chunk != -1) { + + index = cbf0_chunk; + + chunk_size = BE_32(&s->buf[cbf0_chunk + 4]); + /* sanity check the full codebook size */ + if (s->vqa_version == 3) { + if (chunk_size / (V3_VECTOR_SIZE) > V3_MAX_VECTORS) { + printf (" VQA video: problem: CBF0 chunk too large (0x%X bytes)\n", + chunk_size); + return; + } + } else { + if (chunk_size / (V1_2_VECTOR_SIZE) > V1_2_MAX_VECTORS) { + printf (" VQA video: problem: CBF0 chunk too large (0x%X bytes)\n", + chunk_size); + return; + } + } + cbf0_chunk += CHUNK_PREAMBLE_SIZE; + + memcpy(s->codebook, &s->buf[cbf0_chunk], chunk_size); + } + + /* decode the frame */ + if (vptz_chunk == -1) { + + /* something is wrong if there is no VPTZ chunk */ + printf (" VQA video: problem: no VPTZ chunk found\n"); + return; + } + + /* decode frame */ + chunk_size = BE_32(&s->buf[vptz_chunk + 4]); + vptz_chunk += CHUNK_PREAMBLE_SIZE; + decode_format80(&s->buf[vptz_chunk], chunk_size, + s->decode_buffer, s->decode_buffer_size); + + +if (0) +{ +int count = 0; +printf (" finished decoding frame..."); +for (index = 8000; index < 16000; index++) + if (s->decode_buffer[index] > 0x0F) + count++; +printf (" %d/8000 hibytes exceeded 0x0F\n", count); +} + + + /* render the final PAL8 frame */ + for (y = 0; y < s->frame.linesize[0] * s->height; + y += s->frame.linesize[0] * s->vector_height) { + + for (x = y; x < y + s->width; x += 4, lobytes++, hibytes++) { + pixel_ptr = x; + + /* get the vector index, the method for which varies according to + * VQA file version */ + switch (s->vqa_version) { + + case 1: +/* still need sample media for this case (only one game, "Legend of + * Kyrandia III : Malcolm's Revenge", is known to use this version) */ + lines = 0; + break; + + case 2: + lobyte = s->decode_buffer[lobytes]; + hibyte = s->decode_buffer[hibytes]; + if (hibyte > 0x0F) { + printf (" VQA video: problem: vector #%d/%d high byte out of range (0x%X >= 0x0F)\n", + lobytes, s->decode_buffer_size / 2, hibyte); + hibyte = lobyte = 0; + } else if (hibyte == 0x0F) + hibyte = 0; + vector_index = (hibyte << 8) | lobyte; + vector_index *= V1_2_VECTOR_SIZE; + lines = 2; + break; + + case 3: +/* not implemented yet */ + lines = 0; + break; + } + + while (lines--) { + s->frame.data[0][pixel_ptr + 0] = s->codebook[vector_index++]; + s->frame.data[0][pixel_ptr + 1] = s->codebook[vector_index++]; + s->frame.data[0][pixel_ptr + 2] = s->codebook[vector_index++]; + s->frame.data[0][pixel_ptr + 3] = s->codebook[vector_index++]; + pixel_ptr += s->frame.linesize[0]; + } + } + } + + /* handle partial codebook */ + if ((cbp0_chunk != -1) && (cbpz_chunk != -1)) { + /* a chunk should not have both chunk types */ + printf (" VQA video: problem: found both CBP0 and CBPZ chunks\n"); + return; + } + + if (cbp0_chunk != -1) { + + chunk_size = BE_32(&s->buf[cbp0_chunk + 4]); + cbp0_chunk += CHUNK_PREAMBLE_SIZE; + + /* accumulate partial codebook */ + memcpy(&s->next_codebook_buffer[s->next_codebook_buffer_index], + &s->buf[cbp0_chunk], chunk_size); + s->next_codebook_buffer_index += chunk_size; + + s->partial_countdown--; + if (s->partial_countdown == 0) { + + /* time to replace codebook */ + memcpy(s->codebook, s->next_codebook_buffer, + s->next_codebook_buffer_index); + + /* reset accounting */ + s->next_codebook_buffer_index = 0; + s->partial_countdown = s->partial_count; + } + } + + if (cbpz_chunk != -1) { + +/* more partial codebook handling ... */ + + } +} + +static int vqa_decode_frame(AVCodecContext *avctx, + void *data, int *data_size, + uint8_t *buf, int buf_size) +{ + VqaContext *s = (VqaContext *)avctx->priv_data; + + s->buf = buf; + s->size = buf_size; + + if (s->frame.data[0]) + avctx->release_buffer(avctx, &s->frame); + + if (avctx->get_buffer(avctx, &s->frame)) { + printf (" VQA Video: get_buffer() failed\n"); + return -1; + } + + vqa_decode_chunk(s); + + /* make the palette available on the way out */ + memcpy(s->frame.data[1], s->palette, PALETTE_COUNT * 4); + + *data_size = sizeof(AVFrame); + *(AVFrame*)data = s->frame; + + /* report that the buffer was completely consumed */ + return buf_size; +} + +static int vqa_decode_end(AVCodecContext *avctx) +{ + VqaContext *s = (VqaContext *)avctx->priv_data; + + av_free(s->codebook); + av_free(s->next_codebook_buffer); + av_free(s->decode_buffer); + + if (s->frame.data[0]) + avctx->release_buffer(avctx, &s->frame); + + return 0; +} + +AVCodec vqa_decoder = { + "vqavideo", + CODEC_TYPE_VIDEO, + CODEC_ID_WS_VQA, + sizeof(VqaContext), + vqa_decode_init, + NULL, + vqa_decode_end, + vqa_decode_frame, + CODEC_CAP_DR1, +};