Mercurial > libavcodec.hg
changeset 675:9008cbe229ce libavcodec
alignment info
author | michaelni |
---|---|
date | Sat, 14 Sep 2002 19:00:09 +0000 |
parents | 4490bfbb932d |
children | c3bdb00a98a9 |
files | dsputil.h |
diffstat | 1 files changed, 23 insertions(+), 13 deletions(-) [+] |
line wrap: on
line diff
--- a/dsputil.h Sat Sep 14 17:18:26 2002 +0000 +++ b/dsputil.h Sat Sep 14 19:00:09 2002 +0000 @@ -50,17 +50,26 @@ void dsputil_init(void); -/* pixel ops : interface with DCT */ +/* minimum alignment rules ;) +if u notice errors in the align stuff, need more alignment for some asm code for some cpu +or need to use a function with less aligned data then send a mail to the ffmpeg-dev list, ... + +!warning these alignments might not match reallity, (missing attribute((align)) stuff somewhere possible) +i (michael) didnt check them, these are just the alignents which i think could be reached easily ... + +!future video codecs might need functions with less strict alignment +*/ -extern void (*ff_idct)(DCTELEM *block); -extern void (*ff_idct_put)(UINT8 *dest, int line_size, DCTELEM *block); -extern void (*ff_idct_add)(UINT8 *dest, int line_size, DCTELEM *block); -extern void (*get_pixels)(DCTELEM *block, const UINT8 *pixels, int line_size); -extern void (*diff_pixels)(DCTELEM *block, const UINT8 *s1, const UINT8 *s2, int stride); -extern void (*put_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size); -extern void (*add_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size); -extern void (*gmc1)(UINT8 *dst, UINT8 *src, int srcStride, int h, int x16, int y16, int rounder); -extern void (*clear_blocks)(DCTELEM *blocks); +/* pixel ops : interface with DCT */ +extern void (*ff_idct)(DCTELEM *block/*align 16*/); +extern void (*ff_idct_put)(UINT8 *dest/*align 8*/, int line_size, DCTELEM *block/*align 16*/); +extern void (*ff_idct_add)(UINT8 *dest/*align 8*/, int line_size, DCTELEM *block/*align 16*/); +extern void (*get_pixels)(DCTELEM *block/*align 16*/, const UINT8 *pixels/*align 8*/, int line_size); +extern void (*diff_pixels)(DCTELEM *block/*align 16*/, const UINT8 *s1/*align 8*/, const UINT8 *s2/*align 8*/, int stride); +extern void (*put_pixels_clamped)(const DCTELEM *block/*align 16*/, UINT8 *pixels/*align 8*/, int line_size); +extern void (*add_pixels_clamped)(const DCTELEM *block/*align 16*/, UINT8 *pixels/*align 8*/, int line_size); +extern void (*gmc1)(UINT8 *dst/*align 8*/, UINT8 *src/*align 1*/, int srcStride, int h, int x16, int y16, int rounder); +extern void (*clear_blocks)(DCTELEM *blocks/*align 16*/); extern int (*pix_sum)(UINT8 * pix, int line_size); extern int (*pix_norm1)(UINT8 * pix, int line_size); @@ -73,8 +82,9 @@ void clear_blocks_c(DCTELEM *blocks); /* add and put pixel (decoding) */ -typedef void (*op_pixels_func)(UINT8 *block, const UINT8 *pixels, int line_size, int h); -typedef void (*qpel_mc_func)(UINT8 *dst, UINT8 *src, int stride); +// blocksizes for op_pixels_func are 8x4,8x8 16x8 16x16 +typedef void (*op_pixels_func)(UINT8 *block/*align width (8 or 16)*/, const UINT8 *pixels/*align 1*/, int line_size, int h); +typedef void (*qpel_mc_func)(UINT8 *dst/*align width (8 or 16)*/, UINT8 *src/*align 1*/, int stride); extern op_pixels_func put_pixels_tab[2][4]; extern op_pixels_func avg_pixels_tab[2][4]; @@ -93,7 +103,7 @@ /* motion estimation */ -typedef int (*op_pixels_abs_func)(UINT8 *blk1, UINT8 *blk2, int line_size); +typedef int (*op_pixels_abs_func)(UINT8 *blk1/*align width (8 or 16)*/, UINT8 *blk2/*align 1*/, int line_size); extern op_pixels_abs_func pix_abs16x16; extern op_pixels_abs_func pix_abs16x16_x2;