mplayer.hg: postproc/rgb2rgb.c annotate

annotate postproc/rgb2rgb.c @ 6484:c5cf988c6d6f

pre-yvu9toyv12 converter, only grayscale Y-plane coping :)

author	alex
date	Fri, 21 Jun 2002 17:37:00 +0000
parents	f0fa3373f616
children	e7635c03910f

rev	line source
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	1 /*
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	2 *
71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	3 * rgb2rgb.c, Software RGB to RGB convertor
2732 ae79207a3055 Move yuv2rgb to postprocess nick parents: 2725 diff changeset	4 * pluralize by Software PAL8 to RGB convertor
ae79207a3055 Move yuv2rgb to postprocess nick parents: 2725 diff changeset	5 * Software YUV to YUV convertor
ae79207a3055 Move yuv2rgb to postprocess nick parents: 2725 diff changeset	6 * Software YUV to RGB convertor
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	7 * Written by Nick Kurshev.
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	8 * palette & yuv & runtime cpu stuff by Michael (michaelni@gmx.at) (under GPL)
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	9 */
2504 13e1c5ab417a vo_vesa: rgb2rgb support nick parents: diff changeset	10 #include <inttypes.h>
13e1c5ab417a vo_vesa: rgb2rgb support nick parents: diff changeset	11 #include "../config.h"
13e1c5ab417a vo_vesa: rgb2rgb support nick parents: diff changeset	12 #include "rgb2rgb.h"
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	13 #include "../cpudetect.h"
4923 3cc0f4938be1 add mangling atmos4 parents: 4622 diff changeset	14 #include "../mangle.h"
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	15
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	16 #ifdef ARCH_X86
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	17 #define CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	18 #endif
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	19
4622 e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	20 #define FAST_BGR2YV12 // use 7 bit coeffs instead of 15bit
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	21
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	22 #ifdef CAN_COMPILE_X86_ASM
2755 2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	23 static const uint64_t mask32b __attribute__((aligned(8))) = 0x000000FF000000FFULL;
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	24 static const uint64_t mask32g __attribute__((aligned(8))) = 0x0000FF000000FF00ULL;
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	25 static const uint64_t mask32r __attribute__((aligned(8))) = 0x00FF000000FF0000ULL;
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	26 static const uint64_t mask32 __attribute__((aligned(8))) = 0x00FFFFFF00FFFFFFULL;
5582 21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	27 static const uint64_t mask24b __attribute__((aligned(8))) = 0x00FF0000FF0000FFULL;
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	28 static const uint64_t mask24g __attribute__((aligned(8))) = 0xFF0000FF0000FF00ULL;
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	29 static const uint64_t mask24r __attribute__((aligned(8))) = 0x0000FF0000FF0000ULL;
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	30 static const uint64_t mask24l __attribute__((aligned(8))) = 0x0000000000FFFFFFULL;
71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	31 static const uint64_t mask24h __attribute__((aligned(8))) = 0x0000FFFFFF000000ULL;
2746 dece635a28e3 Minor speedup of rgb32to24. (performance is not successful) nick parents: 2741 diff changeset	32 static const uint64_t mask24hh __attribute__((aligned(8))) = 0xffff000000000000ULL;
dece635a28e3 Minor speedup of rgb32to24. (performance is not successful) nick parents: 2741 diff changeset	33 static const uint64_t mask24hhh __attribute__((aligned(8))) = 0xffffffff00000000ULL;
dece635a28e3 Minor speedup of rgb32to24. (performance is not successful) nick parents: 2741 diff changeset	34 static const uint64_t mask24hhhh __attribute__((aligned(8))) = 0xffffffffffff0000ULL;
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	35 static const uint64_t mask15b __attribute__((aligned(8))) = 0x001F001F001F001FULL; /* 00000000 00011111 xxB */
71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	36 static const uint64_t mask15rg __attribute__((aligned(8))) = 0x7FE07FE07FE07FE0ULL; /* 01111111 11100000 RGx */
2698 22652c028692 faster 15to16 bit rgb (the mmx routine is limited by memory speed so there is no difference ): but the c routine is faster michael parents: 2697 diff changeset	37 static const uint64_t mask15s __attribute__((aligned(8))) = 0xFFE0FFE0FFE0FFE0ULL;
2741 b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	38 static const uint64_t red_16mask __attribute__((aligned(8))) = 0x0000f8000000f800ULL;
b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	39 static const uint64_t green_16mask __attribute__((aligned(8)))= 0x000007e0000007e0ULL;
b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	40 static const uint64_t blue_16mask __attribute__((aligned(8))) = 0x0000001f0000001fULL;
b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	41 static const uint64_t red_15mask __attribute__((aligned(8))) = 0x00007c000000f800ULL;
b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	42 static const uint64_t green_15mask __attribute__((aligned(8)))= 0x000003e0000007e0ULL;
b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	43 static const uint64_t blue_15mask __attribute__((aligned(8))) = 0x0000001f0000001fULL;
4622 e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	44
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	45 #ifdef FAST_BGR2YV12
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	46 static const uint64_t bgr2YCoeff __attribute__((aligned(8))) = 0x000000210041000DULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	47 static const uint64_t bgr2UCoeff __attribute__((aligned(8))) = 0x0000FFEEFFDC0038ULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	48 static const uint64_t bgr2VCoeff __attribute__((aligned(8))) = 0x00000038FFD2FFF8ULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	49 #else
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	50 static const uint64_t bgr2YCoeff __attribute__((aligned(8))) = 0x000020E540830C8BULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	51 static const uint64_t bgr2UCoeff __attribute__((aligned(8))) = 0x0000ED0FDAC23831ULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	52 static const uint64_t bgr2VCoeff __attribute__((aligned(8))) = 0x00003831D0E6F6EAULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	53 #endif
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	54 static const uint64_t bgr2YOffset __attribute__((aligned(8))) = 0x1010101010101010ULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	55 static const uint64_t bgr2UVOffset __attribute__((aligned(8)))= 0x8080808080808080ULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	56 static const uint64_t w1111 __attribute__((aligned(8))) = 0x0001000100010001ULL;
e3a9fae516e4 rgb24toyv12 in MMX (untested) michael parents: 3132 diff changeset	57
2755 2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	58 #if 0
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	59 static volatile uint64_t __attribute__((aligned(8))) b5Dither;
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	60 static volatile uint64_t __attribute__((aligned(8))) g5Dither;
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	61 static volatile uint64_t __attribute__((aligned(8))) g6Dither;
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	62 static volatile uint64_t __attribute__((aligned(8))) r5Dither;
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	63
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	64 static uint64_t __attribute__((aligned(8))) dither4[2]={
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	65 0x0103010301030103LL,
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	66 0x0200020002000200LL,};
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	67
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	68 static uint64_t __attribute__((aligned(8))) dither8[2]={
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	69 0x0602060206020602LL,
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	70 0x0004000400040004LL,};
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	71 #endif
2535 b44113f46c96 cant compile on non x86 bugfix michael parents: 2517 diff changeset	72 #endif
2513 d3c6b9ae24b1 sfence nick parents: 2512 diff changeset	73
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	74 #define RGB2YUV_SHIFT 8
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	75 #define BY ((int)( 0.098*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	76 #define BV ((int)(-0.071*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	77 #define BU ((int)( 0.439*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	78 #define GY ((int)( 0.504*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	79 #define GV ((int)(-0.368*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	80 #define GU ((int)(-0.291*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	81 #define RY ((int)( 0.257*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	82 #define RV ((int)( 0.439*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	83 #define RU ((int)(-0.148*(1<<RGB2YUV_SHIFT)+0.5))
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	84
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	85 //Note: we have C, MMX, MMX2, 3DNOW version therse no 3DNOW+MMX2 one
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	86 //Plain C versions
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	87 #undef HAVE_MMX
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	88 #undef HAVE_MMX2
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	89 #undef HAVE_3DNOW
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	90 #undef ARCH_X86
5338 2819346c6049 10l michael parents: 5337 diff changeset	91 #undef HAVE_SSE2
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	92 #define RENAME(a) a ## _C
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	93 #include "rgb2rgb_template.c"
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	94
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	95 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	96
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	97 //MMX versions
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	98 #undef RENAME
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	99 #define HAVE_MMX
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	100 #undef HAVE_MMX2
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	101 #undef HAVE_3DNOW
5338 2819346c6049 10l michael parents: 5337 diff changeset	102 #undef HAVE_SSE2
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	103 #define ARCH_X86
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	104 #define RENAME(a) a ## _MMX
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	105 #include "rgb2rgb_template.c"
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	106
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	107 //MMX2 versions
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	108 #undef RENAME
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	109 #define HAVE_MMX
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	110 #define HAVE_MMX2
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	111 #undef HAVE_3DNOW
5338 2819346c6049 10l michael parents: 5337 diff changeset	112 #undef HAVE_SSE2
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	113 #define ARCH_X86
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	114 #define RENAME(a) a ## _MMX2
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	115 #include "rgb2rgb_template.c"
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	116
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	117 //3DNOW versions
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	118 #undef RENAME
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	119 #define HAVE_MMX
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	120 #undef HAVE_MMX2
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	121 #define HAVE_3DNOW
5338 2819346c6049 10l michael parents: 5337 diff changeset	122 #undef HAVE_SSE2
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	123 #define ARCH_X86
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	124 #define RENAME(a) a ## _3DNow
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	125 #include "rgb2rgb_template.c"
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	126
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	127 #endif //CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	128
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	129 void rgb24to32(const uint8_t src,uint8_t dst,unsigned src_size)
2504 13e1c5ab417a vo_vesa: rgb2rgb support nick parents: diff changeset	130 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	131 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	132 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	133 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	134 rgb24to32_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	135 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	136 rgb24to32_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	137 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	138 rgb24to32_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	139 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	140 rgb24to32_C(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	141 #else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	142 rgb24to32_C(src, dst, src_size);
2510 42e1ae2c8f5f mmx optimized 24to32 nick parents: 2508 diff changeset	143 #endif
2504 13e1c5ab417a vo_vesa: rgb2rgb support nick parents: diff changeset	144 }
2505 2aaa11d22f91 vo_vesa: more rgb2rgb support nick parents: 2504 diff changeset	145
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	146 void rgb32to24(const uint8_t src,uint8_t dst,unsigned src_size)
2505 2aaa11d22f91 vo_vesa: more rgb2rgb support nick parents: 2504 diff changeset	147 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	148 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	149 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	150 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	151 rgb32to24_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	152 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	153 rgb32to24_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	154 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	155 rgb32to24_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	156 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	157 rgb32to24_C(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	158 #else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	159 rgb32to24_C(src, dst, src_size);
2517 3d507ef1e3ed 32to24: MMX, MMX2, 3DNOW optimization nick parents: 2516 diff changeset	160 #endif
2505 2aaa11d22f91 vo_vesa: more rgb2rgb support nick parents: 2504 diff changeset	161 }
2506 501752469c39 vo_vesa: more rgb2rgb support nick parents: 2505 diff changeset	162
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	163 /*
71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	164 Original by Strepto/Astral
71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	165 ported to gcc & bugfixed : A'rpi
2564 3d04a0991dce cosmetic nick parents: 2538 diff changeset	166 MMX2, 3DNOW optimization by Nick Kurshev
2698 22652c028692 faster 15to16 bit rgb (the mmx routine is limited by memory speed so there is no difference ): but the c routine is faster michael parents: 2697 diff changeset	167 32bit c version, and and&add trick by Michael Niedermayer
2538 71320898b333 Finish mmx2, 3dnow optimiz. 15to16 should be tested. Better fix of can't compile nick parents: 2535 diff changeset	168 */
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	169 void rgb15to16(const uint8_t src,uint8_t dst,unsigned src_size)
2506 501752469c39 vo_vesa: more rgb2rgb support nick parents: 2505 diff changeset	170 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	171 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	172 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	173 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	174 rgb15to16_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	175 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	176 rgb15to16_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	177 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	178 rgb15to16_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	179 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	180 rgb15to16_C(src, dst, src_size);
2506 501752469c39 vo_vesa: more rgb2rgb support nick parents: 2505 diff changeset	181 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	182 rgb15to16_C(src, dst, src_size);
2506 501752469c39 vo_vesa: more rgb2rgb support nick parents: 2505 diff changeset	183 #endif
501752469c39 vo_vesa: more rgb2rgb support nick parents: 2505 diff changeset	184 }
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	185
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	186 /**
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	187 * Pallete is assumed to contain bgr32
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	188 */
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	189 void palette8torgb32(const uint8_t src, uint8_t dst, unsigned num_pixels, const uint8_t *palette)
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	190 {
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	191 unsigned i;
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	192 for(i=0; i<num_pixels; i++)
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	193 ((unsigned )dst)[i] = ((unsigned )palette)[ src[i] ];
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	194 }
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	195
2697 1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	196 /**
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	197 * Pallete is assumed to contain bgr32
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	198 */
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	199 void palette8torgb24(const uint8_t src, uint8_t dst, unsigned num_pixels, const uint8_t *palette)
2697 1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	200 {
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	201 unsigned i;
2697 1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	202 /*
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	203 writes 1 byte o much and might cause alignment issues on some architectures?
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	204 for(i=0; i<num_pixels; i++)
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	205 ((unsigned )(&dst[i3])) = ((unsigned *)palette)[ src[i] ];
2697 1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	206 */
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	207 for(i=0; i<num_pixels; i++)
2697 1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	208 {
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	209 //FIXME slow?
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	210 dst[0]= palette[ src[i]*4+0 ];
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	211 dst[1]= palette[ src[i]*4+1 ];
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	212 dst[2]= palette[ src[i]*4+2 ];
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	213 dst+= 3;
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	214 }
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	215 }
1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	216
6484 c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	217 void bgr24torgb24(const uint8_t src, uint8_t dst, unsigned src_size)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	218 {
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	219 #ifdef CAN_COMPILE_X86_ASM
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	220 // ordered per speed fasterst first
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	221 if(gCpuCaps.hasMMX2)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	222 bgr24torgb24_MMX2(src, dst, src_size);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	223 else if(gCpuCaps.has3DNow)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	224 bgr24torgb24_3DNow(src, dst, src_size);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	225 else if(gCpuCaps.hasMMX)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	226 bgr24torgb24_MMX(src, dst, src_size);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	227 else
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	228 bgr24torgb24_C(src, dst, src_size);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	229 #else
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	230 bgr24torgb24_C(src, dst, src_size);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	231 #endif
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	232 }
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	233
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	234 void rgb32to16(const uint8_t src, uint8_t dst, unsigned src_size)
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	235 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	236 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	237 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	238 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	239 rgb32to16_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	240 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	241 rgb32to16_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	242 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	243 rgb32to16_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	244 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	245 rgb32to16_C(src, dst, src_size);
2741 b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	246 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	247 rgb32to16_C(src, dst, src_size);
2741 b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	248 #endif
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	249 }
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	250
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	251 void rgb32to15(const uint8_t src, uint8_t dst, unsigned src_size)
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	252 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	253 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	254 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	255 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	256 rgb32to15_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	257 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	258 rgb32to15_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	259 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	260 rgb32to15_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	261 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	262 rgb32to15_C(src, dst, src_size);
2741 b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	263 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	264 rgb32to15_C(src, dst, src_size);
2741 b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	265 #endif
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	266 }
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	267
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	268 void rgb24to16(const uint8_t src, uint8_t dst, unsigned src_size)
9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	269 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	270 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	271 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	272 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	273 rgb24to16_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	274 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	275 rgb24to16_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	276 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	277 rgb24to16_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	278 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	279 rgb24to16_C(src, dst, src_size);
2740 1583214489a2 optimized rgb24to16 stuff nick parents: 2738 diff changeset	280 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	281 rgb24to16_C(src, dst, src_size);
2740 1583214489a2 optimized rgb24to16 stuff nick parents: 2738 diff changeset	282 #endif
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	283 }
9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	284
9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	285 void rgb24to15(const uint8_t src, uint8_t dst, unsigned src_size)
9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	286 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	287 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	288 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	289 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	290 rgb24to15_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	291 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	292 rgb24to15_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	293 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	294 rgb24to15_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	295 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	296 rgb24to15_C(src, dst, src_size);
2741 b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	297 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	298 rgb24to15_C(src, dst, src_size);
2741 b8a692c59b64 MMX2, 3DNOW, MMX optimized rgb32(24)to16(15) stuff nick parents: 2740 diff changeset	299 #endif
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	300 }
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	301
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	302 /**
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	303 * Palette is assumed to contain bgr16, see rgb32to16 to convert the palette
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	304 */
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	305 void palette8torgb16(const uint8_t src, uint8_t dst, unsigned num_pixels, const uint8_t *palette)
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	306 {
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	307 unsigned i;
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	308 for(i=0; i<num_pixels; i++)
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	309 ((uint16_t )dst)[i] = ((uint16_t )palette)[ src[i] ];
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	310 }
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	311
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	312 /**
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	313 * Pallete is assumed to contain bgr15, see rgb32to15 to convert the palette
2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	314 */
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	315 void palette8torgb15(const uint8_t src, uint8_t dst, unsigned num_pixels, const uint8_t *palette)
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	316 {
2718 9c5e64493742 Well - old algorithms and new stuff rgb24to16(15) nick parents: 2711 diff changeset	317 unsigned i;
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	318 for(i=0; i<num_pixels; i++)
2694 2924350d92ed bgr32to16, bgr32to15 (needed for palette stuff) michael parents: 2677 diff changeset	319 ((uint16_t )dst)[i] = ((uint16_t )palette)[ src[i] ];
2697 1eaf3f89e49f palette to bgr24 michael parents: 2694 diff changeset	320 }
2755 2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	321
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	322 void rgb32tobgr32(const uint8_t src, uint8_t dst, unsigned int src_size)
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	323 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	324 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	325 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	326 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	327 rgb32tobgr32_MMX2(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	328 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	329 rgb32tobgr32_3DNow(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	330 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	331 rgb32tobgr32_MMX(src, dst, src_size);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	332 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	333 rgb32tobgr32_C(src, dst, src_size);
2755 2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	334 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	335 rgb32tobgr32_C(src, dst, src_size);
2755 2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	336 #endif
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	337 }
2f93f4351765 rgb32tobgr32 / bgr32torgb32 michael parents: 2746 diff changeset	338
5582 21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	339 void rgb24tobgr24(const uint8_t src, uint8_t dst, unsigned int src_size)
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	340 {
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	341 #ifdef CAN_COMPILE_X86_ASM
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	342 // ordered per speed fasterst first
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	343 if(gCpuCaps.hasMMX2)
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	344 rgb24tobgr24_MMX2(src, dst, src_size);
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	345 else if(gCpuCaps.has3DNow)
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	346 rgb24tobgr24_3DNow(src, dst, src_size);
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	347 else if(gCpuCaps.hasMMX)
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	348 rgb24tobgr24_MMX(src, dst, src_size);
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	349 else
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	350 rgb24tobgr24_C(src, dst, src_size);
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	351 #else
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	352 rgb24tobgr24_C(src, dst, src_size);
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	353 #endif
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	354 }
21bd4b32abb4 rgb24->bgr24 michael parents: 5338 diff changeset	355
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	356 /**
440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	357 *
2724 c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	358 * height should be a multiple of 2 and width should be a multiple of 16 (if this is a
c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	359 * problem for anyone then tell me, and ill fix it)
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	360 */
2723 22aba8af94af fixed yv12toyuy2 michael parents: 2720 diff changeset	361 void yv12toyuy2(const uint8_t ysrc, const uint8_t usrc, const uint8_t vsrc, uint8_t dst,
2725 5bba527c9a4c unsigned stuff michael parents: 2724 diff changeset	362 unsigned int width, unsigned int height,
5bba527c9a4c unsigned stuff michael parents: 2724 diff changeset	363 unsigned int lumStride, unsigned int chromStride, unsigned int dstStride)
2701 9b47bc409083 yv12 <-> yuy2 in C michael parents: 2698 diff changeset	364 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	365 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	366 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	367 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	368 yv12toyuy2_MMX2(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	369 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	370 yv12toyuy2_3DNow(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	371 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	372 yv12toyuy2_MMX(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	373 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	374 yv12toyuy2_C(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	375 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	376 yv12toyuy2_C(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
2702 440312d953a8 yv12toyuy2 in MMX michael parents: 2701 diff changeset	377 #endif
2701 9b47bc409083 yv12 <-> yuy2 in C michael parents: 2698 diff changeset	378 }
9b47bc409083 yv12 <-> yuy2 in C michael parents: 2698 diff changeset	379
2724 c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	380 /**
c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	381 *
5588 f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	382 * width should be a multiple of 16
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	383 */
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	384 void yuv422ptoyuy2(const uint8_t ysrc, const uint8_t usrc, const uint8_t vsrc, uint8_t dst,
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	385 unsigned int width, unsigned int height,
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	386 unsigned int lumStride, unsigned int chromStride, unsigned int dstStride)
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	387 {
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	388 #ifdef CAN_COMPILE_X86_ASM
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	389 // ordered per speed fasterst first
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	390 if(gCpuCaps.hasMMX2)
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	391 yuv422ptoyuy2_MMX2(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	392 else if(gCpuCaps.has3DNow)
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	393 yuv422ptoyuy2_3DNow(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	394 else if(gCpuCaps.hasMMX)
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	395 yuv422ptoyuy2_MMX(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	396 else
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	397 yuv422ptoyuy2_C(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	398 #else
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	399 yuv422ptoyuy2_C(ysrc, usrc, vsrc, dst, width, height, lumStride, chromStride, dstStride);
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	400 #endif
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	401 }
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	402
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	403 /**
f0fa3373f616 yuv422p -> yuy2 (untested) michael parents: 5582 diff changeset	404 *
2724 c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	405 * height should be a multiple of 2 and width should be a multiple of 16 (if this is a
c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	406 * problem for anyone then tell me, and ill fix it)
c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	407 */
c08b7af26782 yuy2toyv12 fixed and speedup michael parents: 2723 diff changeset	408 void yuy2toyv12(const uint8_t src, uint8_t ydst, uint8_t udst, uint8_t vdst,
2725 5bba527c9a4c unsigned stuff michael parents: 2724 diff changeset	409 unsigned int width, unsigned int height,
5bba527c9a4c unsigned stuff michael parents: 2724 diff changeset	410 unsigned int lumStride, unsigned int chromStride, unsigned int srcStride)
2701 9b47bc409083 yv12 <-> yuy2 in C michael parents: 2698 diff changeset	411 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	412 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	413 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	414 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	415 yuy2toyv12_MMX2(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	416 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	417 yuy2toyv12_3DNow(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	418 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	419 yuy2toyv12_MMX(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	420 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	421 yuy2toyv12_C(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
2704 b4c6699d3893 yuy2toyv12 in MMX michael parents: 2702 diff changeset	422 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	423 yuy2toyv12_C(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
2704 b4c6699d3893 yuy2toyv12 in MMX michael parents: 2702 diff changeset	424 #endif
2723 22aba8af94af fixed yv12toyuy2 michael parents: 2720 diff changeset	425 }
2801 318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	426
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	427 /**
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	428 *
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	429 * height should be a multiple of 2 and width should be a multiple of 16 (if this is a
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	430 * problem for anyone then tell me, and ill fix it)
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	431 * chrominance data is only taken from every secound line others are ignored FIXME write HQ version
2801 318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	432 */
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	433 void uyvytoyv12(const uint8_t src, uint8_t ydst, uint8_t udst, uint8_t vdst,
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	434 unsigned int width, unsigned int height,
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	435 unsigned int lumStride, unsigned int chromStride, unsigned int srcStride)
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	436 {
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	437 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	438 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	439 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	440 uyvytoyv12_MMX2(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	441 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	442 uyvytoyv12_3DNow(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	443 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	444 uyvytoyv12_MMX(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	445 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	446 uyvytoyv12_C(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
2847 1d92268eb8fc uyvytoyv12 in MMX (untested) michael parents: 2806 diff changeset	447 #else
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	448 uyvytoyv12_C(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
2847 1d92268eb8fc uyvytoyv12 in MMX (untested) michael parents: 2806 diff changeset	449 #endif
2801 318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	450 }
318c240363c7 uyvy->uv12 added arpi parents: 2800 diff changeset	451
6484 c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	452 void yvu9toyv12(const uint8_t ysrc, const uint8_t usrc, const uint8_t *vsrc,
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	453 uint8_t ydst, uint8_t udst, uint8_t *vdst,
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	454 unsigned int width, unsigned int height,
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	455 unsigned int lumStride, unsigned int chromStride)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	456 {
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	457 #ifdef CAN_COMPILE_X86_ASM
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	458 // ordered per speed fasterst first
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	459 if(gCpuCaps.hasMMX2)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	460 yvu9toyv12_MMX2(ysrc, usrc, vsrc, ydst, udst, vdst, width, height, lumStride, chromStride);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	461 else if(gCpuCaps.has3DNow)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	462 yvu9toyv12_3DNow(ysrc, usrc, vsrc, ydst, udst, vdst, width, height, lumStride, chromStride);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	463 else if(gCpuCaps.hasMMX)
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	464 yvu9toyv12_MMX(ysrc, usrc, vsrc, ydst, udst, vdst, width, height, lumStride, chromStride);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	465 else
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	466 yvu9toyv12_C(ysrc, usrc, vsrc, ydst, udst, vdst, width, height, lumStride, chromStride);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	467 #else
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	468 yvu9toyv12_C(ysrc, usrc, vsrc, ydst, udst, vdst, width, height, lumStride, chromStride);
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	469 #endif
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	470 }
c5cf988c6d6f pre-yvu9toyv12 converter, only grayscale Y-plane coping :) alex parents: 5588 diff changeset	471
3132 ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	472 /**
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	473 *
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	474 * height should be a multiple of 2 and width should be a multiple of 2 (if this is a
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	475 * problem for anyone then tell me, and ill fix it)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	476 * chrominance data is only taken from every secound line others are ignored FIXME write HQ version
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	477 */
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	478 void rgb24toyv12(const uint8_t src, uint8_t ydst, uint8_t udst, uint8_t vdst,
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	479 unsigned int width, unsigned int height,
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	480 unsigned int lumStride, unsigned int chromStride, unsigned int srcStride)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	481 {
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	482 #ifdef CAN_COMPILE_X86_ASM
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	483 // ordered per speed fasterst first
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	484 if(gCpuCaps.hasMMX2)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	485 rgb24toyv12_MMX2(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	486 else if(gCpuCaps.has3DNow)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	487 rgb24toyv12_3DNow(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	488 else if(gCpuCaps.hasMMX)
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	489 rgb24toyv12_MMX(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	490 else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	491 rgb24toyv12_C(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	492 #else
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	493 rgb24toyv12_C(src, ydst, udst, vdst, width, height, lumStride, chromStride, srcStride);
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	494 #endif
ab67556586fa runtime cpu detection michael parents: 2847 diff changeset	495 }
5337 0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	496
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	497 void interleaveBytes(uint8_t src1, uint8_t src2, uint8_t *dst,
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	498 int width, int height, int src1Stride, int src2Stride, int dstStride)
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	499 {
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	500 #ifdef CAN_COMPILE_X86_ASM
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	501 // ordered per speed fasterst first
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	502 if(gCpuCaps.hasMMX2)
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	503 interleaveBytes_MMX2(src1, src2, dst, width, height, src1Stride, src2Stride, dstStride);
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	504 else if(gCpuCaps.has3DNow)
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	505 interleaveBytes_3DNow(src1, src2, dst, width, height, src1Stride, src2Stride, dstStride);
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	506 else if(gCpuCaps.hasMMX)
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	507 interleaveBytes_MMX(src1, src2, dst, width, height, src1Stride, src2Stride, dstStride);
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	508 else
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	509 interleaveBytes_C(src1, src2, dst, width, height, src1Stride, src2Stride, dstStride);
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	510 #else
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	511 interleaveBytes_C(src1, src2, dst, width, height, src1Stride, src2Stride, dstStride);
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	512 #endif
0bd1c35aa42c byte interleaving for mga michael parents: 4923 diff changeset	513 }

Mercurial > mplayer.hg

annotate postproc/rgb2rgb.c @ 6484:c5cf988c6d6f