mplayer.hg: libvo/yuv2rgb

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

2 /*

3b5f5d1c5041 Initial revision

arpi_esp

parents:

3 * yuv2rgb_mmx.c, Software YUV to RGB coverter with Intel MMX "technology"

3b5f5d1c5041 Initial revision

arpi_esp

parents:

4 *

3b5f5d1c5041 Initial revision

arpi_esp

parents:

3b5f5d1c5041 Initial revision

arpi_esp

parents:

3b5f5d1c5041 Initial revision

arpi_esp

parents:

7 *

3b5f5d1c5041 Initial revision

arpi_esp

parents:

8 * Author: Olie Lho <ollie@sis.com.tw>

3b5f5d1c5041 Initial revision

arpi_esp

parents:

9 *

3b5f5d1c5041 Initial revision

arpi_esp

parents:

10 * This file is part of mpeg2dec, a free MPEG-2 video decoder

3b5f5d1c5041 Initial revision

arpi_esp

parents:

11 *

3b5f5d1c5041 Initial revision

arpi_esp

parents:

12 * mpeg2dec is free software; you can redistribute it and/or modify

3b5f5d1c5041 Initial revision

arpi_esp

parents:

13 * it under the terms of the GNU General Public License as published by

3b5f5d1c5041 Initial revision

arpi_esp

parents:

14 * the Free Software Foundation; either version 2, or (at your option)

3b5f5d1c5041 Initial revision

arpi_esp

parents:

15 * any later version.

3b5f5d1c5041 Initial revision

arpi_esp

parents:

16 *

3b5f5d1c5041 Initial revision

arpi_esp

parents:

17 * mpeg2dec is distributed in the hope that it will be useful,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

18 * but WITHOUT ANY WARRANTY; without even the implied warranty of

3b5f5d1c5041 Initial revision

arpi_esp

parents:

19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

3b5f5d1c5041 Initial revision

arpi_esp

parents:

20 * GNU General Public License for more details.

3b5f5d1c5041 Initial revision

arpi_esp

parents:

21 *

3b5f5d1c5041 Initial revision

arpi_esp

parents:

22 * You should have received a copy of the GNU General Public License

3b5f5d1c5041 Initial revision

arpi_esp

parents:

23 * along with GNU Make; see the file COPYING. If not, write to

3b5f5d1c5041 Initial revision

arpi_esp

parents:

24 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.

3b5f5d1c5041 Initial revision

arpi_esp

parents:

25 *

3b5f5d1c5041 Initial revision

arpi_esp

parents:

26 */

3b5f5d1c5041 Initial revision

arpi_esp

parents:

27

3b5f5d1c5041 Initial revision

arpi_esp

parents:

28 #include <stdio.h>

3b5f5d1c5041 Initial revision

arpi_esp

parents:

29 #include <stdlib.h>

3b5f5d1c5041 Initial revision

arpi_esp

parents:

30

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

31 #include "../config.h"

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

32

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

33 #include "mmx.h"

3b5f5d1c5041 Initial revision

arpi_esp

parents:

34 //#include "libmpeg2/mpeg2.h"

3b5f5d1c5041 Initial revision

arpi_esp

parents:

35 //#include "libmpeg2/mpeg2_internal.h"

3b5f5d1c5041 Initial revision

arpi_esp

parents:

36 #include <inttypes.h>

3b5f5d1c5041 Initial revision

arpi_esp

parents:

37

3b5f5d1c5041 Initial revision

arpi_esp

parents:

38 #include "yuv2rgb.h"

3b5f5d1c5041 Initial revision

arpi_esp

parents:

39

3b5f5d1c5041 Initial revision

arpi_esp

parents:

40 /* hope these constant values are cache line aligned */

3b5f5d1c5041 Initial revision

arpi_esp

parents:

41 uint64_t mmx_80w = 0x0080008000800080;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

42 uint64_t mmx_10w = 0x1010101010101010;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

43 uint64_t mmx_00ffw = 0x00ff00ff00ff00ff;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

44 uint64_t mmx_Y_coeff = 0x253f253f253f253f;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

45

3b5f5d1c5041 Initial revision

arpi_esp

parents:

46 /* hope these constant values are cache line aligned */

3b5f5d1c5041 Initial revision

arpi_esp

parents:

47 uint64_t mmx_U_green = 0xf37df37df37df37d;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

48 uint64_t mmx_U_blue = 0x4093409340934093;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

49 uint64_t mmx_V_red = 0x3312331233123312;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

50 uint64_t mmx_V_green = 0xe5fce5fce5fce5fc;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

51

3b5f5d1c5041 Initial revision

arpi_esp

parents:

52 /* hope these constant values are cache line aligned */

3b5f5d1c5041 Initial revision

arpi_esp

parents:

53 uint64_t mmx_redmask = 0xf8f8f8f8f8f8f8f8;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

54 uint64_t mmx_grnmask = 0xfcfcfcfcfcfcfcfc;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

55 uint64_t mmx_grnshift = 0x03;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

56 uint64_t mmx_blueshift = 0x03;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

57

688

1a016347010a movntq causes SIGILL on k6-3. Lets it be for K7, P3 cpus only

nickols_k

parents: 1

58 #ifdef HAVE_MMX2

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

59 /* use this for K7 and p3 only */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

60 #define MOVNTQ "movntq"

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

61 #else

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

62 /* for MMX-only processors */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

63 #define MOVNTQ "movq"

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

64 #endif

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

65

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

66 #if !defined( HAVE_MMX2) && defined( HAVE_3DNOW)

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

67 /* for K6 2/2+/3 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

68 #define EMMS "femms;"

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

69 #else

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

70 #define EMMS "emms;"

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

71 #endif

3b5f5d1c5041 Initial revision

arpi_esp

parents:

72

3b5f5d1c5041 Initial revision

arpi_esp

parents:

73 static void yuv420_rgb16_mmx (uint8_t * image, uint8_t * py,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

74 uint8_t * pu, uint8_t * pv,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

75 int h_size, int v_size,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

76 int rgb_stride, int y_stride, int uv_stride)

3b5f5d1c5041 Initial revision

arpi_esp

parents:

77 {

3b5f5d1c5041 Initial revision

arpi_esp

parents:

78 int even = 1;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

79 int x, y;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

80

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

81 __asm__ __volatile__ ("pxor %mm4, %mm4;" /* zero mm4 */ );

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

82

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

83 for (y = v_size; --y >= 0; ) {

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

84 uint8_t *_image = image;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

85 uint8_t *_py = py;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

86 uint8_t *_pu = pu;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

87 uint8_t *_pv = pv;

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

88

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

89 /* load data for start of next scan line */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

90 __asm__ __volatile__ (

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

91 "movd (%1), %%mm0;" /* Load 4 Cb 00 00 00 00 u3 u2 u1 u0 */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

92 "movd (%2), %%mm1;" /* Load 4 Cr 00 00 00 00 v3 v2 v1 v0 */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

93 "movq (%0), %%mm6;" /* Load 8 Y Y7 Y6 Y5 Y4 Y3 Y2 Y1 Y0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

94

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

95 : : "r" (_py), "r" (_pu), "r" (_pv));

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

96

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

97 for (x = h_size >> 3; --x >= 0; ) {

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

98 /* this mmx assembly code deals with SINGLE scan line at a time, it convert 8

3b5f5d1c5041 Initial revision

arpi_esp

parents:

99 pixels in each iteration */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

100

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

101 __asm__ __volatile__ (

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

102 /* Do the multiply part of the conversion for even and odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

103 register usage:

3b5f5d1c5041 Initial revision

arpi_esp

parents:

104 mm0 -> Cblue, mm1 -> Cred, mm2 -> Cgreen even pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

105 mm3 -> Cblue, mm4 -> Cred, mm5 -> Cgreen odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

106 mm6 -> Y even, mm7 -> Y odd */

3b5f5d1c5041 Initial revision

arpi_esp

parents:

107 /* convert the chroma part */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

108 "punpcklbw %%mm4, %%mm0;" /* scatter 4 Cb 00 u3 00 u2 00 u1 00 u0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

109 "punpcklbw %%mm4, %%mm1;" /* scatter 4 Cr 00 v3 00 v2 00 v1 00 v0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

110

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

111 "psubsw mmx_80w, %%mm0;" /* Cb -= 128 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

112 "psubsw mmx_80w, %%mm1;" /* Cr -= 128 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

113

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

114 "psllw $3, %%mm0;" /* Promote precision */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

115 "psllw $3, %%mm1;" /* Promote precision */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

116

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

117 "movq %%mm0, %%mm2;" /* Copy 4 Cb 00 u3 00 u2 00 u1 00 u0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

118 "movq %%mm1, %%mm3;" /* Copy 4 Cr 00 v3 00 v2 00 v1 00 v0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

119

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

120 "pmulhw mmx_U_green, %%mm2;" /* Mul Cb with green coeff -> Cb green */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

121 "pmulhw mmx_V_green, %%mm3;" /* Mul Cr with green coeff -> Cr green */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

122

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

123 "pmulhw mmx_U_blue, %%mm0;" /* Mul Cb -> Cblue 00 b3 00 b2 00 b1 00 b0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

124 "pmulhw mmx_V_red, %%mm1;" /* Mul Cr -> Cred 00 r3 00 r2 00 r1 00 r0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

125

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

126 "paddsw %%mm3, %%mm2;" /* Cb green + Cr green -> Cgreen */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

127

3b5f5d1c5041 Initial revision

arpi_esp

parents:

128 /* convert the luma part */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

129 "psubusb mmx_10w, %%mm6;" /* Y -= 16 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

130

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

131 "movq %%mm6, %%mm7;" /* Copy 8 Y Y7 Y6 Y5 Y4 Y3 Y2 Y1 Y0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

132 "pand mmx_00ffw, %%mm6;" /* get Y even 00 Y6 00 Y4 00 Y2 00 Y0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

133

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

134 "psrlw $8, %%mm7;" /* get Y odd 00 Y7 00 Y5 00 Y3 00 Y1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

135

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

136 "psllw $3, %%mm6;" /* Promote precision */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

137 "psllw $3, %%mm7;" /* Promote precision */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

138

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

139 "pmulhw mmx_Y_coeff, %%mm6;" /* Mul 4 Y even 00 y6 00 y4 00 y2 00 y0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

140 "pmulhw mmx_Y_coeff, %%mm7;" /* Mul 4 Y odd 00 y7 00 y5 00 y3 00 y1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

141

3b5f5d1c5041 Initial revision

arpi_esp

parents:

142 /* Do the addition part of the conversion for even and odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

143 register usage:

3b5f5d1c5041 Initial revision

arpi_esp

parents:

144 mm0 -> Cblue, mm1 -> Cred, mm2 -> Cgreen even pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

145 mm3 -> Cblue, mm4 -> Cred, mm5 -> Cgreen odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

146 mm6 -> Y even, mm7 -> Y odd */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

147 "movq %%mm0, %%mm3;" /* Copy Cblue */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

148 "movq %%mm1, %%mm4;" /* Copy Cred */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

149 "movq %%mm2, %%mm5;" /* Copy Cgreen */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

150

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

151 "paddsw %%mm6, %%mm0;" /* Y even + Cblue 00 B6 00 B4 00 B2 00 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

152 "paddsw %%mm7, %%mm3;" /* Y odd + Cblue 00 B7 00 B5 00 B3 00 B1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

153

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

154 "paddsw %%mm6, %%mm1;" /* Y even + Cred 00 R6 00 R4 00 R2 00 R0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

155 "paddsw %%mm7, %%mm4;" /* Y odd + Cred 00 R7 00 R5 00 R3 00 R1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

156

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

157 "paddsw %%mm6, %%mm2;" /* Y even + Cgreen 00 G6 00 G4 00 G2 00 G0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

158 "paddsw %%mm7, %%mm5;" /* Y odd + Cgreen 00 G7 00 G5 00 G3 00 G1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

159

3b5f5d1c5041 Initial revision

arpi_esp

parents:

160 /* Limit RGB even to 0..255 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

161 "packuswb %%mm0, %%mm0;" /* B6 B4 B2 B0 B6 B4 B2 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

162 "packuswb %%mm1, %%mm1;" /* R6 R4 R2 R0 R6 R4 R2 R0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

163 "packuswb %%mm2, %%mm2;" /* G6 G4 G2 G0 G6 G4 G2 G0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

164

3b5f5d1c5041 Initial revision

arpi_esp

parents:

165 /* Limit RGB odd to 0..255 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

166 "packuswb %%mm3, %%mm3;" /* B7 B5 B3 B1 B7 B5 B3 B1 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

167 "packuswb %%mm4, %%mm4;" /* R7 R5 R3 R1 R7 R5 R3 R1 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

168 "packuswb %%mm5, %%mm5;" /* G7 G5 G3 G1 G7 G5 G3 G1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

169

3b5f5d1c5041 Initial revision

arpi_esp

parents:

170 /* Interleave RGB even and odd */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

171 "punpcklbw %%mm3, %%mm0;" /* B7 B6 B5 B4 B3 B2 B1 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

172 "punpcklbw %%mm4, %%mm1;" /* R7 R6 R5 R4 R3 R2 R1 R0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

173 "punpcklbw %%mm5, %%mm2;" /* G7 G6 G5 G4 G3 G2 G1 G0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

174

3b5f5d1c5041 Initial revision

arpi_esp

parents:

175 /* mask unneeded bits off */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

176 "pand mmx_redmask, %%mm0;" /* b7b6b5b4 b3_0_0_0 b7b6b5b4 b3_0_0_0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

177 "pand mmx_grnmask, %%mm2;" /* g7g6g5g4 g3g2_0_0 g7g6g5g4 g3g2_0_0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

178 "pand mmx_redmask, %%mm1;" /* r7r6r5r4 r3_0_0_0 r7r6r5r4 r3_0_0_0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

179

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

180 "psrlw mmx_blueshift,%%mm0;" /* 0_0_0_b7 b6b5b4b3 0_0_0_b7 b6b5b4b3 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

181 "pxor %%mm4, %%mm4;" /* zero mm4 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

182

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

183 "movq %%mm0, %%mm5;" /* Copy B7-B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

184 "movq %%mm2, %%mm7;" /* Copy G7-G0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

185

3b5f5d1c5041 Initial revision

arpi_esp

parents:

186 /* convert rgb24 plane to rgb16 pack for pixel 0-3 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

187 "punpcklbw %%mm4, %%mm2;" /* 0_0_0_0 0_0_0_0 g7g6g5g4 g3g2_0_0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

188 "punpcklbw %%mm1, %%mm0;" /* r7r6r5r4 r3_0_0_0 0_0_0_b7 b6b5b4b3 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

189

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

190 "psllw mmx_blueshift,%%mm2;" /* 0_0_0_0 0_g7g6g5 g4g3g2_0 0_0_0_0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

191 "por %%mm2, %%mm0;" /* r7r6r5r4 r3g7g6g5 g4g3g2b7 b6b5b4b3 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

192

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

193 "movq 8 (%0), %%mm6;" /* Load 8 Y Y7 Y6 Y5 Y4 Y3 Y2 Y1 Y0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

194 MOVNTQ " %%mm0, (%3);" /* store pixel 0-3 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

195

3b5f5d1c5041 Initial revision

arpi_esp

parents:

196 /* convert rgb24 plane to rgb16 pack for pixel 0-3 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

197 "punpckhbw %%mm4, %%mm7;" /* 0_0_0_0 0_0_0_0 g7g6g5g4 g3g2_0_0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

198 "punpckhbw %%mm1, %%mm5;" /* r7r6r5r4 r3_0_0_0 0_0_0_b7 b6b5b4b3 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

199

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

200 "psllw mmx_blueshift,%%mm7;" /* 0_0_0_0 0_g7g6g5 g4g3g2_0 0_0_0_0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

201 "movd 4 (%1), %%mm0;" /* Load 4 Cb 00 00 00 00 u3 u2 u1 u0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

202

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

203 "por %%mm7, %%mm5;" /* r7r6r5r4 r3g7g6g5 g4g3g2b7 b6b5b4b3 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

204 "movd 4 (%2), %%mm1;" /* Load 4 Cr 00 00 00 00 v3 v2 v1 v0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

205

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

206 MOVNTQ " %%mm5, 8 (%3);" /* store pixel 4-7 */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

207 : : "r" (_py), "r" (_pu), "r" (_pv), "r" (_image));

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

208

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

209 _py += 8;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

210 _pu += 4;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

211 _pv += 4;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

212 _image += 16;

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

213 }

3b5f5d1c5041 Initial revision

arpi_esp

parents:

214

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

215 if (!even) {

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

216 pu += uv_stride;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

217 pv += uv_stride;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

218 }

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

219

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

220 py += y_stride;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

221 image += rgb_stride;

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

222

3b5f5d1c5041 Initial revision

arpi_esp

parents:

223 even = (!even);

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

224 }

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

225

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

226 __asm__ __volatile__ (EMMS);

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

227 }

3b5f5d1c5041 Initial revision

arpi_esp

parents:

228

3b5f5d1c5041 Initial revision

arpi_esp

parents:

229 static void yuv420_argb32_mmx (uint8_t * image, uint8_t * py,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

230 uint8_t * pu, uint8_t * pv,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

231 int h_size, int v_size,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

232 int rgb_stride, int y_stride, int uv_stride)

3b5f5d1c5041 Initial revision

arpi_esp

parents:

233 {

3b5f5d1c5041 Initial revision

arpi_esp

parents:

234 int even = 1;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

235 int x, y;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

236

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

237 __asm__ __volatile__ ("pxor %mm4, %mm4;" /* zero mm4 */ );

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

238

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

239 for (y = v_size; --y >= 0; ) {

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

240 uint8_t *_image = image;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

241 uint8_t *_py = py;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

242 uint8_t *_pu = pu;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

243 uint8_t *_pv = pv;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

244

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

245 /* load data for start of next scan line */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

246 __asm__ __volatile__

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

247 (

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

248 "movd (%1), %%mm0;" /* Load 4 Cb 00 00 00 00 u3 u2 u1 u0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

249 "movd (%2), %%mm1;" /* Load 4 Cr 00 00 00 00 v3 v2 v1 v0 */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

250 "movq (%0), %%mm6;" /* Load 8 Y Y7 Y6 Y5 Y4 Y3 Y2 Y1 Y0 */

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

251 : : "r" (_py), "r" (_pu), "r" (_pv)

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

252 );

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

253

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

254 for (x = h_size >> 3; --x >= 0; ) {

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

255 /* this mmx assembly code deals with SINGLE scan line at a time, it convert 8

3b5f5d1c5041 Initial revision

arpi_esp

parents:

256 pixels in each iteration */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

257 __asm__ __volatile__ (

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

258 /* Do the multiply part of the conversion for even and odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

259 register usage:

3b5f5d1c5041 Initial revision

arpi_esp

parents:

260 mm0 -> Cblue, mm1 -> Cred, mm2 -> Cgreen even pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

261 mm3 -> Cblue, mm4 -> Cred, mm5 -> Cgreen odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

262 mm6 -> Y even, mm7 -> Y odd */

3b5f5d1c5041 Initial revision

arpi_esp

parents:

263

3b5f5d1c5041 Initial revision

arpi_esp

parents:

264 /* convert the chroma part */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

265 "punpcklbw %%mm4, %%mm0;" /* scatter 4 Cb 00 u3 00 u2 00 u1 00 u0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

266 "punpcklbw %%mm4, %%mm1;" /* scatter 4 Cr 00 v3 00 v2 00 v1 00 v0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

267

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

268 "psubsw mmx_80w, %%mm0;" /* Cb -= 128 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

269 "psubsw mmx_80w, %%mm1;" /* Cr -= 128 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

270

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

271 "psllw $3, %%mm0;" /* Promote precision */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

272 "psllw $3, %%mm1;" /* Promote precision */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

273

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

274 "movq %%mm0, %%mm2;" /* Copy 4 Cb 00 u3 00 u2 00 u1 00 u0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

275 "movq %%mm1, %%mm3;" /* Copy 4 Cr 00 v3 00 v2 00 v1 00 v0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

276

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

277 "pmulhw mmx_U_green, %%mm2;" /* Mul Cb with green coeff -> Cb green */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

278 "pmulhw mmx_V_green, %%mm3;" /* Mul Cr with green coeff -> Cr green */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

279

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

280 "pmulhw mmx_U_blue, %%mm0;" /* Mul Cb -> Cblue 00 b3 00 b2 00 b1 00 b0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

281 "pmulhw mmx_V_red, %%mm1;" /* Mul Cr -> Cred 00 r3 00 r2 00 r1 00 r0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

282

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

283 "paddsw %%mm3, %%mm2;" /* Cb green + Cr green -> Cgreen */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

284

3b5f5d1c5041 Initial revision

arpi_esp

parents:

285 /* convert the luma part */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

286 "psubusb mmx_10w, %%mm6;" /* Y -= 16 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

287

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

288 "movq %%mm6, %%mm7;" /* Copy 8 Y Y7 Y6 Y5 Y4 Y3 Y2 Y1 Y0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

289 "pand mmx_00ffw, %%mm6;" /* get Y even 00 Y6 00 Y4 00 Y2 00 Y0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

290

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

291 "psrlw $8, %%mm7;" /* get Y odd 00 Y7 00 Y5 00 Y3 00 Y1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

292

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

293 "psllw $3, %%mm6;" /* Promote precision */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

294 "psllw $3, %%mm7;" /* Promote precision */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

295

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

296 "pmulhw mmx_Y_coeff, %%mm6;" /* Mul 4 Y even 00 y6 00 y4 00 y2 00 y0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

297 "pmulhw mmx_Y_coeff, %%mm7;" /* Mul 4 Y odd 00 y7 00 y5 00 y3 00 y1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

298

3b5f5d1c5041 Initial revision

arpi_esp

parents:

299 /* Do the addition part of the conversion for even and odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

300 register usage:

3b5f5d1c5041 Initial revision

arpi_esp

parents:

301 mm0 -> Cblue, mm1 -> Cred, mm2 -> Cgreen even pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

302 mm3 -> Cblue, mm4 -> Cred, mm5 -> Cgreen odd pixels,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

303 mm6 -> Y even, mm7 -> Y odd */

3b5f5d1c5041 Initial revision

arpi_esp

parents:

304

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

305 "movq %%mm0, %%mm3;" /* Copy Cblue */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

306 "movq %%mm1, %%mm4;" /* Copy Cred */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

307 "movq %%mm2, %%mm5;" /* Copy Cgreen */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

308

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

309 "paddsw %%mm6, %%mm0;" /* Y even + Cblue 00 B6 00 B4 00 B2 00 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

310 "paddsw %%mm7, %%mm3;" /* Y odd + Cblue 00 B7 00 B5 00 B3 00 B1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

311

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

312 "paddsw %%mm6, %%mm1;" /* Y even + Cred 00 R6 00 R4 00 R2 00 R0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

313 "paddsw %%mm7, %%mm4;" /* Y odd + Cred 00 R7 00 R5 00 R3 00 R1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

314

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

315 "paddsw %%mm6, %%mm2;" /* Y even + Cgreen 00 G6 00 G4 00 G2 00 G0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

316 "paddsw %%mm7, %%mm5;" /* Y odd + Cgreen 00 G7 00 G5 00 G3 00 G1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

317

3b5f5d1c5041 Initial revision

arpi_esp

parents:

318 /* Limit RGB even to 0..255 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

319 "packuswb %%mm0, %%mm0;" /* B6 B4 B2 B0 B6 B4 B2 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

320 "packuswb %%mm1, %%mm1;" /* R6 R4 R2 R0 R6 R4 R2 R0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

321 "packuswb %%mm2, %%mm2;" /* G6 G4 G2 G0 G6 G4 G2 G0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

322

3b5f5d1c5041 Initial revision

arpi_esp

parents:

323 /* Limit RGB odd to 0..255 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

324 "packuswb %%mm3, %%mm3;" /* B7 B5 B3 B1 B7 B5 B3 B1 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

325 "packuswb %%mm4, %%mm4;" /* R7 R5 R3 R1 R7 R5 R3 R1 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

326 "packuswb %%mm5, %%mm5;" /* G7 G5 G3 G1 G7 G5 G3 G1 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

327

3b5f5d1c5041 Initial revision

arpi_esp

parents:

328 /* Interleave RGB even and odd */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

329 "punpcklbw %%mm3, %%mm0;" /* B7 B6 B5 B4 B3 B2 B1 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

330 "punpcklbw %%mm4, %%mm1;" /* R7 R6 R5 R4 R3 R2 R1 R0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

331 "punpcklbw %%mm5, %%mm2;" /* G7 G6 G5 G4 G3 G2 G1 G0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

332

3b5f5d1c5041 Initial revision

arpi_esp

parents:

333 /* convert RGB plane to RGB packed format,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

334 mm0 -> B, mm1 -> R, mm2 -> G, mm3 -> 0,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

335 mm4 -> GB, mm5 -> AR pixel 4-7,

3b5f5d1c5041 Initial revision

arpi_esp

parents:

336 mm6 -> GB, mm7 -> AR pixel 0-3 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

337 "pxor %%mm3, %%mm3;" /* zero mm3 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

338

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

339 "movq %%mm0, %%mm6;" /* B7 B6 B5 B4 B3 B2 B1 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

340 "movq %%mm1, %%mm7;" /* R7 R6 R5 R4 R3 R2 R1 R0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

341

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

342 "movq %%mm0, %%mm4;" /* B7 B6 B5 B4 B3 B2 B1 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

343 "movq %%mm1, %%mm5;" /* R7 R6 R5 R4 R3 R2 R1 R0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

344

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

345 "punpcklbw %%mm2, %%mm6;" /* G3 B3 G2 B2 G1 B1 G0 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

346 "punpcklbw %%mm3, %%mm7;" /* 00 R3 00 R2 00 R1 00 R0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

347

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

348 "punpcklwd %%mm7, %%mm6;" /* 00 R1 B1 G1 00 R0 B0 G0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

349 MOVNTQ " %%mm6, (%3);" /* Store ARGB1 ARGB0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

350

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

351 "movq %%mm0, %%mm6;" /* B7 B6 B5 B4 B3 B2 B1 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

352 "punpcklbw %%mm2, %%mm6;" /* G3 B3 G2 B2 G1 B1 G0 B0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

353

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

354 "punpckhwd %%mm7, %%mm6;" /* 00 R3 G3 B3 00 R2 B3 G2 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

355 MOVNTQ " %%mm6, 8 (%3);" /* Store ARGB3 ARGB2 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

356

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

357 "punpckhbw %%mm2, %%mm4;" /* G7 B7 G6 B6 G5 B5 G4 B4 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

358 "punpckhbw %%mm3, %%mm5;" /* 00 R7 00 R6 00 R5 00 R4 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

359

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

360 "punpcklwd %%mm5, %%mm4;" /* 00 R5 B5 G5 00 R4 B4 G4 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

361 MOVNTQ " %%mm4, 16 (%3);" /* Store ARGB5 ARGB4 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

362

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

363 "movq %%mm0, %%mm4;" /* B7 B6 B5 B4 B3 B2 B1 B0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

364 "punpckhbw %%mm2, %%mm4;" /* G7 B7 G6 B6 G5 B5 G4 B4 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

365

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

366 "punpckhwd %%mm5, %%mm4;" /* 00 R7 G7 B7 00 R6 B6 G6 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

367 MOVNTQ " %%mm4, 24 (%3);" /* Store ARGB7 ARGB6 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

368

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

369 "movd 4 (%1), %%mm0;" /* Load 4 Cb 00 00 00 00 u3 u2 u1 u0 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

370 "movd 4 (%2), %%mm1;" /* Load 4 Cr 00 00 00 00 v3 v2 v1 v0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

371

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

372 "pxor %%mm4, %%mm4;" /* zero mm4 */

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

373 "movq 8 (%0), %%mm6;" /* Load 8 Y Y7 Y6 Y5 Y4 Y3 Y2 Y1 Y0 */

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

374

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

375 : : "r" (_py), "r" (_pu), "r" (_pv), "r" (_image));

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

376

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

377 _py += 8;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

378 _pu += 4;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

379 _pv += 4;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

380 _image += 32;

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

381 }

3b5f5d1c5041 Initial revision

arpi_esp

parents:

382

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

383 if (!even) {

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

384 pu += uv_stride;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

385 pv += uv_stride;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

386 }

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

387

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

388 py += y_stride;

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

389 image += rgb_stride;

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

390

3b5f5d1c5041 Initial revision

arpi_esp

parents:

391 even = (!even);

7ce37211e454 yuv2rgb_mmx crashes with ffdivx codec, when we play back avi files that have

jkeil

parents: 1101

392 }

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

393

961f53221ffc Code cleanup and fix missing config.h and use femms on K6 2/2+/3.

atmosfear

parents: 1098

394 __asm__ __volatile__ (EMMS);

1

3b5f5d1c5041 Initial revision

arpi_esp

parents:

395 }

3b5f5d1c5041 Initial revision

arpi_esp

parents:

396

3b5f5d1c5041 Initial revision

arpi_esp

parents:

397 yuv2rgb_fun yuv2rgb_init_mmx (int bpp, int mode)

3b5f5d1c5041 Initial revision

arpi_esp

parents:

398 {

3b5f5d1c5041 Initial revision

arpi_esp

parents:

399 // if (bpp == 15 || bpp == 16) {

3b5f5d1c5041 Initial revision

arpi_esp

parents:

400 if (bpp == 16 && mode == MODE_RGB) return yuv420_rgb16_mmx;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

401 if (bpp == 32 && mode == MODE_RGB) return yuv420_argb32_mmx;

3b5f5d1c5041 Initial revision

arpi_esp

parents:

402 return NULL; // Fallback to C.

3b5f5d1c5041 Initial revision

arpi_esp

parents:

403 }

3b5f5d1c5041 Initial revision

arpi_esp

parents: