annotate postproc/swscale.h @ 5452:eb87391a5292

overread in the mmx2 horizontal scaler fixed 2% faster horizontal mmx2 scaler
author michael
date Mon, 01 Apr 2002 14:01:22 +0000
parents 16fdb694cf13
children 5ac294a77a87
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
4295
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
1 /*
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
2 Copyright (C) 2001-2002 Michael Niedermayer <michaelni@gmx.at>
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
3
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
4 This program is free software; you can redistribute it and/or modify
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
5 it under the terms of the GNU General Public License as published by
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
6 the Free Software Foundation; either version 2 of the License, or
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
7 (at your option) any later version.
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
8
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
9 This program is distributed in the hope that it will be useful,
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
12 GNU General Public License for more details.
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
13
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
14 You should have received a copy of the GNU General Public License
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
15 along with this program; if not, write to the Free Software
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
16 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
67c56df76a44 copyright(swscaler) = GPL
michael
parents: 4294
diff changeset
17 */
3272
7e4399d1eb65 horizontal up/downscale linear & cubic
michael
parents: 3209
diff changeset
18
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
19 /* values for the flags, the stuff on the command line is different */
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
20 #define SWS_FAST_BILINEAR 1
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
21 #define SWS_BILINEAR 2
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
22 #define SWS_BICUBIC 4
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
23 #define SWS_X 8
4401
8d00348d0d6b nearest neighbor / sdl emulation ;) scaling (-sws 4)
michael
parents: 4297
diff changeset
24 #define SWS_POINT 0x10
4402
67abbf501b02 area averageing scaling support (-sws 5) (is identical to bilinear for upscale)
michael
parents: 4401
diff changeset
25 #define SWS_AREA 0x20
4467
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
26
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
27 //the following 4 flags are not completly implemented
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
28 //internal chrominace subsamling info
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
29 #define SWS_FULL_CHR_V 0x100
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
30 #define SWS_FULL_CHR_H_INT 0x200
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
31 //input subsampling info
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
32 #define SWS_FULL_CHR_H_INP 0x400
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
33 #define SWS_DIRECT_BGR 0x800
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
34
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
35 #define SWS_PRINT_INFO 0x1000
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
36
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
37 #define SWS_MAX_REDUCE_CUTOFF 0.002
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
38
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
39 /* this struct should be aligned on at least 32-byte boundary */
4554
16fdb694cf13 swScale internally uses yuv2rgb now if possible
michael
parents: 4467
diff changeset
40 typedef struct SwsContext{
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
41 int srcW, srcH, dstW, dstH;
4467
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
42 int chrSrcW, chrSrcH, chrDstW, chrDstH;
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
43 int lumXInc, chrXInc;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
44 int lumYInc, chrYInc;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
45 int dstFormat, srcFormat;
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
46
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
47 int16_t **lumPixBuf;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
48 int16_t **chrPixBuf;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
49 int16_t *hLumFilter;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
50 int16_t *hLumFilterPos;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
51 int16_t *hChrFilter;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
52 int16_t *hChrFilterPos;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
53 int16_t *vLumFilter;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
54 int16_t *vLumFilterPos;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
55 int16_t *vChrFilter;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
56 int16_t *vChrFilterPos;
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
57
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
58 // Contain simply the values from v(Lum|Chr)Filter just nicely packed for mmx
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
59 int16_t *lumMmxFilter;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
60 int16_t *chrMmxFilter;
4467
9512d6832b38 YUY2, BGR24, BGR32 input support (no mmx yet)
michael
parents: 4419
diff changeset
61 uint8_t formatConvBuffer[4000]; //FIXME dynamic alloc, but we have to change alot of code for this to be usefull
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
62
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
63 int hLumFilterSize;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
64 int hChrFilterSize;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
65 int vLumFilterSize;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
66 int vChrFilterSize;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
67 int vLumBufSize;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
68 int vChrBufSize;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
69
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
70 uint8_t __attribute__((aligned(32))) funnyYCode[10000];
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
71 uint8_t __attribute__((aligned(32))) funnyUVCode[10000];
5452
eb87391a5292 overread in the mmx2 horizontal scaler fixed
michael
parents: 4554
diff changeset
72 int32_t *lumMmx2FilterPos;
eb87391a5292 overread in the mmx2 horizontal scaler fixed
michael
parents: 4554
diff changeset
73 int32_t *chrMmx2FilterPos;
eb87391a5292 overread in the mmx2 horizontal scaler fixed
michael
parents: 4554
diff changeset
74 int16_t *lumMmx2Filter;
eb87391a5292 overread in the mmx2 horizontal scaler fixed
michael
parents: 4554
diff changeset
75 int16_t *chrMmx2Filter;
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
76
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
77 int canMMX2BeUsed;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
78
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
79 int lastInLumBuf;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
80 int lastInChrBuf;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
81 int lumBufIndex;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
82 int chrBufIndex;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
83 int dstY;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
84 int flags;
4554
16fdb694cf13 swScale internally uses yuv2rgb now if possible
michael
parents: 4467
diff changeset
85
16fdb694cf13 swScale internally uses yuv2rgb now if possible
michael
parents: 4467
diff changeset
86 void (*swScale)(struct SwsContext *context, uint8_t* src[], int srcStride[], int srcSliceY,
16fdb694cf13 swScale internally uses yuv2rgb now if possible
michael
parents: 4467
diff changeset
87 int srcSliceH, uint8_t* dst[], int dstStride[]);
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
88 } SwsContext;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
89 //FIXME check init (where 0)
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
90
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
91 // when used for filters they must have an odd number of elements
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
92 // coeffs cannot be shared between vectors
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
93 typedef struct {
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
94 double *coeff;
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
95 int length;
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
96 } SwsVector;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
97
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
98 // vectors can be shared
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
99 typedef struct {
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
100 SwsVector *lumH;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
101 SwsVector *lumV;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
102 SwsVector *chrH;
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
103 SwsVector *chrV;
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
104 } SwsFilter;
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
105
2217
fd9311c3fa42 header for swscale.c
arpi
parents:
diff changeset
106
2519
6f3fa9bc3b27 yv12 to yv12 scaler
michael
parents: 2217
diff changeset
107 // *** bilinear scaling and yuv->rgb & yuv->yuv conversion of yv12 slices:
2217
fd9311c3fa42 header for swscale.c
arpi
parents:
diff changeset
108 // *** Note: it's called multiple times while decoding a frame, first time y==0
2519
6f3fa9bc3b27 yv12 to yv12 scaler
michael
parents: 2217
diff changeset
109 // dstbpp == 12 -> yv12 output
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
110 // will use sws_flags
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
111 void SwScale_YV12slice(unsigned char* src[],int srcStride[], int srcSliceY,
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
112 int srcSliceH, uint8_t* dst[], int dstStride, int dstbpp,
3209
0b172eb639f1 swscaler cleanup
michael
parents: 2519
diff changeset
113 int srcW, int srcH, int dstW, int dstH);
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
114
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
115 // Obsolete, will be removed soon
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
116 void SwScale_Init();
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
117
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
118
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
119
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
120 void freeSwsContext(SwsContext *swsContext);
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
121
4419
f002407e298d YV12 like formats support (I420/IYUV)
michael
parents: 4402
diff changeset
122 SwsContext *getSwsContextFromCmdLine(int srcW, int srcH, int srcFormat, int dstW, int dstH, int dstFormat);
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
123 SwsContext *getSwsContext(int srcW, int srcH, int srcFormat, int dstW, int dstH, int dstFormat, int flags,
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
124 SwsFilter *srcFilter, SwsFilter *dstFilter);
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
125
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
126 SwsVector *getGaussianVec(double variance, double quality);
4297
29fef3982238 15/16 bit dithering in C (5% slower, can be disabled by comenting #define DITHER1XBPP out)
michael
parents: 4295
diff changeset
127 SwsVector *getConstVec(double c, int length);
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
128 SwsVector *getIdentityVec(void);
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
129 void scaleVec(SwsVector *a, double scalar);
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
130 void normalizeVec(SwsVector *a, double height);
4294
21dbbbbd5479 a few filters (should be removed/merged when arpis videofilter stuff is finished)
michael
parents: 4290
diff changeset
131 void convVec(SwsVector *a, SwsVector *b);
21dbbbbd5479 a few filters (should be removed/merged when arpis videofilter stuff is finished)
michael
parents: 4290
diff changeset
132 void addVec(SwsVector *a, SwsVector *b);
21dbbbbd5479 a few filters (should be removed/merged when arpis videofilter stuff is finished)
michael
parents: 4290
diff changeset
133 void subVec(SwsVector *a, SwsVector *b);
21dbbbbd5479 a few filters (should be removed/merged when arpis videofilter stuff is finished)
michael
parents: 4290
diff changeset
134 void shiftVec(SwsVector *a, int shift);
21dbbbbd5479 a few filters (should be removed/merged when arpis videofilter stuff is finished)
michael
parents: 4290
diff changeset
135 SwsVector *cloneVec(SwsVector *a);
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
136
4290
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
137 void printVec(SwsVector *a);
1f8ceb12284d general convolution filtering of the source picture
michael
parents: 4276
diff changeset
138 void freeVec(SwsVector *a);
4276
9199d15cb4e0 removed global vars so that multiple swscalers can be used
michael
parents: 3344
diff changeset
139