Rename "funny" code to "mmx2 filter" code.
[libav.git] / libswscale / swscale_internal.h
CommitLineData
5427e242 1/*
d026b45e
DB
2 * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
3 *
4 * This file is part of FFmpeg.
5 *
807e0c66
LA
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
d026b45e
DB
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
807e0c66
LA
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
d026b45e 15 *
807e0c66
LA
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
b19bcbaa 18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
d026b45e 19 */
5427e242 20
0eaf5235
SS
21#ifndef SWSCALE_SWSCALE_INTERNAL_H
22#define SWSCALE_SWSCALE_INTERNAL_H
5427e242 23
4706949c
DB
24#include "config.h"
25
b63f641e 26#if HAVE_ALTIVEC_H
f2015f0c
AB
27#include <altivec.h>
28#endif
29
83da2c6f 30#include "libavutil/avutil.h"
94c4def2 31
59ded10c 32#define STR(s) AV_TOSTRING(s) //AV_STRINGIFY is too long
1625216e 33
5427e242
MN
34#define MAX_FILTER_SIZE 256
35
9507d911
MN
36#if ARCH_X86
37#define VOFW 5120
38#else
39#define VOFW 2048 // faster on PPC and not tested on others
40#endif
41
710af50e 42#define VOF (VOFW*2)
8b2fce0d 43
a898cdc9 44#if HAVE_BIGENDIAN
9990e426
MN
45#define ALT32_CORR (-1)
46#else
47#define ALT32_CORR 1
1625216e
MN
48#endif
49
b63f641e 50#if ARCH_X86_64
1625216e
MN
51# define APCK_PTR2 8
52# define APCK_COEF 16
53# define APCK_SIZE 24
54#else
55# define APCK_PTR2 4
56# define APCK_COEF 8
57# define APCK_SIZE 16
9990e426
MN
58#endif
59
1615fb91
DB
60struct SwsContext;
61
457eed72
DB
62typedef int (*SwsFunc)(struct SwsContext *context, uint8_t* src[],
63 int srcStride[], int srcSliceY, int srcSliceH,
64 uint8_t* dst[], int dstStride[]);
5427e242 65
8a322796 66/* This struct should be aligned on at least a 32-byte boundary. */
5427e242 67typedef struct SwsContext{
221b804f
DB
68 /**
69 * info on struct for av_log
70 */
635a8cd2 71 const AVClass *av_class;
221b804f
DB
72
73 /**
56b69633
DB
74 * Note that src, dst, srcStride, dstStride will be copied in the
75 * sws_scale() wrapper so they can be freely modified here.
221b804f
DB
76 */
77 SwsFunc swScale;
78 int srcW, srcH, dstH;
79 int chrSrcW, chrSrcH, chrDstW, chrDstH;
80 int lumXInc, chrXInc;
81 int lumYInc, chrYInc;
58e4b706 82 enum PixelFormat dstFormat, srcFormat; ///< format 4:2:0 type is always YV12
221b804f
DB
83 int origDstFormat, origSrcFormat; ///< format
84 int chrSrcHSubSample, chrSrcVSubSample;
221b804f
DB
85 int chrDstHSubSample, chrDstVSubSample;
86 int vChrDrop;
87 int sliceDir;
88 double param[2];
89
49004617
VS
90 uint32_t pal_yuv[256];
91 uint32_t pal_rgb[256];
92
221b804f
DB
93 int16_t **lumPixBuf;
94 int16_t **chrPixBuf;
6858492e 95 int16_t **alpPixBuf;
221b804f
DB
96 int16_t *hLumFilter;
97 int16_t *hLumFilterPos;
98 int16_t *hChrFilter;
99 int16_t *hChrFilterPos;
100 int16_t *vLumFilter;
101 int16_t *vLumFilterPos;
102 int16_t *vChrFilter;
103 int16_t *vChrFilterPos;
104
8a322796 105 uint8_t formatConvBuffer[VOF]; //FIXME dynamic allocation, but we have to change a lot of code for this to be useful
221b804f
DB
106
107 int hLumFilterSize;
108 int hChrFilterSize;
109 int vLumFilterSize;
110 int vChrFilterSize;
111 int vLumBufSize;
112 int vChrBufSize;
113
bcdedf67
RP
114 uint8_t *lumMmx2FilterCode;
115 uint8_t *chrMmx2FilterCode;
221b804f
DB
116 int32_t *lumMmx2FilterPos;
117 int32_t *chrMmx2FilterPos;
118 int16_t *lumMmx2Filter;
119 int16_t *chrMmx2Filter;
120
121 int canMMX2BeUsed;
122
123 int lastInLumBuf;
124 int lastInChrBuf;
125 int lumBufIndex;
126 int chrBufIndex;
127 int dstY;
128 int flags;
129 void * yuvTable; // pointer to the yuv->rgb table start so it can be freed()
130 uint8_t * table_rV[256];
131 uint8_t * table_gU[256];
132 int table_gV[256];
133 uint8_t * table_bU[256];
134
135 //Colorspace stuff
136 int contrast, brightness, saturation; // for sws_getColorspaceDetails
137 int srcColorspaceTable[4];
138 int dstColorspaceTable[4];
139 int srcRange, dstRange;
43c16478
MN
140 int yuv2rgb_y_offset;
141 int yuv2rgb_y_coeff;
142 int yuv2rgb_v2r_coeff;
143 int yuv2rgb_v2g_coeff;
144 int yuv2rgb_u2g_coeff;
145 int yuv2rgb_u2b_coeff;
221b804f
DB
146
147#define RED_DITHER "0*8"
148#define GREEN_DITHER "1*8"
149#define BLUE_DITHER "2*8"
150#define Y_COEFF "3*8"
151#define VR_COEFF "4*8"
152#define UB_COEFF "5*8"
153#define VG_COEFF "6*8"
154#define UG_COEFF "7*8"
155#define Y_OFFSET "8*8"
156#define U_OFFSET "9*8"
157#define V_OFFSET "10*8"
8bae9ddc
MN
158#define LUM_MMX_FILTER_OFFSET "11*8"
159#define CHR_MMX_FILTER_OFFSET "11*8+4*4*256"
8a322796 160#define DSTW_OFFSET "11*8+4*4*256*2" //do not change, it is hardcoded in the ASM
221b804f
DB
161#define ESP_OFFSET "11*8+4*4*256*2+8"
162#define VROUNDER_OFFSET "11*8+4*4*256*2+16"
163#define U_TEMP "11*8+4*4*256*2+24"
164#define V_TEMP "11*8+4*4*256*2+32"
6858492e
CS
165#define Y_TEMP "11*8+4*4*256*2+40"
166#define ALP_MMX_FILTER_OFFSET "11*8+4*4*256*2+48"
221b804f 167
92db6235
PP
168 DECLARE_ALIGNED(8, uint64_t, redDither);
169 DECLARE_ALIGNED(8, uint64_t, greenDither);
170 DECLARE_ALIGNED(8, uint64_t, blueDither);
171
172 DECLARE_ALIGNED(8, uint64_t, yCoeff);
173 DECLARE_ALIGNED(8, uint64_t, vrCoeff);
174 DECLARE_ALIGNED(8, uint64_t, ubCoeff);
175 DECLARE_ALIGNED(8, uint64_t, vgCoeff);
176 DECLARE_ALIGNED(8, uint64_t, ugCoeff);
177 DECLARE_ALIGNED(8, uint64_t, yOffset);
178 DECLARE_ALIGNED(8, uint64_t, uOffset);
179 DECLARE_ALIGNED(8, uint64_t, vOffset);
221b804f
DB
180 int32_t lumMmxFilter[4*MAX_FILTER_SIZE];
181 int32_t chrMmxFilter[4*MAX_FILTER_SIZE];
182 int dstW;
92db6235
PP
183 DECLARE_ALIGNED(8, uint64_t, esp);
184 DECLARE_ALIGNED(8, uint64_t, vRounder);
185 DECLARE_ALIGNED(8, uint64_t, u_temp);
186 DECLARE_ALIGNED(8, uint64_t, v_temp);
187 DECLARE_ALIGNED(8, uint64_t, y_temp);
6858492e 188 int32_t alpMmxFilter[4*MAX_FILTER_SIZE];
a31de956 189
b63f641e 190#if HAVE_ALTIVEC
a31de956
MN
191 vector signed short CY;
192 vector signed short CRV;
193 vector signed short CBU;
194 vector signed short CGU;
195 vector signed short CGV;
196 vector signed short OY;
197 vector unsigned short CSHIFT;
221b804f 198 vector signed short *vYCoeffsBank, *vCCoeffsBank;
a31de956
MN
199#endif
200
b63f641e 201#if ARCH_BFIN
92db6235
PP
202 DECLARE_ALIGNED(4, uint32_t, oy);
203 DECLARE_ALIGNED(4, uint32_t, oc);
204 DECLARE_ALIGNED(4, uint32_t, zero);
205 DECLARE_ALIGNED(4, uint32_t, cy);
206 DECLARE_ALIGNED(4, uint32_t, crv);
207 DECLARE_ALIGNED(4, uint32_t, rmask);
208 DECLARE_ALIGNED(4, uint32_t, cbu);
209 DECLARE_ALIGNED(4, uint32_t, bmask);
210 DECLARE_ALIGNED(4, uint32_t, cgu);
211 DECLARE_ALIGNED(4, uint32_t, cgv);
212 DECLARE_ALIGNED(4, uint32_t, gmask);
d3f3eea9
MH
213#endif
214
b63f641e 215#if HAVE_VIS
92db6235 216 DECLARE_ALIGNED(8, uint64_t, sparc_coeffs[10]);
90c1d7b4 217#endif
d3f3eea9 218
40fa5140
RP
219 /* function pointers for swScale() */
220 void (*yuv2nv12X )(struct SwsContext *c,
221 const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
222 const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
223 uint8_t *dest, uint8_t *uDest,
224 int dstW, int chrDstW, int dstFormat);
225 void (*yuv2yuv1 )(struct SwsContext *c,
226 const int16_t *lumSrc, const int16_t *chrSrc, const int16_t *alpSrc,
227 uint8_t *dest,
228 uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
229 long dstW, long chrDstW);
230 void (*yuv2yuvX )(struct SwsContext *c,
231 const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
232 const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
233 const int16_t **alpSrc,
234 uint8_t *dest,
235 uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
236 long dstW, long chrDstW);
237 void (*yuv2packed1)(struct SwsContext *c,
238 const uint16_t *buf0,
239 const uint16_t *uvbuf0, const uint16_t *uvbuf1,
240 const uint16_t *abuf0,
241 uint8_t *dest,
242 int dstW, int uvalpha, int dstFormat, int flags, int y);
243 void (*yuv2packed2)(struct SwsContext *c,
244 const uint16_t *buf0, const uint16_t *buf1,
245 const uint16_t *uvbuf0, const uint16_t *uvbuf1,
246 const uint16_t *abuf0, const uint16_t *abuf1,
247 uint8_t *dest,
248 int dstW, int yalpha, int uvalpha, int y);
249 void (*yuv2packedX)(struct SwsContext *c,
250 const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
251 const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
252 const int16_t **alpSrc, uint8_t *dest,
253 long dstW, long dstY);
254
255 void (*hyscale_internal)(uint8_t *dst, const uint8_t *src,
256 long width, uint32_t *pal);
39e5f87b
CS
257 void (*hascale_internal)(uint8_t *dst, const uint8_t *src,
258 long width, uint32_t *pal);
40fa5140
RP
259 void (*hcscale_internal)(uint8_t *dstU, uint8_t *dstV,
260 const uint8_t *src1, const uint8_t *src2,
261 long width, uint32_t *pal);
262 void (*hyscale_fast)(struct SwsContext *c,
263 int16_t *dst, int dstWidth,
264 const uint8_t *src, int srcW, int xInc);
265 void (*hcscale_fast)(struct SwsContext *c,
266 int16_t *dst, int dstWidth,
457eed72
DB
267 const uint8_t *src1, const uint8_t *src2,
268 int srcW, int xInc);
40fa5140
RP
269
270 void (*hScale)(int16_t *dst, int dstW, const uint8_t *src, int srcW,
457eed72
DB
271 int xInc, const int16_t *filter, const int16_t *filterPos,
272 long filterSize);
40fa5140 273
5427e242
MN
274} SwsContext;
275//FIXME check init (where 0)
5427e242 276
780daf2b 277SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c);
457eed72
DB
278int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
279 int fullRange, int brightness,
280 int contrast, int saturation);
5427e242 281
457eed72
DB
282void ff_yuv2rgb_init_tables_altivec(SwsContext *c, const int inv_table[4],
283 int brightness, int contrast, int saturation);
befa8e66
RP
284SwsFunc ff_yuv2rgb_init_mmx(SwsContext *c);
285SwsFunc ff_yuv2rgb_init_vis(SwsContext *c);
286SwsFunc ff_yuv2rgb_init_mlib(SwsContext *c);
780daf2b 287SwsFunc ff_yuv2rgb_init_altivec(SwsContext *c);
befa8e66 288SwsFunc ff_yuv2rgb_get_func_ptr_bfin(SwsContext *c);
d5e9bc06 289void ff_bfin_get_unscaled_swscale(SwsContext *c);
780daf2b 290void ff_yuv2packedX_altivec(SwsContext *c,
f1933e43
DB
291 const int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize,
292 const int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize,
457eed72 293 uint8_t *dest, int dstW, int dstY);
c95a3a9f 294
b4b91702 295const char *sws_format_name(enum PixelFormat format);
94c4def2 296
e9e12f0e 297//FIXME replace this with something faster
714f32bf
MN
298#define is16BPS(x) ( \
299 (x)==PIX_FMT_GRAY16BE \
300 || (x)==PIX_FMT_GRAY16LE \
5b21719e
KS
301 || (x)==PIX_FMT_RGB48BE \
302 || (x)==PIX_FMT_RGB48LE \
de1275d5
MN
303 || (x)==PIX_FMT_YUV420PLE \
304 || (x)==PIX_FMT_YUV422PLE \
305 || (x)==PIX_FMT_YUV444PLE \
306 || (x)==PIX_FMT_YUV420PBE \
307 || (x)==PIX_FMT_YUV422PBE \
308 || (x)==PIX_FMT_YUV444PBE \
714f32bf 309 )
c3dc6c5a 310#define isBE(x) ((x)&1)
de1275d5 311#define isPlanar8YUV(x) ( \
9d9de37d
IP
312 (x)==PIX_FMT_YUV410P \
313 || (x)==PIX_FMT_YUV420P \
9621f2f5 314 || (x)==PIX_FMT_YUVA420P \
9d9de37d
IP
315 || (x)==PIX_FMT_YUV411P \
316 || (x)==PIX_FMT_YUV422P \
317 || (x)==PIX_FMT_YUV444P \
9ba7fe6d 318 || (x)==PIX_FMT_YUV440P \
9d9de37d
IP
319 || (x)==PIX_FMT_NV12 \
320 || (x)==PIX_FMT_NV21 \
321 )
de1275d5
MN
322#define isPlanarYUV(x) ( \
323 isPlanar8YUV(x) \
324 || (x)==PIX_FMT_YUV420PLE \
325 || (x)==PIX_FMT_YUV422PLE \
326 || (x)==PIX_FMT_YUV444PLE \
327 || (x)==PIX_FMT_YUV420PBE \
328 || (x)==PIX_FMT_YUV422PBE \
329 || (x)==PIX_FMT_YUV444PBE \
330 )
9d9de37d
IP
331#define isYUV(x) ( \
332 (x)==PIX_FMT_UYVY422 \
333 || (x)==PIX_FMT_YUYV422 \
334 || isPlanarYUV(x) \
335 )
336#define isGray(x) ( \
337 (x)==PIX_FMT_GRAY8 \
338 || (x)==PIX_FMT_GRAY16BE \
339 || (x)==PIX_FMT_GRAY16LE \
340 )
341#define isGray16(x) ( \
342 (x)==PIX_FMT_GRAY16BE \
343 || (x)==PIX_FMT_GRAY16LE \
344 )
345#define isRGB(x) ( \
e8417235
KS
346 (x)==PIX_FMT_RGB48BE \
347 || (x)==PIX_FMT_RGB48LE \
348 || (x)==PIX_FMT_RGB32 \
9990e426 349 || (x)==PIX_FMT_RGB32_1 \
9d9de37d
IP
350 || (x)==PIX_FMT_RGB24 \
351 || (x)==PIX_FMT_RGB565 \
352 || (x)==PIX_FMT_RGB555 \
353 || (x)==PIX_FMT_RGB8 \
354 || (x)==PIX_FMT_RGB4 \
355 || (x)==PIX_FMT_RGB4_BYTE \
356 || (x)==PIX_FMT_MONOBLACK \
ec1bca2a 357 || (x)==PIX_FMT_MONOWHITE \
9d9de37d
IP
358 )
359#define isBGR(x) ( \
d52337af 360 (x)==PIX_FMT_BGR32 \
9990e426 361 || (x)==PIX_FMT_BGR32_1 \
9d9de37d
IP
362 || (x)==PIX_FMT_BGR24 \
363 || (x)==PIX_FMT_BGR565 \
364 || (x)==PIX_FMT_BGR555 \
365 || (x)==PIX_FMT_BGR8 \
366 || (x)==PIX_FMT_BGR4 \
367 || (x)==PIX_FMT_BGR4_BYTE \
368 || (x)==PIX_FMT_MONOBLACK \
ec1bca2a 369 || (x)==PIX_FMT_MONOWHITE \
9d9de37d 370 )
c2751600
CS
371#define isALPHA(x) ( \
372 (x)==PIX_FMT_BGR32 \
373 || (x)==PIX_FMT_BGR32_1 \
374 || (x)==PIX_FMT_RGB32 \
375 || (x)==PIX_FMT_RGB32_1 \
376 || (x)==PIX_FMT_YUVA420P \
377 )
e9e12f0e
LA
378
379static inline int fmt_depth(int fmt)
380{
381 switch(fmt) {
075ec82c
KS
382 case PIX_FMT_RGB48BE:
383 case PIX_FMT_RGB48LE:
384 return 48;
e9e12f0e
LA
385 case PIX_FMT_BGRA:
386 case PIX_FMT_ABGR:
387 case PIX_FMT_RGBA:
388 case PIX_FMT_ARGB:
389 return 32;
390 case PIX_FMT_BGR24:
391 case PIX_FMT_RGB24:
392 return 24;
393 case PIX_FMT_BGR565:
394 case PIX_FMT_RGB565:
4884b9e5
KS
395 case PIX_FMT_GRAY16BE:
396 case PIX_FMT_GRAY16LE:
e9e12f0e
LA
397 return 16;
398 case PIX_FMT_BGR555:
399 case PIX_FMT_RGB555:
400 return 15;
401 case PIX_FMT_BGR8:
402 case PIX_FMT_RGB8:
403 return 8;
404 case PIX_FMT_BGR4:
405 case PIX_FMT_RGB4:
406 case PIX_FMT_BGR4_BYTE:
407 case PIX_FMT_RGB4_BYTE:
408 return 4;
409 case PIX_FMT_MONOBLACK:
ec1bca2a 410 case PIX_FMT_MONOWHITE:
e9e12f0e
LA
411 return 1;
412 default:
413 return 0;
414 }
415}
416
43175f50
DB
417extern const uint64_t ff_dither4[2];
418extern const uint64_t ff_dither8[2];
0cb25594 419
e40b183d
LB
420extern const AVClass sws_context_class;
421
0eaf5235 422#endif /* SWSCALE_SWSCALE_INTERNAL_H */