Commit | Line | Data |
---|---|---|
5427e242 | 1 | /* |
d026b45e DB |
2 | * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at> |
3 | * | |
4 | * This file is part of FFmpeg. | |
5 | * | |
807e0c66 LA |
6 | * FFmpeg is free software; you can redistribute it and/or |
7 | * modify it under the terms of the GNU Lesser General Public | |
8 | * License as published by the Free Software Foundation; either | |
9 | * version 2.1 of the License, or (at your option) any later version. | |
d026b45e DB |
10 | * |
11 | * FFmpeg is distributed in the hope that it will be useful, | |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
807e0c66 LA |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
14 | * Lesser General Public License for more details. | |
d026b45e | 15 | * |
807e0c66 LA |
16 | * You should have received a copy of the GNU Lesser General Public |
17 | * License along with FFmpeg; if not, write to the Free Software | |
b19bcbaa | 18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
d026b45e | 19 | */ |
5427e242 | 20 | |
0eaf5235 SS |
21 | #ifndef SWSCALE_SWSCALE_INTERNAL_H |
22 | #define SWSCALE_SWSCALE_INTERNAL_H | |
5427e242 | 23 | |
4706949c DB |
24 | #include "config.h" |
25 | ||
b63f641e | 26 | #if HAVE_ALTIVEC_H |
f2015f0c AB |
27 | #include <altivec.h> |
28 | #endif | |
29 | ||
83da2c6f | 30 | #include "libavutil/avutil.h" |
94c4def2 | 31 | |
59ded10c | 32 | #define STR(s) AV_TOSTRING(s) //AV_STRINGIFY is too long |
1625216e | 33 | |
5427e242 MN |
34 | #define MAX_FILTER_SIZE 256 |
35 | ||
9507d911 MN |
36 | #if ARCH_X86 |
37 | #define VOFW 5120 | |
38 | #else | |
39 | #define VOFW 2048 // faster on PPC and not tested on others | |
40 | #endif | |
41 | ||
710af50e | 42 | #define VOF (VOFW*2) |
8b2fce0d | 43 | |
a898cdc9 | 44 | #if HAVE_BIGENDIAN |
9990e426 MN |
45 | #define ALT32_CORR (-1) |
46 | #else | |
47 | #define ALT32_CORR 1 | |
1625216e MN |
48 | #endif |
49 | ||
b63f641e | 50 | #if ARCH_X86_64 |
1625216e MN |
51 | # define APCK_PTR2 8 |
52 | # define APCK_COEF 16 | |
53 | # define APCK_SIZE 24 | |
54 | #else | |
55 | # define APCK_PTR2 4 | |
56 | # define APCK_COEF 8 | |
57 | # define APCK_SIZE 16 | |
9990e426 MN |
58 | #endif |
59 | ||
1615fb91 DB |
60 | struct SwsContext; |
61 | ||
457eed72 DB |
62 | typedef int (*SwsFunc)(struct SwsContext *context, uint8_t* src[], |
63 | int srcStride[], int srcSliceY, int srcSliceH, | |
64 | uint8_t* dst[], int dstStride[]); | |
5427e242 | 65 | |
8a322796 | 66 | /* This struct should be aligned on at least a 32-byte boundary. */ |
5427e242 | 67 | typedef struct SwsContext{ |
221b804f DB |
68 | /** |
69 | * info on struct for av_log | |
70 | */ | |
635a8cd2 | 71 | const AVClass *av_class; |
221b804f DB |
72 | |
73 | /** | |
56b69633 DB |
74 | * Note that src, dst, srcStride, dstStride will be copied in the |
75 | * sws_scale() wrapper so they can be freely modified here. | |
221b804f DB |
76 | */ |
77 | SwsFunc swScale; | |
78 | int srcW, srcH, dstH; | |
79 | int chrSrcW, chrSrcH, chrDstW, chrDstH; | |
80 | int lumXInc, chrXInc; | |
81 | int lumYInc, chrYInc; | |
58e4b706 | 82 | enum PixelFormat dstFormat, srcFormat; ///< format 4:2:0 type is always YV12 |
221b804f DB |
83 | int origDstFormat, origSrcFormat; ///< format |
84 | int chrSrcHSubSample, chrSrcVSubSample; | |
221b804f DB |
85 | int chrDstHSubSample, chrDstVSubSample; |
86 | int vChrDrop; | |
87 | int sliceDir; | |
88 | double param[2]; | |
89 | ||
49004617 VS |
90 | uint32_t pal_yuv[256]; |
91 | uint32_t pal_rgb[256]; | |
92 | ||
221b804f DB |
93 | int16_t **lumPixBuf; |
94 | int16_t **chrPixBuf; | |
6858492e | 95 | int16_t **alpPixBuf; |
221b804f DB |
96 | int16_t *hLumFilter; |
97 | int16_t *hLumFilterPos; | |
98 | int16_t *hChrFilter; | |
99 | int16_t *hChrFilterPos; | |
100 | int16_t *vLumFilter; | |
101 | int16_t *vLumFilterPos; | |
102 | int16_t *vChrFilter; | |
103 | int16_t *vChrFilterPos; | |
104 | ||
8a322796 | 105 | uint8_t formatConvBuffer[VOF]; //FIXME dynamic allocation, but we have to change a lot of code for this to be useful |
221b804f DB |
106 | |
107 | int hLumFilterSize; | |
108 | int hChrFilterSize; | |
109 | int vLumFilterSize; | |
110 | int vChrFilterSize; | |
111 | int vLumBufSize; | |
112 | int vChrBufSize; | |
113 | ||
bcdedf67 RP |
114 | uint8_t *lumMmx2FilterCode; |
115 | uint8_t *chrMmx2FilterCode; | |
221b804f DB |
116 | int32_t *lumMmx2FilterPos; |
117 | int32_t *chrMmx2FilterPos; | |
118 | int16_t *lumMmx2Filter; | |
119 | int16_t *chrMmx2Filter; | |
120 | ||
121 | int canMMX2BeUsed; | |
122 | ||
123 | int lastInLumBuf; | |
124 | int lastInChrBuf; | |
125 | int lumBufIndex; | |
126 | int chrBufIndex; | |
127 | int dstY; | |
128 | int flags; | |
129 | void * yuvTable; // pointer to the yuv->rgb table start so it can be freed() | |
130 | uint8_t * table_rV[256]; | |
131 | uint8_t * table_gU[256]; | |
132 | int table_gV[256]; | |
133 | uint8_t * table_bU[256]; | |
134 | ||
135 | //Colorspace stuff | |
136 | int contrast, brightness, saturation; // for sws_getColorspaceDetails | |
137 | int srcColorspaceTable[4]; | |
138 | int dstColorspaceTable[4]; | |
139 | int srcRange, dstRange; | |
43c16478 MN |
140 | int yuv2rgb_y_offset; |
141 | int yuv2rgb_y_coeff; | |
142 | int yuv2rgb_v2r_coeff; | |
143 | int yuv2rgb_v2g_coeff; | |
144 | int yuv2rgb_u2g_coeff; | |
145 | int yuv2rgb_u2b_coeff; | |
221b804f DB |
146 | |
147 | #define RED_DITHER "0*8" | |
148 | #define GREEN_DITHER "1*8" | |
149 | #define BLUE_DITHER "2*8" | |
150 | #define Y_COEFF "3*8" | |
151 | #define VR_COEFF "4*8" | |
152 | #define UB_COEFF "5*8" | |
153 | #define VG_COEFF "6*8" | |
154 | #define UG_COEFF "7*8" | |
155 | #define Y_OFFSET "8*8" | |
156 | #define U_OFFSET "9*8" | |
157 | #define V_OFFSET "10*8" | |
8bae9ddc MN |
158 | #define LUM_MMX_FILTER_OFFSET "11*8" |
159 | #define CHR_MMX_FILTER_OFFSET "11*8+4*4*256" | |
8a322796 | 160 | #define DSTW_OFFSET "11*8+4*4*256*2" //do not change, it is hardcoded in the ASM |
221b804f DB |
161 | #define ESP_OFFSET "11*8+4*4*256*2+8" |
162 | #define VROUNDER_OFFSET "11*8+4*4*256*2+16" | |
163 | #define U_TEMP "11*8+4*4*256*2+24" | |
164 | #define V_TEMP "11*8+4*4*256*2+32" | |
6858492e CS |
165 | #define Y_TEMP "11*8+4*4*256*2+40" |
166 | #define ALP_MMX_FILTER_OFFSET "11*8+4*4*256*2+48" | |
221b804f | 167 | |
92db6235 PP |
168 | DECLARE_ALIGNED(8, uint64_t, redDither); |
169 | DECLARE_ALIGNED(8, uint64_t, greenDither); | |
170 | DECLARE_ALIGNED(8, uint64_t, blueDither); | |
171 | ||
172 | DECLARE_ALIGNED(8, uint64_t, yCoeff); | |
173 | DECLARE_ALIGNED(8, uint64_t, vrCoeff); | |
174 | DECLARE_ALIGNED(8, uint64_t, ubCoeff); | |
175 | DECLARE_ALIGNED(8, uint64_t, vgCoeff); | |
176 | DECLARE_ALIGNED(8, uint64_t, ugCoeff); | |
177 | DECLARE_ALIGNED(8, uint64_t, yOffset); | |
178 | DECLARE_ALIGNED(8, uint64_t, uOffset); | |
179 | DECLARE_ALIGNED(8, uint64_t, vOffset); | |
221b804f DB |
180 | int32_t lumMmxFilter[4*MAX_FILTER_SIZE]; |
181 | int32_t chrMmxFilter[4*MAX_FILTER_SIZE]; | |
182 | int dstW; | |
92db6235 PP |
183 | DECLARE_ALIGNED(8, uint64_t, esp); |
184 | DECLARE_ALIGNED(8, uint64_t, vRounder); | |
185 | DECLARE_ALIGNED(8, uint64_t, u_temp); | |
186 | DECLARE_ALIGNED(8, uint64_t, v_temp); | |
187 | DECLARE_ALIGNED(8, uint64_t, y_temp); | |
6858492e | 188 | int32_t alpMmxFilter[4*MAX_FILTER_SIZE]; |
a31de956 | 189 | |
b63f641e | 190 | #if HAVE_ALTIVEC |
a31de956 MN |
191 | vector signed short CY; |
192 | vector signed short CRV; | |
193 | vector signed short CBU; | |
194 | vector signed short CGU; | |
195 | vector signed short CGV; | |
196 | vector signed short OY; | |
197 | vector unsigned short CSHIFT; | |
221b804f | 198 | vector signed short *vYCoeffsBank, *vCCoeffsBank; |
a31de956 MN |
199 | #endif |
200 | ||
b63f641e | 201 | #if ARCH_BFIN |
92db6235 PP |
202 | DECLARE_ALIGNED(4, uint32_t, oy); |
203 | DECLARE_ALIGNED(4, uint32_t, oc); | |
204 | DECLARE_ALIGNED(4, uint32_t, zero); | |
205 | DECLARE_ALIGNED(4, uint32_t, cy); | |
206 | DECLARE_ALIGNED(4, uint32_t, crv); | |
207 | DECLARE_ALIGNED(4, uint32_t, rmask); | |
208 | DECLARE_ALIGNED(4, uint32_t, cbu); | |
209 | DECLARE_ALIGNED(4, uint32_t, bmask); | |
210 | DECLARE_ALIGNED(4, uint32_t, cgu); | |
211 | DECLARE_ALIGNED(4, uint32_t, cgv); | |
212 | DECLARE_ALIGNED(4, uint32_t, gmask); | |
d3f3eea9 MH |
213 | #endif |
214 | ||
b63f641e | 215 | #if HAVE_VIS |
92db6235 | 216 | DECLARE_ALIGNED(8, uint64_t, sparc_coeffs[10]); |
90c1d7b4 | 217 | #endif |
d3f3eea9 | 218 | |
40fa5140 RP |
219 | /* function pointers for swScale() */ |
220 | void (*yuv2nv12X )(struct SwsContext *c, | |
221 | const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, | |
222 | const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize, | |
223 | uint8_t *dest, uint8_t *uDest, | |
224 | int dstW, int chrDstW, int dstFormat); | |
225 | void (*yuv2yuv1 )(struct SwsContext *c, | |
226 | const int16_t *lumSrc, const int16_t *chrSrc, const int16_t *alpSrc, | |
227 | uint8_t *dest, | |
228 | uint8_t *uDest, uint8_t *vDest, uint8_t *aDest, | |
229 | long dstW, long chrDstW); | |
230 | void (*yuv2yuvX )(struct SwsContext *c, | |
231 | const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, | |
232 | const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize, | |
233 | const int16_t **alpSrc, | |
234 | uint8_t *dest, | |
235 | uint8_t *uDest, uint8_t *vDest, uint8_t *aDest, | |
236 | long dstW, long chrDstW); | |
237 | void (*yuv2packed1)(struct SwsContext *c, | |
238 | const uint16_t *buf0, | |
239 | const uint16_t *uvbuf0, const uint16_t *uvbuf1, | |
240 | const uint16_t *abuf0, | |
241 | uint8_t *dest, | |
242 | int dstW, int uvalpha, int dstFormat, int flags, int y); | |
243 | void (*yuv2packed2)(struct SwsContext *c, | |
244 | const uint16_t *buf0, const uint16_t *buf1, | |
245 | const uint16_t *uvbuf0, const uint16_t *uvbuf1, | |
246 | const uint16_t *abuf0, const uint16_t *abuf1, | |
247 | uint8_t *dest, | |
248 | int dstW, int yalpha, int uvalpha, int y); | |
249 | void (*yuv2packedX)(struct SwsContext *c, | |
250 | const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, | |
251 | const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize, | |
252 | const int16_t **alpSrc, uint8_t *dest, | |
253 | long dstW, long dstY); | |
254 | ||
255 | void (*hyscale_internal)(uint8_t *dst, const uint8_t *src, | |
256 | long width, uint32_t *pal); | |
39e5f87b CS |
257 | void (*hascale_internal)(uint8_t *dst, const uint8_t *src, |
258 | long width, uint32_t *pal); | |
40fa5140 RP |
259 | void (*hcscale_internal)(uint8_t *dstU, uint8_t *dstV, |
260 | const uint8_t *src1, const uint8_t *src2, | |
261 | long width, uint32_t *pal); | |
262 | void (*hyscale_fast)(struct SwsContext *c, | |
263 | int16_t *dst, int dstWidth, | |
264 | const uint8_t *src, int srcW, int xInc); | |
265 | void (*hcscale_fast)(struct SwsContext *c, | |
266 | int16_t *dst, int dstWidth, | |
457eed72 DB |
267 | const uint8_t *src1, const uint8_t *src2, |
268 | int srcW, int xInc); | |
40fa5140 RP |
269 | |
270 | void (*hScale)(int16_t *dst, int dstW, const uint8_t *src, int srcW, | |
457eed72 DB |
271 | int xInc, const int16_t *filter, const int16_t *filterPos, |
272 | long filterSize); | |
40fa5140 | 273 | |
5427e242 MN |
274 | } SwsContext; |
275 | //FIXME check init (where 0) | |
5427e242 | 276 | |
780daf2b | 277 | SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c); |
457eed72 DB |
278 | int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4], |
279 | int fullRange, int brightness, | |
280 | int contrast, int saturation); | |
5427e242 | 281 | |
457eed72 DB |
282 | void ff_yuv2rgb_init_tables_altivec(SwsContext *c, const int inv_table[4], |
283 | int brightness, int contrast, int saturation); | |
befa8e66 RP |
284 | SwsFunc ff_yuv2rgb_init_mmx(SwsContext *c); |
285 | SwsFunc ff_yuv2rgb_init_vis(SwsContext *c); | |
286 | SwsFunc ff_yuv2rgb_init_mlib(SwsContext *c); | |
780daf2b | 287 | SwsFunc ff_yuv2rgb_init_altivec(SwsContext *c); |
befa8e66 | 288 | SwsFunc ff_yuv2rgb_get_func_ptr_bfin(SwsContext *c); |
d5e9bc06 | 289 | void ff_bfin_get_unscaled_swscale(SwsContext *c); |
780daf2b | 290 | void ff_yuv2packedX_altivec(SwsContext *c, |
f1933e43 DB |
291 | const int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize, |
292 | const int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize, | |
457eed72 | 293 | uint8_t *dest, int dstW, int dstY); |
c95a3a9f | 294 | |
b4b91702 | 295 | const char *sws_format_name(enum PixelFormat format); |
94c4def2 | 296 | |
e9e12f0e | 297 | //FIXME replace this with something faster |
714f32bf MN |
298 | #define is16BPS(x) ( \ |
299 | (x)==PIX_FMT_GRAY16BE \ | |
300 | || (x)==PIX_FMT_GRAY16LE \ | |
5b21719e KS |
301 | || (x)==PIX_FMT_RGB48BE \ |
302 | || (x)==PIX_FMT_RGB48LE \ | |
de1275d5 MN |
303 | || (x)==PIX_FMT_YUV420PLE \ |
304 | || (x)==PIX_FMT_YUV422PLE \ | |
305 | || (x)==PIX_FMT_YUV444PLE \ | |
306 | || (x)==PIX_FMT_YUV420PBE \ | |
307 | || (x)==PIX_FMT_YUV422PBE \ | |
308 | || (x)==PIX_FMT_YUV444PBE \ | |
714f32bf | 309 | ) |
c3dc6c5a | 310 | #define isBE(x) ((x)&1) |
de1275d5 | 311 | #define isPlanar8YUV(x) ( \ |
9d9de37d IP |
312 | (x)==PIX_FMT_YUV410P \ |
313 | || (x)==PIX_FMT_YUV420P \ | |
9621f2f5 | 314 | || (x)==PIX_FMT_YUVA420P \ |
9d9de37d IP |
315 | || (x)==PIX_FMT_YUV411P \ |
316 | || (x)==PIX_FMT_YUV422P \ | |
317 | || (x)==PIX_FMT_YUV444P \ | |
9ba7fe6d | 318 | || (x)==PIX_FMT_YUV440P \ |
9d9de37d IP |
319 | || (x)==PIX_FMT_NV12 \ |
320 | || (x)==PIX_FMT_NV21 \ | |
321 | ) | |
de1275d5 MN |
322 | #define isPlanarYUV(x) ( \ |
323 | isPlanar8YUV(x) \ | |
324 | || (x)==PIX_FMT_YUV420PLE \ | |
325 | || (x)==PIX_FMT_YUV422PLE \ | |
326 | || (x)==PIX_FMT_YUV444PLE \ | |
327 | || (x)==PIX_FMT_YUV420PBE \ | |
328 | || (x)==PIX_FMT_YUV422PBE \ | |
329 | || (x)==PIX_FMT_YUV444PBE \ | |
330 | ) | |
9d9de37d IP |
331 | #define isYUV(x) ( \ |
332 | (x)==PIX_FMT_UYVY422 \ | |
333 | || (x)==PIX_FMT_YUYV422 \ | |
334 | || isPlanarYUV(x) \ | |
335 | ) | |
336 | #define isGray(x) ( \ | |
337 | (x)==PIX_FMT_GRAY8 \ | |
338 | || (x)==PIX_FMT_GRAY16BE \ | |
339 | || (x)==PIX_FMT_GRAY16LE \ | |
340 | ) | |
341 | #define isGray16(x) ( \ | |
342 | (x)==PIX_FMT_GRAY16BE \ | |
343 | || (x)==PIX_FMT_GRAY16LE \ | |
344 | ) | |
345 | #define isRGB(x) ( \ | |
e8417235 KS |
346 | (x)==PIX_FMT_RGB48BE \ |
347 | || (x)==PIX_FMT_RGB48LE \ | |
348 | || (x)==PIX_FMT_RGB32 \ | |
9990e426 | 349 | || (x)==PIX_FMT_RGB32_1 \ |
9d9de37d IP |
350 | || (x)==PIX_FMT_RGB24 \ |
351 | || (x)==PIX_FMT_RGB565 \ | |
352 | || (x)==PIX_FMT_RGB555 \ | |
353 | || (x)==PIX_FMT_RGB8 \ | |
354 | || (x)==PIX_FMT_RGB4 \ | |
355 | || (x)==PIX_FMT_RGB4_BYTE \ | |
356 | || (x)==PIX_FMT_MONOBLACK \ | |
ec1bca2a | 357 | || (x)==PIX_FMT_MONOWHITE \ |
9d9de37d IP |
358 | ) |
359 | #define isBGR(x) ( \ | |
d52337af | 360 | (x)==PIX_FMT_BGR32 \ |
9990e426 | 361 | || (x)==PIX_FMT_BGR32_1 \ |
9d9de37d IP |
362 | || (x)==PIX_FMT_BGR24 \ |
363 | || (x)==PIX_FMT_BGR565 \ | |
364 | || (x)==PIX_FMT_BGR555 \ | |
365 | || (x)==PIX_FMT_BGR8 \ | |
366 | || (x)==PIX_FMT_BGR4 \ | |
367 | || (x)==PIX_FMT_BGR4_BYTE \ | |
368 | || (x)==PIX_FMT_MONOBLACK \ | |
ec1bca2a | 369 | || (x)==PIX_FMT_MONOWHITE \ |
9d9de37d | 370 | ) |
c2751600 CS |
371 | #define isALPHA(x) ( \ |
372 | (x)==PIX_FMT_BGR32 \ | |
373 | || (x)==PIX_FMT_BGR32_1 \ | |
374 | || (x)==PIX_FMT_RGB32 \ | |
375 | || (x)==PIX_FMT_RGB32_1 \ | |
376 | || (x)==PIX_FMT_YUVA420P \ | |
377 | ) | |
e9e12f0e LA |
378 | |
379 | static inline int fmt_depth(int fmt) | |
380 | { | |
381 | switch(fmt) { | |
075ec82c KS |
382 | case PIX_FMT_RGB48BE: |
383 | case PIX_FMT_RGB48LE: | |
384 | return 48; | |
e9e12f0e LA |
385 | case PIX_FMT_BGRA: |
386 | case PIX_FMT_ABGR: | |
387 | case PIX_FMT_RGBA: | |
388 | case PIX_FMT_ARGB: | |
389 | return 32; | |
390 | case PIX_FMT_BGR24: | |
391 | case PIX_FMT_RGB24: | |
392 | return 24; | |
393 | case PIX_FMT_BGR565: | |
394 | case PIX_FMT_RGB565: | |
4884b9e5 KS |
395 | case PIX_FMT_GRAY16BE: |
396 | case PIX_FMT_GRAY16LE: | |
e9e12f0e LA |
397 | return 16; |
398 | case PIX_FMT_BGR555: | |
399 | case PIX_FMT_RGB555: | |
400 | return 15; | |
401 | case PIX_FMT_BGR8: | |
402 | case PIX_FMT_RGB8: | |
403 | return 8; | |
404 | case PIX_FMT_BGR4: | |
405 | case PIX_FMT_RGB4: | |
406 | case PIX_FMT_BGR4_BYTE: | |
407 | case PIX_FMT_RGB4_BYTE: | |
408 | return 4; | |
409 | case PIX_FMT_MONOBLACK: | |
ec1bca2a | 410 | case PIX_FMT_MONOWHITE: |
e9e12f0e LA |
411 | return 1; |
412 | default: | |
413 | return 0; | |
414 | } | |
415 | } | |
416 | ||
43175f50 DB |
417 | extern const uint64_t ff_dither4[2]; |
418 | extern const uint64_t ff_dither8[2]; | |
0cb25594 | 419 | |
e40b183d LB |
420 | extern const AVClass sws_context_class; |
421 | ||
0eaf5235 | 422 | #endif /* SWSCALE_SWSCALE_INTERNAL_H */ |