Commit | Line | Data |
---|---|---|
5427e242 | 1 | /* |
d026b45e DB |
2 | * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at> |
3 | * | |
4 | * This file is part of FFmpeg. | |
5 | * | |
807e0c66 LA |
6 | * FFmpeg is free software; you can redistribute it and/or |
7 | * modify it under the terms of the GNU Lesser General Public | |
8 | * License as published by the Free Software Foundation; either | |
9 | * version 2.1 of the License, or (at your option) any later version. | |
d026b45e DB |
10 | * |
11 | * FFmpeg is distributed in the hope that it will be useful, | |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
807e0c66 LA |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
14 | * Lesser General Public License for more details. | |
d026b45e | 15 | * |
807e0c66 LA |
16 | * You should have received a copy of the GNU Lesser General Public |
17 | * License along with FFmpeg; if not, write to the Free Software | |
b19bcbaa | 18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
d026b45e | 19 | */ |
5427e242 | 20 | |
0eaf5235 SS |
21 | #ifndef SWSCALE_SWSCALE_INTERNAL_H |
22 | #define SWSCALE_SWSCALE_INTERNAL_H | |
5427e242 | 23 | |
4706949c DB |
24 | #include "config.h" |
25 | ||
b63f641e | 26 | #if HAVE_ALTIVEC_H |
f2015f0c AB |
27 | #include <altivec.h> |
28 | #endif | |
29 | ||
83da2c6f | 30 | #include "libavutil/avutil.h" |
94c4def2 | 31 | |
59ded10c | 32 | #define STR(s) AV_TOSTRING(s) //AV_STRINGIFY is too long |
1625216e | 33 | |
5427e242 MN |
34 | #define MAX_FILTER_SIZE 256 |
35 | ||
9507d911 MN |
36 | #if ARCH_X86 |
37 | #define VOFW 5120 | |
38 | #else | |
39 | #define VOFW 2048 // faster on PPC and not tested on others | |
40 | #endif | |
41 | ||
710af50e | 42 | #define VOF (VOFW*2) |
8b2fce0d | 43 | |
9990e426 MN |
44 | #ifdef WORDS_BIGENDIAN |
45 | #define ALT32_CORR (-1) | |
46 | #else | |
47 | #define ALT32_CORR 1 | |
1625216e MN |
48 | #endif |
49 | ||
b63f641e | 50 | #if ARCH_X86_64 |
1625216e MN |
51 | # define APCK_PTR2 8 |
52 | # define APCK_COEF 16 | |
53 | # define APCK_SIZE 24 | |
54 | #else | |
55 | # define APCK_PTR2 4 | |
56 | # define APCK_COEF 8 | |
57 | # define APCK_SIZE 16 | |
9990e426 MN |
58 | #endif |
59 | ||
1615fb91 DB |
60 | struct SwsContext; |
61 | ||
457eed72 DB |
62 | typedef int (*SwsFunc)(struct SwsContext *context, uint8_t* src[], |
63 | int srcStride[], int srcSliceY, int srcSliceH, | |
64 | uint8_t* dst[], int dstStride[]); | |
5427e242 | 65 | |
8a322796 | 66 | /* This struct should be aligned on at least a 32-byte boundary. */ |
5427e242 | 67 | typedef struct SwsContext{ |
221b804f DB |
68 | /** |
69 | * info on struct for av_log | |
70 | */ | |
635a8cd2 | 71 | const AVClass *av_class; |
221b804f DB |
72 | |
73 | /** | |
56b69633 DB |
74 | * Note that src, dst, srcStride, dstStride will be copied in the |
75 | * sws_scale() wrapper so they can be freely modified here. | |
221b804f DB |
76 | */ |
77 | SwsFunc swScale; | |
78 | int srcW, srcH, dstH; | |
79 | int chrSrcW, chrSrcH, chrDstW, chrDstH; | |
80 | int lumXInc, chrXInc; | |
81 | int lumYInc, chrYInc; | |
58e4b706 | 82 | enum PixelFormat dstFormat, srcFormat; ///< format 4:2:0 type is always YV12 |
221b804f DB |
83 | int origDstFormat, origSrcFormat; ///< format |
84 | int chrSrcHSubSample, chrSrcVSubSample; | |
85 | int chrIntHSubSample, chrIntVSubSample; | |
86 | int chrDstHSubSample, chrDstVSubSample; | |
87 | int vChrDrop; | |
88 | int sliceDir; | |
89 | double param[2]; | |
90 | ||
49004617 VS |
91 | uint32_t pal_yuv[256]; |
92 | uint32_t pal_rgb[256]; | |
93 | ||
221b804f DB |
94 | int16_t **lumPixBuf; |
95 | int16_t **chrPixBuf; | |
6858492e | 96 | int16_t **alpPixBuf; |
221b804f DB |
97 | int16_t *hLumFilter; |
98 | int16_t *hLumFilterPos; | |
99 | int16_t *hChrFilter; | |
100 | int16_t *hChrFilterPos; | |
101 | int16_t *vLumFilter; | |
102 | int16_t *vLumFilterPos; | |
103 | int16_t *vChrFilter; | |
104 | int16_t *vChrFilterPos; | |
105 | ||
8a322796 | 106 | uint8_t formatConvBuffer[VOF]; //FIXME dynamic allocation, but we have to change a lot of code for this to be useful |
221b804f DB |
107 | |
108 | int hLumFilterSize; | |
109 | int hChrFilterSize; | |
110 | int vLumFilterSize; | |
111 | int vChrFilterSize; | |
112 | int vLumBufSize; | |
113 | int vChrBufSize; | |
114 | ||
115 | uint8_t *funnyYCode; | |
116 | uint8_t *funnyUVCode; | |
117 | int32_t *lumMmx2FilterPos; | |
118 | int32_t *chrMmx2FilterPos; | |
119 | int16_t *lumMmx2Filter; | |
120 | int16_t *chrMmx2Filter; | |
121 | ||
122 | int canMMX2BeUsed; | |
123 | ||
124 | int lastInLumBuf; | |
125 | int lastInChrBuf; | |
126 | int lumBufIndex; | |
127 | int chrBufIndex; | |
128 | int dstY; | |
129 | int flags; | |
130 | void * yuvTable; // pointer to the yuv->rgb table start so it can be freed() | |
131 | uint8_t * table_rV[256]; | |
132 | uint8_t * table_gU[256]; | |
133 | int table_gV[256]; | |
134 | uint8_t * table_bU[256]; | |
135 | ||
136 | //Colorspace stuff | |
137 | int contrast, brightness, saturation; // for sws_getColorspaceDetails | |
138 | int srcColorspaceTable[4]; | |
139 | int dstColorspaceTable[4]; | |
140 | int srcRange, dstRange; | |
43c16478 MN |
141 | int yuv2rgb_y_offset; |
142 | int yuv2rgb_y_coeff; | |
143 | int yuv2rgb_v2r_coeff; | |
144 | int yuv2rgb_v2g_coeff; | |
145 | int yuv2rgb_u2g_coeff; | |
146 | int yuv2rgb_u2b_coeff; | |
221b804f DB |
147 | |
148 | #define RED_DITHER "0*8" | |
149 | #define GREEN_DITHER "1*8" | |
150 | #define BLUE_DITHER "2*8" | |
151 | #define Y_COEFF "3*8" | |
152 | #define VR_COEFF "4*8" | |
153 | #define UB_COEFF "5*8" | |
154 | #define VG_COEFF "6*8" | |
155 | #define UG_COEFF "7*8" | |
156 | #define Y_OFFSET "8*8" | |
157 | #define U_OFFSET "9*8" | |
158 | #define V_OFFSET "10*8" | |
8bae9ddc MN |
159 | #define LUM_MMX_FILTER_OFFSET "11*8" |
160 | #define CHR_MMX_FILTER_OFFSET "11*8+4*4*256" | |
8a322796 | 161 | #define DSTW_OFFSET "11*8+4*4*256*2" //do not change, it is hardcoded in the ASM |
221b804f DB |
162 | #define ESP_OFFSET "11*8+4*4*256*2+8" |
163 | #define VROUNDER_OFFSET "11*8+4*4*256*2+16" | |
164 | #define U_TEMP "11*8+4*4*256*2+24" | |
165 | #define V_TEMP "11*8+4*4*256*2+32" | |
6858492e CS |
166 | #define Y_TEMP "11*8+4*4*256*2+40" |
167 | #define ALP_MMX_FILTER_OFFSET "11*8+4*4*256*2+48" | |
221b804f DB |
168 | |
169 | uint64_t redDither __attribute__((aligned(8))); | |
170 | uint64_t greenDither __attribute__((aligned(8))); | |
171 | uint64_t blueDither __attribute__((aligned(8))); | |
172 | ||
173 | uint64_t yCoeff __attribute__((aligned(8))); | |
174 | uint64_t vrCoeff __attribute__((aligned(8))); | |
175 | uint64_t ubCoeff __attribute__((aligned(8))); | |
176 | uint64_t vgCoeff __attribute__((aligned(8))); | |
177 | uint64_t ugCoeff __attribute__((aligned(8))); | |
178 | uint64_t yOffset __attribute__((aligned(8))); | |
179 | uint64_t uOffset __attribute__((aligned(8))); | |
180 | uint64_t vOffset __attribute__((aligned(8))); | |
181 | int32_t lumMmxFilter[4*MAX_FILTER_SIZE]; | |
182 | int32_t chrMmxFilter[4*MAX_FILTER_SIZE]; | |
183 | int dstW; | |
184 | uint64_t esp __attribute__((aligned(8))); | |
185 | uint64_t vRounder __attribute__((aligned(8))); | |
186 | uint64_t u_temp __attribute__((aligned(8))); | |
187 | uint64_t v_temp __attribute__((aligned(8))); | |
6858492e CS |
188 | uint64_t y_temp __attribute__((aligned(8))); |
189 | int32_t alpMmxFilter[4*MAX_FILTER_SIZE]; | |
a31de956 | 190 | |
b63f641e | 191 | #if HAVE_ALTIVEC |
a31de956 MN |
192 | vector signed short CY; |
193 | vector signed short CRV; | |
194 | vector signed short CBU; | |
195 | vector signed short CGU; | |
196 | vector signed short CGV; | |
197 | vector signed short OY; | |
198 | vector unsigned short CSHIFT; | |
221b804f | 199 | vector signed short *vYCoeffsBank, *vCCoeffsBank; |
a31de956 MN |
200 | #endif |
201 | ||
b63f641e | 202 | #if ARCH_BFIN |
d3f3eea9 MH |
203 | uint32_t oy __attribute__((aligned(4))); |
204 | uint32_t oc __attribute__((aligned(4))); | |
205 | uint32_t zero __attribute__((aligned(4))); | |
206 | uint32_t cy __attribute__((aligned(4))); | |
207 | uint32_t crv __attribute__((aligned(4))); | |
208 | uint32_t rmask __attribute__((aligned(4))); | |
209 | uint32_t cbu __attribute__((aligned(4))); | |
210 | uint32_t bmask __attribute__((aligned(4))); | |
211 | uint32_t cgu __attribute__((aligned(4))); | |
212 | uint32_t cgv __attribute__((aligned(4))); | |
213 | uint32_t gmask __attribute__((aligned(4))); | |
214 | #endif | |
215 | ||
b63f641e | 216 | #if HAVE_VIS |
90c1d7b4 DB |
217 | uint64_t sparc_coeffs[10] __attribute__((aligned(8))); |
218 | #endif | |
d3f3eea9 | 219 | |
40fa5140 RP |
220 | /* function pointers for swScale() */ |
221 | void (*yuv2nv12X )(struct SwsContext *c, | |
222 | const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, | |
223 | const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize, | |
224 | uint8_t *dest, uint8_t *uDest, | |
225 | int dstW, int chrDstW, int dstFormat); | |
226 | void (*yuv2yuv1 )(struct SwsContext *c, | |
227 | const int16_t *lumSrc, const int16_t *chrSrc, const int16_t *alpSrc, | |
228 | uint8_t *dest, | |
229 | uint8_t *uDest, uint8_t *vDest, uint8_t *aDest, | |
230 | long dstW, long chrDstW); | |
231 | void (*yuv2yuvX )(struct SwsContext *c, | |
232 | const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, | |
233 | const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize, | |
234 | const int16_t **alpSrc, | |
235 | uint8_t *dest, | |
236 | uint8_t *uDest, uint8_t *vDest, uint8_t *aDest, | |
237 | long dstW, long chrDstW); | |
238 | void (*yuv2packed1)(struct SwsContext *c, | |
239 | const uint16_t *buf0, | |
240 | const uint16_t *uvbuf0, const uint16_t *uvbuf1, | |
241 | const uint16_t *abuf0, | |
242 | uint8_t *dest, | |
243 | int dstW, int uvalpha, int dstFormat, int flags, int y); | |
244 | void (*yuv2packed2)(struct SwsContext *c, | |
245 | const uint16_t *buf0, const uint16_t *buf1, | |
246 | const uint16_t *uvbuf0, const uint16_t *uvbuf1, | |
247 | const uint16_t *abuf0, const uint16_t *abuf1, | |
248 | uint8_t *dest, | |
249 | int dstW, int yalpha, int uvalpha, int y); | |
250 | void (*yuv2packedX)(struct SwsContext *c, | |
251 | const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, | |
252 | const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize, | |
253 | const int16_t **alpSrc, uint8_t *dest, | |
254 | long dstW, long dstY); | |
255 | ||
256 | void (*hyscale_internal)(uint8_t *dst, const uint8_t *src, | |
257 | long width, uint32_t *pal); | |
39e5f87b CS |
258 | void (*hascale_internal)(uint8_t *dst, const uint8_t *src, |
259 | long width, uint32_t *pal); | |
40fa5140 RP |
260 | void (*hcscale_internal)(uint8_t *dstU, uint8_t *dstV, |
261 | const uint8_t *src1, const uint8_t *src2, | |
262 | long width, uint32_t *pal); | |
263 | void (*hyscale_fast)(struct SwsContext *c, | |
264 | int16_t *dst, int dstWidth, | |
265 | const uint8_t *src, int srcW, int xInc); | |
266 | void (*hcscale_fast)(struct SwsContext *c, | |
267 | int16_t *dst, int dstWidth, | |
457eed72 DB |
268 | const uint8_t *src1, const uint8_t *src2, |
269 | int srcW, int xInc); | |
40fa5140 RP |
270 | |
271 | void (*hScale)(int16_t *dst, int dstW, const uint8_t *src, int srcW, | |
457eed72 DB |
272 | int xInc, const int16_t *filter, const int16_t *filterPos, |
273 | long filterSize); | |
40fa5140 | 274 | |
5427e242 MN |
275 | } SwsContext; |
276 | //FIXME check init (where 0) | |
5427e242 | 277 | |
780daf2b | 278 | SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c); |
457eed72 DB |
279 | int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4], |
280 | int fullRange, int brightness, | |
281 | int contrast, int saturation); | |
5427e242 | 282 | |
457eed72 DB |
283 | void ff_yuv2rgb_init_tables_altivec(SwsContext *c, const int inv_table[4], |
284 | int brightness, int contrast, int saturation); | |
befa8e66 RP |
285 | SwsFunc ff_yuv2rgb_init_mmx(SwsContext *c); |
286 | SwsFunc ff_yuv2rgb_init_vis(SwsContext *c); | |
287 | SwsFunc ff_yuv2rgb_init_mlib(SwsContext *c); | |
780daf2b | 288 | SwsFunc ff_yuv2rgb_init_altivec(SwsContext *c); |
befa8e66 | 289 | SwsFunc ff_yuv2rgb_get_func_ptr_bfin(SwsContext *c); |
d5e9bc06 | 290 | void ff_bfin_get_unscaled_swscale(SwsContext *c); |
780daf2b | 291 | void ff_yuv2packedX_altivec(SwsContext *c, |
f1933e43 DB |
292 | const int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize, |
293 | const int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize, | |
457eed72 | 294 | uint8_t *dest, int dstW, int dstY); |
c95a3a9f | 295 | |
8055ede6 | 296 | const char *sws_format_name(int format); |
94c4def2 | 297 | |
e9e12f0e | 298 | //FIXME replace this with something faster |
714f32bf MN |
299 | #define is16BPS(x) ( \ |
300 | (x)==PIX_FMT_GRAY16BE \ | |
301 | || (x)==PIX_FMT_GRAY16LE \ | |
5b21719e KS |
302 | || (x)==PIX_FMT_RGB48BE \ |
303 | || (x)==PIX_FMT_RGB48LE \ | |
de1275d5 MN |
304 | || (x)==PIX_FMT_YUV420PLE \ |
305 | || (x)==PIX_FMT_YUV422PLE \ | |
306 | || (x)==PIX_FMT_YUV444PLE \ | |
307 | || (x)==PIX_FMT_YUV420PBE \ | |
308 | || (x)==PIX_FMT_YUV422PBE \ | |
309 | || (x)==PIX_FMT_YUV444PBE \ | |
714f32bf | 310 | ) |
c3dc6c5a | 311 | #define isBE(x) ((x)&1) |
de1275d5 | 312 | #define isPlanar8YUV(x) ( \ |
9d9de37d IP |
313 | (x)==PIX_FMT_YUV410P \ |
314 | || (x)==PIX_FMT_YUV420P \ | |
9621f2f5 | 315 | || (x)==PIX_FMT_YUVA420P \ |
9d9de37d IP |
316 | || (x)==PIX_FMT_YUV411P \ |
317 | || (x)==PIX_FMT_YUV422P \ | |
318 | || (x)==PIX_FMT_YUV444P \ | |
9ba7fe6d | 319 | || (x)==PIX_FMT_YUV440P \ |
9d9de37d IP |
320 | || (x)==PIX_FMT_NV12 \ |
321 | || (x)==PIX_FMT_NV21 \ | |
322 | ) | |
de1275d5 MN |
323 | #define isPlanarYUV(x) ( \ |
324 | isPlanar8YUV(x) \ | |
325 | || (x)==PIX_FMT_YUV420PLE \ | |
326 | || (x)==PIX_FMT_YUV422PLE \ | |
327 | || (x)==PIX_FMT_YUV444PLE \ | |
328 | || (x)==PIX_FMT_YUV420PBE \ | |
329 | || (x)==PIX_FMT_YUV422PBE \ | |
330 | || (x)==PIX_FMT_YUV444PBE \ | |
331 | ) | |
9d9de37d IP |
332 | #define isYUV(x) ( \ |
333 | (x)==PIX_FMT_UYVY422 \ | |
334 | || (x)==PIX_FMT_YUYV422 \ | |
335 | || isPlanarYUV(x) \ | |
336 | ) | |
337 | #define isGray(x) ( \ | |
338 | (x)==PIX_FMT_GRAY8 \ | |
339 | || (x)==PIX_FMT_GRAY16BE \ | |
340 | || (x)==PIX_FMT_GRAY16LE \ | |
341 | ) | |
342 | #define isGray16(x) ( \ | |
343 | (x)==PIX_FMT_GRAY16BE \ | |
344 | || (x)==PIX_FMT_GRAY16LE \ | |
345 | ) | |
346 | #define isRGB(x) ( \ | |
e8417235 KS |
347 | (x)==PIX_FMT_RGB48BE \ |
348 | || (x)==PIX_FMT_RGB48LE \ | |
349 | || (x)==PIX_FMT_RGB32 \ | |
9990e426 | 350 | || (x)==PIX_FMT_RGB32_1 \ |
9d9de37d IP |
351 | || (x)==PIX_FMT_RGB24 \ |
352 | || (x)==PIX_FMT_RGB565 \ | |
353 | || (x)==PIX_FMT_RGB555 \ | |
354 | || (x)==PIX_FMT_RGB8 \ | |
355 | || (x)==PIX_FMT_RGB4 \ | |
356 | || (x)==PIX_FMT_RGB4_BYTE \ | |
357 | || (x)==PIX_FMT_MONOBLACK \ | |
ec1bca2a | 358 | || (x)==PIX_FMT_MONOWHITE \ |
9d9de37d IP |
359 | ) |
360 | #define isBGR(x) ( \ | |
d52337af | 361 | (x)==PIX_FMT_BGR32 \ |
9990e426 | 362 | || (x)==PIX_FMT_BGR32_1 \ |
9d9de37d IP |
363 | || (x)==PIX_FMT_BGR24 \ |
364 | || (x)==PIX_FMT_BGR565 \ | |
365 | || (x)==PIX_FMT_BGR555 \ | |
366 | || (x)==PIX_FMT_BGR8 \ | |
367 | || (x)==PIX_FMT_BGR4 \ | |
368 | || (x)==PIX_FMT_BGR4_BYTE \ | |
369 | || (x)==PIX_FMT_MONOBLACK \ | |
ec1bca2a | 370 | || (x)==PIX_FMT_MONOWHITE \ |
9d9de37d | 371 | ) |
c2751600 CS |
372 | #define isALPHA(x) ( \ |
373 | (x)==PIX_FMT_BGR32 \ | |
374 | || (x)==PIX_FMT_BGR32_1 \ | |
375 | || (x)==PIX_FMT_RGB32 \ | |
376 | || (x)==PIX_FMT_RGB32_1 \ | |
377 | || (x)==PIX_FMT_YUVA420P \ | |
378 | ) | |
e9e12f0e LA |
379 | |
380 | static inline int fmt_depth(int fmt) | |
381 | { | |
382 | switch(fmt) { | |
075ec82c KS |
383 | case PIX_FMT_RGB48BE: |
384 | case PIX_FMT_RGB48LE: | |
385 | return 48; | |
e9e12f0e LA |
386 | case PIX_FMT_BGRA: |
387 | case PIX_FMT_ABGR: | |
388 | case PIX_FMT_RGBA: | |
389 | case PIX_FMT_ARGB: | |
390 | return 32; | |
391 | case PIX_FMT_BGR24: | |
392 | case PIX_FMT_RGB24: | |
393 | return 24; | |
394 | case PIX_FMT_BGR565: | |
395 | case PIX_FMT_RGB565: | |
4884b9e5 KS |
396 | case PIX_FMT_GRAY16BE: |
397 | case PIX_FMT_GRAY16LE: | |
e9e12f0e LA |
398 | return 16; |
399 | case PIX_FMT_BGR555: | |
400 | case PIX_FMT_RGB555: | |
401 | return 15; | |
402 | case PIX_FMT_BGR8: | |
403 | case PIX_FMT_RGB8: | |
404 | return 8; | |
405 | case PIX_FMT_BGR4: | |
406 | case PIX_FMT_RGB4: | |
407 | case PIX_FMT_BGR4_BYTE: | |
408 | case PIX_FMT_RGB4_BYTE: | |
409 | return 4; | |
410 | case PIX_FMT_MONOBLACK: | |
ec1bca2a | 411 | case PIX_FMT_MONOWHITE: |
e9e12f0e LA |
412 | return 1; |
413 | default: | |
414 | return 0; | |
415 | } | |
416 | } | |
417 | ||
43175f50 DB |
418 | extern const uint64_t ff_dither4[2]; |
419 | extern const uint64_t ff_dither8[2]; | |
0cb25594 | 420 | |
e40b183d LB |
421 | extern const AVClass sws_context_class; |
422 | ||
0eaf5235 | 423 | #endif /* SWSCALE_SWSCALE_INTERNAL_H */ |