a401175a263805cc433edbc99876bbff9cb4e3f5
[libav.git] / libswscale / swscale_internal.h
1 /*
2 * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 #ifndef SWSCALE_SWSCALE_INTERNAL_H
22 #define SWSCALE_SWSCALE_INTERNAL_H
23
24 #include "config.h"
25
26 #ifdef HAVE_ALTIVEC_H
27 #include <altivec.h>
28 #endif
29
30 #include "libavutil/avutil.h"
31
32 #define STR(s) AV_TOSTRING(s) //AV_STRINGIFY is too long
33
34 #define MAX_FILTER_SIZE 256
35
36 #define VOFW 2048
37 #define VOF (VOFW*2)
38
39 #ifdef WORDS_BIGENDIAN
40 #define ALT32_CORR (-1)
41 #else
42 #define ALT32_CORR 1
43 #endif
44
45 #ifdef ARCH_X86_64
46 # define APCK_PTR2 8
47 # define APCK_COEF 16
48 # define APCK_SIZE 24
49 #else
50 # define APCK_PTR2 4
51 # define APCK_COEF 8
52 # define APCK_SIZE 16
53 #endif
54
55 typedef int (*SwsFunc)(struct SwsContext *context, uint8_t* src[], int srcStride[], int srcSliceY,
56 int srcSliceH, uint8_t* dst[], int dstStride[]);
57
58 /* This struct should be aligned on at least a 32-byte boundary. */
59 typedef struct SwsContext{
60 /**
61 * info on struct for av_log
62 */
63 const AVClass *av_class;
64
65 /**
66 * Note that src, dst, srcStride, dstStride will be copied in the
67 * sws_scale() wrapper so they can be freely modified here.
68 */
69 SwsFunc swScale;
70 int srcW, srcH, dstH;
71 int chrSrcW, chrSrcH, chrDstW, chrDstH;
72 int lumXInc, chrXInc;
73 int lumYInc, chrYInc;
74 int dstFormat, srcFormat; ///< format 4:2:0 type is always YV12
75 int origDstFormat, origSrcFormat; ///< format
76 int chrSrcHSubSample, chrSrcVSubSample;
77 int chrIntHSubSample, chrIntVSubSample;
78 int chrDstHSubSample, chrDstVSubSample;
79 int vChrDrop;
80 int sliceDir;
81 double param[2];
82
83 int16_t **lumPixBuf;
84 int16_t **chrPixBuf;
85 int16_t *hLumFilter;
86 int16_t *hLumFilterPos;
87 int16_t *hChrFilter;
88 int16_t *hChrFilterPos;
89 int16_t *vLumFilter;
90 int16_t *vLumFilterPos;
91 int16_t *vChrFilter;
92 int16_t *vChrFilterPos;
93
94 uint8_t formatConvBuffer[VOF]; //FIXME dynamic allocation, but we have to change a lot of code for this to be useful
95
96 int hLumFilterSize;
97 int hChrFilterSize;
98 int vLumFilterSize;
99 int vChrFilterSize;
100 int vLumBufSize;
101 int vChrBufSize;
102
103 uint8_t *funnyYCode;
104 uint8_t *funnyUVCode;
105 int32_t *lumMmx2FilterPos;
106 int32_t *chrMmx2FilterPos;
107 int16_t *lumMmx2Filter;
108 int16_t *chrMmx2Filter;
109
110 int canMMX2BeUsed;
111
112 int lastInLumBuf;
113 int lastInChrBuf;
114 int lumBufIndex;
115 int chrBufIndex;
116 int dstY;
117 int flags;
118 void * yuvTable; // pointer to the yuv->rgb table start so it can be freed()
119 uint8_t * table_rV[256];
120 uint8_t * table_gU[256];
121 int table_gV[256];
122 uint8_t * table_bU[256];
123
124 //Colorspace stuff
125 int contrast, brightness, saturation; // for sws_getColorspaceDetails
126 int srcColorspaceTable[4];
127 int dstColorspaceTable[4];
128 int srcRange, dstRange;
129 int oy,cy,cvr,cvg,cug,cub;
130
131 #define RED_DITHER "0*8"
132 #define GREEN_DITHER "1*8"
133 #define BLUE_DITHER "2*8"
134 #define Y_COEFF "3*8"
135 #define VR_COEFF "4*8"
136 #define UB_COEFF "5*8"
137 #define VG_COEFF "6*8"
138 #define UG_COEFF "7*8"
139 #define Y_OFFSET "8*8"
140 #define U_OFFSET "9*8"
141 #define V_OFFSET "10*8"
142 #define LUM_MMX_FILTER_OFFSET "11*8"
143 #define CHR_MMX_FILTER_OFFSET "11*8+4*4*256"
144 #define DSTW_OFFSET "11*8+4*4*256*2" //do not change, it is hardcoded in the ASM
145 #define ESP_OFFSET "11*8+4*4*256*2+8"
146 #define VROUNDER_OFFSET "11*8+4*4*256*2+16"
147 #define U_TEMP "11*8+4*4*256*2+24"
148 #define V_TEMP "11*8+4*4*256*2+32"
149
150 uint64_t redDither __attribute__((aligned(8)));
151 uint64_t greenDither __attribute__((aligned(8)));
152 uint64_t blueDither __attribute__((aligned(8)));
153
154 uint64_t yCoeff __attribute__((aligned(8)));
155 uint64_t vrCoeff __attribute__((aligned(8)));
156 uint64_t ubCoeff __attribute__((aligned(8)));
157 uint64_t vgCoeff __attribute__((aligned(8)));
158 uint64_t ugCoeff __attribute__((aligned(8)));
159 uint64_t yOffset __attribute__((aligned(8)));
160 uint64_t uOffset __attribute__((aligned(8)));
161 uint64_t vOffset __attribute__((aligned(8)));
162 int32_t lumMmxFilter[4*MAX_FILTER_SIZE];
163 int32_t chrMmxFilter[4*MAX_FILTER_SIZE];
164 int dstW;
165 uint64_t esp __attribute__((aligned(8)));
166 uint64_t vRounder __attribute__((aligned(8)));
167 uint64_t u_temp __attribute__((aligned(8)));
168 uint64_t v_temp __attribute__((aligned(8)));
169
170 #ifdef HAVE_ALTIVEC
171
172 vector signed short CY;
173 vector signed short CRV;
174 vector signed short CBU;
175 vector signed short CGU;
176 vector signed short CGV;
177 vector signed short OY;
178 vector unsigned short CSHIFT;
179 vector signed short *vYCoeffsBank, *vCCoeffsBank;
180
181 #endif
182
183
184 #ifdef ARCH_BFIN
185 uint32_t oy __attribute__((aligned(4)));
186 uint32_t oc __attribute__((aligned(4)));
187 uint32_t zero __attribute__((aligned(4)));
188 uint32_t cy __attribute__((aligned(4)));
189 uint32_t crv __attribute__((aligned(4)));
190 uint32_t rmask __attribute__((aligned(4)));
191 uint32_t cbu __attribute__((aligned(4)));
192 uint32_t bmask __attribute__((aligned(4)));
193 uint32_t cgu __attribute__((aligned(4)));
194 uint32_t cgv __attribute__((aligned(4)));
195 uint32_t gmask __attribute__((aligned(4)));
196 #endif
197
198 #ifdef HAVE_VIS
199 uint64_t sparc_coeffs[10] __attribute__((aligned(8)));
200 #endif
201
202 } SwsContext;
203 //FIXME check init (where 0)
204
205 SwsFunc yuv2rgb_get_func_ptr (SwsContext *c);
206 int yuv2rgb_c_init_tables (SwsContext *c, const int inv_table[4], int fullRange, int brightness, int contrast, int saturation);
207
208 void yuv2rgb_altivec_init_tables (SwsContext *c, const int inv_table[4],int brightness,int contrast, int saturation);
209 SwsFunc yuv2rgb_init_altivec (SwsContext *c);
210 void altivec_yuv2packedX (SwsContext *c,
211 int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize,
212 int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize,
213 uint8_t *dest, int dstW, int dstY);
214
215 const char *sws_format_name(int format);
216
217 //FIXME replace this with something faster
218 #define isPlanarYUV(x) ( \
219 (x)==PIX_FMT_YUV410P \
220 || (x)==PIX_FMT_YUV420P \
221 || (x)==PIX_FMT_YUV411P \
222 || (x)==PIX_FMT_YUV422P \
223 || (x)==PIX_FMT_YUV444P \
224 || (x)==PIX_FMT_YUV440P \
225 || (x)==PIX_FMT_NV12 \
226 || (x)==PIX_FMT_NV21 \
227 )
228 #define isYUV(x) ( \
229 (x)==PIX_FMT_UYVY422 \
230 || (x)==PIX_FMT_YUYV422 \
231 || isPlanarYUV(x) \
232 )
233 #define isGray(x) ( \
234 (x)==PIX_FMT_GRAY8 \
235 || (x)==PIX_FMT_GRAY16BE \
236 || (x)==PIX_FMT_GRAY16LE \
237 )
238 #define isGray16(x) ( \
239 (x)==PIX_FMT_GRAY16BE \
240 || (x)==PIX_FMT_GRAY16LE \
241 )
242 #define isRGB(x) ( \
243 (x)==PIX_FMT_RGB32 \
244 || (x)==PIX_FMT_RGB32_1 \
245 || (x)==PIX_FMT_RGB24 \
246 || (x)==PIX_FMT_RGB565 \
247 || (x)==PIX_FMT_RGB555 \
248 || (x)==PIX_FMT_RGB8 \
249 || (x)==PIX_FMT_RGB4 \
250 || (x)==PIX_FMT_RGB4_BYTE \
251 || (x)==PIX_FMT_MONOBLACK \
252 )
253 #define isBGR(x) ( \
254 (x)==PIX_FMT_BGR32 \
255 || (x)==PIX_FMT_BGR32_1 \
256 || (x)==PIX_FMT_BGR24 \
257 || (x)==PIX_FMT_BGR565 \
258 || (x)==PIX_FMT_BGR555 \
259 || (x)==PIX_FMT_BGR8 \
260 || (x)==PIX_FMT_BGR4 \
261 || (x)==PIX_FMT_BGR4_BYTE \
262 || (x)==PIX_FMT_MONOBLACK \
263 )
264
265 static inline int fmt_depth(int fmt)
266 {
267 switch(fmt) {
268 case PIX_FMT_BGRA:
269 case PIX_FMT_ABGR:
270 case PIX_FMT_RGBA:
271 case PIX_FMT_ARGB:
272 return 32;
273 case PIX_FMT_BGR24:
274 case PIX_FMT_RGB24:
275 return 24;
276 case PIX_FMT_BGR565:
277 case PIX_FMT_RGB565:
278 case PIX_FMT_GRAY16BE:
279 case PIX_FMT_GRAY16LE:
280 return 16;
281 case PIX_FMT_BGR555:
282 case PIX_FMT_RGB555:
283 return 15;
284 case PIX_FMT_BGR8:
285 case PIX_FMT_RGB8:
286 return 8;
287 case PIX_FMT_BGR4:
288 case PIX_FMT_RGB4:
289 case PIX_FMT_BGR4_BYTE:
290 case PIX_FMT_RGB4_BYTE:
291 return 4;
292 case PIX_FMT_MONOBLACK:
293 return 1;
294 default:
295 return 0;
296 }
297 }
298
299 extern const DECLARE_ALIGNED(8, uint64_t, ff_dither4[2]);
300 extern const DECLARE_ALIGNED(8, uint64_t, ff_dither8[2]);
301
302 extern const AVClass sws_context_class;
303
304 #endif /* SWSCALE_SWSCALE_INTERNAL_H */