Commit | Line | Data |
---|---|---|
ff4ec49e FB |
1 | /* |
2 | * DSP utils | |
3 | * Copyright (c) 2000, 2001, 2002 Fabrice Bellard. | |
4 | * | |
5 | * This library is free software; you can redistribute it and/or | |
6 | * modify it under the terms of the GNU Lesser General Public | |
7 | * License as published by the Free Software Foundation; either | |
8 | * version 2 of the License, or (at your option) any later version. | |
9 | * | |
10 | * This library is distributed in the hope that it will be useful, | |
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
13 | * Lesser General Public License for more details. | |
14 | * | |
15 | * You should have received a copy of the GNU Lesser General Public | |
16 | * License along with this library; if not, write to the Free Software | |
17 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | |
18 | */ | |
de6d9b64 FB |
19 | #ifndef DSPUTIL_H |
20 | #define DSPUTIL_H | |
21 | ||
22 | #include "common.h" | |
43f1708f | 23 | #include "avcodec.h" |
de6d9b64 | 24 | |
44eb4951 | 25 | //#define DEBUG |
de6d9b64 FB |
26 | /* dct code */ |
27 | typedef short DCTELEM; | |
28 | ||
03c94ede | 29 | void fdct_ifast (DCTELEM *data); |
de6d9b64 FB |
30 | |
31 | void j_rev_dct (DCTELEM *data); | |
32 | ||
33 | void fdct_mmx(DCTELEM *block); | |
34 | ||
03c94ede | 35 | extern void (*av_fdct)(DCTELEM *block); |
de6d9b64 | 36 | |
e0eac44e FB |
37 | /* encoding scans */ |
38 | extern UINT8 ff_alternate_horizontal_scan[64]; | |
39 | extern UINT8 ff_alternate_vertical_scan[64]; | |
40 | extern UINT8 zigzag_direct[64]; | |
41 | ||
5a240838 MN |
42 | /* permutation table */ |
43 | extern UINT8 permutation[64]; | |
44 | ||
de6d9b64 FB |
45 | /* pixel operations */ |
46 | #define MAX_NEG_CROP 384 | |
47 | ||
48 | /* temporary */ | |
49 | extern UINT32 squareTbl[512]; | |
0cfa9713 | 50 | extern UINT8 cropTbl[256 + 2 * MAX_NEG_CROP]; |
de6d9b64 FB |
51 | |
52 | void dsputil_init(void); | |
53 | ||
54 | /* pixel ops : interface with DCT */ | |
55 | ||
4af7bcc1 | 56 | extern void (*ff_idct)(DCTELEM *block); |
8ee14970 FB |
57 | extern void (*ff_idct_put)(UINT8 *dest, int line_size, DCTELEM *block); |
58 | extern void (*ff_idct_add)(UINT8 *dest, int line_size, DCTELEM *block); | |
de6d9b64 | 59 | extern void (*get_pixels)(DCTELEM *block, const UINT8 *pixels, int line_size); |
9dbcbd92 | 60 | extern void (*diff_pixels)(DCTELEM *block, const UINT8 *s1, const UINT8 *s2, int stride); |
de6d9b64 FB |
61 | extern void (*put_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size); |
62 | extern void (*add_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size); | |
44eb4951 | 63 | extern void (*gmc1)(UINT8 *dst, UINT8 *src, int srcStride, int h, int x16, int y16, int rounder); |
649c00c9 | 64 | extern void (*clear_blocks)(DCTELEM *blocks); |
3aa102be MN |
65 | extern int (*pix_sum)(UINT8 * pix, int line_size); |
66 | extern int (*pix_norm1)(UINT8 * pix, int line_size); | |
67 | ||
44eb4951 | 68 | |
de6d9b64 FB |
69 | |
70 | void get_pixels_c(DCTELEM *block, const UINT8 *pixels, int line_size); | |
9dbcbd92 | 71 | void diff_pixels_c(DCTELEM *block, const UINT8 *s1, const UINT8 *s2, int stride); |
de6d9b64 FB |
72 | void put_pixels_clamped_c(const DCTELEM *block, UINT8 *pixels, int line_size); |
73 | void add_pixels_clamped_c(const DCTELEM *block, UINT8 *pixels, int line_size); | |
649c00c9 | 74 | void clear_blocks_c(DCTELEM *blocks); |
de6d9b64 FB |
75 | |
76 | /* add and put pixel (decoding) */ | |
77 | typedef void (*op_pixels_func)(UINT8 *block, const UINT8 *pixels, int line_size, int h); | |
44eb4951 | 78 | typedef void (*qpel_mc_func)(UINT8 *dst, UINT8 *src, int dstStride, int srcStride, int mx, int my); |
de6d9b64 FB |
79 | |
80 | extern op_pixels_func put_pixels_tab[4]; | |
81 | extern op_pixels_func avg_pixels_tab[4]; | |
82 | extern op_pixels_func put_no_rnd_pixels_tab[4]; | |
83 | extern op_pixels_func avg_no_rnd_pixels_tab[4]; | |
44eb4951 MN |
84 | extern qpel_mc_func qpel_mc_rnd_tab[16]; |
85 | extern qpel_mc_func qpel_mc_no_rnd_tab[16]; | |
86 | ||
de6d9b64 FB |
87 | /* motion estimation */ |
88 | ||
ba6802de | 89 | typedef int (*op_pixels_abs_func)(UINT8 *blk1, UINT8 *blk2, int line_size); |
de6d9b64 FB |
90 | |
91 | extern op_pixels_abs_func pix_abs16x16; | |
92 | extern op_pixels_abs_func pix_abs16x16_x2; | |
93 | extern op_pixels_abs_func pix_abs16x16_y2; | |
94 | extern op_pixels_abs_func pix_abs16x16_xy2; | |
ba6802de MN |
95 | extern op_pixels_abs_func pix_abs8x8; |
96 | extern op_pixels_abs_func pix_abs8x8_x2; | |
97 | extern op_pixels_abs_func pix_abs8x8_y2; | |
98 | extern op_pixels_abs_func pix_abs8x8_xy2; | |
99 | ||
100 | int pix_abs16x16_c(UINT8 *blk1, UINT8 *blk2, int lx); | |
101 | int pix_abs16x16_x2_c(UINT8 *blk1, UINT8 *blk2, int lx); | |
102 | int pix_abs16x16_y2_c(UINT8 *blk1, UINT8 *blk2, int lx); | |
103 | int pix_abs16x16_xy2_c(UINT8 *blk1, UINT8 *blk2, int lx); | |
de6d9b64 | 104 | |
e0eac44e FB |
105 | static inline int block_permute_op(int j) |
106 | { | |
5a240838 | 107 | return permutation[j]; |
e0eac44e FB |
108 | } |
109 | ||
110 | void block_permute(INT16 *block); | |
111 | ||
3d03c0a2 | 112 | #if defined(HAVE_MMX) |
de6d9b64 FB |
113 | |
114 | #define MM_MMX 0x0001 /* standard MMX */ | |
115 | #define MM_3DNOW 0x0004 /* AMD 3DNOW */ | |
116 | #define MM_MMXEXT 0x0002 /* SSE integer functions or AMD MMX ext */ | |
117 | #define MM_SSE 0x0008 /* SSE functions */ | |
118 | #define MM_SSE2 0x0010 /* PIV SSE2 functions */ | |
119 | ||
120 | extern int mm_flags; | |
121 | ||
122 | int mm_support(void); | |
123 | ||
124 | static inline void emms(void) | |
125 | { | |
fb16b7e7 FB |
126 | __asm __volatile ("emms;":::"memory"); |
127 | } | |
128 | ||
129 | #define emms_c() \ | |
130 | {\ | |
131 | if (mm_flags & MM_MMX)\ | |
132 | emms();\ | |
de6d9b64 FB |
133 | } |
134 | ||
135 | #define __align8 __attribute__ ((aligned (8))) | |
136 | ||
137 | void dsputil_init_mmx(void); | |
57060b1e | 138 | void dsputil_set_bit_exact_mmx(void); |
de6d9b64 | 139 | |
3d03c0a2 FB |
140 | #elif defined(ARCH_ARMV4L) |
141 | ||
142 | #define emms_c() | |
143 | ||
144 | /* This is to use 4 bytes read to the IDCT pointers for some 'zero' | |
145 | line ptimizations */ | |
146 | #define __align8 __attribute__ ((aligned (4))) | |
147 | ||
148 | void dsputil_init_armv4l(void); | |
149 | ||
c34270f5 FB |
150 | #elif defined(HAVE_MLIB) |
151 | ||
152 | #define emms_c() | |
153 | ||
154 | /* SPARC/VIS IDCT needs 8-byte aligned DCT blocks */ | |
155 | #define __align8 __attribute__ ((aligned (8))) | |
156 | ||
157 | void dsputil_init_mlib(void); | |
158 | ||
1e98dffb NK |
159 | #elif defined(ARCH_ALPHA) |
160 | ||
161 | #define emms_c() | |
162 | #define __align8 __attribute__ ((aligned (8))) | |
163 | ||
164 | void dsputil_init_alpha(void); | |
165 | ||
59925ef2 BF |
166 | #elif defined(ARCH_POWERPC) |
167 | ||
168 | #define emms_c() | |
169 | #define __align8 __attribute__ ((aligned (16))) | |
170 | ||
171 | void dsputil_init_altivec(void); | |
172 | ||
de6d9b64 FB |
173 | #else |
174 | ||
fb16b7e7 FB |
175 | #define emms_c() |
176 | ||
de6d9b64 FB |
177 | #define __align8 |
178 | ||
179 | #endif | |
180 | ||
6d4985bb FB |
181 | #ifdef __GNUC__ |
182 | ||
183 | struct unaligned_64 { uint64_t l; } __attribute__((packed)); | |
184 | struct unaligned_32 { uint32_t l; } __attribute__((packed)); | |
185 | ||
186 | #define LD32(a) (((const struct unaligned_32 *) (a))->l) | |
187 | #define LD64(a) (((const struct unaligned_64 *) (a))->l) | |
188 | ||
189 | #define ST32(a, b) (((struct unaligned_32 *) (a))->l) = (b) | |
190 | ||
191 | #else /* __GNUC__ */ | |
192 | ||
193 | #define LD32(a) (*((uint32_t*)(a))) | |
194 | #define LD64(a) (*((uint64_t*)(a))) | |
195 | ||
196 | #define ST32(a, b) *((uint32_t*)(a)) = (b) | |
197 | ||
198 | #endif /* !__GNUC__ */ | |
199 | ||
43f1708f J |
200 | /* PSNR */ |
201 | void get_psnr(UINT8 *orig_image[3], UINT8 *coded_image[3], | |
202 | int orig_linesize[3], int coded_linesize, | |
203 | AVCodecContext *avctx); | |
204 | ||
de6d9b64 | 205 | #endif |