2 * Copyright (c) 2002 Brian Foley
3 * Copyright (c) 2002 Dieter Shirley
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 #ifndef _DSPUTIL_ALTIVEC_
21 #define _DSPUTIL_ALTIVEC_
23 #include "dsputil_ppc.h"
27 extern int pix_abs16x16_x2_altivec(uint8_t *pix1
, uint8_t *pix2
, int line_size
);
28 extern int pix_abs16x16_y2_altivec(uint8_t *pix1
, uint8_t *pix2
, int line_size
);
29 extern int pix_abs16x16_xy2_altivec(uint8_t *pix1
, uint8_t *pix2
, int line_size
);
30 extern int pix_abs16x16_altivec(uint8_t *pix1
, uint8_t *pix2
, int line_size
);
31 extern int pix_abs8x8_altivec(uint8_t *pix1
, uint8_t *pix2
, int line_size
);
32 extern int sad16x16_altivec(void *s
, uint8_t *a
, uint8_t *b
, int stride
);
33 extern int sad8x8_altivec(void *s
, uint8_t *a
, uint8_t *b
, int stride
);
34 extern int pix_norm1_altivec(uint8_t *pix
, int line_size
);
35 extern int sse8_altivec(void *v
, uint8_t *pix1
, uint8_t *pix2
, int line_size
);
36 extern int sse16_altivec(void *v
, uint8_t *pix1
, uint8_t *pix2
, int line_size
);
37 extern int pix_sum_altivec(UINT8
* pix
, int line_size
);
38 extern void diff_pixels_altivec(DCTELEM
* block
, const UINT8
* s1
, const UINT8
* s2
, int stride
);
39 extern void get_pixels_altivec(DCTELEM
* block
, const UINT8
* pixels
, int line_size
);
41 extern void add_bytes_altivec(uint8_t *dst
, uint8_t *src
, int w
);
42 extern void put_pixels_clamped_altivec(const DCTELEM
*block
, UINT8
*restrict pixels
, int line_size
);
43 extern void put_pixels16_altivec(uint8_t *block
, const uint8_t *pixels
, int line_size
, int h
);
44 extern void avg_pixels16_altivec(uint8_t *block
, const uint8_t *pixels
, int line_size
, int h
);
45 extern void avg_pixels8_altivec(uint8_t * block
, const uint8_t * pixels
, int line_size
, int h
);
46 extern void put_pixels8_xy2_altivec(uint8_t *block
, const uint8_t *pixels
, int line_size
, int h
);
47 extern void put_no_rnd_pixels8_xy2_altivec(uint8_t *block
, const uint8_t *pixels
, int line_size
, int h
);
48 extern void put_pixels16_xy2_altivec(uint8_t * block
, const uint8_t * pixels
, int line_size
, int h
);
49 extern void put_no_rnd_pixels16_xy2_altivec(uint8_t * block
, const uint8_t * pixels
, int line_size
, int h
);
51 extern void gmc1_altivec(UINT8
*dst
, UINT8
*src
, int stride
, int h
, int x16
, int y16
, int rounder
);
53 extern int has_altivec(void);
55 // used to build registers permutation vectors (vcprm)
56 // the 's' are for words in the _s_econd vector
57 #define WORD_0 0x00,0x01,0x02,0x03
58 #define WORD_1 0x04,0x05,0x06,0x07
59 #define WORD_2 0x08,0x09,0x0a,0x0b
60 #define WORD_3 0x0c,0x0d,0x0e,0x0f
61 #define WORD_s0 0x10,0x11,0x12,0x13
62 #define WORD_s1 0x14,0x15,0x16,0x17
63 #define WORD_s2 0x18,0x19,0x1a,0x1b
64 #define WORD_s3 0x1c,0x1d,0x1e,0x1f
67 #define vcprm(a,b,c,d) (const vector unsigned char)(WORD_ ## a, WORD_ ## b, WORD_ ## c, WORD_ ## d)
69 #define vcprm(a,b,c,d) (const vector unsigned char){WORD_ ## a, WORD_ ## b, WORD_ ## c, WORD_ ## d}
72 // vcprmle is used to keep the same index as in the SSE version.
73 // it's the same as vcprm, with the index inversed
74 // ('le' is Little Endian)
75 #define vcprmle(a,b,c,d) vcprm(d,c,b,a)
77 // used to build inverse/identity vectors (vcii)
78 // n is _n_egative, p is _p_ositive
84 #define vcii(a,b,c,d) (const vector float)(FLOAT_ ## a, FLOAT_ ## b, FLOAT_ ## c, FLOAT_ ## d)
86 #define vcii(a,b,c,d) (const vector float){FLOAT_ ## a, FLOAT_ ## b, FLOAT_ ## c, FLOAT_ ## d}
89 #else /* HAVE_ALTIVEC */
90 #ifdef ALTIVEC_USE_REFERENCE_C_CODE
91 #error "I can't use ALTIVEC_USE_REFERENCE_C_CODE if I don't use HAVE_ALTIVEC"
92 #endif /* ALTIVEC_USE_REFERENCE_C_CODE */
93 #endif /* HAVE_ALTIVEC */
95 #endif /* _DSPUTIL_ALTIVEC_ */