1 | /*
|
---|
2 | * Copyright (c) 2002 Brian Foley
|
---|
3 | * Copyright (c) 2002 Dieter Shirley
|
---|
4 | * Copyright (c) 2003-2004 Romain Dolbeau <[email protected]>
|
---|
5 | *
|
---|
6 | * This library is free software; you can redistribute it and/or
|
---|
7 | * modify it under the terms of the GNU Lesser General Public
|
---|
8 | * License as published by the Free Software Foundation; either
|
---|
9 | * version 2 of the License, or (at your option) any later version.
|
---|
10 | *
|
---|
11 | * This library is distributed in the hope that it will be useful,
|
---|
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
---|
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
---|
14 | * Lesser General Public License for more details.
|
---|
15 | *
|
---|
16 | * You should have received a copy of the GNU Lesser General Public
|
---|
17 | * License along with this library; if not, write to the Free Software
|
---|
18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
---|
19 | */
|
---|
20 |
|
---|
21 | #ifndef _DSPUTIL_ALTIVEC_
|
---|
22 | #define _DSPUTIL_ALTIVEC_
|
---|
23 |
|
---|
24 | #include "dsputil_ppc.h"
|
---|
25 |
|
---|
26 | #ifdef HAVE_ALTIVEC
|
---|
27 |
|
---|
28 | extern int sad16_x2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
---|
29 | extern int sad16_y2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
---|
30 | extern int sad16_xy2_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
---|
31 | extern int sad16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
---|
32 | extern int sad8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
---|
33 | extern int pix_norm1_altivec(uint8_t *pix, int line_size);
|
---|
34 | extern int sse8_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
---|
35 | extern int sse16_altivec(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h);
|
---|
36 | extern int pix_sum_altivec(uint8_t * pix, int line_size);
|
---|
37 | extern void diff_pixels_altivec(DCTELEM* block, const uint8_t* s1, const uint8_t* s2, int stride);
|
---|
38 | extern void get_pixels_altivec(DCTELEM* block, const uint8_t * pixels, int line_size);
|
---|
39 |
|
---|
40 | extern void add_bytes_altivec(uint8_t *dst, uint8_t *src, int w);
|
---|
41 | extern void put_pixels_clamped_altivec(const DCTELEM *block, uint8_t *restrict pixels, int line_size);
|
---|
42 | extern void put_pixels16_altivec(uint8_t *block, const uint8_t *pixels, int line_size, int h);
|
---|
43 | extern void avg_pixels16_altivec(uint8_t *block, const uint8_t *pixels, int line_size, int h);
|
---|
44 | extern void avg_pixels8_altivec(uint8_t * block, const uint8_t * pixels, int line_size, int h);
|
---|
45 | extern void put_pixels8_xy2_altivec(uint8_t *block, const uint8_t *pixels, int line_size, int h);
|
---|
46 | extern void put_no_rnd_pixels8_xy2_altivec(uint8_t *block, const uint8_t *pixels, int line_size, int h);
|
---|
47 | extern void put_pixels16_xy2_altivec(uint8_t * block, const uint8_t * pixels, int line_size, int h);
|
---|
48 | extern void put_no_rnd_pixels16_xy2_altivec(uint8_t * block, const uint8_t * pixels, int line_size, int h);
|
---|
49 | extern int hadamard8_diff8x8_altivec(/*MpegEncContext*/ void *s, uint8_t *dst, uint8_t *src, int stride, int h);
|
---|
50 | extern int hadamard8_diff16_altivec(/*MpegEncContext*/ void *s, uint8_t *dst, uint8_t *src, int stride, int h);
|
---|
51 | extern void avg_pixels8_xy2_altivec(uint8_t *block, const uint8_t *pixels, int line_size, int h);
|
---|
52 |
|
---|
53 | extern void gmc1_altivec(uint8_t *dst, uint8_t *src, int stride, int h, int x16, int y16, int rounder);
|
---|
54 |
|
---|
55 | extern int has_altivec(void);
|
---|
56 |
|
---|
57 | // used to build registers permutation vectors (vcprm)
|
---|
58 | // the 's' are for words in the _s_econd vector
|
---|
59 | #define WORD_0 0x00,0x01,0x02,0x03
|
---|
60 | #define WORD_1 0x04,0x05,0x06,0x07
|
---|
61 | #define WORD_2 0x08,0x09,0x0a,0x0b
|
---|
62 | #define WORD_3 0x0c,0x0d,0x0e,0x0f
|
---|
63 | #define WORD_s0 0x10,0x11,0x12,0x13
|
---|
64 | #define WORD_s1 0x14,0x15,0x16,0x17
|
---|
65 | #define WORD_s2 0x18,0x19,0x1a,0x1b
|
---|
66 | #define WORD_s3 0x1c,0x1d,0x1e,0x1f
|
---|
67 |
|
---|
68 | #ifdef CONFIG_DARWIN
|
---|
69 | #define vcprm(a,b,c,d) (const vector unsigned char)(WORD_ ## a, WORD_ ## b, WORD_ ## c, WORD_ ## d)
|
---|
70 | #else
|
---|
71 | #define vcprm(a,b,c,d) (const vector unsigned char){WORD_ ## a, WORD_ ## b, WORD_ ## c, WORD_ ## d}
|
---|
72 | #endif
|
---|
73 |
|
---|
74 | // vcprmle is used to keep the same index as in the SSE version.
|
---|
75 | // it's the same as vcprm, with the index inversed
|
---|
76 | // ('le' is Little Endian)
|
---|
77 | #define vcprmle(a,b,c,d) vcprm(d,c,b,a)
|
---|
78 |
|
---|
79 | // used to build inverse/identity vectors (vcii)
|
---|
80 | // n is _n_egative, p is _p_ositive
|
---|
81 | #define FLOAT_n -1.
|
---|
82 | #define FLOAT_p 1.
|
---|
83 |
|
---|
84 |
|
---|
85 | #ifdef CONFIG_DARWIN
|
---|
86 | #define vcii(a,b,c,d) (const vector float)(FLOAT_ ## a, FLOAT_ ## b, FLOAT_ ## c, FLOAT_ ## d)
|
---|
87 | #else
|
---|
88 | #define vcii(a,b,c,d) (const vector float){FLOAT_ ## a, FLOAT_ ## b, FLOAT_ ## c, FLOAT_ ## d}
|
---|
89 | #endif
|
---|
90 |
|
---|
91 | #else /* HAVE_ALTIVEC */
|
---|
92 | #ifdef ALTIVEC_USE_REFERENCE_C_CODE
|
---|
93 | #error "I can't use ALTIVEC_USE_REFERENCE_C_CODE if I don't use HAVE_ALTIVEC"
|
---|
94 | #endif /* ALTIVEC_USE_REFERENCE_C_CODE */
|
---|
95 | #endif /* HAVE_ALTIVEC */
|
---|
96 |
|
---|
97 | #endif /* _DSPUTIL_ALTIVEC_ */
|
---|