Go to most recent revision | Details | Last modification | View Log | RSS feed
Rev | Author | Line No. | Line |
---|---|---|---|
4349 | Serge | 1 | /* |
2 | * This file is part of FFmpeg. |
||
3 | * |
||
4 | * FFmpeg is free software; you can redistribute it and/or |
||
5 | * modify it under the terms of the GNU Lesser General Public |
||
6 | * License as published by the Free Software Foundation; either |
||
7 | * version 2.1 of the License, or (at your option) any later version. |
||
8 | * |
||
9 | * FFmpeg is distributed in the hope that it will be useful, |
||
10 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
||
11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
||
12 | * Lesser General Public License for more details. |
||
13 | * |
||
14 | * You should have received a copy of the GNU Lesser General Public |
||
15 | * License along with FFmpeg; if not, write to the Free Software |
||
16 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
||
17 | */ |
||
18 | |||
19 | #ifndef AVUTIL_FLOAT_DSP_H |
||
20 | #define AVUTIL_FLOAT_DSP_H |
||
21 | |||
22 | #include "config.h" |
||
23 | |||
24 | typedef struct AVFloatDSPContext { |
||
25 | /** |
||
26 | * Calculate the product of two vectors of floats and store the result in |
||
27 | * a vector of floats. |
||
28 | * |
||
29 | * @param dst output vector |
||
30 | * constraints: 32-byte aligned |
||
31 | * @param src0 first input vector |
||
32 | * constraints: 32-byte aligned |
||
33 | * @param src1 second input vector |
||
34 | * constraints: 32-byte aligned |
||
35 | * @param len number of elements in the input |
||
36 | * constraints: multiple of 16 |
||
37 | */ |
||
38 | void (*vector_fmul)(float *dst, const float *src0, const float *src1, |
||
39 | int len); |
||
40 | |||
41 | /** |
||
42 | * Multiply a vector of floats by a scalar float and add to |
||
43 | * destination vector. Source and destination vectors must |
||
44 | * overlap exactly or not at all. |
||
45 | * |
||
46 | * @param dst result vector |
||
47 | * constraints: 32-byte aligned |
||
48 | * @param src input vector |
||
49 | * constraints: 32-byte aligned |
||
50 | * @param mul scalar value |
||
51 | * @param len length of vector |
||
52 | * constraints: multiple of 16 |
||
53 | */ |
||
54 | void (*vector_fmac_scalar)(float *dst, const float *src, float mul, |
||
55 | int len); |
||
56 | |||
57 | /** |
||
58 | * Multiply a vector of floats by a scalar float. Source and |
||
59 | * destination vectors must overlap exactly or not at all. |
||
60 | * |
||
61 | * @param dst result vector |
||
62 | * constraints: 16-byte aligned |
||
63 | * @param src input vector |
||
64 | * constraints: 16-byte aligned |
||
65 | * @param mul scalar value |
||
66 | * @param len length of vector |
||
67 | * constraints: multiple of 4 |
||
68 | */ |
||
69 | void (*vector_fmul_scalar)(float *dst, const float *src, float mul, |
||
70 | int len); |
||
71 | |||
72 | /** |
||
73 | * Multiply a vector of double by a scalar double. Source and |
||
74 | * destination vectors must overlap exactly or not at all. |
||
75 | * |
||
76 | * @param dst result vector |
||
77 | * constraints: 32-byte aligned |
||
78 | * @param src input vector |
||
79 | * constraints: 32-byte aligned |
||
80 | * @param mul scalar value |
||
81 | * @param len length of vector |
||
82 | * constraints: multiple of 8 |
||
83 | */ |
||
84 | void (*vector_dmul_scalar)(double *dst, const double *src, double mul, |
||
85 | int len); |
||
86 | |||
87 | /** |
||
88 | * Overlap/add with window function. |
||
89 | * Used primarily by MDCT-based audio codecs. |
||
90 | * Source and destination vectors must overlap exactly or not at all. |
||
91 | * |
||
92 | * @param dst result vector |
||
93 | * constraints: 16-byte aligned |
||
94 | * @param src0 first source vector |
||
95 | * constraints: 16-byte aligned |
||
96 | * @param src1 second source vector |
||
97 | * constraints: 16-byte aligned |
||
98 | * @param win half-window vector |
||
99 | * constraints: 16-byte aligned |
||
100 | * @param len length of vector |
||
101 | * constraints: multiple of 4 |
||
102 | */ |
||
103 | void (*vector_fmul_window)(float *dst, const float *src0, |
||
104 | const float *src1, const float *win, int len); |
||
105 | |||
106 | /** |
||
107 | * Calculate the product of two vectors of floats, add a third vector of |
||
108 | * floats and store the result in a vector of floats. |
||
109 | * |
||
110 | * @param dst output vector |
||
111 | * constraints: 32-byte aligned |
||
112 | * @param src0 first input vector |
||
113 | * constraints: 32-byte aligned |
||
114 | * @param src1 second input vector |
||
115 | * constraints: 32-byte aligned |
||
116 | * @param src1 third input vector |
||
117 | * constraints: 32-byte aligned |
||
118 | * @param len number of elements in the input |
||
119 | * constraints: multiple of 16 |
||
120 | */ |
||
121 | void (*vector_fmul_add)(float *dst, const float *src0, const float *src1, |
||
122 | const float *src2, int len); |
||
123 | |||
124 | /** |
||
125 | * Calculate the product of two vectors of floats, and store the result |
||
126 | * in a vector of floats. The second vector of floats is iterated over |
||
127 | * in reverse order. |
||
128 | * |
||
129 | * @param dst output vector |
||
130 | * constraints: 32-byte aligned |
||
131 | * @param src0 first input vector |
||
132 | * constraints: 32-byte aligned |
||
133 | * @param src1 second input vector |
||
134 | * constraints: 32-byte aligned |
||
135 | * @param src1 third input vector |
||
136 | * constraints: 32-byte aligned |
||
137 | * @param len number of elements in the input |
||
138 | * constraints: multiple of 16 |
||
139 | */ |
||
140 | void (*vector_fmul_reverse)(float *dst, const float *src0, |
||
141 | const float *src1, int len); |
||
142 | |||
143 | /** |
||
144 | * Calculate the sum and difference of two vectors of floats. |
||
145 | * |
||
146 | * @param v1 first input vector, sum output, 16-byte aligned |
||
147 | * @param v2 second input vector, difference output, 16-byte aligned |
||
148 | * @param len length of vectors, multiple of 4 |
||
149 | */ |
||
150 | void (*butterflies_float)(float *av_restrict v1, float *av_restrict v2, int len); |
||
151 | |||
152 | /** |
||
153 | * Calculate the scalar product of two vectors of floats. |
||
154 | * |
||
155 | * @param v1 first vector, 16-byte aligned |
||
156 | * @param v2 second vector, 16-byte aligned |
||
157 | * @param len length of vectors, multiple of 4 |
||
158 | * |
||
159 | * @return sum of elementwise products |
||
160 | */ |
||
161 | float (*scalarproduct_float)(const float *v1, const float *v2, int len); |
||
162 | } AVFloatDSPContext; |
||
163 | |||
164 | /** |
||
165 | * Return the scalar product of two vectors. |
||
166 | * |
||
167 | * @param v1 first input vector |
||
168 | * @param v2 first input vector |
||
169 | * @param len number of elements |
||
170 | * |
||
171 | * @return sum of elementwise products |
||
172 | */ |
||
173 | float avpriv_scalarproduct_float_c(const float *v1, const float *v2, int len); |
||
174 | |||
175 | /** |
||
176 | * Initialize a float DSP context. |
||
177 | * |
||
178 | * @param fdsp float DSP context |
||
179 | * @param strict setting to non-zero avoids using functions which may not be IEEE-754 compliant |
||
180 | */ |
||
181 | void avpriv_float_dsp_init(AVFloatDSPContext *fdsp, int strict); |
||
182 | |||
183 | |||
184 | void ff_float_dsp_init_arm(AVFloatDSPContext *fdsp); |
||
185 | void ff_float_dsp_init_ppc(AVFloatDSPContext *fdsp, int strict); |
||
186 | void ff_float_dsp_init_x86(AVFloatDSPContext *fdsp); |
||
187 | void ff_float_dsp_init_mips(AVFloatDSPContext *fdsp); |
||
188 | |||
189 | #endif /* AVUTIL_FLOAT_DSP_H */ |