Commit | Line | Data |
---|---|---|
2ba45a60 DM |
1 | /* |
2 | * Copyright (c) 2010 Alex Converse <alex.converse@gmail.com> | |
3 | * | |
4 | * This file is part of FFmpeg. | |
5 | * | |
6 | * FFmpeg is free software; you can redistribute it and/or | |
7 | * modify it under the terms of the GNU Lesser General Public | |
8 | * License as published by the Free Software Foundation; either | |
9 | * version 2.1 of the License, or (at your option) any later version. | |
10 | * | |
11 | * FFmpeg is distributed in the hope that it will be useful, | |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
14 | * Lesser General Public License for more details. | |
15 | * | |
16 | * You should have received a copy of the GNU Lesser General Public | |
17 | * License along with FFmpeg; if not, write to the Free Software | |
18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | |
19 | */ | |
20 | ||
21 | #include "config.h" | |
22 | #include "libavutil/attributes.h" | |
23 | #include "aacpsdsp.h" | |
24 | ||
25 | static void ps_add_squares_c(float *dst, const float (*src)[2], int n) | |
26 | { | |
27 | int i; | |
28 | for (i = 0; i < n; i++) | |
29 | dst[i] += src[i][0] * src[i][0] + src[i][1] * src[i][1]; | |
30 | } | |
31 | ||
32 | static void ps_mul_pair_single_c(float (*dst)[2], float (*src0)[2], float *src1, | |
33 | int n) | |
34 | { | |
35 | int i; | |
36 | for (i = 0; i < n; i++) { | |
37 | dst[i][0] = src0[i][0] * src1[i]; | |
38 | dst[i][1] = src0[i][1] * src1[i]; | |
39 | } | |
40 | } | |
41 | ||
42 | static void ps_hybrid_analysis_c(float (*out)[2], float (*in)[2], | |
43 | const float (*filter)[8][2], | |
44 | int stride, int n) | |
45 | { | |
46 | int i, j; | |
47 | ||
48 | for (i = 0; i < n; i++) { | |
49 | float sum_re = filter[i][6][0] * in[6][0]; | |
50 | float sum_im = filter[i][6][0] * in[6][1]; | |
51 | ||
52 | for (j = 0; j < 6; j++) { | |
53 | float in0_re = in[j][0]; | |
54 | float in0_im = in[j][1]; | |
55 | float in1_re = in[12-j][0]; | |
56 | float in1_im = in[12-j][1]; | |
57 | sum_re += filter[i][j][0] * (in0_re + in1_re) - | |
58 | filter[i][j][1] * (in0_im - in1_im); | |
59 | sum_im += filter[i][j][0] * (in0_im + in1_im) + | |
60 | filter[i][j][1] * (in0_re - in1_re); | |
61 | } | |
62 | out[i * stride][0] = sum_re; | |
63 | out[i * stride][1] = sum_im; | |
64 | } | |
65 | } | |
66 | ||
67 | static void ps_hybrid_analysis_ileave_c(float (*out)[32][2], float L[2][38][64], | |
68 | int i, int len) | |
69 | { | |
70 | int j; | |
71 | ||
72 | for (; i < 64; i++) { | |
73 | for (j = 0; j < len; j++) { | |
74 | out[i][j][0] = L[0][j][i]; | |
75 | out[i][j][1] = L[1][j][i]; | |
76 | } | |
77 | } | |
78 | } | |
79 | ||
80 | static void ps_hybrid_synthesis_deint_c(float out[2][38][64], | |
81 | float (*in)[32][2], | |
82 | int i, int len) | |
83 | { | |
84 | int n; | |
85 | ||
86 | for (; i < 64; i++) { | |
87 | for (n = 0; n < len; n++) { | |
88 | out[0][n][i] = in[i][n][0]; | |
89 | out[1][n][i] = in[i][n][1]; | |
90 | } | |
91 | } | |
92 | } | |
93 | ||
94 | static void ps_decorrelate_c(float (*out)[2], float (*delay)[2], | |
95 | float (*ap_delay)[PS_QMF_TIME_SLOTS + PS_MAX_AP_DELAY][2], | |
96 | const float phi_fract[2], const float (*Q_fract)[2], | |
97 | const float *transient_gain, | |
98 | float g_decay_slope, | |
99 | int len) | |
100 | { | |
101 | static const float a[] = { 0.65143905753106f, | |
102 | 0.56471812200776f, | |
103 | 0.48954165955695f }; | |
104 | float ag[PS_AP_LINKS]; | |
105 | int m, n; | |
106 | ||
107 | for (m = 0; m < PS_AP_LINKS; m++) | |
108 | ag[m] = a[m] * g_decay_slope; | |
109 | ||
110 | for (n = 0; n < len; n++) { | |
111 | float in_re = delay[n][0] * phi_fract[0] - delay[n][1] * phi_fract[1]; | |
112 | float in_im = delay[n][0] * phi_fract[1] + delay[n][1] * phi_fract[0]; | |
113 | for (m = 0; m < PS_AP_LINKS; m++) { | |
114 | float a_re = ag[m] * in_re; | |
115 | float a_im = ag[m] * in_im; | |
116 | float link_delay_re = ap_delay[m][n+2-m][0]; | |
117 | float link_delay_im = ap_delay[m][n+2-m][1]; | |
118 | float fractional_delay_re = Q_fract[m][0]; | |
119 | float fractional_delay_im = Q_fract[m][1]; | |
120 | float apd_re = in_re; | |
121 | float apd_im = in_im; | |
122 | in_re = link_delay_re * fractional_delay_re - | |
123 | link_delay_im * fractional_delay_im - a_re; | |
124 | in_im = link_delay_re * fractional_delay_im + | |
125 | link_delay_im * fractional_delay_re - a_im; | |
126 | ap_delay[m][n+5][0] = apd_re + ag[m] * in_re; | |
127 | ap_delay[m][n+5][1] = apd_im + ag[m] * in_im; | |
128 | } | |
129 | out[n][0] = transient_gain[n] * in_re; | |
130 | out[n][1] = transient_gain[n] * in_im; | |
131 | } | |
132 | } | |
133 | ||
134 | static void ps_stereo_interpolate_c(float (*l)[2], float (*r)[2], | |
135 | float h[2][4], float h_step[2][4], | |
136 | int len) | |
137 | { | |
138 | float h0 = h[0][0]; | |
139 | float h1 = h[0][1]; | |
140 | float h2 = h[0][2]; | |
141 | float h3 = h[0][3]; | |
142 | float hs0 = h_step[0][0]; | |
143 | float hs1 = h_step[0][1]; | |
144 | float hs2 = h_step[0][2]; | |
145 | float hs3 = h_step[0][3]; | |
146 | int n; | |
147 | ||
148 | for (n = 0; n < len; n++) { | |
149 | //l is s, r is d | |
150 | float l_re = l[n][0]; | |
151 | float l_im = l[n][1]; | |
152 | float r_re = r[n][0]; | |
153 | float r_im = r[n][1]; | |
154 | h0 += hs0; | |
155 | h1 += hs1; | |
156 | h2 += hs2; | |
157 | h3 += hs3; | |
158 | l[n][0] = h0 * l_re + h2 * r_re; | |
159 | l[n][1] = h0 * l_im + h2 * r_im; | |
160 | r[n][0] = h1 * l_re + h3 * r_re; | |
161 | r[n][1] = h1 * l_im + h3 * r_im; | |
162 | } | |
163 | } | |
164 | ||
165 | static void ps_stereo_interpolate_ipdopd_c(float (*l)[2], float (*r)[2], | |
166 | float h[2][4], float h_step[2][4], | |
167 | int len) | |
168 | { | |
169 | float h00 = h[0][0], h10 = h[1][0]; | |
170 | float h01 = h[0][1], h11 = h[1][1]; | |
171 | float h02 = h[0][2], h12 = h[1][2]; | |
172 | float h03 = h[0][3], h13 = h[1][3]; | |
173 | float hs00 = h_step[0][0], hs10 = h_step[1][0]; | |
174 | float hs01 = h_step[0][1], hs11 = h_step[1][1]; | |
175 | float hs02 = h_step[0][2], hs12 = h_step[1][2]; | |
176 | float hs03 = h_step[0][3], hs13 = h_step[1][3]; | |
177 | int n; | |
178 | ||
179 | for (n = 0; n < len; n++) { | |
180 | //l is s, r is d | |
181 | float l_re = l[n][0]; | |
182 | float l_im = l[n][1]; | |
183 | float r_re = r[n][0]; | |
184 | float r_im = r[n][1]; | |
185 | h00 += hs00; | |
186 | h01 += hs01; | |
187 | h02 += hs02; | |
188 | h03 += hs03; | |
189 | h10 += hs10; | |
190 | h11 += hs11; | |
191 | h12 += hs12; | |
192 | h13 += hs13; | |
193 | ||
194 | l[n][0] = h00 * l_re + h02 * r_re - h10 * l_im - h12 * r_im; | |
195 | l[n][1] = h00 * l_im + h02 * r_im + h10 * l_re + h12 * r_re; | |
196 | r[n][0] = h01 * l_re + h03 * r_re - h11 * l_im - h13 * r_im; | |
197 | r[n][1] = h01 * l_im + h03 * r_im + h11 * l_re + h13 * r_re; | |
198 | } | |
199 | } | |
200 | ||
201 | av_cold void ff_psdsp_init(PSDSPContext *s) | |
202 | { | |
203 | s->add_squares = ps_add_squares_c; | |
204 | s->mul_pair_single = ps_mul_pair_single_c; | |
205 | s->hybrid_analysis = ps_hybrid_analysis_c; | |
206 | s->hybrid_analysis_ileave = ps_hybrid_analysis_ileave_c; | |
207 | s->hybrid_synthesis_deint = ps_hybrid_synthesis_deint_c; | |
208 | s->decorrelate = ps_decorrelate_c; | |
209 | s->stereo_interpolate[0] = ps_stereo_interpolate_c; | |
210 | s->stereo_interpolate[1] = ps_stereo_interpolate_ipdopd_c; | |
211 | ||
212 | if (ARCH_ARM) | |
213 | ff_psdsp_init_arm(s); | |
214 | if (ARCH_MIPS) | |
215 | ff_psdsp_init_mips(s); | |
216 | } |