[deb_ffmpeg.git] / ffmpeg / libavcodec / acelp_pitch_delay.h

/*
 * gain code, gain pitch and pitch delay decoding
 *
 * Copyright (c) 2008 Vladimir Voroshilov
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#ifndef AVCODEC_ACELP_PITCH_DELAY_H
#define AVCODEC_ACELP_PITCH_DELAY_H

#include <stdint.h>

#include "audiodsp.h"

#define PITCH_DELAY_MIN             20
#define PITCH_DELAY_MAX             143

/**
 * @brief Decode pitch delay of the first subframe encoded by 8 bits with 1/3
 *        resolution.
 * @param ac_index adaptive codebook index (8 bits)
 *
 * @return pitch delay in 1/3 units
 *
 * Pitch delay is coded:
 *    with 1/3 resolution, 19  < pitch_delay <  85
 *    integers only,       85 <= pitch_delay <= 143
 */
int ff_acelp_decode_8bit_to_1st_delay3(int ac_index);

/**
 * @brief Decode pitch delay of the second subframe encoded by 5 or 6 bits
 *        with 1/3 precision.
 * @param ac_index adaptive codebook index (5 or 6 bits)
 * @param pitch_delay_min lower bound (integer) of pitch delay interval
 *                      for second subframe
 *
 * @return pitch delay in 1/3 units
 *
 * Pitch delay is coded:
 *    with 1/3 resolution, -6 < pitch_delay - int(prev_pitch_delay) < 5
 *
 * @remark The routine is used in G.729 @@8k, AMR @@10.2k, AMR @@7.95k,
 *         AMR @@7.4k for the second subframe.
 */
int ff_acelp_decode_5_6_bit_to_2nd_delay3(
        int ac_index,
        int pitch_delay_min);

/**
 * @brief Decode pitch delay with 1/3 precision.
 * @param ac_index adaptive codebook index (4 bits)
 * @param pitch_delay_min lower bound (integer) of pitch delay interval for
 *                      second subframe
 *
 * @return pitch delay in 1/3 units
 *
 * Pitch delay is coded:
 *    integers only,          -6  < pitch_delay - int(prev_pitch_delay) <= -2
 *    with 1/3 resolution,    -2  < pitch_delay - int(prev_pitch_delay) <  1
 *    integers only,           1 <= pitch_delay - int(prev_pitch_delay) <  5
 *
 * @remark The routine is used in G.729 @@6.4k, AMR @@6.7k, AMR @@5.9k,
 *         AMR @@5.15k, AMR @@4.75k for the second subframe.
 */
int ff_acelp_decode_4bit_to_2nd_delay3(
        int ac_index,
        int pitch_delay_min);

/**
 * @brief Decode pitch delay of the first subframe encoded by 9 bits
 *        with 1/6 precision.
 * @param ac_index adaptive codebook index (9 bits)
 *
 * @return pitch delay in 1/6 units
 *
 * Pitch delay is coded:
 *    with 1/6 resolution,  17  < pitch_delay <  95
 *    integers only,        95 <= pitch_delay <= 143
 *
 * @remark The routine is used in AMR @@12.2k for the first and third subframes.
 */
int ff_acelp_decode_9bit_to_1st_delay6(int ac_index);

/**
 * @brief Decode pitch delay of the second subframe encoded by 6 bits
 *        with 1/6 precision.
 * @param ac_index adaptive codebook index (6 bits)
 * @param pitch_delay_min lower bound (integer) of pitch delay interval for
 *                      second subframe
 *
 * @return pitch delay in 1/6 units
 *
 * Pitch delay is coded:
 *    with 1/6 resolution, -6 < pitch_delay - int(prev_pitch_delay) < 5
 *
 * @remark The routine is used in AMR @@12.2k for the second and fourth subframes.
 */
int ff_acelp_decode_6bit_to_2nd_delay6(
        int ac_index,
        int pitch_delay_min);

/**
 * @brief Update past quantized energies
 * @param[in,out]  quant_energy  past quantized energies (5.10)
 * @param gain_corr_factor gain correction factor
 * @param log2_ma_pred_order log2() of MA prediction order
 * @param erasure frame erasure flag
 *
 * If frame erasure flag is not equal to zero, memory is updated with
 * averaged energy, attenuated by 4dB:
 *     max(avg(quant_energy[i])-4, -14), i=0,ma_pred_order
 *
 * In normal mode memory is updated with
 *     Er - Ep = 20 * log10(gain_corr_factor)
 *
 * @remark The routine is used in G.729 and AMR (all modes).
 */
void ff_acelp_update_past_gain(
        int16_t* quant_energy,
        int gain_corr_factor,
        int log2_ma_pred_order,
        int erasure);

/**
 * @brief Decode the adaptive codebook gain and add
 *        correction (4.1.5 and 3.9.1 of G.729).
 * @param adsp initialized audio DSP context
 * @param gain_corr_factor gain correction factor (2.13)
 * @param fc_v fixed-codebook vector (2.13)
 * @param mr_energy mean innovation energy and fixed-point correction (7.13)
 * @param[in,out]  quant_energy  past quantized energies (5.10)
 * @param subframe_size length of subframe
 *
 * @return quantized fixed-codebook gain (14.1)
 *
 * The routine implements equations 69, 66 and 71 of the G.729 specification (3.9.1)
 *
 *    Em   - mean innovation energy (dB, constant, depends on decoding algorithm)
 *    Ep   - mean-removed predicted energy (dB)
 *    Er   - mean-removed innovation energy (dB)
 *    Ei   - mean energy of the fixed-codebook contribution (dB)
 *    N    - subframe_size
 *    M    - MA (Moving Average) prediction order
 *    gc   - fixed-codebook gain
 *    gc_p - predicted fixed-codebook gain
 *
 *    Fixed codebook gain is computed using predicted gain gc_p and
 *    correction factor gain_corr_factor as shown below:
 *
 *        gc = gc_p * gain_corr_factor
 *
 *    The predicted fixed codebook gain gc_p is found by predicting
 *    the energy of the fixed-codebook contribution from the energy
 *    of previous fixed-codebook contributions.
 *
 *        mean = 1/N * sum(i,0,N){ fc_v[i] * fc_v[i] }
 *
 *        Ei = 10log(mean)
 *
 *        Er = 10log(1/N * gc^2 * mean) - Em = 20log(gc) + Ei - Em
 *
 *    Replacing Er with Ep and gc with gc_p we will receive:
 *
 *        Ep = 10log(1/N * gc_p^2 * mean) - Em = 20log(gc_p) + Ei - Em
 *
 *    and from above:
 *
 *        gc_p = 10^((Ep - Ei + Em) / 20)
 *
 *    Ep is predicted using past energies and prediction coefficients:
 *
 *        Ep = sum(i,0,M){ ma_prediction_coeff[i] * quant_energy[i] }
 *
 *    gc_p in fixed-point arithmetic is calculated as following:
 *
 *        mean = 1/N * sum(i,0,N){ (fc_v[i] / 2^13) * (fc_v[i] / 2^13) } =
 *        = 1/N * sum(i,0,N) { fc_v[i] * fc_v[i] } / 2^26
 *
 *        Ei = 10log(mean) = -10log(N) - 10log(2^26) +
 *        + 10log(sum(i,0,N) { fc_v[i] * fc_v[i] })
 *
 *        Ep - Ei + Em = Ep + Em + 10log(N) + 10log(2^26) -
 *        - 10log(sum(i,0,N) { fc_v[i] * fc_v[i] }) =
 *        = Ep + mr_energy - 10log(sum(i,0,N) { fc_v[i] * fc_v[i] })
 *
 *        gc_p = 10 ^ ((Ep - Ei + Em) / 20) =
 *        = 2 ^ (3.3219 * (Ep - Ei + Em) / 20) = 2 ^ (0.166 * (Ep - Ei + Em))
 *
 *    where
 *
 *        mr_energy = Em + 10log(N) + 10log(2^26)
 *
 * @remark The routine is used in G.729 and AMR (all modes).
 */
int16_t ff_acelp_decode_gain_code(
    AudioDSPContext *adsp,
    int gain_corr_factor,
    const int16_t* fc_v,
    int mr_energy,
    const int16_t* quant_energy,
    const int16_t* ma_prediction_coeff,
    int subframe_size,
    int max_pred_order);

/**
 * Calculate fixed gain (part of section 6.1.3 of AMR spec)
 *
 * @param fixed_gain_factor gain correction factor
 * @param fixed_mean_energy mean decoded algebraic codebook vector energy
 * @param prediction_error vector of the quantified predictor errors of
 *        the four previous subframes. It is updated by this function.
 * @param energy_mean desired mean innovation energy
 * @param pred_table table of four moving average coefficients
 */
float ff_amr_set_fixed_gain(float fixed_gain_factor, float fixed_mean_energy,
                            float *prediction_error, float energy_mean,
                            const float *pred_table);


/**
 * Decode the adaptive codebook index to the integer and fractional parts
 * of the pitch lag for one subframe at 1/3 fractional precision.
 *
 * The choice of pitch lag is described in 3GPP TS 26.090 section 5.6.1.
 *
 * @param lag_int             integer part of pitch lag of the current subframe
 * @param lag_frac            fractional part of pitch lag of the current subframe
 * @param pitch_index         parsed adaptive codebook (pitch) index
 * @param prev_lag_int        integer part of pitch lag for the previous subframe
 * @param subframe            current subframe number
 * @param third_as_first      treat the third frame the same way as the first
 */
void ff_decode_pitch_lag(int *lag_int, int *lag_frac, int pitch_index,
                         const int prev_lag_int, const int subframe,
                         int third_as_first, int resolution);

#endif /* AVCODEC_ACELP_PITCH_DELAY_H */
Commit	Line	Data
2ba45a60 DM	1	/*
	2	* gain code, gain pitch and pitch delay decoding
	3	*
	4	* Copyright (c) 2008 Vladimir Voroshilov
	5	*
	6	* This file is part of FFmpeg.
	7	*
	8	* FFmpeg is free software; you can redistribute it and/or
	9	* modify it under the terms of the GNU Lesser General Public
	10	* License as published by the Free Software Foundation; either
	11	* version 2.1 of the License, or (at your option) any later version.
	12	*
	13	* FFmpeg is distributed in the hope that it will be useful,
	14	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	15	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	16	* Lesser General Public License for more details.
	17	*
	18	* You should have received a copy of the GNU Lesser General Public
	19	* License along with FFmpeg; if not, write to the Free Software
	20	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	21	*/
	22
	23	#ifndef AVCODEC_ACELP_PITCH_DELAY_H
	24	#define AVCODEC_ACELP_PITCH_DELAY_H
	25
	26	#include <stdint.h>
	27
	28	#include "audiodsp.h"
	29
	30	#define PITCH_DELAY_MIN 20
	31	#define PITCH_DELAY_MAX 143
	32
	33	/**
	34	* @brief Decode pitch delay of the first subframe encoded by 8 bits with 1/3
	35	* resolution.
	36	* @param ac_index adaptive codebook index (8 bits)
	37	*
	38	* @return pitch delay in 1/3 units
	39	*
	40	* Pitch delay is coded:
	41	* with 1/3 resolution, 19 < pitch_delay < 85
	42	* integers only, 85 <= pitch_delay <= 143
	43	*/
	44	int ff_acelp_decode_8bit_to_1st_delay3(int ac_index);
	45
	46	/**
	47	* @brief Decode pitch delay of the second subframe encoded by 5 or 6 bits
	48	* with 1/3 precision.
	49	* @param ac_index adaptive codebook index (5 or 6 bits)
	50	* @param pitch_delay_min lower bound (integer) of pitch delay interval
	51	* for second subframe
	52	*
	53	* @return pitch delay in 1/3 units
	54	*
	55	* Pitch delay is coded:
	56	* with 1/3 resolution, -6 < pitch_delay - int(prev_pitch_delay) < 5
	57	*
	58	* @remark The routine is used in G.729 @@8k, AMR @@10.2k, AMR @@7.95k,
	59	* AMR @@7.4k for the second subframe.
	60	*/
	61	int ff_acelp_decode_5_6_bit_to_2nd_delay3(
	62	int ac_index,
	63	int pitch_delay_min);
	64
65	/**
66	* @brief Decode pitch delay with 1/3 precision.
67	* @param ac_index adaptive codebook index (4 bits)
68	* @param pitch_delay_min lower bound (integer) of pitch delay interval for
69	* second subframe
70	*
71	* @return pitch delay in 1/3 units
72	*
73	* Pitch delay is coded:
74	* integers only, -6 < pitch_delay - int(prev_pitch_delay) <= -2
75	* with 1/3 resolution, -2 < pitch_delay - int(prev_pitch_delay) < 1
76	* integers only, 1 <= pitch_delay - int(prev_pitch_delay) < 5
77	*
78	* @remark The routine is used in G.729 @@6.4k, AMR @@6.7k, AMR @@5.9k,
79	* AMR @@5.15k, AMR @@4.75k for the second subframe.
80	*/
81	int ff_acelp_decode_4bit_to_2nd_delay3(
82	int ac_index,
83	int pitch_delay_min);
84
85	/**
86	* @brief Decode pitch delay of the first subframe encoded by 9 bits
87	* with 1/6 precision.
88	* @param ac_index adaptive codebook index (9 bits)
89	*
90	* @return pitch delay in 1/6 units
91	*
92	* Pitch delay is coded:
93	* with 1/6 resolution, 17 < pitch_delay < 95
94	* integers only, 95 <= pitch_delay <= 143
95	*
96	* @remark The routine is used in AMR @@12.2k for the first and third subframes.
97	*/
98	int ff_acelp_decode_9bit_to_1st_delay6(int ac_index);
99
100	/**
101	* @brief Decode pitch delay of the second subframe encoded by 6 bits
102	* with 1/6 precision.
103	* @param ac_index adaptive codebook index (6 bits)
104	* @param pitch_delay_min lower bound (integer) of pitch delay interval for
105	* second subframe
106	*
107	* @return pitch delay in 1/6 units
108	*
109	* Pitch delay is coded:
110	* with 1/6 resolution, -6 < pitch_delay - int(prev_pitch_delay) < 5
111	*
112	* @remark The routine is used in AMR @@12.2k for the second and fourth subframes.
113	*/
114	int ff_acelp_decode_6bit_to_2nd_delay6(
115	int ac_index,
116	int pitch_delay_min);
117
118	/**
119	* @brief Update past quantized energies
120	* @param[in,out] quant_energy past quantized energies (5.10)
121	* @param gain_corr_factor gain correction factor
122	* @param log2_ma_pred_order log2() of MA prediction order
123	* @param erasure frame erasure flag
124	*
125	* If frame erasure flag is not equal to zero, memory is updated with
126	* averaged energy, attenuated by 4dB:
127	* max(avg(quant_energy[i])-4, -14), i=0,ma_pred_order
128	*
129	* In normal mode memory is updated with
130	* Er - Ep = 20 * log10(gain_corr_factor)
131	*
132	* @remark The routine is used in G.729 and AMR (all modes).
133	*/
134	void ff_acelp_update_past_gain(
135	int16_t* quant_energy,
136	int gain_corr_factor,
137	int log2_ma_pred_order,
138	int erasure);
139
140	/**
141	* @brief Decode the adaptive codebook gain and add
142	* correction (4.1.5 and 3.9.1 of G.729).
143	* @param adsp initialized audio DSP context
144	* @param gain_corr_factor gain correction factor (2.13)
145	* @param fc_v fixed-codebook vector (2.13)
146	* @param mr_energy mean innovation energy and fixed-point correction (7.13)
147	* @param[in,out] quant_energy past quantized energies (5.10)
148	* @param subframe_size length of subframe
149	*
150	* @return quantized fixed-codebook gain (14.1)
151	*
152	* The routine implements equations 69, 66 and 71 of the G.729 specification (3.9.1)
153	*
154	* Em - mean innovation energy (dB, constant, depends on decoding algorithm)
155	* Ep - mean-removed predicted energy (dB)
156	* Er - mean-removed innovation energy (dB)
157	* Ei - mean energy of the fixed-codebook contribution (dB)
158	* N - subframe_size
159	* M - MA (Moving Average) prediction order
160	* gc - fixed-codebook gain
161	* gc_p - predicted fixed-codebook gain
162	*
163	* Fixed codebook gain is computed using predicted gain gc_p and
164	* correction factor gain_corr_factor as shown below:
165	*
166	* gc = gc_p * gain_corr_factor
167	*
168	* The predicted fixed codebook gain gc_p is found by predicting
169	* the energy of the fixed-codebook contribution from the energy
170	* of previous fixed-codebook contributions.
171	*
172	* mean = 1/N * sum(i,0,N){ fc_v[i] * fc_v[i] }
173	*
174	* Ei = 10log(mean)
175	*
176	* Er = 10log(1/N * gc^2 * mean) - Em = 20log(gc) + Ei - Em
177	*
178	* Replacing Er with Ep and gc with gc_p we will receive:
179	*
180	* Ep = 10log(1/N * gc_p^2 * mean) - Em = 20log(gc_p) + Ei - Em
181	*
182	* and from above:
183	*
184	* gc_p = 10^((Ep - Ei + Em) / 20)
185	*
186	* Ep is predicted using past energies and prediction coefficients:
187	*
188	* Ep = sum(i,0,M){ ma_prediction_coeff[i] * quant_energy[i] }
189	*
190	* gc_p in fixed-point arithmetic is calculated as following:
191	*
192	* mean = 1/N * sum(i,0,N){ (fc_v[i] / 2^13) * (fc_v[i] / 2^13) } =
193	* = 1/N * sum(i,0,N) { fc_v[i] * fc_v[i] } / 2^26
194	*
195	* Ei = 10log(mean) = -10log(N) - 10log(2^26) +
196	* + 10log(sum(i,0,N) { fc_v[i] * fc_v[i] })
197	*
198	* Ep - Ei + Em = Ep + Em + 10log(N) + 10log(2^26) -
199	* - 10log(sum(i,0,N) { fc_v[i] * fc_v[i] }) =
200	* = Ep + mr_energy - 10log(sum(i,0,N) { fc_v[i] * fc_v[i] })
201	*
202	* gc_p = 10 ^ ((Ep - Ei + Em) / 20) =
203	* = 2 ^ (3.3219 * (Ep - Ei + Em) / 20) = 2 ^ (0.166 * (Ep - Ei + Em))
204	*
205	* where
206	*
207	* mr_energy = Em + 10log(N) + 10log(2^26)
208	*
209	* @remark The routine is used in G.729 and AMR (all modes).
210	*/
211	int16_t ff_acelp_decode_gain_code(
212	AudioDSPContext *adsp,
213	int gain_corr_factor,
214	const int16_t* fc_v,
215	int mr_energy,
216	const int16_t* quant_energy,
217	const int16_t* ma_prediction_coeff,
218	int subframe_size,
219	int max_pred_order);
220
221	/**
222	* Calculate fixed gain (part of section 6.1.3 of AMR spec)
223	*
224	* @param fixed_gain_factor gain correction factor
225	* @param fixed_mean_energy mean decoded algebraic codebook vector energy
226	* @param prediction_error vector of the quantified predictor errors of
227	* the four previous subframes. It is updated by this function.
228	* @param energy_mean desired mean innovation energy
229	* @param pred_table table of four moving average coefficients
230	*/
231	float ff_amr_set_fixed_gain(float fixed_gain_factor, float fixed_mean_energy,
232	float *prediction_error, float energy_mean,
233	const float *pred_table);
234
235
236	/**
237	* Decode the adaptive codebook index to the integer and fractional parts
238	* of the pitch lag for one subframe at 1/3 fractional precision.
239	*
240	* The choice of pitch lag is described in 3GPP TS 26.090 section 5.6.1.
241	*
242	* @param lag_int integer part of pitch lag of the current subframe
243	* @param lag_frac fractional part of pitch lag of the current subframe
244	* @param pitch_index parsed adaptive codebook (pitch) index
245	* @param prev_lag_int integer part of pitch lag for the previous subframe
246	* @param subframe current subframe number
247	* @param third_as_first treat the third frame the same way as the first
248	*/
249	void ff_decode_pitch_lag(int lag_int, int lag_frac, int pitch_index,
250	const int prev_lag_int, const int subframe,
251	int third_as_first, int resolution);
252
253	#endif /* AVCODEC_ACELP_PITCH_DELAY_H */