[deb_ffmpeg.git] / lpc.c

/*
 * LPC utility code
 * Copyright (c) 2006  Justin Ruggles <justin.ruggles@gmail.com>
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include "libavutil/common.h"
#include "libavutil/lls.h"

#define LPC_USE_DOUBLE
#include "lpc.h"
#include "libavutil/avassert.h"


/**
 * Apply Welch window function to audio block
 */
static void lpc_apply_welch_window_c(const int32_t *data, int len,
                                     double *w_data)
{
    int i, n2;
    double w;
    double c;

    /* The optimization in commit fa4ed8c does not support odd len.
     * If someone wants odd len extend that change. */
    av_assert2(!(len & 1));

    n2 = (len >> 1);
    c = 2.0 / (len - 1.0);

    w_data+=n2;
      data+=n2;
    for(i=0; i<n2; i++) {
        w = c - n2 + i;
        w = 1.0 - (w * w);
        w_data[-i-1] = data[-i-1] * w;
        w_data[+i  ] = data[+i  ] * w;
    }
}

/**
 * Calculate autocorrelation data from audio samples
 * A Welch window function is applied before calculation.
 */
static void lpc_compute_autocorr_c(const double *data, int len, int lag,
                                   double *autoc)
{
    int i, j;

    for(j=0; j<lag; j+=2){
        double sum0 = 1.0, sum1 = 1.0;
        for(i=j; i<len; i++){
            sum0 += data[i] * data[i-j];
            sum1 += data[i] * data[i-j-1];
        }
        autoc[j  ] = sum0;
        autoc[j+1] = sum1;
    }

    if(j==lag){
        double sum = 1.0;
        for(i=j-1; i<len; i+=2){
            sum += data[i  ] * data[i-j  ]
                 + data[i+1] * data[i-j+1];
        }
        autoc[j] = sum;
    }
}

/**
 * Quantize LPC coefficients
 */
static void quantize_lpc_coefs(double *lpc_in, int order, int precision,
                               int32_t *lpc_out, int *shift, int max_shift, int zero_shift)
{
    int i;
    double cmax, error;
    int32_t qmax;
    int sh;

    /* define maximum levels */
    qmax = (1 << (precision - 1)) - 1;

    /* find maximum coefficient value */
    cmax = 0.0;
    for(i=0; i<order; i++) {
        cmax= FFMAX(cmax, fabs(lpc_in[i]));
    }

    /* if maximum value quantizes to zero, return all zeros */
    if(cmax * (1 << max_shift) < 1.0) {
        *shift = zero_shift;
        memset(lpc_out, 0, sizeof(int32_t) * order);
        return;
    }

    /* calculate level shift which scales max coeff to available bits */
    sh = max_shift;
    while((cmax * (1 << sh) > qmax) && (sh > 0)) {
        sh--;
    }

    /* since negative shift values are unsupported in decoder, scale down
       coefficients instead */
    if(sh == 0 && cmax > qmax) {
        double scale = ((double)qmax) / cmax;
        for(i=0; i<order; i++) {
            lpc_in[i] *= scale;
        }
    }

    /* output quantized coefficients and level shift */
    error=0;
    for(i=0; i<order; i++) {
        error -= lpc_in[i] * (1 << sh);
        lpc_out[i] = av_clip(lrintf(error), -qmax, qmax);
        error -= lpc_out[i];
    }
    *shift = sh;
}

static int estimate_best_order(double *ref, int min_order, int max_order)
{
    int i, est;

    est = min_order;
    for(i=max_order-1; i>=min_order-1; i--) {
        if(ref[i] > 0.10) {
            est = i+1;
            break;
        }
    }
    return est;
}

int ff_lpc_calc_ref_coefs(LPCContext *s,
                          const int32_t *samples, int order, double *ref)
{
    double autoc[MAX_LPC_ORDER + 1];

    s->lpc_apply_welch_window(samples, s->blocksize, s->windowed_samples);
    s->lpc_compute_autocorr(s->windowed_samples, s->blocksize, order, autoc);
    compute_ref_coefs(autoc, order, ref, NULL);

    return order;
}

/**
 * Calculate LPC coefficients for multiple orders
 *
 * @param lpc_type LPC method for determining coefficients,
 *                 see #FFLPCType for details
 */
int ff_lpc_calc_coefs(LPCContext *s,
                      const int32_t *samples, int blocksize, int min_order,
                      int max_order, int precision,
                      int32_t coefs[][MAX_LPC_ORDER], int *shift,
                      enum FFLPCType lpc_type, int lpc_passes,
                      int omethod, int max_shift, int zero_shift)
{
    double autoc[MAX_LPC_ORDER+1];
    double ref[MAX_LPC_ORDER];
    double lpc[MAX_LPC_ORDER][MAX_LPC_ORDER];
    int i, j, pass = 0;
    int opt_order;

    av_assert2(max_order >= MIN_LPC_ORDER && max_order <= MAX_LPC_ORDER &&
           lpc_type > FF_LPC_TYPE_FIXED);
    av_assert0(lpc_type == FF_LPC_TYPE_CHOLESKY || lpc_type == FF_LPC_TYPE_LEVINSON);

    /* reinit LPC context if parameters have changed */
    if (blocksize != s->blocksize || max_order != s->max_order ||
        lpc_type  != s->lpc_type) {
        ff_lpc_end(s);
        ff_lpc_init(s, blocksize, max_order, lpc_type);
    }

    if(lpc_passes <= 0)
        lpc_passes = 2;

    if (lpc_type == FF_LPC_TYPE_LEVINSON || (lpc_type == FF_LPC_TYPE_CHOLESKY && lpc_passes > 1)) {
        s->lpc_apply_welch_window(samples, blocksize, s->windowed_samples);

        s->lpc_compute_autocorr(s->windowed_samples, blocksize, max_order, autoc);

        compute_lpc_coefs(autoc, max_order, &lpc[0][0], MAX_LPC_ORDER, 0, 1);

        for(i=0; i<max_order; i++)
            ref[i] = fabs(lpc[i][i]);

        pass++;
    }

    if (lpc_type == FF_LPC_TYPE_CHOLESKY) {
        LLSModel m[2];
        LOCAL_ALIGNED(32, double, var, [FFALIGN(MAX_LPC_ORDER+1,4)]);
        double av_uninit(weight);
        memset(var, 0, FFALIGN(MAX_LPC_ORDER+1,4)*sizeof(*var));

        for(j=0; j<max_order; j++)
            m[0].coeff[max_order-1][j] = -lpc[max_order-1][j];

        for(; pass<lpc_passes; pass++){
            avpriv_init_lls(&m[pass&1], max_order);

            weight=0;
            for(i=max_order; i<blocksize; i++){
                for(j=0; j<=max_order; j++)
                    var[j]= samples[i-j];

                if(pass){
                    double eval, inv, rinv;
                    eval= m[pass&1].evaluate_lls(&m[(pass-1)&1], var+1, max_order-1);
                    eval= (512>>pass) + fabs(eval - var[0]);
                    inv = 1/eval;
                    rinv = sqrt(inv);
                    for(j=0; j<=max_order; j++)
                        var[j] *= rinv;
                    weight += inv;
                }else
                    weight++;

                m[pass&1].update_lls(&m[pass&1], var);
            }
            avpriv_solve_lls(&m[pass&1], 0.001, 0);
        }

        for(i=0; i<max_order; i++){
            for(j=0; j<max_order; j++)
                lpc[i][j]=-m[(pass-1)&1].coeff[i][j];
            ref[i]= sqrt(m[(pass-1)&1].variance[i] / weight) * (blocksize - max_order) / 4000;
        }
        for(i=max_order-1; i>0; i--)
            ref[i] = ref[i-1] - ref[i];
    }

    opt_order = max_order;

    if(omethod == ORDER_METHOD_EST) {
        opt_order = estimate_best_order(ref, min_order, max_order);
        i = opt_order-1;
        quantize_lpc_coefs(lpc[i], i+1, precision, coefs[i], &shift[i], max_shift, zero_shift);
    } else {
        for(i=min_order-1; i<max_order; i++) {
            quantize_lpc_coefs(lpc[i], i+1, precision, coefs[i], &shift[i], max_shift, zero_shift);
        }
    }

    return opt_order;
}

av_cold int ff_lpc_init(LPCContext *s, int blocksize, int max_order,
                        enum FFLPCType lpc_type)
{
    s->blocksize = blocksize;
    s->max_order = max_order;
    s->lpc_type  = lpc_type;

    s->windowed_buffer = av_mallocz((blocksize + 2 + FFALIGN(max_order, 4)) *
                                    sizeof(*s->windowed_samples));
    if (!s->windowed_buffer)
        return AVERROR(ENOMEM);
    s->windowed_samples = s->windowed_buffer + FFALIGN(max_order, 4);

    s->lpc_apply_welch_window = lpc_apply_welch_window_c;
    s->lpc_compute_autocorr   = lpc_compute_autocorr_c;

    if (ARCH_X86)
        ff_lpc_init_x86(s);

    return 0;
}

av_cold void ff_lpc_end(LPCContext *s)
{
    av_freep(&s->windowed_buffer);
}
Commit	Line	Data
	1	/*
	2	* LPC utility code
	3	* Copyright (c) 2006 Justin Ruggles <justin.ruggles@gmail.com>
	4	*
	5	* This file is part of FFmpeg.
	6	*
	7	* FFmpeg is free software; you can redistribute it and/or
	8	* modify it under the terms of the GNU Lesser General Public
	9	* License as published by the Free Software Foundation; either
	10	* version 2.1 of the License, or (at your option) any later version.
	11	*
	12	* FFmpeg is distributed in the hope that it will be useful,
	13	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	14	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	15	* Lesser General Public License for more details.
	16	*
	17	* You should have received a copy of the GNU Lesser General Public
	18	* License along with FFmpeg; if not, write to the Free Software
	19	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	20	*/
	21
	22	#include "libavutil/common.h"
	23	#include "libavutil/lls.h"
	24
	25	#define LPC_USE_DOUBLE
	26	#include "lpc.h"
	27	#include "libavutil/avassert.h"
	28
	29
	30	/**
	31	* Apply Welch window function to audio block
	32	*/
	33	static void lpc_apply_welch_window_c(const int32_t *data, int len,
	34	double *w_data)
	35	{
	36	int i, n2;
	37	double w;
	38	double c;
	39
	40	/* The optimization in commit fa4ed8c does not support odd len.
	41	* If someone wants odd len extend that change. */
	42	av_assert2(!(len & 1));
	43
	44	n2 = (len >> 1);
	45	c = 2.0 / (len - 1.0);
	46
	47	w_data+=n2;
	48	data+=n2;
	49	for(i=0; i<n2; i++) {
	50	w = c - n2 + i;
	51	w = 1.0 - (w * w);
	52	w_data[-i-1] = data[-i-1] * w;
	53	w_data[+i ] = data[+i ] * w;
	54	}
	55	}
	56
	57	/**
	58	* Calculate autocorrelation data from audio samples
	59	* A Welch window function is applied before calculation.
	60	*/
	61	static void lpc_compute_autocorr_c(const double *data, int len, int lag,
	62	double *autoc)
	63	{
	64	int i, j;
	65
	66	for(j=0; j<lag; j+=2){
	67	double sum0 = 1.0, sum1 = 1.0;
	68	for(i=j; i<len; i++){
	69	sum0 += data[i] * data[i-j];
	70	sum1 += data[i] * data[i-j-1];
	71	}
	72	autoc[j ] = sum0;
	73	autoc[j+1] = sum1;
	74	}
	75
	76	if(j==lag){
	77	double sum = 1.0;
	78	for(i=j-1; i<len; i+=2){
	79	sum += data[i ] * data[i-j ]
	80	+ data[i+1] * data[i-j+1];
	81	}
	82	autoc[j] = sum;
	83	}
	84	}
	85
	86	/**
	87	* Quantize LPC coefficients
	88	*/
	89	static void quantize_lpc_coefs(double *lpc_in, int order, int precision,
	90	int32_t lpc_out, int shift, int max_shift, int zero_shift)
	91	{
	92	int i;
	93	double cmax, error;
	94	int32_t qmax;
	95	int sh;
	96
	97	/* define maximum levels */
	98	qmax = (1 << (precision - 1)) - 1;
	99
	100	/* find maximum coefficient value */
	101	cmax = 0.0;
	102	for(i=0; i<order; i++) {
	103	cmax= FFMAX(cmax, fabs(lpc_in[i]));
	104	}
	105
	106	/* if maximum value quantizes to zero, return all zeros */
	107	if(cmax * (1 << max_shift) < 1.0) {
	108	*shift = zero_shift;
	109	memset(lpc_out, 0, sizeof(int32_t) * order);
	110	return;
	111	}
	112
	113	/* calculate level shift which scales max coeff to available bits */
	114	sh = max_shift;
	115	while((cmax * (1 << sh) > qmax) && (sh > 0)) {
	116	sh--;
	117	}
	118
	119	/* since negative shift values are unsupported in decoder, scale down
	120	coefficients instead */
	121	if(sh == 0 && cmax > qmax) {
	122	double scale = ((double)qmax) / cmax;
	123	for(i=0; i<order; i++) {
	124	lpc_in[i] *= scale;
	125	}
	126	}
	127
	128	/* output quantized coefficients and level shift */
	129	error=0;
	130	for(i=0; i<order; i++) {
	131	error -= lpc_in[i] * (1 << sh);
	132	lpc_out[i] = av_clip(lrintf(error), -qmax, qmax);
	133	error -= lpc_out[i];
	134	}
	135	*shift = sh;
	136	}
	137
	138	static int estimate_best_order(double *ref, int min_order, int max_order)
	139	{
	140	int i, est;
	141
	142	est = min_order;
	143	for(i=max_order-1; i>=min_order-1; i--) {
	144	if(ref[i] > 0.10) {
	145	est = i+1;
	146	break;
	147	}
	148	}
	149	return est;
	150	}
	151
	152	int ff_lpc_calc_ref_coefs(LPCContext *s,
	153	const int32_t samples, int order, double ref)
	154	{
	155	double autoc[MAX_LPC_ORDER + 1];
	156
	157	s->lpc_apply_welch_window(samples, s->blocksize, s->windowed_samples);
	158	s->lpc_compute_autocorr(s->windowed_samples, s->blocksize, order, autoc);
	159	compute_ref_coefs(autoc, order, ref, NULL);
	160
	161	return order;
	162	}
	163
	164	/**
	165	* Calculate LPC coefficients for multiple orders
	166	*
	167	* @param lpc_type LPC method for determining coefficients,
	168	* see #FFLPCType for details
	169	*/
	170	int ff_lpc_calc_coefs(LPCContext *s,
	171	const int32_t *samples, int blocksize, int min_order,
	172	int max_order, int precision,
	173	int32_t coefs[][MAX_LPC_ORDER], int *shift,
	174	enum FFLPCType lpc_type, int lpc_passes,
	175	int omethod, int max_shift, int zero_shift)
	176	{
	177	double autoc[MAX_LPC_ORDER+1];
	178	double ref[MAX_LPC_ORDER];
	179	double lpc[MAX_LPC_ORDER][MAX_LPC_ORDER];
	180	int i, j, pass = 0;
	181	int opt_order;
	182
	183	av_assert2(max_order >= MIN_LPC_ORDER && max_order <= MAX_LPC_ORDER &&
	184	lpc_type > FF_LPC_TYPE_FIXED);
	185	av_assert0(lpc_type == FF_LPC_TYPE_CHOLESKY \|\| lpc_type == FF_LPC_TYPE_LEVINSON);
	186
	187	/* reinit LPC context if parameters have changed */
	188	if (blocksize != s->blocksize \|\| max_order != s->max_order \|\|
	189	lpc_type != s->lpc_type) {
	190	ff_lpc_end(s);
	191	ff_lpc_init(s, blocksize, max_order, lpc_type);
	192	}
	193
	194	if(lpc_passes <= 0)
	195	lpc_passes = 2;
	196
	197	if (lpc_type == FF_LPC_TYPE_LEVINSON \|\| (lpc_type == FF_LPC_TYPE_CHOLESKY && lpc_passes > 1)) {
	198	s->lpc_apply_welch_window(samples, blocksize, s->windowed_samples);
	199
	200	s->lpc_compute_autocorr(s->windowed_samples, blocksize, max_order, autoc);
	201
	202	compute_lpc_coefs(autoc, max_order, &lpc[0][0], MAX_LPC_ORDER, 0, 1);
	203
	204	for(i=0; i<max_order; i++)
	205	ref[i] = fabs(lpc[i][i]);
	206
	207	pass++;
	208	}
	209
	210	if (lpc_type == FF_LPC_TYPE_CHOLESKY) {
	211	LLSModel m[2];
	212	LOCAL_ALIGNED(32, double, var, [FFALIGN(MAX_LPC_ORDER+1,4)]);
	213	double av_uninit(weight);
	214	memset(var, 0, FFALIGN(MAX_LPC_ORDER+1,4)sizeof(var));
	215
	216	for(j=0; j<max_order; j++)
	217	m[0].coeff[max_order-1][j] = -lpc[max_order-1][j];
	218
	219	for(; pass<lpc_passes; pass++){
	220	avpriv_init_lls(&m[pass&1], max_order);
	221
	222	weight=0;
	223	for(i=max_order; i<blocksize; i++){
	224	for(j=0; j<=max_order; j++)
	225	var[j]= samples[i-j];
	226
	227	if(pass){
	228	double eval, inv, rinv;
	229	eval= m[pass&1].evaluate_lls(&m[(pass-1)&1], var+1, max_order-1);
	230	eval= (512>>pass) + fabs(eval - var[0]);
	231	inv = 1/eval;
	232	rinv = sqrt(inv);
	233	for(j=0; j<=max_order; j++)
	234	var[j] *= rinv;
	235	weight += inv;
	236	}else
	237	weight++;
	238
	239	m[pass&1].update_lls(&m[pass&1], var);
	240	}
	241	avpriv_solve_lls(&m[pass&1], 0.001, 0);
	242	}
	243
	244	for(i=0; i<max_order; i++){
	245	for(j=0; j<max_order; j++)
	246	lpc[i][j]=-m[(pass-1)&1].coeff[i][j];
	247	ref[i]= sqrt(m[(pass-1)&1].variance[i] / weight) * (blocksize - max_order) / 4000;
	248	}
	249	for(i=max_order-1; i>0; i--)
	250	ref[i] = ref[i-1] - ref[i];
	251	}
	252
	253	opt_order = max_order;
	254
	255	if(omethod == ORDER_METHOD_EST) {
	256	opt_order = estimate_best_order(ref, min_order, max_order);
	257	i = opt_order-1;
	258	quantize_lpc_coefs(lpc[i], i+1, precision, coefs[i], &shift[i], max_shift, zero_shift);
	259	} else {
	260	for(i=min_order-1; i<max_order; i++) {
	261	quantize_lpc_coefs(lpc[i], i+1, precision, coefs[i], &shift[i], max_shift, zero_shift);
	262	}
	263	}
	264
	265	return opt_order;
	266	}
	267
	268	av_cold int ff_lpc_init(LPCContext *s, int blocksize, int max_order,
	269	enum FFLPCType lpc_type)
	270	{
	271	s->blocksize = blocksize;
	272	s->max_order = max_order;
	273	s->lpc_type = lpc_type;
	274
	275	s->windowed_buffer = av_mallocz((blocksize + 2 + FFALIGN(max_order, 4)) *
	276	sizeof(*s->windowed_samples));
	277	if (!s->windowed_buffer)
	278	return AVERROR(ENOMEM);
	279	s->windowed_samples = s->windowed_buffer + FFALIGN(max_order, 4);
	280
	281	s->lpc_apply_welch_window = lpc_apply_welch_window_c;
	282	s->lpc_compute_autocorr = lpc_compute_autocorr_c;
	283
	284	if (ARCH_X86)
	285	ff_lpc_init_x86(s);
	286
	287	return 0;
	288	}
	289
	290	av_cold void ff_lpc_end(LPCContext *s)
	291	{
	292	av_freep(&s->windowed_buffer);
	293	}