[deb_ffmpeg.git] / ffmpeg / libavcodec / mips / aacpsy_mips.h

/*
 * Copyright (c) 2012
 *      MIPS Technologies, Inc., California.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. Neither the name of the MIPS Technologies, Inc., nor the names of its
 *    contributors may be used to endorse or promote products derived from
 *    this software without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE MIPS TECHNOLOGIES, INC. ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE MIPS TECHNOLOGIES, INC. BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 * Author:  Bojan Zivkovic   (bojan@mips.com)
 *
 * AAC encoder psychoacoustic model routines optimized
 * for MIPS floating-point architecture
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

/**
 * @file
 * Reference: libavcodec/aacpsy.c
 */

#ifndef AVCODEC_MIPS_AACPSY_MIPS_H
#define AVCODEC_MIPS_AACPSY_MIPS_H

#if HAVE_INLINE_ASM && HAVE_MIPSFPU && ( PSY_LAME_FIR_LEN == 21 )
static void calc_thr_3gpp_mips(const FFPsyWindowInfo *wi, const int num_bands,
                               AacPsyChannel *pch, const uint8_t *band_sizes,
                               const float *coefs)
{
    int i, w, g;
    int start = 0;
    for (w = 0; w < wi->num_windows*16; w += 16) {
        for (g = 0; g < num_bands; g++) {
            AacPsyBand *band = &pch->band[w+g];

            float form_factor = 0.0f;
            float Temp;
            band->energy = 0.0f;
            for (i = 0; i < band_sizes[g]; i+=4) {
                float a, b, c, d;
                float ax, bx, cx, dx;
                float *cf = (float *)&coefs[start+i];

                __asm__ volatile (
                    "lwc1   %[a],   0(%[cf])                \n\t"
                    "lwc1   %[b],   4(%[cf])                \n\t"
                    "lwc1   %[c],   8(%[cf])                \n\t"
                    "lwc1   %[d],   12(%[cf])               \n\t"
                    "abs.s  %[a],   %[a]                    \n\t"
                    "abs.s  %[b],   %[b]                    \n\t"
                    "abs.s  %[c],   %[c]                    \n\t"
                    "abs.s  %[d],   %[d]                    \n\t"
                    "sqrt.s %[ax],  %[a]                    \n\t"
                    "sqrt.s %[bx],  %[b]                    \n\t"
                    "sqrt.s %[cx],  %[c]                    \n\t"
                    "sqrt.s %[dx],  %[d]                    \n\t"
                    "madd.s %[e],   %[e],   %[a],   %[a]    \n\t"
                    "madd.s %[e],   %[e],   %[b],   %[b]    \n\t"
                    "madd.s %[e],   %[e],   %[c],   %[c]    \n\t"
                    "madd.s %[e],   %[e],   %[d],   %[d]    \n\t"
                    "add.s  %[f],   %[f],   %[ax]           \n\t"
                    "add.s  %[f],   %[f],   %[bx]           \n\t"
                    "add.s  %[f],   %[f],   %[cx]           \n\t"
                    "add.s  %[f],   %[f],   %[dx]           \n\t"

                    : [a]"=&f"(a), [b]"=&f"(b),
                      [c]"=&f"(c), [d]"=&f"(d),
                      [e]"+f"(band->energy), [f]"+f"(form_factor),
                      [ax]"=&f"(ax), [bx]"=&f"(bx),
                      [cx]"=&f"(cx), [dx]"=&f"(dx)
                    : [cf]"r"(cf)
                    : "memory"
                );
            }

            Temp = sqrtf((float)band_sizes[g] / band->energy);
            band->thr      = band->energy * 0.001258925f;
            band->nz_lines = form_factor * sqrtf(Temp);
            start += band_sizes[g];
        }
    }
}

static void psy_hp_filter_mips(const float *firbuf, float *hpfsmpl, const float * psy_fir_coeffs)
{
    float sum1, sum2, sum3, sum4;
    float *fb = (float*)firbuf;
    float *fb_end = fb + AAC_BLOCK_SIZE_LONG;
    float *hp = hpfsmpl;

    float coeff0 = psy_fir_coeffs[1];
    float coeff1 = psy_fir_coeffs[3];
    float coeff2 = psy_fir_coeffs[5];
    float coeff3 = psy_fir_coeffs[7];
    float coeff4 = psy_fir_coeffs[9];

    __asm__ volatile (
        ".set push                                          \n\t"
        ".set noreorder                                     \n\t"

        "li.s   $f12,       32768                           \n\t"
        "1:                                                 \n\t"
        "lwc1   $f0,        40(%[fb])                       \n\t"
        "lwc1   $f1,        4(%[fb])                        \n\t"
        "lwc1   $f2,        80(%[fb])                       \n\t"
        "lwc1   $f3,        44(%[fb])                       \n\t"
        "lwc1   $f4,        8(%[fb])                        \n\t"
        "madd.s %[sum1],    $f0,        $f1,    %[coeff0]   \n\t"
        "lwc1   $f5,        84(%[fb])                       \n\t"
        "lwc1   $f6,        48(%[fb])                       \n\t"
        "madd.s %[sum2],    $f3,        $f4,    %[coeff0]   \n\t"
        "lwc1   $f7,        12(%[fb])                       \n\t"
        "madd.s %[sum1],    %[sum1],    $f2,    %[coeff0]   \n\t"
        "lwc1   $f8,        88(%[fb])                       \n\t"
        "lwc1   $f9,        52(%[fb])                       \n\t"
        "madd.s %[sum2],    %[sum2],    $f5,    %[coeff0]   \n\t"
        "madd.s %[sum3],    $f6,        $f7,    %[coeff0]   \n\t"
        "lwc1   $f10,       16(%[fb])                       \n\t"
        "lwc1   $f11,       92(%[fb])                       \n\t"
        "madd.s %[sum1],    %[sum1],    $f7,    %[coeff1]   \n\t"
        "lwc1   $f1,        72(%[fb])                       \n\t"
        "madd.s %[sum3],    %[sum3],    $f8,    %[coeff0]   \n\t"
        "madd.s %[sum4],    $f9,        $f10,   %[coeff0]   \n\t"
        "madd.s %[sum2],    %[sum2],    $f10,   %[coeff1]   \n\t"
        "madd.s %[sum1],    %[sum1],    $f1,    %[coeff1]   \n\t"
        "lwc1   $f4,        76(%[fb])                       \n\t"
        "lwc1   $f8,        20(%[fb])                       \n\t"
        "madd.s %[sum4],    %[sum4],    $f11,   %[coeff0]   \n\t"
        "lwc1   $f11,       24(%[fb])                       \n\t"
        "madd.s %[sum2],    %[sum2],    $f4,    %[coeff1]   \n\t"
        "madd.s %[sum1],    %[sum1],    $f8,    %[coeff2]   \n\t"
        "madd.s %[sum3],    %[sum3],    $f8,    %[coeff1]   \n\t"
        "madd.s %[sum4],    %[sum4],    $f11,   %[coeff1]   \n\t"
        "lwc1   $f7,        64(%[fb])                       \n\t"
        "madd.s %[sum2],    %[sum2],    $f11,   %[coeff2]   \n\t"
        "lwc1   $f10,       68(%[fb])                       \n\t"
        "madd.s %[sum3],    %[sum3],    $f2,    %[coeff1]   \n\t"
        "madd.s %[sum4],    %[sum4],    $f5,    %[coeff1]   \n\t"
        "madd.s %[sum1],    %[sum1],    $f7,    %[coeff2]   \n\t"
        "madd.s %[sum2],    %[sum2],    $f10,   %[coeff2]   \n\t"
        "lwc1   $f2,        28(%[fb])                       \n\t"
        "lwc1   $f5,        32(%[fb])                       \n\t"
        "lwc1   $f8,        56(%[fb])                       \n\t"
        "lwc1   $f11,       60(%[fb])                       \n\t"
        "madd.s %[sum3],    %[sum3],    $f2,    %[coeff2]   \n\t"
        "madd.s %[sum4],    %[sum4],    $f5,    %[coeff2]   \n\t"
        "madd.s %[sum1],    %[sum1],    $f2,    %[coeff3]   \n\t"
        "madd.s %[sum2],    %[sum2],    $f5,    %[coeff3]   \n\t"
        "madd.s %[sum3],    %[sum3],    $f1,    %[coeff2]   \n\t"
        "madd.s %[sum4],    %[sum4],    $f4,    %[coeff2]   \n\t"
        "madd.s %[sum1],    %[sum1],    $f8,    %[coeff3]   \n\t"
        "madd.s %[sum2],    %[sum2],    $f11,   %[coeff3]   \n\t"
        "lwc1   $f1,        36(%[fb])                       \n\t"
        "addiu  %[fb],      %[fb],      16                  \n\t"
        "madd.s %[sum4],    %[sum4],    $f0,    %[coeff3]   \n\t"
        "madd.s %[sum3],    %[sum3],    $f1,    %[coeff3]   \n\t"
        "madd.s %[sum1],    %[sum1],    $f1,    %[coeff4]   \n\t"
        "madd.s %[sum2],    %[sum2],    $f0,    %[coeff4]   \n\t"
        "madd.s %[sum4],    %[sum4],    $f10,   %[coeff3]   \n\t"
        "madd.s %[sum3],    %[sum3],    $f7,    %[coeff3]   \n\t"
        "madd.s %[sum1],    %[sum1],    $f6,    %[coeff4]   \n\t"
        "madd.s %[sum2],    %[sum2],    $f9,    %[coeff4]   \n\t"
        "madd.s %[sum4],    %[sum4],    $f6,    %[coeff4]   \n\t"
        "madd.s %[sum3],    %[sum3],    $f3,    %[coeff4]   \n\t"
        "mul.s  %[sum1],    %[sum1],    $f12                \n\t"
        "mul.s  %[sum2],    %[sum2],    $f12                \n\t"
        "madd.s %[sum4],    %[sum4],    $f11,   %[coeff4]   \n\t"
        "madd.s %[sum3],    %[sum3],    $f8,    %[coeff4]   \n\t"
        "swc1   %[sum1],    0(%[hp])                        \n\t"
        "swc1   %[sum2],    4(%[hp])                        \n\t"
        "mul.s  %[sum4],    %[sum4],    $f12                \n\t"
        "mul.s  %[sum3],    %[sum3],    $f12                \n\t"
        "swc1   %[sum4],    12(%[hp])                       \n\t"
        "swc1   %[sum3],    8(%[hp])                        \n\t"
        "bne    %[fb],      %[fb_end],  1b                  \n\t"
        " addiu %[hp],      %[hp],      16                  \n\t"

        ".set pop                                           \n\t"

        : [sum1]"=&f"(sum1), [sum2]"=&f"(sum2),
          [sum3]"=&f"(sum3), [sum4]"=&f"(sum4),
          [fb]"+r"(fb), [hp]"+r"(hp)
        : [coeff0]"f"(coeff0), [coeff1]"f"(coeff1),
          [coeff2]"f"(coeff2), [coeff3]"f"(coeff3),
          [coeff4]"f"(coeff4), [fb_end]"r"(fb_end)
        : "$f0", "$f1", "$f2", "$f3", "$f4", "$f5", "$f6",
          "$f7", "$f8", "$f9", "$f10", "$f11", "$f12",
          "memory"
    );
}

#define calc_thr_3gpp calc_thr_3gpp_mips
#define psy_hp_filter psy_hp_filter_mips

#endif /* HAVE_INLINE_ASM && HAVE_MIPSFPU */
#endif /* AVCODEC_MIPS_AACPSY_MIPS_H */
Commit	Line	Data
2ba45a60 DM	1	/*
	2	* Copyright (c) 2012
	3	* MIPS Technologies, Inc., California.
	4	*
	5	* Redistribution and use in source and binary forms, with or without
	6	* modification, are permitted provided that the following conditions
	7	* are met:
	8	* 1. Redistributions of source code must retain the above copyright
	9	* notice, this list of conditions and the following disclaimer.
	10	* 2. Redistributions in binary form must reproduce the above copyright
	11	* notice, this list of conditions and the following disclaimer in the
	12	* documentation and/or other materials provided with the distribution.
	13	* 3. Neither the name of the MIPS Technologies, Inc., nor the names of its
	14	* contributors may be used to endorse or promote products derived from
	15	* this software without specific prior written permission.
	16	*
	17	* THIS SOFTWARE IS PROVIDED BY THE MIPS TECHNOLOGIES, INC. ``AS IS'' AND
	18	* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
	19	* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
	20	* ARE DISCLAIMED. IN NO EVENT SHALL THE MIPS TECHNOLOGIES, INC. BE LIABLE
	21	* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
	22	* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
	23	* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
	24	* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
	25	* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
	26	* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
	27	* SUCH DAMAGE.
	28	*
	29	* Author: Bojan Zivkovic (bojan@mips.com)
	30	*
	31	* AAC encoder psychoacoustic model routines optimized
	32	* for MIPS floating-point architecture
	33	*
	34	* This file is part of FFmpeg.
	35	*
	36	* FFmpeg is free software; you can redistribute it and/or
	37	* modify it under the terms of the GNU Lesser General Public
	38	* License as published by the Free Software Foundation; either
	39	* version 2.1 of the License, or (at your option) any later version.
	40	*
	41	* FFmpeg is distributed in the hope that it will be useful,
	42	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	43	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	44	* Lesser General Public License for more details.
	45	*
	46	* You should have received a copy of the GNU Lesser General Public
	47	* License along with FFmpeg; if not, write to the Free Software
	48	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	49	*/
	50
	51	/**
	52	* @file
	53	* Reference: libavcodec/aacpsy.c
	54	*/
	55
	56	#ifndef AVCODEC_MIPS_AACPSY_MIPS_H
	57	#define AVCODEC_MIPS_AACPSY_MIPS_H
	58
	59	#if HAVE_INLINE_ASM && HAVE_MIPSFPU && ( PSY_LAME_FIR_LEN == 21 )
	60	static void calc_thr_3gpp_mips(const FFPsyWindowInfo *wi, const int num_bands,
	61	AacPsyChannel pch, const uint8_t band_sizes,
	62	const float *coefs)
	63	{
	64	int i, w, g;
65	int start = 0;
66	for (w = 0; w < wi->num_windows*16; w += 16) {
67	for (g = 0; g < num_bands; g++) {
68	AacPsyBand *band = &pch->band[w+g];
69
70	float form_factor = 0.0f;
71	float Temp;
72	band->energy = 0.0f;
73	for (i = 0; i < band_sizes[g]; i+=4) {
74	float a, b, c, d;
75	float ax, bx, cx, dx;
76	float cf = (float )&coefs[start+i];
77
78	__asm__ volatile (
79	"lwc1 %[a], 0(%[cf]) \n\t"
80	"lwc1 %[b], 4(%[cf]) \n\t"
81	"lwc1 %[c], 8(%[cf]) \n\t"
82	"lwc1 %[d], 12(%[cf]) \n\t"
83	"abs.s %[a], %[a] \n\t"
84	"abs.s %[b], %[b] \n\t"
85	"abs.s %[c], %[c] \n\t"
86	"abs.s %[d], %[d] \n\t"
87	"sqrt.s %[ax], %[a] \n\t"
88	"sqrt.s %[bx], %[b] \n\t"
89	"sqrt.s %[cx], %[c] \n\t"
90	"sqrt.s %[dx], %[d] \n\t"
91	"madd.s %[e], %[e], %[a], %[a] \n\t"
92	"madd.s %[e], %[e], %[b], %[b] \n\t"
93	"madd.s %[e], %[e], %[c], %[c] \n\t"
94	"madd.s %[e], %[e], %[d], %[d] \n\t"
95	"add.s %[f], %[f], %[ax] \n\t"
96	"add.s %[f], %[f], %[bx] \n\t"
97	"add.s %[f], %[f], %[cx] \n\t"
98	"add.s %[f], %[f], %[dx] \n\t"
99
100	: [a]"=&f"(a), [b]"=&f"(b),
101	[c]"=&f"(c), [d]"=&f"(d),
102	[e]"+f"(band->energy), [f]"+f"(form_factor),
103	[ax]"=&f"(ax), [bx]"=&f"(bx),
104	[cx]"=&f"(cx), [dx]"=&f"(dx)
105	: [cf]"r"(cf)
106	: "memory"
107	);
108	}
109
110	Temp = sqrtf((float)band_sizes[g] / band->energy);
111	band->thr = band->energy * 0.001258925f;
112	band->nz_lines = form_factor * sqrtf(Temp);
113	start += band_sizes[g];
114	}
115	}
116	}
117
118	static void psy_hp_filter_mips(const float firbuf, float hpfsmpl, const float * psy_fir_coeffs)
119	{
120	float sum1, sum2, sum3, sum4;
121	float fb = (float)firbuf;
122	float *fb_end = fb + AAC_BLOCK_SIZE_LONG;
123	float *hp = hpfsmpl;
124
125	float coeff0 = psy_fir_coeffs[1];
126	float coeff1 = psy_fir_coeffs[3];
127	float coeff2 = psy_fir_coeffs[5];
128	float coeff3 = psy_fir_coeffs[7];
129	float coeff4 = psy_fir_coeffs[9];
130
131	__asm__ volatile (
132	".set push \n\t"
133	".set noreorder \n\t"
134
135	"li.s $f12, 32768 \n\t"
136	"1: \n\t"
137	"lwc1 $f0, 40(%[fb]) \n\t"
138	"lwc1 $f1, 4(%[fb]) \n\t"
139	"lwc1 $f2, 80(%[fb]) \n\t"
140	"lwc1 $f3, 44(%[fb]) \n\t"
141	"lwc1 $f4, 8(%[fb]) \n\t"
142	"madd.s %[sum1], $f0, $f1, %[coeff0] \n\t"
143	"lwc1 $f5, 84(%[fb]) \n\t"
144	"lwc1 $f6, 48(%[fb]) \n\t"
145	"madd.s %[sum2], $f3, $f4, %[coeff0] \n\t"
146	"lwc1 $f7, 12(%[fb]) \n\t"
147	"madd.s %[sum1], %[sum1], $f2, %[coeff0] \n\t"
148	"lwc1 $f8, 88(%[fb]) \n\t"
149	"lwc1 $f9, 52(%[fb]) \n\t"
150	"madd.s %[sum2], %[sum2], $f5, %[coeff0] \n\t"
151	"madd.s %[sum3], $f6, $f7, %[coeff0] \n\t"
152	"lwc1 $f10, 16(%[fb]) \n\t"
153	"lwc1 $f11, 92(%[fb]) \n\t"
154	"madd.s %[sum1], %[sum1], $f7, %[coeff1] \n\t"
155	"lwc1 $f1, 72(%[fb]) \n\t"
156	"madd.s %[sum3], %[sum3], $f8, %[coeff0] \n\t"
157	"madd.s %[sum4], $f9, $f10, %[coeff0] \n\t"
158	"madd.s %[sum2], %[sum2], $f10, %[coeff1] \n\t"
159	"madd.s %[sum1], %[sum1], $f1, %[coeff1] \n\t"
160	"lwc1 $f4, 76(%[fb]) \n\t"
161	"lwc1 $f8, 20(%[fb]) \n\t"
162	"madd.s %[sum4], %[sum4], $f11, %[coeff0] \n\t"
163	"lwc1 $f11, 24(%[fb]) \n\t"
164	"madd.s %[sum2], %[sum2], $f4, %[coeff1] \n\t"
165	"madd.s %[sum1], %[sum1], $f8, %[coeff2] \n\t"
166	"madd.s %[sum3], %[sum3], $f8, %[coeff1] \n\t"
167	"madd.s %[sum4], %[sum4], $f11, %[coeff1] \n\t"
168	"lwc1 $f7, 64(%[fb]) \n\t"
169	"madd.s %[sum2], %[sum2], $f11, %[coeff2] \n\t"
170	"lwc1 $f10, 68(%[fb]) \n\t"
171	"madd.s %[sum3], %[sum3], $f2, %[coeff1] \n\t"
172	"madd.s %[sum4], %[sum4], $f5, %[coeff1] \n\t"
173	"madd.s %[sum1], %[sum1], $f7, %[coeff2] \n\t"
174	"madd.s %[sum2], %[sum2], $f10, %[coeff2] \n\t"
175	"lwc1 $f2, 28(%[fb]) \n\t"
176	"lwc1 $f5, 32(%[fb]) \n\t"
177	"lwc1 $f8, 56(%[fb]) \n\t"
178	"lwc1 $f11, 60(%[fb]) \n\t"
179	"madd.s %[sum3], %[sum3], $f2, %[coeff2] \n\t"
180	"madd.s %[sum4], %[sum4], $f5, %[coeff2] \n\t"
181	"madd.s %[sum1], %[sum1], $f2, %[coeff3] \n\t"
182	"madd.s %[sum2], %[sum2], $f5, %[coeff3] \n\t"
183	"madd.s %[sum3], %[sum3], $f1, %[coeff2] \n\t"
184	"madd.s %[sum4], %[sum4], $f4, %[coeff2] \n\t"
185	"madd.s %[sum1], %[sum1], $f8, %[coeff3] \n\t"
186	"madd.s %[sum2], %[sum2], $f11, %[coeff3] \n\t"
187	"lwc1 $f1, 36(%[fb]) \n\t"
188	"addiu %[fb], %[fb], 16 \n\t"
189	"madd.s %[sum4], %[sum4], $f0, %[coeff3] \n\t"
190	"madd.s %[sum3], %[sum3], $f1, %[coeff3] \n\t"
191	"madd.s %[sum1], %[sum1], $f1, %[coeff4] \n\t"
192	"madd.s %[sum2], %[sum2], $f0, %[coeff4] \n\t"
193	"madd.s %[sum4], %[sum4], $f10, %[coeff3] \n\t"
194	"madd.s %[sum3], %[sum3], $f7, %[coeff3] \n\t"
195	"madd.s %[sum1], %[sum1], $f6, %[coeff4] \n\t"
196	"madd.s %[sum2], %[sum2], $f9, %[coeff4] \n\t"
197	"madd.s %[sum4], %[sum4], $f6, %[coeff4] \n\t"
198	"madd.s %[sum3], %[sum3], $f3, %[coeff4] \n\t"
199	"mul.s %[sum1], %[sum1], $f12 \n\t"
200	"mul.s %[sum2], %[sum2], $f12 \n\t"
201	"madd.s %[sum4], %[sum4], $f11, %[coeff4] \n\t"
202	"madd.s %[sum3], %[sum3], $f8, %[coeff4] \n\t"
203	"swc1 %[sum1], 0(%[hp]) \n\t"
204	"swc1 %[sum2], 4(%[hp]) \n\t"
205	"mul.s %[sum4], %[sum4], $f12 \n\t"
206	"mul.s %[sum3], %[sum3], $f12 \n\t"
207	"swc1 %[sum4], 12(%[hp]) \n\t"
208	"swc1 %[sum3], 8(%[hp]) \n\t"
209	"bne %[fb], %[fb_end], 1b \n\t"
210	" addiu %[hp], %[hp], 16 \n\t"
211
212	".set pop \n\t"
213
214	: [sum1]"=&f"(sum1), [sum2]"=&f"(sum2),
215	[sum3]"=&f"(sum3), [sum4]"=&f"(sum4),
216	[fb]"+r"(fb), [hp]"+r"(hp)
217	: [coeff0]"f"(coeff0), [coeff1]"f"(coeff1),
218	[coeff2]"f"(coeff2), [coeff3]"f"(coeff3),
219	[coeff4]"f"(coeff4), [fb_end]"r"(fb_end)
220	: "$f0", "$f1", "$f2", "$f3", "$f4", "$f5", "$f6",
221	"$f7", "$f8", "$f9", "$f10", "$f11", "$f12",
222	"memory"
223	);
224	}
225
226	#define calc_thr_3gpp calc_thr_3gpp_mips
227	#define psy_hp_filter psy_hp_filter_mips
228
229	#endif /* HAVE_INLINE_ASM && HAVE_MIPSFPU */
230	#endif /* AVCODEC_MIPS_AACPSY_MIPS_H */