Commit | Line | Data |
---|---|---|
2ba45a60 DM |
1 | /* |
2 | * audio conversion | |
3 | * Copyright (c) 2006 Michael Niedermayer <michaelni@gmx.at> | |
4 | * | |
5 | * This file is part of FFmpeg. | |
6 | * | |
7 | * FFmpeg is free software; you can redistribute it and/or | |
8 | * modify it under the terms of the GNU Lesser General Public | |
9 | * License as published by the Free Software Foundation; either | |
10 | * version 2.1 of the License, or (at your option) any later version. | |
11 | * | |
12 | * FFmpeg is distributed in the hope that it will be useful, | |
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
15 | * Lesser General Public License for more details. | |
16 | * | |
17 | * You should have received a copy of the GNU Lesser General Public | |
18 | * License along with FFmpeg; if not, write to the Free Software | |
19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | |
20 | */ | |
21 | ||
22 | /** | |
23 | * @file | |
24 | * audio conversion | |
25 | * @author Michael Niedermayer <michaelni@gmx.at> | |
26 | */ | |
27 | ||
28 | #include "libavutil/avstring.h" | |
29 | #include "libavutil/avassert.h" | |
30 | #include "libavutil/libm.h" | |
31 | #include "libavutil/samplefmt.h" | |
32 | #include "audioconvert.h" | |
33 | ||
34 | ||
35 | #define CONV_FUNC_NAME(dst_fmt, src_fmt) conv_ ## src_fmt ## _to_ ## dst_fmt | |
36 | ||
37 | //FIXME rounding ? | |
38 | #define CONV_FUNC(ofmt, otype, ifmt, expr)\ | |
39 | static void CONV_FUNC_NAME(ofmt, ifmt)(uint8_t *po, const uint8_t *pi, int is, int os, uint8_t *end)\ | |
40 | {\ | |
41 | uint8_t *end2 = end - 3*os;\ | |
42 | while(po < end2){\ | |
43 | *(otype*)po = expr; pi += is; po += os;\ | |
44 | *(otype*)po = expr; pi += is; po += os;\ | |
45 | *(otype*)po = expr; pi += is; po += os;\ | |
46 | *(otype*)po = expr; pi += is; po += os;\ | |
47 | }\ | |
48 | while(po < end){\ | |
49 | *(otype*)po = expr; pi += is; po += os;\ | |
50 | }\ | |
51 | } | |
52 | ||
53 | //FIXME put things below under ifdefs so we do not waste space for cases no codec will need | |
54 | CONV_FUNC(AV_SAMPLE_FMT_U8 , uint8_t, AV_SAMPLE_FMT_U8 , *(const uint8_t*)pi) | |
f6fa7814 DM |
55 | CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_U8 , (*(const uint8_t*)pi - 0x80U)<<8) |
56 | CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_U8 , (*(const uint8_t*)pi - 0x80U)<<24) | |
2ba45a60 DM |
57 | CONV_FUNC(AV_SAMPLE_FMT_FLT, float , AV_SAMPLE_FMT_U8 , (*(const uint8_t*)pi - 0x80)*(1.0f/ (1<<7))) |
58 | CONV_FUNC(AV_SAMPLE_FMT_DBL, double , AV_SAMPLE_FMT_U8 , (*(const uint8_t*)pi - 0x80)*(1.0 / (1<<7))) | |
59 | CONV_FUNC(AV_SAMPLE_FMT_U8 , uint8_t, AV_SAMPLE_FMT_S16, (*(const int16_t*)pi>>8) + 0x80) | |
60 | CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_S16, *(const int16_t*)pi) | |
61 | CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_S16, *(const int16_t*)pi<<16) | |
62 | CONV_FUNC(AV_SAMPLE_FMT_FLT, float , AV_SAMPLE_FMT_S16, *(const int16_t*)pi*(1.0f/ (1<<15))) | |
63 | CONV_FUNC(AV_SAMPLE_FMT_DBL, double , AV_SAMPLE_FMT_S16, *(const int16_t*)pi*(1.0 / (1<<15))) | |
64 | CONV_FUNC(AV_SAMPLE_FMT_U8 , uint8_t, AV_SAMPLE_FMT_S32, (*(const int32_t*)pi>>24) + 0x80) | |
65 | CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_S32, *(const int32_t*)pi>>16) | |
66 | CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_S32, *(const int32_t*)pi) | |
67 | CONV_FUNC(AV_SAMPLE_FMT_FLT, float , AV_SAMPLE_FMT_S32, *(const int32_t*)pi*(1.0f/ (1U<<31))) | |
68 | CONV_FUNC(AV_SAMPLE_FMT_DBL, double , AV_SAMPLE_FMT_S32, *(const int32_t*)pi*(1.0 / (1U<<31))) | |
69 | CONV_FUNC(AV_SAMPLE_FMT_U8 , uint8_t, AV_SAMPLE_FMT_FLT, av_clip_uint8( lrintf(*(const float*)pi * (1<<7)) + 0x80)) | |
70 | CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, av_clip_int16( lrintf(*(const float*)pi * (1<<15)))) | |
71 | CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, av_clipl_int32(llrintf(*(const float*)pi * (1U<<31)))) | |
72 | CONV_FUNC(AV_SAMPLE_FMT_FLT, float , AV_SAMPLE_FMT_FLT, *(const float*)pi) | |
73 | CONV_FUNC(AV_SAMPLE_FMT_DBL, double , AV_SAMPLE_FMT_FLT, *(const float*)pi) | |
74 | CONV_FUNC(AV_SAMPLE_FMT_U8 , uint8_t, AV_SAMPLE_FMT_DBL, av_clip_uint8( lrint(*(const double*)pi * (1<<7)) + 0x80)) | |
75 | CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, av_clip_int16( lrint(*(const double*)pi * (1<<15)))) | |
76 | CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, av_clipl_int32(llrint(*(const double*)pi * (1U<<31)))) | |
77 | CONV_FUNC(AV_SAMPLE_FMT_FLT, float , AV_SAMPLE_FMT_DBL, *(const double*)pi) | |
78 | CONV_FUNC(AV_SAMPLE_FMT_DBL, double , AV_SAMPLE_FMT_DBL, *(const double*)pi) | |
79 | ||
80 | #define FMT_PAIR_FUNC(out, in) [(out) + AV_SAMPLE_FMT_NB*(in)] = CONV_FUNC_NAME(out, in) | |
81 | ||
82 | static conv_func_type * const fmt_pair_to_conv_functions[AV_SAMPLE_FMT_NB*AV_SAMPLE_FMT_NB] = { | |
83 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8 , AV_SAMPLE_FMT_U8 ), | |
84 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_U8 ), | |
85 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_U8 ), | |
86 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_U8 ), | |
87 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_U8 ), | |
88 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8 , AV_SAMPLE_FMT_S16), | |
89 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S16), | |
90 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S16), | |
91 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16), | |
92 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S16), | |
93 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8 , AV_SAMPLE_FMT_S32), | |
94 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S32), | |
95 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S32), | |
96 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S32), | |
97 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S32), | |
98 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8 , AV_SAMPLE_FMT_FLT), | |
99 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_FLT), | |
100 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_FLT), | |
101 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_FLT), | |
102 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_FLT), | |
103 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8 , AV_SAMPLE_FMT_DBL), | |
104 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_DBL), | |
105 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_DBL), | |
106 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_DBL), | |
107 | FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_DBL), | |
108 | }; | |
109 | ||
110 | static void cpy1(uint8_t **dst, const uint8_t **src, int len){ | |
111 | memcpy(*dst, *src, len); | |
112 | } | |
113 | static void cpy2(uint8_t **dst, const uint8_t **src, int len){ | |
114 | memcpy(*dst, *src, 2*len); | |
115 | } | |
116 | static void cpy4(uint8_t **dst, const uint8_t **src, int len){ | |
117 | memcpy(*dst, *src, 4*len); | |
118 | } | |
119 | static void cpy8(uint8_t **dst, const uint8_t **src, int len){ | |
120 | memcpy(*dst, *src, 8*len); | |
121 | } | |
122 | ||
123 | AudioConvert *swri_audio_convert_alloc(enum AVSampleFormat out_fmt, | |
124 | enum AVSampleFormat in_fmt, | |
125 | int channels, const int *ch_map, | |
126 | int flags) | |
127 | { | |
128 | AudioConvert *ctx; | |
129 | conv_func_type *f = fmt_pair_to_conv_functions[av_get_packed_sample_fmt(out_fmt) + AV_SAMPLE_FMT_NB*av_get_packed_sample_fmt(in_fmt)]; | |
130 | ||
131 | if (!f) | |
132 | return NULL; | |
133 | ctx = av_mallocz(sizeof(*ctx)); | |
134 | if (!ctx) | |
135 | return NULL; | |
136 | ||
137 | if(channels == 1){ | |
138 | in_fmt = av_get_planar_sample_fmt( in_fmt); | |
139 | out_fmt = av_get_planar_sample_fmt(out_fmt); | |
140 | } | |
141 | ||
142 | ctx->channels = channels; | |
143 | ctx->conv_f = f; | |
144 | ctx->ch_map = ch_map; | |
145 | if (in_fmt == AV_SAMPLE_FMT_U8 || in_fmt == AV_SAMPLE_FMT_U8P) | |
146 | memset(ctx->silence, 0x80, sizeof(ctx->silence)); | |
147 | ||
148 | if(out_fmt == in_fmt && !ch_map) { | |
149 | switch(av_get_bytes_per_sample(in_fmt)){ | |
150 | case 1:ctx->simd_f = cpy1; break; | |
151 | case 2:ctx->simd_f = cpy2; break; | |
152 | case 4:ctx->simd_f = cpy4; break; | |
153 | case 8:ctx->simd_f = cpy8; break; | |
154 | } | |
155 | } | |
156 | ||
157 | if(HAVE_YASM && HAVE_MMX) swri_audio_convert_init_x86(ctx, out_fmt, in_fmt, channels); | |
158 | if(ARCH_ARM) swri_audio_convert_init_arm(ctx, out_fmt, in_fmt, channels); | |
159 | if(ARCH_AARCH64) swri_audio_convert_init_aarch64(ctx, out_fmt, in_fmt, channels); | |
160 | ||
161 | return ctx; | |
162 | } | |
163 | ||
164 | void swri_audio_convert_free(AudioConvert **ctx) | |
165 | { | |
166 | av_freep(ctx); | |
167 | } | |
168 | ||
169 | int swri_audio_convert(AudioConvert *ctx, AudioData *out, AudioData *in, int len) | |
170 | { | |
171 | int ch; | |
172 | int off=0; | |
173 | const int os= (out->planar ? 1 :out->ch_count) *out->bps; | |
174 | unsigned misaligned = 0; | |
175 | ||
176 | av_assert0(ctx->channels == out->ch_count); | |
177 | ||
178 | if (ctx->in_simd_align_mask) { | |
179 | int planes = in->planar ? in->ch_count : 1; | |
180 | unsigned m = 0; | |
181 | for (ch = 0; ch < planes; ch++) | |
182 | m |= (intptr_t)in->ch[ch]; | |
183 | misaligned |= m & ctx->in_simd_align_mask; | |
184 | } | |
185 | if (ctx->out_simd_align_mask) { | |
186 | int planes = out->planar ? out->ch_count : 1; | |
187 | unsigned m = 0; | |
188 | for (ch = 0; ch < planes; ch++) | |
189 | m |= (intptr_t)out->ch[ch]; | |
190 | misaligned |= m & ctx->out_simd_align_mask; | |
191 | } | |
192 | ||
193 | //FIXME optimize common cases | |
194 | ||
195 | if(ctx->simd_f && !ctx->ch_map && !misaligned){ | |
196 | off = len&~15; | |
197 | av_assert1(off>=0); | |
198 | av_assert1(off<=len); | |
199 | av_assert2(ctx->channels == SWR_CH_MAX || !in->ch[ctx->channels]); | |
200 | if(off>0){ | |
201 | if(out->planar == in->planar){ | |
202 | int planes = out->planar ? out->ch_count : 1; | |
203 | for(ch=0; ch<planes; ch++){ | |
204 | ctx->simd_f(out->ch+ch, (const uint8_t **)in->ch+ch, off * (out->planar ? 1 :out->ch_count)); | |
205 | } | |
206 | }else{ | |
207 | ctx->simd_f(out->ch, (const uint8_t **)in->ch, off); | |
208 | } | |
209 | } | |
210 | if(off == len) | |
211 | return 0; | |
212 | } | |
213 | ||
214 | for(ch=0; ch<ctx->channels; ch++){ | |
215 | const int ich= ctx->ch_map ? ctx->ch_map[ch] : ch; | |
216 | const int is= ich < 0 ? 0 : (in->planar ? 1 : in->ch_count) * in->bps; | |
217 | const uint8_t *pi= ich < 0 ? ctx->silence : in->ch[ich]; | |
218 | uint8_t *po= out->ch[ch]; | |
219 | uint8_t *end= po + os*len; | |
220 | if(!po) | |
221 | continue; | |
222 | ctx->conv_f(po+off*os, pi+off*is, is, os, end); | |
223 | } | |
224 | return 0; | |
225 | } |