3 * Copyright (c) 2006 Michael Niedermayer <michaelni@gmx.at>
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
25 * @author Michael Niedermayer <michaelni@gmx.at>
28 #include "libavutil/avstring.h"
29 #include "libavutil/avassert.h"
30 #include "libavutil/libm.h"
31 #include "libavutil/samplefmt.h"
32 #include "audioconvert.h"
35 #define CONV_FUNC_NAME(dst_fmt, src_fmt) conv_ ## src_fmt ## _to_ ## dst_fmt
38 #define CONV_FUNC(ofmt, otype, ifmt, expr)\
39 static void CONV_FUNC_NAME(ofmt, ifmt)(uint8_t *po, const uint8_t *pi, int is, int os, uint8_t *end)\
41 uint8_t *end2 = end - 3*os;\
43 *(otype*)po = expr; pi += is; po += os;\
44 *(otype*)po = expr; pi += is; po += os;\
45 *(otype*)po = expr; pi += is; po += os;\
46 *(otype*)po = expr; pi += is; po += os;\
49 *(otype*)po = expr; pi += is; po += os;\
53 //FIXME put things below under ifdefs so we do not waste space for cases no codec will need
54 CONV_FUNC(AV_SAMPLE_FMT_U8
, uint8_t, AV_SAMPLE_FMT_U8
, *(const uint8_t*)pi
)
55 CONV_FUNC(AV_SAMPLE_FMT_S16
, int16_t, AV_SAMPLE_FMT_U8
, (*(const uint8_t*)pi
- 0x80U
)<<8)
56 CONV_FUNC(AV_SAMPLE_FMT_S32
, int32_t, AV_SAMPLE_FMT_U8
, (*(const uint8_t*)pi
- 0x80U
)<<24)
57 CONV_FUNC(AV_SAMPLE_FMT_FLT
, float , AV_SAMPLE_FMT_U8
, (*(const uint8_t*)pi
- 0x80)*(1.0f
/ (1<<7)))
58 CONV_FUNC(AV_SAMPLE_FMT_DBL
, double , AV_SAMPLE_FMT_U8
, (*(const uint8_t*)pi
- 0x80)*(1.0 / (1<<7)))
59 CONV_FUNC(AV_SAMPLE_FMT_U8
, uint8_t, AV_SAMPLE_FMT_S16
, (*(const int16_t*)pi
>>8) + 0x80)
60 CONV_FUNC(AV_SAMPLE_FMT_S16
, int16_t, AV_SAMPLE_FMT_S16
, *(const int16_t*)pi
)
61 CONV_FUNC(AV_SAMPLE_FMT_S32
, int32_t, AV_SAMPLE_FMT_S16
, *(const int16_t*)pi
<<16)
62 CONV_FUNC(AV_SAMPLE_FMT_FLT
, float , AV_SAMPLE_FMT_S16
, *(const int16_t*)pi
*(1.0f
/ (1<<15)))
63 CONV_FUNC(AV_SAMPLE_FMT_DBL
, double , AV_SAMPLE_FMT_S16
, *(const int16_t*)pi
*(1.0 / (1<<15)))
64 CONV_FUNC(AV_SAMPLE_FMT_U8
, uint8_t, AV_SAMPLE_FMT_S32
, (*(const int32_t*)pi
>>24) + 0x80)
65 CONV_FUNC(AV_SAMPLE_FMT_S16
, int16_t, AV_SAMPLE_FMT_S32
, *(const int32_t*)pi
>>16)
66 CONV_FUNC(AV_SAMPLE_FMT_S32
, int32_t, AV_SAMPLE_FMT_S32
, *(const int32_t*)pi
)
67 CONV_FUNC(AV_SAMPLE_FMT_FLT
, float , AV_SAMPLE_FMT_S32
, *(const int32_t*)pi
*(1.0f
/ (1U<<31)))
68 CONV_FUNC(AV_SAMPLE_FMT_DBL
, double , AV_SAMPLE_FMT_S32
, *(const int32_t*)pi
*(1.0 / (1U<<31)))
69 CONV_FUNC(AV_SAMPLE_FMT_U8
, uint8_t, AV_SAMPLE_FMT_FLT
, av_clip_uint8( lrintf(*(const float*)pi
* (1<<7)) + 0x80))
70 CONV_FUNC(AV_SAMPLE_FMT_S16
, int16_t, AV_SAMPLE_FMT_FLT
, av_clip_int16( lrintf(*(const float*)pi
* (1<<15))))
71 CONV_FUNC(AV_SAMPLE_FMT_S32
, int32_t, AV_SAMPLE_FMT_FLT
, av_clipl_int32(llrintf(*(const float*)pi
* (1U<<31))))
72 CONV_FUNC(AV_SAMPLE_FMT_FLT
, float , AV_SAMPLE_FMT_FLT
, *(const float*)pi
)
73 CONV_FUNC(AV_SAMPLE_FMT_DBL
, double , AV_SAMPLE_FMT_FLT
, *(const float*)pi
)
74 CONV_FUNC(AV_SAMPLE_FMT_U8
, uint8_t, AV_SAMPLE_FMT_DBL
, av_clip_uint8( lrint(*(const double*)pi
* (1<<7)) + 0x80))
75 CONV_FUNC(AV_SAMPLE_FMT_S16
, int16_t, AV_SAMPLE_FMT_DBL
, av_clip_int16( lrint(*(const double*)pi
* (1<<15))))
76 CONV_FUNC(AV_SAMPLE_FMT_S32
, int32_t, AV_SAMPLE_FMT_DBL
, av_clipl_int32(llrint(*(const double*)pi
* (1U<<31))))
77 CONV_FUNC(AV_SAMPLE_FMT_FLT
, float , AV_SAMPLE_FMT_DBL
, *(const double*)pi
)
78 CONV_FUNC(AV_SAMPLE_FMT_DBL
, double , AV_SAMPLE_FMT_DBL
, *(const double*)pi
)
80 #define FMT_PAIR_FUNC(out, in) [(out) + AV_SAMPLE_FMT_NB*(in)] = CONV_FUNC_NAME(out, in)
82 static conv_func_type
* const fmt_pair_to_conv_functions
[AV_SAMPLE_FMT_NB
*AV_SAMPLE_FMT_NB
] = {
83 FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8
, AV_SAMPLE_FMT_U8
),
84 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16
, AV_SAMPLE_FMT_U8
),
85 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32
, AV_SAMPLE_FMT_U8
),
86 FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT
, AV_SAMPLE_FMT_U8
),
87 FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL
, AV_SAMPLE_FMT_U8
),
88 FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8
, AV_SAMPLE_FMT_S16
),
89 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16
, AV_SAMPLE_FMT_S16
),
90 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32
, AV_SAMPLE_FMT_S16
),
91 FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT
, AV_SAMPLE_FMT_S16
),
92 FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL
, AV_SAMPLE_FMT_S16
),
93 FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8
, AV_SAMPLE_FMT_S32
),
94 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16
, AV_SAMPLE_FMT_S32
),
95 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32
, AV_SAMPLE_FMT_S32
),
96 FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT
, AV_SAMPLE_FMT_S32
),
97 FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL
, AV_SAMPLE_FMT_S32
),
98 FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8
, AV_SAMPLE_FMT_FLT
),
99 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16
, AV_SAMPLE_FMT_FLT
),
100 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32
, AV_SAMPLE_FMT_FLT
),
101 FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT
, AV_SAMPLE_FMT_FLT
),
102 FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL
, AV_SAMPLE_FMT_FLT
),
103 FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8
, AV_SAMPLE_FMT_DBL
),
104 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16
, AV_SAMPLE_FMT_DBL
),
105 FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32
, AV_SAMPLE_FMT_DBL
),
106 FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT
, AV_SAMPLE_FMT_DBL
),
107 FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL
, AV_SAMPLE_FMT_DBL
),
110 static void cpy1(uint8_t **dst
, const uint8_t **src
, int len
){
111 memcpy(*dst
, *src
, len
);
113 static void cpy2(uint8_t **dst
, const uint8_t **src
, int len
){
114 memcpy(*dst
, *src
, 2*len
);
116 static void cpy4(uint8_t **dst
, const uint8_t **src
, int len
){
117 memcpy(*dst
, *src
, 4*len
);
119 static void cpy8(uint8_t **dst
, const uint8_t **src
, int len
){
120 memcpy(*dst
, *src
, 8*len
);
123 AudioConvert
*swri_audio_convert_alloc(enum AVSampleFormat out_fmt
,
124 enum AVSampleFormat in_fmt
,
125 int channels
, const int *ch_map
,
129 conv_func_type
*f
= fmt_pair_to_conv_functions
[av_get_packed_sample_fmt(out_fmt
) + AV_SAMPLE_FMT_NB
*av_get_packed_sample_fmt(in_fmt
)];
133 ctx
= av_mallocz(sizeof(*ctx
));
138 in_fmt
= av_get_planar_sample_fmt( in_fmt
);
139 out_fmt
= av_get_planar_sample_fmt(out_fmt
);
142 ctx
->channels
= channels
;
144 ctx
->ch_map
= ch_map
;
145 if (in_fmt
== AV_SAMPLE_FMT_U8
|| in_fmt
== AV_SAMPLE_FMT_U8P
)
146 memset(ctx
->silence
, 0x80, sizeof(ctx
->silence
));
148 if(out_fmt
== in_fmt
&& !ch_map
) {
149 switch(av_get_bytes_per_sample(in_fmt
)){
150 case 1:ctx
->simd_f
= cpy1
; break;
151 case 2:ctx
->simd_f
= cpy2
; break;
152 case 4:ctx
->simd_f
= cpy4
; break;
153 case 8:ctx
->simd_f
= cpy8
; break;
157 if(HAVE_YASM
&& HAVE_MMX
) swri_audio_convert_init_x86(ctx
, out_fmt
, in_fmt
, channels
);
158 if(ARCH_ARM
) swri_audio_convert_init_arm(ctx
, out_fmt
, in_fmt
, channels
);
159 if(ARCH_AARCH64
) swri_audio_convert_init_aarch64(ctx
, out_fmt
, in_fmt
, channels
);
164 void swri_audio_convert_free(AudioConvert
**ctx
)
169 int swri_audio_convert(AudioConvert
*ctx
, AudioData
*out
, AudioData
*in
, int len
)
173 const int os
= (out
->planar
? 1 :out
->ch_count
) *out
->bps
;
174 unsigned misaligned
= 0;
176 av_assert0(ctx
->channels
== out
->ch_count
);
178 if (ctx
->in_simd_align_mask
) {
179 int planes
= in
->planar
? in
->ch_count
: 1;
181 for (ch
= 0; ch
< planes
; ch
++)
182 m
|= (intptr_t)in
->ch
[ch
];
183 misaligned
|= m
& ctx
->in_simd_align_mask
;
185 if (ctx
->out_simd_align_mask
) {
186 int planes
= out
->planar
? out
->ch_count
: 1;
188 for (ch
= 0; ch
< planes
; ch
++)
189 m
|= (intptr_t)out
->ch
[ch
];
190 misaligned
|= m
& ctx
->out_simd_align_mask
;
193 //FIXME optimize common cases
195 if(ctx
->simd_f
&& !ctx
->ch_map
&& !misaligned
){
198 av_assert1(off
<=len
);
199 av_assert2(ctx
->channels
== SWR_CH_MAX
|| !in
->ch
[ctx
->channels
]);
201 if(out
->planar
== in
->planar
){
202 int planes
= out
->planar
? out
->ch_count
: 1;
203 for(ch
=0; ch
<planes
; ch
++){
204 ctx
->simd_f(out
->ch
+ch
, (const uint8_t **)in
->ch
+ch
, off
* (out
->planar
? 1 :out
->ch_count
));
207 ctx
->simd_f(out
->ch
, (const uint8_t **)in
->ch
, off
);
214 for(ch
=0; ch
<ctx
->channels
; ch
++){
215 const int ich
= ctx
->ch_map
? ctx
->ch_map
[ch
] : ch
;
216 const int is
= ich
< 0 ? 0 : (in
->planar
? 1 : in
->ch_count
) * in
->bps
;
217 const uint8_t *pi
= ich
< 0 ? ctx
->silence
: in
->ch
[ich
];
218 uint8_t *po
= out
->ch
[ch
];
219 uint8_t *end
= po
+ os
*len
;
222 ctx
->conv_f(po
+off
*os
, pi
+off
*is
, is
, os
, end
);