2 * Lossless video DSP utils
4 * This file is part of FFmpeg.
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 #include "../lossless_videodsp.h"
22 #include "libavutil/pixdesc.h"
23 #include "libavutil/x86/cpu.h"
25 void ff_add_int16_mmx(uint16_t *dst
, const uint16_t *src
, unsigned mask
, int w
);
26 void ff_add_int16_sse2(uint16_t *dst
, const uint16_t *src
, unsigned mask
, int w
);
27 void ff_diff_int16_mmx (uint16_t *dst
, const uint16_t *src1
, const uint16_t *src2
, unsigned mask
, int w
);
28 void ff_diff_int16_sse2(uint16_t *dst
, const uint16_t *src1
, const uint16_t *src2
, unsigned mask
, int w
);
29 int ff_add_hfyu_left_pred_int16_ssse3(uint16_t *dst
, const uint16_t *src
, unsigned mask
, int w
, unsigned acc
);
30 int ff_add_hfyu_left_pred_int16_sse4(uint16_t *dst
, const uint16_t *src
, unsigned mask
, int w
, unsigned acc
);
31 void ff_add_hfyu_median_pred_int16_mmxext(uint16_t *dst
, const uint16_t *top
, const uint16_t *diff
, unsigned mask
, int w
, int *left
, int *left_top
);
32 void ff_sub_hfyu_median_pred_int16_mmxext(uint16_t *dst
, const uint16_t *src1
, const uint16_t *src2
, unsigned mask
, int w
, int *left
, int *left_top
);
35 void ff_llviddsp_init_x86(LLVidDSPContext
*c
, AVCodecContext
*avctx
)
37 int cpu_flags
= av_get_cpu_flags();
38 const AVPixFmtDescriptor
*pix_desc
= av_pix_fmt_desc_get(avctx
->pix_fmt
);
40 if (EXTERNAL_MMX(cpu_flags
)) {
41 c
->add_int16
= ff_add_int16_mmx
;
42 c
->diff_int16
= ff_diff_int16_mmx
;
45 if (EXTERNAL_MMXEXT(cpu_flags
) && pix_desc
->comp
[0].depth_minus1
<15) {
46 c
->add_hfyu_median_pred_int16
= ff_add_hfyu_median_pred_int16_mmxext
;
47 c
->sub_hfyu_median_pred_int16
= ff_sub_hfyu_median_pred_int16_mmxext
;
50 if (EXTERNAL_SSE2(cpu_flags
)) {
51 c
->add_int16
= ff_add_int16_sse2
;
52 c
->diff_int16
= ff_diff_int16_sse2
;
55 if (EXTERNAL_SSSE3(cpu_flags
)) {
56 c
->add_hfyu_left_pred_int16
= ff_add_hfyu_left_pred_int16_ssse3
;
59 if (EXTERNAL_SSE4(cpu_flags
)) {
60 c
->add_hfyu_left_pred_int16
= ff_add_hfyu_left_pred_int16_sse4
;