1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with FFmpeg; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18 
19 #include "config.h"
20 #include "libavutil/attributes.h"
21 #include "libavutil/cpu.h"
22 #include "libavutil/x86/cpu.h"
23 #include "libavcodec/idctdsp.h"
24 #include "libavcodec/xvididct.h"
25 
26 #include "idctdsp.h"
27 #include "xvididct.h"
28 
29 #if ARCH_X86_32 && HAVE_X86ASM
xvid_idct_mmx_put(uint8_t * dest,ptrdiff_t line_size,short * block)30 static void xvid_idct_mmx_put(uint8_t *dest, ptrdiff_t line_size, short *block)
31 {
32     ff_xvid_idct_mmx(block);
33     ff_put_pixels_clamped_mmx(block, dest, line_size);
34 }
35 
xvid_idct_mmx_add(uint8_t * dest,ptrdiff_t line_size,short * block)36 static void xvid_idct_mmx_add(uint8_t *dest, ptrdiff_t line_size, short *block)
37 {
38     ff_xvid_idct_mmx(block);
39     ff_add_pixels_clamped_mmx(block, dest, line_size);
40 }
41 
xvid_idct_mmxext_put(uint8_t * dest,ptrdiff_t line_size,short * block)42 static void xvid_idct_mmxext_put(uint8_t *dest, ptrdiff_t line_size, short *block)
43 {
44     ff_xvid_idct_mmxext(block);
45     ff_put_pixels_clamped_mmx(block, dest, line_size);
46 }
47 
xvid_idct_mmxext_add(uint8_t * dest,ptrdiff_t line_size,short * block)48 static void xvid_idct_mmxext_add(uint8_t *dest, ptrdiff_t line_size, short *block)
49 {
50     ff_xvid_idct_mmxext(block);
51     ff_add_pixels_clamped_mmx(block, dest, line_size);
52 }
53 #endif
54 
ff_xvid_idct_init_x86(IDCTDSPContext * c,AVCodecContext * avctx,unsigned high_bit_depth)55 av_cold void ff_xvid_idct_init_x86(IDCTDSPContext *c, AVCodecContext *avctx,
56                                    unsigned high_bit_depth)
57 {
58 #if HAVE_X86ASM
59     int cpu_flags = av_get_cpu_flags();
60 
61     if (high_bit_depth ||
62         !(avctx->idct_algo == FF_IDCT_AUTO ||
63           avctx->idct_algo == FF_IDCT_XVID))
64         return;
65 
66 #if ARCH_X86_32
67     if (EXTERNAL_MMX(cpu_flags)) {
68         c->idct_put  = xvid_idct_mmx_put;
69         c->idct_add  = xvid_idct_mmx_add;
70         c->idct      = ff_xvid_idct_mmx;
71         c->perm_type = FF_IDCT_PERM_NONE;
72     }
73 
74     if (EXTERNAL_MMXEXT(cpu_flags)) {
75         c->idct_put  = xvid_idct_mmxext_put;
76         c->idct_add  = xvid_idct_mmxext_add;
77         c->idct      = ff_xvid_idct_mmxext;
78         c->perm_type = FF_IDCT_PERM_NONE;
79     }
80 #endif
81 
82     if (EXTERNAL_SSE2(cpu_flags)) {
83         c->idct_put  = ff_xvid_idct_put_sse2;
84         c->idct_add  = ff_xvid_idct_add_sse2;
85         c->idct      = ff_xvid_idct_sse2;
86         c->perm_type = FF_IDCT_PERM_SSE2;
87     }
88 #endif /* HAVE_X86ASM */
89 }
90