FFmpeg
vf_idetdsp_init.c
Go to the documentation of this file.
1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with FFmpeg; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18 
19 #include "libavutil/attributes.h"
20 #include "libavutil/cpu.h"
21 #include "libavutil/x86/asm.h"
22 #include "libavutil/x86/cpu.h"
23 #include "libavfilter/vf_idetdsp.h"
24 
25 #if HAVE_X86ASM
26 
27 /* declares main callable idet_filter_line_sse2() */
28 #define FUNC_MAIN_DECL(KIND, SPAN) \
29 int ff_idet_filter_line_##KIND(const uint8_t *a, const uint8_t *b, \
30  const uint8_t *c, int w); \
31 static int idet_filter_line_##KIND(const uint8_t *a, const uint8_t *b, \
32  const uint8_t *c, int w) { \
33  int sum = 0; \
34  const int left_over = w & (SPAN - 1); \
35  w -= left_over; \
36  if (w > 0) \
37  sum += ff_idet_filter_line_##KIND(a, b, c, w); \
38  if (left_over > 0) \
39  sum += ff_idet_filter_line_c(a + w, b + w, c + w, left_over); \
40  return sum; \
41 }
42 
43 
44 #define FUNC_MAIN_DECL_16bit(KIND, SPAN) \
45 int ff_idet_filter_line_16bit_##KIND(const uint8_t *a, const uint8_t *b, \
46  const uint8_t *c, int w); \
47 static int idet_filter_line_16bit_##KIND(const uint8_t *a, const uint8_t *b, \
48  const uint8_t *c, int w) { \
49  int sum = 0; \
50  const int left_over = w & (SPAN - 1); \
51  const int w_main = w - left_over; \
52  const int offset = w_main << 1; \
53  if (w_main > 0) \
54  sum += ff_idet_filter_line_16bit_##KIND(a, b, c, w_main); \
55  if (left_over > 0) { \
56  sum += ff_idet_filter_line_c_16bit(a + offset, b + offset, c + offset, \
57  left_over); \
58  } \
59  return sum; \
60 }
61 
62 FUNC_MAIN_DECL(sse2, 16)
63 FUNC_MAIN_DECL_16bit(sse2, 8)
64 
65 FUNC_MAIN_DECL(avx2, 32)
66 FUNC_MAIN_DECL_16bit(avx2, 16)
67 
68 FUNC_MAIN_DECL(avx512icl, 64)
69 FUNC_MAIN_DECL_16bit(avx512icl, 32)
70 
71 #endif
73 {
74 #if HAVE_X86ASM
75  const int cpu_flags = av_get_cpu_flags();
76 
77  if (EXTERNAL_SSE2(cpu_flags)) {
78  dsp->filter_line = depth > 8 ? idet_filter_line_16bit_sse2 : idet_filter_line_sse2;
79  }
80  if (EXTERNAL_AVX2(cpu_flags)) {
81  dsp->filter_line = depth > 8 ? idet_filter_line_16bit_avx2 : idet_filter_line_avx2;
82  }
84  dsp->filter_line = depth > 8 ? idet_filter_line_16bit_avx512icl : idet_filter_line_avx512icl;
85  }
86 #endif // HAVE_X86ASM
87 }
cpu.h
av_get_cpu_flags
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:109
cpu_flags
static atomic_int cpu_flags
Definition: cpu.c:56
EXTERNAL_AVX2
#define EXTERNAL_AVX2(flags)
Definition: cpu.h:78
av_cold
#define av_cold
Definition: attributes.h:106
vf_idetdsp.h
IDETDSPContext::filter_line
ff_idet_filter_func filter_line
Definition: vf_idetdsp.h:27
asm.h
cpu.h
attributes.h
EXTERNAL_SSE2
#define EXTERNAL_SSE2(flags)
Definition: cpu.h:59
ff_idet_dsp_init_x86
av_cold void ff_idet_dsp_init_x86(IDETDSPContext *dsp, int depth)
Definition: vf_idetdsp_init.c:72
EXTERNAL_AVX512ICL
#define EXTERNAL_AVX512ICL(flags)
Definition: cpu.h:83
IDETDSPContext
Definition: vf_idetdsp.h:26