FFmpeg
scene_sad_init.c
Go to the documentation of this file.
1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with FFmpeg; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18 
19 #include "libavutil/cpu.h"
20 #include "libavutil/x86/cpu.h"
21 #include "libavfilter/scene_sad.h"
22 
23 #define SCENE_SAD_FUNC(FUNC_NAME, ASM_FUNC_NAME, MMSIZE) \
24 void ASM_FUNC_NAME(SCENE_SAD_PARAMS); \
25  \
26 static void FUNC_NAME(SCENE_SAD_PARAMS) { \
27  uint64_t sad[MMSIZE / 8] = {0}; \
28  ptrdiff_t awidth = width & ~(MMSIZE - 1); \
29  *sum = 0; \
30  ASM_FUNC_NAME(src1, stride1, src2, stride2, awidth, height, sad); \
31  for (int i = 0; i < MMSIZE / 8; i++) \
32  *sum += sad[i]; \
33  ff_scene_sad_c(src1 + awidth, stride1, \
34  src2 + awidth, stride2, \
35  width - awidth, height, sad); \
36  *sum += sad[0]; \
37 }
38 
39 #define SCENE_SAD16_FUNC(FUNC_NAME, ASM_FUNC_NAME, MMSIZE) \
40 void ASM_FUNC_NAME(SCENE_SAD_PARAMS); \
41  \
42 static void FUNC_NAME(SCENE_SAD_PARAMS) { \
43  uint64_t sad[MMSIZE / 8] = {0}; \
44  ptrdiff_t bytes = (width << 1) & ~(MMSIZE - 1); \
45  *sum = 0; \
46  ASM_FUNC_NAME(src1, stride1, src2, stride2, bytes, height, sad); \
47  for (int i = 0; i < MMSIZE / 8; i++) \
48  *sum += sad[i]; \
49  ff_scene_sad16_c(src1 + bytes, stride1, \
50  src2 + bytes, stride2, \
51  width - (bytes >> 1), height, sad); \
52  *sum += sad[0]; \
53 }
54 
55 #if HAVE_X86ASM
56 SCENE_SAD_FUNC(scene_sad_sse2, ff_scene_sad8_sse2, 16)
57 #if HAVE_AVX2_EXTERNAL
58 SCENE_SAD_FUNC(scene_sad_avx2, ff_scene_sad8_avx2, 32)
59 SCENE_SAD16_FUNC(scene_sad16_avx2, ff_scene_sad16_avx2, 32)
60 #endif
61 #if HAVE_AVX512_EXTERNAL
62 SCENE_SAD_FUNC(scene_sad_avx512, ff_scene_sad8_avx512, 64)
63 SCENE_SAD16_FUNC(scene_sad16_avx512, ff_scene_sad16_avx512, 64)
64 #endif
65 #endif
66 
68 {
69 #if HAVE_X86ASM
71  if (depth <= 8) {
72 #if HAVE_AVX512_EXTERNAL
74  return scene_sad_avx512;
75 #endif
76 #if HAVE_AVX2_EXTERNAL
78  return scene_sad_avx2;
79 #endif
81  return scene_sad_sse2;
82  } else if (depth < 16) { /* this routine is only safe up to 15 bits */
83 #if HAVE_AVX512_EXTERNAL
85  return scene_sad16_avx512;
86 #endif
87 #if HAVE_AVX2_EXTERNAL
89  return scene_sad16_avx2;
90 #endif
91  }
92 #endif
93  return NULL;
94 }
cpu.h
EXTERNAL_AVX2_FAST
#define EXTERNAL_AVX2_FAST(flags)
Definition: cpu.h:79
av_get_cpu_flags
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:109
ff_scene_sad_get_fn_x86
ff_scene_sad_fn ff_scene_sad_get_fn_x86(int depth)
Definition: scene_sad_init.c:67
cpu_flags
static atomic_int cpu_flags
Definition: cpu.c:56
SCENE_SAD16_FUNC
#define SCENE_SAD16_FUNC(FUNC_NAME, ASM_FUNC_NAME, MMSIZE)
Definition: scene_sad_init.c:39
NULL
#define NULL
Definition: coverity.c:32
SCENE_SAD_FUNC
#define SCENE_SAD_FUNC(FUNC_NAME, ASM_FUNC_NAME, MMSIZE)
Definition: scene_sad_init.c:23
scene_sad.h
cpu.h
ff_scene_sad_fn
void(* ff_scene_sad_fn)(SCENE_SAD_PARAMS)
Definition: scene_sad.h:34
EXTERNAL_SSE2
#define EXTERNAL_SSE2(flags)
Definition: cpu.h:59
EXTERNAL_AVX512
#define EXTERNAL_AVX512(flags)
Definition: cpu.h:82