FFmpeg
aacpsdsp_init.c
Go to the documentation of this file.
1 /*
2  * SIMD optimized MPEG-4 Parametric Stereo decoding functions
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include <stddef.h>
22 
23 #include "config.h"
24 
25 #include "libavutil/x86/cpu.h"
26 #include "libavutil/attributes.h"
27 #include "libavcodec/aacpsdsp.h"
28 
29 void ff_ps_add_squares_sse (float *dst, const float (*src)[2], int n);
30 void ff_ps_add_squares_sse3 (float *dst, const float (*src)[2], int n);
31 void ff_ps_mul_pair_single_sse (float (*dst)[2], float (*src0)[2],
32  float *src1, int n);
33 void ff_ps_hybrid_analysis_sse (float (*out)[2], float (*in)[2],
34  const float (*filter)[8][2],
35  ptrdiff_t stride, int n);
36 void ff_ps_hybrid_analysis_fma3(float (*out)[2], float (*in)[2],
37  const float (*filter)[8][2],
38  ptrdiff_t stride, int n);
39 void ff_ps_stereo_interpolate_sse3(float (*l)[2], float (*r)[2],
40  float h[2][4], float h_step[2][4],
41  int len);
42 void ff_ps_stereo_interpolate_ipdopd_sse3(float (*l)[2], float (*r)[2],
43  float h[2][4], float h_step[2][4],
44  int len);
45 void ff_ps_hybrid_synthesis_deint_sse(float out[2][38][64], float (*in)[32][2],
46  int i, int len);
47 void ff_ps_hybrid_synthesis_deint_sse4(float out[2][38][64], float (*in)[32][2],
48  int i, int len);
49 void ff_ps_hybrid_analysis_ileave_sse(float (*out)[32][2], float L[2][38][64],
50  int i, int len);
51 
53 {
55 
56  if (EXTERNAL_SSE(cpu_flags)) {
57  s->add_squares = ff_ps_add_squares_sse;
58  s->mul_pair_single = ff_ps_mul_pair_single_sse;
59  s->hybrid_analysis_ileave = ff_ps_hybrid_analysis_ileave_sse;
60  s->hybrid_synthesis_deint = ff_ps_hybrid_synthesis_deint_sse;
61  s->hybrid_analysis = ff_ps_hybrid_analysis_sse;
62  }
63  if (EXTERNAL_SSE3(cpu_flags)) {
64  s->add_squares = ff_ps_add_squares_sse3;
65  s->stereo_interpolate[0] = ff_ps_stereo_interpolate_sse3;
66  s->stereo_interpolate[1] = ff_ps_stereo_interpolate_ipdopd_sse3;
67  }
68  if (EXTERNAL_SSE4(cpu_flags)) {
69  s->hybrid_synthesis_deint = ff_ps_hybrid_synthesis_deint_sse4;
70  }
71  if (EXTERNAL_FMA3(cpu_flags)) {
72  s->hybrid_analysis = ff_ps_hybrid_analysis_fma3;
73  }
74 }
cpu.h
r
const char * r
Definition: vf_curves.c:127
out
FILE * out
Definition: movenc.c:55
src1
const pixel * src1
Definition: h264pred_template.c:421
filter
void(* filter)(uint8_t *src, int stride, int qscale)
Definition: h263dsp.c:29
av_get_cpu_flags
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:107
cpu_flags
static atomic_int cpu_flags
Definition: cpu.c:56
ff_ps_hybrid_analysis_sse
void ff_ps_hybrid_analysis_sse(float(*out)[2], float(*in)[2], const float(*filter)[8][2], ptrdiff_t stride, int n)
ff_ps_stereo_interpolate_sse3
void ff_ps_stereo_interpolate_sse3(float(*l)[2], float(*r)[2], float h[2][4], float h_step[2][4], int len)
av_cold
#define av_cold
Definition: attributes.h:90
aacpsdsp.h
ff_ps_hybrid_synthesis_deint_sse
void ff_ps_hybrid_synthesis_deint_sse(float out[2][38][64], float(*in)[32][2], int i, int len)
s
#define s(width, name)
Definition: cbs_vp9.c:198
EXTERNAL_SSE
#define EXTERNAL_SSE(flags)
Definition: cpu.h:58
ff_ps_mul_pair_single_sse
void ff_ps_mul_pair_single_sse(float(*dst)[2], float(*src0)[2], float *src1, int n)
EXTERNAL_SSE3
#define EXTERNAL_SSE3(flags)
Definition: cpu.h:62
ff_psdsp_init_x86
av_cold void ff_psdsp_init_x86(PSDSPContext *s)
Definition: aacpsdsp_init.c:52
dst
uint8_t ptrdiff_t const uint8_t ptrdiff_t int intptr_t intptr_t int int16_t * dst
Definition: dsp.h:83
ff_ps_hybrid_analysis_ileave_sse
void ff_ps_hybrid_analysis_ileave_sse(float(*out)[32][2], float L[2][38][64], int i, int len)
ff_ps_add_squares_sse
void ff_ps_add_squares_sse(float *dst, const float(*src)[2], int n)
attributes.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
len
int len
Definition: vorbis_enc_data.h:426
ff_ps_hybrid_analysis_fma3
void ff_ps_hybrid_analysis_fma3(float(*out)[2], float(*in)[2], const float(*filter)[8][2], ptrdiff_t stride, int n)
stride
#define stride
Definition: h264pred_template.c:537
EXTERNAL_SSE4
#define EXTERNAL_SSE4(flags)
Definition: cpu.h:68
PSDSPContext
Definition: aacpsdsp.h:32
ff_ps_hybrid_synthesis_deint_sse4
void ff_ps_hybrid_synthesis_deint_sse4(float out[2][38][64], float(*in)[32][2], int i, int len)
L
#define L(x)
Definition: vpx_arith.h:36
src0
const pixel *const src0
Definition: h264pred_template.c:420
h
h
Definition: vp9dsp_template.c:2070
ff_ps_add_squares_sse3
void ff_ps_add_squares_sse3(float *dst, const float(*src)[2], int n)
EXTERNAL_FMA3
#define EXTERNAL_FMA3(flags)
Definition: cpu.h:74
ff_ps_stereo_interpolate_ipdopd_sse3
void ff_ps_stereo_interpolate_ipdopd_sse3(float(*l)[2], float(*r)[2], float h[2][4], float h_step[2][4], int len)
src
#define src
Definition: vp8dsp.c:248