FFmpeg
aacpsdsp_init.c
Go to the documentation of this file.
1 /*
2  * SIMD optimized MPEG-4 Parametric Stereo decoding functions
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include <stddef.h>
22 
23 #include "config.h"
24 
25 #include "libavutil/x86/cpu.h"
26 #include "libavutil/attributes.h"
27 #include "libavcodec/aacpsdsp.h"
28 
29 void ff_ps_add_squares_sse (float *dst, const float (*src)[2], int n);
30 void ff_ps_add_squares_sse3 (float *dst, const float (*src)[2], int n);
31 void ff_ps_mul_pair_single_sse (float (*dst)[2], float (*src0)[2],
32  float *src1, int n);
33 void ff_ps_hybrid_analysis_sse (float (*out)[2], float (*in)[2],
34  const float (*filter)[8][2],
35  ptrdiff_t stride, int n);
36 void ff_ps_hybrid_analysis_fma3(float (*out)[2], float (*in)[2],
37  const float (*filter)[8][2],
38  ptrdiff_t stride, int n);
39 void ff_ps_stereo_interpolate_sse3(float (*l)[2], float (*r)[2],
40  float h[2][4], float h_step[2][4],
41  int len);
42 void ff_ps_stereo_interpolate_ipdopd_sse3(float (*l)[2], float (*r)[2],
43  float h[2][4], float h_step[2][4],
44  int len);
45 void ff_ps_hybrid_synthesis_deint_sse(float out[2][38][64], float (*in)[32][2],
46  int i, int len);
47 void ff_ps_hybrid_synthesis_deint_sse4(float out[2][38][64], float (*in)[32][2],
48  int i, int len);
49 void ff_ps_hybrid_analysis_ileave_sse(float (*out)[32][2], float L[2][38][64],
50  int i, int len);
51 
53 {
55 
56  if (EXTERNAL_SSE(cpu_flags)) {
57  s->add_squares = ff_ps_add_squares_sse;
58  s->mul_pair_single = ff_ps_mul_pair_single_sse;
59  s->hybrid_analysis_ileave = ff_ps_hybrid_analysis_ileave_sse;
60  s->hybrid_synthesis_deint = ff_ps_hybrid_synthesis_deint_sse;
61  s->hybrid_analysis = ff_ps_hybrid_analysis_sse;
62  }
63  if (EXTERNAL_SSE3(cpu_flags)) {
64  s->add_squares = ff_ps_add_squares_sse3;
65  s->stereo_interpolate[0] = ff_ps_stereo_interpolate_sse3;
66  s->stereo_interpolate[1] = ff_ps_stereo_interpolate_ipdopd_sse3;
67  }
68  if (EXTERNAL_SSE4(cpu_flags)) {
69  s->hybrid_synthesis_deint = ff_ps_hybrid_synthesis_deint_sse4;
70  }
71  if (EXTERNAL_FMA3(cpu_flags)) {
72  s->hybrid_analysis = ff_ps_hybrid_analysis_fma3;
73  }
74 }
cpu.h
r
const char * r
Definition: vf_curves.c:126
out
FILE * out
Definition: movenc.c:54
src1
const pixel * src1
Definition: h264pred_template.c:421
filter
filter_frame For filters that do not use the this method is called when a frame is pushed to the filter s input It can be called at any time except in a reentrant way If the input frame is enough to produce then the filter should push the output frames on the output link immediately As an exception to the previous rule if the input frame is enough to produce several output frames then the filter needs output only at least one per link The additional frames can be left buffered in the filter
Definition: filter_design.txt:228
av_get_cpu_flags
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:103
cpu_flags
static atomic_int cpu_flags
Definition: cpu.c:52
ff_ps_hybrid_analysis_sse
void ff_ps_hybrid_analysis_sse(float(*out)[2], float(*in)[2], const float(*filter)[8][2], ptrdiff_t stride, int n)
ff_ps_stereo_interpolate_sse3
void ff_ps_stereo_interpolate_sse3(float(*l)[2], float(*r)[2], float h[2][4], float h_step[2][4], int len)
av_cold
#define av_cold
Definition: attributes.h:90
aacpsdsp.h
ff_ps_hybrid_synthesis_deint_sse
void ff_ps_hybrid_synthesis_deint_sse(float out[2][38][64], float(*in)[32][2], int i, int len)
s
#define s(width, name)
Definition: cbs_vp9.c:256
EXTERNAL_SSE
#define EXTERNAL_SSE(flags)
Definition: cpu.h:58
ff_ps_mul_pair_single_sse
void ff_ps_mul_pair_single_sse(float(*dst)[2], float(*src0)[2], float *src1, int n)
EXTERNAL_SSE3
#define EXTERNAL_SSE3(flags)
Definition: cpu.h:62
ff_psdsp_init_x86
av_cold void ff_psdsp_init_x86(PSDSPContext *s)
Definition: aacpsdsp_init.c:52
ff_ps_hybrid_analysis_ileave_sse
void ff_ps_hybrid_analysis_ileave_sse(float(*out)[32][2], float L[2][38][64], int i, int len)
ff_ps_add_squares_sse
void ff_ps_add_squares_sse(float *dst, const float(*src)[2], int n)
attributes.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:269
len
int len
Definition: vorbis_enc_data.h:426
ff_ps_hybrid_analysis_fma3
void ff_ps_hybrid_analysis_fma3(float(*out)[2], float(*in)[2], const float(*filter)[8][2], ptrdiff_t stride, int n)
stride
#define stride
Definition: h264pred_template.c:537
EXTERNAL_SSE4
#define EXTERNAL_SSE4(flags)
Definition: cpu.h:68
PSDSPContext
Definition: aacpsdsp.h:32
ff_ps_hybrid_synthesis_deint_sse4
void ff_ps_hybrid_synthesis_deint_sse4(float out[2][38][64], float(*in)[32][2], int i, int len)
L
#define L(x)
Definition: vpx_arith.h:36
src0
const pixel *const src0
Definition: h264pred_template.c:420
src
INIT_CLIP pixel * src
Definition: h264pred_template.c:418
h
h
Definition: vp9dsp_template.c:2038
ff_ps_add_squares_sse3
void ff_ps_add_squares_sse3(float *dst, const float(*src)[2], int n)
EXTERNAL_FMA3
#define EXTERNAL_FMA3(flags)
Definition: cpu.h:74
ff_ps_stereo_interpolate_ipdopd_sse3
void ff_ps_stereo_interpolate_ipdopd_sse3(float(*l)[2], float(*r)[2], float h[2][4], float h_step[2][4], int len)