FFmpeg
aacpsdsp_init.c
Go to the documentation of this file.
1 /*
2  * SIMD optimized MPEG-4 Parametric Stereo decoding functions
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include <stddef.h>
22 
23 #include "config.h"
24 
25 #include "libavutil/x86/cpu.h"
26 #include "libavutil/attributes.h"
27 #include "libavcodec/aacpsdsp.h"
28 
29 void ff_ps_add_squares_sse (float *dst, const float (*src)[2], int n);
30 void ff_ps_add_squares_sse3 (float *dst, const float (*src)[2], int n);
31 void ff_ps_mul_pair_single_sse (float (*dst)[2], float (*src0)[2],
32  float *src1, int n);
33 void ff_ps_hybrid_analysis_sse (float (*out)[2], float (*in)[2],
34  const float (*filter)[8][2],
35  ptrdiff_t stride, int n);
36 void ff_ps_hybrid_analysis_sse3(float (*out)[2], float (*in)[2],
37  const float (*filter)[8][2],
38  ptrdiff_t stride, int n);
39 void ff_ps_stereo_interpolate_sse3(float (*l)[2], float (*r)[2],
40  float h[2][4], float h_step[2][4],
41  int len);
42 void ff_ps_stereo_interpolate_ipdopd_sse3(float (*l)[2], float (*r)[2],
43  float h[2][4], float h_step[2][4],
44  int len);
45 void ff_ps_hybrid_synthesis_deint_sse(float out[2][38][64], float (*in)[32][2],
46  int i, int len);
47 void ff_ps_hybrid_synthesis_deint_sse4(float out[2][38][64], float (*in)[32][2],
48  int i, int len);
49 void ff_ps_hybrid_analysis_ileave_sse(float (*out)[32][2], float L[2][38][64],
50  int i, int len);
51 
53 {
55 
56  if (EXTERNAL_SSE(cpu_flags)) {
57  s->add_squares = ff_ps_add_squares_sse;
58  s->mul_pair_single = ff_ps_mul_pair_single_sse;
59  s->hybrid_analysis_ileave = ff_ps_hybrid_analysis_ileave_sse;
60  s->hybrid_synthesis_deint = ff_ps_hybrid_synthesis_deint_sse;
61  s->hybrid_analysis = ff_ps_hybrid_analysis_sse;
62  }
63  if (EXTERNAL_SSE3(cpu_flags)) {
64  s->add_squares = ff_ps_add_squares_sse3;
65  s->stereo_interpolate[0] = ff_ps_stereo_interpolate_sse3;
66  s->stereo_interpolate[1] = ff_ps_stereo_interpolate_ipdopd_sse3;
67  s->hybrid_analysis = ff_ps_hybrid_analysis_sse3;
68  }
69  if (EXTERNAL_SSE4(cpu_flags)) {
70  s->hybrid_synthesis_deint = ff_ps_hybrid_synthesis_deint_sse4;
71  }
72 }
ff_ps_hybrid_synthesis_deint_sse
void ff_ps_hybrid_synthesis_deint_sse(float out[2][38][64], float(*in)[32][2], int i, int len)
stride
int stride
Definition: mace.c:144
cpu.h
r
const char * r
Definition: vf_curves.c:116
out
FILE * out
Definition: movenc.c:54
ff_ps_hybrid_analysis_sse3
void ff_ps_hybrid_analysis_sse3(float(*out)[2], float(*in)[2], const float(*filter)[8][2], ptrdiff_t stride, int n)
filter
filter_frame For filters that do not use the this method is called when a frame is pushed to the filter s input It can be called at any time except in a reentrant way If the input frame is enough to produce then the filter should push the output frames on the output link immediately As an exception to the previous rule if the input frame is enough to produce several output frames then the filter needs output only at least one per link The additional frames can be left buffered in the filter
Definition: filter_design.txt:228
av_get_cpu_flags
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:98
cpu_flags
static atomic_int cpu_flags
Definition: cpu.c:50
av_cold
#define av_cold
Definition: attributes.h:90
aacpsdsp.h
s
#define s(width, name)
Definition: cbs_vp9.c:257
EXTERNAL_SSE
#define EXTERNAL_SSE(flags)
Definition: cpu.h:58
ff_ps_stereo_interpolate_sse3
void ff_ps_stereo_interpolate_sse3(float(*l)[2], float(*r)[2], float h[2][4], float h_step[2][4], int len)
ff_ps_hybrid_analysis_ileave_sse
void ff_ps_hybrid_analysis_ileave_sse(float(*out)[32][2], float L[2][38][64], int i, int len)
EXTERNAL_SSE3
#define EXTERNAL_SSE3(flags)
Definition: cpu.h:62
src
#define src
Definition: vp8dsp.c:255
ff_ps_hybrid_synthesis_deint_sse4
void ff_ps_hybrid_synthesis_deint_sse4(float out[2][38][64], float(*in)[32][2], int i, int len)
ff_psdsp_init_x86
av_cold void ff_psdsp_init_x86(PSDSPContext *s)
Definition: aacpsdsp_init.c:52
attributes.h
src0
#define src0
Definition: h264pred.c:139
src1
#define src1
Definition: h264pred.c:140
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:271
len
int len
Definition: vorbis_enc_data.h:426
ff_ps_add_squares_sse
void ff_ps_add_squares_sse(float *dst, const float(*src)[2], int n)
ff_ps_stereo_interpolate_ipdopd_sse3
void ff_ps_stereo_interpolate_ipdopd_sse3(float(*l)[2], float(*r)[2], float h[2][4], float h_step[2][4], int len)
EXTERNAL_SSE4
#define EXTERNAL_SSE4(flags)
Definition: cpu.h:68
L
#define L(x)
Definition: vp56_arith.h:36
PSDSPContext
Definition: aacpsdsp.h:32
ff_ps_mul_pair_single_sse
void ff_ps_mul_pair_single_sse(float(*dst)[2], float(*src0)[2], float *src1, int n)
ff_ps_add_squares_sse3
void ff_ps_add_squares_sse3(float *dst, const float(*src)[2], int n)
ff_ps_hybrid_analysis_sse
void ff_ps_hybrid_analysis_sse(float(*out)[2], float(*in)[2], const float(*filter)[8][2], ptrdiff_t stride, int n)
h
h
Definition: vp9dsp_template.c:2038