doxygen/2.7/lossless__audiodsp__altivec_8c_source.html

 /*

  * Copyright (c) 2007 Luca Barbato <lu_zero@gentoo.org>

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 #include "config.h"

 #if HAVE_ALTIVEC_H

 #include <altivec.h>

 #endif


 #include "libavutil/attributes.h"

 #include "libavutil/cpu.h"

 #include "libavutil/ppc/cpu.h"

 #include "libavutil/ppc/types_altivec.h"

 #include "libavcodec/lossless_audiodsp.h"


 #if HAVE_BIGENDIAN

 #define GET_T(tt0,tt1,src,a,b){       \

         a = vec_ld(16, src);          \

         tt0 = vec_perm(b, a, align);  \

         b = vec_ld(32, src);          \

         tt1 = vec_perm(a, b, align);  \

  }

 #else

 #define GET_T(tt0,tt1,src,a,b){       \

         tt0 = vec_vsx_ld(0, src);     \

         tt1 = vec_vsx_ld(16, src);    \

  }

 #endif


 #if HAVE_ALTIVEC

 static int32_t scalarproduct_and_madd_int16_altivec(int16_t *v1,

                                                     const int16_t *v2,

                                                     const int16_t *v3,

                                                     int order, int mul)

 {

     LOAD_ZERO;

     vec_s16 *pv1 = (vec_s16 *) v1;

     register vec_s16 muls = { mul, mul, mul, mul, mul, mul, mul, mul };

     register vec_s16 t0, t1, i0, i1, i4, i2, i3;

     register vec_s32 res = zero_s32v;

 #if HAVE_BIGENDIAN

     register vec_u8 align = vec_lvsl(0, v2);

     i2 = vec_ld(0, v2);

     i3 = vec_ld(0, v3);

 #endif

     int32_t ires;


     order >>= 4;

     do {

         GET_T(t0,t1,v2,i1,i2);

         i0     = pv1[0];

         i1     = pv1[1];

         res    = vec_msum(t0, i0, res);

         res    = vec_msum(t1, i1, res);

         GET_T(t0,t1,v3,i4,i3);

         pv1[0] = vec_mladd(t0, muls, i0);

         pv1[1] = vec_mladd(t1, muls, i1);

         pv1   += 2;

         v2    += 16;

         v3    += 16;

     } while (--order);

     res = vec_splat(vec_sums(res, zero_s32v), 3);

     vec_ste(res, 0, &ires);


     return ires;

 }

 #endif /* HAVE_ALTIVEC */


 av_cold void ff_llauddsp_init_ppc(LLAudDSPContext *c)

 {

 #if HAVE_ALTIVEC

     if (!PPC_ALTIVEC(av_get_cpu_flags()))

         return;


     c->scalarproduct_and_madd_int16 = scalarproduct_and_madd_int16_altivec;

 #endif /* HAVE_ALTIVEC */

 }

zero_s32v
#define zero_s32v
Definition: types_altivec.h:45

cpu.h

ff_llauddsp_init_ppc
av_cold void ff_llauddsp_init_ppc(LLAudDSPContext *c)
Definition: lossless_audiodsp_altivec.c:85

vec_s32
#define vec_s32
Definition: types_altivec.h:32

attributes.h
Macro definitions for various function/variable attributes.

config.h

av_cold
#define av_cold
Definition: attributes.h:74

t0
#define t0
Definition: regdef.h:28

vec_s16
#define vec_s16
Definition: types_altivec.h:30

LLAudDSPContext
Definition: lossless_audiodsp.h:28

PPC_ALTIVEC
#define PPC_ALTIVEC(flags)
Definition: cpu.h:26

t1
#define t1
Definition: regdef.h:29

LOAD_ZERO
#define LOAD_ZERO
Definition: types_altivec.h:38

lossless_audiodsp.h

int32_t
int32_t
Definition: audio_convert.c:194

align
const AVS_VideoInfo int align
Definition: avisynth_c.h:658

vec_u8
#define vec_u8
Definition: types_altivec.h:27

types_altivec.h

cpu.h

LLAudDSPContext::scalarproduct_and_madd_int16
int32_t(* scalarproduct_and_madd_int16)(int16_t *v1, const int16_t *v2, const int16_t *v3, int len, int mul)
Calculate scalar product of v1 and v2, and v1[i] += v3[i] * mul.
Definition: lossless_audiodsp.h:35

av_get_cpu_flags
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:76

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

GET_T
#define GET_T(tt0, tt1, src, a, b)
Definition: lossless_audiodsp_altivec.c:40