doxygen/3.1/h264idct__template_8c_source.html

 /*

  * H.264 IDCT

  * Copyright (c) 2004-2011 Michael Niedermayer <michaelni@gmx.at>

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 /**

  * @file

  * H.264 IDCT.

  * @author Michael Niedermayer <michaelni@gmx.at>

  */


 #include "bit_depth_template.c"

 #include "libavutil/common.h"

 #include "h264.h"

 #include "h264idct.h"


 void FUNCC(ff_h264_idct_add)(uint8_t *_dst, int16_t *_block, int stride)

 {

     int i;

     pixel *dst = (pixel*)_dst;

     dctcoef *block = (dctcoef*)_block;

     stride >>= sizeof(pixel)-1;


     block[0] += 1 << 5;


     for(i=0; i<4; i++){

         const int z0=  block[i + 4*0]     +  block[i + 4*2];

         const int z1=  block[i + 4*0]     -  block[i + 4*2];

         const int z2= (block[i + 4*1]>>1) -  block[i + 4*3];

         const int z3=  block[i + 4*1]     + (block[i + 4*3]>>1);


         block[i + 4*0]= z0 + z3;

         block[i + 4*1]= z1 + z2;

         block[i + 4*2]= z1 - z2;

         block[i + 4*3]= z0 - z3;

     }


     for(i=0; i<4; i++){

         const int z0=  block[0 + 4*i]     +  block[2 + 4*i];

         const int z1=  block[0 + 4*i]     -  block[2 + 4*i];

         const int z2= (block[1 + 4*i]>>1) -  block[3 + 4*i];

         const int z3=  block[1 + 4*i]     + (block[3 + 4*i]>>1);


         dst[i + 0*stride]= av_clip_pixel(dst[i + 0*stride] + ((z0 + z3) >> 6));

         dst[i + 1*stride]= av_clip_pixel(dst[i + 1*stride] + ((z1 + z2) >> 6));

         dst[i + 2*stride]= av_clip_pixel(dst[i + 2*stride] + ((z1 - z2) >> 6));

         dst[i + 3*stride]= av_clip_pixel(dst[i + 3*stride] + ((z0 - z3) >> 6));

     }


     memset(block, 0, 16 * sizeof(dctcoef));

 }


 void FUNCC(ff_h264_idct8_add)(uint8_t *_dst, int16_t *_block, int stride){

     int i;

     pixel *dst = (pixel*)_dst;

     dctcoef *block = (dctcoef*)_block;

     stride >>= sizeof(pixel)-1;


     block[0] += 32;


     for( i = 0; i < 8; i++ )

     {

         const int a0 =  block[i+0*8] + block[i+4*8];

         const int a2 =  block[i+0*8] - block[i+4*8];

         const int a4 = (block[i+2*8]>>1) - block[i+6*8];

         const int a6 = (block[i+6*8]>>1) + block[i+2*8];


         const int b0 = a0 + a6;

         const int b2 = a2 + a4;

         const int b4 = a2 - a4;

         const int b6 = a0 - a6;


         const int a1 = -block[i+3*8] + block[i+5*8] - block[i+7*8] - (block[i+7*8]>>1);

         const int a3 =  block[i+1*8] + block[i+7*8] - block[i+3*8] - (block[i+3*8]>>1);

         const int a5 = -block[i+1*8] + block[i+7*8] + block[i+5*8] + (block[i+5*8]>>1);

         const int a7 =  block[i+3*8] + block[i+5*8] + block[i+1*8] + (block[i+1*8]>>1);


         const int b1 = (a7>>2) + a1;

         const int b3 =  a3 + (a5>>2);

         const int b5 = (a3>>2) - a5;

         const int b7 =  a7 - (a1>>2);


         block[i+0*8] = b0 + b7;

         block[i+7*8] = b0 - b7;

         block[i+1*8] = b2 + b5;

         block[i+6*8] = b2 - b5;

         block[i+2*8] = b4 + b3;

         block[i+5*8] = b4 - b3;

         block[i+3*8] = b6 + b1;

         block[i+4*8] = b6 - b1;

     }

     for( i = 0; i < 8; i++ )

     {

         const int a0 =  block[0+i*8] + block[4+i*8];

         const int a2 =  block[0+i*8] - block[4+i*8];

         const int a4 = (block[2+i*8]>>1) - block[6+i*8];

         const int a6 = (block[6+i*8]>>1) + block[2+i*8];


         const int b0 = a0 + a6;

         const int b2 = a2 + a4;

         const int b4 = a2 - a4;

         const int b6 = a0 - a6;


         const int a1 = -block[3+i*8] + block[5+i*8] - block[7+i*8] - (block[7+i*8]>>1);

         const int a3 =  block[1+i*8] + block[7+i*8] - block[3+i*8] - (block[3+i*8]>>1);

         const int a5 = -block[1+i*8] + block[7+i*8] + block[5+i*8] + (block[5+i*8]>>1);

         const int a7 =  block[3+i*8] + block[5+i*8] + block[1+i*8] + (block[1+i*8]>>1);


         const int b1 = (a7>>2) + a1;

         const int b3 =  a3 + (a5>>2);

         const int b5 = (a3>>2) - a5;

         const int b7 =  a7 - (a1>>2);


         dst[i + 0*stride] = av_clip_pixel( dst[i + 0*stride] + ((b0 + b7) >> 6) );

         dst[i + 1*stride] = av_clip_pixel( dst[i + 1*stride] + ((b2 + b5) >> 6) );

         dst[i + 2*stride] = av_clip_pixel( dst[i + 2*stride] + ((b4 + b3) >> 6) );

         dst[i + 3*stride] = av_clip_pixel( dst[i + 3*stride] + ((b6 + b1) >> 6) );

         dst[i + 4*stride] = av_clip_pixel( dst[i + 4*stride] + ((b6 - b1) >> 6) );

         dst[i + 5*stride] = av_clip_pixel( dst[i + 5*stride] + ((b4 - b3) >> 6) );

         dst[i + 6*stride] = av_clip_pixel( dst[i + 6*stride] + ((b2 - b5) >> 6) );

         dst[i + 7*stride] = av_clip_pixel( dst[i + 7*stride] + ((b0 - b7) >> 6) );

     }


     memset(block, 0, 64 * sizeof(dctcoef));

 }


 // assumes all AC coefs are 0

 void FUNCC(ff_h264_idct_dc_add)(uint8_t *_dst, int16_t *_block, int stride){

     int i, j;

     pixel *dst = (pixel*)_dst;

     dctcoef *block = (dctcoef*)_block;

     int dc = (block[0] + 32) >> 6;

     stride /= sizeof(pixel);

     block[0] = 0;

     for( j = 0; j < 4; j++ )

     {

         for( i = 0; i < 4; i++ )

             dst[i] = av_clip_pixel( dst[i] + dc );

         dst += stride;

     }

 }


 void FUNCC(ff_h264_idct8_dc_add)(uint8_t *_dst, int16_t *_block, int stride){

     int i, j;

     pixel *dst = (pixel*)_dst;

     dctcoef *block = (dctcoef*)_block;

     int dc = (block[0] + 32) >> 6;

     block[0] = 0;

     stride /= sizeof(pixel);

     for( j = 0; j < 8; j++ )

     {

         for( i = 0; i < 8; i++ )

             dst[i] = av_clip_pixel( dst[i] + dc );

         dst += stride;

     }

 }


 void FUNCC(ff_h264_idct_add16)(uint8_t *dst, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15*8]){

     int i;

     for(i=0; i<16; i++){

         int nnz = nnzc[ scan8[i] ];

         if(nnz){

             if(nnz==1 && ((dctcoef*)block)[i*16]) FUNCC(ff_h264_idct_dc_add)(dst + block_offset[i], block + i*16*sizeof(pixel), stride);

             else                                  FUNCC(ff_h264_idct_add   )(dst + block_offset[i], block + i*16*sizeof(pixel), stride);

         }

     }

 }


 void FUNCC(ff_h264_idct_add16intra)(uint8_t *dst, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15*8]){

     int i;

     for(i=0; i<16; i++){

         if(nnzc[ scan8[i] ])             FUNCC(ff_h264_idct_add   )(dst + block_offset[i], block + i*16*sizeof(pixel), stride);

         else if(((dctcoef*)block)[i*16]) FUNCC(ff_h264_idct_dc_add)(dst + block_offset[i], block + i*16*sizeof(pixel), stride);

     }

 }


 void FUNCC(ff_h264_idct8_add4)(uint8_t *dst, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15*8]){

     int i;

     for(i=0; i<16; i+=4){

         int nnz = nnzc[ scan8[i] ];

         if(nnz){

             if(nnz==1 && ((dctcoef*)block)[i*16]) FUNCC(ff_h264_idct8_dc_add)(dst + block_offset[i], block + i*16*sizeof(pixel), stride);

             else                                  FUNCC(ff_h264_idct8_add   )(dst + block_offset[i], block + i*16*sizeof(pixel), stride);

         }

     }

 }


 void FUNCC(ff_h264_idct_add8)(uint8_t **dest, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15*8]){

     int i, j;

     for(j=1; j<3; j++){

         for(i=j*16; i<j*16+4; i++){

             if(nnzc[ scan8[i] ])

                 FUNCC(ff_h264_idct_add   )(dest[j-1] + block_offset[i], block + i*16*sizeof(pixel), stride);

             else if(((dctcoef*)block)[i*16])

                 FUNCC(ff_h264_idct_dc_add)(dest[j-1] + block_offset[i], block + i*16*sizeof(pixel), stride);

         }

     }

 }


 void FUNCC(ff_h264_idct_add8_422)(uint8_t **dest, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15*8]){

     int i, j;


     for(j=1; j<3; j++){

         for(i=j*16; i<j*16+4; i++){

             if(nnzc[ scan8[i] ])

                 FUNCC(ff_h264_idct_add   )(dest[j-1] + block_offset[i], block + i*16*sizeof(pixel), stride);

             else if(((dctcoef*)block)[i*16])

                 FUNCC(ff_h264_idct_dc_add)(dest[j-1] + block_offset[i], block + i*16*sizeof(pixel), stride);

         }

     }


     for(j=1; j<3; j++){

         for(i=j*16+4; i<j*16+8; i++){

             if(nnzc[ scan8[i+4] ])

                 FUNCC(ff_h264_idct_add   )(dest[j-1] + block_offset[i+4], block + i*16*sizeof(pixel), stride);

             else if(((dctcoef*)block)[i*16])

                 FUNCC(ff_h264_idct_dc_add)(dest[j-1] + block_offset[i+4], block + i*16*sizeof(pixel), stride);

         }

     }

 }


 /**

  * IDCT transforms the 16 dc values and dequantizes them.

  * @param qmul quantization parameter

  */

 void FUNCC(ff_h264_luma_dc_dequant_idct)(int16_t *_output, int16_t *_input, int qmul){

 #define stride 16

     int i;

     int temp[16];

     static const uint8_t x_offset[4]={0, 2*stride, 8*stride, 10*stride};

     dctcoef *input = (dctcoef*)_input;

     dctcoef *output = (dctcoef*)_output;


     for(i=0; i<4; i++){

         const int z0= input[4*i+0] + input[4*i+1];

         const int z1= input[4*i+0] - input[4*i+1];

         const int z2= input[4*i+2] - input[4*i+3];

         const int z3= input[4*i+2] + input[4*i+3];


         temp[4*i+0]= z0+z3;

         temp[4*i+1]= z0-z3;

         temp[4*i+2]= z1-z2;

         temp[4*i+3]= z1+z2;

     }


     for(i=0; i<4; i++){

         const int offset= x_offset[i];

         const int z0= temp[4*0+i] + temp[4*2+i];

         const int z1= temp[4*0+i] - temp[4*2+i];

         const int z2= temp[4*1+i] - temp[4*3+i];

         const int z3= temp[4*1+i] + temp[4*3+i];


         output[stride* 0+offset]= ((((z0 + z3)*qmul + 128 ) >> 8));

         output[stride* 1+offset]= ((((z1 + z2)*qmul + 128 ) >> 8));

         output[stride* 4+offset]= ((((z1 - z2)*qmul + 128 ) >> 8));

         output[stride* 5+offset]= ((((z0 - z3)*qmul + 128 ) >> 8));

     }

 #undef stride

 }


 void FUNCC(ff_h264_chroma422_dc_dequant_idct)(int16_t *_block, int qmul){

     const int stride= 16*2;

     const int xStride= 16;

     int i;

     int temp[8];

     static const uint8_t x_offset[2]={0, 16};

     dctcoef *block = (dctcoef*)_block;


     for(i=0; i<4; i++){

         temp[2*i+0] = block[stride*i + xStride*0] + block[stride*i + xStride*1];

         temp[2*i+1] = block[stride*i + xStride*0] - block[stride*i + xStride*1];

     }


     for(i=0; i<2; i++){

         const int offset= x_offset[i];

         const int z0= temp[2*0+i] + temp[2*2+i];

         const int z1= temp[2*0+i] - temp[2*2+i];

         const int z2= temp[2*1+i] - temp[2*3+i];

         const int z3= temp[2*1+i] + temp[2*3+i];


         block[stride*0+offset]= ((z0 + z3)*qmul + 128) >> 8;

         block[stride*1+offset]= ((z1 + z2)*qmul + 128) >> 8;

         block[stride*2+offset]= ((z1 - z2)*qmul + 128) >> 8;

         block[stride*3+offset]= ((z0 - z3)*qmul + 128) >> 8;

     }

 }


 void FUNCC(ff_h264_chroma_dc_dequant_idct)(int16_t *_block, int qmul){

     const int stride= 16*2;

     const int xStride= 16;

     int a,b,c,d,e;

     dctcoef *block = (dctcoef*)_block;


     a= block[stride*0 + xStride*0];

     b= block[stride*0 + xStride*1];

     c= block[stride*1 + xStride*0];

     d= block[stride*1 + xStride*1];


     e= a-b;

     a= a+b;

     b= c-d;

     c= c+d;


     block[stride*0 + xStride*0]= ((a+c)*qmul) >> 7;

     block[stride*0 + xStride*1]= ((e+b)*qmul) >> 7;

     block[stride*1 + xStride*0]= ((a-c)*qmul) >> 7;

     block[stride*1 + xStride*1]= ((e-b)*qmul) >> 7;

 }

temp
else temp
Definition: vf_mcdeint.c:259

a0
#define a0
Definition: regdef.h:46

b
const char * b
Definition: vf_curves.c:109

a1
#define a1
Definition: regdef.h:47

av_clip_pixel
#define av_clip_pixel(a)
Definition: bit_depth_template.c:86

block
static int16_t block[64]
Definition: dct.c:113

ff_h264_idct8_dc_add
void FUNCC() ff_h264_idct8_dc_add(uint8_t *_dst, int16_t *_block, int stride)
Definition: h264idct_template.c:159

a3
#define a3
Definition: regdef.h:49

uint8_t
uint8_t
Definition: audio_convert.c:194

ff_h264_idct8_add
void FUNCC() ff_h264_idct8_add(uint8_t *_dst, int16_t *_block, int stride)
Definition: h264idct_template.c:69

h264.h
H.264 / AVC / MPEG-4 part10 codec.

ff_h264_idct_add16
void FUNCC() ff_h264_idct_add16(uint8_t *dst, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15 *8])
Definition: h264idct_template.c:174

h264idct.h

offset
static const uint8_t offset[127][2]
Definition: vf_spp.c:92

scan8
static const uint8_t scan8[16 *3+3]
Definition: h264.h:801

ff_h264_idct_add
void FUNCC() ff_h264_idct_add(uint8_t *_dst, int16_t *_block, int stride)
Definition: h264idct_template.c:33

a2
#define a2
Definition: regdef.h:48

ff_h264_chroma_dc_dequant_idct
void FUNCC() ff_h264_chroma_dc_dequant_idct(int16_t *_block, int qmul)
Definition: h264idct_template.c:304

a5
#define a5
Definition: regdef.h:51

ff_h264_idct8_add4
void FUNCC() ff_h264_idct8_add4(uint8_t *dst, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15 *8])
Definition: h264idct_template.c:193

dctcoef
#define dctcoef
Definition: bit_depth_template.c:73

ff_h264_luma_dc_dequant_idct
void FUNCC() ff_h264_luma_dc_dequant_idct(int16_t *_output, int16_t *_input, int qmul)
IDCT transforms the 16 dc values and dequantizes them.
Definition: h264idct_template.c:242

bit_depth_template.c

pixel
uint8_t pixel
Definition: tiny_ssim.c:42

ff_h264_idct_dc_add
void FUNCC() ff_h264_idct_dc_add(uint8_t *_dst, int16_t *_block, int stride)
Definition: h264idct_template.c:144

stride
GLint GLenum GLboolean GLsizei stride
Definition: opengl_enc.c:105

common.h
common internal and external API header

ff_h264_chroma422_dc_dequant_idct
void FUNCC() ff_h264_chroma422_dc_dequant_idct(int16_t *_block, int qmul)
Definition: h264idct_template.c:277

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

ff_h264_idct_add8_422
void FUNCC() ff_h264_idct_add8_422(uint8_t **dest, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15 *8])
Definition: h264idct_template.c:216

a4
#define a4
Definition: regdef.h:50

ff_h264_idct_add8
void FUNCC() ff_h264_idct_add8(uint8_t **dest, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15 *8])
Definition: h264idct_template.c:204

dc
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(constint16_t *) pi >>8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(constint32_t *) pi >>24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(constfloat *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(constfloat *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(constfloat *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(constdouble *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(constdouble *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(constdouble *) pi *(1U<< 31))))#defineSET_CONV_FUNC_GROUP(ofmt, ifmt) staticvoidset_generic_function(AudioConvert *ac){}voidff_audio_convert_free(AudioConvert **ac){if(!*ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);}AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enumAVSampleFormatout_fmt, enumAVSampleFormatin_fmt, intchannels, intsample_rate, intapply_map){AudioConvert *ac;intin_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) returnNULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method!=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt)>2){ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc){av_free(ac);returnNULL;}returnac;}in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar){ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar?ac->channels:1;}elseif(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;elseac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);returnac;}intff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in){intuse_generic=1;intlen=in->nb_samples;intp;if(ac->dc){av_log(ac->avr, AV_LOG_TRACE,"%dsamples-audio_convert:%sto%s(dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));returnff_convert_dither(ac-> dc
Definition: audio_convert.c:194

stride
#define stride

FUNCC
#define FUNCC(a)
Definition: bit_depth_template.c:93

ff_h264_idct_add16intra
void FUNCC() ff_h264_idct_add16intra(uint8_t *dst, const int *block_offset, int16_t *block, int stride, const uint8_t nnzc[15 *8])
Definition: h264idct_template.c:185

a
a
Definition: h264pred_template.c:468