42 const uint8_t *obmc1= obmc + y*obmc_stride;
43 const uint8_t *obmc2= obmc1+ (obmc_stride>>1);
44 const uint8_t *obmc3= obmc1+ obmc_stride*(obmc_stride>>1);
48 int v= obmc1[x] * block[3][x + y*src_stride]
49 +obmc2[x] * block[2][x + y*src_stride]
50 +obmc3[x] * block[1][x + y*src_stride]
51 +obmc4[x] * block[0][x + y*src_stride];
60 if(v&(~255)) v= ~(v>>31);
61 dst8[x + y*src_stride] =
v;
70 int plane_index,
level, orientation;
72 for(plane_index=0; plane_index<3; plane_index++){
74 for(orientation=level ? 1:0; orientation<4; orientation++){
99 for(i=0; i<
QROOT; i++){
101 v *= pow(2, 1.0 / QROOT);
116 static const uint8_t brane[256]={
117 0x00,0x01,0x01,0x01,0x01,0x01,0x01,0x01,0x11,0x12,0x12,0x12,0x12,0x12,0x12,0x12,
118 0x04,0x05,0xcc,0xcc,0xcc,0xcc,0xcc,0x41,0x15,0x16,0xcc,0xcc,0xcc,0xcc,0xcc,0x52,
119 0x04,0xcc,0x05,0xcc,0xcc,0xcc,0x41,0xcc,0x15,0xcc,0x16,0xcc,0xcc,0xcc,0x52,0xcc,
120 0x04,0xcc,0xcc,0x05,0xcc,0x41,0xcc,0xcc,0x15,0xcc,0xcc,0x16,0xcc,0x52,0xcc,0xcc,
121 0x04,0xcc,0xcc,0xcc,0x41,0xcc,0xcc,0xcc,0x15,0xcc,0xcc,0xcc,0x16,0xcc,0xcc,0xcc,
122 0x04,0xcc,0xcc,0x41,0xcc,0x05,0xcc,0xcc,0x15,0xcc,0xcc,0x52,0xcc,0x16,0xcc,0xcc,
123 0x04,0xcc,0x41,0xcc,0xcc,0xcc,0x05,0xcc,0x15,0xcc,0x52,0xcc,0xcc,0xcc,0x16,0xcc,
124 0x04,0x41,0xcc,0xcc,0xcc,0xcc,0xcc,0x05,0x15,0x52,0xcc,0xcc,0xcc,0xcc,0xcc,0x16,
125 0x44,0x45,0x45,0x45,0x45,0x45,0x45,0x45,0x55,0x56,0x56,0x56,0x56,0x56,0x56,0x56,
126 0x48,0x49,0xcc,0xcc,0xcc,0xcc,0xcc,0x85,0x59,0x5A,0xcc,0xcc,0xcc,0xcc,0xcc,0x96,
127 0x48,0xcc,0x49,0xcc,0xcc,0xcc,0x85,0xcc,0x59,0xcc,0x5A,0xcc,0xcc,0xcc,0x96,0xcc,
128 0x48,0xcc,0xcc,0x49,0xcc,0x85,0xcc,0xcc,0x59,0xcc,0xcc,0x5A,0xcc,0x96,0xcc,0xcc,
129 0x48,0xcc,0xcc,0xcc,0x49,0xcc,0xcc,0xcc,0x59,0xcc,0xcc,0xcc,0x96,0xcc,0xcc,0xcc,
130 0x48,0xcc,0xcc,0x85,0xcc,0x49,0xcc,0xcc,0x59,0xcc,0xcc,0x96,0xcc,0x5A,0xcc,0xcc,
131 0x48,0xcc,0x85,0xcc,0xcc,0xcc,0x49,0xcc,0x59,0xcc,0x96,0xcc,0xcc,0xcc,0x5A,0xcc,
132 0x48,0x85,0xcc,0xcc,0xcc,0xcc,0xcc,0x49,0x59,0x96,0xcc,0xcc,0xcc,0xcc,0xcc,0x5A,
135 static const uint8_t needs[16]={
145 int16_t *tmpI= tmpIt;
149 r= brane[dx + 16*dy]&15;
150 l= brane[dx + 16*dy]>>4;
152 b= needs[l] | needs[
r];
158 for(x=0; x < b_w; x++){
159 int a_1=src[x + HTAPS_MAX/2-4];
160 int a0= src[x + HTAPS_MAX/2-3];
161 int a1= src[x + HTAPS_MAX/2-2];
162 int a2= src[x + HTAPS_MAX/2-1];
163 int a3= src[x + HTAPS_MAX/2+0];
164 int a4= src[x + HTAPS_MAX/2+1];
165 int a5= src[x + HTAPS_MAX/2+2];
166 int a6= src[x + HTAPS_MAX/2+3];
169 am= 20*(a2+
a3) - 5*(a1+a4) + (a0+
a5);
178 if(am&(~255)) am= ~(am>>31);
191 for(y=0; y < b_h; y++){
192 for(x=0; x < b_w+1; x++){
203 am= (20*(a2+
a3) - 5*(a1+a4) + (a0+
a5) + 16)>>5;
207 if(am&(~255)) am= ~(am>>31);
219 for(y=0; y < b_h; y++){
220 for(x=0; x < b_w; x++){
231 am= (20*(a2+
a3) - 5*(a1+a4) + (a0+
a5) + 512)>>10;
234 if(am&(~255)) am= ~(am>>31);
248 hpel[ 6]= tmp2t[1] + 1;
251 hpel[ 9]= hpel[1] + 64;
252 hpel[10]= hpel[8] + 1;
254 #define MC_STRIDE(x) (needs[x] ? 64 : stride)
257 int dxy = dx / 8 + dy / 8 * 4;
258 const uint8_t *src1 = hpel[dxy ];
259 const uint8_t *src2 = hpel[dxy + 1];
260 const uint8_t *src3 = hpel[dxy + 4];
261 const uint8_t *src4 = hpel[dxy + 5];
268 for(y=0; y < b_h; y++){
269 for(x=0; x < b_w; x++){
270 dst[x]= ((8-dx)*(8-dy)*src1[x] + dx*(8-dy)*src2[x]+
271 (8-dx)* dy *src3[x] + dx* dy *src4[x]+32)>>6;
284 int a= weight[((dx&7) + (8*(dy&7)))];
286 for(y=0; y < b_h; y++){
287 for(x=0; x < b_w; x++){
288 dst[x]= (a*src1[x] + b*src2[x] + 4)>>3;
297 void ff_snow_pred_block(
SnowContext *s,
uint8_t *
dst,
uint8_t *tmp,
int stride,
int sx,
int sy,
int b_w,
int b_h,
BlockNode *
block,
int plane_index,
int w,
int h){
300 const unsigned color = block->
color[plane_index];
301 const unsigned color4 = color*0x01010101;
303 for(y=0; y < b_h; y++){
304 *(uint32_t*)&dst[0 + y*stride]= color4;
305 *(uint32_t*)&dst[4 + y*stride]= color4;
306 *(uint32_t*)&dst[8 + y*stride]= color4;
307 *(uint32_t*)&dst[12+ y*stride]= color4;
308 *(uint32_t*)&dst[16+ y*stride]= color4;
309 *(uint32_t*)&dst[20+ y*stride]= color4;
310 *(uint32_t*)&dst[24+ y*stride]= color4;
311 *(uint32_t*)&dst[28+ y*stride]= color4;
314 for(y=0; y < b_h; y++){
315 *(uint32_t*)&dst[0 + y*stride]= color4;
316 *(uint32_t*)&dst[4 + y*stride]= color4;
317 *(uint32_t*)&dst[8 + y*stride]= color4;
318 *(uint32_t*)&dst[12+ y*stride]= color4;
321 for(y=0; y < b_h; y++){
322 *(uint32_t*)&dst[0 + y*stride]= color4;
323 *(uint32_t*)&dst[4 + y*stride]= color4;
326 for(y=0; y < b_h; y++){
327 *(uint32_t*)&dst[0 + y*stride]= color4;
330 for(y=0; y < b_h; y++){
331 for(x=0; x < b_w; x++){
339 int mx= block->
mx*scale;
340 int my= block->
my*scale;
343 const int tab_index= 3 - (b_w>>2) + (b_w>>4);
358 av_assert2((tab_index>=0 && tab_index<4) || b_w==32);
359 if((dx&3) || (dy&3) || !(b_w == b_h || 2*b_w == b_h || b_w == 2*b_h) || (b_w&(b_w-1)) || !s->
plane[plane_index].
fast_mc )
360 mc_block(&s->
plane[plane_index], dst, src, stride, b_w, b_h, dx, dy);
363 for(y=0; y<b_h; y+=16){
380 #define mca(dx,dy,b_w)\
381 static void mc_block_hpel ## dx ## dy ## b_w(uint8_t *dst, const uint8_t *src, ptrdiff_t stride, int h){\
383 mc_block(NULL, dst, src-(HTAPS_MAX/2-1)-(HTAPS_MAX/2-1)*stride, stride, b_w, b_w, dx, dy);\
409 s->dsp.put_qpel_pixels_tab [0][dy+dx/4]=\
410 s->dsp.put_no_rnd_qpel_pixels_tab[0][dy+dx/4]=\
411 s->h264qpel.put_h264_qpel_pixels_tab[0][dy+dx/4];\
412 s->dsp.put_qpel_pixels_tab [1][dy+dx/4]=\
413 s->dsp.put_no_rnd_qpel_pixels_tab[1][dy+dx/4]=\
414 s->h264qpel.put_h264_qpel_pixels_tab[1][dy+dx/4];
434 s->dsp.put_pixels_tab [0][dy/4+dx/8]=\
435 s->dsp.put_no_rnd_pixels_tab[0][dy/4+dx/8]=\
436 mc_block_hpel ## dx ## dy ## 16;\
437 s->dsp.put_pixels_tab [1][dy/4+dx/8]=\
438 s->dsp.put_no_rnd_pixels_tab[1][dy/4+dx/8]=\
439 mc_block_hpel ## dx ## dy ## 8;
470 int plane_index,
level, orientation;
471 int ret, emu_buf_size;
488 for(plane_index=0; plane_index<3; plane_index++){
500 for(orientation=level ? 1 : 0; orientation<4; orientation++){
506 b->
width = (w + !(orientation&1))>>1;
507 b->
height= (h + !(orientation>1))>>1;
539 #define USE_HALFPEL_PLANE 0
560 halfpel[1][p][i]= (20*(src[i] + src[i+1]) - 5*(src[i-1] + src[i+2]) + (src[i-2] + src[i+3]) + 16 )>>5;
567 halfpel[2][p][i]= (20*(src[i] + src[i+ls]) - 5*(src[i-ls] + src[i+2*ls]) + (src[i-2*ls] + src[i+3*ls]) + 16 )>>5;
575 halfpel[3][p][i]= (20*(src[i] + src[i+ls]) - 5*(src[i-ls] + src[i+2*ls]) + (src[i-2*ls] + src[i+3*ls]) + 16 )>>5;
650 int plane_index,
level, orientation, i;
677 for(plane_index=0; plane_index<3; plane_index++){
679 for(orientation=level ? 1 : 0; orientation<4; orientation++){