53 for(plane_index=0; plane_index<3; plane_index++){
153 for (i = 0; i < h; i++) {
154 for (j = 0; j < w; j++) {
158 pix += line_size - w;
170 for (i = 0; i < w; i++) {
171 for (j = 0; j < w; j ++) {
175 pix += line_size - w;
186 return (3*lambda)>>(FF_LAMBDA_SHIFT+1);
207 #define P_TOPRIGHT P[3]
208 #define P_MEDIAN P[4]
210 #define FLAG_QPEL 1 //must be 1
220 int score, score2, iscore, i_len, p_len, block_s, sum, base_bits;
224 const int index= (x + y*w) << rem_depth;
226 int trx= (x+1)<<rem_depth;
227 int try= (y+1)<<rem_depth;
233 const BlockNode *tr = y && trx<w && ((x&1)==0 || level==0) ? &s->
block[index-w+(1<<rem_depth)] : tl;
234 int pl = left->
color[0];
235 int pcb= left->
color[1];
236 int pcr= left->
color[2];
246 int16_t last_mv[3][2];
248 const int shift= 1+qpel;
254 int ref, best_ref, ref_score, ref_mx, ref_my;
258 set_blocks(s, level, x, y, pl, pcb, pcr, 0, 0, 0,
BLOCK_INTRA);
273 last_mv[1][0]= right->
mx;
274 last_mv[1][1]= right->
my;
275 last_mv[2][0]= bottom->
mx;
276 last_mv[2][1]= bottom->
my;
291 c->
xmin = - x*block_w - 16+3;
292 c->
ymin = - y*block_w - 16+3;
336 if(score > ref_score){
349 pc.bytestream= p_buffer;
353 put_rac(&pc, &p_state[4 + s_context], 1);
356 put_symbol(&pc, &p_state[128 + 1024 + 32*ref_context], best_ref, 0);
357 pred_mv(s, &pmx, &pmy, best_ref, left, top, tr);
358 put_symbol(&pc, &p_state[128 + 32*(mx_context + 16*!!best_ref)], mx - pmx, 1);
359 put_symbol(&pc, &p_state[128 + 32*(my_context + 16*!!best_ref)], my - pmy, 1);
360 p_len= pc.bytestream - pc.bytestream_start;
363 block_s= block_w*block_w;
364 sum =
pix_sum(current_data[0], stride, block_w, block_w);
365 l= (sum + block_s/2)/block_s;
366 iscore =
pix_norm1(current_data[0], stride, block_w) - 2*l*sum + l*l*block_s;
371 cb= (sum + block_s/2)/block_s;
374 cr= (sum + block_s/2)/block_s;
381 ic.bytestream= i_buffer;
384 put_rac(&ic, &i_state[4 + s_context], 1);
391 i_len= ic.bytestream - ic.bytestream_start;
394 av_assert1(iscore < 255*255*256 + s->lambda2*10);
400 int varc= iscore >> 8;
401 int vard= score >> 8;
402 if (vard <= 64 || vard < varc)
416 if(score2 < score && score2 < iscore)
421 pred_mv(s, &pmx, &pmy, 0, left, top, tr);
422 memcpy(pbbak, i_buffer, i_len);
426 set_blocks(s, level, x, y, l, cb, cr, pmx, pmy, 0,
BLOCK_INTRA);
430 memcpy(pbbak, p_buffer, p_len);
434 set_blocks(s, level, x, y, pl, pcb, pcr, mx, my, best_ref, 0);
443 const int index= (x + y*w) << rem_depth;
444 int trx= (x+1)<<rem_depth;
449 const BlockNode *tr = y && trx<w && ((x&1)==0 || level==0) ? &s->
block[index-w+(1<<rem_depth)] : tl;
450 int pl = left->
color[0];
451 int pcb= left->
color[1];
452 int pcr= left->
color[2];
460 set_blocks(s, level, x, y, pl, pcb, pcr, 0, 0, 0,
BLOCK_INTRA);
477 pred_mv(s, &pmx, &pmy, 0, left, top, tr);
484 set_blocks(s, level, x, y, b->
color[0], b->
color[1], b->
color[2], pmx, pmy, 0,
BLOCK_INTRA);
486 pred_mv(s, &pmx, &pmy, b->
ref, left, top, tr);
492 set_blocks(s, level, x, y, pl, pcb, pcr, b->
mx, b->
my, b->
ref, 0);
500 const int block_w = plane_index ? block_size>>s->
chroma_h_shift : block_size;
501 const int block_h = plane_index ? block_size>>s->
chroma_v_shift : block_size;
503 const int obmc_stride= plane_index ? (2*block_size)>>s->
chroma_h_shift : 2*block_size;
505 uint8_t *
src= s-> input_picture->data[plane_index];
508 const int w= p->
width;
510 int index= mb_x + mb_y*b_stride;
519 b->
color[plane_index]= 0;
520 memset(dst, 0, obmc_stride*obmc_stride*
sizeof(
IDWTELEM));
523 int mb_x2= mb_x + (i &1) - 1;
524 int mb_y2= mb_y + (i>>1) - 1;
525 int x= block_w*mb_x2 + block_w/2;
526 int y= block_h*mb_y2 + block_h/2;
529 x, y, block_w, block_h, w, h, obmc_stride, ref_stride, obmc_stride, mb_x2, mb_y2, 0, 0, plane_index);
531 for(y2=
FFMAX(y, 0); y2<
FFMIN(h, y+block_h); y2++){
532 for(x2=
FFMAX(x, 0); x2<
FFMIN(w, x+block_w); x2++){
533 int index= x2-(block_w*mb_x - block_w/2) + (y2-(block_h*mb_y - block_h/2))*obmc_stride;
534 int obmc_v= obmc[
index];
536 if(y<0) obmc_v += obmc[index + block_h*obmc_stride];
537 if(x<0) obmc_v += obmc[index + block_w];
538 if(y+block_h>h) obmc_v += obmc[index - block_h*obmc_stride];
539 if(x+block_w>w) obmc_v += obmc[index - block_w];
544 ab += (
src[x2 + y2*ref_stride] - (d>>
FRAC_BITS)) * obmc_v;
545 aa += obmc_v * obmc_v;
557 int index= x + y*b_stride;
561 const BlockNode *tl = y && x ? &s->
block[index-b_stride-1] : left;
562 const BlockNode *tr = y && x+w<b_stride ? &s->
block[index-b_stride+w] : tl;
567 if(x<0 || x>=b_stride || y>=b_height)
583 pred_mv(s, &dmx, &dmy, b->
ref, left, top, tr);
595 const int block_w = plane_index ? block_size>>s->
chroma_h_shift : block_size;
596 const int block_h = plane_index ? block_size>>s->
chroma_v_shift : block_size;
597 const int obmc_stride= plane_index ? (2*block_size)>>s->
chroma_h_shift : 2*block_size;
600 uint8_t *
src= s-> input_picture->data[plane_index];
606 const int w= p->
width;
611 int sx= block_w*mb_x - block_w/2;
612 int sy= block_h*mb_y - block_h/2;
613 int x0=
FFMAX(0,-sx);
614 int y0=
FFMAX(0,-sy);
615 int x1=
FFMIN(block_w*2, w-sx);
616 int y1=
FFMIN(block_h*2, h-sy);
621 ff_snow_pred_block(s, cur, tmp, ref_stride, sx, sy, block_w*2, block_h*2, &s->
block[mb_x + mb_y*b_stride], plane_index, w, h);
623 for(y=y0; y<y1; y++){
624 const uint8_t *obmc1= obmc_edged[
y];
626 uint8_t *cur1 = cur + y*ref_stride;
627 uint8_t *dst1 = dst + sx + (sy+
y)*ref_stride;
628 for(x=x0; x<x1; x++){
629 #if FRAC_BITS >= LOG2_OBMC_MAX
635 if(v&(~255)) v= ~(v>>31);
642 && (mb_x == 0 || mb_x == b_stride-1)
643 && (mb_y == 0 || mb_y == b_height-1)){
653 memcpy(dst + sx+x0 + (sy+y)*ref_stride, cur + x0 + y*ref_stride, x1-x0);
664 distortion =
ff_w97_32_c(&s->
m,
src + sx + sy*ref_stride, dst + sx + sy*ref_stride, ref_stride, 32);
666 distortion =
ff_w53_32_c(&s->
m,
src + sx + sy*ref_stride, dst + sx + sy*ref_stride, ref_stride, 32);
670 int off = sx+16*(i&1) + (sy+16*(i>>1))*ref_stride;
671 distortion += s->
mecc.
me_cmp[0](&s->
m,
src + off, dst + off, ref_stride, 16);
676 distortion = s->
mecc.
me_cmp[0](&s->
m,
src + sx + sy*ref_stride, dst + sx + sy*ref_stride, ref_stride, block_w*2);
685 rate +=
get_block_bits(s, mb_x + (i&1) - (i>>1), mb_y + (i>>1), 1);
687 if(mb_x == b_stride-2)
690 return distortion + rate*penalty_factor;
697 const int block_w = plane_index ? block_size>>s->
chroma_h_shift : block_size;
698 const int block_h = plane_index ? block_size>>s->
chroma_v_shift : block_size;
700 const int obmc_stride= plane_index ? (2*block_size)>>s->
chroma_h_shift : 2*block_size;
703 uint8_t *
src= s-> input_picture->data[plane_index];
708 const int w= p->
width;
717 int mb_x2= mb_x + (i%3) - 1;
718 int mb_y2= mb_y + (i/3) - 1;
719 int x= block_w*mb_x2 + block_w/2;
720 int y= block_h*mb_y2 + block_h/2;
723 x, y, block_w, block_h, w, h, 0, ref_stride, obmc_stride, mb_x2, mb_y2, 1, 1, plane_index);
726 for(y2= y; y2<0; y2++)
727 memcpy(dst + x + y2*ref_stride,
src + x + y2*ref_stride, block_w);
728 for(y2= h; y2<y+block_h; y2++)
729 memcpy(dst + x + y2*ref_stride,
src + x + y2*ref_stride, block_w);
731 for(y2= y; y2<y+block_h; y2++)
732 memcpy(dst + x + y2*ref_stride,
src + x + y2*ref_stride, -x);
735 for(y2= y; y2<y+block_h; y2++)
736 memcpy(dst + w + y2*ref_stride,
src + w + y2*ref_stride, x+block_w - w);
740 distortion += s->
mecc.
me_cmp[block_w==8](&s->
m,
src + x + y*ref_stride, dst + x + y*ref_stride, ref_stride, block_h);
754 for(i=merged?4:0; i<9; i++){
755 static const int dxy[9][2] = {{0,0},{1,0},{0,1},{1,1},{2,0},{2,1},{-1,2},{0,2},{1,2}};
759 return distortion + rate*penalty_factor;
763 const int w= b->
width;
776 int l=0, lt=0, t=0, rt=0;
777 v= src[x + y*stride];
780 t= src[x + (y-1)*stride];
782 lt= src[x - 1 + (y-1)*stride];
785 rt= src[x + 1 + (y-1)*stride];
789 l= src[x - 1 + y*stride];
798 if(px<b->parent->width && py<b->parent->height)
799 p= parent[px + py*2*stride];
803 runs[run_index++]=
run;
811 max_index= run_index;
812 runs[run_index++]=
run;
814 run= runs[run_index++];
817 if(run_index <= max_index)
827 int l=0, lt=0, t=0, rt=0;
828 v= src[x + y*stride];
831 t= src[x + (y-1)*stride];
833 lt= src[x - 1 + (y-1)*stride];
836 rt= src[x + 1 + (y-1)*stride];
840 l= src[x - 1 + y*stride];
849 if(px<b->parent->width && py<b->parent->height)
850 p= parent[px + py*2*stride];
858 run= runs[run_index++];
860 if(run_index <= max_index)
870 int l2= 2*
FFABS(l) + (l<0);
900 block->
color[0] = p[0];
901 block->
color[1] = p[1];
902 block->
color[2] = p[2];
932 return check_block(s, mb_x, mb_y, p, 0, obmc_edged, best_rd);
945 backup[0] = block[0];
946 backup[1] = block[1];
947 backup[2] = block[b_stride];
948 backup[3] = block[b_stride + 1];
964 block[1]= block[b_stride]= block[b_stride+1]= *
block;
975 block[b_stride]= backup[2];
976 block[b_stride+1]= backup[3];
982 int pass, mb_x, mb_y;
985 const int b_stride= b_width;
992 for(mb_y= 0; mb_y<s->
b_height; mb_y++)
993 for(mb_x= 0; mb_x<s->
b_width; mb_x++)
999 for(pass=0; pass<25; pass++){
1002 for(mb_y= 0; mb_y<b_height; mb_y++){
1003 for(mb_x= 0; mb_x<b_width; mb_x++){
1004 int dia_change, i, j, ref;
1005 int best_rd= INT_MAX, ref_rd;
1007 const int index= mb_x + mb_y * b_stride;
1016 BlockNode *brb= mb_x+1<b_width && mb_y+1<b_height ? &s->
block[index+b_stride+1] :
NULL;
1033 for (y = 0; y < b_w * 2; y++)
1036 for(y=0; y<b_w*2; y++)
1037 memset(obmc_edged[y], obmc_edged[y][0] + obmc_edged[y][b_w-1], b_w);
1038 if(mb_x==b_stride-1)
1039 for(y=0; y<b_w*2; y++)
1040 memset(obmc_edged[y]+b_w, obmc_edged[y][b_w] + obmc_edged[y][b_w*2-1], b_w);
1042 for(x=0; x<b_w*2; x++)
1043 obmc_edged[0][x] += obmc_edged[b_w-1][x];
1044 for(y=1; y<b_w; y++)
1045 memcpy(obmc_edged[y], obmc_edged[0], b_w*2);
1047 if(mb_y==b_height-1){
1048 for(x=0; x<b_w*2; x++)
1049 obmc_edged[b_w*2-1][x] += obmc_edged[b_w][x];
1050 for(y=b_w; y<b_w*2-1; y++)
1051 memcpy(obmc_edged[y], obmc_edged[b_w*2-1], b_w*2);
1056 if(mb_x==0 || mb_y==0 || mb_x==b_width-1 || mb_y==b_height-1){
1062 const int sx= block_w*mb_x - block_w/2;
1063 const int sy= block_h*mb_y - block_h/2;
1069 memcpy(dst + sx + y*stride, src + sx + y*stride, block_w*2);
1070 for(y=h; y<sy+block_h*2; y++)
1071 memcpy(dst + sx + y*stride, src + sx + y*stride, block_w*2);
1073 for(y=sy; y<sy+block_h*2; y++)
1074 memcpy(dst + sx + y*stride, src + sx + y*stride, -sx);
1076 if(sx+block_w*2 > w){
1077 for(y=sy; y<sy+block_h*2; y++)
1078 memcpy(dst + w + y*stride, src + w + y*stride, sx+block_w*2 - w);
1084 color[i]=
get_dc(s, mb_x, mb_y, i);
1089 check_block(s, mb_x, mb_y, color0, 1, obmc_edged, &best_rd);
1105 check_block_inter(s, mb_x, mb_y, mvr[-b_stride][0], mvr[-b_stride][1], obmc_edged, &best_rd);
1111 check_block_inter(s, mb_x, mb_y, mvr[b_stride][0], mvr[b_stride][1], obmc_edged, &best_rd);
1119 dia_change |=
check_block_inter(s, mb_x, mb_y, block->
mx+4*(i-j), block->
my+(4*j), obmc_edged, &best_rd);
1120 dia_change |=
check_block_inter(s, mb_x, mb_y, block->
mx-4*(i-j), block->
my-(4*j), obmc_edged, &best_rd);
1121 dia_change |=
check_block_inter(s, mb_x, mb_y, block->
mx+4*(i-j), block->
my-(4*j), obmc_edged, &best_rd);
1122 dia_change |=
check_block_inter(s, mb_x, mb_y, block->
mx-4*(i-j), block->
my+(4*j), obmc_edged, &best_rd);
1128 static const int square[8][2]= {{+1, 0},{-1, 0},{ 0,+1},{ 0,-1},{+1,+1},{-1,-1},{+1,-1},{-1,+1},};
1131 dia_change |=
check_block_inter(s, mb_x, mb_y, block->
mx+square[i][0], block->
my+square[i][1], obmc_edged, &best_rd);
1135 mvr[0][0]= block->
mx;
1136 mvr[0][1]= block->
my;
1137 if(ref_rd > best_rd){
1144 check_block(s, mb_x, mb_y, color, 1, obmc_edged, &best_rd);
1166 for(mb_y= 0; mb_y<b_height; mb_y+=2){
1167 for(mb_x= 0; mb_x<b_width; mb_x+=2){
1169 int best_rd, init_rd;
1170 const int index= mb_x + mb_y * b_stride;
1175 b[2]= b[0]+b_stride;
1190 (b[0]->mx + b[1]->mx + b[2]->mx + b[3]->mx + 2) >> 2,
1191 (b[0]->my + b[1]->my + b[2]->my + b[3]->my + 2) >> 2, 0, &best_rd);
1197 if(init_rd != best_rd)
1228 const int w= b->
width;
1232 int x,
y, thres1, thres2;
1237 dst[x + y*stride]= src[x + y*stride];
1241 bias= bias ? 0 : (3*qmul)>>3;
1248 int i= src[x + y*stride];
1250 if((
unsigned)(i+thres1) > thres2){
1254 dst[x + y*stride]= i;
1259 dst[x + y*stride]= -i;
1262 dst[x + y*stride]= 0;
1268 int i= src[x + y*stride];
1270 if((
unsigned)(i+thres1) > thres2){
1273 i= (i + bias) / qmul;
1274 dst[x + y*stride]= i;
1278 i= (i + bias) / qmul;
1279 dst[x + y*stride]= -i;
1282 dst[x + y*stride]= 0;
1289 const int w= b->
width;
1300 int i= src[x + y*stride];
1302 src[x + y*stride]= -((-i*qmul + qadd)>>(
QEXPSHIFT));
1304 src[x + y*stride]= (( i*qmul + qadd)>>(
QEXPSHIFT));
1311 const int w= b->
width;
1315 for(y=h-1; y>=0; y--){
1316 for(x=w-1; x>=0; x--){
1317 int i= x + y*stride;
1321 if(y && x+1<w) src[i] -=
mid_pred(src[i - 1], src[i - stride], src[i - stride + 1]);
1322 else src[i] -= src[i - 1];
1324 if(y) src[i] -=
mid_pred(src[i - 1], src[i - stride], src[i - 1] + src[i - stride] - src[i - 1 - stride]);
1325 else src[i] -= src[i - 1];
1328 if(y) src[i] -= src[i - stride];
1335 const int w= b->
width;
1341 int i= x + y*stride;
1345 if(y && x+1<w) src[i] +=
mid_pred(src[i - 1], src[i - stride], src[i - stride + 1]);
1346 else src[i] += src[i - 1];
1348 if(y) src[i] +=
mid_pred(src[i - 1], src[i - stride], src[i - 1] + src[i - stride] - src[i - 1 - stride]);
1349 else src[i] += src[i - 1];
1352 if(y) src[i] += src[i - stride];
1359 int plane_index,
level, orientation;
1361 for(plane_index=0; plane_index<
FFMIN(s->
nb_planes, 2); plane_index++){
1363 for(orientation=level ? 1:0; orientation<4; orientation++){
1364 if(orientation==2)
continue;
1375 memset(kstate,
MID_STATE,
sizeof(kstate));
1385 for(plane_index=0; plane_index<2; plane_index++){
1412 for(plane_index=0; plane_index<
FFMIN(s->
nb_planes, 2); plane_index++){
1420 for(plane_index=0; plane_index<
FFMIN(s->
nb_planes, 2); plane_index++){
1424 for(i= p->
htaps/2; i; i--)
1448 for(plane_index=0; plane_index<2; plane_index++){
1474 uint32_t coef_sum= 0;
1475 int level, orientation, delta_qlog;
1478 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1481 const int w= b->
width;
1483 const int stride= b->
stride;
1486 const int qdiv= (1<<16)/qmul;
1491 buf[x+y*stride]= b->
buf[x+y*stride];
1496 coef_sum+= abs(buf[x+y*stride]) * qdiv >> 16;
1502 coef_sum = (uint64_t)coef_sum * coef_sum >> 16;
1517 s->
qlog+= delta_qlog;
1524 int level, orientation, x,
y;
1527 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1536 for(x=0; x<
width; x++){
1542 b->
qlog= (int)(log(352256.0/sqrt(error)) / log(pow(2.0, 1.0/
QROOT))+0.5);
1548 const AVFrame *pict,
int *got_packet)
1555 int level, orientation, plane_index, i,
y,
ret;
1568 for(y=0; y<(height>>vshift); y++)
1573 width >> hshift, height >> vshift,
1631 int block_width = (width +15)>>4;
1632 int block_height= (height+15)>>4;
1641 s->
m. last_picture_ptr= &s->
m. last_picture;
1695 for(plane_index=0; plane_index < s->
nb_planes; plane_index++){
1705 for(plane_index=0; plane_index < s->nb_planes; plane_index++){
1714 if(pict->
data[plane_index])
1752 if (delta_qlog <= INT_MIN)
1765 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1780 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1802 pict->
data[plane_index][y*pict->
linesize[plane_index] + x];
1813 if(pict->
data[plane_index])
1873 #define OFFSET(x) offsetof(SnowContext, x)
1874 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
1877 {
"memc_only",
"Only do ME/MC (I frames -> ref, P frame -> ME+MC).",
OFFSET(memc_only),
AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1,
VE },
1878 {
"no_bitstream",
"Skip final bitstream writeout.",
OFFSET(no_bitstream),
AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1,
VE },
1929 fprintf(stderr,
"Failed to allocate memory\n");
1935 printf(
"testing 5/3 DWT\n");
1937 buffer[0][i] = buffer[1][i] =
av_lfg_get(&prng) % 54321 - 12345;
1943 if(buffer[0][i]!= buffer[1][i]) printf(
"fsck: %6d %12d %7d\n",i, buffer[0][i], buffer[1][i]);
1945 printf(
"testing 9/7 DWT\n");
1948 buffer[0][i] = buffer[1][i] =
av_lfg_get(&prng) % 54321 - 12345;
1954 if(
FFABS(buffer[0][i] - buffer[1][i])>20) printf(
"fsck: %6d %12d %7d\n",i, buffer[0][i], buffer[1][i]);
1957 int level, orientation, x,
y;
1958 int64_t errors[8][4];
1961 memset(errors, 0,
sizeof(errors));
1965 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1972 if(orientation&1) buf+=w;
1973 if(orientation>1) buf+=stride>>1;
1975 memset(buffer[0], 0,
sizeof(
int)*
width*height);
1976 buf[w/2 + h/2*stride]= 256*256;
1979 for(x=0; x<
width; x++){
1980 int64_t d= buffer[0][x + y*
width];
1982 if(
FFABS(width/2-x)<9 &&
FFABS(height/2-y)<9 && level==2) printf(
"%8"PRId64
" ", d);
1984 if(
FFABS(height/2-y)<9 && level==2) printf(
"\n");
1986 error= (int)(sqrt(error)+0.5);
1987 errors[
level][orientation]= error;
1988 if(g) g=
av_gcd(g, error);
1992 printf(
"static int const visual_weight[][4]={\n");
1995 for(orientation=0; orientation<4; orientation++){
1996 printf(
"%8"PRId64
",", errors[level][orientation]/g);
2012 memset(buffer[0], 0,
sizeof(
int)*width*height);
2014 for(x=0; x<
width; x++){
2015 int tab[4]={0,2,3,1};
2016 buffer[0][x+width*
y]= 256*256*tab[(x&1) + 2*(y&1)];
2021 for(x=0; x<
width; x++){
2022 int64_t d= buffer[0][x + y*
width];
2024 if(
FFABS(width/2-x)<9 &&
FFABS(height/2-y)<9) printf(
"%8"PRId64
" ", d);
2026 if(
FFABS(height/2-y)<9) printf(
"\n");