57 memset(score, 0,
sizeof(*score)*score_stride*((p->
height + Q2_STEP-1)/Q2_STEP));
58 for(y=0; y<p->
height; y++){
59 for(x=0; x<p->
width; x++){
60 int sx= (x-xo + step/2) / step / Q2_STEP;
61 int sy= (y-yo + step/2) / step / Q2_STEP;
63 assert(sx>=0 && sy>=0 && sx < score_stride);
65 score[sx + sy*score_stride] += v*
v;
66 assert(score[sx + sy*score_stride] >= 0);
72 int level, orientation;
75 for(orientation=level ? 1 : 0; orientation<4; orientation++){
79 dequantize(s, b, dst, b->
stride);
85 int level, orientation, ys, xs, x, y,
pass;
88 const int score_stride= (width + 10)/Q2_STEP;
89 int best_score[(width + 10)/Q2_STEP * (height + 10)/Q2_STEP];
90 int score[(width + 10)/Q2_STEP * (height + 10)/Q2_STEP];
99 for(orientation=level ? 1 : 0; orientation<4; orientation++){
103 assert(src == b->
buf);
108 for(pass=0; pass<1; pass++){
112 for(orientation=level ? 1 : 0; orientation<4; orientation++){
117 for(ys= 0; ys<Q2_STEP; ys++){
118 for(xs= 0; xs<Q2_STEP; xs++){
119 memcpy(idwt2_buffer, best_dequant, height * stride *
sizeof(
IDWTELEM));
120 dequantize_all(s, p, idwt2_buffer, width, height);
122 find_sse(s, p, best_score, score_stride, idwt2_buffer, s->
spatial_idwt_buffer, level, orientation);
123 memcpy(idwt2_buffer, best_dequant, height * stride *
sizeof(
IDWTELEM));
124 for(y=ys; y<b->
height; y+= Q2_STEP){
125 for(x=xs; x<b->
width; x+= Q2_STEP){
131 dequantize_all(s, p, idwt2_buffer, width, height);
133 find_sse(s, p, score, score_stride, idwt2_buffer, s->
spatial_idwt_buffer, level, orientation);
134 for(y=ys; y<b->
height; y+= Q2_STEP){
135 for(x=xs; x<b->
width; x+= Q2_STEP){
136 int score_idx= x/Q2_STEP + (y/Q2_STEP)*score_stride;
137 if(score[score_idx] <= best_score[score_idx] + threshold){
138 best_score[score_idx]= score[score_idx];
139 if(best_dst[x + y*b->
stride]<0) best_dst[x + y*b->
stride]++;
140 if(best_dst[x + y*b->
stride]>0) best_dst[x + y*b->
stride]--;
155 #if CONFIG_SNOW_ENCODER
159 int plane_index, ret;
162 av_log(avctx,
AV_LOG_ERROR,
"This codec is under development, files encoded with it may not be decodable with future versions!!!\n"
163 "Use vstrict=-2 / -strict -2 to use it anyway.\n");
179 for(plane_index=0; plane_index<3; plane_index++){
258 static int pix_sum(uint8_t * pix,
int line_size,
int w)
263 for (i = 0; i < w; i++) {
264 for (j = 0; j < w; j++) {
268 pix += line_size - w;
274 static int pix_norm1(uint8_t * pix,
int line_size,
int w)
280 for (i = 0; i < w; i++) {
281 for (j = 0; j < w; j ++) {
285 pix += line_size - w;
293 #define P_TOPRIGHT P[3]
294 #define P_MEDIAN P[4]
296 #define FLAG_QPEL 1 //must be 1
298 static int encode_q_branch(
SnowContext *s,
int level,
int x,
int y){
299 uint8_t p_buffer[1024];
300 uint8_t i_buffer[1024];
306 int score, score2, iscore, i_len, p_len, block_s, sum, base_bits;
310 const int index= (x + y*w) << rem_depth;
312 int trx= (x+1)<<rem_depth;
313 int try= (y+1)<<rem_depth;
319 const BlockNode *tr = y && trx<w && ((x&1)==0 || level==0) ? &s->block[
index-w+(1<<rem_depth)] : tl;
320 int pl = left->
color[0];
321 int pcb= left->color[1];
322 int pcr= left->color[2];
326 const int stride= s->current_picture.linesize[0];
327 const int uvstride= s->current_picture.linesize[1];
328 uint8_t *current_data[3]= { s->input_picture.data[0] + (x + y*
stride)*block_w,
329 s->input_picture.data[1] + (x + y*uvstride)*block_w/2,
330 s->input_picture.data[2] + (x + y*uvstride)*block_w/2};
332 int16_t last_mv[3][2];
334 const int shift= 1+qpel;
336 int ref_context= av_log2(2*left->ref) + av_log2(2*top->ref);
337 int mx_context= av_log2(2*
FFABS(left->mx - top->mx));
338 int my_context= av_log2(2*
FFABS(left->my - top->my));
339 int s_context= 2*left->level + 2*top->level + tl->level + tr->level;
340 int ref, best_ref, ref_score, ref_mx, ref_my;
342 assert(
sizeof(s->block_state) >= 256);
344 set_blocks(s, level, x, y, pl, pcb, pcr, 0, 0, 0,
BLOCK_INTRA);
357 last_mv[0][0]= s->block[
index].mx;
358 last_mv[0][1]= s->block[
index].my;
359 last_mv[1][0]= right->mx;
360 last_mv[1][1]= right->my;
361 last_mv[2][0]= bottom->mx;
362 last_mv[2][1]= bottom->my;
369 assert(c-> stride == stride);
377 c->
xmin = - x*block_w - 16+3;
378 c->
ymin = - y*block_w - 16+3;
379 c->
xmax = - (x+1)*block_w + (w<<(
LOG2_MB_SIZE - s->block_max_depth)) + 16-3;
380 c->
ymax = - (y+1)*block_w + (h<<(
LOG2_MB_SIZE - s->block_max_depth)) + 16-3;
403 for(ref=0; ref<s->ref_frames; ref++){
404 init_ref(c, current_data, s->last_picture[ref].data,
NULL, block_w*x, block_w*y, 0);
409 assert(ref_mx >= c->
xmin);
410 assert(ref_mx <= c->xmax);
411 assert(ref_my >= c->
ymin);
412 assert(ref_my <= c->ymax);
418 s->ref_mvs[ref][
index][0]= ref_mx;
419 s->ref_mvs[ref][
index][1]= ref_my;
420 s->ref_scores[ref][
index]= ref_score;
422 if(score > ref_score){
432 base_bits=
get_rac_count(&s->c) - 8*(s->c.bytestream - s->c.bytestream_start);
435 pc.bytestream= p_buffer;
436 memcpy(p_state, s->block_state,
sizeof(s->block_state));
438 if(level!=s->block_max_depth)
439 put_rac(&pc, &p_state[4 + s_context], 1);
440 put_rac(&pc, &p_state[1 + left->type + top->type], 0);
441 if(s->ref_frames > 1)
442 put_symbol(&pc, &p_state[128 + 1024 + 32*ref_context], best_ref, 0);
443 pred_mv(s, &pmx, &pmy, best_ref, left, top, tr);
444 put_symbol(&pc, &p_state[128 + 32*(mx_context + 16*!!best_ref)], mx - pmx, 1);
445 put_symbol(&pc, &p_state[128 + 32*(my_context + 16*!!best_ref)], my - pmy, 1);
446 p_len= pc.bytestream - pc.bytestream_start;
449 block_s= block_w*block_w;
450 sum = pix_sum(current_data[0], stride, block_w);
451 l= (sum + block_s/2)/block_s;
452 iscore = pix_norm1(current_data[0], stride, block_w) - 2*l*sum + l*l*block_s;
454 block_s= block_w*block_w>>2;
455 sum = pix_sum(current_data[1], uvstride, block_w>>1);
456 cb= (sum + block_s/2)/block_s;
458 sum = pix_sum(current_data[2], uvstride, block_w>>1);
459 cr= (sum + block_s/2)/block_s;
464 ic.bytestream= i_buffer;
465 memcpy(i_state, s->block_state,
sizeof(s->block_state));
466 if(level!=s->block_max_depth)
467 put_rac(&ic, &i_state[4 + s_context], 1);
468 put_rac(&ic, &i_state[1 + left->type + top->type], 1);
472 i_len= ic.bytestream - ic.bytestream_start;
476 assert(iscore < 255*255*256 + s->lambda2*10);
478 assert(l>=0 && l<=255);
479 assert(pl>=0 && pl<=255);
482 int varc= iscore >> 8;
483 int vard= score >> 8;
484 if (vard <= 64 || vard < varc)
490 if(level!=s->block_max_depth){
491 put_rac(&s->c, &s->block_state[4 + s_context], 0);
492 score2 = encode_q_branch(s, level+1, 2*x+0, 2*y+0);
493 score2+= encode_q_branch(s, level+1, 2*x+1, 2*y+0);
494 score2+= encode_q_branch(s, level+1, 2*x+0, 2*y+1);
495 score2+= encode_q_branch(s, level+1, 2*x+1, 2*y+1);
498 if(score2 < score && score2 < iscore)
503 pred_mv(s, &pmx, &pmy, 0, left, top, tr);
504 memcpy(pbbak, i_buffer, i_len);
506 s->c.bytestream_start= pbbak_start;
507 s->c.bytestream= pbbak + i_len;
508 set_blocks(s, level, x, y, l, cb, cr, pmx, pmy, 0,
BLOCK_INTRA);
509 memcpy(s->block_state, i_state,
sizeof(s->block_state));
512 memcpy(pbbak, p_buffer, p_len);
514 s->c.bytestream_start= pbbak_start;
515 s->c.bytestream= pbbak + p_len;
516 set_blocks(s, level, x, y, pl, pcb, pcr, mx, my, best_ref, 0);
517 memcpy(s->block_state, p_state,
sizeof(s->block_state));
522 static void encode_q_branch2(
SnowContext *s,
int level,
int x,
int y){
525 const int index= (x + y*w) << rem_depth;
526 int trx= (x+1)<<rem_depth;
531 const BlockNode *tr = y && trx<w && ((x&1)==0 || level==0) ? &s->block[
index-w+(1<<rem_depth)] : tl;
532 int pl = left->
color[0];
533 int pcb= left->color[1];
534 int pcr= left->color[2];
536 int ref_context= av_log2(2*left->ref) + av_log2(2*top->ref);
537 int mx_context= av_log2(2*
FFABS(left->mx - top->mx)) + 16*!!b->ref;
538 int my_context= av_log2(2*
FFABS(left->my - top->my)) + 16*!!b->ref;
539 int s_context= 2*left->
level + 2*top->level + tl->level + tr->level;
542 set_blocks(s, level, x, y, pl, pcb, pcr, 0, 0, 0,
BLOCK_INTRA);
546 if(level!=s->block_max_depth){
548 put_rac(&s->c, &s->block_state[4 + s_context], 1);
550 put_rac(&s->c, &s->block_state[4 + s_context], 0);
551 encode_q_branch2(s, level+1, 2*x+0, 2*y+0);
552 encode_q_branch2(s, level+1, 2*x+1, 2*y+0);
553 encode_q_branch2(s, level+1, 2*x+0, 2*y+1);
554 encode_q_branch2(s, level+1, 2*x+1, 2*y+1);
559 pred_mv(s, &pmx, &pmy, 0, left, top, tr);
560 put_rac(&s->c, &s->block_state[1 + (left->type&1) + (top->type&1)], 1);
561 put_symbol(&s->c, &s->block_state[32], b->color[0]-pl , 1);
562 put_symbol(&s->c, &s->block_state[64], b->color[1]-pcb, 1);
563 put_symbol(&s->c, &s->block_state[96], b->color[2]-pcr, 1);
564 set_blocks(s, level, x, y, b->color[0], b->color[1], b->color[2], pmx, pmy, 0,
BLOCK_INTRA);
566 pred_mv(s, &pmx, &pmy, b->ref, left, top, tr);
567 put_rac(&s->c, &s->block_state[1 + (left->type&1) + (top->type&1)], 0);
568 if(s->ref_frames > 1)
569 put_symbol(&s->c, &s->block_state[128 + 1024 + 32*ref_context], b->ref, 0);
570 put_symbol(&s->c, &s->block_state[128 + 32*mx_context], b->mx - pmx, 1);
571 put_symbol(&s->c, &s->block_state[128 + 32*my_context], b->my - pmy, 1);
572 set_blocks(s, level, x, y, pl, pcb, pcr, b->mx, b->my, b->ref, 0);
580 const int block_w = plane_index ? block_size/2 : block_size;
582 const int obmc_stride= plane_index ? block_size : 2*block_size;
584 uint8_t *src= s-> input_picture.data[plane_index];
587 const int w= p->
width;
589 int index= mb_x + mb_y*b_stride;
596 b->color[plane_index]= 0;
597 memset(dst, 0, obmc_stride*obmc_stride*
sizeof(
IDWTELEM));
600 int mb_x2= mb_x + (i &1) - 1;
601 int mb_y2= mb_y + (i>>1) - 1;
602 int x= block_w*mb_x2 + block_w/2;
603 int y= block_w*mb_y2 + block_w/2;
606 x, y, block_w, block_w, w, h, obmc_stride, ref_stride, obmc_stride, mb_x2, mb_y2, 0, 0, plane_index);
608 for(y2=
FFMAX(y, 0); y2<
FFMIN(h, y+block_w); y2++){
609 for(x2=
FFMAX(x, 0); x2<
FFMIN(w, x+block_w); x2++){
610 int index= x2-(block_w*mb_x - block_w/2) + (y2-(block_w*mb_y - block_w/2))*obmc_stride;
611 int obmc_v= obmc[
index];
613 if(y<0) obmc_v += obmc[index + block_w*obmc_stride];
614 if(x<0) obmc_v += obmc[index + block_w];
615 if(y+block_w>h) obmc_v += obmc[index - block_w*obmc_stride];
616 if(x+block_w>w) obmc_v += obmc[index - block_w];
621 ab += (src[x2 + y2*ref_stride] - (d>>
FRAC_BITS)) * obmc_v;
622 aa += obmc_v * obmc_v;
631 static inline int get_block_bits(
SnowContext *s,
int x,
int y,
int w){
634 int index= x + y*b_stride;
638 const BlockNode *tl = y && x ? &s->
block[index-b_stride-1] : left;
639 const BlockNode *tr = y && x+w<b_stride ? &s->
block[index-b_stride+w] : tl;
644 if(x<0 || x>=b_stride || y>=b_height)
660 pred_mv(s, &dmx, &dmy, b->
ref, left, top, tr);
663 return 2*(1 + av_log2(2*
FFABS(dmx))
664 + av_log2(2*
FFABS(dmy))
665 + av_log2(2*b->
ref));
669 static int get_block_rd(
SnowContext *s,
int mb_x,
int mb_y,
int plane_index,
const uint8_t *obmc_edged){
672 const int block_w = plane_index ? block_size/2 : block_size;
673 const int obmc_stride= plane_index ? block_size : 2*block_size;
676 uint8_t *src= s-> input_picture.data[plane_index];
682 const int w= p->
width;
687 int sx= block_w*mb_x - block_w/2;
688 int sy= block_w*mb_y - block_w/2;
689 int x0=
FFMAX(0,-sx);
690 int y0=
FFMAX(0,-sy);
691 int x1=
FFMIN(block_w*2, w-sx);
692 int y1=
FFMIN(block_w*2, h-sy);
695 ff_snow_pred_block(s, cur, tmp, ref_stride, sx, sy, block_w*2, block_w*2, &s->
block[mb_x + mb_y*b_stride], plane_index, w, h);
697 for(y=y0; y<y1; y++){
698 const uint8_t *obmc1= obmc_edged + y*obmc_stride;
699 const IDWTELEM *pred1 = pred + y*obmc_stride;
700 uint8_t *cur1 = cur + y*ref_stride;
701 uint8_t *dst1 = dst + sx + (sy+y)*ref_stride;
702 for(x=x0; x<x1; x++){
703 #if FRAC_BITS >= LOG2_OBMC_MAX
709 if(v&(~255)) v= ~(v>>31);
716 && (mb_x == 0 || mb_x == b_stride-1)
717 && (mb_y == 0 || mb_y == b_height-1)){
727 memcpy(dst + sx+x0 + (sy+y)*ref_stride, cur + x0 + y*ref_stride, x1-x0);
738 distortion =
ff_w97_32_c(&s->
m, src + sx + sy*ref_stride, dst + sx + sy*ref_stride, ref_stride, 32);
740 distortion =
ff_w53_32_c(&s->
m, src + sx + sy*ref_stride, dst + sx + sy*ref_stride, ref_stride, 32);
744 int off = sx+16*(i&1) + (sy+16*(i>>1))*ref_stride;
745 distortion += s->
dsp.
me_cmp[0](&s->
m, src +
off, dst +
off, ref_stride, 16);
750 distortion = s->
dsp.
me_cmp[0](&s->
m, src + sx + sy*ref_stride, dst + sx + sy*ref_stride, ref_stride, block_w*2);
759 rate += get_block_bits(s, mb_x + (i&1) - (i>>1), mb_y + (i>>1), 1);
761 if(mb_x == b_stride-2)
762 rate += get_block_bits(s, mb_x + 1, mb_y + 1, 1);
764 return distortion + rate*penalty_factor;
767 static int get_4block_rd(
SnowContext *s,
int mb_x,
int mb_y,
int plane_index){
771 const int block_w = plane_index ? block_size/2 : block_size;
773 const int obmc_stride= plane_index ? block_size : 2*block_size;
776 uint8_t *src= s-> input_picture.data[plane_index];
781 const int w= p->
width;
788 int mb_x2= mb_x + (i%3) - 1;
789 int mb_y2= mb_y + (i/3) - 1;
790 int x= block_w*mb_x2 + block_w/2;
791 int y= block_w*mb_y2 + block_w/2;
794 x, y, block_w, block_w, w, h, 0, ref_stride, obmc_stride, mb_x2, mb_y2, 1, 1, plane_index);
797 for(y2= y; y2<0; y2++)
798 memcpy(dst + x + y2*ref_stride, src + x + y2*ref_stride, block_w);
799 for(y2= h; y2<y+block_w; y2++)
800 memcpy(dst + x + y2*ref_stride, src + x + y2*ref_stride, block_w);
802 for(y2= y; y2<y+block_w; y2++)
803 memcpy(dst + x + y2*ref_stride, src + x + y2*ref_stride, -x);
806 for(y2= y; y2<y+block_w; y2++)
807 memcpy(dst + w + y2*ref_stride, src + w + y2*ref_stride, x+block_w - w);
810 assert(block_w== 8 || block_w==16);
811 distortion += s->
dsp.
me_cmp[block_w==8](&s->
m, src + x + y*ref_stride, dst + x + y*ref_stride, ref_stride, block_w);
824 rate = get_block_bits(s, mb_x, mb_y, 2);
825 for(i=merged?4:0; i<9; i++){
826 static const int dxy[9][2] = {{0,0},{1,0},{0,1},{1,1},{2,0},{2,1},{-1,2},{0,2},{1,2}};
827 rate += get_block_bits(s, mb_x + dxy[i][0], mb_y + dxy[i][1], 1);
830 return distortion + rate*penalty_factor;
834 const int w= b->
width;
847 int l=0, lt=0,
t=0, rt=0;
851 t= src[x + (y-1)*stride];
853 lt= src[x - 1 + (y-1)*stride];
856 rt= src[x + 1 + (y-1)*stride];
869 if(px<b->parent->width && py<b->parent->height)
870 p= parent[px + py*2*
stride];
874 runs[run_index++]=
run;
882 max_index= run_index;
883 runs[run_index++]=
run;
885 run= runs[run_index++];
888 if(run_index <= max_index)
898 int l=0, lt=0,
t=0, rt=0;
902 t= src[x + (y-1)*stride];
904 lt= src[x - 1 + (y-1)*stride];
907 rt= src[x + 1 + (y-1)*stride];
920 if(px<b->parent->width && py<b->parent->height)
921 p= parent[px + py*2*
stride];
929 run= runs[run_index++];
931 if(run_index <= max_index)
941 int l2= 2*
FFABS(l) + (l<0);
956 return encode_subband_c0run(s, b, src, parent, stride, orientation);
960 static av_always_inline int check_block(
SnowContext *s,
int mb_x,
int mb_y,
int p[3],
int intra,
const uint8_t *obmc_edged,
int *best_rd){
967 assert(mb_x>=0 && mb_y>=0);
968 assert(mb_x<b_stride);
971 block->
color[0] = p[0];
972 block->
color[1] = p[1];
973 block->
color[2] = p[2];
987 rd= get_block_rd(s, mb_x, mb_y, 0, obmc_edged);
1001 static av_always_inline int check_block_inter(
SnowContext *s,
int mb_x,
int mb_y,
int p0,
int p1,
const uint8_t *obmc_edged,
int *best_rd){
1002 int p[2] = {p0, p1};
1003 return check_block(s, mb_x, mb_y, p, 0, obmc_edged, best_rd);
1009 BlockNode backup[4]= {block[0], block[1], block[b_stride], block[b_stride+1]};
1013 assert(mb_x>=0 && mb_y>=0);
1014 assert(mb_x<b_stride);
1015 assert(((mb_x|mb_y)&1) == 0);
1027 block[1]= block[b_stride]= block[b_stride+1]= *
block;
1029 rd= get_4block_rd(s, mb_x, mb_y, 0);
1036 block[0]= backup[0];
1037 block[1]= backup[1];
1038 block[b_stride]= backup[2];
1039 block[b_stride+1]= backup[3];
1045 int pass, mb_x, mb_y;
1048 const int b_stride= b_width;
1055 for(mb_y= 0; mb_y<s->
b_height; mb_y++)
1056 for(mb_x= 0; mb_x<s->
b_width; mb_x++)
1057 encode_q_branch(s, 0, mb_x, mb_y);
1062 for(pass=0; pass<25; pass++){
1065 for(mb_y= 0; mb_y<b_height; mb_y++){
1066 for(mb_x= 0; mb_x<b_width; mb_x++){
1067 int dia_change, i, j, ref;
1068 int best_rd= INT_MAX, ref_rd;
1070 const int index= mb_x + mb_y * b_stride;
1079 BlockNode *brb= mb_x+1<b_width && mb_y+1<b_height ? &s->
block[index+b_stride+1] :
NULL;
1081 uint8_t obmc_edged[b_w*2][b_w*2];
1098 for(y=0; y<b_w*2; y++)
1099 memset(obmc_edged[y], obmc_edged[y][0] + obmc_edged[y][b_w-1], b_w);
1100 if(mb_x==b_stride-1)
1101 for(y=0; y<b_w*2; y++)
1102 memset(obmc_edged[y]+b_w, obmc_edged[y][b_w] + obmc_edged[y][b_w*2-1], b_w);
1104 for(x=0; x<b_w*2; x++)
1105 obmc_edged[0][x] += obmc_edged[b_w-1][x];
1106 for(y=1; y<b_w; y++)
1107 memcpy(obmc_edged[y], obmc_edged[0], b_w*2);
1109 if(mb_y==b_height-1){
1110 for(x=0; x<b_w*2; x++)
1111 obmc_edged[b_w*2-1][x] += obmc_edged[b_w][x];
1112 for(y=b_w; y<b_w*2-1; y++)
1113 memcpy(obmc_edged[y], obmc_edged[b_w*2-1], b_w*2);
1118 if(mb_x==0 || mb_y==0 || mb_x==b_width-1 || mb_y==b_height-1){
1119 uint8_t *src= s-> input_picture.data[0];
1123 const int sx= block_w*mb_x - block_w/2;
1124 const int sy= block_w*mb_y - block_w/2;
1130 memcpy(dst + sx + y*stride, src + sx + y*stride, block_w*2);
1131 for(y=h; y<sy+block_w*2; y++)
1132 memcpy(dst + sx + y*stride, src + sx + y*stride, block_w*2);
1134 for(y=sy; y<sy+block_w*2; y++)
1135 memcpy(dst + sx + y*stride, src + sx + y*stride, -sx);
1137 if(sx+block_w*2 > w){
1138 for(y=sy; y<sy+block_w*2; y++)
1139 memcpy(dst + w + y*stride, src + w + y*stride, sx+block_w*2 - w);
1145 color[i]=
get_dc(s, mb_x, mb_y, i);
1150 check_block(s, mb_x, mb_y, color0, 1, *obmc_edged, &best_rd);
1152 check_block_inter(s, mb_x, mb_y, block->
mx, block->
my, *obmc_edged, &best_rd);
1163 check_block_inter(s, mb_x, mb_y, mvr[0][0], mvr[0][1], *obmc_edged, &best_rd);
1164 check_block_inter(s, mb_x, mb_y, 0, 0, *obmc_edged, &best_rd);
1166 check_block_inter(s, mb_x, mb_y, mvr[-b_stride][0], mvr[-b_stride][1], *obmc_edged, &best_rd);
1168 check_block_inter(s, mb_x, mb_y, mvr[-1][0], mvr[-1][1], *obmc_edged, &best_rd);
1170 check_block_inter(s, mb_x, mb_y, mvr[1][0], mvr[1][1], *obmc_edged, &best_rd);
1172 check_block_inter(s, mb_x, mb_y, mvr[b_stride][0], mvr[b_stride][1], *obmc_edged, &best_rd);
1180 dia_change |= check_block_inter(s, mb_x, mb_y, block->
mx+4*(i-j), block->
my+(4*j), *obmc_edged, &best_rd);
1181 dia_change |= check_block_inter(s, mb_x, mb_y, block->
mx-4*(i-j), block->
my-(4*j), *obmc_edged, &best_rd);
1182 dia_change |= check_block_inter(s, mb_x, mb_y, block->
mx+4*(i-j), block->
my-(4*j), *obmc_edged, &best_rd);
1183 dia_change |= check_block_inter(s, mb_x, mb_y, block->
mx-4*(i-j), block->
my+(4*j), *obmc_edged, &best_rd);
1189 static const int square[8][2]= {{+1, 0},{-1, 0},{ 0,+1},{ 0,-1},{+1,+1},{-1,-1},{+1,-1},{-1,+1},};
1192 dia_change |= check_block_inter(s, mb_x, mb_y, block->
mx+square[i][0], block->
my+square[i][1], *obmc_edged, &best_rd);
1196 mvr[0][0]= block->
mx;
1197 mvr[0][1]= block->
my;
1198 if(ref_rd > best_rd){
1205 check_block(s, mb_x, mb_y, color, 1, *obmc_edged, &best_rd);
1227 for(mb_y= 0; mb_y<b_height; mb_y+=2){
1228 for(mb_x= 0; mb_x<b_width; mb_x+=2){
1230 int best_rd, init_rd;
1231 const int index= mb_x + mb_y * b_stride;
1236 b[2]= b[0]+b_stride;
1247 init_rd= best_rd= get_4block_rd(s, mb_x, mb_y, 0);
1250 check_4block_inter(s, mb_x, mb_y,
1251 (b[0]->mx + b[1]->mx + b[2]->mx + b[3]->mx + 2) >> 2,
1252 (b[0]->my + b[1]->my + b[2]->my + b[3]->my + 2) >> 2, 0, &best_rd);
1256 check_4block_inter(s, mb_x, mb_y, b[i]->mx, b[i]->my, b[i]->ref, &best_rd);
1258 if(init_rd != best_rd)
1266 static void encode_blocks(
SnowContext *s,
int search){
1281 encode_q_branch2(s, 0, x, y);
1283 encode_q_branch (s, 0, x, y);
1289 const int w= b->
width;
1293 int x,y, thres1, thres2;
1298 dst[x + y*stride]= src[x + y*stride];
1302 bias= bias ? 0 : (3*qmul)>>3;
1309 int i= src[x + y*
stride];
1311 if((
unsigned)(i+thres1) > thres2){
1329 int i= src[x + y*
stride];
1331 if((
unsigned)(i+thres1) > thres2){
1334 i= (i + bias) / qmul;
1339 i= (i + bias) / qmul;
1350 const int w= b->
width;
1361 int i= src[x + y*
stride];
1372 const int w= b->
width;
1376 for(y=h-1; y>=0; y--){
1377 for(x=w-1; x>=0; x--){
1382 if(y && x+1<w) src[i] -=
mid_pred(src[i - 1], src[i - stride], src[i - stride + 1]);
1383 else src[i] -= src[i - 1];
1385 if(y) src[i] -=
mid_pred(src[i - 1], src[i - stride], src[i - 1] + src[i - stride] - src[i - 1 - stride]);
1386 else src[i] -= src[i - 1];
1389 if(y) src[i] -= src[i -
stride];
1396 const int w= b->
width;
1406 if(y && x+1<w) src[i] +=
mid_pred(src[i - 1], src[i - stride], src[i - stride + 1]);
1407 else src[i] += src[i - 1];
1409 if(y) src[i] +=
mid_pred(src[i - 1], src[i - stride], src[i - 1] + src[i - stride] - src[i - 1 - stride]);
1410 else src[i] += src[i - 1];
1413 if(y) src[i] += src[i -
stride];
1420 int plane_index,
level, orientation;
1422 for(plane_index=0; plane_index<2; plane_index++){
1424 for(orientation=level ? 1:0; orientation<4; orientation++){
1425 if(orientation==2)
continue;
1436 memset(kstate,
MID_STATE,
sizeof(kstate));
1446 for(plane_index=0; plane_index<2; plane_index++){
1471 for(plane_index=0; plane_index<2; plane_index++){
1479 for(plane_index=0; plane_index<2; plane_index++){
1483 for(i= p->
htaps/2; i; i--)
1503 static void update_last_header_values(
SnowContext *s){
1507 for(plane_index=0; plane_index<2; plane_index++){
1523 static int qscale2qlog(
int qscale){
1533 uint32_t coef_sum= 0;
1534 int level, orientation, delta_qlog;
1537 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1540 const int w= b->
width;
1542 const int stride= b->
stride;
1545 const int qdiv= (1<<16)/qmul;
1550 buf[x+y*stride]= b->
buf[x+y*stride];
1552 decorrelate(s, b, buf, stride, 1, 0);
1555 coef_sum+= abs(buf[x+y*stride]) * qdiv >> 16;
1560 coef_sum = (uint64_t)coef_sum * coef_sum >> 16;
1561 assert(coef_sum < INT_MAX);
1576 s->
qlog+= delta_qlog;
1581 int width = p->
width;
1583 int level, orientation, x, y;
1586 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1595 for(x=0; x<
width; x++){
1601 b->
qlog= (int)(log(352256.0/sqrt(error)) / log(pow(2.0, 1.0/
QROOT))+0.5);
1612 int level, orientation, plane_index, i, y;
1621 for(y=0; y<(height>>shift); y++)
1661 int block_width = (width +15)>>4;
1662 int block_height= (height+15)>>4;
1671 s->
m. new_picture.f.data[0] = s-> input_picture.data[0];
1672 s->
m. last_picture_ptr= &s->
m. last_picture;
1720 for(plane_index=0; plane_index<3; plane_index++){
1721 calculate_visual_weight(s, &s->
plane[plane_index]);
1727 encode_blocks(s, 1);
1730 for(plane_index=0; plane_index<3; plane_index++){
1739 if(pict->
data[plane_index])
1779 int delta_qlog = ratecontrol_1pass(s, pict);
1780 if (delta_qlog <= INT_MIN)
1788 encode_blocks(s, 0);
1793 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1808 for(orientation=level ? 1 : 0; orientation<4; orientation++){
1830 pict->
data[plane_index][y*pict->
linesize[plane_index] + x];
1841 if(pict->
data[plane_index])
1854 update_last_header_values(s);
1895 #define OFFSET(x) offsetof(SnowContext, x)
1896 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
1898 {
"memc_only",
"Only do ME/MC (I frames -> ref, P frame -> ME+MC).",
OFFSET(memc_only),
AV_OPT_TYPE_INT, { 0 }, 0, 1,
VE },
1902 static const AVClass snowenc_class = {
1918 .priv_class = &snowenc_class,