29 uint32_t av_unused * const score_map= c->score_map;\
30 const int av_unused xmin= c->xmin;\
31 const int av_unused ymin= c->ymin;\
32 const int av_unused xmax= c->xmax;\
33 const int av_unused ymax= c->ymax;\
34 uint8_t *mv_penalty= c->current_mv_penalty;\
35 const int pred_x= c->pred_x;\
36 const int pred_y= c->pred_y;\
38 #define CHECK_HALF_MV(dx, dy, x, y)\
40 const int hx= 2*(x)+(dx);\
41 const int hy= 2*(y)+(dy);\
42 d= cmp_hpel(s, x, y, dx, dy, size, h, ref_index, src_index, cmp_sub, chroma_cmp_sub, flags);\
43 d += (mv_penalty[hx - pred_x] + mv_penalty[hy - pred_y])*penalty_factor;\
44 COPY3_IF_LT(dmin, d, bx, hx, by, hy)\
48 int *mx_ptr,
int *my_ptr,
int dmin,
49 int src_index,
int ref_index,
53 const int mx = *mx_ptr;
54 const int my = *my_ptr;
74 dmin=
cmp(s, mx, my, 0, 0, size, h, ref_index, src_index, cmp_sub, chroma_cmp_sub, flags);
75 if(mx || my || size>0)
79 if (mx > xmin && mx < xmax &&
80 my > ymin && my < ymax) {
92 #if defined(ASSERT_LEVEL) && ASSERT_LEVEL > 1
143 av_assert2(bx >= xmin*2 && bx <= xmax*2 && by >= ymin*2 && by <= ymax*2);
153 int *mx_ptr,
int *my_ptr,
int dmin,
154 int src_index,
int ref_index,
163 int src_index,
int ref_index,
int size,
171 const int mask= 1+2*qpel;
182 d=
cmp(s, mx>>(qpel+1), my>>(qpel+1), mx&mask, my&mask, size, h, ref_index, src_index, cmp_sub, chroma_cmp_sub, flags);
184 if(add_rate && (mx || my || size>0))
191 int ref_index,
int size,
int h,
int add_rate)
193 return get_mb_score(s, mx, my, src_index, ref_index, size, h, add_rate);
196 #define CHECK_QUARTER_MV(dx, dy, x, y)\
198 const int hx= 4*(x)+(dx);\
199 const int hy= 4*(y)+(dy);\
200 d= cmp_qpel(s, x, y, dx, dy, size, h, ref_index, src_index, cmpf, chroma_cmpf, flags);\
201 d += (mv_penalty[hx - pred_x] + mv_penalty[hy - pred_y])*penalty_factor;\
202 COPY3_IF_LT(dmin, d, bx, hx, by, hy)\
206 int *mx_ptr,
int *my_ptr,
int dmin,
207 int src_index,
int ref_index,
211 const int mx = *mx_ptr;
212 const int my = *my_ptr;
216 uint32_t *map= c->
map;
237 dmin=
cmp(s, mx, my, 0, 0, size, h, ref_index, src_index, cmp_sub, chroma_cmp_sub, flags);
238 if(mx || my || size>0)
242 if (mx > xmin && mx < xmax &&
243 my > ymin && my < ymax) {
244 int bx=4*mx, by=4*my;
249 const int l= score_map[(index- 1 )&(
ME_MAP_SIZE-1)];
256 memset(best, 64,
sizeof(
int)*8);
263 for(ny= -3; ny <= 3; ny++){
264 for(nx= -3; nx <= 3; nx++){
266 const int64_t
t2= nx*nx*(tr + tl - 2*
t) + 4*nx*(tr-tl) + 32*
t;
267 const int64_t
c2= nx*nx*( r + l - 2*
c) + 4*nx*( r- l) + 32*
c;
268 const int64_t b2= nx*nx*(br + bl - 2*
b) + 4*nx*(br-bl) + 32*
b;
269 int score= (ny*ny*(b2 + t2 - 2*
c2) + 4*ny*(b2 - t2) + 32*c2 + 512)>>10;
272 if((nx&3)==0 && (ny&3)==0)
continue;
281 memmove(&best[i+1], &best[i],
sizeof(
int)*(7-i));
282 memmove(&best_pos[i+1][0], &best_pos[i][0],
sizeof(
int)*2*(7-i));
284 best_pos[i][0]= nx + 4*mx;
285 best_pos[i][1]= ny + 4*my;
294 const int cx = 4*(r - l);
295 const int cx2= r + l - 2*
c;
296 const int cy = 4*(b -
t);
297 const int cy2= b + t - 2*
c;
303 tl=
cmp(s, mx-1, my-1, 0, 0, size, h, ref_index, src_index, cmpf, chroma_cmpf, flags);
306 cxy= 2*tl + (cx + cy)/4 - (cx2 + cy2) - 2*
c;
312 av_assert2(16*cxy + 16*cy2 + 16*cx2 - 4*cy - 4*cx + 32*c == 32*tl);
314 for(ny= -3; ny <= 3; ny++){
315 for(nx= -3; nx <= 3; nx++){
317 int score= ny*nx*cxy + nx*nx*cx2 + ny*ny*cy2 + nx*cx + ny*cy + 32*
c;
320 if((nx&3)==0 && (ny&3)==0)
continue;
328 memmove(&best[i+1], &best[i],
sizeof(
int)*(7-i));
329 memmove(&best_pos[i+1][0], &best_pos[i][0],
sizeof(
int)*2*(7-i));
331 best_pos[i][0]= nx + 4*mx;
332 best_pos[i][1]= ny + 4*my;
339 for(i=0; i<subpel_quality; i++){
345 av_assert2(bx >= xmin*4 && bx <= xmax*4 && by >= ymin*4 && by <= ymax*4);
358 #define CHECK_MV(x,y)\
360 const unsigned key = ((y)<<ME_MAP_MV_BITS) + (x) + map_generation;\
361 const int index= (((y)<<ME_MAP_SHIFT) + (x))&(ME_MAP_SIZE-1);\
362 av_assert2((x) >= xmin);\
363 av_assert2((x) <= xmax);\
364 av_assert2((y) >= ymin);\
365 av_assert2((y) <= ymax);\
366 if(map[index]!=key){\
367 d= cmp(s, x, y, 0, 0, size, h, ref_index, src_index, cmpf, chroma_cmpf, flags);\
369 score_map[index]= d;\
370 d += (mv_penalty[((x)<<shift)-pred_x] + mv_penalty[((y)<<shift)-pred_y])*penalty_factor;\
371 COPY3_IF_LT(dmin, d, best[0], x, best[1], y)\
375 #define CHECK_CLIPPED_MV(ax,ay)\
379 const int Lx2= FFMAX(xmin, FFMIN(Lx, xmax));\
380 const int Ly2= FFMAX(ymin, FFMIN(Ly, ymax));\
384 #define CHECK_MV_DIR(x,y,new_dir)\
386 const unsigned key = ((y)<<ME_MAP_MV_BITS) + (x) + map_generation;\
387 const int index= (((y)<<ME_MAP_SHIFT) + (x))&(ME_MAP_SIZE-1);\
388 if(map[index]!=key){\
389 d= cmp(s, x, y, 0, 0, size, h, ref_index, src_index, cmpf, chroma_cmpf, flags);\
391 score_map[index]= d;\
392 d += (mv_penalty[((x)<<shift)-pred_x] + mv_penalty[((y)<<shift)-pred_y])*penalty_factor;\
402 #define check(x,y,S,v)\
403 if( (x)<(xmin<<(S)) ) av_log(NULL, AV_LOG_ERROR, "%d %d %d %d %d xmin" #v, xmin, (x), (y), s->mb_x, s->mb_y);\
404 if( (x)>(xmax<<(S)) ) av_log(NULL, AV_LOG_ERROR, "%d %d %d %d %d xmax" #v, xmax, (x), (y), s->mb_x, s->mb_y);\
405 if( (y)<(ymin<<(S)) ) av_log(NULL, AV_LOG_ERROR, "%d %d %d %d %d ymin" #v, ymin, (x), (y), s->mb_x, s->mb_y);\
406 if( (y)>(ymax<<(S)) ) av_log(NULL, AV_LOG_ERROR, "%d %d %d %d %d ymax" #v, ymax, (x), (y), s->mb_x, s->mb_y);\
408 #define LOAD_COMMON2\
409 uint32_t *map= c->map;\
410 const int qpel= flags&FLAG_QPEL;\
411 const int shift= 1+qpel;\
414 int src_index,
int ref_index,
int const penalty_factor,
428 const unsigned key = (best[1]<<
ME_MAP_MV_BITS) + best[0] + map_generation;
431 score_map[
index]=
cmp(s, best[0], best[1], 0, 0, size, h, ref_index, src_index, cmpf, chroma_cmpf, flags);
438 const int dir= next_dir;
439 const int x= best[0];
440 const int y= best[1];
455 int src_index,
int ref_index,
int const penalty_factor,
468 for(dia_size=1; dia_size<=4; dia_size++){
470 const int x= best[0];
471 const int y= best[1];
473 if(dia_size&(dia_size-1))
continue;
475 if( x + dia_size > xmax
476 || x - dia_size < xmin
477 || y + dia_size > ymax
478 || y - dia_size < ymin)
481 for(dir= 0; dir<dia_size; dir+=2){
484 CHECK_MV(x + dir , y + dia_size - dir);
485 CHECK_MV(x + dia_size - dir, y - dir );
486 CHECK_MV(x - dir , y - dia_size + dir);
487 CHECK_MV(x - dia_size + dir, y + dir );
490 if(x!=best[0] || y!=best[1])
497 int src_index,
int ref_index,
int const penalty_factor,
498 int size,
int h,
int flags,
int dia_size)
506 const int dec= dia_size & (dia_size-1);
511 for(;dia_size; dia_size= dec ? dia_size-1 : dia_size>>1){
524 }
while(best[0] != x || best[1] != y);
531 int src_index,
int ref_index,
int const penalty_factor,
541 const int dec= dia_size & (dia_size-1);
542 static const int hex[8][2]={{-2, 0}, {-1,-1}, { 0,-2}, { 1,-1},
543 { 2, 0}, { 1, 1}, { 0, 2}, {-1, 1}};
548 for(; dia_size; dia_size= dec ? dia_size-1 : dia_size>>1){
555 }
while(best[0] != x || best[1] != y);
569 int src_index,
int ref_index,
int const penalty_factor,
577 int x,
y,x2,y2, i, j, d;
578 const int dia_size= c->
dia_size&0xFE;
579 static const int hex[16][2]={{-4,-2}, {-4,-1}, {-4, 0}, {-4, 1}, {-4, 2},
580 { 4,-2}, { 4,-1}, { 4, 0}, { 4, 1}, { 4, 2},
581 {-2, 3}, { 0, 4}, { 2, 3},
582 {-2,-3}, { 0,-4}, { 2,-3},};
589 for(x2=
FFMAX(x-dia_size+1, xmin); x2<=
FFMIN(x+dia_size-1,xmax); x2+=2){
592 for(y2=
FFMAX(y-dia_size/2+1, ymin); y2<=
FFMIN(y+dia_size/2-1,ymax); y2+=2){
598 for(y2=
FFMAX(y-2, ymin); y2<=
FFMIN(y+2,ymax); y2++){
599 for(x2=
FFMAX(x-2, xmin); x2<=
FFMIN(x+2,xmax); x2++){
606 for(j=1; j<=dia_size/4; j++){
612 return hex_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags, 2);
616 int src_index,
int ref_index,
int const penalty_factor,
625 const int dia_size= c->
dia_size&0xFF;
630 for(y=
FFMAX(-dia_size, ymin); y<=
FFMIN(dia_size,ymax); y++){
631 for(x=
FFMAX(-dia_size, xmin); x<=
FFMIN(dia_size,xmax); x++){
650 #define SAB_CHECK_MV(ax,ay)\
652 const unsigned key = ((ay)<<ME_MAP_MV_BITS) + (ax) + map_generation;\
653 const int index= (((ay)<<ME_MAP_SHIFT) + (ax))&(ME_MAP_SIZE-1);\
654 if(map[index]!=key){\
655 d= cmp(s, ax, ay, 0, 0, size, h, ref_index, src_index, cmpf, chroma_cmpf, flags);\
657 score_map[index]= d;\
658 d += (mv_penalty[((ax)<<shift)-pred_x] + mv_penalty[((ay)<<shift)-pred_y])*penalty_factor;\
659 if(d < minima[minima_count-1].height){\
662 while(d >= minima[j].height) j++;\
664 memmove(&minima [j+1], &minima [j], (minima_count - j - 1)*sizeof(Minima));\
666 minima[j].checked= 0;\
667 minima[j].height= d;\
677 #define MAX_SAB_SIZE ME_MAP_SIZE
679 int src_index,
int ref_index,
int const penalty_factor,
700 uint32_t key= map[i];
706 minima[j].
height= score_map[i];
713 if( minima[j].x > xmax || minima[j].x < xmin
714 || minima[j].
y > ymax || minima[j].
y < ymin)
718 if(minima[j].x || minima[j].
y)
726 for(; j<minima_count; j++){
727 minima[j].
height=256*256*256*64;
729 minima[j].
x= minima[j].
y=0;
732 for(i=0; i<minima_count; i++){
733 const int x= minima[i].
x;
734 const int y= minima[i].
y;
737 if(minima[i].
checked)
continue;
739 if( x >= xmax || x <= xmin
740 || y >= ymax || y <= ymin)
751 best[0]= minima[0].
x;
752 best[1]= minima[0].
y;
755 if( best[0] < xmax && best[0] > xmin
756 && best[1] < ymax && best[1] > ymin){
768 int src_index,
int ref_index,
int const penalty_factor,
781 for(dia_size=1; dia_size<=c->
dia_size; dia_size++){
783 const int x= best[0];
784 const int y= best[1];
786 start=
FFMAX(0, y + dia_size - ymax);
787 end =
FFMIN(dia_size, xmax - x + 1);
788 for(dir= start; dir<
end; dir++){
792 CHECK_MV(x + dir , y + dia_size - dir);
795 start=
FFMAX(0, x + dia_size - xmax);
796 end =
FFMIN(dia_size, y - ymin + 1);
797 for(dir= start; dir<
end; dir++){
801 CHECK_MV(x + dia_size - dir, y - dir );
804 start=
FFMAX(0, -y + dia_size + ymin );
805 end =
FFMIN(dia_size, x - xmin + 1);
806 for(dir= start; dir<
end; dir++){
810 CHECK_MV(x - dir , y - dia_size + dir);
813 start=
FFMAX(0, -x + dia_size + xmin );
814 end =
FFMIN(dia_size, ymax - y + 1);
815 for(dir= start; dir<
end; dir++){
819 CHECK_MV(x - dia_size + dir, y + dir );
822 if(x!=best[0] || y!=best[1])
829 int src_index,
int ref_index,
int const penalty_factor,
833 return funny_diamond_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
835 return sab_diamond_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
837 return small_diamond_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
839 return full_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
841 return umh_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
843 return hex_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags, c->
dia_size&0xFF);
845 return l2s_dia_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
847 return var_diamond_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
857 int P[10][2],
int src_index,
int ref_index, int16_t (*last_mv)[2],
858 int ref_mv_scale,
int flags,
int size,
int h)
868 unsigned map_generation;
871 const int ref_mv_xy= s->
mb_x + s->
mb_y*ref_mv_stride;
890 dmin=
cmp(s, 0, 0, 0, 0, size, h, ref_index, src_index, cmpf, chroma_cmpf, flags);
891 map[0]= map_generation;
902 (last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
919 (last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
927 (last_mv[ref_mv_xy-1][1]*ref_mv_scale + (1<<15))>>16)
929 CHECK_CLIPPED_MV((last_mv[ref_mv_xy-ref_mv_stride][0]*ref_mv_scale + (1<<15))>>16,
930 (last_mv[ref_mv_xy-ref_mv_stride][1]*ref_mv_scale + (1<<15))>>16)
933 (last_mv[ref_mv_xy+1][1]*ref_mv_scale + (1<<15))>>16)
935 CHECK_CLIPPED_MV((last_mv[ref_mv_xy+ref_mv_stride][0]*ref_mv_scale + (1<<15))>>16,
936 (last_mv[ref_mv_xy+ref_mv_stride][1]*ref_mv_scale + (1<<15))>>16)
942 const int xstart=
FFMAX(0, s->
mb_x - count);
943 const int ystart=
FFMAX(0, s->
mb_y - count);
948 for(mb_y=ystart; mb_y<yend; mb_y++){
950 for(mb_x=xstart; mb_x<xend; mb_x++){
951 const int xy= mb_x + 1 + (mb_y + 1)*ref_mv_stride;
952 int mx= (last_mv[xy][0]*ref_mv_scale + (1<<15))>>16;
953 int my= (last_mv[xy][1]*ref_mv_scale + (1<<15))>>16;
955 if(mx>xmax || mx<xmin || my>ymax || my<ymin)
continue;
962 dmin=
diamond_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
973 int P[10][2],
int src_index,
int ref_index,
974 int16_t (*last_mv)[2],
int ref_mv_scale,
979 if(c->
flags==0 && h==16 && size==0){
980 return epzs_motion_search_internal(s, mx_ptr, my_ptr, P, src_index, ref_index, last_mv, ref_mv_scale, 0, 0, 16);
984 return epzs_motion_search_internal(s, mx_ptr, my_ptr, P, src_index, ref_index, last_mv, ref_mv_scale, c->
flags, size, h);
989 int *mx_ptr,
int *my_ptr,
int P[10][2],
990 int src_index,
int ref_index, int16_t (*last_mv)[2],
996 unsigned map_generation;
1001 const int ref_mv_xy= s->
mb_x + s->
mb_y *ref_mv_stride;
1018 (last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
1028 (last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
1032 (last_mv[ref_mv_xy+1][1]*ref_mv_scale + (1<<15))>>16)
1034 CHECK_CLIPPED_MV((last_mv[ref_mv_xy+ref_mv_stride][0]*ref_mv_scale + (1<<15))>>16,
1035 (last_mv[ref_mv_xy+ref_mv_stride][1]*ref_mv_scale + (1<<15))>>16)
1038 dmin=
diamond_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);
1048 int *mx_ptr,
int *my_ptr,
int P[10][2],
1049 int src_index,
int ref_index, int16_t (*last_mv)[2],
1055 unsigned map_generation;
1060 const int ref_mv_xy= s->
mb_x + s->
mb_y *ref_mv_stride;
1077 (last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
1087 (last_mv[ref_mv_xy][1]*ref_mv_scale + (1<<15))>>16)
1091 (last_mv[ref_mv_xy+1][1]*ref_mv_scale + (1<<15))>>16)
1093 CHECK_CLIPPED_MV((last_mv[ref_mv_xy+ref_mv_stride][0]*ref_mv_scale + (1<<15))>>16,
1094 (last_mv[ref_mv_xy+ref_mv_stride][1]*ref_mv_scale + (1<<15))>>16)
1097 dmin=
diamond_search(s, best, dmin, src_index, ref_index, penalty_factor, size, h, flags);