22 #ifndef AVCODEC_SNOW_H
23 #define AVCODEC_SNOW_H
38 #define QROOT (1<<QSHIFT)
39 #define LOSSLESS_QLOG -128
41 #define MAX_REF_FRAMES 8
43 #define LOG2_OBMC_MAX 8
44 #define OBMC_MAX (1<<(LOG2_OBMC_MAX))
59 .
color= {128,128,128},
67 #define LOG2_MB_SIZE 4
68 #define MB_SIZE (1<<LOG2_MB_SIZE)
69 #define ENCODER_EXTRA_BITS 4
157 #define QBIAS_SHIFT 3
165 #define ME_CACHE_SIZE 1024
189 low[(*i)+1] = low[((*i)+1)>>1];
195 for (; (*i)>=0; (*i)-=2){
196 low[(*i)+1] = high[(*i)>>1];
197 low[*i] = low[(*i)>>1];
203 dst[i] = src[i] - ((mul * (ref[i] + ref[i + 1]) + add) >>
shift);
206 if((width^lift_high)&1){
207 dst[w] = src[w] - ((mul * 2 * ref[w] + add) >> shift);
213 dst[i] = src[i] + ((ref[i] + ref[(i+1)]+
W_BO + 4 * src[i]) >>
W_BS);
217 dst[w] = src[w] + ((2 * ref[w] +
W_BO + 4 * src[w]) >>
W_BS);
232 int plane_index,
int w,
int h);
236 static inline void snow_set_blocks(
SnowContext *
s,
int level,
int x,
int y,
int l,
int cb,
int cr,
int mx,
int my,
int ref,
int type){
239 const int index= (x + y*w) << rem_depth;
240 const int block_w= 1<<rem_depth;
253 for(j=0; j<block_w; j++){
254 for(i=0; i<block_w; i++){
268 (top ->
mx * scale[top ->
ref] + 128) >>8,
269 (tr ->
mx * scale[tr ->
ref] + 128) >>8);
271 (top ->
my * scale[top ->
ref] + 128) >>8,
272 (tr ->
my * scale[tr ->
ref] + 128) >>8);
286 static av_always_inline void add_yblock(
SnowContext *
s,
int sliced,
slice_buffer *sb,
IDWTELEM *dst,
uint8_t *dst8,
const uint8_t *obmc,
int src_x,
int src_y,
int b_w,
int b_h,
int w,
int h,
int dst_stride,
int src_stride,
int obmc_stride,
int b_x,
int b_y,
int add,
int offset_dst,
int plane_index){
289 const int b_stride= b_width;
303 }
else if(b_x + 1 >= b_width){
310 }
else if(b_y + 1 >= b_height){
318 if(!sliced && !offset_dst)
326 obmc -= src_y*obmc_stride;
328 if(!sliced && !offset_dst)
329 dst -= src_y*dst_stride;
336 if(b_w<=0 || b_h<=0)
return;
340 if(!sliced && offset_dst)
341 dst += src_x + src_y*dst_stride;
342 dst8+= src_x + src_y*src_stride;
345 ptmp= tmp + 3*tmp_step;
348 ff_snow_pred_block(s, block[0], tmp, src_stride, src_x, src_y, b_w, b_h, lt, plane_index, w, h);
355 ff_snow_pred_block(s, block[1], tmp, src_stride, src_x, src_y, b_w, b_h, rt, plane_index, w, h);
365 ff_snow_pred_block(s, block[2], tmp, src_stride, src_x, src_y, b_w, b_h, lb, plane_index, w, h);
376 ff_snow_pred_block(s, block[3], tmp, src_stride, src_x, src_y, b_w, b_h, rb, plane_index, w, h);
379 s->
dwt.
inner_add_yblock(obmc, obmc_stride, block, b_w, b_h, src_x,src_y, src_stride, sb, add, dst8);
381 for(y=0; y<b_h; y++){
383 const uint8_t *obmc1= obmc + y*obmc_stride;
384 const uint8_t *obmc2= obmc1+ (obmc_stride>>1);
385 const uint8_t *obmc3= obmc1+ obmc_stride*(obmc_stride>>1);
387 for(x=0; x<b_w; x++){
388 int v= obmc1[x] * block[3][x + y*src_stride]
389 +obmc2[x] * block[2][x + y*src_stride]
390 +obmc3[x] * block[1][x + y*src_stride]
391 +obmc4[x] * block[0][x + y*src_stride];
398 v += dst[x + y*dst_stride];
400 if(v&(~255)) v= ~(v>>31);
401 dst8[x + y*src_stride] =
v;
403 dst[x + y*dst_stride] -=
v;
416 int block_w = plane_index ? block_size>>s->
chroma_h_shift : block_size;
417 int block_h = plane_index ? block_size>>s->
chroma_v_shift : block_size;
419 const int obmc_stride= plane_index ? (2*block_size)>>s->
chroma_h_shift : 2*block_size;
430 for(y=block_h*mb_y; y<
FFMIN(h,block_h*(mb_y+1)); y++){
434 if(v&(~255)) v= ~(v>>31);
435 dst8[x + y*ref_stride]=
v;
439 for(y=block_h*mb_y; y<
FFMIN(h,block_h*(mb_y+1)); y++){
449 for(mb_x=0; mb_x<=mb_w; mb_x++){
451 block_w*mb_x - block_w/2,
452 block_h*mb_y - block_h/2,
455 w, ref_stride, obmc_stride,
457 add, 1, plane_index);
464 for(mb_y=0; mb_y<=mb_h; mb_y++)
468 static inline void set_blocks(
SnowContext *
s,
int level,
int x,
int y,
int l,
int cb,
int cr,
int mx,
int my,
int ref,
int type){
471 const int index= (x + y*w) << rem_depth;
472 const int block_w= 1<<rem_depth;
473 const int block_h= 1<<rem_depth;
486 for(j=0; j<block_h; j++){
487 for(i=0; i<block_w; i++){
502 c->
src[0][i]= src [i];
503 c->
ref[0][i]= ref [i] + offset[i];
513 #define QEXPSHIFT (7-FRAC_BITS+8) //FIXME try to change this to 0
521 const int el=
FFMIN(e, 10);
532 for(i=e-1; i>=el; i--){
533 put_rac(c, state+22+9, (a>>i)&1);
536 put_rac(c, state+22+i, (a>>i)&1);
540 put_rac(c, state+11 + el, v < 0);
557 for(i=e-1; i>=0; i--){
568 int r= log2>=0 ? 1<<log2 : 1;
581 for(i=log2-1; i>=0; i--){
582 put_rac(c, state+31-i, (v>>i)&1);
588 int r= log2>=0 ? 1<<log2 : 1;
593 while(log2<28 &&
get_rac(c, state+4+log2)){
599 for(i=log2-1; i>=0; i--){
607 const int w= b->
width;
626 if(y && prev_xc->
x == 0){
638 if(prev_xc->
x == x + 1)
644 if(x>>1 > parent_xc->
x){
647 if(x>>1 == parent_xc->
x){
652 int context=
av_log2(3*(l>>1) + (lt>>1) + (
t&~1) + (rt>>1) + (p>>1));
676 if(y) max_run=
FFMIN(run, prev_xc->
x - x - 2);
677 else max_run=
FFMIN(run, w-x-1);
679 max_run=
FFMIN(max_run, 2*parent_xc->
x - x - 1);
693 while(parent_xc->
x != parent->
width+1)
696 prev_parent_xc= parent_xc;
698 parent_xc= prev_parent_xc;