22 #ifndef AVCODEC_SNOW_H
23 #define AVCODEC_SNOW_H
37 #define QROOT (1<<QSHIFT)
38 #define LOSSLESS_QLOG -128
40 #define MAX_REF_FRAMES 8
42 #define LOG2_OBMC_MAX 8
43 #define OBMC_MAX (1<<(LOG2_OBMC_MAX))
58 .
color= {128,128,128},
66 #define LOG2_MB_SIZE 4
67 #define MB_SIZE (1<<LOG2_MB_SIZE)
68 #define ENCODER_EXTRA_BITS 4
155 #define QBIAS_SHIFT 3
162 #define ME_CACHE_SIZE 1024
186 low[(*i)+1] = low[((*i)+1)>>1];
192 for (; (*i)>=0; (*i)-=2){
193 low[(*i)+1] = high[(*i)>>1];
194 low[*i] = low[(*i)>>1];
200 dst[i] = src[i] - ((mul * (ref[i] + ref[i + 1]) + add) >>
shift);
203 if((width^lift_high)&1){
204 dst[w] = src[w] - ((mul * 2 * ref[w] + add) >> shift);
210 dst[i] = src[i] + ((ref[i] + ref[(i+1)]+
W_BO + 4 * src[i]) >>
W_BS);
214 dst[w] = src[w] + ((2 * ref[w] +
W_BO + 4 * src[w]) >>
W_BS);
229 int plane_index,
int w,
int h);
233 static inline void snow_set_blocks(
SnowContext *s,
int level,
int x,
int y,
int l,
int cb,
int cr,
int mx,
int my,
int ref,
int type){
236 const int index= (x + y*w) << rem_depth;
237 const int block_w= 1<<rem_depth;
250 for(j=0; j<block_w; j++){
251 for(i=0; i<block_w; i++){
265 (top ->
mx * scale[top ->
ref] + 128) >>8,
266 (tr ->
mx * scale[tr ->
ref] + 128) >>8);
268 (top ->
my * scale[top ->
ref] + 128) >>8,
269 (tr ->
my * scale[tr ->
ref] + 128) >>8);
283 static av_always_inline void add_yblock(
SnowContext *s,
int sliced,
slice_buffer *sb,
IDWTELEM *
dst,
uint8_t *dst8,
const uint8_t *obmc,
int src_x,
int src_y,
int b_w,
int b_h,
int w,
int h,
int dst_stride,
int src_stride,
int obmc_stride,
int b_x,
int b_y,
int add,
int offset_dst,
int plane_index){
286 const int b_stride= b_width;
300 }
else if(b_x + 1 >= b_width){
307 }
else if(b_y + 1 >= b_height){
315 if(!sliced && !offset_dst)
318 }
else if(src_x + b_w > w){
322 obmc -= src_y*obmc_stride;
324 if(!sliced && !offset_dst)
325 dst -= src_y*dst_stride;
327 }
else if(src_y + b_h> h){
331 if(b_w<=0 || b_h<=0)
return;
335 if(!sliced && offset_dst)
336 dst += src_x + src_y*dst_stride;
337 dst8+= src_x + src_y*src_stride;
340 ptmp= tmp + 3*tmp_step;
343 ff_snow_pred_block(s, block[0], tmp, src_stride, src_x, src_y, b_w, b_h, lt, plane_index, w, h);
350 ff_snow_pred_block(s, block[1], tmp, src_stride, src_x, src_y, b_w, b_h, rt, plane_index, w, h);
360 ff_snow_pred_block(s, block[2], tmp, src_stride, src_x, src_y, b_w, b_h, lb, plane_index, w, h);
371 ff_snow_pred_block(s, block[3], tmp, src_stride, src_x, src_y, b_w, b_h, rb, plane_index, w, h);
374 s->
dwt.
inner_add_yblock(obmc, obmc_stride, block, b_w, b_h, src_x,src_y, src_stride, sb, add, dst8);
376 for(y=0; y<b_h; y++){
378 const uint8_t *obmc1= obmc + y*obmc_stride;
379 const uint8_t *obmc2= obmc1+ (obmc_stride>>1);
380 const uint8_t *obmc3= obmc1+ obmc_stride*(obmc_stride>>1);
382 for(x=0; x<b_w; x++){
383 int v= obmc1[x] * block[3][x + y*src_stride]
384 +obmc2[x] * block[2][x + y*src_stride]
385 +obmc3[x] * block[1][x + y*src_stride]
386 +obmc4[x] * block[0][x + y*src_stride];
393 v += dst[x + y*dst_stride];
395 if(v&(~255)) v= ~(v>>31);
396 dst8[x + y*src_stride] =
v;
398 dst[x + y*dst_stride] -=
v;
411 int block_w = plane_index ? block_size>>s->
chroma_h_shift : block_size;
412 int block_h = plane_index ? block_size>>s->
chroma_v_shift : block_size;
414 const int obmc_stride= plane_index ? (2*block_size)>>s->
chroma_h_shift : 2*block_size;
425 for(y=block_h*mb_y; y<
FFMIN(h,block_h*(mb_y+1)); y++){
429 if(v&(~255)) v= ~(v>>31);
430 dst8[x + y*ref_stride]=
v;
434 for(y=block_h*mb_y; y<
FFMIN(h,block_h*(mb_y+1)); y++){
444 for(mb_x=0; mb_x<=mb_w; mb_x++){
446 block_w*mb_x - block_w/2,
447 block_h*mb_y - block_h/2,
450 w, ref_stride, obmc_stride,
452 add, 1, plane_index);
459 for(mb_y=0; mb_y<=mb_h; mb_y++)
463 static inline void set_blocks(
SnowContext *s,
int level,
int x,
int y,
int l,
int cb,
int cr,
int mx,
int my,
int ref,
int type){
466 const int index= (x + y*w) << rem_depth;
467 const int block_w= 1<<rem_depth;
468 const int block_h= 1<<rem_depth;
481 for(j=0; j<block_h; j++){
482 for(i=0; i<block_w; i++){
497 c->
src[0][i]= src [i];
498 c->
ref[0][i]= ref [i] + offset[i];
508 #define QEXPSHIFT (7-FRAC_BITS+8) //FIXME try to change this to 0
516 const int el=
FFMIN(e, 10);
527 for(i=e-1; i>=el; i--){
528 put_rac(c, state+22+9, (a>>i)&1);
531 put_rac(c, state+22+i, (a>>i)&1);
535 put_rac(c, state+11 + el, v < 0);
552 for(i=e-1; i>=0; i--){
563 int r= log2>=0 ? 1<<log2 : 1;
576 for(i=log2-1; i>=0; i--){
577 put_rac(c, state+31-i, (v>>i)&1);
583 int r= log2>=0 ? 1<<log2 : 1;
588 while(log2<28 &&
get_rac(c, state+4+log2)){
594 for(i=log2-1; i>=0; i--){
602 const int w= b->
width;
621 if(y && prev_xc->
x == 0){
633 if(prev_xc->
x == x + 1)
639 if(x>>1 > parent_xc->
x){
642 if(x>>1 == parent_xc->
x){
647 int context=
av_log2(3*(l>>1) + (lt>>1) + (
t&~1) + (rt>>1) + (p>>1));
671 if(y) max_run=
FFMIN(run, prev_xc->
x - x - 2);
672 else max_run=
FFMIN(run, w-x-1);
674 max_run=
FFMIN(max_run, 2*parent_xc->
x - x - 1);
688 while(parent_xc->
x != parent->
width+1)
691 prev_parent_xc= parent_xc;
693 parent_xc= prev_parent_xc;