3
* VP5 and VP6 compatible video decoder (common features)
5
* Copyright (C) 2006 Aurelien Jacobs <aurel@gnuage.org>
7
* This file is part of FFmpeg.
9
* FFmpeg is free software; you can redistribute it and/or
10
* modify it under the terms of the GNU Lesser General Public
11
* License as published by the Free Software Foundation; either
12
* version 2.1 of the License, or (at your option) any later version.
14
* FFmpeg is distributed in the hope that it will be useful,
15
* but WITHOUT ANY WARRANTY; without even the implied warranty of
16
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17
* Lesser General Public License for more details.
19
* You should have received a copy of the GNU Lesser General Public
20
* License along with FFmpeg; if not, write to the Free Software
21
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
30
void vp56_init_dequant(vp56_context_t *s, int quantizer)
32
s->quantizer = quantizer;
33
s->dequant_dc = vp56_dc_dequant[quantizer] << 2;
34
s->dequant_ac = vp56_ac_dequant[quantizer] << 2;
37
static int vp56_get_vectors_predictors(vp56_context_t *s, int row, int col,
38
vp56_frame_t ref_frame)
41
vp56_mv_t vect[2] = {{0,0}, {0,0}};
45
for (pos=0; pos<12; pos++) {
46
mvp.x = col + vp56_candidate_predictor_pos[pos][0];
47
mvp.y = row + vp56_candidate_predictor_pos[pos][1];
48
if (mvp.x < 0 || mvp.x >= s->mb_width ||
49
mvp.y < 0 || mvp.y >= s->mb_height)
51
offset = mvp.x + s->mb_width*mvp.y;
53
if (vp56_reference_frame[s->macroblocks[offset].type] != ref_frame)
55
if ((s->macroblocks[offset].mv.x == vect[0].x &&
56
s->macroblocks[offset].mv.y == vect[0].y) ||
57
(s->macroblocks[offset].mv.x == 0 &&
58
s->macroblocks[offset].mv.y == 0))
61
vect[nb_pred++] = s->macroblocks[offset].mv;
66
s->vector_candidate_pos = pos;
69
s->vector_candidate[0] = vect[0];
70
s->vector_candidate[1] = vect[1];
75
static void vp56_parse_mb_type_models(vp56_context_t *s)
77
vp56_range_coder_t *c = &s->c;
80
for (ctx=0; ctx<3; ctx++) {
81
if (vp56_rac_get_prob(c, 174)) {
82
int idx = vp56_rac_gets(c, 4);
83
memcpy(s->mb_types_stats[ctx],vp56_pre_def_mb_type_stats[idx][ctx],
84
sizeof(s->mb_types_stats[ctx]));
86
if (vp56_rac_get_prob(c, 254)) {
87
for (type=0; type<10; type++) {
89
if (vp56_rac_get_prob(c, 205)) {
90
int delta, sign = vp56_rac_get(c);
92
delta = vp56_rac_get_tree(c, vp56_pmbtm_tree,
93
vp56_mb_type_model_model);
95
delta = 4 * vp56_rac_gets(c, 7);
96
s->mb_types_stats[ctx][type][i] += (delta ^ -sign) + sign;
103
/* compute MB type probability tables based on previous MB type */
104
for (ctx=0; ctx<3; ctx++) {
107
for (type=0; type<10; type++)
108
p[type] = 100 * s->mb_types_stats[ctx][type][1];
110
for (type=0; type<10; type++) {
111
int p02, p34, p0234, p17, p56, p89, p5689, p156789;
113
/* conservative MB type probability */
114
s->mb_type_model[ctx][type][0] = 255 - (255 * s->mb_types_stats[ctx][type][0]) / (1 + s->mb_types_stats[ctx][type][0] + s->mb_types_stats[ctx][type][1]);
116
p[type] = 0; /* same MB type => weight is null */
118
/* binary tree parsing probabilities */
126
p156789 = p17 + p5689;
128
s->mb_type_model[ctx][type][1] = 1 + 255 * p0234/(1+p0234+p156789);
129
s->mb_type_model[ctx][type][2] = 1 + 255 * p02 / (1+p0234);
130
s->mb_type_model[ctx][type][3] = 1 + 255 * p17 / (1+p156789);
131
s->mb_type_model[ctx][type][4] = 1 + 255 * p[0] / (1+p02);
132
s->mb_type_model[ctx][type][5] = 1 + 255 * p[3] / (1+p34);
133
s->mb_type_model[ctx][type][6] = 1 + 255 * p[1] / (1+p17);
134
s->mb_type_model[ctx][type][7] = 1 + 255 * p56 / (1+p5689);
135
s->mb_type_model[ctx][type][8] = 1 + 255 * p[5] / (1+p56);
136
s->mb_type_model[ctx][type][9] = 1 + 255 * p[8] / (1+p89);
138
/* restore initial value */
139
p[type] = 100 * s->mb_types_stats[ctx][type][1];
144
static vp56_mb_t vp56_parse_mb_type(vp56_context_t *s,
145
vp56_mb_t prev_type, int ctx)
147
uint8_t *mb_type_model = s->mb_type_model[ctx][prev_type];
148
vp56_range_coder_t *c = &s->c;
150
if (vp56_rac_get_prob(c, mb_type_model[0]))
153
return vp56_rac_get_tree(c, vp56_pmbt_tree, mb_type_model);
156
static void vp56_decode_4mv(vp56_context_t *s, int row, int col)
158
vp56_mv_t mv = {0,0};
162
/* parse each block type */
163
for (b=0; b<4; b++) {
164
type[b] = vp56_rac_gets(&s->c, 2);
166
type[b]++; /* only returns 0, 2, 3 or 4 (all INTER_PF) */
170
for (b=0; b<4; b++) {
172
case VP56_MB_INTER_NOVEC_PF:
173
s->mv[b] = (vp56_mv_t) {0,0};
175
case VP56_MB_INTER_DELTA_PF:
176
s->parse_vector_adjustment(s, &s->mv[b]);
178
case VP56_MB_INTER_V1_PF:
179
s->mv[b] = s->vector_candidate[0];
181
case VP56_MB_INTER_V2_PF:
182
s->mv[b] = s->vector_candidate[1];
189
/* this is the one selected for the whole MB for prediction */
190
s->macroblocks[row * s->mb_width + col].mv = s->mv[3];
192
/* chroma vectors are average luma vectors */
193
if (s->avctx->codec->id == CODEC_ID_VP5) {
194
s->mv[4].x = s->mv[5].x = RSHIFT(mv.x,2);
195
s->mv[4].y = s->mv[5].y = RSHIFT(mv.y,2);
197
s->mv[4] = s->mv[5] = (vp56_mv_t) {mv.x/4, mv.y/4};
201
static vp56_mb_t vp56_decode_mv(vp56_context_t *s, int row, int col)
203
vp56_mv_t *mv, vect = {0,0};
206
ctx = vp56_get_vectors_predictors(s, row, col, VP56_FRAME_PREVIOUS);
207
s->mb_type = vp56_parse_mb_type(s, s->mb_type, ctx);
208
s->macroblocks[row * s->mb_width + col].type = s->mb_type;
210
switch (s->mb_type) {
211
case VP56_MB_INTER_V1_PF:
212
mv = &s->vector_candidate[0];
215
case VP56_MB_INTER_V2_PF:
216
mv = &s->vector_candidate[1];
219
case VP56_MB_INTER_V1_GF:
220
vp56_get_vectors_predictors(s, row, col, VP56_FRAME_GOLDEN);
221
mv = &s->vector_candidate[0];
224
case VP56_MB_INTER_V2_GF:
225
vp56_get_vectors_predictors(s, row, col, VP56_FRAME_GOLDEN);
226
mv = &s->vector_candidate[1];
229
case VP56_MB_INTER_DELTA_PF:
230
s->parse_vector_adjustment(s, &vect);
234
case VP56_MB_INTER_DELTA_GF:
235
vp56_get_vectors_predictors(s, row, col, VP56_FRAME_GOLDEN);
236
s->parse_vector_adjustment(s, &vect);
240
case VP56_MB_INTER_4V:
241
vp56_decode_4mv(s, row, col);
249
s->macroblocks[row*s->mb_width + col].mv = *mv;
251
/* same vector for all blocks */
258
static void vp56_add_predictors_dc(vp56_context_t *s, vp56_frame_t ref_frame)
260
int idx = s->scantable.permutated[0];
263
for (i=0; i<6; i++) {
264
vp56_ref_dc_t *ab = &s->above_blocks[s->above_block_idx[i]];
265
vp56_ref_dc_t *lb = &s->left_block[vp56_b6to4[i]];
269
if (ref_frame == lb->ref_frame) {
273
if (ref_frame == ab->ref_frame) {
277
if (s->avctx->codec->id == CODEC_ID_VP5) {
278
if (count < 2 && ref_frame == ab[-1].ref_frame) {
279
dc += ab[-1].dc_coeff;
282
if (count < 2 && ref_frame == ab[1].ref_frame) {
283
dc += ab[1].dc_coeff;
288
dc = s->prev_dc[vp56_b6to3[i]][ref_frame];
292
s->block_coeff[i][idx] += dc;
293
s->prev_dc[vp56_b6to3[i]][ref_frame] = s->block_coeff[i][idx];
294
ab->dc_coeff = s->block_coeff[i][idx];
295
ab->ref_frame = ref_frame;
296
lb->dc_coeff = s->block_coeff[i][idx];
297
lb->ref_frame = ref_frame;
298
s->block_coeff[i][idx] *= s->dequant_dc;
302
static void vp56_edge_filter(vp56_context_t *s, uint8_t *yuv,
303
int pix_inc, int line_inc, int t)
305
int pix2_inc = 2 * pix_inc;
308
for (i=0; i<12; i++) {
309
v = (yuv[-pix2_inc] + 3*(yuv[0]-yuv[-pix_inc]) - yuv[pix_inc] + 4) >>3;
311
yuv[-pix_inc] = av_clip_uint8(yuv[-pix_inc] + v);
312
yuv[0] = av_clip_uint8(yuv[0] - v);
317
static void vp56_deblock_filter(vp56_context_t *s, uint8_t *yuv,
318
int stride, int dx, int dy)
320
int t = vp56_filter_threshold[s->quantizer];
321
if (dx) vp56_edge_filter(s, yuv + 10-dx , 1, stride, t);
322
if (dy) vp56_edge_filter(s, yuv + stride*(10-dy), stride, 1, t);
325
static void vp56_mc(vp56_context_t *s, int b, uint8_t *src,
326
int stride, int x, int y)
328
int plane = vp56_b6to3[b];
329
uint8_t *dst=s->framep[VP56_FRAME_CURRENT]->data[plane]+s->block_offset[b];
332
int overlap_offset = 0;
333
int mask = s->vp56_coord_div[b] - 1;
334
int deblock_filtering = s->deblock_filtering;
338
if (s->avctx->skip_loop_filter >= AVDISCARD_ALL ||
339
(s->avctx->skip_loop_filter >= AVDISCARD_NONKEY
340
&& !s->framep[VP56_FRAME_CURRENT]->key_frame))
341
deblock_filtering = 0;
343
dx = s->mv[b].x / s->vp56_coord_div[b];
344
dy = s->mv[b].y / s->vp56_coord_div[b];
353
if (x<0 || x+12>=s->plane_width[plane] ||
354
y<0 || y+12>=s->plane_height[plane]) {
355
ff_emulated_edge_mc(s->edge_emu_buffer,
356
src + s->block_offset[b] + (dy-2)*stride + (dx-2),
357
stride, 12, 12, x, y,
358
s->plane_width[plane],
359
s->plane_height[plane]);
360
src_block = s->edge_emu_buffer;
361
src_offset = 2 + 2*stride;
362
} else if (deblock_filtering) {
363
/* only need a 12x12 block, but there is no such dsp function, */
364
/* so copy a 16x12 block */
365
s->dsp.put_pixels_tab[0][0](s->edge_emu_buffer,
366
src + s->block_offset[b] + (dy-2)*stride + (dx-2),
368
src_block = s->edge_emu_buffer;
369
src_offset = 2 + 2*stride;
372
src_offset = s->block_offset[b] + dy*stride + dx;
375
if (deblock_filtering)
376
vp56_deblock_filter(s, src_block, stride, dx&7, dy&7);
378
if (s->mv[b].x & mask)
379
overlap_offset += (s->mv[b].x > 0) ? 1 : -1;
380
if (s->mv[b].y & mask)
381
overlap_offset += (s->mv[b].y > 0) ? stride : -stride;
383
if (overlap_offset) {
385
s->filter(s, dst, src_block, src_offset, src_offset+overlap_offset,
386
stride, s->mv[b], mask, s->filter_selection, b<4);
388
s->dsp.put_no_rnd_pixels_l2[1](dst, src_block+src_offset,
389
src_block+src_offset+overlap_offset,
392
s->dsp.put_pixels_tab[1][0](dst, src_block+src_offset, stride, 8);
396
static void vp56_decode_mb(vp56_context_t *s, int row, int col)
398
AVFrame *frame_current, *frame_ref;
400
vp56_frame_t ref_frame;
403
if (s->framep[VP56_FRAME_CURRENT]->key_frame)
404
mb_type = VP56_MB_INTRA;
406
mb_type = vp56_decode_mv(s, row, col);
407
ref_frame = vp56_reference_frame[mb_type];
409
memset(s->block_coeff, 0, sizeof(s->block_coeff));
413
vp56_add_predictors_dc(s, ref_frame);
415
frame_current = s->framep[VP56_FRAME_CURRENT];
416
frame_ref = s->framep[ref_frame];
420
for (b=0; b<6; b++) {
421
plan = vp56_b6to3[b];
422
s->dsp.idct_put(frame_current->data[plan] + s->block_offset[b],
423
s->stride[plan], s->block_coeff[b]);
427
case VP56_MB_INTER_NOVEC_PF:
428
case VP56_MB_INTER_NOVEC_GF:
429
for (b=0; b<6; b++) {
430
plan = vp56_b6to3[b];
431
off = s->block_offset[b];
432
s->dsp.put_pixels_tab[1][0](frame_current->data[plan] + off,
433
frame_ref->data[plan] + off,
435
s->dsp.idct_add(frame_current->data[plan] + off,
436
s->stride[plan], s->block_coeff[b]);
440
case VP56_MB_INTER_DELTA_PF:
441
case VP56_MB_INTER_V1_PF:
442
case VP56_MB_INTER_V2_PF:
443
case VP56_MB_INTER_DELTA_GF:
444
case VP56_MB_INTER_4V:
445
case VP56_MB_INTER_V1_GF:
446
case VP56_MB_INTER_V2_GF:
447
for (b=0; b<6; b++) {
448
int x_off = b==1 || b==3 ? 8 : 0;
449
int y_off = b==2 || b==3 ? 8 : 0;
450
plan = vp56_b6to3[b];
451
vp56_mc(s, b, frame_ref->data[plan], s->stride[plan],
452
16*col+x_off, 16*row+y_off);
453
s->dsp.idct_add(frame_current->data[plan] + s->block_offset[b],
454
s->stride[plan], s->block_coeff[b]);
460
static int vp56_size_changed(AVCodecContext *avctx, vp56_context_t *s)
462
int stride = s->framep[VP56_FRAME_CURRENT]->linesize[0];
465
s->plane_width[0] = s->avctx->coded_width;
466
s->plane_width[1] = s->plane_width[2] = s->avctx->coded_width/2;
467
s->plane_height[0] = s->avctx->coded_height;
468
s->plane_height[1] = s->plane_height[2] = s->avctx->coded_height/2;
471
s->stride[i] = s->flip * s->framep[VP56_FRAME_CURRENT]->linesize[i];
473
s->mb_width = (s->avctx->coded_width+15) / 16;
474
s->mb_height = (s->avctx->coded_height+15) / 16;
476
if (s->mb_width > 1000 || s->mb_height > 1000) {
477
av_log(avctx, AV_LOG_ERROR, "picture too big\n");
481
s->above_blocks = av_realloc(s->above_blocks,
482
(4*s->mb_width+6) * sizeof(*s->above_blocks));
483
s->macroblocks = av_realloc(s->macroblocks,
484
s->mb_width*s->mb_height*sizeof(*s->macroblocks));
485
av_free(s->edge_emu_buffer_alloc);
486
s->edge_emu_buffer_alloc = av_malloc(16*stride);
487
s->edge_emu_buffer = s->edge_emu_buffer_alloc;
489
s->edge_emu_buffer += 15 * stride;
494
int vp56_decode_frame(AVCodecContext *avctx, void *data, int *data_size,
495
uint8_t *buf, int buf_size)
497
vp56_context_t *s = avctx->priv_data;
498
AVFrame *const p = s->framep[VP56_FRAME_CURRENT];
499
int mb_row, mb_col, mb_row_flip, mb_offset = 0;
500
int block, y, uv, stride_y, stride_uv;
501
int golden_frame = 0;
504
res = s->parse_header(s, buf, buf_size, &golden_frame);
509
if (avctx->get_buffer(avctx, p) < 0) {
510
av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
515
if (vp56_size_changed(avctx, s)) {
516
avctx->release_buffer(avctx, p);
521
p->pict_type = FF_I_TYPE;
522
s->default_models_init(s);
523
for (block=0; block<s->mb_height*s->mb_width; block++)
524
s->macroblocks[block].type = VP56_MB_INTRA;
526
p->pict_type = FF_P_TYPE;
527
vp56_parse_mb_type_models(s);
528
s->parse_vector_models(s);
529
s->mb_type = VP56_MB_INTER_NOVEC_PF;
532
s->parse_coeff_models(s);
534
memset(s->prev_dc, 0, sizeof(s->prev_dc));
535
s->prev_dc[1][VP56_FRAME_CURRENT] = 128;
536
s->prev_dc[2][VP56_FRAME_CURRENT] = 128;
538
for (block=0; block < 4*s->mb_width+6; block++) {
539
s->above_blocks[block].ref_frame = -1;
540
s->above_blocks[block].dc_coeff = 0;
541
s->above_blocks[block].not_null_dc = 0;
543
s->above_blocks[2*s->mb_width + 2].ref_frame = 0;
544
s->above_blocks[3*s->mb_width + 4].ref_frame = 0;
546
stride_y = p->linesize[0];
547
stride_uv = p->linesize[1];
552
/* main macroblocks loop */
553
for (mb_row=0; mb_row<s->mb_height; mb_row++) {
555
mb_row_flip = s->mb_height - mb_row - 1;
557
mb_row_flip = mb_row;
559
for (block=0; block<4; block++) {
560
s->left_block[block].ref_frame = -1;
561
s->left_block[block].dc_coeff = 0;
562
s->left_block[block].not_null_dc = 0;
563
memset(s->coeff_ctx[block], 0, 64*sizeof(s->coeff_ctx[block][0]));
565
memset(s->coeff_ctx_last, 24, sizeof(s->coeff_ctx_last));
567
s->above_block_idx[0] = 1;
568
s->above_block_idx[1] = 2;
569
s->above_block_idx[2] = 1;
570
s->above_block_idx[3] = 2;
571
s->above_block_idx[4] = 2*s->mb_width + 2 + 1;
572
s->above_block_idx[5] = 3*s->mb_width + 4 + 1;
574
s->block_offset[s->frbi] = (mb_row_flip*16 + mb_offset) * stride_y;
575
s->block_offset[s->srbi] = s->block_offset[s->frbi] + 8*stride_y;
576
s->block_offset[1] = s->block_offset[0] + 8;
577
s->block_offset[3] = s->block_offset[2] + 8;
578
s->block_offset[4] = (mb_row_flip*8 + mb_offset) * stride_uv;
579
s->block_offset[5] = s->block_offset[4];
581
for (mb_col=0; mb_col<s->mb_width; mb_col++) {
582
vp56_decode_mb(s, mb_row, mb_col);
584
for (y=0; y<4; y++) {
585
s->above_block_idx[y] += 2;
586
s->block_offset[y] += 16;
589
for (uv=4; uv<6; uv++) {
590
s->above_block_idx[uv] += 1;
591
s->block_offset[uv] += 8;
596
if (s->framep[VP56_FRAME_PREVIOUS] == s->framep[VP56_FRAME_GOLDEN])
597
FFSWAP(AVFrame *, s->framep[VP56_FRAME_PREVIOUS],
598
s->framep[VP56_FRAME_UNUSED]);
599
else if (s->framep[VP56_FRAME_PREVIOUS]->data[0])
600
avctx->release_buffer(avctx, s->framep[VP56_FRAME_PREVIOUS]);
601
if (p->key_frame || golden_frame) {
602
if (s->framep[VP56_FRAME_GOLDEN]->data[0])
603
avctx->release_buffer(avctx, s->framep[VP56_FRAME_GOLDEN]);
604
s->framep[VP56_FRAME_GOLDEN] = p;
606
FFSWAP(AVFrame *, s->framep[VP56_FRAME_CURRENT],
607
s->framep[VP56_FRAME_PREVIOUS]);
609
*(AVFrame*)data = *p;
610
*data_size = sizeof(AVFrame);
615
void vp56_init(vp56_context_t *s, AVCodecContext *avctx, int flip)
620
avctx->pix_fmt = PIX_FMT_YUV420P;
622
if (s->avctx->idct_algo == FF_IDCT_AUTO)
623
s->avctx->idct_algo = FF_IDCT_VP3;
624
dsputil_init(&s->dsp, s->avctx);
625
ff_init_scantable(s->dsp.idct_permutation, &s->scantable,ff_zigzag_direct);
627
avcodec_set_dimensions(s->avctx, 0, 0);
630
s->framep[i] = &s->frames[i];
631
s->framep[VP56_FRAME_UNUSED] = s->framep[VP56_FRAME_GOLDEN];
632
s->edge_emu_buffer_alloc = NULL;
634
s->above_blocks = NULL;
635
s->macroblocks = NULL;
637
s->deblock_filtering = 1;
652
int vp56_free(AVCodecContext *avctx)
654
vp56_context_t *s = avctx->priv_data;
656
av_free(s->above_blocks);
657
av_free(s->macroblocks);
658
av_free(s->edge_emu_buffer_alloc);
659
if (s->framep[VP56_FRAME_GOLDEN]->data[0]
660
&& (s->framep[VP56_FRAME_PREVIOUS] != s->framep[VP56_FRAME_GOLDEN]))
661
avctx->release_buffer(avctx, s->framep[VP56_FRAME_GOLDEN]);
662
if (s->framep[VP56_FRAME_PREVIOUS]->data[0])
663
avctx->release_buffer(avctx, s->framep[VP56_FRAME_PREVIOUS]);