1 /*
2 * VC3/DNxHD decoder.
3 * Copyright (c) 2007 SmartJog S.A., Baptiste Coudurier <baptiste dot coudurier at smartjog dot com>
4 * Copyright (c) 2011 MirriAd Ltd
5 * Copyright (c) 2015 Christophe Gisquet
6 *
7 * 10 bit support added by MirriAd Ltd, Joseph Artsimovich <joseph@mirriad.com>
8 * Slice multithreading and MB interlaced support added by Christophe Gisquet
9 *
10 * This file is part of FFmpeg.
11 *
12 * FFmpeg is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU Lesser General Public
14 * License as published by the Free Software Foundation; either
15 * version 2.1 of the License, or (at your option) any later version.
16 *
17 * FFmpeg is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20 * Lesser General Public License for more details.
21 *
22 * You should have received a copy of the GNU Lesser General Public
23 * License along with FFmpeg; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
25 */
26
27 #include "libavutil/imgutils.h"
28 #include "libavutil/timer.h"
29 #include "avcodec.h"
30 #include "blockdsp.h"
31 #include "get_bits.h"
32 #include "dnxhddata.h"
33 #include "idctdsp.h"
34 #include "internal.h"
35 #include "profiles.h"
36 #include "thread.h"
37
38 typedef struct RowContext {
39 DECLARE_ALIGNED(32, int16_t, blocks)[12][64];
40 int luma_scale[64];
41 int chroma_scale[64];
42 GetBitContext gb;
43 int last_dc[3];
44 int last_qscale;
45 int errors;
46 /** -1:not set yet 0:off=RGB 1:on=YUV 2:variable */
47 int format;
48 } RowContext;
49
50 typedef struct DNXHDContext {
51 AVCodecContext *avctx;
52 RowContext *rows;
53 BlockDSPContext bdsp;
54 const uint8_t* buf;
55 int buf_size;
56 int64_t cid; ///< compression id
57 unsigned int width, height;
58 enum AVPixelFormat pix_fmt;
59 unsigned int mb_width, mb_height;
60 uint32_t mb_scan_index[512];
61 int data_offset; // End of mb_scan_index, where macroblocks start
62 int cur_field; ///< current interlaced field
63 VLC ac_vlc, dc_vlc, run_vlc;
64 IDCTDSPContext idsp;
65 ScanTable scantable;
66 const CIDEntry *cid_table;
67 int bit_depth; // 8, 10, 12 or 0 if not initialized at all.
68 int is_444;
69 int alpha;
70 int lla;
71 int mbaff;
72 int act;
73 int (*decode_dct_block)(const struct DNXHDContext *ctx,
74 RowContext *row, int n);
75 } DNXHDContext;
76
77 #define DNXHD_VLC_BITS 9
78 #define DNXHD_DC_VLC_BITS 7
79
80 static int dnxhd_decode_dct_block_8(const DNXHDContext *ctx,
81 RowContext *row, int n);
82 static int dnxhd_decode_dct_block_10(const DNXHDContext *ctx,
83 RowContext *row, int n);
84 static int dnxhd_decode_dct_block_10_444(const DNXHDContext *ctx,
85 RowContext *row, int n);
86 static int dnxhd_decode_dct_block_12(const DNXHDContext *ctx,
87 RowContext *row, int n);
88 static int dnxhd_decode_dct_block_12_444(const DNXHDContext *ctx,
89 RowContext *row, int n);
90
dnxhd_decode_init(AVCodecContext * avctx)91 static av_cold int dnxhd_decode_init(AVCodecContext *avctx)
92 {
93 DNXHDContext *ctx = avctx->priv_data;
94
95 ctx->avctx = avctx;
96 ctx->cid = -1;
97 if (avctx->colorspace == AVCOL_SPC_UNSPECIFIED) {
98 avctx->colorspace = AVCOL_SPC_BT709;
99 }
100
101 avctx->coded_width = FFALIGN(avctx->width, 16);
102 avctx->coded_height = FFALIGN(avctx->height, 16);
103
104 ctx->rows = av_mallocz_array(avctx->thread_count, sizeof(RowContext));
105 if (!ctx->rows)
106 return AVERROR(ENOMEM);
107
108 return 0;
109 }
110
dnxhd_init_vlc(DNXHDContext * ctx,uint32_t cid,int bitdepth)111 static int dnxhd_init_vlc(DNXHDContext *ctx, uint32_t cid, int bitdepth)
112 {
113 if (cid != ctx->cid) {
114 int index;
115
116 if ((index = ff_dnxhd_get_cid_table(cid)) < 0) {
117 av_log(ctx->avctx, AV_LOG_ERROR, "unsupported cid %"PRIu32"\n", cid);
118 return AVERROR(ENOSYS);
119 }
120 if (ff_dnxhd_cid_table[index].bit_depth != bitdepth &&
121 ff_dnxhd_cid_table[index].bit_depth != DNXHD_VARIABLE) {
122 av_log(ctx->avctx, AV_LOG_ERROR, "bit depth mismatches %d %d\n", ff_dnxhd_cid_table[index].bit_depth, bitdepth);
123 return AVERROR_INVALIDDATA;
124 }
125 ctx->cid_table = &ff_dnxhd_cid_table[index];
126 av_log(ctx->avctx, AV_LOG_VERBOSE, "Profile cid %"PRIu32".\n", cid);
127
128 ff_free_vlc(&ctx->ac_vlc);
129 ff_free_vlc(&ctx->dc_vlc);
130 ff_free_vlc(&ctx->run_vlc);
131
132 init_vlc(&ctx->ac_vlc, DNXHD_VLC_BITS, 257,
133 ctx->cid_table->ac_bits, 1, 1,
134 ctx->cid_table->ac_codes, 2, 2, 0);
135 init_vlc(&ctx->dc_vlc, DNXHD_DC_VLC_BITS, bitdepth > 8 ? 14 : 12,
136 ctx->cid_table->dc_bits, 1, 1,
137 ctx->cid_table->dc_codes, 1, 1, 0);
138 init_vlc(&ctx->run_vlc, DNXHD_VLC_BITS, 62,
139 ctx->cid_table->run_bits, 1, 1,
140 ctx->cid_table->run_codes, 2, 2, 0);
141
142 ctx->cid = cid;
143 }
144 return 0;
145 }
146
dnxhd_decode_init_thread_copy(AVCodecContext * avctx)147 static av_cold int dnxhd_decode_init_thread_copy(AVCodecContext *avctx)
148 {
149 DNXHDContext *ctx = avctx->priv_data;
150
151 ctx->avctx = avctx;
152 // make sure VLC tables will be loaded when cid is parsed
153 ctx->cid = -1;
154
155 ctx->rows = av_mallocz_array(avctx->thread_count, sizeof(RowContext));
156 if (!ctx->rows)
157 return AVERROR(ENOMEM);
158
159 return 0;
160 }
161
dnxhd_get_profile(int cid)162 static int dnxhd_get_profile(int cid)
163 {
164 switch(cid) {
165 case 1270:
166 return FF_PROFILE_DNXHR_444;
167 case 1271:
168 return FF_PROFILE_DNXHR_HQX;
169 case 1272:
170 return FF_PROFILE_DNXHR_HQ;
171 case 1273:
172 return FF_PROFILE_DNXHR_SQ;
173 case 1274:
174 return FF_PROFILE_DNXHR_LB;
175 }
176 return FF_PROFILE_DNXHD;
177 }
178
dnxhd_decode_header(DNXHDContext * ctx,AVFrame * frame,const uint8_t * buf,int buf_size,int first_field)179 static int dnxhd_decode_header(DNXHDContext *ctx, AVFrame *frame,
180 const uint8_t *buf, int buf_size,
181 int first_field)
182 {
183 int i, cid, ret;
184 int old_bit_depth = ctx->bit_depth, bitdepth;
185 uint64_t header_prefix;
186 if (buf_size < 0x280) {
187 av_log(ctx->avctx, AV_LOG_ERROR,
188 "buffer too small (%d < 640).\n", buf_size);
189 return AVERROR_INVALIDDATA;
190 }
191
192 header_prefix = ff_dnxhd_parse_header_prefix(buf);
193 if (header_prefix == 0) {
194 av_log(ctx->avctx, AV_LOG_ERROR,
195 "unknown header 0x%02X 0x%02X 0x%02X 0x%02X 0x%02X\n",
196 buf[0], buf[1], buf[2], buf[3], buf[4]);
197 return AVERROR_INVALIDDATA;
198 }
199 if (buf[5] & 2) { /* interlaced */
200 ctx->cur_field = buf[5] & 1;
201 frame->interlaced_frame = 1;
202 frame->top_field_first = first_field ^ ctx->cur_field;
203 av_log(ctx->avctx, AV_LOG_DEBUG,
204 "interlaced %d, cur field %d\n", buf[5] & 3, ctx->cur_field);
205 } else {
206 ctx->cur_field = 0;
207 }
208 ctx->mbaff = (buf[0x6] >> 5) & 1;
209 ctx->alpha = buf[0x7] & 1;
210 ctx->lla = (buf[0x7] >> 1) & 1;
211 if (ctx->alpha)
212 avpriv_request_sample(ctx->avctx, "alpha");
213
214 ctx->height = AV_RB16(buf + 0x18);
215 ctx->width = AV_RB16(buf + 0x1a);
216
217 switch(buf[0x21] >> 5) {
218 case 1: bitdepth = 8; break;
219 case 2: bitdepth = 10; break;
220 case 3: bitdepth = 12; break;
221 default:
222 av_log(ctx->avctx, AV_LOG_ERROR,
223 "Unknown bitdepth indicator (%d)\n", buf[0x21] >> 5);
224 return AVERROR_INVALIDDATA;
225 }
226
227 cid = AV_RB32(buf + 0x28);
228
229 ctx->avctx->profile = dnxhd_get_profile(cid);
230
231 if ((ret = dnxhd_init_vlc(ctx, cid, bitdepth)) < 0)
232 return ret;
233 if (ctx->mbaff && ctx->cid_table->cid != 1260)
234 av_log(ctx->avctx, AV_LOG_WARNING,
235 "Adaptive MB interlace flag in an unsupported profile.\n");
236
237 switch ((buf[0x2C] >> 1) & 3) {
238 case 0: frame->colorspace = AVCOL_SPC_BT709; break;
239 case 1: frame->colorspace = AVCOL_SPC_BT2020_NCL; break;
240 case 2: frame->colorspace = AVCOL_SPC_BT2020_CL; break;
241 case 3: frame->colorspace = AVCOL_SPC_UNSPECIFIED; break;
242 }
243
244 ctx->act = buf[0x2C] & 1;
245 if (ctx->act && ctx->cid_table->cid != 1256 && ctx->cid_table->cid != 1270)
246 av_log(ctx->avctx, AV_LOG_WARNING,
247 "Adaptive color transform in an unsupported profile.\n");
248
249 ctx->is_444 = (buf[0x2C] >> 6) & 1;
250 if (ctx->is_444) {
251 if (bitdepth == 8) {
252 avpriv_request_sample(ctx->avctx, "4:4:4 8 bits");
253 return AVERROR_INVALIDDATA;
254 } else if (bitdepth == 10) {
255 ctx->decode_dct_block = dnxhd_decode_dct_block_10_444;
256 ctx->pix_fmt = ctx->act ? AV_PIX_FMT_YUV444P10
257 : AV_PIX_FMT_GBRP10;
258 } else {
259 ctx->decode_dct_block = dnxhd_decode_dct_block_12_444;
260 ctx->pix_fmt = ctx->act ? AV_PIX_FMT_YUV444P12
261 : AV_PIX_FMT_GBRP12;
262 }
263 } else if (bitdepth == 12) {
264 ctx->decode_dct_block = dnxhd_decode_dct_block_12;
265 ctx->pix_fmt = AV_PIX_FMT_YUV422P12;
266 } else if (bitdepth == 10) {
267 if (ctx->avctx->profile == FF_PROFILE_DNXHR_HQX)
268 ctx->decode_dct_block = dnxhd_decode_dct_block_10_444;
269 else
270 ctx->decode_dct_block = dnxhd_decode_dct_block_10;
271 ctx->pix_fmt = AV_PIX_FMT_YUV422P10;
272 } else {
273 ctx->decode_dct_block = dnxhd_decode_dct_block_8;
274 ctx->pix_fmt = AV_PIX_FMT_YUV422P;
275 }
276
277 ctx->avctx->bits_per_raw_sample = ctx->bit_depth = bitdepth;
278 if (ctx->bit_depth != old_bit_depth) {
279 ff_blockdsp_init(&ctx->bdsp, ctx->avctx);
280 ff_idctdsp_init(&ctx->idsp, ctx->avctx);
281 ff_init_scantable(ctx->idsp.idct_permutation, &ctx->scantable,
282 ff_zigzag_direct);
283 }
284
285 // make sure profile size constraints are respected
286 // DNx100 allows 1920->1440 and 1280->960 subsampling
287 if (ctx->width != ctx->cid_table->width &&
288 ctx->cid_table->width != DNXHD_VARIABLE) {
289 av_reduce(&ctx->avctx->sample_aspect_ratio.num,
290 &ctx->avctx->sample_aspect_ratio.den,
291 ctx->width, ctx->cid_table->width, 255);
292 ctx->width = ctx->cid_table->width;
293 }
294
295 if (buf_size < ctx->cid_table->coding_unit_size) {
296 av_log(ctx->avctx, AV_LOG_ERROR, "incorrect frame size (%d < %u).\n",
297 buf_size, ctx->cid_table->coding_unit_size);
298 return AVERROR_INVALIDDATA;
299 }
300
301 ctx->mb_width = (ctx->width + 15)>> 4;
302 ctx->mb_height = AV_RB16(buf + 0x16c);
303
304 if ((ctx->height + 15) >> 4 == ctx->mb_height && frame->interlaced_frame)
305 ctx->height <<= 1;
306
307 av_log(ctx->avctx, AV_LOG_VERBOSE, "%dx%d, 4:%s %d bits, MBAFF=%d ACT=%d\n",
308 ctx->width, ctx->height, ctx->is_444 ? "4:4" : "2:2",
309 ctx->bit_depth, ctx->mbaff, ctx->act);
310
311 // Newer format supports variable mb_scan_index sizes
312 if (ctx->mb_height > 68 && ff_dnxhd_check_header_prefix_hr(header_prefix)) {
313 ctx->data_offset = 0x170 + (ctx->mb_height << 2);
314 } else {
315 if (ctx->mb_height > 68) {
316 av_log(ctx->avctx, AV_LOG_ERROR,
317 "mb height too big: %d\n", ctx->mb_height);
318 return AVERROR_INVALIDDATA;
319 }
320 ctx->data_offset = 0x280;
321 }
322 if ((ctx->mb_height << frame->interlaced_frame) > (ctx->height + 15) >> 4) {
323 av_log(ctx->avctx, AV_LOG_ERROR,
324 "mb height too big: %d\n", ctx->mb_height);
325 return AVERROR_INVALIDDATA;
326 }
327
328 if (buf_size < ctx->data_offset) {
329 av_log(ctx->avctx, AV_LOG_ERROR,
330 "buffer too small (%d < %d).\n", buf_size, ctx->data_offset);
331 return AVERROR_INVALIDDATA;
332 }
333
334 if (ctx->mb_height > FF_ARRAY_ELEMS(ctx->mb_scan_index)) {
335 av_log(ctx->avctx, AV_LOG_ERROR,
336 "mb_height too big (%d > %"SIZE_SPECIFIER").\n", ctx->mb_height, FF_ARRAY_ELEMS(ctx->mb_scan_index));
337 return AVERROR_INVALIDDATA;
338 }
339
340 for (i = 0; i < ctx->mb_height; i++) {
341 ctx->mb_scan_index[i] = AV_RB32(buf + 0x170 + (i << 2));
342 ff_dlog(ctx->avctx, "mb scan index %d, pos %d: %"PRIu32"\n",
343 i, 0x170 + (i << 2), ctx->mb_scan_index[i]);
344 if (buf_size - ctx->data_offset < ctx->mb_scan_index[i]) {
345 av_log(ctx->avctx, AV_LOG_ERROR,
346 "invalid mb scan index (%"PRIu32" vs %u).\n",
347 ctx->mb_scan_index[i], buf_size - ctx->data_offset);
348 return AVERROR_INVALIDDATA;
349 }
350 }
351
352 return 0;
353 }
354
dnxhd_decode_dct_block(const DNXHDContext * ctx,RowContext * row,int n,int index_bits,int level_bias,int level_shift,int dc_shift)355 static av_always_inline int dnxhd_decode_dct_block(const DNXHDContext *ctx,
356 RowContext *row,
357 int n,
358 int index_bits,
359 int level_bias,
360 int level_shift,
361 int dc_shift)
362 {
363 int i, j, index1, index2, len, flags;
364 int level, component, sign;
365 const int *scale;
366 const uint8_t *weight_matrix;
367 const uint8_t *ac_info = ctx->cid_table->ac_info;
368 int16_t *block = row->blocks[n];
369 const int eob_index = ctx->cid_table->eob_index;
370 int ret = 0;
371 OPEN_READER(bs, &row->gb);
372
373 ctx->bdsp.clear_block(block);
374
375 if (!ctx->is_444) {
376 if (n & 2) {
377 component = 1 + (n & 1);
378 scale = row->chroma_scale;
379 weight_matrix = ctx->cid_table->chroma_weight;
380 } else {
381 component = 0;
382 scale = row->luma_scale;
383 weight_matrix = ctx->cid_table->luma_weight;
384 }
385 } else {
386 component = (n >> 1) % 3;
387 if (component) {
388 scale = row->chroma_scale;
389 weight_matrix = ctx->cid_table->chroma_weight;
390 } else {
391 scale = row->luma_scale;
392 weight_matrix = ctx->cid_table->luma_weight;
393 }
394 }
395
396 UPDATE_CACHE(bs, &row->gb);
397 GET_VLC(len, bs, &row->gb, ctx->dc_vlc.table, DNXHD_DC_VLC_BITS, 1);
398 if (len < 0) {
399 ret = len;
400 goto error;
401 }
402 if (len) {
403 level = GET_CACHE(bs, &row->gb);
404 LAST_SKIP_BITS(bs, &row->gb, len);
405 sign = ~level >> 31;
406 level = (NEG_USR32(sign ^ level, len) ^ sign) - sign;
407 row->last_dc[component] += level * (1 << dc_shift);
408 }
409 block[0] = row->last_dc[component];
410
411 i = 0;
412
413 UPDATE_CACHE(bs, &row->gb);
414 GET_VLC(index1, bs, &row->gb, ctx->ac_vlc.table,
415 DNXHD_VLC_BITS, 2);
416
417 while (index1 != eob_index) {
418 level = ac_info[2*index1+0];
419 flags = ac_info[2*index1+1];
420
421 sign = SHOW_SBITS(bs, &row->gb, 1);
422 SKIP_BITS(bs, &row->gb, 1);
423
424 if (flags & 1) {
425 level += SHOW_UBITS(bs, &row->gb, index_bits) << 7;
426 SKIP_BITS(bs, &row->gb, index_bits);
427 }
428
429 if (flags & 2) {
430 UPDATE_CACHE(bs, &row->gb);
431 GET_VLC(index2, bs, &row->gb, ctx->run_vlc.table,
432 DNXHD_VLC_BITS, 2);
433 i += ctx->cid_table->run[index2];
434 }
435
436 if (++i > 63) {
437 av_log(ctx->avctx, AV_LOG_ERROR, "ac tex damaged %d, %d\n", n, i);
438 ret = -1;
439 break;
440 }
441
442 j = ctx->scantable.permutated[i];
443 level *= scale[i];
444 level += scale[i] >> 1;
445 if (level_bias < 32 || weight_matrix[i] != level_bias)
446 level += level_bias; // 1<<(level_shift-1)
447 level >>= level_shift;
448
449 block[j] = (level ^ sign) - sign;
450
451 UPDATE_CACHE(bs, &row->gb);
452 GET_VLC(index1, bs, &row->gb, ctx->ac_vlc.table,
453 DNXHD_VLC_BITS, 2);
454 }
455 error:
456 CLOSE_READER(bs, &row->gb);
457 return ret;
458 }
459
dnxhd_decode_dct_block_8(const DNXHDContext * ctx,RowContext * row,int n)460 static int dnxhd_decode_dct_block_8(const DNXHDContext *ctx,
461 RowContext *row, int n)
462 {
463 return dnxhd_decode_dct_block(ctx, row, n, 4, 32, 6, 0);
464 }
465
dnxhd_decode_dct_block_10(const DNXHDContext * ctx,RowContext * row,int n)466 static int dnxhd_decode_dct_block_10(const DNXHDContext *ctx,
467 RowContext *row, int n)
468 {
469 return dnxhd_decode_dct_block(ctx, row, n, 6, 8, 4, 0);
470 }
471
dnxhd_decode_dct_block_10_444(const DNXHDContext * ctx,RowContext * row,int n)472 static int dnxhd_decode_dct_block_10_444(const DNXHDContext *ctx,
473 RowContext *row, int n)
474 {
475 return dnxhd_decode_dct_block(ctx, row, n, 6, 32, 6, 0);
476 }
477
dnxhd_decode_dct_block_12(const DNXHDContext * ctx,RowContext * row,int n)478 static int dnxhd_decode_dct_block_12(const DNXHDContext *ctx,
479 RowContext *row, int n)
480 {
481 return dnxhd_decode_dct_block(ctx, row, n, 6, 8, 4, 2);
482 }
483
dnxhd_decode_dct_block_12_444(const DNXHDContext * ctx,RowContext * row,int n)484 static int dnxhd_decode_dct_block_12_444(const DNXHDContext *ctx,
485 RowContext *row, int n)
486 {
487 return dnxhd_decode_dct_block(ctx, row, n, 6, 32, 4, 2);
488 }
489
dnxhd_decode_macroblock(const DNXHDContext * ctx,RowContext * row,AVFrame * frame,int x,int y)490 static int dnxhd_decode_macroblock(const DNXHDContext *ctx, RowContext *row,
491 AVFrame *frame, int x, int y)
492 {
493 int shift1 = ctx->bit_depth >= 10;
494 int dct_linesize_luma = frame->linesize[0];
495 int dct_linesize_chroma = frame->linesize[1];
496 uint8_t *dest_y, *dest_u, *dest_v;
497 int dct_y_offset, dct_x_offset;
498 int qscale, i, act;
499 int interlaced_mb = 0;
500
501 if (ctx->mbaff) {
502 interlaced_mb = get_bits1(&row->gb);
503 qscale = get_bits(&row->gb, 10);
504 } else {
505 qscale = get_bits(&row->gb, 11);
506 }
507 act = get_bits1(&row->gb);
508 if (act) {
509 if (!ctx->act) {
510 static int act_warned;
511 if (!act_warned) {
512 act_warned = 1;
513 av_log(ctx->avctx, AV_LOG_ERROR,
514 "ACT flag set, in violation of frame header.\n");
515 }
516 } else if (row->format == -1) {
517 row->format = act;
518 } else if (row->format != act) {
519 row->format = 2; // Variable
520 }
521 }
522
523 if (qscale != row->last_qscale) {
524 for (i = 0; i < 64; i++) {
525 row->luma_scale[i] = qscale * ctx->cid_table->luma_weight[i];
526 row->chroma_scale[i] = qscale * ctx->cid_table->chroma_weight[i];
527 }
528 row->last_qscale = qscale;
529 }
530
531 for (i = 0; i < 8 + 4 * ctx->is_444; i++) {
532 if (ctx->decode_dct_block(ctx, row, i) < 0)
533 return AVERROR_INVALIDDATA;
534 }
535
536 if (frame->interlaced_frame) {
537 dct_linesize_luma <<= 1;
538 dct_linesize_chroma <<= 1;
539 }
540
541 dest_y = frame->data[0] + ((y * dct_linesize_luma) << 4) + (x << (4 + shift1));
542 dest_u = frame->data[1] + ((y * dct_linesize_chroma) << 4) + (x << (3 + shift1 + ctx->is_444));
543 dest_v = frame->data[2] + ((y * dct_linesize_chroma) << 4) + (x << (3 + shift1 + ctx->is_444));
544
545 if (frame->interlaced_frame && ctx->cur_field) {
546 dest_y += frame->linesize[0];
547 dest_u += frame->linesize[1];
548 dest_v += frame->linesize[2];
549 }
550 if (interlaced_mb) {
551 dct_linesize_luma <<= 1;
552 dct_linesize_chroma <<= 1;
553 }
554
555 dct_y_offset = interlaced_mb ? frame->linesize[0] : (dct_linesize_luma << 3);
556 dct_x_offset = 8 << shift1;
557 if (!ctx->is_444) {
558 ctx->idsp.idct_put(dest_y, dct_linesize_luma, row->blocks[0]);
559 ctx->idsp.idct_put(dest_y + dct_x_offset, dct_linesize_luma, row->blocks[1]);
560 ctx->idsp.idct_put(dest_y + dct_y_offset, dct_linesize_luma, row->blocks[4]);
561 ctx->idsp.idct_put(dest_y + dct_y_offset + dct_x_offset, dct_linesize_luma, row->blocks[5]);
562
563 if (!(ctx->avctx->flags & AV_CODEC_FLAG_GRAY)) {
564 dct_y_offset = interlaced_mb ? frame->linesize[1] : (dct_linesize_chroma << 3);
565 ctx->idsp.idct_put(dest_u, dct_linesize_chroma, row->blocks[2]);
566 ctx->idsp.idct_put(dest_v, dct_linesize_chroma, row->blocks[3]);
567 ctx->idsp.idct_put(dest_u + dct_y_offset, dct_linesize_chroma, row->blocks[6]);
568 ctx->idsp.idct_put(dest_v + dct_y_offset, dct_linesize_chroma, row->blocks[7]);
569 }
570 } else {
571 ctx->idsp.idct_put(dest_y, dct_linesize_luma, row->blocks[0]);
572 ctx->idsp.idct_put(dest_y + dct_x_offset, dct_linesize_luma, row->blocks[1]);
573 ctx->idsp.idct_put(dest_y + dct_y_offset, dct_linesize_luma, row->blocks[6]);
574 ctx->idsp.idct_put(dest_y + dct_y_offset + dct_x_offset, dct_linesize_luma, row->blocks[7]);
575
576 if (!(ctx->avctx->flags & AV_CODEC_FLAG_GRAY)) {
577 dct_y_offset = interlaced_mb ? frame->linesize[1] : (dct_linesize_chroma << 3);
578 ctx->idsp.idct_put(dest_u, dct_linesize_chroma, row->blocks[2]);
579 ctx->idsp.idct_put(dest_u + dct_x_offset, dct_linesize_chroma, row->blocks[3]);
580 ctx->idsp.idct_put(dest_u + dct_y_offset, dct_linesize_chroma, row->blocks[8]);
581 ctx->idsp.idct_put(dest_u + dct_y_offset + dct_x_offset, dct_linesize_chroma, row->blocks[9]);
582 ctx->idsp.idct_put(dest_v, dct_linesize_chroma, row->blocks[4]);
583 ctx->idsp.idct_put(dest_v + dct_x_offset, dct_linesize_chroma, row->blocks[5]);
584 ctx->idsp.idct_put(dest_v + dct_y_offset, dct_linesize_chroma, row->blocks[10]);
585 ctx->idsp.idct_put(dest_v + dct_y_offset + dct_x_offset, dct_linesize_chroma, row->blocks[11]);
586 }
587 }
588
589 return 0;
590 }
591
dnxhd_decode_row(AVCodecContext * avctx,void * data,int rownb,int threadnb)592 static int dnxhd_decode_row(AVCodecContext *avctx, void *data,
593 int rownb, int threadnb)
594 {
595 const DNXHDContext *ctx = avctx->priv_data;
596 uint32_t offset = ctx->mb_scan_index[rownb];
597 RowContext *row = ctx->rows + threadnb;
598 int x, ret;
599
600 row->last_dc[0] =
601 row->last_dc[1] =
602 row->last_dc[2] = 1 << (ctx->bit_depth + 2); // for levels +2^(bitdepth-1)
603 ret = init_get_bits8(&row->gb, ctx->buf + offset, ctx->buf_size - offset);
604 if (ret < 0) {
605 row->errors++;
606 return ret;
607 }
608 for (x = 0; x < ctx->mb_width; x++) {
609 //START_TIMER;
610 int ret = dnxhd_decode_macroblock(ctx, row, data, x, rownb);
611 if (ret < 0) {
612 row->errors++;
613 return ret;
614 }
615 //STOP_TIMER("decode macroblock");
616 }
617
618 return 0;
619 }
620
dnxhd_decode_frame(AVCodecContext * avctx,void * data,int * got_frame,AVPacket * avpkt)621 static int dnxhd_decode_frame(AVCodecContext *avctx, void *data,
622 int *got_frame, AVPacket *avpkt)
623 {
624 const uint8_t *buf = avpkt->data;
625 int buf_size = avpkt->size;
626 DNXHDContext *ctx = avctx->priv_data;
627 ThreadFrame frame = { .f = data };
628 AVFrame *picture = data;
629 int first_field = 1;
630 int ret, i;
631
632 ff_dlog(avctx, "frame size %d\n", buf_size);
633
634 for (i = 0; i < avctx->thread_count; i++)
635 ctx->rows[i].format = -1;
636
637 decode_coding_unit:
638 if ((ret = dnxhd_decode_header(ctx, picture, buf, buf_size, first_field)) < 0)
639 return ret;
640
641 if ((avctx->width || avctx->height) &&
642 (ctx->width != avctx->width || ctx->height != avctx->height)) {
643 av_log(avctx, AV_LOG_WARNING, "frame size changed: %dx%d -> %ux%u\n",
644 avctx->width, avctx->height, ctx->width, ctx->height);
645 first_field = 1;
646 }
647 if (avctx->pix_fmt != AV_PIX_FMT_NONE && avctx->pix_fmt != ctx->pix_fmt) {
648 av_log(avctx, AV_LOG_WARNING, "pix_fmt changed: %s -> %s\n",
649 av_get_pix_fmt_name(avctx->pix_fmt), av_get_pix_fmt_name(ctx->pix_fmt));
650 first_field = 1;
651 }
652
653 avctx->pix_fmt = ctx->pix_fmt;
654 ret = ff_set_dimensions(avctx, ctx->width, ctx->height);
655 if (ret < 0)
656 return ret;
657
658 if (first_field) {
659 if ((ret = ff_thread_get_buffer(avctx, &frame, 0)) < 0)
660 return ret;
661 picture->pict_type = AV_PICTURE_TYPE_I;
662 picture->key_frame = 1;
663 }
664
665 ctx->buf_size = buf_size - ctx->data_offset;
666 ctx->buf = buf + ctx->data_offset;
667 avctx->execute2(avctx, dnxhd_decode_row, picture, NULL, ctx->mb_height);
668
669 if (first_field && picture->interlaced_frame) {
670 buf += ctx->cid_table->coding_unit_size;
671 buf_size -= ctx->cid_table->coding_unit_size;
672 first_field = 0;
673 goto decode_coding_unit;
674 }
675
676 ret = 0;
677 for (i = 0; i < avctx->thread_count; i++) {
678 ret += ctx->rows[i].errors;
679 ctx->rows[i].errors = 0;
680 }
681
682 if (ctx->act) {
683 static int act_warned;
684 int format = ctx->rows[0].format;
685 for (i = 1; i < avctx->thread_count; i++) {
686 if (ctx->rows[i].format != format &&
687 ctx->rows[i].format != -1 /* not run */) {
688 format = 2;
689 break;
690 }
691 }
692 switch (format) {
693 case -1:
694 case 2:
695 if (!act_warned) {
696 act_warned = 1;
697 av_log(ctx->avctx, AV_LOG_ERROR,
698 "Unsupported: variable ACT flag.\n");
699 }
700 break;
701 case 0:
702 ctx->pix_fmt = ctx->bit_depth==10
703 ? AV_PIX_FMT_GBRP10 : AV_PIX_FMT_GBRP12;
704 break;
705 case 1:
706 ctx->pix_fmt = ctx->bit_depth==10
707 ? AV_PIX_FMT_YUV444P10 : AV_PIX_FMT_YUV444P12;
708 break;
709 }
710 }
711 avctx->pix_fmt = ctx->pix_fmt;
712 if (ret) {
713 av_log(ctx->avctx, AV_LOG_ERROR, "%d lines with errors\n", ret);
714 return AVERROR_INVALIDDATA;
715 }
716
717 *got_frame = 1;
718 return avpkt->size;
719 }
720
dnxhd_decode_close(AVCodecContext * avctx)721 static av_cold int dnxhd_decode_close(AVCodecContext *avctx)
722 {
723 DNXHDContext *ctx = avctx->priv_data;
724
725 ff_free_vlc(&ctx->ac_vlc);
726 ff_free_vlc(&ctx->dc_vlc);
727 ff_free_vlc(&ctx->run_vlc);
728
729 av_freep(&ctx->rows);
730
731 return 0;
732 }
733
734 AVCodec ff_dnxhd_decoder = {
735 .name = "dnxhd",
736 .long_name = NULL_IF_CONFIG_SMALL("VC3/DNxHD"),
737 .type = AVMEDIA_TYPE_VIDEO,
738 .id = AV_CODEC_ID_DNXHD,
739 .priv_data_size = sizeof(DNXHDContext),
740 .init = dnxhd_decode_init,
741 .close = dnxhd_decode_close,
742 .decode = dnxhd_decode_frame,
743 .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS |
744 AV_CODEC_CAP_SLICE_THREADS,
745 .init_thread_copy = ONLY_IF_THREADS_ENABLED(dnxhd_decode_init_thread_copy),
746 .profiles = NULL_IF_CONFIG_SMALL(ff_dnxhd_profiles),
747 };
748