1 /*
2 * VC3/DNxHD decoder.
3 * Copyright (c) 2007 SmartJog S.A., Baptiste Coudurier <baptiste dot coudurier at smartjog dot com>
4 * Copyright (c) 2011 MirriAd Ltd
5 * Copyright (c) 2015 Christophe Gisquet
6 *
7 * 10 bit support added by MirriAd Ltd, Joseph Artsimovich <joseph@mirriad.com>
8 * Slice multithreading and MB interlaced support added by Christophe Gisquet
9 *
10 * This file is part of FFmpeg.
11 *
12 * FFmpeg is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU Lesser General Public
14 * License as published by the Free Software Foundation; either
15 * version 2.1 of the License, or (at your option) any later version.
16 *
17 * FFmpeg is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20 * Lesser General Public License for more details.
21 *
22 * You should have received a copy of the GNU Lesser General Public
23 * License along with FFmpeg; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
25 */
26
27 #include "libavutil/imgutils.h"
28 #include "libavutil/timer.h"
29 #include "avcodec.h"
30 #include "blockdsp.h"
31 #define UNCHECKED_BITSTREAM_READER 1
32 #include "get_bits.h"
33 #include "dnxhddata.h"
34 #include "idctdsp.h"
35 #include "internal.h"
36 #include "profiles.h"
37 #include "thread.h"
38
39 typedef struct RowContext {
40 DECLARE_ALIGNED(16, int16_t, blocks)[12][64];
41 int luma_scale[64];
42 int chroma_scale[64];
43 GetBitContext gb;
44 int last_dc[3];
45 int last_qscale;
46 int errors;
47 /** -1:not set yet 0:off=RGB 1:on=YUV 2:variable */
48 int format;
49 } RowContext;
50
51 typedef struct DNXHDContext {
52 AVCodecContext *avctx;
53 RowContext *rows;
54 BlockDSPContext bdsp;
55 const uint8_t* buf;
56 int buf_size;
57 int64_t cid; ///< compression id
58 unsigned int width, height;
59 enum AVPixelFormat pix_fmt;
60 unsigned int mb_width, mb_height;
61 uint32_t mb_scan_index[512];
62 int data_offset; // End of mb_scan_index, where macroblocks start
63 int cur_field; ///< current interlaced field
64 VLC ac_vlc, dc_vlc, run_vlc;
65 IDCTDSPContext idsp;
66 ScanTable scantable;
67 const CIDEntry *cid_table;
68 int bit_depth; // 8, 10, 12 or 0 if not initialized at all.
69 int is_444;
70 int alpha;
71 int lla;
72 int mbaff;
73 int act;
74 int (*decode_dct_block)(const struct DNXHDContext *ctx,
75 RowContext *row, int n);
76 } DNXHDContext;
77
78 #define DNXHD_VLC_BITS 9
79 #define DNXHD_DC_VLC_BITS 7
80
81 static int dnxhd_decode_dct_block_8(const DNXHDContext *ctx,
82 RowContext *row, int n);
83 static int dnxhd_decode_dct_block_10(const DNXHDContext *ctx,
84 RowContext *row, int n);
85 static int dnxhd_decode_dct_block_10_444(const DNXHDContext *ctx,
86 RowContext *row, int n);
87 static int dnxhd_decode_dct_block_12(const DNXHDContext *ctx,
88 RowContext *row, int n);
89 static int dnxhd_decode_dct_block_12_444(const DNXHDContext *ctx,
90 RowContext *row, int n);
91
dnxhd_decode_init(AVCodecContext * avctx)92 static av_cold int dnxhd_decode_init(AVCodecContext *avctx)
93 {
94 DNXHDContext *ctx = avctx->priv_data;
95
96 ctx->avctx = avctx;
97 ctx->cid = -1;
98 if (avctx->colorspace == AVCOL_SPC_UNSPECIFIED) {
99 avctx->colorspace = AVCOL_SPC_BT709;
100 }
101
102 avctx->coded_width = FFALIGN(avctx->width, 16);
103 avctx->coded_height = FFALIGN(avctx->height, 16);
104
105 ctx->rows = av_mallocz_array(avctx->thread_count, sizeof(RowContext));
106 if (!ctx->rows)
107 return AVERROR(ENOMEM);
108
109 return 0;
110 }
111
dnxhd_init_vlc(DNXHDContext * ctx,uint32_t cid,int bitdepth)112 static int dnxhd_init_vlc(DNXHDContext *ctx, uint32_t cid, int bitdepth)
113 {
114 if (cid != ctx->cid) {
115 int index;
116
117 if ((index = ff_dnxhd_get_cid_table(cid)) < 0) {
118 av_log(ctx->avctx, AV_LOG_ERROR, "unsupported cid %"PRIu32"\n", cid);
119 return AVERROR(ENOSYS);
120 }
121 if (ff_dnxhd_cid_table[index].bit_depth != bitdepth &&
122 ff_dnxhd_cid_table[index].bit_depth != DNXHD_VARIABLE) {
123 av_log(ctx->avctx, AV_LOG_ERROR, "bit depth mismatches %d %d\n", ff_dnxhd_cid_table[index].bit_depth, bitdepth);
124 return AVERROR_INVALIDDATA;
125 }
126 ctx->cid_table = &ff_dnxhd_cid_table[index];
127 av_log(ctx->avctx, AV_LOG_VERBOSE, "Profile cid %"PRIu32".\n", cid);
128
129 ff_free_vlc(&ctx->ac_vlc);
130 ff_free_vlc(&ctx->dc_vlc);
131 ff_free_vlc(&ctx->run_vlc);
132
133 init_vlc(&ctx->ac_vlc, DNXHD_VLC_BITS, 257,
134 ctx->cid_table->ac_bits, 1, 1,
135 ctx->cid_table->ac_codes, 2, 2, 0);
136 init_vlc(&ctx->dc_vlc, DNXHD_DC_VLC_BITS, bitdepth > 8 ? 14 : 12,
137 ctx->cid_table->dc_bits, 1, 1,
138 ctx->cid_table->dc_codes, 1, 1, 0);
139 init_vlc(&ctx->run_vlc, DNXHD_VLC_BITS, 62,
140 ctx->cid_table->run_bits, 1, 1,
141 ctx->cid_table->run_codes, 2, 2, 0);
142
143 ctx->cid = cid;
144 }
145 return 0;
146 }
147
dnxhd_decode_init_thread_copy(AVCodecContext * avctx)148 static av_cold int dnxhd_decode_init_thread_copy(AVCodecContext *avctx)
149 {
150 DNXHDContext *ctx = avctx->priv_data;
151
152 ctx->avctx = avctx;
153 // make sure VLC tables will be loaded when cid is parsed
154 ctx->cid = -1;
155
156 ctx->rows = av_mallocz_array(avctx->thread_count, sizeof(RowContext));
157 if (!ctx->rows)
158 return AVERROR(ENOMEM);
159
160 return 0;
161 }
162
dnxhd_get_profile(int cid)163 static int dnxhd_get_profile(int cid)
164 {
165 switch(cid) {
166 case 1270:
167 return FF_PROFILE_DNXHR_444;
168 case 1271:
169 return FF_PROFILE_DNXHR_HQX;
170 case 1272:
171 return FF_PROFILE_DNXHR_HQ;
172 case 1273:
173 return FF_PROFILE_DNXHR_SQ;
174 case 1274:
175 return FF_PROFILE_DNXHR_LB;
176 }
177 return FF_PROFILE_DNXHD;
178 }
179
dnxhd_decode_header(DNXHDContext * ctx,AVFrame * frame,const uint8_t * buf,int buf_size,int first_field)180 static int dnxhd_decode_header(DNXHDContext *ctx, AVFrame *frame,
181 const uint8_t *buf, int buf_size,
182 int first_field)
183 {
184 int i, cid, ret;
185 int old_bit_depth = ctx->bit_depth, bitdepth;
186 uint64_t header_prefix;
187 if (buf_size < 0x280) {
188 av_log(ctx->avctx, AV_LOG_ERROR,
189 "buffer too small (%d < 640).\n", buf_size);
190 return AVERROR_INVALIDDATA;
191 }
192
193 header_prefix = ff_dnxhd_parse_header_prefix(buf);
194 if (header_prefix == 0) {
195 av_log(ctx->avctx, AV_LOG_ERROR,
196 "unknown header 0x%02X 0x%02X 0x%02X 0x%02X 0x%02X\n",
197 buf[0], buf[1], buf[2], buf[3], buf[4]);
198 return AVERROR_INVALIDDATA;
199 }
200 if (buf[5] & 2) { /* interlaced */
201 ctx->cur_field = buf[5] & 1;
202 frame->interlaced_frame = 1;
203 frame->top_field_first = first_field ^ ctx->cur_field;
204 av_log(ctx->avctx, AV_LOG_DEBUG,
205 "interlaced %d, cur field %d\n", buf[5] & 3, ctx->cur_field);
206 } else {
207 ctx->cur_field = 0;
208 }
209 ctx->mbaff = (buf[0x6] >> 5) & 1;
210 ctx->alpha = buf[0x7] & 1;
211 ctx->lla = (buf[0x7] >> 1) & 1;
212 if (ctx->alpha)
213 avpriv_request_sample(ctx->avctx, "alpha");
214
215 ctx->height = AV_RB16(buf + 0x18);
216 ctx->width = AV_RB16(buf + 0x1a);
217
218 switch(buf[0x21] >> 5) {
219 case 1: bitdepth = 8; break;
220 case 2: bitdepth = 10; break;
221 case 3: bitdepth = 12; break;
222 default:
223 av_log(ctx->avctx, AV_LOG_ERROR,
224 "Unknown bitdepth indicator (%d)\n", buf[0x21] >> 5);
225 return AVERROR_INVALIDDATA;
226 }
227
228 cid = AV_RB32(buf + 0x28);
229
230 ctx->avctx->profile = dnxhd_get_profile(cid);
231
232 if ((ret = dnxhd_init_vlc(ctx, cid, bitdepth)) < 0)
233 return ret;
234 if (ctx->mbaff && ctx->cid_table->cid != 1260)
235 av_log(ctx->avctx, AV_LOG_WARNING,
236 "Adaptive MB interlace flag in an unsupported profile.\n");
237
238 ctx->act = buf[0x2C] & 7;
239 if (ctx->act && ctx->cid_table->cid != 1256 && ctx->cid_table->cid != 1270)
240 av_log(ctx->avctx, AV_LOG_WARNING,
241 "Adaptive color transform in an unsupported profile.\n");
242
243 ctx->is_444 = (buf[0x2C] >> 6) & 1;
244 if (ctx->is_444) {
245 if (bitdepth == 8) {
246 avpriv_request_sample(ctx->avctx, "4:4:4 8 bits");
247 return AVERROR_INVALIDDATA;
248 } else if (bitdepth == 10) {
249 ctx->decode_dct_block = dnxhd_decode_dct_block_10_444;
250 ctx->pix_fmt = ctx->act ? AV_PIX_FMT_YUV444P10
251 : AV_PIX_FMT_GBRP10;
252 } else {
253 ctx->decode_dct_block = dnxhd_decode_dct_block_12_444;
254 ctx->pix_fmt = ctx->act ? AV_PIX_FMT_YUV444P12
255 : AV_PIX_FMT_GBRP12;
256 }
257 } else if (bitdepth == 12) {
258 ctx->decode_dct_block = dnxhd_decode_dct_block_12;
259 ctx->pix_fmt = AV_PIX_FMT_YUV422P12;
260 } else if (bitdepth == 10) {
261 if (ctx->avctx->profile == FF_PROFILE_DNXHR_HQX)
262 ctx->decode_dct_block = dnxhd_decode_dct_block_10_444;
263 else
264 ctx->decode_dct_block = dnxhd_decode_dct_block_10;
265 ctx->pix_fmt = AV_PIX_FMT_YUV422P10;
266 } else {
267 ctx->decode_dct_block = dnxhd_decode_dct_block_8;
268 ctx->pix_fmt = AV_PIX_FMT_YUV422P;
269 }
270
271 ctx->avctx->bits_per_raw_sample = ctx->bit_depth = bitdepth;
272 if (ctx->bit_depth != old_bit_depth) {
273 ff_blockdsp_init(&ctx->bdsp, ctx->avctx);
274 ff_idctdsp_init(&ctx->idsp, ctx->avctx);
275 ff_init_scantable(ctx->idsp.idct_permutation, &ctx->scantable,
276 ff_zigzag_direct);
277 }
278
279 // make sure profile size constraints are respected
280 // DNx100 allows 1920->1440 and 1280->960 subsampling
281 if (ctx->width != ctx->cid_table->width &&
282 ctx->cid_table->width != DNXHD_VARIABLE) {
283 av_reduce(&ctx->avctx->sample_aspect_ratio.num,
284 &ctx->avctx->sample_aspect_ratio.den,
285 ctx->width, ctx->cid_table->width, 255);
286 ctx->width = ctx->cid_table->width;
287 }
288
289 if (buf_size < ctx->cid_table->coding_unit_size) {
290 av_log(ctx->avctx, AV_LOG_ERROR, "incorrect frame size (%d < %u).\n",
291 buf_size, ctx->cid_table->coding_unit_size);
292 return AVERROR_INVALIDDATA;
293 }
294
295 ctx->mb_width = (ctx->width + 15)>> 4;
296 ctx->mb_height = AV_RB16(buf + 0x16c);
297
298 if ((ctx->height + 15) >> 4 == ctx->mb_height && frame->interlaced_frame)
299 ctx->height <<= 1;
300
301 av_log(ctx->avctx, AV_LOG_VERBOSE, "%dx%d, 4:%s %d bits, MBAFF=%d ACT=%d\n",
302 ctx->width, ctx->height, ctx->is_444 ? "4:4" : "2:2",
303 ctx->bit_depth, ctx->mbaff, ctx->act);
304
305 // Newer format supports variable mb_scan_index sizes
306 if (ctx->mb_height > 68 && ff_dnxhd_check_header_prefix_hr(header_prefix)) {
307 ctx->data_offset = 0x170 + (ctx->mb_height << 2);
308 } else {
309 if (ctx->mb_height > 68) {
310 av_log(ctx->avctx, AV_LOG_ERROR,
311 "mb height too big: %d\n", ctx->mb_height);
312 return AVERROR_INVALIDDATA;
313 }
314 ctx->data_offset = 0x280;
315 }
316 if ((ctx->mb_height << frame->interlaced_frame) > (ctx->height + 15) >> 4) {
317 av_log(ctx->avctx, AV_LOG_ERROR,
318 "mb height too big: %d\n", ctx->mb_height);
319 return AVERROR_INVALIDDATA;
320 }
321
322 if (buf_size < ctx->data_offset) {
323 av_log(ctx->avctx, AV_LOG_ERROR,
324 "buffer too small (%d < %d).\n", buf_size, ctx->data_offset);
325 return AVERROR_INVALIDDATA;
326 }
327
328 if (ctx->mb_height > FF_ARRAY_ELEMS(ctx->mb_scan_index)) {
329 av_log(ctx->avctx, AV_LOG_ERROR,
330 "mb_height too big (%d > %"SIZE_SPECIFIER").\n", ctx->mb_height, FF_ARRAY_ELEMS(ctx->mb_scan_index));
331 return AVERROR_INVALIDDATA;
332 }
333
334 for (i = 0; i < ctx->mb_height; i++) {
335 ctx->mb_scan_index[i] = AV_RB32(buf + 0x170 + (i << 2));
336 ff_dlog(ctx->avctx, "mb scan index %d, pos %d: %"PRIu32"\n",
337 i, 0x170 + (i << 2), ctx->mb_scan_index[i]);
338 if (buf_size - ctx->data_offset < ctx->mb_scan_index[i]) {
339 av_log(ctx->avctx, AV_LOG_ERROR,
340 "invalid mb scan index (%"PRIu32" vs %u).\n",
341 ctx->mb_scan_index[i], buf_size - ctx->data_offset);
342 return AVERROR_INVALIDDATA;
343 }
344 }
345
346 return 0;
347 }
348
dnxhd_decode_dct_block(const DNXHDContext * ctx,RowContext * row,int n,int index_bits,int level_bias,int level_shift,int dc_shift)349 static av_always_inline int dnxhd_decode_dct_block(const DNXHDContext *ctx,
350 RowContext *row,
351 int n,
352 int index_bits,
353 int level_bias,
354 int level_shift,
355 int dc_shift)
356 {
357 int i, j, index1, index2, len, flags;
358 int level, component, sign;
359 const int *scale;
360 const uint8_t *weight_matrix;
361 const uint8_t *ac_info = ctx->cid_table->ac_info;
362 int16_t *block = row->blocks[n];
363 const int eob_index = ctx->cid_table->eob_index;
364 int ret = 0;
365 OPEN_READER(bs, &row->gb);
366
367 ctx->bdsp.clear_block(block);
368
369 if (!ctx->is_444) {
370 if (n & 2) {
371 component = 1 + (n & 1);
372 scale = row->chroma_scale;
373 weight_matrix = ctx->cid_table->chroma_weight;
374 } else {
375 component = 0;
376 scale = row->luma_scale;
377 weight_matrix = ctx->cid_table->luma_weight;
378 }
379 } else {
380 component = (n >> 1) % 3;
381 if (component) {
382 scale = row->chroma_scale;
383 weight_matrix = ctx->cid_table->chroma_weight;
384 } else {
385 scale = row->luma_scale;
386 weight_matrix = ctx->cid_table->luma_weight;
387 }
388 }
389
390 UPDATE_CACHE(bs, &row->gb);
391 GET_VLC(len, bs, &row->gb, ctx->dc_vlc.table, DNXHD_DC_VLC_BITS, 1);
392 if (len < 0) {
393 ret = len;
394 goto error;
395 }
396 if (len) {
397 level = GET_CACHE(bs, &row->gb);
398 LAST_SKIP_BITS(bs, &row->gb, len);
399 sign = ~level >> 31;
400 level = (NEG_USR32(sign ^ level, len) ^ sign) - sign;
401 row->last_dc[component] += level * (1 << dc_shift);
402 }
403 block[0] = row->last_dc[component];
404
405 i = 0;
406
407 UPDATE_CACHE(bs, &row->gb);
408 GET_VLC(index1, bs, &row->gb, ctx->ac_vlc.table,
409 DNXHD_VLC_BITS, 2);
410
411 while (index1 != eob_index) {
412 level = ac_info[2*index1+0];
413 flags = ac_info[2*index1+1];
414
415 sign = SHOW_SBITS(bs, &row->gb, 1);
416 SKIP_BITS(bs, &row->gb, 1);
417
418 if (flags & 1) {
419 level += SHOW_UBITS(bs, &row->gb, index_bits) << 7;
420 SKIP_BITS(bs, &row->gb, index_bits);
421 }
422
423 if (flags & 2) {
424 UPDATE_CACHE(bs, &row->gb);
425 GET_VLC(index2, bs, &row->gb, ctx->run_vlc.table,
426 DNXHD_VLC_BITS, 2);
427 i += ctx->cid_table->run[index2];
428 }
429
430 if (++i > 63) {
431 av_log(ctx->avctx, AV_LOG_ERROR, "ac tex damaged %d, %d\n", n, i);
432 ret = -1;
433 break;
434 }
435
436 j = ctx->scantable.permutated[i];
437 level *= scale[i];
438 level += scale[i] >> 1;
439 if (level_bias < 32 || weight_matrix[i] != level_bias)
440 level += level_bias; // 1<<(level_shift-1)
441 level >>= level_shift;
442
443 block[j] = (level ^ sign) - sign;
444
445 UPDATE_CACHE(bs, &row->gb);
446 GET_VLC(index1, bs, &row->gb, ctx->ac_vlc.table,
447 DNXHD_VLC_BITS, 2);
448 }
449 error:
450 CLOSE_READER(bs, &row->gb);
451 return ret;
452 }
453
dnxhd_decode_dct_block_8(const DNXHDContext * ctx,RowContext * row,int n)454 static int dnxhd_decode_dct_block_8(const DNXHDContext *ctx,
455 RowContext *row, int n)
456 {
457 return dnxhd_decode_dct_block(ctx, row, n, 4, 32, 6, 0);
458 }
459
dnxhd_decode_dct_block_10(const DNXHDContext * ctx,RowContext * row,int n)460 static int dnxhd_decode_dct_block_10(const DNXHDContext *ctx,
461 RowContext *row, int n)
462 {
463 return dnxhd_decode_dct_block(ctx, row, n, 6, 8, 4, 0);
464 }
465
dnxhd_decode_dct_block_10_444(const DNXHDContext * ctx,RowContext * row,int n)466 static int dnxhd_decode_dct_block_10_444(const DNXHDContext *ctx,
467 RowContext *row, int n)
468 {
469 return dnxhd_decode_dct_block(ctx, row, n, 6, 32, 6, 0);
470 }
471
dnxhd_decode_dct_block_12(const DNXHDContext * ctx,RowContext * row,int n)472 static int dnxhd_decode_dct_block_12(const DNXHDContext *ctx,
473 RowContext *row, int n)
474 {
475 return dnxhd_decode_dct_block(ctx, row, n, 6, 8, 4, 2);
476 }
477
dnxhd_decode_dct_block_12_444(const DNXHDContext * ctx,RowContext * row,int n)478 static int dnxhd_decode_dct_block_12_444(const DNXHDContext *ctx,
479 RowContext *row, int n)
480 {
481 return dnxhd_decode_dct_block(ctx, row, n, 6, 32, 4, 2);
482 }
483
dnxhd_decode_macroblock(const DNXHDContext * ctx,RowContext * row,AVFrame * frame,int x,int y)484 static int dnxhd_decode_macroblock(const DNXHDContext *ctx, RowContext *row,
485 AVFrame *frame, int x, int y)
486 {
487 int shift1 = ctx->bit_depth >= 10;
488 int dct_linesize_luma = frame->linesize[0];
489 int dct_linesize_chroma = frame->linesize[1];
490 uint8_t *dest_y, *dest_u, *dest_v;
491 int dct_y_offset, dct_x_offset;
492 int qscale, i, act;
493 int interlaced_mb = 0;
494
495 if (ctx->mbaff) {
496 interlaced_mb = get_bits1(&row->gb);
497 qscale = get_bits(&row->gb, 10);
498 } else {
499 qscale = get_bits(&row->gb, 11);
500 }
501 act = get_bits1(&row->gb);
502 if (act) {
503 if (!ctx->act) {
504 static int act_warned;
505 if (!act_warned) {
506 act_warned = 1;
507 av_log(ctx->avctx, AV_LOG_ERROR,
508 "ACT flag set, in violation of frame header.\n");
509 }
510 } else if (row->format == -1) {
511 row->format = act;
512 } else if (row->format != act) {
513 row->format = 2; // Variable
514 }
515 }
516
517 if (qscale != row->last_qscale) {
518 for (i = 0; i < 64; i++) {
519 row->luma_scale[i] = qscale * ctx->cid_table->luma_weight[i];
520 row->chroma_scale[i] = qscale * ctx->cid_table->chroma_weight[i];
521 }
522 row->last_qscale = qscale;
523 }
524
525 for (i = 0; i < 8 + 4 * ctx->is_444; i++) {
526 if (ctx->decode_dct_block(ctx, row, i) < 0)
527 return AVERROR_INVALIDDATA;
528 }
529
530 if (frame->interlaced_frame) {
531 dct_linesize_luma <<= 1;
532 dct_linesize_chroma <<= 1;
533 }
534
535 dest_y = frame->data[0] + ((y * dct_linesize_luma) << 4) + (x << (4 + shift1));
536 dest_u = frame->data[1] + ((y * dct_linesize_chroma) << 4) + (x << (3 + shift1 + ctx->is_444));
537 dest_v = frame->data[2] + ((y * dct_linesize_chroma) << 4) + (x << (3 + shift1 + ctx->is_444));
538
539 if (frame->interlaced_frame && ctx->cur_field) {
540 dest_y += frame->linesize[0];
541 dest_u += frame->linesize[1];
542 dest_v += frame->linesize[2];
543 }
544 if (interlaced_mb) {
545 dct_linesize_luma <<= 1;
546 dct_linesize_chroma <<= 1;
547 }
548
549 dct_y_offset = interlaced_mb ? frame->linesize[0] : (dct_linesize_luma << 3);
550 dct_x_offset = 8 << shift1;
551 if (!ctx->is_444) {
552 ctx->idsp.idct_put(dest_y, dct_linesize_luma, row->blocks[0]);
553 ctx->idsp.idct_put(dest_y + dct_x_offset, dct_linesize_luma, row->blocks[1]);
554 ctx->idsp.idct_put(dest_y + dct_y_offset, dct_linesize_luma, row->blocks[4]);
555 ctx->idsp.idct_put(dest_y + dct_y_offset + dct_x_offset, dct_linesize_luma, row->blocks[5]);
556
557 if (!(ctx->avctx->flags & AV_CODEC_FLAG_GRAY)) {
558 dct_y_offset = interlaced_mb ? frame->linesize[1] : (dct_linesize_chroma << 3);
559 ctx->idsp.idct_put(dest_u, dct_linesize_chroma, row->blocks[2]);
560 ctx->idsp.idct_put(dest_v, dct_linesize_chroma, row->blocks[3]);
561 ctx->idsp.idct_put(dest_u + dct_y_offset, dct_linesize_chroma, row->blocks[6]);
562 ctx->idsp.idct_put(dest_v + dct_y_offset, dct_linesize_chroma, row->blocks[7]);
563 }
564 } else {
565 ctx->idsp.idct_put(dest_y, dct_linesize_luma, row->blocks[0]);
566 ctx->idsp.idct_put(dest_y + dct_x_offset, dct_linesize_luma, row->blocks[1]);
567 ctx->idsp.idct_put(dest_y + dct_y_offset, dct_linesize_luma, row->blocks[6]);
568 ctx->idsp.idct_put(dest_y + dct_y_offset + dct_x_offset, dct_linesize_luma, row->blocks[7]);
569
570 if (!(ctx->avctx->flags & AV_CODEC_FLAG_GRAY)) {
571 dct_y_offset = interlaced_mb ? frame->linesize[1] : (dct_linesize_chroma << 3);
572 ctx->idsp.idct_put(dest_u, dct_linesize_chroma, row->blocks[2]);
573 ctx->idsp.idct_put(dest_u + dct_x_offset, dct_linesize_chroma, row->blocks[3]);
574 ctx->idsp.idct_put(dest_u + dct_y_offset, dct_linesize_chroma, row->blocks[8]);
575 ctx->idsp.idct_put(dest_u + dct_y_offset + dct_x_offset, dct_linesize_chroma, row->blocks[9]);
576 ctx->idsp.idct_put(dest_v, dct_linesize_chroma, row->blocks[4]);
577 ctx->idsp.idct_put(dest_v + dct_x_offset, dct_linesize_chroma, row->blocks[5]);
578 ctx->idsp.idct_put(dest_v + dct_y_offset, dct_linesize_chroma, row->blocks[10]);
579 ctx->idsp.idct_put(dest_v + dct_y_offset + dct_x_offset, dct_linesize_chroma, row->blocks[11]);
580 }
581 }
582
583 return 0;
584 }
585
dnxhd_decode_row(AVCodecContext * avctx,void * data,int rownb,int threadnb)586 static int dnxhd_decode_row(AVCodecContext *avctx, void *data,
587 int rownb, int threadnb)
588 {
589 const DNXHDContext *ctx = avctx->priv_data;
590 uint32_t offset = ctx->mb_scan_index[rownb];
591 RowContext *row = ctx->rows + threadnb;
592 int x;
593
594 row->last_dc[0] =
595 row->last_dc[1] =
596 row->last_dc[2] = 1 << (ctx->bit_depth + 2); // for levels +2^(bitdepth-1)
597 init_get_bits(&row->gb, ctx->buf + offset, (ctx->buf_size - offset) << 3);
598 for (x = 0; x < ctx->mb_width; x++) {
599 //START_TIMER;
600 int ret = dnxhd_decode_macroblock(ctx, row, data, x, rownb);
601 if (ret < 0) {
602 row->errors++;
603 return ret;
604 }
605 //STOP_TIMER("decode macroblock");
606 }
607
608 return 0;
609 }
610
dnxhd_decode_frame(AVCodecContext * avctx,void * data,int * got_frame,AVPacket * avpkt)611 static int dnxhd_decode_frame(AVCodecContext *avctx, void *data,
612 int *got_frame, AVPacket *avpkt)
613 {
614 const uint8_t *buf = avpkt->data;
615 int buf_size = avpkt->size;
616 DNXHDContext *ctx = avctx->priv_data;
617 ThreadFrame frame = { .f = data };
618 AVFrame *picture = data;
619 int first_field = 1;
620 int ret, i;
621
622 ff_dlog(avctx, "frame size %d\n", buf_size);
623
624 for (i = 0; i < avctx->thread_count; i++)
625 ctx->rows[i].format = -1;
626
627 decode_coding_unit:
628 if ((ret = dnxhd_decode_header(ctx, picture, buf, buf_size, first_field)) < 0)
629 return ret;
630
631 if ((avctx->width || avctx->height) &&
632 (ctx->width != avctx->width || ctx->height != avctx->height)) {
633 av_log(avctx, AV_LOG_WARNING, "frame size changed: %dx%d -> %ux%u\n",
634 avctx->width, avctx->height, ctx->width, ctx->height);
635 first_field = 1;
636 }
637 if (avctx->pix_fmt != AV_PIX_FMT_NONE && avctx->pix_fmt != ctx->pix_fmt) {
638 av_log(avctx, AV_LOG_WARNING, "pix_fmt changed: %s -> %s\n",
639 av_get_pix_fmt_name(avctx->pix_fmt), av_get_pix_fmt_name(ctx->pix_fmt));
640 first_field = 1;
641 }
642
643 avctx->pix_fmt = ctx->pix_fmt;
644 ret = ff_set_dimensions(avctx, ctx->width, ctx->height);
645 if (ret < 0)
646 return ret;
647
648 if (first_field) {
649 if ((ret = ff_thread_get_buffer(avctx, &frame, 0)) < 0)
650 return ret;
651 picture->pict_type = AV_PICTURE_TYPE_I;
652 picture->key_frame = 1;
653 }
654
655 ctx->buf_size = buf_size - ctx->data_offset;
656 ctx->buf = buf + ctx->data_offset;
657 avctx->execute2(avctx, dnxhd_decode_row, picture, NULL, ctx->mb_height);
658
659 if (first_field && picture->interlaced_frame) {
660 buf += ctx->cid_table->coding_unit_size;
661 buf_size -= ctx->cid_table->coding_unit_size;
662 first_field = 0;
663 goto decode_coding_unit;
664 }
665
666 ret = 0;
667 for (i = 0; i < avctx->thread_count; i++) {
668 ret += ctx->rows[i].errors;
669 ctx->rows[i].errors = 0;
670 }
671
672 if (ctx->act) {
673 static int act_warned;
674 int format = ctx->rows[0].format;
675 for (i = 1; i < avctx->thread_count; i++) {
676 if (ctx->rows[i].format != format &&
677 ctx->rows[i].format != -1 /* not run */) {
678 format = 2;
679 break;
680 }
681 }
682 switch (format) {
683 case -1:
684 case 2:
685 if (!act_warned) {
686 act_warned = 1;
687 av_log(ctx->avctx, AV_LOG_ERROR,
688 "Unsupported: variable ACT flag.\n");
689 }
690 break;
691 case 0:
692 ctx->pix_fmt = ctx->bit_depth==10
693 ? AV_PIX_FMT_GBRP10 : AV_PIX_FMT_GBRP12;
694 break;
695 case 1:
696 ctx->pix_fmt = ctx->bit_depth==10
697 ? AV_PIX_FMT_YUV444P10 : AV_PIX_FMT_YUV444P12;
698 break;
699 }
700 }
701 avctx->pix_fmt = ctx->pix_fmt;
702 if (ret) {
703 av_log(ctx->avctx, AV_LOG_ERROR, "%d lines with errors\n", ret);
704 return AVERROR_INVALIDDATA;
705 }
706
707 *got_frame = 1;
708 return avpkt->size;
709 }
710
dnxhd_decode_close(AVCodecContext * avctx)711 static av_cold int dnxhd_decode_close(AVCodecContext *avctx)
712 {
713 DNXHDContext *ctx = avctx->priv_data;
714
715 ff_free_vlc(&ctx->ac_vlc);
716 ff_free_vlc(&ctx->dc_vlc);
717 ff_free_vlc(&ctx->run_vlc);
718
719 av_freep(&ctx->rows);
720
721 return 0;
722 }
723
724 AVCodec ff_dnxhd_decoder = {
725 .name = "dnxhd",
726 .long_name = NULL_IF_CONFIG_SMALL("VC3/DNxHD"),
727 .type = AVMEDIA_TYPE_VIDEO,
728 .id = AV_CODEC_ID_DNXHD,
729 .priv_data_size = sizeof(DNXHDContext),
730 .init = dnxhd_decode_init,
731 .close = dnxhd_decode_close,
732 .decode = dnxhd_decode_frame,
733 .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS |
734 AV_CODEC_CAP_SLICE_THREADS,
735 .init_thread_copy = ONLY_IF_THREADS_ENABLED(dnxhd_decode_init_thread_copy),
736 .profiles = NULL_IF_CONFIG_SMALL(ff_dnxhd_profiles),
737 };
738