xref: /third_party/ffmpeg/libavcodec/dnxhddec.c (revision cabdff1a)
1/*
2 * VC3/DNxHD decoder.
3 * Copyright (c) 2007 SmartJog S.A., Baptiste Coudurier <baptiste dot coudurier at smartjog dot com>
4 * Copyright (c) 2011 MirriAd Ltd
5 * Copyright (c) 2015 Christophe Gisquet
6 *
7 * 10 bit support added by MirriAd Ltd, Joseph Artsimovich <joseph@mirriad.com>
8 * Slice multithreading and MB interlaced support added by Christophe Gisquet
9 *
10 * This file is part of FFmpeg.
11 *
12 * FFmpeg is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU Lesser General Public
14 * License as published by the Free Software Foundation; either
15 * version 2.1 of the License, or (at your option) any later version.
16 *
17 * FFmpeg is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 * Lesser General Public License for more details.
21 *
22 * You should have received a copy of the GNU Lesser General Public
23 * License along with FFmpeg; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
25 */
26
27#include "libavutil/imgutils.h"
28#include "libavutil/mem_internal.h"
29
30#include "avcodec.h"
31#include "blockdsp.h"
32#include "codec_internal.h"
33#define  UNCHECKED_BITSTREAM_READER 1
34#include "get_bits.h"
35#include "dnxhddata.h"
36#include "idctdsp.h"
37#include "internal.h"
38#include "profiles.h"
39#include "thread.h"
40
41typedef struct RowContext {
42    DECLARE_ALIGNED(32, int16_t, blocks)[12][64];
43    int luma_scale[64];
44    int chroma_scale[64];
45    GetBitContext gb;
46    int last_dc[3];
47    int last_qscale;
48    int errors;
49    /** -1:not set yet  0:off=RGB  1:on=YUV  2:variable */
50    int format;
51} RowContext;
52
53typedef struct DNXHDContext {
54    AVCodecContext *avctx;
55    RowContext *rows;
56    BlockDSPContext bdsp;
57    const uint8_t* buf;
58    int buf_size;
59    int64_t cid;                        ///< compression id
60    unsigned int width, height;
61    enum AVPixelFormat pix_fmt;
62    unsigned int mb_width, mb_height;
63    uint32_t mb_scan_index[512];
64    int data_offset;                    // End of mb_scan_index, where macroblocks start
65    int cur_field;                      ///< current interlaced field
66    VLC ac_vlc, dc_vlc, run_vlc;
67    IDCTDSPContext idsp;
68    ScanTable scantable;
69    const CIDEntry *cid_table;
70    int bit_depth; // 8, 10, 12 or 0 if not initialized at all.
71    int is_444;
72    int alpha;
73    int lla;
74    int mbaff;
75    int act;
76    int (*decode_dct_block)(const struct DNXHDContext *ctx,
77                            RowContext *row, int n);
78} DNXHDContext;
79
80#define DNXHD_VLC_BITS 9
81#define DNXHD_DC_VLC_BITS 7
82
83static int dnxhd_decode_dct_block_8(const DNXHDContext *ctx,
84                                    RowContext *row, int n);
85static int dnxhd_decode_dct_block_10(const DNXHDContext *ctx,
86                                     RowContext *row, int n);
87static int dnxhd_decode_dct_block_10_444(const DNXHDContext *ctx,
88                                         RowContext *row, int n);
89static int dnxhd_decode_dct_block_12(const DNXHDContext *ctx,
90                                     RowContext *row, int n);
91static int dnxhd_decode_dct_block_12_444(const DNXHDContext *ctx,
92                                         RowContext *row, int n);
93
94static av_cold int dnxhd_decode_init(AVCodecContext *avctx)
95{
96    DNXHDContext *ctx = avctx->priv_data;
97
98    ctx->avctx = avctx;
99    ctx->cid = -1;
100    if (avctx->colorspace == AVCOL_SPC_UNSPECIFIED) {
101        avctx->colorspace = AVCOL_SPC_BT709;
102    }
103
104    avctx->coded_width  = FFALIGN(avctx->width,  16);
105    avctx->coded_height = FFALIGN(avctx->height, 16);
106
107    ctx->rows = av_calloc(avctx->thread_count, sizeof(*ctx->rows));
108    if (!ctx->rows)
109        return AVERROR(ENOMEM);
110
111    return 0;
112}
113
114static int dnxhd_init_vlc(DNXHDContext *ctx, uint32_t cid, int bitdepth)
115{
116    int ret;
117    if (cid != ctx->cid) {
118        const CIDEntry *cid_table = ff_dnxhd_get_cid_table(cid);
119
120        if (!cid_table) {
121            av_log(ctx->avctx, AV_LOG_ERROR, "unsupported cid %"PRIu32"\n", cid);
122            return AVERROR(ENOSYS);
123        }
124        if (cid_table->bit_depth != bitdepth &&
125            cid_table->bit_depth != DNXHD_VARIABLE) {
126            av_log(ctx->avctx, AV_LOG_ERROR, "bit depth mismatches %d %d\n",
127                   cid_table->bit_depth, bitdepth);
128            return AVERROR_INVALIDDATA;
129        }
130        ctx->cid_table = cid_table;
131        av_log(ctx->avctx, AV_LOG_VERBOSE, "Profile cid %"PRIu32".\n", cid);
132
133        ff_free_vlc(&ctx->ac_vlc);
134        ff_free_vlc(&ctx->dc_vlc);
135        ff_free_vlc(&ctx->run_vlc);
136
137        if ((ret = init_vlc(&ctx->ac_vlc, DNXHD_VLC_BITS, 257,
138                 ctx->cid_table->ac_bits, 1, 1,
139                 ctx->cid_table->ac_codes, 2, 2, 0)) < 0)
140            goto out;
141        if ((ret = init_vlc(&ctx->dc_vlc, DNXHD_DC_VLC_BITS, bitdepth > 8 ? 14 : 12,
142                 ctx->cid_table->dc_bits, 1, 1,
143                 ctx->cid_table->dc_codes, 1, 1, 0)) < 0)
144            goto out;
145        if ((ret = init_vlc(&ctx->run_vlc, DNXHD_VLC_BITS, 62,
146                 ctx->cid_table->run_bits, 1, 1,
147                 ctx->cid_table->run_codes, 2, 2, 0)) < 0)
148            goto out;
149
150        ctx->cid = cid;
151    }
152    ret = 0;
153out:
154    if (ret < 0)
155        av_log(ctx->avctx, AV_LOG_ERROR, "init_vlc failed\n");
156    return ret;
157}
158
159static int dnxhd_get_profile(int cid)
160{
161    switch(cid) {
162    case 1270:
163        return FF_PROFILE_DNXHR_444;
164    case 1271:
165        return FF_PROFILE_DNXHR_HQX;
166    case 1272:
167        return FF_PROFILE_DNXHR_HQ;
168    case 1273:
169        return FF_PROFILE_DNXHR_SQ;
170    case 1274:
171        return FF_PROFILE_DNXHR_LB;
172    }
173    return FF_PROFILE_DNXHD;
174}
175
176static int dnxhd_decode_header(DNXHDContext *ctx, AVFrame *frame,
177                               const uint8_t *buf, int buf_size,
178                               int first_field)
179{
180    int i, cid, ret;
181    int old_bit_depth = ctx->bit_depth, bitdepth;
182    uint64_t header_prefix;
183    if (buf_size < 0x280) {
184        av_log(ctx->avctx, AV_LOG_ERROR,
185               "buffer too small (%d < 640).\n", buf_size);
186        return AVERROR_INVALIDDATA;
187    }
188
189    header_prefix = ff_dnxhd_parse_header_prefix(buf);
190    if (header_prefix == 0) {
191        av_log(ctx->avctx, AV_LOG_ERROR,
192               "unknown header 0x%02X 0x%02X 0x%02X 0x%02X 0x%02X\n",
193               buf[0], buf[1], buf[2], buf[3], buf[4]);
194        return AVERROR_INVALIDDATA;
195    }
196    if (buf[5] & 2) { /* interlaced */
197        ctx->cur_field = first_field ? buf[5] & 1 : !ctx->cur_field;
198        frame->interlaced_frame = 1;
199        frame->top_field_first  = first_field ^ ctx->cur_field;
200        av_log(ctx->avctx, AV_LOG_DEBUG,
201               "interlaced %d, cur field %d\n", buf[5] & 3, ctx->cur_field);
202    } else {
203        ctx->cur_field = 0;
204    }
205    ctx->mbaff = (buf[0x6] >> 5) & 1;
206    ctx->alpha = buf[0x7] & 1;
207    ctx->lla   = (buf[0x7] >> 1) & 1;
208    if (ctx->alpha)
209        avpriv_request_sample(ctx->avctx, "alpha");
210
211    ctx->height = AV_RB16(buf + 0x18);
212    ctx->width  = AV_RB16(buf + 0x1a);
213
214    switch(buf[0x21] >> 5) {
215    case 1: bitdepth = 8; break;
216    case 2: bitdepth = 10; break;
217    case 3: bitdepth = 12; break;
218    default:
219        av_log(ctx->avctx, AV_LOG_ERROR,
220               "Unknown bitdepth indicator (%d)\n", buf[0x21] >> 5);
221        return AVERROR_INVALIDDATA;
222    }
223
224    cid = AV_RB32(buf + 0x28);
225
226    ctx->avctx->profile = dnxhd_get_profile(cid);
227
228    if ((ret = dnxhd_init_vlc(ctx, cid, bitdepth)) < 0)
229        return ret;
230    if (ctx->mbaff && ctx->cid_table->cid != 1260)
231        av_log(ctx->avctx, AV_LOG_WARNING,
232               "Adaptive MB interlace flag in an unsupported profile.\n");
233
234    switch ((buf[0x2C] >> 1) & 3) {
235    case 0: frame->colorspace = AVCOL_SPC_BT709;       break;
236    case 1: frame->colorspace = AVCOL_SPC_BT2020_NCL;  break;
237    case 2: frame->colorspace = AVCOL_SPC_BT2020_CL;   break;
238    case 3: frame->colorspace = AVCOL_SPC_UNSPECIFIED; break;
239    }
240
241    ctx->act = buf[0x2C] & 1;
242    if (ctx->act && ctx->cid_table->cid != 1256 && ctx->cid_table->cid != 1270)
243        av_log(ctx->avctx, AV_LOG_WARNING,
244               "Adaptive color transform in an unsupported profile.\n");
245
246    ctx->is_444 = (buf[0x2C] >> 6) & 1;
247    if (ctx->is_444) {
248        if (bitdepth == 8) {
249            avpriv_request_sample(ctx->avctx, "4:4:4 8 bits");
250            return AVERROR_INVALIDDATA;
251        } else if (bitdepth == 10) {
252            ctx->decode_dct_block = dnxhd_decode_dct_block_10_444;
253            ctx->pix_fmt = ctx->act ? AV_PIX_FMT_YUV444P10
254                                    : AV_PIX_FMT_GBRP10;
255        } else {
256            ctx->decode_dct_block = dnxhd_decode_dct_block_12_444;
257            ctx->pix_fmt = ctx->act ? AV_PIX_FMT_YUV444P12
258                                    : AV_PIX_FMT_GBRP12;
259        }
260    } else if (bitdepth == 12) {
261        ctx->decode_dct_block = dnxhd_decode_dct_block_12;
262        ctx->pix_fmt = AV_PIX_FMT_YUV422P12;
263    } else if (bitdepth == 10) {
264        if (ctx->avctx->profile == FF_PROFILE_DNXHR_HQX)
265            ctx->decode_dct_block = dnxhd_decode_dct_block_10_444;
266        else
267            ctx->decode_dct_block = dnxhd_decode_dct_block_10;
268        ctx->pix_fmt = AV_PIX_FMT_YUV422P10;
269    } else {
270        ctx->decode_dct_block = dnxhd_decode_dct_block_8;
271        ctx->pix_fmt = AV_PIX_FMT_YUV422P;
272    }
273
274    ctx->avctx->bits_per_raw_sample = ctx->bit_depth = bitdepth;
275    if (ctx->bit_depth != old_bit_depth) {
276        ff_blockdsp_init(&ctx->bdsp, ctx->avctx);
277        ff_idctdsp_init(&ctx->idsp, ctx->avctx);
278        ff_init_scantable(ctx->idsp.idct_permutation, &ctx->scantable,
279                          ff_zigzag_direct);
280    }
281
282    // make sure profile size constraints are respected
283    // DNx100 allows 1920->1440 and 1280->960 subsampling
284    if (ctx->width != ctx->cid_table->width &&
285        ctx->cid_table->width != DNXHD_VARIABLE) {
286        av_reduce(&ctx->avctx->sample_aspect_ratio.num,
287                  &ctx->avctx->sample_aspect_ratio.den,
288                  ctx->width, ctx->cid_table->width, 255);
289        ctx->width = ctx->cid_table->width;
290    }
291
292    if (buf_size < ctx->cid_table->coding_unit_size) {
293        av_log(ctx->avctx, AV_LOG_ERROR, "incorrect frame size (%d < %u).\n",
294               buf_size, ctx->cid_table->coding_unit_size);
295        return AVERROR_INVALIDDATA;
296    }
297
298    ctx->mb_width  = (ctx->width + 15)>> 4;
299    ctx->mb_height = AV_RB16(buf + 0x16c);
300
301    if ((ctx->height + 15) >> 4 == ctx->mb_height && frame->interlaced_frame)
302        ctx->height <<= 1;
303
304    av_log(ctx->avctx, AV_LOG_VERBOSE, "%dx%d, 4:%s %d bits, MBAFF=%d ACT=%d\n",
305           ctx->width, ctx->height, ctx->is_444 ? "4:4" : "2:2",
306           ctx->bit_depth, ctx->mbaff, ctx->act);
307
308    // Newer format supports variable mb_scan_index sizes
309    if (ctx->mb_height > 68 && ff_dnxhd_check_header_prefix_hr(header_prefix)) {
310        ctx->data_offset = 0x170 + (ctx->mb_height << 2);
311    } else {
312        if (ctx->mb_height > 68) {
313            av_log(ctx->avctx, AV_LOG_ERROR,
314                   "mb height too big: %d\n", ctx->mb_height);
315            return AVERROR_INVALIDDATA;
316        }
317        ctx->data_offset = 0x280;
318    }
319    if ((ctx->mb_height << frame->interlaced_frame) > (ctx->height + 15) >> 4) {
320        av_log(ctx->avctx, AV_LOG_ERROR,
321                "mb height too big: %d\n", ctx->mb_height);
322        return AVERROR_INVALIDDATA;
323    }
324
325    if (buf_size < ctx->data_offset) {
326        av_log(ctx->avctx, AV_LOG_ERROR,
327               "buffer too small (%d < %d).\n", buf_size, ctx->data_offset);
328        return AVERROR_INVALIDDATA;
329    }
330
331    if (ctx->mb_height > FF_ARRAY_ELEMS(ctx->mb_scan_index)) {
332        av_log(ctx->avctx, AV_LOG_ERROR,
333               "mb_height too big (%d > %"SIZE_SPECIFIER").\n", ctx->mb_height, FF_ARRAY_ELEMS(ctx->mb_scan_index));
334        return AVERROR_INVALIDDATA;
335    }
336
337    for (i = 0; i < ctx->mb_height; i++) {
338        ctx->mb_scan_index[i] = AV_RB32(buf + 0x170 + (i << 2));
339        ff_dlog(ctx->avctx, "mb scan index %d, pos %d: %"PRIu32"\n",
340                i, 0x170 + (i << 2), ctx->mb_scan_index[i]);
341        if (buf_size - ctx->data_offset < ctx->mb_scan_index[i]) {
342            av_log(ctx->avctx, AV_LOG_ERROR,
343                   "invalid mb scan index (%"PRIu32" vs %u).\n",
344                   ctx->mb_scan_index[i], buf_size - ctx->data_offset);
345            return AVERROR_INVALIDDATA;
346        }
347    }
348
349    return 0;
350}
351
352static av_always_inline int dnxhd_decode_dct_block(const DNXHDContext *ctx,
353                                                   RowContext *row,
354                                                   int n,
355                                                   int index_bits,
356                                                   int level_bias,
357                                                   int level_shift,
358                                                   int dc_shift)
359{
360    int i, j, index1, index2, len, flags;
361    int level, component, sign;
362    const int *scale;
363    const uint8_t *weight_matrix;
364    const uint8_t *ac_info = ctx->cid_table->ac_info;
365    int16_t *block = row->blocks[n];
366    const int eob_index     = ctx->cid_table->eob_index;
367    int ret = 0;
368    OPEN_READER(bs, &row->gb);
369
370    ctx->bdsp.clear_block(block);
371
372    if (!ctx->is_444) {
373        if (n & 2) {
374            component     = 1 + (n & 1);
375            scale = row->chroma_scale;
376            weight_matrix = ctx->cid_table->chroma_weight;
377        } else {
378            component     = 0;
379            scale = row->luma_scale;
380            weight_matrix = ctx->cid_table->luma_weight;
381        }
382    } else {
383        component = (n >> 1) % 3;
384        if (component) {
385            scale = row->chroma_scale;
386            weight_matrix = ctx->cid_table->chroma_weight;
387        } else {
388            scale = row->luma_scale;
389            weight_matrix = ctx->cid_table->luma_weight;
390        }
391    }
392
393    UPDATE_CACHE(bs, &row->gb);
394    GET_VLC(len, bs, &row->gb, ctx->dc_vlc.table, DNXHD_DC_VLC_BITS, 1);
395    if (len < 0) {
396        ret = len;
397        goto error;
398    }
399    if (len) {
400        level = GET_CACHE(bs, &row->gb);
401        LAST_SKIP_BITS(bs, &row->gb, len);
402        sign  = ~level >> 31;
403        level = (NEG_USR32(sign ^ level, len) ^ sign) - sign;
404        row->last_dc[component] += level * (1 << dc_shift);
405    }
406    block[0] = row->last_dc[component];
407
408    i = 0;
409
410    UPDATE_CACHE(bs, &row->gb);
411    GET_VLC(index1, bs, &row->gb, ctx->ac_vlc.table,
412            DNXHD_VLC_BITS, 2);
413
414    while (index1 != eob_index) {
415        level = ac_info[2*index1+0];
416        flags = ac_info[2*index1+1];
417
418        sign = SHOW_SBITS(bs, &row->gb, 1);
419        SKIP_BITS(bs, &row->gb, 1);
420
421        if (flags & 1) {
422            level += SHOW_UBITS(bs, &row->gb, index_bits) << 7;
423            SKIP_BITS(bs, &row->gb, index_bits);
424        }
425
426        if (flags & 2) {
427            UPDATE_CACHE(bs, &row->gb);
428            GET_VLC(index2, bs, &row->gb, ctx->run_vlc.table,
429                    DNXHD_VLC_BITS, 2);
430            i += ctx->cid_table->run[index2];
431        }
432
433        if (++i > 63) {
434            av_log(ctx->avctx, AV_LOG_ERROR, "ac tex damaged %d, %d\n", n, i);
435            ret = -1;
436            break;
437        }
438
439        j     = ctx->scantable.permutated[i];
440        level *= scale[i];
441        level += scale[i] >> 1;
442        if (level_bias < 32 || weight_matrix[i] != level_bias)
443            level += level_bias; // 1<<(level_shift-1)
444        level >>= level_shift;
445
446        block[j] = (level ^ sign) - sign;
447
448        UPDATE_CACHE(bs, &row->gb);
449        GET_VLC(index1, bs, &row->gb, ctx->ac_vlc.table,
450                DNXHD_VLC_BITS, 2);
451    }
452error:
453    CLOSE_READER(bs, &row->gb);
454    return ret;
455}
456
457static int dnxhd_decode_dct_block_8(const DNXHDContext *ctx,
458                                    RowContext *row, int n)
459{
460    return dnxhd_decode_dct_block(ctx, row, n, 4, 32, 6, 0);
461}
462
463static int dnxhd_decode_dct_block_10(const DNXHDContext *ctx,
464                                     RowContext *row, int n)
465{
466    return dnxhd_decode_dct_block(ctx, row, n, 6, 8, 4, 0);
467}
468
469static int dnxhd_decode_dct_block_10_444(const DNXHDContext *ctx,
470                                         RowContext *row, int n)
471{
472    return dnxhd_decode_dct_block(ctx, row, n, 6, 32, 6, 0);
473}
474
475static int dnxhd_decode_dct_block_12(const DNXHDContext *ctx,
476                                     RowContext *row, int n)
477{
478    return dnxhd_decode_dct_block(ctx, row, n, 6, 8, 4, 2);
479}
480
481static int dnxhd_decode_dct_block_12_444(const DNXHDContext *ctx,
482                                         RowContext *row, int n)
483{
484    return dnxhd_decode_dct_block(ctx, row, n, 6, 32, 4, 2);
485}
486
487static int dnxhd_decode_macroblock(const DNXHDContext *ctx, RowContext *row,
488                                   AVFrame *frame, int x, int y)
489{
490    int shift1 = ctx->bit_depth >= 10;
491    int dct_linesize_luma   = frame->linesize[0];
492    int dct_linesize_chroma = frame->linesize[1];
493    uint8_t *dest_y, *dest_u, *dest_v;
494    int dct_y_offset, dct_x_offset;
495    int qscale, i, act;
496    int interlaced_mb = 0;
497
498    if (ctx->mbaff) {
499        interlaced_mb = get_bits1(&row->gb);
500        qscale = get_bits(&row->gb, 10);
501    } else {
502        qscale = get_bits(&row->gb, 11);
503    }
504    act = get_bits1(&row->gb);
505    if (act) {
506        if (!ctx->act) {
507            static int act_warned;
508            if (!act_warned) {
509                act_warned = 1;
510                av_log(ctx->avctx, AV_LOG_ERROR,
511                       "ACT flag set, in violation of frame header.\n");
512            }
513        } else if (row->format == -1) {
514            row->format = act;
515        } else if (row->format != act) {
516            row->format = 2; // Variable
517        }
518    }
519
520    if (qscale != row->last_qscale) {
521        for (i = 0; i < 64; i++) {
522            row->luma_scale[i]   = qscale * ctx->cid_table->luma_weight[i];
523            row->chroma_scale[i] = qscale * ctx->cid_table->chroma_weight[i];
524        }
525        row->last_qscale = qscale;
526    }
527
528    for (i = 0; i < 8 + 4 * ctx->is_444; i++) {
529        if (ctx->decode_dct_block(ctx, row, i) < 0)
530            return AVERROR_INVALIDDATA;
531    }
532
533    if (frame->interlaced_frame) {
534        dct_linesize_luma   <<= 1;
535        dct_linesize_chroma <<= 1;
536    }
537
538    dest_y = frame->data[0] + ((y * dct_linesize_luma)   << 4) + (x << (4 + shift1));
539    dest_u = frame->data[1] + ((y * dct_linesize_chroma) << 4) + (x << (3 + shift1 + ctx->is_444));
540    dest_v = frame->data[2] + ((y * dct_linesize_chroma) << 4) + (x << (3 + shift1 + ctx->is_444));
541
542    if (frame->interlaced_frame && ctx->cur_field) {
543        dest_y += frame->linesize[0];
544        dest_u += frame->linesize[1];
545        dest_v += frame->linesize[2];
546    }
547    if (interlaced_mb) {
548        dct_linesize_luma   <<= 1;
549        dct_linesize_chroma <<= 1;
550    }
551
552    dct_y_offset = interlaced_mb ? frame->linesize[0] : (dct_linesize_luma << 3);
553    dct_x_offset = 8 << shift1;
554    if (!ctx->is_444) {
555        ctx->idsp.idct_put(dest_y,                               dct_linesize_luma, row->blocks[0]);
556        ctx->idsp.idct_put(dest_y + dct_x_offset,                dct_linesize_luma, row->blocks[1]);
557        ctx->idsp.idct_put(dest_y + dct_y_offset,                dct_linesize_luma, row->blocks[4]);
558        ctx->idsp.idct_put(dest_y + dct_y_offset + dct_x_offset, dct_linesize_luma, row->blocks[5]);
559
560        if (!(ctx->avctx->flags & AV_CODEC_FLAG_GRAY)) {
561            dct_y_offset = interlaced_mb ? frame->linesize[1] : (dct_linesize_chroma << 3);
562            ctx->idsp.idct_put(dest_u,                dct_linesize_chroma, row->blocks[2]);
563            ctx->idsp.idct_put(dest_v,                dct_linesize_chroma, row->blocks[3]);
564            ctx->idsp.idct_put(dest_u + dct_y_offset, dct_linesize_chroma, row->blocks[6]);
565            ctx->idsp.idct_put(dest_v + dct_y_offset, dct_linesize_chroma, row->blocks[7]);
566        }
567    } else {
568        ctx->idsp.idct_put(dest_y,                               dct_linesize_luma, row->blocks[0]);
569        ctx->idsp.idct_put(dest_y + dct_x_offset,                dct_linesize_luma, row->blocks[1]);
570        ctx->idsp.idct_put(dest_y + dct_y_offset,                dct_linesize_luma, row->blocks[6]);
571        ctx->idsp.idct_put(dest_y + dct_y_offset + dct_x_offset, dct_linesize_luma, row->blocks[7]);
572
573        if (!(ctx->avctx->flags & AV_CODEC_FLAG_GRAY)) {
574            dct_y_offset = interlaced_mb ? frame->linesize[1] : (dct_linesize_chroma << 3);
575            ctx->idsp.idct_put(dest_u,                               dct_linesize_chroma, row->blocks[2]);
576            ctx->idsp.idct_put(dest_u + dct_x_offset,                dct_linesize_chroma, row->blocks[3]);
577            ctx->idsp.idct_put(dest_u + dct_y_offset,                dct_linesize_chroma, row->blocks[8]);
578            ctx->idsp.idct_put(dest_u + dct_y_offset + dct_x_offset, dct_linesize_chroma, row->blocks[9]);
579            ctx->idsp.idct_put(dest_v,                               dct_linesize_chroma, row->blocks[4]);
580            ctx->idsp.idct_put(dest_v + dct_x_offset,                dct_linesize_chroma, row->blocks[5]);
581            ctx->idsp.idct_put(dest_v + dct_y_offset,                dct_linesize_chroma, row->blocks[10]);
582            ctx->idsp.idct_put(dest_v + dct_y_offset + dct_x_offset, dct_linesize_chroma, row->blocks[11]);
583        }
584    }
585
586    return 0;
587}
588
589static int dnxhd_decode_row(AVCodecContext *avctx, void *data,
590                            int rownb, int threadnb)
591{
592    const DNXHDContext *ctx = avctx->priv_data;
593    uint32_t offset = ctx->mb_scan_index[rownb];
594    RowContext *row = ctx->rows + threadnb;
595    int x, ret;
596
597    row->last_dc[0] =
598    row->last_dc[1] =
599    row->last_dc[2] = 1 << (ctx->bit_depth + 2); // for levels +2^(bitdepth-1)
600    ret = init_get_bits8(&row->gb, ctx->buf + offset, ctx->buf_size - offset);
601    if (ret < 0) {
602        row->errors++;
603        return ret;
604    }
605    for (x = 0; x < ctx->mb_width; x++) {
606        int ret = dnxhd_decode_macroblock(ctx, row, data, x, rownb);
607        if (ret < 0) {
608            row->errors++;
609            return ret;
610        }
611    }
612
613    return 0;
614}
615
616static int dnxhd_decode_frame(AVCodecContext *avctx, AVFrame *picture,
617                              int *got_frame, AVPacket *avpkt)
618{
619    const uint8_t *buf = avpkt->data;
620    int buf_size = avpkt->size;
621    DNXHDContext *ctx = avctx->priv_data;
622    int first_field = 1;
623    int ret, i;
624
625    ff_dlog(avctx, "frame size %d\n", buf_size);
626
627    for (i = 0; i < avctx->thread_count; i++)
628        ctx->rows[i].format = -1;
629
630decode_coding_unit:
631    if ((ret = dnxhd_decode_header(ctx, picture, buf, buf_size, first_field)) < 0)
632        return ret;
633
634    if ((avctx->width || avctx->height) &&
635        (ctx->width != avctx->width || ctx->height != avctx->height)) {
636        av_log(avctx, AV_LOG_WARNING, "frame size changed: %dx%d -> %ux%u\n",
637               avctx->width, avctx->height, ctx->width, ctx->height);
638        first_field = 1;
639    }
640    if (avctx->pix_fmt != AV_PIX_FMT_NONE && avctx->pix_fmt != ctx->pix_fmt) {
641        av_log(avctx, AV_LOG_WARNING, "pix_fmt changed: %s -> %s\n",
642               av_get_pix_fmt_name(avctx->pix_fmt), av_get_pix_fmt_name(ctx->pix_fmt));
643        first_field = 1;
644    }
645
646    avctx->pix_fmt = ctx->pix_fmt;
647    ret = ff_set_dimensions(avctx, ctx->width, ctx->height);
648    if (ret < 0)
649        return ret;
650
651    if (first_field) {
652        if ((ret = ff_thread_get_buffer(avctx, picture, 0)) < 0)
653            return ret;
654        picture->pict_type = AV_PICTURE_TYPE_I;
655        picture->key_frame = 1;
656    }
657
658    ctx->buf_size = buf_size - ctx->data_offset;
659    ctx->buf = buf + ctx->data_offset;
660    avctx->execute2(avctx, dnxhd_decode_row, picture, NULL, ctx->mb_height);
661
662    if (first_field && picture->interlaced_frame) {
663        buf      += ctx->cid_table->coding_unit_size;
664        buf_size -= ctx->cid_table->coding_unit_size;
665        first_field = 0;
666        goto decode_coding_unit;
667    }
668
669    ret = 0;
670    for (i = 0; i < avctx->thread_count; i++) {
671        ret += ctx->rows[i].errors;
672        ctx->rows[i].errors = 0;
673    }
674
675    if (ctx->act) {
676        static int act_warned;
677        int format = ctx->rows[0].format;
678        for (i = 1; i < avctx->thread_count; i++) {
679            if (ctx->rows[i].format != format &&
680                ctx->rows[i].format != -1 /* not run */) {
681                format = 2;
682                break;
683            }
684        }
685        switch (format) {
686        case -1:
687        case 2:
688            if (!act_warned) {
689                act_warned = 1;
690                av_log(ctx->avctx, AV_LOG_ERROR,
691                       "Unsupported: variable ACT flag.\n");
692            }
693            break;
694        case 0:
695            ctx->pix_fmt = ctx->bit_depth==10
696                         ? AV_PIX_FMT_GBRP10 : AV_PIX_FMT_GBRP12;
697            break;
698        case 1:
699            ctx->pix_fmt = ctx->bit_depth==10
700                         ? AV_PIX_FMT_YUV444P10 : AV_PIX_FMT_YUV444P12;
701            break;
702        }
703    }
704    avctx->pix_fmt = ctx->pix_fmt;
705    if (ret) {
706        av_log(ctx->avctx, AV_LOG_ERROR, "%d lines with errors\n", ret);
707        return AVERROR_INVALIDDATA;
708    }
709
710    *got_frame = 1;
711    return avpkt->size;
712}
713
714static av_cold int dnxhd_decode_close(AVCodecContext *avctx)
715{
716    DNXHDContext *ctx = avctx->priv_data;
717
718    ff_free_vlc(&ctx->ac_vlc);
719    ff_free_vlc(&ctx->dc_vlc);
720    ff_free_vlc(&ctx->run_vlc);
721
722    av_freep(&ctx->rows);
723
724    return 0;
725}
726
727const FFCodec ff_dnxhd_decoder = {
728    .p.name         = "dnxhd",
729    .p.long_name    = NULL_IF_CONFIG_SMALL("VC3/DNxHD"),
730    .p.type         = AVMEDIA_TYPE_VIDEO,
731    .p.id           = AV_CODEC_ID_DNXHD,
732    .priv_data_size = sizeof(DNXHDContext),
733    .init           = dnxhd_decode_init,
734    .close          = dnxhd_decode_close,
735    FF_CODEC_DECODE_CB(dnxhd_decode_frame),
736    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS |
737                      AV_CODEC_CAP_SLICE_THREADS,
738    .p.profiles     = NULL_IF_CONFIG_SMALL(ff_dnxhd_profiles),
739    .caps_internal  = FF_CODEC_CAP_INIT_THREADSAFE,
740};
741