1/*
2 * Copyright (c) 2010-2011 Maxim Poliakovski
3 * Copyright (c) 2010-2011 Elvis Presley
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22/**
23 * @file
24 * Known FOURCCs: 'apch' (HQ), 'apcn' (SD), 'apcs' (LT), 'apco' (Proxy), 'ap4h' (4444), 'ap4x' (4444 XQ)
25 */
26
27//#define DEBUG
28
29#define LONG_BITSTREAM_READER
30
31#include "config_components.h"
32
33#include "libavutil/internal.h"
34#include "libavutil/mem_internal.h"
35
36#include "avcodec.h"
37#include "codec_internal.h"
38#include "get_bits.h"
39#include "hwconfig.h"
40#include "idctdsp.h"
41#include "internal.h"
42#include "profiles.h"
43#include "simple_idct.h"
44#include "proresdec.h"
45#include "proresdata.h"
46#include "thread.h"
47
48static void permute(uint8_t *dst, const uint8_t *src, const uint8_t permutation[64])
49{
50    int i;
51    for (i = 0; i < 64; i++)
52        dst[i] = permutation[src[i]];
53}
54
55#define ALPHA_SHIFT_16_TO_10(alpha_val) (alpha_val >> 6)
56#define ALPHA_SHIFT_8_TO_10(alpha_val)  ((alpha_val << 2) | (alpha_val >> 6))
57#define ALPHA_SHIFT_16_TO_12(alpha_val) (alpha_val >> 4)
58#define ALPHA_SHIFT_8_TO_12(alpha_val)  ((alpha_val << 4) | (alpha_val >> 4))
59
60static void inline unpack_alpha(GetBitContext *gb, uint16_t *dst, int num_coeffs,
61                                const int num_bits, const int decode_precision) {
62    const int mask = (1 << num_bits) - 1;
63    int i, idx, val, alpha_val;
64
65    idx       = 0;
66    alpha_val = mask;
67    do {
68        do {
69            if (get_bits1(gb)) {
70                val = get_bits(gb, num_bits);
71            } else {
72                int sign;
73                val  = get_bits(gb, num_bits == 16 ? 7 : 4);
74                sign = val & 1;
75                val  = (val + 2) >> 1;
76                if (sign)
77                    val = -val;
78            }
79            alpha_val = (alpha_val + val) & mask;
80            if (num_bits == 16) {
81                if (decode_precision == 10) {
82                    dst[idx++] = ALPHA_SHIFT_16_TO_10(alpha_val);
83                } else { /* 12b */
84                    dst[idx++] = ALPHA_SHIFT_16_TO_12(alpha_val);
85                }
86            } else {
87                if (decode_precision == 10) {
88                    dst[idx++] = ALPHA_SHIFT_8_TO_10(alpha_val);
89                } else { /* 12b */
90                    dst[idx++] = ALPHA_SHIFT_8_TO_12(alpha_val);
91                }
92            }
93            if (idx >= num_coeffs)
94                break;
95        } while (get_bits_left(gb)>0 && get_bits1(gb));
96        val = get_bits(gb, 4);
97        if (!val)
98            val = get_bits(gb, 11);
99        if (idx + val > num_coeffs)
100            val = num_coeffs - idx;
101        if (num_bits == 16) {
102            for (i = 0; i < val; i++) {
103                if (decode_precision == 10) {
104                    dst[idx++] = ALPHA_SHIFT_16_TO_10(alpha_val);
105                } else { /* 12b */
106                    dst[idx++] = ALPHA_SHIFT_16_TO_12(alpha_val);
107                }
108            }
109        } else {
110            for (i = 0; i < val; i++) {
111                if (decode_precision == 10) {
112                    dst[idx++] = ALPHA_SHIFT_8_TO_10(alpha_val);
113                } else { /* 12b */
114                    dst[idx++] = ALPHA_SHIFT_8_TO_12(alpha_val);
115                }
116            }
117        }
118    } while (idx < num_coeffs);
119}
120
121static void unpack_alpha_10(GetBitContext *gb, uint16_t *dst, int num_coeffs,
122                            const int num_bits)
123{
124    if (num_bits == 16) {
125        unpack_alpha(gb, dst, num_coeffs, 16, 10);
126    } else { /* 8 bits alpha */
127        unpack_alpha(gb, dst, num_coeffs, 8, 10);
128    }
129}
130
131static void unpack_alpha_12(GetBitContext *gb, uint16_t *dst, int num_coeffs,
132                            const int num_bits)
133{
134    if (num_bits == 16) {
135        unpack_alpha(gb, dst, num_coeffs, 16, 12);
136    } else { /* 8 bits alpha */
137        unpack_alpha(gb, dst, num_coeffs, 8, 12);
138    }
139}
140
141static av_cold int decode_init(AVCodecContext *avctx)
142{
143    int ret = 0;
144    ProresContext *ctx = avctx->priv_data;
145    uint8_t idct_permutation[64];
146
147    avctx->bits_per_raw_sample = 10;
148
149    switch (avctx->codec_tag) {
150    case MKTAG('a','p','c','o'):
151        avctx->profile = FF_PROFILE_PRORES_PROXY;
152        break;
153    case MKTAG('a','p','c','s'):
154        avctx->profile = FF_PROFILE_PRORES_LT;
155        break;
156    case MKTAG('a','p','c','n'):
157        avctx->profile = FF_PROFILE_PRORES_STANDARD;
158        break;
159    case MKTAG('a','p','c','h'):
160        avctx->profile = FF_PROFILE_PRORES_HQ;
161        break;
162    case MKTAG('a','p','4','h'):
163        avctx->profile = FF_PROFILE_PRORES_4444;
164        avctx->bits_per_raw_sample = 12;
165        break;
166    case MKTAG('a','p','4','x'):
167        avctx->profile = FF_PROFILE_PRORES_XQ;
168        avctx->bits_per_raw_sample = 12;
169        break;
170    default:
171        avctx->profile = FF_PROFILE_UNKNOWN;
172        av_log(avctx, AV_LOG_WARNING, "Unknown prores profile %d\n", avctx->codec_tag);
173    }
174
175    if (avctx->bits_per_raw_sample == 10) {
176        av_log(avctx, AV_LOG_DEBUG, "Auto bitdepth precision. Use 10b decoding based on codec tag.\n");
177    } else { /* 12b */
178        av_log(avctx, AV_LOG_DEBUG, "Auto bitdepth precision. Use 12b decoding based on codec tag.\n");
179    }
180
181    ff_blockdsp_init(&ctx->bdsp, avctx);
182    ret = ff_proresdsp_init(&ctx->prodsp, avctx);
183    if (ret < 0) {
184        av_log(avctx, AV_LOG_ERROR, "Fail to init proresdsp for bits per raw sample %d\n", avctx->bits_per_raw_sample);
185        return ret;
186    }
187
188    ff_init_scantable_permutation(idct_permutation,
189                                  ctx->prodsp.idct_permutation_type);
190
191    permute(ctx->progressive_scan, ff_prores_progressive_scan, idct_permutation);
192    permute(ctx->interlaced_scan, ff_prores_interlaced_scan, idct_permutation);
193
194    ctx->pix_fmt = AV_PIX_FMT_NONE;
195
196    if (avctx->bits_per_raw_sample == 10){
197        ctx->unpack_alpha = unpack_alpha_10;
198    } else if (avctx->bits_per_raw_sample == 12){
199        ctx->unpack_alpha = unpack_alpha_12;
200    } else {
201        av_log(avctx, AV_LOG_ERROR, "Fail to set unpack_alpha for bits per raw sample %d\n", avctx->bits_per_raw_sample);
202        return AVERROR_BUG;
203    }
204    return ret;
205}
206
207static int decode_frame_header(ProresContext *ctx, const uint8_t *buf,
208                               const int data_size, AVCodecContext *avctx)
209{
210    int hdr_size, width, height, flags;
211    int version;
212    const uint8_t *ptr;
213    enum AVPixelFormat pix_fmt;
214
215    hdr_size = AV_RB16(buf);
216    ff_dlog(avctx, "header size %d\n", hdr_size);
217    if (hdr_size > data_size) {
218        av_log(avctx, AV_LOG_ERROR, "error, wrong header size\n");
219        return AVERROR_INVALIDDATA;
220    }
221
222    version = AV_RB16(buf + 2);
223    ff_dlog(avctx, "%.4s version %d\n", buf+4, version);
224    if (version > 1) {
225        av_log(avctx, AV_LOG_ERROR, "unsupported version: %d\n", version);
226        return AVERROR_PATCHWELCOME;
227    }
228
229    width  = AV_RB16(buf + 8);
230    height = AV_RB16(buf + 10);
231
232    if (width != avctx->width || height != avctx->height) {
233        int ret;
234
235        av_log(avctx, AV_LOG_WARNING, "picture resolution change: %dx%d -> %dx%d\n",
236               avctx->width, avctx->height, width, height);
237        if ((ret = ff_set_dimensions(avctx, width, height)) < 0)
238            return ret;
239    }
240
241    ctx->frame_type = (buf[12] >> 2) & 3;
242    ctx->alpha_info = buf[17] & 0xf;
243
244    if (ctx->alpha_info > 2) {
245        av_log(avctx, AV_LOG_ERROR, "Invalid alpha mode %d\n", ctx->alpha_info);
246        return AVERROR_INVALIDDATA;
247    }
248    if (avctx->skip_alpha) ctx->alpha_info = 0;
249
250    ff_dlog(avctx, "frame type %d\n", ctx->frame_type);
251
252    if (ctx->frame_type == 0) {
253        ctx->scan = ctx->progressive_scan; // permuted
254    } else {
255        ctx->scan = ctx->interlaced_scan; // permuted
256        ctx->frame->interlaced_frame = 1;
257        ctx->frame->top_field_first = ctx->frame_type == 1;
258    }
259
260    if (ctx->alpha_info) {
261        if (avctx->bits_per_raw_sample == 10) {
262            pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUVA444P10 : AV_PIX_FMT_YUVA422P10;
263        } else { /* 12b */
264            pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUVA444P12 : AV_PIX_FMT_YUVA422P12;
265        }
266    } else {
267        if (avctx->bits_per_raw_sample == 10) {
268            pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUV444P10 : AV_PIX_FMT_YUV422P10;
269        } else { /* 12b */
270            pix_fmt = (buf[12] & 0xC0) == 0xC0 ? AV_PIX_FMT_YUV444P12 : AV_PIX_FMT_YUV422P12;
271        }
272    }
273
274    if (pix_fmt != ctx->pix_fmt) {
275#define HWACCEL_MAX (CONFIG_PRORES_VIDEOTOOLBOX_HWACCEL)
276        enum AVPixelFormat pix_fmts[HWACCEL_MAX + 2], *fmtp = pix_fmts;
277        int ret;
278
279        ctx->pix_fmt = pix_fmt;
280
281#if CONFIG_PRORES_VIDEOTOOLBOX_HWACCEL
282        *fmtp++ = AV_PIX_FMT_VIDEOTOOLBOX;
283#endif
284        *fmtp++ = ctx->pix_fmt;
285        *fmtp = AV_PIX_FMT_NONE;
286
287        if ((ret = ff_thread_get_format(avctx, pix_fmts)) < 0)
288            return ret;
289
290        avctx->pix_fmt = ret;
291    }
292
293    avctx->color_primaries = buf[14];
294    avctx->color_trc       = buf[15];
295    avctx->colorspace      = buf[16];
296    avctx->color_range     = AVCOL_RANGE_MPEG;
297
298    ptr   = buf + 20;
299    flags = buf[19];
300    ff_dlog(avctx, "flags %x\n", flags);
301
302    if (flags & 2) {
303        if(buf + data_size - ptr < 64) {
304            av_log(avctx, AV_LOG_ERROR, "Header truncated\n");
305            return AVERROR_INVALIDDATA;
306        }
307        permute(ctx->qmat_luma, ctx->prodsp.idct_permutation, ptr);
308        ptr += 64;
309    } else {
310        memset(ctx->qmat_luma, 4, 64);
311    }
312
313    if (flags & 1) {
314        if(buf + data_size - ptr < 64) {
315            av_log(avctx, AV_LOG_ERROR, "Header truncated\n");
316            return AVERROR_INVALIDDATA;
317        }
318        permute(ctx->qmat_chroma, ctx->prodsp.idct_permutation, ptr);
319    } else {
320        memcpy(ctx->qmat_chroma, ctx->qmat_luma, 64);
321    }
322
323    return hdr_size;
324}
325
326static int decode_picture_header(AVCodecContext *avctx, const uint8_t *buf, const int buf_size)
327{
328    ProresContext *ctx = avctx->priv_data;
329    int i, hdr_size, slice_count;
330    unsigned pic_data_size;
331    int log2_slice_mb_width, log2_slice_mb_height;
332    int slice_mb_count, mb_x, mb_y;
333    const uint8_t *data_ptr, *index_ptr;
334
335    hdr_size = buf[0] >> 3;
336    if (hdr_size < 8 || hdr_size > buf_size) {
337        av_log(avctx, AV_LOG_ERROR, "error, wrong picture header size\n");
338        return AVERROR_INVALIDDATA;
339    }
340
341    pic_data_size = AV_RB32(buf + 1);
342    if (pic_data_size > buf_size) {
343        av_log(avctx, AV_LOG_ERROR, "error, wrong picture data size\n");
344        return AVERROR_INVALIDDATA;
345    }
346
347    log2_slice_mb_width  = buf[7] >> 4;
348    log2_slice_mb_height = buf[7] & 0xF;
349    if (log2_slice_mb_width > 3 || log2_slice_mb_height) {
350        av_log(avctx, AV_LOG_ERROR, "unsupported slice resolution: %dx%d\n",
351               1 << log2_slice_mb_width, 1 << log2_slice_mb_height);
352        return AVERROR_INVALIDDATA;
353    }
354
355    ctx->mb_width  = (avctx->width  + 15) >> 4;
356    if (ctx->frame_type)
357        ctx->mb_height = (avctx->height + 31) >> 5;
358    else
359        ctx->mb_height = (avctx->height + 15) >> 4;
360
361    // QT ignores the written value
362    // slice_count = AV_RB16(buf + 5);
363    slice_count = ctx->mb_height * ((ctx->mb_width >> log2_slice_mb_width) +
364                                    av_popcount(ctx->mb_width & (1 << log2_slice_mb_width) - 1));
365
366    if (ctx->slice_count != slice_count || !ctx->slices) {
367        av_freep(&ctx->slices);
368        ctx->slice_count = 0;
369        ctx->slices = av_calloc(slice_count, sizeof(*ctx->slices));
370        if (!ctx->slices)
371            return AVERROR(ENOMEM);
372        ctx->slice_count = slice_count;
373    }
374
375    if (!slice_count)
376        return AVERROR(EINVAL);
377
378    if (hdr_size + slice_count*2 > buf_size) {
379        av_log(avctx, AV_LOG_ERROR, "error, wrong slice count\n");
380        return AVERROR_INVALIDDATA;
381    }
382
383    // parse slice information
384    index_ptr = buf + hdr_size;
385    data_ptr  = index_ptr + slice_count*2;
386
387    slice_mb_count = 1 << log2_slice_mb_width;
388    mb_x = 0;
389    mb_y = 0;
390
391    for (i = 0; i < slice_count; i++) {
392        SliceContext *slice = &ctx->slices[i];
393
394        slice->data = data_ptr;
395        data_ptr += AV_RB16(index_ptr + i*2);
396
397        while (ctx->mb_width - mb_x < slice_mb_count)
398            slice_mb_count >>= 1;
399
400        slice->mb_x = mb_x;
401        slice->mb_y = mb_y;
402        slice->mb_count = slice_mb_count;
403        slice->data_size = data_ptr - slice->data;
404
405        if (slice->data_size < 6) {
406            av_log(avctx, AV_LOG_ERROR, "error, wrong slice data size\n");
407            return AVERROR_INVALIDDATA;
408        }
409
410        mb_x += slice_mb_count;
411        if (mb_x == ctx->mb_width) {
412            slice_mb_count = 1 << log2_slice_mb_width;
413            mb_x = 0;
414            mb_y++;
415        }
416        if (data_ptr > buf + buf_size) {
417            av_log(avctx, AV_LOG_ERROR, "error, slice out of bounds\n");
418            return AVERROR_INVALIDDATA;
419        }
420    }
421
422    if (mb_x || mb_y != ctx->mb_height) {
423        av_log(avctx, AV_LOG_ERROR, "error wrong mb count y %d h %d\n",
424               mb_y, ctx->mb_height);
425        return AVERROR_INVALIDDATA;
426    }
427
428    return pic_data_size;
429}
430
431#define DECODE_CODEWORD(val, codebook, SKIP)                            \
432    do {                                                                \
433        unsigned int rice_order, exp_order, switch_bits;                \
434        unsigned int q, buf, bits;                                      \
435                                                                        \
436        UPDATE_CACHE(re, gb);                                           \
437        buf = GET_CACHE(re, gb);                                        \
438                                                                        \
439        /* number of bits to switch between rice and exp golomb */      \
440        switch_bits =  codebook & 3;                                    \
441        rice_order  =  codebook >> 5;                                   \
442        exp_order   = (codebook >> 2) & 7;                              \
443                                                                        \
444        q = 31 - av_log2(buf);                                          \
445                                                                        \
446        if (q > switch_bits) { /* exp golomb */                         \
447            bits = exp_order - switch_bits + (q<<1);                    \
448            if (bits > FFMIN(MIN_CACHE_BITS, 31))                       \
449                return AVERROR_INVALIDDATA;                             \
450            val = SHOW_UBITS(re, gb, bits) - (1 << exp_order) +         \
451                ((switch_bits + 1) << rice_order);                      \
452            SKIP(re, gb, bits);                                         \
453        } else if (rice_order) {                                        \
454            SKIP_BITS(re, gb, q+1);                                     \
455            val = (q << rice_order) + SHOW_UBITS(re, gb, rice_order);   \
456            SKIP(re, gb, rice_order);                                   \
457        } else {                                                        \
458            val = q;                                                    \
459            SKIP(re, gb, q+1);                                          \
460        }                                                               \
461    } while (0)
462
463#define TOSIGNED(x) (((x) >> 1) ^ (-((x) & 1)))
464
465#define FIRST_DC_CB 0xB8
466
467static const uint8_t dc_codebook[7] = { 0x04, 0x28, 0x28, 0x4D, 0x4D, 0x70, 0x70};
468
469static av_always_inline int decode_dc_coeffs(GetBitContext *gb, int16_t *out,
470                                              int blocks_per_slice)
471{
472    int16_t prev_dc;
473    int code, i, sign;
474
475    OPEN_READER(re, gb);
476
477    DECODE_CODEWORD(code, FIRST_DC_CB, LAST_SKIP_BITS);
478    prev_dc = TOSIGNED(code);
479    out[0] = prev_dc;
480
481    out += 64; // dc coeff for the next block
482
483    code = 5;
484    sign = 0;
485    for (i = 1; i < blocks_per_slice; i++, out += 64) {
486        DECODE_CODEWORD(code, dc_codebook[FFMIN(code, 6U)], LAST_SKIP_BITS);
487        if(code) sign ^= -(code & 1);
488        else     sign  = 0;
489        prev_dc += (((code + 1) >> 1) ^ sign) - sign;
490        out[0] = prev_dc;
491    }
492    CLOSE_READER(re, gb);
493    return 0;
494}
495
496// adaptive codebook switching lut according to previous run/level values
497static const uint8_t run_to_cb[16] = { 0x06, 0x06, 0x05, 0x05, 0x04, 0x29, 0x29, 0x29, 0x29, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x4C };
498static const uint8_t lev_to_cb[10] = { 0x04, 0x0A, 0x05, 0x06, 0x04, 0x28, 0x28, 0x28, 0x28, 0x4C };
499
500static av_always_inline int decode_ac_coeffs(AVCodecContext *avctx, GetBitContext *gb,
501                                             int16_t *out, int blocks_per_slice)
502{
503    ProresContext *ctx = avctx->priv_data;
504    int block_mask, sign;
505    unsigned pos, run, level;
506    int max_coeffs, i, bits_left;
507    int log2_block_count = av_log2(blocks_per_slice);
508
509    OPEN_READER(re, gb);
510    UPDATE_CACHE(re, gb);                                           \
511    run   = 4;
512    level = 2;
513
514    max_coeffs = 64 << log2_block_count;
515    block_mask = blocks_per_slice - 1;
516
517    for (pos = block_mask;;) {
518        bits_left = gb->size_in_bits - re_index;
519        if (!bits_left || (bits_left < 32 && !SHOW_UBITS(re, gb, bits_left)))
520            break;
521
522        DECODE_CODEWORD(run, run_to_cb[FFMIN(run,  15)], LAST_SKIP_BITS);
523        pos += run + 1;
524        if (pos >= max_coeffs) {
525            av_log(avctx, AV_LOG_ERROR, "ac tex damaged %d, %d\n", pos, max_coeffs);
526            return AVERROR_INVALIDDATA;
527        }
528
529        DECODE_CODEWORD(level, lev_to_cb[FFMIN(level, 9)], SKIP_BITS);
530        level += 1;
531
532        i = pos >> log2_block_count;
533
534        sign = SHOW_SBITS(re, gb, 1);
535        SKIP_BITS(re, gb, 1);
536        out[((pos & block_mask) << 6) + ctx->scan[i]] = ((level ^ sign) - sign);
537    }
538
539    CLOSE_READER(re, gb);
540    return 0;
541}
542
543static int decode_slice_luma(AVCodecContext *avctx, SliceContext *slice,
544                             uint16_t *dst, int dst_stride,
545                             const uint8_t *buf, unsigned buf_size,
546                             const int16_t *qmat)
547{
548    ProresContext *ctx = avctx->priv_data;
549    LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
550    int16_t *block;
551    GetBitContext gb;
552    int i, blocks_per_slice = slice->mb_count<<2;
553    int ret;
554
555    for (i = 0; i < blocks_per_slice; i++)
556        ctx->bdsp.clear_block(blocks+(i<<6));
557
558    init_get_bits(&gb, buf, buf_size << 3);
559
560    if ((ret = decode_dc_coeffs(&gb, blocks, blocks_per_slice)) < 0)
561        return ret;
562    if ((ret = decode_ac_coeffs(avctx, &gb, blocks, blocks_per_slice)) < 0)
563        return ret;
564
565    block = blocks;
566    for (i = 0; i < slice->mb_count; i++) {
567        ctx->prodsp.idct_put(dst, dst_stride, block+(0<<6), qmat);
568        ctx->prodsp.idct_put(dst             +8, dst_stride, block+(1<<6), qmat);
569        ctx->prodsp.idct_put(dst+4*dst_stride  , dst_stride, block+(2<<6), qmat);
570        ctx->prodsp.idct_put(dst+4*dst_stride+8, dst_stride, block+(3<<6), qmat);
571        block += 4*64;
572        dst += 16;
573    }
574    return 0;
575}
576
577static int decode_slice_chroma(AVCodecContext *avctx, SliceContext *slice,
578                               uint16_t *dst, int dst_stride,
579                               const uint8_t *buf, unsigned buf_size,
580                               const int16_t *qmat, int log2_blocks_per_mb)
581{
582    ProresContext *ctx = avctx->priv_data;
583    LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
584    int16_t *block;
585    GetBitContext gb;
586    int i, j, blocks_per_slice = slice->mb_count << log2_blocks_per_mb;
587    int ret;
588
589    for (i = 0; i < blocks_per_slice; i++)
590        ctx->bdsp.clear_block(blocks+(i<<6));
591
592    init_get_bits(&gb, buf, buf_size << 3);
593
594    if ((ret = decode_dc_coeffs(&gb, blocks, blocks_per_slice)) < 0)
595        return ret;
596    if ((ret = decode_ac_coeffs(avctx, &gb, blocks, blocks_per_slice)) < 0)
597        return ret;
598
599    block = blocks;
600    for (i = 0; i < slice->mb_count; i++) {
601        for (j = 0; j < log2_blocks_per_mb; j++) {
602            ctx->prodsp.idct_put(dst,              dst_stride, block+(0<<6), qmat);
603            ctx->prodsp.idct_put(dst+4*dst_stride, dst_stride, block+(1<<6), qmat);
604            block += 2*64;
605            dst += 8;
606        }
607    }
608    return 0;
609}
610
611/**
612 * Decode alpha slice plane.
613 */
614static void decode_slice_alpha(ProresContext *ctx,
615                               uint16_t *dst, int dst_stride,
616                               const uint8_t *buf, int buf_size,
617                               int blocks_per_slice)
618{
619    GetBitContext gb;
620    int i;
621    LOCAL_ALIGNED_32(int16_t, blocks, [8*4*64]);
622    int16_t *block;
623
624    for (i = 0; i < blocks_per_slice<<2; i++)
625        ctx->bdsp.clear_block(blocks+(i<<6));
626
627    init_get_bits(&gb, buf, buf_size << 3);
628
629    if (ctx->alpha_info == 2) {
630        ctx->unpack_alpha(&gb, blocks, blocks_per_slice * 4 * 64, 16);
631    } else {
632        ctx->unpack_alpha(&gb, blocks, blocks_per_slice * 4 * 64, 8);
633    }
634
635    block = blocks;
636
637    for (i = 0; i < 16; i++) {
638        memcpy(dst, block, 16 * blocks_per_slice * sizeof(*dst));
639        dst   += dst_stride >> 1;
640        block += 16 * blocks_per_slice;
641    }
642}
643
644static int decode_slice_thread(AVCodecContext *avctx, void *arg, int jobnr, int threadnr)
645{
646    ProresContext *ctx = avctx->priv_data;
647    SliceContext *slice = &ctx->slices[jobnr];
648    const uint8_t *buf = slice->data;
649    AVFrame *pic = ctx->frame;
650    int i, hdr_size, qscale, log2_chroma_blocks_per_mb;
651    int luma_stride, chroma_stride;
652    int y_data_size, u_data_size, v_data_size, a_data_size, offset;
653    uint8_t *dest_y, *dest_u, *dest_v;
654    LOCAL_ALIGNED_16(int16_t, qmat_luma_scaled,  [64]);
655    LOCAL_ALIGNED_16(int16_t, qmat_chroma_scaled,[64]);
656    int mb_x_shift;
657    int ret;
658    uint16_t val_no_chroma;
659
660    slice->ret = -1;
661    //av_log(avctx, AV_LOG_INFO, "slice %d mb width %d mb x %d y %d\n",
662    //       jobnr, slice->mb_count, slice->mb_x, slice->mb_y);
663
664    // slice header
665    hdr_size = buf[0] >> 3;
666    qscale = av_clip(buf[1], 1, 224);
667    qscale = qscale > 128 ? qscale - 96 << 2: qscale;
668    y_data_size = AV_RB16(buf + 2);
669    u_data_size = AV_RB16(buf + 4);
670    v_data_size = slice->data_size - y_data_size - u_data_size - hdr_size;
671    if (hdr_size > 7) v_data_size = AV_RB16(buf + 6);
672    a_data_size = slice->data_size - y_data_size - u_data_size -
673                  v_data_size - hdr_size;
674
675    if (y_data_size < 0 || u_data_size < 0 || v_data_size < 0
676        || hdr_size+y_data_size+u_data_size+v_data_size > slice->data_size){
677        av_log(avctx, AV_LOG_ERROR, "invalid plane data size\n");
678        return AVERROR_INVALIDDATA;
679    }
680
681    buf += hdr_size;
682
683    for (i = 0; i < 64; i++) {
684        qmat_luma_scaled  [i] = ctx->qmat_luma  [i] * qscale;
685        qmat_chroma_scaled[i] = ctx->qmat_chroma[i] * qscale;
686    }
687
688    if (ctx->frame_type == 0) {
689        luma_stride   = pic->linesize[0];
690        chroma_stride = pic->linesize[1];
691    } else {
692        luma_stride   = pic->linesize[0] << 1;
693        chroma_stride = pic->linesize[1] << 1;
694    }
695
696    if (avctx->pix_fmt == AV_PIX_FMT_YUV444P10 || avctx->pix_fmt == AV_PIX_FMT_YUVA444P10 ||
697        avctx->pix_fmt == AV_PIX_FMT_YUV444P12 || avctx->pix_fmt == AV_PIX_FMT_YUVA444P12) {
698        mb_x_shift = 5;
699        log2_chroma_blocks_per_mb = 2;
700    } else {
701        mb_x_shift = 4;
702        log2_chroma_blocks_per_mb = 1;
703    }
704
705    offset = (slice->mb_y << 4) * luma_stride + (slice->mb_x << 5);
706    dest_y = pic->data[0] + offset;
707    dest_u = pic->data[1] + (slice->mb_y << 4) * chroma_stride + (slice->mb_x << mb_x_shift);
708    dest_v = pic->data[2] + (slice->mb_y << 4) * chroma_stride + (slice->mb_x << mb_x_shift);
709
710    if (ctx->frame_type && ctx->first_field ^ ctx->frame->top_field_first) {
711        dest_y += pic->linesize[0];
712        dest_u += pic->linesize[1];
713        dest_v += pic->linesize[2];
714        offset += pic->linesize[3];
715    }
716
717    ret = decode_slice_luma(avctx, slice, (uint16_t*)dest_y, luma_stride,
718                            buf, y_data_size, qmat_luma_scaled);
719    if (ret < 0)
720        return ret;
721
722    if (!(avctx->flags & AV_CODEC_FLAG_GRAY) && (u_data_size + v_data_size) > 0) {
723        ret = decode_slice_chroma(avctx, slice, (uint16_t*)dest_u, chroma_stride,
724                                  buf + y_data_size, u_data_size,
725                                  qmat_chroma_scaled, log2_chroma_blocks_per_mb);
726        if (ret < 0)
727            return ret;
728
729        ret = decode_slice_chroma(avctx, slice, (uint16_t*)dest_v, chroma_stride,
730                                  buf + y_data_size + u_data_size, v_data_size,
731                                  qmat_chroma_scaled, log2_chroma_blocks_per_mb);
732        if (ret < 0)
733            return ret;
734    }
735    else {
736        size_t mb_max_x = slice->mb_count << (mb_x_shift - 1);
737        size_t i, j;
738        if (avctx->bits_per_raw_sample == 10) {
739            val_no_chroma = 511;
740        } else { /* 12b */
741            val_no_chroma = 511 * 4;
742        }
743        for (i = 0; i < 16; ++i)
744            for (j = 0; j < mb_max_x; ++j) {
745                *(uint16_t*)(dest_u + (i * chroma_stride) + (j << 1)) = val_no_chroma;
746                *(uint16_t*)(dest_v + (i * chroma_stride) + (j << 1)) = val_no_chroma;
747            }
748    }
749
750    /* decode alpha plane if available */
751    if (ctx->alpha_info && pic->data[3] && a_data_size) {
752        uint8_t *dest_a = pic->data[3] + offset;
753        decode_slice_alpha(ctx, (uint16_t*)dest_a, luma_stride,
754                           buf + y_data_size + u_data_size + v_data_size,
755                           a_data_size, slice->mb_count);
756    }
757
758    slice->ret = 0;
759    return 0;
760}
761
762static int decode_picture(AVCodecContext *avctx)
763{
764    ProresContext *ctx = avctx->priv_data;
765    int i;
766    int error = 0;
767
768    avctx->execute2(avctx, decode_slice_thread, NULL, NULL, ctx->slice_count);
769
770    for (i = 0; i < ctx->slice_count; i++)
771        error += ctx->slices[i].ret < 0;
772
773    if (error)
774        ctx->frame->decode_error_flags = FF_DECODE_ERROR_INVALID_BITSTREAM;
775    if (error < ctx->slice_count)
776        return 0;
777
778    return ctx->slices[0].ret;
779}
780
781static int decode_frame(AVCodecContext *avctx, AVFrame *frame,
782                        int *got_frame, AVPacket *avpkt)
783{
784    ProresContext *ctx = avctx->priv_data;
785    const uint8_t *buf = avpkt->data;
786    int buf_size = avpkt->size;
787    int frame_hdr_size, pic_size, ret;
788
789    if (buf_size < 28 || AV_RL32(buf + 4) != AV_RL32("icpf")) {
790        av_log(avctx, AV_LOG_ERROR, "invalid frame header\n");
791        return AVERROR_INVALIDDATA;
792    }
793
794    ctx->frame = frame;
795    ctx->frame->pict_type = AV_PICTURE_TYPE_I;
796    ctx->frame->key_frame = 1;
797    ctx->first_field = 1;
798
799    buf += 8;
800    buf_size -= 8;
801
802    frame_hdr_size = decode_frame_header(ctx, buf, buf_size, avctx);
803    if (frame_hdr_size < 0)
804        return frame_hdr_size;
805
806    buf += frame_hdr_size;
807    buf_size -= frame_hdr_size;
808
809    if ((ret = ff_thread_get_buffer(avctx, frame, 0)) < 0)
810        return ret;
811    ff_thread_finish_setup(avctx);
812
813    if (avctx->hwaccel) {
814        ret = avctx->hwaccel->start_frame(avctx, NULL, 0);
815        if (ret < 0)
816            return ret;
817        ret = avctx->hwaccel->decode_slice(avctx, avpkt->data, avpkt->size);
818        if (ret < 0)
819            return ret;
820        ret = avctx->hwaccel->end_frame(avctx);
821        if (ret < 0)
822            return ret;
823        goto finish;
824    }
825
826 decode_picture:
827    pic_size = decode_picture_header(avctx, buf, buf_size);
828    if (pic_size < 0) {
829        av_log(avctx, AV_LOG_ERROR, "error decoding picture header\n");
830        return pic_size;
831    }
832
833    if ((ret = decode_picture(avctx)) < 0) {
834        av_log(avctx, AV_LOG_ERROR, "error decoding picture\n");
835        return ret;
836    }
837
838    buf += pic_size;
839    buf_size -= pic_size;
840
841    if (ctx->frame_type && buf_size > 0 && ctx->first_field) {
842        ctx->first_field = 0;
843        goto decode_picture;
844    }
845
846finish:
847    *got_frame      = 1;
848
849    return avpkt->size;
850}
851
852static av_cold int decode_close(AVCodecContext *avctx)
853{
854    ProresContext *ctx = avctx->priv_data;
855
856    av_freep(&ctx->slices);
857
858    return 0;
859}
860
861#if HAVE_THREADS
862static int update_thread_context(AVCodecContext *dst, const AVCodecContext *src)
863{
864    ProresContext *csrc = src->priv_data;
865    ProresContext *cdst = dst->priv_data;
866
867    cdst->pix_fmt = csrc->pix_fmt;
868
869    return 0;
870}
871#endif
872
873const FFCodec ff_prores_decoder = {
874    .p.name         = "prores",
875    .p.long_name    = NULL_IF_CONFIG_SMALL("Apple ProRes (iCodec Pro)"),
876    .p.type         = AVMEDIA_TYPE_VIDEO,
877    .p.id           = AV_CODEC_ID_PRORES,
878    .priv_data_size = sizeof(ProresContext),
879    .init           = decode_init,
880    .close          = decode_close,
881    FF_CODEC_DECODE_CB(decode_frame),
882    .update_thread_context = ONLY_IF_THREADS_ENABLED(update_thread_context),
883    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_SLICE_THREADS | AV_CODEC_CAP_FRAME_THREADS,
884    .p.profiles     = NULL_IF_CONFIG_SMALL(ff_prores_profiles),
885    .caps_internal  = FF_CODEC_CAP_INIT_THREADSAFE,
886    .hw_configs     = (const AVCodecHWConfigInternal *const []) {
887#if CONFIG_PRORES_VIDEOTOOLBOX_HWACCEL
888        HWACCEL_VIDEOTOOLBOX(prores),
889#endif
890        NULL
891    },
892};
893