[deb_ffmpeg.git] / ffmpeg / libavcodec / proresenc_anatoliy.c

/*
 * Apple ProRes encoder
 *
 * Copyright (c) 2011 Anatoliy Wasserman
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

/**
 * @file
 * Apple ProRes encoder (Anatoliy Wasserman version)
 * Known FOURCCs: 'apch' (HQ), 'apcn' (SD), 'apcs' (LT), 'acpo' (Proxy)
 */

#include "avcodec.h"
#include "dct.h"
#include "internal.h"
#include "put_bits.h"
#include "bytestream.h"
#include "fdctdsp.h"

#define DEFAULT_SLICE_MB_WIDTH 8

#define FF_PROFILE_PRORES_PROXY     0
#define FF_PROFILE_PRORES_LT        1
#define FF_PROFILE_PRORES_STANDARD  2
#define FF_PROFILE_PRORES_HQ        3

static const AVProfile profiles[] = {
    { FF_PROFILE_PRORES_PROXY,    "apco"},
    { FF_PROFILE_PRORES_LT,       "apcs"},
    { FF_PROFILE_PRORES_STANDARD, "apcn"},
    { FF_PROFILE_PRORES_HQ,       "apch"},
    { FF_PROFILE_UNKNOWN }
};

static const int qp_start_table[4] = { 4, 1, 1, 1 };
static const int qp_end_table[4]   = { 8, 9, 6, 6 };
static const int bitrate_table[5]  = { 1000, 2100, 3500, 5400 };

static const uint8_t progressive_scan[64] = {
     0,  1,  8,  9,  2,  3, 10, 11,
    16, 17, 24, 25, 18, 19, 26, 27,
     4,  5, 12, 20, 13,  6,  7, 14,
    21, 28, 29, 22, 15, 23, 30, 31,
    32, 33, 40, 48, 41, 34, 35, 42,
    49, 56, 57, 50, 43, 36, 37, 44,
    51, 58, 59, 52, 45, 38, 39, 46,
    53, 60, 61, 54, 47, 55, 62, 63
};

static const uint8_t QMAT_LUMA[4][64] = {
    {
         4,  7,  9, 11, 13, 14, 15, 63,
         7,  7, 11, 12, 14, 15, 63, 63,
         9, 11, 13, 14, 15, 63, 63, 63,
        11, 11, 13, 14, 63, 63, 63, 63,
        11, 13, 14, 63, 63, 63, 63, 63,
        13, 14, 63, 63, 63, 63, 63, 63,
        13, 63, 63, 63, 63, 63, 63, 63,
        63, 63, 63, 63, 63, 63, 63, 63
    }, {
         4,  5,  6,  7,  9, 11, 13, 15,
         5,  5,  7,  8, 11, 13, 15, 17,
         6,  7,  9, 11, 13, 15, 15, 17,
         7,  7,  9, 11, 13, 15, 17, 19,
         7,  9, 11, 13, 14, 16, 19, 23,
         9, 11, 13, 14, 16, 19, 23, 29,
         9, 11, 13, 15, 17, 21, 28, 35,
        11, 13, 16, 17, 21, 28, 35, 41
    }, {
         4,  4,  5,  5,  6,  7,  7,  9,
         4,  4,  5,  6,  7,  7,  9,  9,
         5,  5,  6,  7,  7,  9,  9, 10,
         5,  5,  6,  7,  7,  9,  9, 10,
         5,  6,  7,  7,  8,  9, 10, 12,
         6,  7,  7,  8,  9, 10, 12, 15,
         6,  7,  7,  9, 10, 11, 14, 17,
         7,  7,  9, 10, 11, 14, 17, 21
    }, {
         4,  4,  4,  4,  4,  4,  4,  4,
         4,  4,  4,  4,  4,  4,  4,  4,
         4,  4,  4,  4,  4,  4,  4,  4,
         4,  4,  4,  4,  4,  4,  4,  5,
         4,  4,  4,  4,  4,  4,  5,  5,
         4,  4,  4,  4,  4,  5,  5,  6,
         4,  4,  4,  4,  5,  5,  6,  7,
         4,  4,  4,  4,  5,  6,  7,  7
    }
};

static const uint8_t QMAT_CHROMA[4][64] = {
    {
         4,  7,  9, 11, 13, 14, 63, 63,
         7,  7, 11, 12, 14, 63, 63, 63,
         9, 11, 13, 14, 63, 63, 63, 63,
        11, 11, 13, 14, 63, 63, 63, 63,
        11, 13, 14, 63, 63, 63, 63, 63,
        13, 14, 63, 63, 63, 63, 63, 63,
        13, 63, 63, 63, 63, 63, 63, 63,
        63, 63, 63, 63, 63, 63, 63, 63
    }, {
         4,  5,  6,  7,  9, 11, 13, 15,
         5,  5,  7,  8, 11, 13, 15, 17,
         6,  7,  9, 11, 13, 15, 15, 17,
         7,  7,  9, 11, 13, 15, 17, 19,
         7,  9, 11, 13, 14, 16, 19, 23,
         9, 11, 13, 14, 16, 19, 23, 29,
         9, 11, 13, 15, 17, 21, 28, 35,
        11, 13, 16, 17, 21, 28, 35, 41
    }, {
         4,  4,  5,  5,  6,  7,  7,  9,
         4,  4,  5,  6,  7,  7,  9,  9,
         5,  5,  6,  7,  7,  9,  9, 10,
         5,  5,  6,  7,  7,  9,  9, 10,
         5,  6,  7,  7,  8,  9, 10, 12,
         6,  7,  7,  8,  9, 10, 12, 15,
         6,  7,  7,  9, 10, 11, 14, 17,
         7,  7,  9, 10, 11, 14, 17, 21
    }, {
         4,  4,  4,  4,  4,  4,  4,  4,
         4,  4,  4,  4,  4,  4,  4,  4,
         4,  4,  4,  4,  4,  4,  4,  4,
         4,  4,  4,  4,  4,  4,  4,  5,
         4,  4,  4,  4,  4,  4,  5,  5,
         4,  4,  4,  4,  4,  5,  5,  6,
         4,  4,  4,  4,  5,  5,  6,  7,
         4,  4,  4,  4,  5,  6,  7,  7
    }
};


typedef struct {
    FDCTDSPContext fdsp;
    uint8_t* fill_y;
    uint8_t* fill_u;
    uint8_t* fill_v;

    int qmat_luma[16][64];
    int qmat_chroma[16][64];
} ProresContext;

static void encode_codeword(PutBitContext *pb, int val, int codebook)
{
    unsigned int rice_order, exp_order, switch_bits, first_exp, exp, zeros,
            mask;

    /* number of bits to switch between rice and exp golomb */
    switch_bits = codebook & 3;
    rice_order  = codebook >> 5;
    exp_order   = (codebook >> 2) & 7;

    first_exp = ((switch_bits + 1) << rice_order);

    if (val >= first_exp) { /* exp golomb */
        val -= first_exp;
        val += (1 << exp_order);
        exp = av_log2(val);
        zeros = exp - exp_order + switch_bits + 1;
        put_bits(pb, zeros, 0);
        put_bits(pb, exp + 1, val);
    } else if (rice_order) {
        mask = (1 << rice_order) - 1;
        put_bits(pb, (val >> rice_order), 0);
        put_bits(pb, 1, 1);
        put_bits(pb, rice_order, val & mask);
    } else {
        put_bits(pb, val, 0);
        put_bits(pb, 1, 1);
    }
}

#define QSCALE(qmat,ind,val) ((val) / ((qmat)[ind]))
#define TO_GOLOMB(val) (((val) << 1) ^ ((val) >> 31))
#define DIFF_SIGN(val, sign) (((val) >> 31) ^ (sign))
#define IS_NEGATIVE(val) ((((val) >> 31) ^ -1) + 1)
#define TO_GOLOMB2(val,sign) ((val)==0 ? 0 : ((val) << 1) + (sign))

static av_always_inline int get_level(int val)
{
    int sign = (val >> 31);
    return (val ^ sign) - sign;
}

#define FIRST_DC_CB 0xB8

static const uint8_t dc_codebook[7] = { 0x04, 0x28, 0x28, 0x4D, 0x4D, 0x70, 0x70};

static void encode_dc_coeffs(PutBitContext *pb, int16_t *in,
        int blocks_per_slice, int *qmat)
{
    int prev_dc, code;
    int i, sign, idx;
    int new_dc, delta, diff_sign, new_code;

    prev_dc = QSCALE(qmat, 0, in[0] - 16384);
    code = TO_GOLOMB(prev_dc);
    encode_codeword(pb, code, FIRST_DC_CB);

    code = 5; sign = 0; idx = 64;
    for (i = 1; i < blocks_per_slice; i++, idx += 64) {
        new_dc    = QSCALE(qmat, 0, in[idx] - 16384);
        delta     = new_dc - prev_dc;
        diff_sign = DIFF_SIGN(delta, sign);
        new_code  = TO_GOLOMB2(get_level(delta), diff_sign);

        encode_codeword(pb, new_code, dc_codebook[FFMIN(code, 6)]);

        code      = new_code;
        sign      = delta >> 31;
        prev_dc   = new_dc;
    }
}

static const uint8_t run_to_cb[16] = { 0x06, 0x06, 0x05, 0x05, 0x04, 0x29,
        0x29, 0x29, 0x29, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x4C };
static const uint8_t lev_to_cb[10] = { 0x04, 0x0A, 0x05, 0x06, 0x04, 0x28,
        0x28, 0x28, 0x28, 0x4C };

static void encode_ac_coeffs(AVCodecContext *avctx, PutBitContext *pb,
        int16_t *in, int blocks_per_slice, int *qmat)
{
    int prev_run = 4;
    int prev_level = 2;

    int run = 0, level, code, i, j;
    for (i = 1; i < 64; i++) {
        int indp = progressive_scan[i];
        for (j = 0; j < blocks_per_slice; j++) {
            int val = QSCALE(qmat, indp, in[(j << 6) + indp]);
            if (val) {
                encode_codeword(pb, run, run_to_cb[FFMIN(prev_run, 15)]);

                prev_run   = run;
                run        = 0;
                level      = get_level(val);
                code       = level - 1;

                encode_codeword(pb, code, lev_to_cb[FFMIN(prev_level, 9)]);

                prev_level = level;

                put_bits(pb, 1, IS_NEGATIVE(val));
            } else {
                ++run;
            }
        }
    }
}

static void get(uint8_t *pixels, int stride, int16_t* block)
{
    int i;

    for (i = 0; i < 8; i++) {
        AV_WN64(block, AV_RN64(pixels));
        AV_WN64(block+4, AV_RN64(pixels+8));
        pixels += stride;
        block += 8;
    }
}

static void fdct_get(FDCTDSPContext *fdsp, uint8_t *pixels, int stride, int16_t* block)
{
    get(pixels, stride, block);
    fdsp->fdct(block);
}

static int encode_slice_plane(AVCodecContext *avctx, int mb_count,
        uint8_t *src, int src_stride, uint8_t *buf, unsigned buf_size,
        int *qmat, int chroma)
{
    ProresContext* ctx = avctx->priv_data;
    FDCTDSPContext *fdsp = &ctx->fdsp;
    DECLARE_ALIGNED(16, int16_t, blocks)[DEFAULT_SLICE_MB_WIDTH << 8], *block;
    int i, blocks_per_slice;
    PutBitContext pb;

    block = blocks;
    for (i = 0; i < mb_count; i++) {
        fdct_get(fdsp, src,                  src_stride, block + (0 << 6));
        fdct_get(fdsp, src + 8 * src_stride, src_stride, block + ((2 - chroma) << 6));
        if (!chroma) {
            fdct_get(fdsp, src + 16,                  src_stride, block + (1 << 6));
            fdct_get(fdsp, src + 16 + 8 * src_stride, src_stride, block + (3 << 6));
        }

        block += (256 >> chroma);
        src   += (32  >> chroma);
    }

    blocks_per_slice = mb_count << (2 - chroma);
    init_put_bits(&pb, buf, buf_size << 3);

    encode_dc_coeffs(&pb, blocks, blocks_per_slice, qmat);
    encode_ac_coeffs(avctx, &pb, blocks, blocks_per_slice, qmat);

    flush_put_bits(&pb);
    return put_bits_ptr(&pb) - pb.buf;
}

static av_always_inline unsigned encode_slice_data(AVCodecContext *avctx,
        uint8_t *dest_y, uint8_t *dest_u, uint8_t *dest_v, int luma_stride,
        int chroma_stride, unsigned mb_count, uint8_t *buf, unsigned data_size,
        unsigned* y_data_size, unsigned* u_data_size, unsigned* v_data_size,
        int qp)
{
    ProresContext* ctx = avctx->priv_data;

    *y_data_size = encode_slice_plane(avctx, mb_count, dest_y, luma_stride,
            buf, data_size, ctx->qmat_luma[qp - 1], 0);

    if (!(avctx->flags & CODEC_FLAG_GRAY)) {
        *u_data_size = encode_slice_plane(avctx, mb_count, dest_u,
                chroma_stride, buf + *y_data_size, data_size - *y_data_size,
                ctx->qmat_chroma[qp - 1], 1);

        *v_data_size = encode_slice_plane(avctx, mb_count, dest_v,
                chroma_stride, buf + *y_data_size + *u_data_size,
                data_size - *y_data_size - *u_data_size,
                ctx->qmat_chroma[qp - 1], 1);
    }

    return *y_data_size + *u_data_size + *v_data_size;
}

static void subimage_with_fill(uint16_t *src, unsigned x, unsigned y,
        unsigned stride, unsigned width, unsigned height, uint16_t *dst,
        unsigned dst_width, unsigned dst_height)
{

    int box_width = FFMIN(width - x, dst_width);
    int box_height = FFMIN(height - y, dst_height);
    int i, j, src_stride = stride >> 1;
    uint16_t last_pix, *last_line;

    src += y * src_stride + x;
    for (i = 0; i < box_height; ++i) {
        for (j = 0; j < box_width; ++j) {
            dst[j] = src[j];
        }
        last_pix = dst[j - 1];
        for (; j < dst_width; j++)
            dst[j] = last_pix;
        src += src_stride;
        dst += dst_width;
    }
    last_line = dst - dst_width;
    for (; i < dst_height; i++) {
        for (j = 0; j < dst_width; ++j) {
            dst[j] = last_line[j];
        }
        dst += dst_width;
    }
}

static int encode_slice(AVCodecContext *avctx, const AVFrame *pic, int mb_x,
        int mb_y, unsigned mb_count, uint8_t *buf, unsigned data_size,
        int unsafe, int *qp)
{
    int luma_stride, chroma_stride;
    int hdr_size = 6, slice_size;
    uint8_t *dest_y, *dest_u, *dest_v;
    unsigned y_data_size = 0, u_data_size = 0, v_data_size = 0;
    ProresContext* ctx = avctx->priv_data;
    int tgt_bits   = (mb_count * bitrate_table[avctx->profile]) >> 2;
    int low_bytes  = (tgt_bits - (tgt_bits >> 3)) >> 3; // 12% bitrate fluctuation
    int high_bytes = (tgt_bits + (tgt_bits >> 3)) >> 3;

    luma_stride   = pic->linesize[0];
    chroma_stride = pic->linesize[1];

    dest_y = pic->data[0] + (mb_y << 4) * luma_stride   + (mb_x << 5);
    dest_u = pic->data[1] + (mb_y << 4) * chroma_stride + (mb_x << 4);
    dest_v = pic->data[2] + (mb_y << 4) * chroma_stride + (mb_x << 4);

    if (unsafe) {

        subimage_with_fill((uint16_t *) pic->data[0], mb_x << 4, mb_y << 4,
                luma_stride, avctx->width, avctx->height,
                (uint16_t *) ctx->fill_y, mb_count << 4, 16);
        subimage_with_fill((uint16_t *) pic->data[1], mb_x << 3, mb_y << 4,
                chroma_stride, avctx->width >> 1, avctx->height,
                (uint16_t *) ctx->fill_u, mb_count << 3, 16);
        subimage_with_fill((uint16_t *) pic->data[2], mb_x << 3, mb_y << 4,
                chroma_stride, avctx->width >> 1, avctx->height,
                (uint16_t *) ctx->fill_v, mb_count << 3, 16);

        encode_slice_data(avctx, ctx->fill_y, ctx->fill_u, ctx->fill_v,
                mb_count << 5, mb_count << 4, mb_count, buf + hdr_size,
                data_size - hdr_size, &y_data_size, &u_data_size, &v_data_size,
                *qp);
    } else {
        slice_size = encode_slice_data(avctx, dest_y, dest_u, dest_v,
                luma_stride, chroma_stride, mb_count, buf + hdr_size,
                data_size - hdr_size, &y_data_size, &u_data_size, &v_data_size,
                *qp);

        if (slice_size > high_bytes && *qp < qp_end_table[avctx->profile]) {
            do {
                *qp += 1;
                slice_size = encode_slice_data(avctx, dest_y, dest_u, dest_v,
                        luma_stride, chroma_stride, mb_count, buf + hdr_size,
                        data_size - hdr_size, &y_data_size, &u_data_size,
                        &v_data_size, *qp);
            } while (slice_size > high_bytes && *qp < qp_end_table[avctx->profile]);
        } else if (slice_size < low_bytes && *qp
                > qp_start_table[avctx->profile]) {
            do {
                *qp -= 1;
                slice_size = encode_slice_data(avctx, dest_y, dest_u, dest_v,
                        luma_stride, chroma_stride, mb_count, buf + hdr_size,
                        data_size - hdr_size, &y_data_size, &u_data_size,
                        &v_data_size, *qp);
            } while (slice_size < low_bytes && *qp > qp_start_table[avctx->profile]);
        }
    }

    buf[0] = hdr_size << 3;
    buf[1] = *qp;
    AV_WB16(buf + 2, y_data_size);
    AV_WB16(buf + 4, u_data_size);

    return hdr_size + y_data_size + u_data_size + v_data_size;
}

static int prores_encode_picture(AVCodecContext *avctx, const AVFrame *pic,
        uint8_t *buf, const int buf_size)
{
    int mb_width = (avctx->width + 15) >> 4;
    int mb_height = (avctx->height + 15) >> 4;
    int hdr_size, sl_size, i;
    int mb_y, sl_data_size, qp;
    int unsafe_bot, unsafe_right;
    uint8_t *sl_data, *sl_data_sizes;
    int slice_per_line = 0, rem = mb_width;

    for (i = av_log2(DEFAULT_SLICE_MB_WIDTH); i >= 0; --i) {
        slice_per_line += rem >> i;
        rem &= (1 << i) - 1;
    }

    qp = qp_start_table[avctx->profile];
    hdr_size = 8; sl_data_size = buf_size - hdr_size;
    sl_data_sizes = buf + hdr_size;
    sl_data = sl_data_sizes + (slice_per_line * mb_height * 2);
    for (mb_y = 0; mb_y < mb_height; mb_y++) {
        int mb_x = 0;
        int slice_mb_count = DEFAULT_SLICE_MB_WIDTH;
        while (mb_x < mb_width) {
            while (mb_width - mb_x < slice_mb_count)
                slice_mb_count >>= 1;

            unsafe_bot = (avctx->height & 0xf) && (mb_y == mb_height - 1);
            unsafe_right = (avctx->width & 0xf) && (mb_x + slice_mb_count == mb_width);

            sl_size = encode_slice(avctx, pic, mb_x, mb_y, slice_mb_count,
                    sl_data, sl_data_size, unsafe_bot || unsafe_right, &qp);

            bytestream_put_be16(&sl_data_sizes, sl_size);
            sl_data           += sl_size;
            sl_data_size      -= sl_size;
            mb_x              += slice_mb_count;
        }
    }

    buf[0] = hdr_size << 3;
    AV_WB32(buf + 1, sl_data - buf);
    AV_WB16(buf + 5, slice_per_line * mb_height);
    buf[7] = av_log2(DEFAULT_SLICE_MB_WIDTH) << 4;

    return sl_data - buf;
}

static int prores_encode_frame(AVCodecContext *avctx, AVPacket *pkt,
                               const AVFrame *pict, int *got_packet)
{
    int header_size = 148;
    uint8_t *buf;
    int pic_size, ret;
    int frame_size = FFALIGN(avctx->width, 16) * FFALIGN(avctx->height, 16)*16 + 500 + FF_MIN_BUFFER_SIZE; //FIXME choose tighter limit


    if ((ret = ff_alloc_packet2(avctx, pkt, frame_size + FF_MIN_BUFFER_SIZE)) < 0)
        return ret;

    buf = pkt->data;
    pic_size = prores_encode_picture(avctx, pict, buf + header_size + 8,
            pkt->size - header_size - 8);

    bytestream_put_be32(&buf, pic_size + 8 + header_size);
    bytestream_put_buffer(&buf, "icpf", 4);

    bytestream_put_be16(&buf, header_size);
    bytestream_put_be16(&buf, 0);
    bytestream_put_buffer(&buf, "fmpg", 4);
    bytestream_put_be16(&buf, avctx->width);
    bytestream_put_be16(&buf, avctx->height);
    *buf++ = 0x83; // {10}(422){00}{00}(frame){11}
    *buf++ = 0;
    *buf++ = 2;
    *buf++ = 2;
    *buf++ = 6;
    *buf++ = 32;
    *buf++ = 0;
    *buf++ = 3;

    bytestream_put_buffer(&buf, QMAT_LUMA[avctx->profile],   64);
    bytestream_put_buffer(&buf, QMAT_CHROMA[avctx->profile], 64);

    pkt->flags |= AV_PKT_FLAG_KEY;
    pkt->size = pic_size + 8 + header_size;
    *got_packet = 1;

    return 0;
}

static void scale_mat(const uint8_t* src, int* dst, int scale)
{
    int i;
    for (i = 0; i < 64; i++)
        dst[i] = src[i] * scale;
}

static av_cold int prores_encode_init(AVCodecContext *avctx)
{
    int i;
    ProresContext* ctx = avctx->priv_data;

    if (avctx->pix_fmt != AV_PIX_FMT_YUV422P10) {
        av_log(avctx, AV_LOG_ERROR, "need YUV422P10\n");
        return -1;
    }
    avctx->bits_per_raw_sample = 10;

    if (avctx->width & 0x1) {
        av_log(avctx, AV_LOG_ERROR,
                "frame width needs to be multiple of 2\n");
        return -1;
    }

    if (avctx->width > 65534 || avctx->height > 65535) {
        av_log(avctx, AV_LOG_ERROR,
                "The maximum dimensions are 65534x65535\n");
        return AVERROR(EINVAL);
    }

    if ((avctx->height & 0xf) || (avctx->width & 0xf)) {
        ctx->fill_y = av_malloc(4 * (DEFAULT_SLICE_MB_WIDTH << 8));
        if (!ctx->fill_y)
            return AVERROR(ENOMEM);
        ctx->fill_u = ctx->fill_y + (DEFAULT_SLICE_MB_WIDTH << 9);
        ctx->fill_v = ctx->fill_u + (DEFAULT_SLICE_MB_WIDTH << 8);
    }

    if (avctx->profile == FF_PROFILE_UNKNOWN) {
        avctx->profile = FF_PROFILE_PRORES_STANDARD;
        av_log(avctx, AV_LOG_INFO,
                "encoding with ProRes standard (apcn) profile\n");

    } else if (avctx->profile < FF_PROFILE_PRORES_PROXY
            || avctx->profile > FF_PROFILE_PRORES_HQ) {
        av_log(
                avctx,
                AV_LOG_ERROR,
                "unknown profile %d, use [0 - apco, 1 - apcs, 2 - apcn (default), 3 - apch]\n",
                avctx->profile);
        return -1;
    }

    ff_fdctdsp_init(&ctx->fdsp, avctx);

    avctx->codec_tag = AV_RL32((const uint8_t*)profiles[avctx->profile].name);

    for (i = 1; i <= 16; i++) {
        scale_mat(QMAT_LUMA[avctx->profile]  , ctx->qmat_luma[i - 1]  , i);
        scale_mat(QMAT_CHROMA[avctx->profile], ctx->qmat_chroma[i - 1], i);
    }

    avctx->coded_frame = av_frame_alloc();
    avctx->coded_frame->key_frame = 1;
    avctx->coded_frame->pict_type = AV_PICTURE_TYPE_I;

    return 0;
}

static av_cold int prores_encode_close(AVCodecContext *avctx)
{
    ProresContext* ctx = avctx->priv_data;
    av_freep(&avctx->coded_frame);
    av_freep(&ctx->fill_y);

    return 0;
}

AVCodec ff_prores_aw_encoder = {
    .name           = "prores_aw",
    .long_name      = NULL_IF_CONFIG_SMALL("Apple ProRes"),
    .type           = AVMEDIA_TYPE_VIDEO,
    .id             = AV_CODEC_ID_PRORES,
    .priv_data_size = sizeof(ProresContext),
    .init           = prores_encode_init,
    .close          = prores_encode_close,
    .encode2        = prores_encode_frame,
    .pix_fmts       = (const enum AVPixelFormat[]){AV_PIX_FMT_YUV422P10, AV_PIX_FMT_NONE},
    .capabilities   = CODEC_CAP_FRAME_THREADS | CODEC_CAP_INTRA_ONLY,
    .profiles       = profiles
};

AVCodec ff_prores_encoder = {
    .name           = "prores",
    .long_name      = NULL_IF_CONFIG_SMALL("Apple ProRes"),
    .type           = AVMEDIA_TYPE_VIDEO,
    .id             = AV_CODEC_ID_PRORES,
    .priv_data_size = sizeof(ProresContext),
    .init           = prores_encode_init,
    .close          = prores_encode_close,
    .encode2        = prores_encode_frame,
    .pix_fmts       = (const enum AVPixelFormat[]){AV_PIX_FMT_YUV422P10, AV_PIX_FMT_NONE},
    .capabilities   = CODEC_CAP_FRAME_THREADS | CODEC_CAP_INTRA_ONLY,
    .profiles       = profiles
};
Commit	Line	Data
	1	/*
	2	* Apple ProRes encoder
	3	*
	4	* Copyright (c) 2011 Anatoliy Wasserman
	5	*
	6	* This file is part of FFmpeg.
	7	*
	8	* FFmpeg is free software; you can redistribute it and/or
	9	* modify it under the terms of the GNU Lesser General Public
	10	* License as published by the Free Software Foundation; either
	11	* version 2.1 of the License, or (at your option) any later version.
	12	*
	13	* FFmpeg is distributed in the hope that it will be useful,
	14	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	15	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	16	* Lesser General Public License for more details.
	17	*
	18	* You should have received a copy of the GNU Lesser General Public
	19	* License along with FFmpeg; if not, write to the Free Software
	20	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	21	*/
	22
	23	/**
	24	* @file
	25	* Apple ProRes encoder (Anatoliy Wasserman version)
	26	* Known FOURCCs: 'apch' (HQ), 'apcn' (SD), 'apcs' (LT), 'acpo' (Proxy)
	27	*/
	28
	29	#include "avcodec.h"
	30	#include "dct.h"
	31	#include "internal.h"
	32	#include "put_bits.h"
	33	#include "bytestream.h"
	34	#include "fdctdsp.h"
	35
	36	#define DEFAULT_SLICE_MB_WIDTH 8
	37
	38	#define FF_PROFILE_PRORES_PROXY 0
	39	#define FF_PROFILE_PRORES_LT 1
	40	#define FF_PROFILE_PRORES_STANDARD 2
	41	#define FF_PROFILE_PRORES_HQ 3
	42
	43	static const AVProfile profiles[] = {
	44	{ FF_PROFILE_PRORES_PROXY, "apco"},
	45	{ FF_PROFILE_PRORES_LT, "apcs"},
	46	{ FF_PROFILE_PRORES_STANDARD, "apcn"},
	47	{ FF_PROFILE_PRORES_HQ, "apch"},
	48	{ FF_PROFILE_UNKNOWN }
	49	};
	50
	51	static const int qp_start_table[4] = { 4, 1, 1, 1 };
	52	static const int qp_end_table[4] = { 8, 9, 6, 6 };
	53	static const int bitrate_table[5] = { 1000, 2100, 3500, 5400 };
	54
	55	static const uint8_t progressive_scan[64] = {
	56	0, 1, 8, 9, 2, 3, 10, 11,
	57	16, 17, 24, 25, 18, 19, 26, 27,
	58	4, 5, 12, 20, 13, 6, 7, 14,
	59	21, 28, 29, 22, 15, 23, 30, 31,
	60	32, 33, 40, 48, 41, 34, 35, 42,
	61	49, 56, 57, 50, 43, 36, 37, 44,
	62	51, 58, 59, 52, 45, 38, 39, 46,
	63	53, 60, 61, 54, 47, 55, 62, 63
	64	};
	65
	66	static const uint8_t QMAT_LUMA[4][64] = {
	67	{
	68	4, 7, 9, 11, 13, 14, 15, 63,
	69	7, 7, 11, 12, 14, 15, 63, 63,
	70	9, 11, 13, 14, 15, 63, 63, 63,
	71	11, 11, 13, 14, 63, 63, 63, 63,
	72	11, 13, 14, 63, 63, 63, 63, 63,
	73	13, 14, 63, 63, 63, 63, 63, 63,
	74	13, 63, 63, 63, 63, 63, 63, 63,
	75	63, 63, 63, 63, 63, 63, 63, 63
	76	}, {
	77	4, 5, 6, 7, 9, 11, 13, 15,
	78	5, 5, 7, 8, 11, 13, 15, 17,
	79	6, 7, 9, 11, 13, 15, 15, 17,
	80	7, 7, 9, 11, 13, 15, 17, 19,
	81	7, 9, 11, 13, 14, 16, 19, 23,
	82	9, 11, 13, 14, 16, 19, 23, 29,
	83	9, 11, 13, 15, 17, 21, 28, 35,
	84	11, 13, 16, 17, 21, 28, 35, 41
	85	}, {
	86	4, 4, 5, 5, 6, 7, 7, 9,
	87	4, 4, 5, 6, 7, 7, 9, 9,
	88	5, 5, 6, 7, 7, 9, 9, 10,
	89	5, 5, 6, 7, 7, 9, 9, 10,
	90	5, 6, 7, 7, 8, 9, 10, 12,
	91	6, 7, 7, 8, 9, 10, 12, 15,
	92	6, 7, 7, 9, 10, 11, 14, 17,
	93	7, 7, 9, 10, 11, 14, 17, 21
	94	}, {
	95	4, 4, 4, 4, 4, 4, 4, 4,
	96	4, 4, 4, 4, 4, 4, 4, 4,
	97	4, 4, 4, 4, 4, 4, 4, 4,
	98	4, 4, 4, 4, 4, 4, 4, 5,
	99	4, 4, 4, 4, 4, 4, 5, 5,
	100	4, 4, 4, 4, 4, 5, 5, 6,
	101	4, 4, 4, 4, 5, 5, 6, 7,
	102	4, 4, 4, 4, 5, 6, 7, 7
	103	}
	104	};
	105
	106	static const uint8_t QMAT_CHROMA[4][64] = {
	107	{
	108	4, 7, 9, 11, 13, 14, 63, 63,
	109	7, 7, 11, 12, 14, 63, 63, 63,
	110	9, 11, 13, 14, 63, 63, 63, 63,
	111	11, 11, 13, 14, 63, 63, 63, 63,
	112	11, 13, 14, 63, 63, 63, 63, 63,
	113	13, 14, 63, 63, 63, 63, 63, 63,
	114	13, 63, 63, 63, 63, 63, 63, 63,
	115	63, 63, 63, 63, 63, 63, 63, 63
	116	}, {
	117	4, 5, 6, 7, 9, 11, 13, 15,
	118	5, 5, 7, 8, 11, 13, 15, 17,
	119	6, 7, 9, 11, 13, 15, 15, 17,
	120	7, 7, 9, 11, 13, 15, 17, 19,
	121	7, 9, 11, 13, 14, 16, 19, 23,
	122	9, 11, 13, 14, 16, 19, 23, 29,
	123	9, 11, 13, 15, 17, 21, 28, 35,
	124	11, 13, 16, 17, 21, 28, 35, 41
	125	}, {
	126	4, 4, 5, 5, 6, 7, 7, 9,
	127	4, 4, 5, 6, 7, 7, 9, 9,
	128	5, 5, 6, 7, 7, 9, 9, 10,
	129	5, 5, 6, 7, 7, 9, 9, 10,
	130	5, 6, 7, 7, 8, 9, 10, 12,
	131	6, 7, 7, 8, 9, 10, 12, 15,
	132	6, 7, 7, 9, 10, 11, 14, 17,
	133	7, 7, 9, 10, 11, 14, 17, 21
	134	}, {
	135	4, 4, 4, 4, 4, 4, 4, 4,
	136	4, 4, 4, 4, 4, 4, 4, 4,
	137	4, 4, 4, 4, 4, 4, 4, 4,
	138	4, 4, 4, 4, 4, 4, 4, 5,
	139	4, 4, 4, 4, 4, 4, 5, 5,
	140	4, 4, 4, 4, 4, 5, 5, 6,
	141	4, 4, 4, 4, 5, 5, 6, 7,
	142	4, 4, 4, 4, 5, 6, 7, 7
	143	}
	144	};
	145
	146
	147	typedef struct {
	148	FDCTDSPContext fdsp;
	149	uint8_t* fill_y;
	150	uint8_t* fill_u;
	151	uint8_t* fill_v;
	152
	153	int qmat_luma[16][64];
	154	int qmat_chroma[16][64];
	155	} ProresContext;
	156
	157	static void encode_codeword(PutBitContext *pb, int val, int codebook)
	158	{
	159	unsigned int rice_order, exp_order, switch_bits, first_exp, exp, zeros,
	160	mask;
	161
	162	/* number of bits to switch between rice and exp golomb */
	163	switch_bits = codebook & 3;
	164	rice_order = codebook >> 5;
	165	exp_order = (codebook >> 2) & 7;
	166
	167	first_exp = ((switch_bits + 1) << rice_order);
	168
	169	if (val >= first_exp) { /* exp golomb */
	170	val -= first_exp;
	171	val += (1 << exp_order);
	172	exp = av_log2(val);
	173	zeros = exp - exp_order + switch_bits + 1;
	174	put_bits(pb, zeros, 0);
	175	put_bits(pb, exp + 1, val);
	176	} else if (rice_order) {
	177	mask = (1 << rice_order) - 1;
	178	put_bits(pb, (val >> rice_order), 0);
	179	put_bits(pb, 1, 1);
	180	put_bits(pb, rice_order, val & mask);
	181	} else {
	182	put_bits(pb, val, 0);
	183	put_bits(pb, 1, 1);
	184	}
	185	}
	186
	187	#define QSCALE(qmat,ind,val) ((val) / ((qmat)[ind]))
	188	#define TO_GOLOMB(val) (((val) << 1) ^ ((val) >> 31))
	189	#define DIFF_SIGN(val, sign) (((val) >> 31) ^ (sign))
	190	#define IS_NEGATIVE(val) ((((val) >> 31) ^ -1) + 1)
	191	#define TO_GOLOMB2(val,sign) ((val)==0 ? 0 : ((val) << 1) + (sign))
	192
	193	static av_always_inline int get_level(int val)
	194	{
	195	int sign = (val >> 31);
	196	return (val ^ sign) - sign;
	197	}
	198
	199	#define FIRST_DC_CB 0xB8
	200
	201	static const uint8_t dc_codebook[7] = { 0x04, 0x28, 0x28, 0x4D, 0x4D, 0x70, 0x70};
	202
	203	static void encode_dc_coeffs(PutBitContext pb, int16_t in,
	204	int blocks_per_slice, int *qmat)
	205	{
	206	int prev_dc, code;
	207	int i, sign, idx;
	208	int new_dc, delta, diff_sign, new_code;
	209
	210	prev_dc = QSCALE(qmat, 0, in[0] - 16384);
	211	code = TO_GOLOMB(prev_dc);
	212	encode_codeword(pb, code, FIRST_DC_CB);
	213
	214	code = 5; sign = 0; idx = 64;
	215	for (i = 1; i < blocks_per_slice; i++, idx += 64) {
	216	new_dc = QSCALE(qmat, 0, in[idx] - 16384);
	217	delta = new_dc - prev_dc;
	218	diff_sign = DIFF_SIGN(delta, sign);
	219	new_code = TO_GOLOMB2(get_level(delta), diff_sign);
	220
	221	encode_codeword(pb, new_code, dc_codebook[FFMIN(code, 6)]);
	222
	223	code = new_code;
	224	sign = delta >> 31;
	225	prev_dc = new_dc;
	226	}
	227	}
	228
	229	static const uint8_t run_to_cb[16] = { 0x06, 0x06, 0x05, 0x05, 0x04, 0x29,
	230	0x29, 0x29, 0x29, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x4C };
	231	static const uint8_t lev_to_cb[10] = { 0x04, 0x0A, 0x05, 0x06, 0x04, 0x28,
	232	0x28, 0x28, 0x28, 0x4C };
	233
	234	static void encode_ac_coeffs(AVCodecContext avctx, PutBitContext pb,
	235	int16_t in, int blocks_per_slice, int qmat)
	236	{
	237	int prev_run = 4;
	238	int prev_level = 2;
	239
	240	int run = 0, level, code, i, j;
	241	for (i = 1; i < 64; i++) {
	242	int indp = progressive_scan[i];
	243	for (j = 0; j < blocks_per_slice; j++) {
	244	int val = QSCALE(qmat, indp, in[(j << 6) + indp]);
	245	if (val) {
	246	encode_codeword(pb, run, run_to_cb[FFMIN(prev_run, 15)]);
	247
	248	prev_run = run;
	249	run = 0;
	250	level = get_level(val);
	251	code = level - 1;
	252
	253	encode_codeword(pb, code, lev_to_cb[FFMIN(prev_level, 9)]);
	254
	255	prev_level = level;
	256
	257	put_bits(pb, 1, IS_NEGATIVE(val));
	258	} else {
	259	++run;
	260	}
	261	}
	262	}
	263	}
	264
	265	static void get(uint8_t pixels, int stride, int16_t block)
	266	{
	267	int i;
	268
	269	for (i = 0; i < 8; i++) {
	270	AV_WN64(block, AV_RN64(pixels));
	271	AV_WN64(block+4, AV_RN64(pixels+8));
	272	pixels += stride;
	273	block += 8;
	274	}
	275	}
	276
	277	static void fdct_get(FDCTDSPContext fdsp, uint8_t pixels, int stride, int16_t* block)
	278	{
	279	get(pixels, stride, block);
	280	fdsp->fdct(block);
	281	}
	282
	283	static int encode_slice_plane(AVCodecContext *avctx, int mb_count,
	284	uint8_t src, int src_stride, uint8_t buf, unsigned buf_size,
	285	int *qmat, int chroma)
	286	{
	287	ProresContext* ctx = avctx->priv_data;
	288	FDCTDSPContext *fdsp = &ctx->fdsp;
	289	DECLARE_ALIGNED(16, int16_t, blocks)[DEFAULT_SLICE_MB_WIDTH << 8], *block;
	290	int i, blocks_per_slice;
	291	PutBitContext pb;
	292
	293	block = blocks;
	294	for (i = 0; i < mb_count; i++) {
	295	fdct_get(fdsp, src, src_stride, block + (0 << 6));
	296	fdct_get(fdsp, src + 8 * src_stride, src_stride, block + ((2 - chroma) << 6));
	297	if (!chroma) {
	298	fdct_get(fdsp, src + 16, src_stride, block + (1 << 6));
	299	fdct_get(fdsp, src + 16 + 8 * src_stride, src_stride, block + (3 << 6));
	300	}
	301
	302	block += (256 >> chroma);
	303	src += (32 >> chroma);
	304	}
	305
	306	blocks_per_slice = mb_count << (2 - chroma);
	307	init_put_bits(&pb, buf, buf_size << 3);
	308
	309	encode_dc_coeffs(&pb, blocks, blocks_per_slice, qmat);
	310	encode_ac_coeffs(avctx, &pb, blocks, blocks_per_slice, qmat);
	311
	312	flush_put_bits(&pb);
	313	return put_bits_ptr(&pb) - pb.buf;
	314	}
	315
	316	static av_always_inline unsigned encode_slice_data(AVCodecContext *avctx,
	317	uint8_t dest_y, uint8_t dest_u, uint8_t *dest_v, int luma_stride,
	318	int chroma_stride, unsigned mb_count, uint8_t *buf, unsigned data_size,
	319	unsigned* y_data_size, unsigned* u_data_size, unsigned* v_data_size,
	320	int qp)
	321	{
	322	ProresContext* ctx = avctx->priv_data;
	323
	324	*y_data_size = encode_slice_plane(avctx, mb_count, dest_y, luma_stride,
	325	buf, data_size, ctx->qmat_luma[qp - 1], 0);
	326
	327	if (!(avctx->flags & CODEC_FLAG_GRAY)) {
	328	*u_data_size = encode_slice_plane(avctx, mb_count, dest_u,
	329	chroma_stride, buf + y_data_size, data_size - y_data_size,
	330	ctx->qmat_chroma[qp - 1], 1);
	331
	332	*v_data_size = encode_slice_plane(avctx, mb_count, dest_v,
	333	chroma_stride, buf + y_data_size + u_data_size,
	334	data_size - y_data_size - u_data_size,
	335	ctx->qmat_chroma[qp - 1], 1);
	336	}
	337
	338	return y_data_size + u_data_size + *v_data_size;
	339	}
	340
	341	static void subimage_with_fill(uint16_t *src, unsigned x, unsigned y,
	342	unsigned stride, unsigned width, unsigned height, uint16_t *dst,
	343	unsigned dst_width, unsigned dst_height)
	344	{
	345
	346	int box_width = FFMIN(width - x, dst_width);
	347	int box_height = FFMIN(height - y, dst_height);
	348	int i, j, src_stride = stride >> 1;
	349	uint16_t last_pix, *last_line;
	350
	351	src += y * src_stride + x;
	352	for (i = 0; i < box_height; ++i) {
	353	for (j = 0; j < box_width; ++j) {
	354	dst[j] = src[j];
	355	}
	356	last_pix = dst[j - 1];
	357	for (; j < dst_width; j++)
	358	dst[j] = last_pix;
	359	src += src_stride;
	360	dst += dst_width;
	361	}
	362	last_line = dst - dst_width;
	363	for (; i < dst_height; i++) {
	364	for (j = 0; j < dst_width; ++j) {
	365	dst[j] = last_line[j];
	366	}
	367	dst += dst_width;
	368	}
	369	}
	370
	371	static int encode_slice(AVCodecContext avctx, const AVFrame pic, int mb_x,
	372	int mb_y, unsigned mb_count, uint8_t *buf, unsigned data_size,
	373	int unsafe, int *qp)
	374	{
	375	int luma_stride, chroma_stride;
	376	int hdr_size = 6, slice_size;
	377	uint8_t dest_y, dest_u, *dest_v;
	378	unsigned y_data_size = 0, u_data_size = 0, v_data_size = 0;
	379	ProresContext* ctx = avctx->priv_data;
	380	int tgt_bits = (mb_count * bitrate_table[avctx->profile]) >> 2;
	381	int low_bytes = (tgt_bits - (tgt_bits >> 3)) >> 3; // 12% bitrate fluctuation
	382	int high_bytes = (tgt_bits + (tgt_bits >> 3)) >> 3;
	383
	384	luma_stride = pic->linesize[0];
	385	chroma_stride = pic->linesize[1];
	386
	387	dest_y = pic->data[0] + (mb_y << 4) * luma_stride + (mb_x << 5);
	388	dest_u = pic->data[1] + (mb_y << 4) * chroma_stride + (mb_x << 4);
	389	dest_v = pic->data[2] + (mb_y << 4) * chroma_stride + (mb_x << 4);
	390
	391	if (unsafe) {
	392
	393	subimage_with_fill((uint16_t *) pic->data[0], mb_x << 4, mb_y << 4,
	394	luma_stride, avctx->width, avctx->height,
	395	(uint16_t *) ctx->fill_y, mb_count << 4, 16);
	396	subimage_with_fill((uint16_t *) pic->data[1], mb_x << 3, mb_y << 4,
	397	chroma_stride, avctx->width >> 1, avctx->height,
	398	(uint16_t *) ctx->fill_u, mb_count << 3, 16);
	399	subimage_with_fill((uint16_t *) pic->data[2], mb_x << 3, mb_y << 4,
	400	chroma_stride, avctx->width >> 1, avctx->height,
	401	(uint16_t *) ctx->fill_v, mb_count << 3, 16);
	402
	403	encode_slice_data(avctx, ctx->fill_y, ctx->fill_u, ctx->fill_v,
	404	mb_count << 5, mb_count << 4, mb_count, buf + hdr_size,
	405	data_size - hdr_size, &y_data_size, &u_data_size, &v_data_size,
	406	*qp);
	407	} else {
	408	slice_size = encode_slice_data(avctx, dest_y, dest_u, dest_v,
	409	luma_stride, chroma_stride, mb_count, buf + hdr_size,
	410	data_size - hdr_size, &y_data_size, &u_data_size, &v_data_size,
	411	*qp);
	412
	413	if (slice_size > high_bytes && *qp < qp_end_table[avctx->profile]) {
	414	do {
	415	*qp += 1;
	416	slice_size = encode_slice_data(avctx, dest_y, dest_u, dest_v,
	417	luma_stride, chroma_stride, mb_count, buf + hdr_size,
	418	data_size - hdr_size, &y_data_size, &u_data_size,
	419	&v_data_size, *qp);
	420	} while (slice_size > high_bytes && *qp < qp_end_table[avctx->profile]);
	421	} else if (slice_size < low_bytes && *qp
	422	> qp_start_table[avctx->profile]) {
	423	do {
	424	*qp -= 1;
	425	slice_size = encode_slice_data(avctx, dest_y, dest_u, dest_v,
	426	luma_stride, chroma_stride, mb_count, buf + hdr_size,
	427	data_size - hdr_size, &y_data_size, &u_data_size,
	428	&v_data_size, *qp);
	429	} while (slice_size < low_bytes && *qp > qp_start_table[avctx->profile]);
	430	}
	431	}
	432
	433	buf[0] = hdr_size << 3;
	434	buf[1] = *qp;
	435	AV_WB16(buf + 2, y_data_size);
	436	AV_WB16(buf + 4, u_data_size);
	437
	438	return hdr_size + y_data_size + u_data_size + v_data_size;
	439	}
	440
	441	static int prores_encode_picture(AVCodecContext avctx, const AVFrame pic,
	442	uint8_t *buf, const int buf_size)
	443	{
	444	int mb_width = (avctx->width + 15) >> 4;
	445	int mb_height = (avctx->height + 15) >> 4;
	446	int hdr_size, sl_size, i;
	447	int mb_y, sl_data_size, qp;
	448	int unsafe_bot, unsafe_right;
	449	uint8_t sl_data, sl_data_sizes;
	450	int slice_per_line = 0, rem = mb_width;
	451
	452	for (i = av_log2(DEFAULT_SLICE_MB_WIDTH); i >= 0; --i) {
	453	slice_per_line += rem >> i;
	454	rem &= (1 << i) - 1;
	455	}
	456
	457	qp = qp_start_table[avctx->profile];
	458	hdr_size = 8; sl_data_size = buf_size - hdr_size;
	459	sl_data_sizes = buf + hdr_size;
	460	sl_data = sl_data_sizes + (slice_per_line * mb_height * 2);
	461	for (mb_y = 0; mb_y < mb_height; mb_y++) {
	462	int mb_x = 0;
	463	int slice_mb_count = DEFAULT_SLICE_MB_WIDTH;
	464	while (mb_x < mb_width) {
	465	while (mb_width - mb_x < slice_mb_count)
	466	slice_mb_count >>= 1;
	467
	468	unsafe_bot = (avctx->height & 0xf) && (mb_y == mb_height - 1);
	469	unsafe_right = (avctx->width & 0xf) && (mb_x + slice_mb_count == mb_width);
	470
	471	sl_size = encode_slice(avctx, pic, mb_x, mb_y, slice_mb_count,
	472	sl_data, sl_data_size, unsafe_bot \|\| unsafe_right, &qp);
	473
	474	bytestream_put_be16(&sl_data_sizes, sl_size);
	475	sl_data += sl_size;
	476	sl_data_size -= sl_size;
	477	mb_x += slice_mb_count;
	478	}
	479	}
	480
	481	buf[0] = hdr_size << 3;
	482	AV_WB32(buf + 1, sl_data - buf);
	483	AV_WB16(buf + 5, slice_per_line * mb_height);
	484	buf[7] = av_log2(DEFAULT_SLICE_MB_WIDTH) << 4;
	485
	486	return sl_data - buf;
	487	}
	488
	489	static int prores_encode_frame(AVCodecContext avctx, AVPacket pkt,
	490	const AVFrame pict, int got_packet)
	491	{
	492	int header_size = 148;
	493	uint8_t *buf;
	494	int pic_size, ret;
	495	int frame_size = FFALIGN(avctx->width, 16) * FFALIGN(avctx->height, 16)*16 + 500 + FF_MIN_BUFFER_SIZE; //FIXME choose tighter limit
	496
	497
	498	if ((ret = ff_alloc_packet2(avctx, pkt, frame_size + FF_MIN_BUFFER_SIZE)) < 0)
	499	return ret;
	500
	501	buf = pkt->data;
	502	pic_size = prores_encode_picture(avctx, pict, buf + header_size + 8,
	503	pkt->size - header_size - 8);
	504
	505	bytestream_put_be32(&buf, pic_size + 8 + header_size);
	506	bytestream_put_buffer(&buf, "icpf", 4);
	507
	508	bytestream_put_be16(&buf, header_size);
	509	bytestream_put_be16(&buf, 0);
	510	bytestream_put_buffer(&buf, "fmpg", 4);
	511	bytestream_put_be16(&buf, avctx->width);
	512	bytestream_put_be16(&buf, avctx->height);
	513	*buf++ = 0x83; // {10}(422){00}{00}(frame){11}
	514	*buf++ = 0;
	515	*buf++ = 2;
	516	*buf++ = 2;
	517	*buf++ = 6;
	518	*buf++ = 32;
	519	*buf++ = 0;
	520	*buf++ = 3;
	521
	522	bytestream_put_buffer(&buf, QMAT_LUMA[avctx->profile], 64);
	523	bytestream_put_buffer(&buf, QMAT_CHROMA[avctx->profile], 64);
	524
	525	pkt->flags \|= AV_PKT_FLAG_KEY;
	526	pkt->size = pic_size + 8 + header_size;
	527	*got_packet = 1;
	528
	529	return 0;
	530	}
	531
	532	static void scale_mat(const uint8_t* src, int* dst, int scale)
	533	{
	534	int i;
	535	for (i = 0; i < 64; i++)
	536	dst[i] = src[i] * scale;
	537	}
	538
	539	static av_cold int prores_encode_init(AVCodecContext *avctx)
	540	{
	541	int i;
	542	ProresContext* ctx = avctx->priv_data;
	543
	544	if (avctx->pix_fmt != AV_PIX_FMT_YUV422P10) {
	545	av_log(avctx, AV_LOG_ERROR, "need YUV422P10\n");
	546	return -1;
	547	}
	548	avctx->bits_per_raw_sample = 10;
	549
	550	if (avctx->width & 0x1) {
	551	av_log(avctx, AV_LOG_ERROR,
	552	"frame width needs to be multiple of 2\n");
	553	return -1;
	554	}
	555
	556	if (avctx->width > 65534 \|\| avctx->height > 65535) {
	557	av_log(avctx, AV_LOG_ERROR,
	558	"The maximum dimensions are 65534x65535\n");
	559	return AVERROR(EINVAL);
	560	}
	561
	562	if ((avctx->height & 0xf) \|\| (avctx->width & 0xf)) {
	563	ctx->fill_y = av_malloc(4 * (DEFAULT_SLICE_MB_WIDTH << 8));
	564	if (!ctx->fill_y)
	565	return AVERROR(ENOMEM);
	566	ctx->fill_u = ctx->fill_y + (DEFAULT_SLICE_MB_WIDTH << 9);
	567	ctx->fill_v = ctx->fill_u + (DEFAULT_SLICE_MB_WIDTH << 8);
	568	}
	569
	570	if (avctx->profile == FF_PROFILE_UNKNOWN) {
	571	avctx->profile = FF_PROFILE_PRORES_STANDARD;
	572	av_log(avctx, AV_LOG_INFO,
	573	"encoding with ProRes standard (apcn) profile\n");
	574
	575	} else if (avctx->profile < FF_PROFILE_PRORES_PROXY
	576	\|\| avctx->profile > FF_PROFILE_PRORES_HQ) {
	577	av_log(
	578	avctx,
	579	AV_LOG_ERROR,
	580	"unknown profile %d, use [0 - apco, 1 - apcs, 2 - apcn (default), 3 - apch]\n",
	581	avctx->profile);
	582	return -1;
	583	}
	584
	585	ff_fdctdsp_init(&ctx->fdsp, avctx);
	586
	587	avctx->codec_tag = AV_RL32((const uint8_t*)profiles[avctx->profile].name);
	588
	589	for (i = 1; i <= 16; i++) {
	590	scale_mat(QMAT_LUMA[avctx->profile] , ctx->qmat_luma[i - 1] , i);
	591	scale_mat(QMAT_CHROMA[avctx->profile], ctx->qmat_chroma[i - 1], i);
	592	}
	593
	594	avctx->coded_frame = av_frame_alloc();
	595	avctx->coded_frame->key_frame = 1;
	596	avctx->coded_frame->pict_type = AV_PICTURE_TYPE_I;
	597
	598	return 0;
	599	}
	600
	601	static av_cold int prores_encode_close(AVCodecContext *avctx)
	602	{
	603	ProresContext* ctx = avctx->priv_data;
	604	av_freep(&avctx->coded_frame);
	605	av_freep(&ctx->fill_y);
	606
	607	return 0;
	608	}
	609
	610	AVCodec ff_prores_aw_encoder = {
	611	.name = "prores_aw",
	612	.long_name = NULL_IF_CONFIG_SMALL("Apple ProRes"),
	613	.type = AVMEDIA_TYPE_VIDEO,
	614	.id = AV_CODEC_ID_PRORES,
	615	.priv_data_size = sizeof(ProresContext),
	616	.init = prores_encode_init,
	617	.close = prores_encode_close,
	618	.encode2 = prores_encode_frame,
	619	.pix_fmts = (const enum AVPixelFormat[]){AV_PIX_FMT_YUV422P10, AV_PIX_FMT_NONE},
	620	.capabilities = CODEC_CAP_FRAME_THREADS \| CODEC_CAP_INTRA_ONLY,
	621	.profiles = profiles
	622	};
	623
	624	AVCodec ff_prores_encoder = {
	625	.name = "prores",
	626	.long_name = NULL_IF_CONFIG_SMALL("Apple ProRes"),
	627	.type = AVMEDIA_TYPE_VIDEO,
	628	.id = AV_CODEC_ID_PRORES,
	629	.priv_data_size = sizeof(ProresContext),
	630	.init = prores_encode_init,
	631	.close = prores_encode_close,
	632	.encode2 = prores_encode_frame,
	633	.pix_fmts = (const enum AVPixelFormat[]){AV_PIX_FMT_YUV422P10, AV_PIX_FMT_NONE},
	634	.capabilities = CODEC_CAP_FRAME_THREADS \| CODEC_CAP_INTRA_ONLY,
	635	.profiles = profiles
	636	};