libavcodec/magicyuv.c
77f9c4b7
 /*
  * MagicYUV decoder
  * Copyright (c) 2016 Paul B Mahol
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
 #include <stdlib.h>
 #include <string.h>
 
c3e2e842
 #include "libavutil/pixdesc.h"
77f9c4b7
 #include "libavutil/qsort.h"
d78fd2fa
 
77f9c4b7
 #include "avcodec.h"
 #include "bytestream.h"
 #include "get_bits.h"
 #include "huffyuvdsp.h"
 #include "internal.h"
6d09d6ed
 #include "lossless_videodsp.h"
77f9c4b7
 #include "thread.h"
 
 typedef struct Slice {
     uint32_t start;
     uint32_t size;
 } Slice;
 
 typedef enum Prediction {
     LEFT = 1,
     GRADIENT,
     MEDIAN,
 } Prediction;
 
 typedef struct HuffEntry {
6d09d6ed
     uint16_t sym;
77f9c4b7
     uint8_t  len;
     uint32_t code;
 } HuffEntry;
 
d78fd2fa
 typedef struct MagicYUVContext {
     AVFrame          *p;
6d09d6ed
     int               max;
0281d5ec
     int               bps;
d78fd2fa
     int               slice_height;
     int               nb_slices;
     int               planes;         // number of encoded planes in bitstream
     int               decorrelate;    // postprocessing work
12461636
     int               color_matrix;   // video color matrix
     int               flags;
d78fd2fa
     int               interlaced;     // video is interlaced
     uint8_t          *buf;            // pointer to AVPacket->data
     int               hshift[4];
     int               vshift[4];
     Slice            *slices[4];      // slice bitstream positions for each plane
     unsigned int      slices_size[4]; // slice sizes for each plane
0281d5ec
     uint8_t           len[4][4096];   // table of code lengths for each plane
d78fd2fa
     VLC               vlc[4];         // VLC for each plane
6d09d6ed
     int (*huff_build)(VLC *vlc, uint8_t *len);
     int (*magy_decode_slice)(AVCodecContext *avctx, void *tdata,
                              int j, int threadnr);
     LLVidDSPContext   llviddsp;
d78fd2fa
 } MagicYUVContext;
 
 static int huff_cmp_len(const void *a, const void *b)
77f9c4b7
 {
     const HuffEntry *aa = a, *bb = b;
     return (aa->len - bb->len) * 256 + aa->sym - bb->sym;
 }
 
6d09d6ed
 static int huff_cmp_len10(const void *a, const void *b)
 {
     const HuffEntry *aa = a, *bb = b;
     return (aa->len - bb->len) * 1024 + aa->sym - bb->sym;
 }
 
0281d5ec
 static int huff_cmp_len12(const void *a, const void *b)
 {
     const HuffEntry *aa = a, *bb = b;
     return (aa->len - bb->len) * 4096 + aa->sym - bb->sym;
 }
 
6d09d6ed
 static int huff_build10(VLC *vlc, uint8_t *len)
 {
     HuffEntry he[1024];
     uint32_t codes[1024];
     uint8_t bits[1024];
     uint16_t syms[1024];
     uint32_t code;
     int i;
 
     for (i = 0; i < 1024; i++) {
         he[i].sym = 1023 - i;
         he[i].len = len[i];
341f0129
         if (len[i] == 0 || len[i] > 32)
2162b862
             return AVERROR_INVALIDDATA;
6d09d6ed
     }
     AV_QSORT(he, 1024, HuffEntry, huff_cmp_len10);
 
     code = 1;
     for (i = 1023; i >= 0; i--) {
         codes[i] = code >> (32 - he[i].len);
         bits[i]  = he[i].len;
         syms[i]  = he[i].sym;
         code += 0x80000000u >> (he[i].len - 1);
     }
 
     ff_free_vlc(vlc);
     return ff_init_vlc_sparse(vlc, FFMIN(he[1023].len, 12), 1024,
                               bits,  sizeof(*bits),  sizeof(*bits),
                               codes, sizeof(*codes), sizeof(*codes),
                               syms,  sizeof(*syms),  sizeof(*syms), 0);
 }
 
0281d5ec
 static int huff_build12(VLC *vlc, uint8_t *len)
 {
     HuffEntry he[4096];
     uint32_t codes[4096];
     uint8_t bits[4096];
     uint16_t syms[4096];
     uint32_t code;
     int i;
 
     for (i = 0; i < 4096; i++) {
         he[i].sym = 4095 - i;
         he[i].len = len[i];
341f0129
         if (len[i] == 0 || len[i] > 32)
0281d5ec
             return AVERROR_INVALIDDATA;
     }
     AV_QSORT(he, 4096, HuffEntry, huff_cmp_len12);
 
     code = 1;
     for (i = 4095; i >= 0; i--) {
         codes[i] = code >> (32 - he[i].len);
         bits[i]  = he[i].len;
         syms[i]  = he[i].sym;
         code += 0x80000000u >> (he[i].len - 1);
     }
 
     ff_free_vlc(vlc);
     return ff_init_vlc_sparse(vlc, FFMIN(he[4095].len, 14), 4096,
                               bits,  sizeof(*bits),  sizeof(*bits),
                               codes, sizeof(*codes), sizeof(*codes),
                               syms,  sizeof(*syms),  sizeof(*syms), 0);
 }
 
d78fd2fa
 static int huff_build(VLC *vlc, uint8_t *len)
77f9c4b7
 {
     HuffEntry he[256];
     uint32_t codes[256];
     uint8_t bits[256];
     uint8_t syms[256];
     uint32_t code;
     int i;
 
     for (i = 0; i < 256; i++) {
         he[i].sym = 255 - i;
         he[i].len = len[i];
341f0129
         if (len[i] == 0 || len[i] > 32)
2162b862
             return AVERROR_INVALIDDATA;
77f9c4b7
     }
c3e2e842
     AV_QSORT(he, 256, HuffEntry, huff_cmp_len);
77f9c4b7
 
     code = 1;
     for (i = 255; i >= 0; i--) {
         codes[i] = code >> (32 - he[i].len);
         bits[i]  = he[i].len;
         syms[i]  = he[i].sym;
         code += 0x80000000u >> (he[i].len - 1);
     }
 
     ff_free_vlc(vlc);
     return ff_init_vlc_sparse(vlc, FFMIN(he[255].len, 12), 256,
                               bits,  sizeof(*bits),  sizeof(*bits),
                               codes, sizeof(*codes), sizeof(*codes),
                               syms,  sizeof(*syms),  sizeof(*syms), 0);
 }
 
0281d5ec
 static void magicyuv_median_pred16(uint16_t *dst, const uint16_t *src1,
6d09d6ed
                                    const uint16_t *diff, intptr_t w,
0281d5ec
                                    int *left, int *left_top, int max)
6d09d6ed
 {
     int i;
     uint16_t l, lt;
 
     l  = *left;
     lt = *left_top;
 
     for (i = 0; i < w; i++) {
         l      = mid_pred(l, src1[i], (l + src1[i] - lt)) + diff[i];
0281d5ec
         l     &= max;
6d09d6ed
         lt     = src1[i];
         dst[i] = l;
     }
 
     *left     = l;
     *left_top = lt;
 }
 
 static int magy_decode_slice10(AVCodecContext *avctx, void *tdata,
                                int j, int threadnr)
 {
     MagicYUVContext *s = avctx->priv_data;
     int interlaced = s->interlaced;
0281d5ec
     const int bps = s->bps;
     const int max = s->max - 1;
6d09d6ed
     AVFrame *p = s->p;
     int i, k, x;
     GetBitContext gb;
     uint16_t *dst;
 
     for (i = 0; i < s->planes; i++) {
         int left, lefttop, top;
         int height = AV_CEIL_RSHIFT(FFMIN(s->slice_height, avctx->coded_height - j * s->slice_height), s->vshift[i]);
         int width = AV_CEIL_RSHIFT(avctx->coded_width, s->hshift[i]);
         int sheight = AV_CEIL_RSHIFT(s->slice_height, s->vshift[i]);
         ptrdiff_t fake_stride = (p->linesize[i] / 2) * (1 + interlaced);
         ptrdiff_t stride = p->linesize[i] / 2;
         int flags, pred;
         int ret = init_get_bits8(&gb, s->buf + s->slices[i][j].start,
                                  s->slices[i][j].size);
 
         if (ret < 0)
             return ret;
 
         flags = get_bits(&gb, 8);
         pred  = get_bits(&gb, 8);
 
         dst = (uint16_t *)p->data[i] + j * sheight * stride;
         if (flags & 1) {
7719b8cc
             if (get_bits_left(&gb) < bps * width * height)
                 return AVERROR_INVALIDDATA;
6d09d6ed
             for (k = 0; k < height; k++) {
                 for (x = 0; x < width; x++)
0281d5ec
                     dst[x] = get_bits(&gb, bps);
6d09d6ed
 
                 dst += stride;
             }
         } else {
             for (k = 0; k < height; k++) {
                 for (x = 0; x < width; x++) {
                     int pix;
                     if (get_bits_left(&gb) <= 0)
                         return AVERROR_INVALIDDATA;
 
                     pix = get_vlc2(&gb, s->vlc[i].table, s->vlc[i].bits, 3);
                     if (pix < 0)
                         return AVERROR_INVALIDDATA;
 
0281d5ec
                     dst[x] = max - pix;
6d09d6ed
                 }
                 dst += stride;
             }
         }
 
         switch (pred) {
         case LEFT:
             dst = (uint16_t *)p->data[i] + j * sheight * stride;
0281d5ec
             s->llviddsp.add_left_pred_int16(dst, dst, max, width, 0);
6d09d6ed
             dst += stride;
             if (interlaced) {
0281d5ec
                 s->llviddsp.add_left_pred_int16(dst, dst, max, width, 0);
6d09d6ed
                 dst += stride;
             }
             for (k = 1 + interlaced; k < height; k++) {
0281d5ec
                 s->llviddsp.add_left_pred_int16(dst, dst, max, width, dst[-fake_stride]);
6d09d6ed
                 dst += stride;
             }
             break;
         case GRADIENT:
             dst = (uint16_t *)p->data[i] + j * sheight * stride;
0281d5ec
             s->llviddsp.add_left_pred_int16(dst, dst, max, width, 0);
6d09d6ed
             dst += stride;
             if (interlaced) {
0281d5ec
                 s->llviddsp.add_left_pred_int16(dst, dst, max, width, 0);
6d09d6ed
                 dst += stride;
             }
             for (k = 1 + interlaced; k < height; k++) {
                 top = dst[-fake_stride];
                 left = top + dst[0];
0281d5ec
                 dst[0] = left & max;
6d09d6ed
                 for (x = 1; x < width; x++) {
                     top = dst[x - fake_stride];
                     lefttop = dst[x - (fake_stride + 1)];
                     left += top - lefttop + dst[x];
0281d5ec
                     dst[x] = left & max;
6d09d6ed
                 }
                 dst += stride;
             }
             break;
         case MEDIAN:
             dst = (uint16_t *)p->data[i] + j * sheight * stride;
0281d5ec
             s->llviddsp.add_left_pred_int16(dst, dst, max, width, 0);
6d09d6ed
             dst += stride;
             if (interlaced) {
0281d5ec
                 s->llviddsp.add_left_pred_int16(dst, dst, max, width, 0);
6d09d6ed
                 dst += stride;
             }
7da25488
             lefttop = left = dst[0];
6d09d6ed
             for (k = 1 + interlaced; k < height; k++) {
0281d5ec
                 magicyuv_median_pred16(dst, dst - fake_stride, dst, width, &left, &lefttop, max);
6d09d6ed
                 lefttop = left = dst[0];
                 dst += stride;
             }
             break;
         default:
             avpriv_request_sample(avctx, "Unknown prediction: %d", pred);
         }
     }
 
     if (s->decorrelate) {
         int height = FFMIN(s->slice_height, avctx->coded_height - j * s->slice_height);
         int width = avctx->coded_width;
         uint16_t *r = (uint16_t *)p->data[0] + j * s->slice_height * p->linesize[0] / 2;
         uint16_t *g = (uint16_t *)p->data[1] + j * s->slice_height * p->linesize[1] / 2;
         uint16_t *b = (uint16_t *)p->data[2] + j * s->slice_height * p->linesize[2] / 2;
 
         for (i = 0; i < height; i++) {
             for (k = 0; k < width; k++) {
0281d5ec
                 b[k] = (b[k] + g[k]) & max;
                 r[k] = (r[k] + g[k]) & max;
6d09d6ed
             }
             b += p->linesize[0] / 2;
             g += p->linesize[1] / 2;
             r += p->linesize[2] / 2;
         }
     }
 
     return 0;
 }
 
d78fd2fa
 static int magy_decode_slice(AVCodecContext *avctx, void *tdata,
                              int j, int threadnr)
77f9c4b7
 {
     MagicYUVContext *s = avctx->priv_data;
     int interlaced = s->interlaced;
     AVFrame *p = s->p;
c76cf303
     int i, k, x, min_width;
d78fd2fa
     GetBitContext gb;
77f9c4b7
     uint8_t *dst;
 
     for (i = 0; i < s->planes; i++) {
d78fd2fa
         int left, lefttop, top;
77f9c4b7
         int height = AV_CEIL_RSHIFT(FFMIN(s->slice_height, avctx->coded_height - j * s->slice_height), s->vshift[i]);
         int width = AV_CEIL_RSHIFT(avctx->coded_width, s->hshift[i]);
         int sheight = AV_CEIL_RSHIFT(s->slice_height, s->vshift[i]);
d78fd2fa
         ptrdiff_t fake_stride = p->linesize[i] * (1 + interlaced);
         ptrdiff_t stride = p->linesize[i];
a3c2a9c7
         int flags, pred;
d78fd2fa
         int ret = init_get_bits8(&gb, s->buf + s->slices[i][j].start,
                                  s->slices[i][j].size);
77f9c4b7
 
d78fd2fa
         if (ret < 0)
77f9c4b7
             return ret;
 
d78fd2fa
         flags = get_bits(&gb, 8);
         pred  = get_bits(&gb, 8);
a3c2a9c7
 
77f9c4b7
         dst = p->data[i] + j * sheight * stride;
a3c2a9c7
         if (flags & 1) {
7719b8cc
             if (get_bits_left(&gb) < 8* width * height)
                 return AVERROR_INVALIDDATA;
a3c2a9c7
             for (k = 0; k < height; k++) {
d78fd2fa
                 for (x = 0; x < width; x++)
                     dst[x] = get_bits(&gb, 8);
 
a3c2a9c7
                 dst += stride;
             }
         } else {
             for (k = 0; k < height; k++) {
                 for (x = 0; x < width; x++) {
                     int pix;
d78fd2fa
                     if (get_bits_left(&gb) <= 0)
a3c2a9c7
                         return AVERROR_INVALIDDATA;
d78fd2fa
 
                     pix = get_vlc2(&gb, s->vlc[i].table, s->vlc[i].bits, 3);
                     if (pix < 0)
a3c2a9c7
                         return AVERROR_INVALIDDATA;
d78fd2fa
 
a3c2a9c7
                     dst[x] = 255 - pix;
77f9c4b7
                 }
a3c2a9c7
                 dst += stride;
77f9c4b7
             }
         }
 
d78fd2fa
         switch (pred) {
         case LEFT:
77f9c4b7
             dst = p->data[i] + j * sheight * stride;
5ac1dd8e
             s->llviddsp.add_left_pred(dst, dst, width, 0);
77f9c4b7
             dst += stride;
             if (interlaced) {
5ac1dd8e
                 s->llviddsp.add_left_pred(dst, dst, width, 0);
77f9c4b7
                 dst += stride;
             }
             for (k = 1 + interlaced; k < height; k++) {
5ac1dd8e
                 s->llviddsp.add_left_pred(dst, dst, width, dst[-fake_stride]);
77f9c4b7
                 dst += stride;
             }
d78fd2fa
             break;
         case GRADIENT:
77f9c4b7
             dst = p->data[i] + j * sheight * stride;
5ac1dd8e
             s->llviddsp.add_left_pred(dst, dst, width, 0);
77f9c4b7
             dst += stride;
             if (interlaced) {
5ac1dd8e
                 s->llviddsp.add_left_pred(dst, dst, width, 0);
77f9c4b7
                 dst += stride;
             }
c76cf303
             min_width = FFMIN(width, 32);
77f9c4b7
             for (k = 1 + interlaced; k < height; k++) {
                 top = dst[-fake_stride];
                 left = top + dst[0];
                 dst[0] = left;
c76cf303
                 for (x = 1; x < min_width; x++) { /* dsp need aligned 32 */
77f9c4b7
                     top = dst[x - fake_stride];
                     lefttop = dst[x - (fake_stride + 1)];
                     left += top - lefttop + dst[x];
                     dst[x] = left;
                 }
c76cf303
                 if (width > 32)
                     s->llviddsp.add_gradient_pred(dst + 32, fake_stride, width - 32);
77f9c4b7
                 dst += stride;
             }
d78fd2fa
             break;
         case MEDIAN:
77f9c4b7
             dst = p->data[i] + j * sheight * stride;
5ac1dd8e
             s->llviddsp.add_left_pred(dst, dst, width, 0);
77f9c4b7
             dst += stride;
             if (interlaced) {
5ac1dd8e
                 s->llviddsp.add_left_pred(dst, dst, width, 0);
77f9c4b7
                 dst += stride;
             }
7da25488
             lefttop = left = dst[0];
77f9c4b7
             for (k = 1 + interlaced; k < height; k++) {
5ac1dd8e
                 s->llviddsp.add_median_pred(dst, dst - fake_stride,
d78fd2fa
                                              dst, width, &left, &lefttop);
77f9c4b7
                 lefttop = left = dst[0];
                 dst += stride;
             }
d78fd2fa
             break;
         default:
             avpriv_request_sample(avctx, "Unknown prediction: %d", pred);
77f9c4b7
         }
     }
 
     if (s->decorrelate) {
         int height = FFMIN(s->slice_height, avctx->coded_height - j * s->slice_height);
         int width = avctx->coded_width;
         uint8_t *b = p->data[0] + j * s->slice_height * p->linesize[0];
         uint8_t *g = p->data[1] + j * s->slice_height * p->linesize[1];
         uint8_t *r = p->data[2] + j * s->slice_height * p->linesize[2];
 
         for (i = 0; i < height; i++) {
5ac1dd8e
             s->llviddsp.add_bytes(b, g, width);
             s->llviddsp.add_bytes(r, g, width);
77f9c4b7
             b += p->linesize[0];
             g += p->linesize[1];
             r += p->linesize[2];
         }
     }
 
     return 0;
 }
 
6d09d6ed
 static int build_huffman(AVCodecContext *avctx, GetBitContext *gbit, int max)
 {
     MagicYUVContext *s = avctx->priv_data;
     int i = 0, j = 0, k;
 
     memset(s->len, 0, sizeof(s->len));
     while (get_bits_left(gbit) >= 8) {
fa3fd7f5
         int b = get_bits(gbit, 1);
         int x = get_bits(gbit, 7);
         int l = get_bitsz(gbit, b * 8) + 1;
6d09d6ed
 
         for (k = 0; k < l; k++)
             if (j + k < max)
                 s->len[i][j + k] = x;
 
         j += l;
         if (j == max) {
             j = 0;
             if (s->huff_build(&s->vlc[i], s->len[i])) {
                 av_log(avctx, AV_LOG_ERROR, "Cannot build Huffman codes\n");
                 return AVERROR_INVALIDDATA;
             }
             i++;
             if (i == s->planes) {
                 break;
             }
         } else if (j > max) {
0281d5ec
             av_log(avctx, AV_LOG_ERROR, "Invalid Huffman codes\n");
6d09d6ed
             return AVERROR_INVALIDDATA;
         }
     }
 
     if (i != s->planes) {
         av_log(avctx, AV_LOG_ERROR, "Huffman tables too short\n");
         return AVERROR_INVALIDDATA;
     }
 
     return 0;
 }
 
d78fd2fa
 static int magy_decode_frame(AVCodecContext *avctx, void *data,
                              int *got_frame, AVPacket *avpkt)
77f9c4b7
 {
     MagicYUVContext *s = avctx->priv_data;
     ThreadFrame frame = { .f = data };
     AVFrame *p = data;
d78fd2fa
     GetByteContext gbyte;
     GetBitContext gbit;
     uint32_t first_offset, offset, next_offset, header_size, slice_width;
     int width, height, format, version, table_size;
6d09d6ed
     int ret, i, j;
77f9c4b7
 
d78fd2fa
     bytestream2_init(&gbyte, avpkt->data, avpkt->size);
     if (bytestream2_get_le32(&gbyte) != MKTAG('M', 'A', 'G', 'Y'))
77f9c4b7
         return AVERROR_INVALIDDATA;
 
d78fd2fa
     header_size = bytestream2_get_le32(&gbyte);
     if (header_size < 32 || header_size >= avpkt->size) {
         av_log(avctx, AV_LOG_ERROR,
                "header or packet too small %"PRIu32"\n", header_size);
77f9c4b7
         return AVERROR_INVALIDDATA;
d78fd2fa
     }
77f9c4b7
 
d78fd2fa
     version = bytestream2_get_byte(&gbyte);
77f9c4b7
     if (version != 7) {
d78fd2fa
         avpriv_request_sample(avctx, "Version %d", version);
77f9c4b7
         return AVERROR_PATCHWELCOME;
     }
 
d78fd2fa
     s->hshift[1] =
     s->vshift[1] =
     s->hshift[2] =
     s->vshift[2] = 0;
77f9c4b7
     s->decorrelate = 0;
0281d5ec
     s->bps = 8;
77f9c4b7
 
d78fd2fa
     format = bytestream2_get_byte(&gbyte);
77f9c4b7
     switch (format) {
     case 0x65:
         avctx->pix_fmt = AV_PIX_FMT_GBRP;
         s->decorrelate = 1;
         break;
     case 0x66:
         avctx->pix_fmt = AV_PIX_FMT_GBRAP;
         s->decorrelate = 1;
         break;
     case 0x67:
         avctx->pix_fmt = AV_PIX_FMT_YUV444P;
         break;
     case 0x68:
         avctx->pix_fmt = AV_PIX_FMT_YUV422P;
d78fd2fa
         s->hshift[1] =
         s->hshift[2] = 1;
77f9c4b7
         break;
     case 0x69:
         avctx->pix_fmt = AV_PIX_FMT_YUV420P;
d78fd2fa
         s->hshift[1] =
         s->vshift[1] =
         s->hshift[2] =
         s->vshift[2] = 1;
77f9c4b7
         break;
     case 0x6a:
         avctx->pix_fmt = AV_PIX_FMT_YUVA444P;
         break;
     case 0x6b:
         avctx->pix_fmt = AV_PIX_FMT_GRAY8;
         break;
6d09d6ed
     case 0x6c:
         avctx->pix_fmt = AV_PIX_FMT_YUV422P10;
         s->hshift[1] =
         s->hshift[2] = 1;
0281d5ec
         s->bps = 10;
6d09d6ed
         break;
2601eef8
     case 0x76:
         avctx->pix_fmt = AV_PIX_FMT_YUV444P10;
         s->bps = 10;
         break;
6d09d6ed
     case 0x6d:
         avctx->pix_fmt = AV_PIX_FMT_GBRP10;
         s->decorrelate = 1;
0281d5ec
         s->bps = 10;
6d09d6ed
         break;
     case 0x6e:
         avctx->pix_fmt = AV_PIX_FMT_GBRAP10;
         s->decorrelate = 1;
0281d5ec
         s->bps = 10;
         break;
     case 0x6f:
         avctx->pix_fmt = AV_PIX_FMT_GBRP12;
         s->decorrelate = 1;
         s->bps = 12;
         break;
     case 0x70:
         avctx->pix_fmt = AV_PIX_FMT_GBRAP12;
         s->decorrelate = 1;
         s->bps = 12;
6d09d6ed
         break;
     case 0x73:
         avctx->pix_fmt = AV_PIX_FMT_GRAY10;
0281d5ec
         s->bps = 10;
6d09d6ed
         break;
77f9c4b7
     default:
d78fd2fa
         avpriv_request_sample(avctx, "Format 0x%X", format);
77f9c4b7
         return AVERROR_PATCHWELCOME;
     }
6d18b62d
     s->max = 1 << s->bps;
     s->magy_decode_slice = s->bps == 8 ? magy_decode_slice : magy_decode_slice10;
     if ( s->bps == 8)
         s->huff_build = huff_build;
     else
         s->huff_build = s->bps == 10 ? huff_build10 : huff_build12;
d78fd2fa
     s->planes = av_pix_fmt_count_planes(avctx->pix_fmt);
77f9c4b7
 
12461636
     bytestream2_skip(&gbyte, 1);
     s->color_matrix = bytestream2_get_byte(&gbyte);
     s->flags        = bytestream2_get_byte(&gbyte);
     s->interlaced   = !!(s->flags & 2);
d78fd2fa
     bytestream2_skip(&gbyte, 3);
77f9c4b7
 
d78fd2fa
     width  = bytestream2_get_le32(&gbyte);
     height = bytestream2_get_le32(&gbyte);
     ret = ff_set_dimensions(avctx, width, height);
     if (ret < 0)
8a135a55
         return ret;
 
d78fd2fa
     slice_width = bytestream2_get_le32(&gbyte);
77f9c4b7
     if (slice_width != avctx->coded_width) {
d78fd2fa
         avpriv_request_sample(avctx, "Slice width %"PRIu32, slice_width);
77f9c4b7
         return AVERROR_PATCHWELCOME;
     }
d78fd2fa
     s->slice_height = bytestream2_get_le32(&gbyte);
c3e2e842
     if (s->slice_height <= 0 || s->slice_height > INT_MAX - avctx->coded_height) {
d78fd2fa
         av_log(avctx, AV_LOG_ERROR,
                "invalid slice height: %d\n", s->slice_height);
77f9c4b7
         return AVERROR_INVALIDDATA;
     }
 
d78fd2fa
     bytestream2_skip(&gbyte, 4);
77f9c4b7
 
     s->nb_slices = (avctx->coded_height + s->slice_height - 1) / s->slice_height;
     if (s->nb_slices > INT_MAX / sizeof(Slice)) {
d78fd2fa
         av_log(avctx, AV_LOG_ERROR,
                "invalid number of slices: %d\n", s->nb_slices);
77f9c4b7
         return AVERROR_INVALIDDATA;
     }
 
f8a0e9f9
     if (s->interlaced) {
         if ((s->slice_height >> s->vshift[1]) < 2) {
             av_log(avctx, AV_LOG_ERROR, "impossible slice height\n");
             return AVERROR_INVALIDDATA;
         }
         if ((avctx->coded_height % s->slice_height) && ((avctx->coded_height % s->slice_height) >> s->vshift[1]) < 2) {
             av_log(avctx, AV_LOG_ERROR, "impossible height\n");
             return AVERROR_INVALIDDATA;
         }
     }
 
77f9c4b7
     for (i = 0; i < s->planes; i++) {
         av_fast_malloc(&s->slices[i], &s->slices_size[i], s->nb_slices * sizeof(Slice));
         if (!s->slices[i])
             return AVERROR(ENOMEM);
 
d78fd2fa
         offset = bytestream2_get_le32(&gbyte);
77f9c4b7
         if (offset >= avpkt->size - header_size)
             return AVERROR_INVALIDDATA;
 
         if (i == 0)
             first_offset = offset;
 
         for (j = 0; j < s->nb_slices - 1; j++) {
             s->slices[i][j].start = offset + header_size;
 
d78fd2fa
             next_offset = bytestream2_get_le32(&gbyte);
             if (next_offset <= offset || next_offset >= avpkt->size - header_size)
77f9c4b7
                 return AVERROR_INVALIDDATA;
d78fd2fa
 
             s->slices[i][j].size = next_offset - offset;
             offset = next_offset;
77f9c4b7
         }
 
         s->slices[i][j].start = offset + header_size;
e8a236ad
         s->slices[i][j].size  = avpkt->size - s->slices[i][j].start;
77f9c4b7
     }
 
d78fd2fa
     if (bytestream2_get_byte(&gbyte) != s->planes)
77f9c4b7
         return AVERROR_INVALIDDATA;
 
d78fd2fa
     bytestream2_skip(&gbyte, s->nb_slices * s->planes);
77f9c4b7
 
d78fd2fa
     table_size = header_size + first_offset - bytestream2_tell(&gbyte);
77f9c4b7
     if (table_size < 2)
         return AVERROR_INVALIDDATA;
 
d78fd2fa
     ret = init_get_bits8(&gbit, avpkt->data + bytestream2_tell(&gbyte), table_size);
     if (ret < 0)
77f9c4b7
         return ret;
 
6d09d6ed
     ret = build_huffman(avctx, &gbit, s->max);
     if (ret < 0)
         return ret;
77f9c4b7
 
     p->pict_type = AV_PICTURE_TYPE_I;
     p->key_frame = 1;
 
     if ((ret = ff_thread_get_buffer(avctx, &frame, 0)) < 0)
         return ret;
 
     s->buf = avpkt->data;
     s->p = p;
6d09d6ed
     avctx->execute2(avctx, s->magy_decode_slice, NULL, NULL, s->nb_slices);
77f9c4b7
 
6d09d6ed
     if (avctx->pix_fmt == AV_PIX_FMT_GBRP   ||
         avctx->pix_fmt == AV_PIX_FMT_GBRAP  ||
         avctx->pix_fmt == AV_PIX_FMT_GBRP10 ||
0281d5ec
         avctx->pix_fmt == AV_PIX_FMT_GBRAP10||
         avctx->pix_fmt == AV_PIX_FMT_GBRAP12||
         avctx->pix_fmt == AV_PIX_FMT_GBRP12) {
77f9c4b7
         FFSWAP(uint8_t*, p->data[0], p->data[1]);
         FFSWAP(int, p->linesize[0], p->linesize[1]);
12461636
     } else {
         switch (s->color_matrix) {
         case 1:
             p->colorspace = AVCOL_SPC_BT470BG;
             break;
         case 2:
             p->colorspace = AVCOL_SPC_BT709;
             break;
         }
         p->color_range = (s->flags & 4) ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG;
77f9c4b7
     }
 
     *got_frame = 1;
 
     return avpkt->size;
 }
 
d78fd2fa
 static av_cold int magy_decode_init(AVCodecContext *avctx)
 {
     MagicYUVContext *s = avctx->priv_data;
47f21232
     ff_llviddsp_init(&s->llviddsp);
d78fd2fa
     return 0;
 }
 
 static av_cold int magy_decode_end(AVCodecContext *avctx)
77f9c4b7
 {
     MagicYUVContext * const s = avctx->priv_data;
d78fd2fa
     int i;
77f9c4b7
 
d78fd2fa
     for (i = 0; i < FF_ARRAY_ELEMS(s->slices); i++) {
         av_freep(&s->slices[i]);
         s->slices_size[i] = 0;
         ff_free_vlc(&s->vlc[i]);
     }
77f9c4b7
 
     return 0;
 }
 
 AVCodec ff_magicyuv_decoder = {
     .name             = "magicyuv",
d78fd2fa
     .long_name        = NULL_IF_CONFIG_SMALL("MagicYUV video"),
77f9c4b7
     .type             = AVMEDIA_TYPE_VIDEO,
     .id               = AV_CODEC_ID_MAGICYUV,
     .priv_data_size   = sizeof(MagicYUVContext),
d78fd2fa
     .init             = magy_decode_init,
     .close            = magy_decode_end,
     .decode           = magy_decode_frame,
     .capabilities     = AV_CODEC_CAP_DR1 |
                         AV_CODEC_CAP_FRAME_THREADS |
                         AV_CODEC_CAP_SLICE_THREADS,
     .caps_internal    = FF_CODEC_CAP_INIT_THREADSAFE,
77f9c4b7
 };