libavcodec/v210enc.c
ca0bb1c4
 /*
  * V210 encoder
  *
  * Copyright (C) 2009 Michael Niedermayer <michaelni@gmx.at>
  * Copyright (c) 2009 Baptiste Coudurier <baptiste dot coudurier at gmail dot com>
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
 #include "avcodec.h"
dc25d79f
 #include "bytestream.h"
ab3a410c
 #include "internal.h"
36091742
 #include "v210enc.h"
 
 #define CLIP(v) av_clip(v, 4, 1019)
 #define CLIP8(v) av_clip(v, 1, 254)
 
 #define WRITE_PIXELS(a, b, c)           \
     do {                                \
9a738c27
         val  =  CLIP(*a++);             \
36091742
         val |= (CLIP(*b++) << 10) |     \
                (CLIP(*c++) << 20);      \
         AV_WL32(dst, val);              \
         dst += 4;                       \
     } while (0)
 
 #define WRITE_PIXELS8(a, b, c)          \
     do {                                \
9a738c27
         val  = (CLIP8(*a++) << 2);      \
         val |= (CLIP8(*b++) << 12) |    \
                (CLIP8(*c++) << 22);     \
36091742
         AV_WL32(dst, val);              \
         dst += 4;                       \
     } while (0)
 
 static void v210_planar_pack_8_c(const uint8_t *y, const uint8_t *u,
9a738c27
                                  const uint8_t *v, uint8_t *dst,
                                  ptrdiff_t width)
36091742
 {
     uint32_t val;
     int i;
 
     /* unroll this to match the assembly */
9a738c27
     for (i = 0; i < width - 11; i += 12) {
36091742
         WRITE_PIXELS8(u, y, v);
         WRITE_PIXELS8(y, u, y);
         WRITE_PIXELS8(v, y, u);
         WRITE_PIXELS8(y, v, y);
         WRITE_PIXELS8(u, y, v);
         WRITE_PIXELS8(y, u, y);
         WRITE_PIXELS8(v, y, u);
         WRITE_PIXELS8(y, v, y);
     }
 }
 
 static void v210_planar_pack_10_c(const uint16_t *y, const uint16_t *u,
9a738c27
                                   const uint16_t *v, uint8_t *dst,
                                   ptrdiff_t width)
36091742
 {
     uint32_t val;
     int i;
 
9a738c27
     for (i = 0; i < width - 5; i += 6) {
36091742
         WRITE_PIXELS(u, y, v);
         WRITE_PIXELS(y, u, y);
         WRITE_PIXELS(v, y, u);
         WRITE_PIXELS(y, v, y);
     }
 }
ca0bb1c4
 
3cdda78d
 av_cold void ff_v210enc_init(V210EncContext *s)
 {
     s->pack_line_8  = v210_planar_pack_8_c;
     s->pack_line_10 = v210_planar_pack_10_c;
e280fe13
     s->sample_factor_8  = 1;
     s->sample_factor_10 = 1;
3cdda78d
 
     if (ARCH_X86)
         ff_v210enc_init_x86(s);
 }
 
ca0bb1c4
 static av_cold int encode_init(AVCodecContext *avctx)
 {
36091742
     V210EncContext *s = avctx->priv_data;
 
ca0bb1c4
     if (avctx->width & 1) {
         av_log(avctx, AV_LOG_ERROR, "v210 needs even width\n");
b5f50da5
         return AVERROR(EINVAL);
ca0bb1c4
     }
 
40cf1bba
 #if FF_API_CODED_FRAME
 FF_DISABLE_DEPRECATION_WARNINGS
ce5e49b0
     avctx->coded_frame->pict_type = AV_PICTURE_TYPE_I;
40cf1bba
 FF_ENABLE_DEPRECATION_WARNINGS
 #endif
ca0bb1c4
 
3cdda78d
     ff_v210enc_init(s);
36091742
 
205b8fd0
     avctx->bits_per_coded_sample = 20;
     avctx->bit_rate = ff_guess_coded_bitrate(avctx) * 16 / 15;
 
ca0bb1c4
     return 0;
 }
 
ab3a410c
 static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
                         const AVFrame *pic, int *got_packet)
ca0bb1c4
 {
36091742
     V210EncContext *s = avctx->priv_data;
ca0bb1c4
     int aligned_width = ((avctx->width + 47) / 48) * 48;
     int stride = aligned_width * 8 / 3;
eeb9e61a
     int line_padding = stride - ((avctx->width * 8 + 11) / 12) * 4;
ab3a410c
     int h, w, ret;
36091742
     uint8_t *dst;
ca0bb1c4
 
06f26598
     ret = ff_alloc_packet2(avctx, pkt, avctx->height * stride, avctx->height * stride);
9a738c27
     if (ret < 0) {
36091742
         av_log(avctx, AV_LOG_ERROR, "Error getting output packet.\n");
ab3a410c
         return ret;
36091742
     }
     dst = pkt->data;
 
     if (pic->format == AV_PIX_FMT_YUV422P10) {
9a738c27
         const uint16_t *y = (const uint16_t *)pic->data[0];
         const uint16_t *u = (const uint16_t *)pic->data[1];
         const uint16_t *v = (const uint16_t *)pic->data[2];
e280fe13
 
         const int sample_size = 6 * s->sample_factor_10;
         const int sample_w    = avctx->width / sample_size;
 
36091742
         for (h = 0; h < avctx->height; h++) {
             uint32_t val;
e280fe13
             w = sample_w * sample_size;
36091742
             s->pack_line_10(y, u, v, dst, w);
 
             y += w;
             u += w >> 1;
             v += w >> 1;
e280fe13
             dst += sample_w * 16 * s->sample_factor_10;
2cba1825
 
             for (; w < avctx->width - 5; w += 6) {
                 WRITE_PIXELS(u, y, v);
                 WRITE_PIXELS(y, u, y);
                 WRITE_PIXELS(v, y, u);
                 WRITE_PIXELS(y, v, y);
             }
36091742
             if (w < avctx->width - 1) {
                 WRITE_PIXELS(u, y, v);
 
                 val = CLIP(*y++);
                 if (w == avctx->width - 2) {
                     AV_WL32(dst, val);
                     dst += 4;
                 }
             }
             if (w < avctx->width - 3) {
                 val |= (CLIP(*u++) << 10) | (CLIP(*y++) << 20);
                 AV_WL32(dst, val);
                 dst += 4;
eeb9e61a
 
36091742
                 val = CLIP(*v++) | (CLIP(*y++) << 10);
                 AV_WL32(dst, val);
                 dst += 4;
             }
74bf9d62
 
36091742
             memset(dst, 0, line_padding);
             dst += line_padding;
             y += pic->linesize[0] / 2 - avctx->width;
             u += pic->linesize[1] / 2 - avctx->width / 2;
             v += pic->linesize[2] / 2 - avctx->width / 2;
ca0bb1c4
         }
9a738c27
     } else if(pic->format == AV_PIX_FMT_YUV422P) {
36091742
         const uint8_t *y = pic->data[0];
         const uint8_t *u = pic->data[1];
         const uint8_t *v = pic->data[2];
e280fe13
 
         const int sample_size = 12 * s->sample_factor_8;
         const int sample_w    = avctx->width / sample_size;
 
36091742
         for (h = 0; h < avctx->height; h++) {
             uint32_t val;
e280fe13
             w = sample_w * sample_size;
36091742
             s->pack_line_8(y, u, v, dst, w);
 
             y += w;
             u += w >> 1;
             v += w >> 1;
e280fe13
             dst += sample_w * 32 * s->sample_factor_8;
36091742
 
9a738c27
             for (; w < avctx->width - 5; w += 6) {
36091742
                 WRITE_PIXELS8(u, y, v);
                 WRITE_PIXELS8(y, u, y);
                 WRITE_PIXELS8(v, y, u);
                 WRITE_PIXELS8(y, v, y);
             }
             if (w < avctx->width - 1) {
                 WRITE_PIXELS8(u, y, v);
 
                 val = CLIP8(*y++) << 2;
                 if (w == avctx->width - 2) {
                     AV_WL32(dst, val);
                     dst += 4;
                 }
             }
c9dc6637
             if (w < avctx->width - 3) {
36091742
                 val |= (CLIP8(*u++) << 12) | (CLIP8(*y++) << 22);
                 AV_WL32(dst, val);
                 dst += 4;
ca0bb1c4
 
36091742
                 val = (CLIP8(*v++) << 2) | (CLIP8(*y++) << 12);
                 AV_WL32(dst, val);
                 dst += 4;
c9dc6637
             }
36091742
             memset(dst, 0, line_padding);
             dst += line_padding;
eeb9e61a
 
36091742
             y += pic->linesize[0] - avctx->width;
             u += pic->linesize[1] - avctx->width / 2;
             v += pic->linesize[2] - avctx->width / 2;
         }
ca0bb1c4
     }
 
ab3a410c
     pkt->flags |= AV_PKT_FLAG_KEY;
     *got_packet = 1;
     return 0;
ca0bb1c4
 }
 
e7e2df27
 AVCodec ff_v210_encoder = {
ec6402b7
     .name           = "v210",
b2bed932
     .long_name      = NULL_IF_CONFIG_SMALL("Uncompressed 4:2:2 10-bit"),
ec6402b7
     .type           = AVMEDIA_TYPE_VIDEO,
36ef5369
     .id             = AV_CODEC_ID_V210,
36091742
     .priv_data_size = sizeof(V210EncContext),
ec6402b7
     .init           = encode_init,
ab3a410c
     .encode2        = encode_frame,
36091742
     .pix_fmts       = (const enum AVPixelFormat[]){ AV_PIX_FMT_YUV422P10, AV_PIX_FMT_YUV422P, AV_PIX_FMT_NONE },
ca0bb1c4
 };