GitList

Browse code

Merge remote-tracking branch 'qatar/master'

* qatar/master:
rtmp: Add support for SWFVerification
api-example: use new video encoding API.
x86: avcodec: Appropriately name files containing only init functions
mpegvideo_mmx_template: drop some commented-out cruft
libavresample: add mix level normalization option
w32pthreads: Add missing #includes to make header compile standalone
rtmp: Gracefully ignore _checkbw errors by tracking them
rtmp: Do not send _checkbw calls as notifications
prores: interlaced ProRes encoding

Conflicts:
doc/examples/decoding_encoding.c
libavcodec/proresenc_kostya.c
libavcodec/w32pthreads.h
libavcodec/x86/Makefile
libavformat/version.h

Merged-by: Michael Niedermayer <michaelni@gmx.at>

Michael Niedermayer authored on 2012/08/15 22:41:01
Showing 20 changed files

doc/examples/decoding_encoding.c index 6295001..919ee48 100644
doc/protocols.texi index 3a82c7f..be19239 100644
libavcodec/proresenc_kostya.c index 440f254..d69892d 100644
libavcodec/w32pthreads.h index fbc183a..c4bbb9a 100644
libavcodec/x86/Makefile index e01454a..0ad3457 100644
libavcodec/x86/ac3dsp_init.c index 0000000..cf1d7db
libavcodec/x86/ac3dsp_mmx.c index cf1d7db..0000000
libavcodec/x86/fft.c index 852c6b8..0000000
libavcodec/x86/fft_init.c index 0000000..852c6b8
libavcodec/x86/fmtconvert_init.c index 0000000..361ac85
libavcodec/x86/fmtconvert_mmx.c index 361ac85..0000000
libavcodec/x86/h264dsp_init.c index 0000000..ea71515
libavcodec/x86/h264dsp_mmx.c index ea71515..0000000
libavcodec/x86/mpegvideo_mmx_template.c index 82e4ffa..d538a39 100644
libavformat/rtmp.h index bdac6fd..7c9bb6d 100644
libavformat/rtmpproto.c index 4f57cb8..e3bcf3d 100644
libavformat/version.h index 99a8ddf..f68805c 100644
libavresample/audio_mix.c index e8ab2e3..f948c82 100644
libavresample/internal.h index 7b7648f..006b6fd 100644
libavresample/options.c index 02e1f86..e7e0c27 100644

@@ -31,10 +31,10 @@
                      #include <math.h>
                     -#include <libavutil/imgutils.h>
                      #include <libavutil/opt.h>
                      #include <libavcodec/avcodec.h>
                      #include <libavutil/audioconvert.h>
                     +#include <libavutil/imgutils.h>
                      #include <libavutil/mathematics.h>
                      #include <libavutil/samplefmt.h>
@@ -315,11 +315,11 @@ static void video_encode_example(const char *filename, int codec_id)
+                     {
                          AVCodec *codec;
                          AVCodecContext *c= NULL;
                     -    int i, out_size, x, y, outbuf_size;
                     +    int i, ret, x, y, got_output;
                          FILE *f;
                          AVFrame *picture;
                     -    uint8_t *outbuf;
                     -    int had_output=0;
                     +    AVPacket pkt;
                     +    uint8_t endcode[] = { 0, 0, 1, 0xb7 };
                          printf("Encode video file %s\n", filename);
@@ -359,17 +359,25 @@ static void video_encode_example(const char *filename, int codec_id)
                              exit(1);
+                         }
                     -    /* alloc image and output buffer */
                     -    outbuf_size = 100000 + 12*c->width*c->height;
                     -    outbuf = malloc(outbuf_size);
+                    -
                          /* the image can be allocated by any means and av_image_alloc() is
                           * just the most convenient way if av_malloc() is to be used */
                     -    av_image_alloc(picture->data, picture->linesize,
                     -                   c->width, c->height, c->pix_fmt, 1);
                     +    ret = av_image_alloc(picture->data, picture->linesize, c->width, c->height,
                     +                         c->pix_fmt, 32);
                     +    if (ret < 0) {
                     +        fprintf(stderr, "could not alloc raw picture buffer\n");
                     +        exit(1);
                     +    }
+                    +
                     +    picture->format = c->pix_fmt;
                     +    picture->width  = c->width;
                     +    picture->height = c->height;
                          /* encode 1 second of video */
                          for(i=0;i<25;i++) {
                     +        av_init_packet(&pkt);
                     +        pkt.data = NULL;    // packet data will be allocated by the encoder
                     +        pkt.size = 0;
+                    +
                              fflush(stdout);
                              /* prepare a dummy image */
                              /* Y */
@@ -387,35 +395,46 @@ static void video_encode_example(const char *filename, int codec_id)
+                                 }
+                             }
                     +        picture->pts = i;
+                    +
                              /* encode the image */
                     -        out_size = avcodec_encode_video(c, outbuf, outbuf_size, picture);
                     -        had_output |= out_size;
                     -        printf("encoding frame %3d (size=%5d)\n", i, out_size);
                     -        fwrite(outbuf, 1, out_size, f);
                     +        ret = avcodec_encode_video2(c, &pkt, picture, &got_output);
                     +        if (ret < 0) {
                     +            fprintf(stderr, "error encoding frame\n");
                     +            exit(1);
                     +        }
+                    +
                     +        if (got_output) {
                     +            printf("encoding frame %3d (size=%5d)\n", i, pkt.size);
                     +            fwrite(pkt.data, 1, pkt.size, f);
                     +            av_free_packet(&pkt);
                     +        }
+                         }
                          /* get the delayed frames */
                     -    for(; out_size || !had_output; i++) {
                     +    for (got_output = 1; got_output; i++) {
                              fflush(stdout);
                     -        out_size = avcodec_encode_video(c, outbuf, outbuf_size, NULL);
                     -        had_output |= out_size;
                     -        printf("write frame %3d (size=%5d)\n", i, out_size);
                     -        fwrite(outbuf, 1, out_size, f);
                     +        ret = avcodec_encode_video2(c, &pkt, NULL, &got_output);
                     +        if (ret < 0) {
                     +            fprintf(stderr, "error encoding frame\n");
                     +            exit(1);
                     +        }
+                    +
                     +        if (got_output) {
                     +            printf("write frame %3d (size=%5d)\n", i, pkt.size);
                     +            fwrite(pkt.data, 1, pkt.size, f);
                     +            av_free_packet(&pkt);
                     +        }
+                         }
                          /* add sequence end code to have a real mpeg file */
                     -    outbuf[0] = 0x00;
                     -    outbuf[1] = 0x00;
                     -    outbuf[2] = 0x01;
                     -    outbuf[3] = 0xb7;
                     -    fwrite(outbuf, 1, 4, f);
                     +    fwrite(endcode, 1, sizeof(endcode), f);
                          fclose(f);
                     -    free(outbuf);
                          avcodec_close(c);
                          av_free(c);
                     -    av_free(picture->data[0]);
                     +    av_freep(&picture->data[0]);
                          av_free(picture);
                          printf("\n");
+                     }

@@ -272,6 +272,12 @@ Name of live stream to subscribe to. By default no value will be sent.
                      It is only sent if the option is specified or if rtmp_live
                      is set to live.
                     +@item rtmp_swfhash
                     +SHA256 hash of the decompressed SWF file (32 bytes).
+                    +
                     +@item rtmp_swfsize
                     +Size of the decompressed SWF file, required for SWFVerification.
+                    +
                      @item rtmp_swfurl
                      URL of the SWF player for the media. By default no value will be sent.

@@ -406,10 +406,15 @@ static int encode_slice(AVCodecContext *avctx, const AVFrame *pic,
                          int total_size = 0;
                          const uint16_t *src;
                          int slice_width_factor = av_log2(mbs_per_slice);
                     -    int num_cblocks, pwidth, linesize, line_offset;
                     +    int num_cblocks, pwidth, linesize, line_add;
                          int plane_factor, is_chroma;
                          uint16_t *qmat;
                     +    if (ctx->pictures_per_frame == 1)
                     +        line_add = 0;
                     +    else
                     +        line_add = ctx->cur_picture_idx ^ !pic->top_field_first;
+                    +
                          if (ctx->force_quant) {
                              qmat = ctx->quants[0];
                          } else if (quant < MAX_STORED_Q) {
@@ -437,15 +442,14 @@ static int encode_slice(AVCodecContext *avctx, const AVFrame *pic,
                                  pwidth      = avctx->width >> 1;
+                             }
                     -        line_offset = ((ctx->cur_picture_idx ^ !pic->top_field_first) &
                     -                       (ctx->pictures_per_frame - 1)) * pic->linesize[i];
                              linesize = pic->linesize[i] * ctx->pictures_per_frame;
                     -        src = (const uint16_t*)(pic->data[i] + yp * linesize + line_offset) + xp;
                     +        src = (const uint16_t*)(pic->data[i] + yp * linesize +
                     +                                line_add * pic->linesize[i]) + xp;
                              get_slice_data(ctx, src, linesize, xp, yp,
                                             pwidth, avctx->height / ctx->pictures_per_frame,
                     -                       ctx->blocks[0], ctx->emu_buf, mbs_per_slice,
                     -                       num_cblocks, is_chroma);
                     +                       ctx->blocks[0], ctx->emu_buf,
                     +                       mbs_per_slice, num_cblocks, is_chroma);
                              sizes[i] = encode_slice_plane(ctx, pb, src, linesize,
                                                            mbs_per_slice, ctx->blocks[0],
                                                            num_cblocks, plane_factor,
@@ -579,8 +583,12 @@ static int find_slice_quant(AVCodecContext *avctx, const AVFrame *pic,
                          int slice_bits[TRELLIS_WIDTH], slice_score[TRELLIS_WIDTH];
                          int overquant;
                          uint16_t *qmat;
                     -    int linesize[4], line_offset;
                     +    int linesize[4], line_add;
                     +    if (ctx->pictures_per_frame == 1)
                     +        line_add = 0;
                     +    else
                     +        line_add = ctx->cur_picture_idx ^ !pic->top_field_first;
                          mbs = x + mbs_per_slice;
                          for (i = 0; i < ctx->num_planes; i++) {
@@ -600,15 +608,14 @@ static int find_slice_quant(AVCodecContext *avctx, const AVFrame *pic,
                                  pwidth         = avctx->width >> 1;
+                             }
                     -        line_offset = ((ctx->cur_picture_idx ^ !pic->top_field_first) &
                     -                       (ctx->pictures_per_frame - 1)) * pic->linesize[i];
                              linesize[i] = pic->linesize[i] * ctx->pictures_per_frame;
                     -        src = (const uint16_t*)(pic->data[i] + yp * linesize[i] + line_offset) + xp;
                     +        src = (const uint16_t*)(pic->data[i] + yp * linesize[i] +
                     +                                line_add * pic->linesize[i]) + xp;
                              get_slice_data(ctx, src, linesize[i], xp, yp,
                                             pwidth, avctx->height / ctx->pictures_per_frame,
                     -                       td->blocks[i], td->emu_buf, mbs_per_slice,
                     -                       num_cblocks[i], is_chroma[i]);
                     +                       td->blocks[i], td->emu_buf,
                     +                       mbs_per_slice, num_cblocks[i], is_chroma[i]);
+                         }
                          for (q = min_quant; q < max_quant + 2; q++) {
@@ -767,9 +774,8 @@ static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
                          bytestream_put_be16  (&buf, avctx->height);
                          frame_flags = ctx->chroma_factor << 6;
                     -    if (avctx->flags & CODEC_FLAG_INTERLACED_DCT) {
                     +    if (avctx->flags & CODEC_FLAG_INTERLACED_DCT)
                              frame_flags |= pic->top_field_first ? 0x04 : 0x08;
                     -    }
                          bytestream_put_byte  (&buf, frame_flags);
                          bytestream_put_byte  (&buf, 0);             // reserved
@@ -791,7 +797,9 @@ static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
+                         }
                          bytestream_put_be16  (&tmp, buf - orig_buf); // write back frame header size
                     -    for (ctx->cur_picture_idx = 0; ctx->cur_picture_idx < ctx->pictures_per_frame; ++ctx->cur_picture_idx) {
                     +    for (ctx->cur_picture_idx = 0;
                     +         ctx->cur_picture_idx < ctx->pictures_per_frame;
                     +         ctx->cur_picture_idx++) {
                              // picture header
                              picture_size_pos = buf + 1;
                              bytestream_put_byte  (&buf, 0x40);          // picture header size (in bits)
@@ -845,7 +853,6 @@ static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
                          frame_size = buf - orig_buf;
                          bytestream_put_be32(&orig_buf, frame_size);
+                    -
                          pkt->size   = frame_size;
                          pkt->flags |= AV_PKT_FLAG_KEY;
                          *got_packet = 1;
@@ -927,7 +934,8 @@ static av_cold int encode_init(AVCodecContext *avctx)
                          if (!ctx->force_quant) {
                              if (!ctx->bits_per_mb) {
                                  for (i = 0; i < NUM_MB_LIMITS - 1; i++)
                     -                if (prores_mb_limits[i] >= ctx->mb_width * ctx->mb_height * ctx->pictures_per_frame)
                     +                if (prores_mb_limits[i] >= ctx->mb_width * ctx->mb_height *
                     +                                           ctx->pictures_per_frame)
                                          break;
                                  ctx->bits_per_mb   = ctx->profile_info->br_tab[i];
                              } else if (ctx->bits_per_mb < 128) {
@@ -991,12 +999,15 @@ static av_cold int encode_init(AVCodecContext *avctx)
                          ctx->frame_size_upper_bound = ctx->pictures_per_frame *
                                                        ctx->slices_per_picture *
                                                        (2 + 2 * ctx->num_planes +
                     -                                   (mps * ctx->bits_per_mb) / 8) + 200;
                     +                                   (mps * ctx->bits_per_mb) / 8)
                     +                                  + 200;
                          avctx->codec_tag   = ctx->profile_info->tag;
                     -    av_log(avctx, AV_LOG_DEBUG, "profile %d, %d slices/pic, %d pics/frame, %d bits per MB\n",
                     -           ctx->profile, ctx->slices_per_picture, ctx->pictures_per_frame, ctx->bits_per_mb);
                     +    av_log(avctx, AV_LOG_DEBUG,
                     +           "profile %d, %d slices, interlacing: %s, %d bits per MB\n",
                     +           ctx->profile, ctx->slices_per_picture * ctx->pictures_per_frame,
                     +           interlaced ? "yes" : "no", ctx->bits_per_mb);
                          av_log(avctx, AV_LOG_DEBUG, "frame size upper bound: %d\n",
                                 ctx->frame_size_upper_bound);

@@ -40,6 +40,8 @@
                      #include <process.h>
                      #include "libavutil/common.h"
                     +#include "libavutil/internal.h"
                     +#include "libavutil/mem.h"
                      typedef struct {
                          void *handle;

@@ -5,7 +5,7 @@ OBJS-$(CONFIG_XMM_CLOBBER_TEST)        += x86/w64xmmtest.o
                      MMX-OBJS                               += x86/dsputil_mmx.o             \
                                                                x86/fdct_mmx.o                \
                     -                                          x86/fmtconvert_mmx.o          \
                     +                                          x86/fmtconvert_init.o         \
                                                                x86/idct_mmx_xvid.o           \
                                                                x86/idct_sse2_xvid.o          \
                                                                x86/motion_est_mmx.o          \
@@ -13,15 +13,15 @@ MMX-OBJS                               += x86/dsputil_mmx.o             \
                                                                x86/simple_idct_mmx.o         \
                      MMX-OBJS-$(CONFIG_AAC_DECODER)         += x86/sbrdsp_init.o
                     -MMX-OBJS-$(CONFIG_AC3DSP)              += x86/ac3dsp_mmx.o
                     +MMX-OBJS-$(CONFIG_AC3DSP)              += x86/ac3dsp_init.o
                      MMX-OBJS-$(CONFIG_CAVS_DECODER)        += x86/cavsdsp_mmx.o
                      MMX-OBJS-$(CONFIG_DNXHD_ENCODER)       += x86/dnxhd_mmx.o
                      MMX-OBJS-$(CONFIG_DWT)                 += x86/snowdsp_mmx.o \
                                                                x86/dwt.o
                      MMX-OBJS-$(CONFIG_ENCODERS)            += x86/dsputilenc_mmx.o
                     -MMX-OBJS-$(CONFIG_FFT)                 += x86/fft.o
                     +MMX-OBJS-$(CONFIG_FFT)                 += x86/fft_init.o
                      MMX-OBJS-$(CONFIG_GPL)                 += x86/idct_mmx.o
                     -MMX-OBJS-$(CONFIG_H264DSP)             += x86/h264dsp_mmx.o
                     +MMX-OBJS-$(CONFIG_H264DSP)             += x86/h264dsp_init.o
                      MMX-OBJS-$(CONFIG_H264PRED)            += x86/h264_intrapred_init.o
                      MMX-OBJS-$(CONFIG_LPC)                 += x86/lpc_mmx.o
                      MMX-OBJS-$(CONFIG_MPEGAUDIODSP)        += x86/mpegaudiodec_mmx.o

                     new file mode 100644
@@ -0,0 +1,93 @@
                     +/*
                     + * x86-optimized AC-3 DSP utils
                     + * Copyright (c) 2011 Justin Ruggles
                     + *
                     + * This file is part of FFmpeg.
                     + *
                     + * FFmpeg is free software; you can redistribute it and/or
                     + * modify it under the terms of the GNU Lesser General Public
                     + * License as published by the Free Software Foundation; either
                     + * version 2.1 of the License, or (at your option) any later version.
                     + *
                     + * FFmpeg is distributed in the hope that it will be useful,
                     + * but WITHOUT ANY WARRANTY; without even the implied warranty of
                     + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
                     + * Lesser General Public License for more details.
                     + *
                     + * You should have received a copy of the GNU Lesser General Public
                     + * License along with FFmpeg; if not, write to the Free Software
                     + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
                     + */
+                    +
                     +#include "libavutil/x86/asm.h"
                     +#include "dsputil_mmx.h"
                     +#include "libavcodec/ac3dsp.h"
+                    +
                     +extern void ff_ac3_exponent_min_mmx   (uint8_t *exp, int num_reuse_blocks, int nb_coefs);
                     +extern void ff_ac3_exponent_min_mmxext(uint8_t *exp, int num_reuse_blocks, int nb_coefs);
                     +extern void ff_ac3_exponent_min_sse2  (uint8_t *exp, int num_reuse_blocks, int nb_coefs);
+                    +
                     +extern int ff_ac3_max_msb_abs_int16_mmx  (const int16_t *src, int len);
                     +extern int ff_ac3_max_msb_abs_int16_mmx2 (const int16_t *src, int len);
                     +extern int ff_ac3_max_msb_abs_int16_sse2 (const int16_t *src, int len);
                     +extern int ff_ac3_max_msb_abs_int16_ssse3(const int16_t *src, int len);
+                    +
                     +extern void ff_ac3_lshift_int16_mmx (int16_t *src, unsigned int len, unsigned int shift);
                     +extern void ff_ac3_lshift_int16_sse2(int16_t *src, unsigned int len, unsigned int shift);
+                    +
                     +extern void ff_ac3_rshift_int32_mmx (int32_t *src, unsigned int len, unsigned int shift);
                     +extern void ff_ac3_rshift_int32_sse2(int32_t *src, unsigned int len, unsigned int shift);
+                    +
                     +extern void ff_float_to_fixed24_3dnow(int32_t *dst, const float *src, unsigned int len);
                     +extern void ff_float_to_fixed24_sse  (int32_t *dst, const float *src, unsigned int len);
                     +extern void ff_float_to_fixed24_sse2 (int32_t *dst, const float *src, unsigned int len);
+                    +
                     +extern int ff_ac3_compute_mantissa_size_sse2(uint16_t mant_cnt[6][16]);
+                    +
                     +extern void ff_ac3_extract_exponents_3dnow(uint8_t *exp, int32_t *coef, int nb_coefs);
                     +extern void ff_ac3_extract_exponents_sse2 (uint8_t *exp, int32_t *coef, int nb_coefs);
                     +extern void ff_ac3_extract_exponents_ssse3(uint8_t *exp, int32_t *coef, int nb_coefs);
+                    +
                     +av_cold void ff_ac3dsp_init_x86(AC3DSPContext *c, int bit_exact)
                     +{
                     +#if HAVE_YASM
                     +    int mm_flags = av_get_cpu_flags();
+                    +
                     +    if (mm_flags & AV_CPU_FLAG_MMX) {
                     +        c->ac3_exponent_min = ff_ac3_exponent_min_mmx;
                     +        c->ac3_max_msb_abs_int16 = ff_ac3_max_msb_abs_int16_mmx;
                     +        c->ac3_lshift_int16 = ff_ac3_lshift_int16_mmx;
                     +        c->ac3_rshift_int32 = ff_ac3_rshift_int32_mmx;
                     +    }
                     +    if (mm_flags & AV_CPU_FLAG_3DNOW && HAVE_AMD3DNOW) {
                     +        c->extract_exponents = ff_ac3_extract_exponents_3dnow;
                     +        if (!bit_exact) {
                     +            c->float_to_fixed24 = ff_float_to_fixed24_3dnow;
                     +        }
                     +    }
                     +    if (mm_flags & AV_CPU_FLAG_MMXEXT && HAVE_MMXEXT) {
                     +        c->ac3_exponent_min = ff_ac3_exponent_min_mmxext;
                     +        c->ac3_max_msb_abs_int16 = ff_ac3_max_msb_abs_int16_mmx2;
                     +    }
                     +    if (mm_flags & AV_CPU_FLAG_SSE && HAVE_SSE) {
                     +        c->float_to_fixed24 = ff_float_to_fixed24_sse;
                     +    }
                     +    if (mm_flags & AV_CPU_FLAG_SSE2 && HAVE_SSE) {
                     +        c->ac3_exponent_min = ff_ac3_exponent_min_sse2;
                     +        c->ac3_max_msb_abs_int16 = ff_ac3_max_msb_abs_int16_sse2;
                     +        c->float_to_fixed24 = ff_float_to_fixed24_sse2;
                     +        c->compute_mantissa_size = ff_ac3_compute_mantissa_size_sse2;
                     +        c->extract_exponents = ff_ac3_extract_exponents_sse2;
                     +        if (!(mm_flags & AV_CPU_FLAG_SSE2SLOW)) {
                     +            c->ac3_lshift_int16 = ff_ac3_lshift_int16_sse2;
                     +            c->ac3_rshift_int32 = ff_ac3_rshift_int32_sse2;
                     +        }
                     +    }
                     +    if (mm_flags & AV_CPU_FLAG_SSSE3 && HAVE_SSSE3) {
                     +        c->ac3_max_msb_abs_int16 = ff_ac3_max_msb_abs_int16_ssse3;
                     +        if (!(mm_flags & AV_CPU_FLAG_ATOM)) {
                     +            c->extract_exponents = ff_ac3_extract_exponents_ssse3;
                     +        }
                     +    }
                     +#endif
                     +}

                     deleted file mode 100644
@@ -1,72 +0,0 @@
                     -/*
                     - * This file is part of FFmpeg.
                     - *
                     - * FFmpeg is free software; you can redistribute it and/or
                     - * modify it under the terms of the GNU Lesser General Public
                     - * License as published by the Free Software Foundation; either
                     - * version 2.1 of the License, or (at your option) any later version.
                     - *
                     - * FFmpeg is distributed in the hope that it will be useful,
                     - * but WITHOUT ANY WARRANTY; without even the implied warranty of
                     - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
                     - * Lesser General Public License for more details.
                     - *
                     - * You should have received a copy of the GNU Lesser General Public
                     - * License along with FFmpeg; if not, write to the Free Software
                     - * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
                     - */
+                    -
                     -#include "libavutil/cpu.h"
                     -#include "libavcodec/dsputil.h"
                     -#include "libavcodec/dct.h"
                     -#include "fft.h"
+                    -
                     -av_cold void ff_fft_init_mmx(FFTContext *s)
                     -{
                     -#if HAVE_YASM
                     -    int has_vectors = av_get_cpu_flags();
                     -#if ARCH_X86_32
                     -    if (has_vectors & AV_CPU_FLAG_3DNOW && HAVE_AMD3DNOW) {
                     -        /* 3DNow! for K6-2/3 */
                     -        s->imdct_calc = ff_imdct_calc_3dnow;
                     -        s->imdct_half = ff_imdct_half_3dnow;
                     -        s->fft_calc   = ff_fft_calc_3dnow;
                     -    }
                     -    if (has_vectors & AV_CPU_FLAG_3DNOWEXT && HAVE_AMD3DNOWEXT) {
                     -        /* 3DNowEx for K7 */
                     -        s->imdct_calc = ff_imdct_calc_3dnowext;
                     -        s->imdct_half = ff_imdct_half_3dnowext;
                     -        s->fft_calc   = ff_fft_calc_3dnowext;
                     -    }
                     -#endif
                     -    if (has_vectors & AV_CPU_FLAG_SSE && HAVE_SSE) {
                     -        /* SSE for P3/P4/K8 */
                     -        s->imdct_calc  = ff_imdct_calc_sse;
                     -        s->imdct_half  = ff_imdct_half_sse;
                     -        s->fft_permute = ff_fft_permute_sse;
                     -        s->fft_calc    = ff_fft_calc_sse;
                     -        s->fft_permutation = FF_FFT_PERM_SWAP_LSBS;
                     -    }
                     -    if (has_vectors & AV_CPU_FLAG_AVX && HAVE_AVX && s->nbits >= 5) {
                     -        /* AVX for SB */
                     -        s->imdct_half      = ff_imdct_half_avx;
                     -        s->fft_calc        = ff_fft_calc_avx;
                     -        s->fft_permutation = FF_FFT_PERM_AVX;
                     -    }
                     -#endif
                     -}
+                    -
                     -#if CONFIG_DCT
                     -av_cold void ff_dct_init_mmx(DCTContext *s)
                     -{
                     -#if HAVE_YASM
                     -    int has_vectors = av_get_cpu_flags();
                     -    if (has_vectors & AV_CPU_FLAG_SSE && HAVE_SSE)
                     -        s->dct32 = ff_dct32_float_sse;
                     -    if (has_vectors & AV_CPU_FLAG_SSE2 && HAVE_SSE)
                     -        s->dct32 = ff_dct32_float_sse2;
                     -    if (has_vectors & AV_CPU_FLAG_AVX && HAVE_AVX)
                     -        s->dct32 = ff_dct32_float_avx;
                     -#endif
                     -}
                     -#endif

                     new file mode 100644
@@ -0,0 +1,147 @@
                     +/*
                     + * Format Conversion Utils
                     + * Copyright (c) 2000, 2001 Fabrice Bellard
                     + * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
                     + *
                     + * This file is part of FFmpeg.
                     + *
                     + * FFmpeg is free software; you can redistribute it and/or
                     + * modify it under the terms of the GNU Lesser General Public
                     + * License as published by the Free Software Foundation; either
                     + * version 2.1 of the License, or (at your option) any later version.
                     + *
                     + * FFmpeg is distributed in the hope that it will be useful,
                     + * but WITHOUT ANY WARRANTY; without even the implied warranty of
                     + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
                     + * Lesser General Public License for more details.
                     + *
                     + * You should have received a copy of the GNU Lesser General Public
                     + * License along with FFmpeg; if not, write to the Free Software
                     + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
                     + *
                     + * MMX optimization by Nick Kurshev <nickols_k@mail.ru>
                     + */
+                    +
                     +#include "libavutil/cpu.h"
                     +#include "libavutil/x86/asm.h"
                     +#include "libavcodec/fmtconvert.h"
                     +#include "libavcodec/dsputil.h"
+                    +
                     +#if HAVE_YASM
+                    +
                     +void ff_int32_to_float_fmul_scalar_sse (float *dst, const int *src, float mul, int len);
                     +void ff_int32_to_float_fmul_scalar_sse2(float *dst, const int *src, float mul, int len);
+                    +
                     +void ff_float_to_int16_3dnow(int16_t *dst, const float *src, long len);
                     +void ff_float_to_int16_sse  (int16_t *dst, const float *src, long len);
                     +void ff_float_to_int16_sse2 (int16_t *dst, const float *src, long len);
+                    +
                     +void ff_float_to_int16_step_3dnow(int16_t *dst, const float *src, long len, long step);
                     +void ff_float_to_int16_step_sse  (int16_t *dst, const float *src, long len, long step);
                     +void ff_float_to_int16_step_sse2 (int16_t *dst, const float *src, long len, long step);
+                    +
                     +void ff_float_to_int16_interleave2_3dnow(int16_t *dst, const float **src, long len);
                     +void ff_float_to_int16_interleave2_sse  (int16_t *dst, const float **src, long len);
                     +void ff_float_to_int16_interleave2_sse2 (int16_t *dst, const float **src, long len);
+                    +
                     +void ff_float_to_int16_interleave6_sse(int16_t *dst, const float **src, int len);
                     +void ff_float_to_int16_interleave6_3dnow(int16_t *dst, const float **src, int len);
                     +void ff_float_to_int16_interleave6_3dnowext(int16_t *dst, const float **src, int len);
+                    +
                     +#define ff_float_to_int16_interleave6_sse2 ff_float_to_int16_interleave6_sse
+                    +
                     +#define FLOAT_TO_INT16_INTERLEAVE(cpu) \
                     +/* gcc pessimizes register allocation if this is in the same function as float_to_int16_interleave_sse2*/\
                     +static av_noinline void float_to_int16_interleave_misc_##cpu(int16_t *dst, const float **src, long len, int channels){\
                     +    int c;\
                     +    for(c=0; c<channels; c++){\
                     +        ff_float_to_int16_step_##cpu(dst+c, src[c], len, channels);\
                     +    }\
                     +}\
                     +\
                     +static void float_to_int16_interleave_##cpu(int16_t *dst, const float **src, long len, int channels){\
                     +    if(channels==1)\
                     +        ff_float_to_int16_##cpu(dst, src[0], len);\
                     +    else if(channels==2){\
                     +        ff_float_to_int16_interleave2_##cpu(dst, src, len);\
                     +    }else if(channels==6){\
                     +        ff_float_to_int16_interleave6_##cpu(dst, src, len);\
                     +    }else\
                     +        float_to_int16_interleave_misc_##cpu(dst, src, len, channels);\
                     +}
+                    +
                     +FLOAT_TO_INT16_INTERLEAVE(3dnow)
                     +FLOAT_TO_INT16_INTERLEAVE(sse)
                     +FLOAT_TO_INT16_INTERLEAVE(sse2)
+                    +
                     +static void float_to_int16_interleave_3dnowext(int16_t *dst, const float **src,
                     +                                               long len, int channels)
                     +{
                     +    if(channels==6)
                     +        ff_float_to_int16_interleave6_3dnowext(dst, src, len);
                     +    else
                     +        float_to_int16_interleave_3dnow(dst, src, len, channels);
                     +}
+                    +
                     +void ff_float_interleave2_mmx(float *dst, const float **src, unsigned int len);
                     +void ff_float_interleave2_sse(float *dst, const float **src, unsigned int len);
+                    +
                     +void ff_float_interleave6_mmx(float *dst, const float **src, unsigned int len);
                     +void ff_float_interleave6_sse(float *dst, const float **src, unsigned int len);
+                    +
                     +static void float_interleave_mmx(float *dst, const float **src,
                     +                                 unsigned int len, int channels)
                     +{
                     +    if (channels == 2) {
                     +        ff_float_interleave2_mmx(dst, src, len);
                     +    } else if (channels == 6)
                     +        ff_float_interleave6_mmx(dst, src, len);
                     +    else
                     +        ff_float_interleave_c(dst, src, len, channels);
                     +}
+                    +
                     +static void float_interleave_sse(float *dst, const float **src,
                     +                                 unsigned int len, int channels)
                     +{
                     +    if (channels == 2) {
                     +        ff_float_interleave2_sse(dst, src, len);
                     +    } else if (channels == 6)
                     +        ff_float_interleave6_sse(dst, src, len);
                     +    else
                     +        ff_float_interleave_c(dst, src, len, channels);
                     +}
                     +#endif
+                    +
                     +void ff_fmt_convert_init_x86(FmtConvertContext *c, AVCodecContext *avctx)
                     +{
                     +#if HAVE_YASM
                     +    int mm_flags = av_get_cpu_flags();
+                    +
                     +    if (mm_flags & AV_CPU_FLAG_MMX) {
                     +        c->float_interleave = float_interleave_mmx;
+                    +
                     +        if (HAVE_AMD3DNOW && mm_flags & AV_CPU_FLAG_3DNOW) {
                     +            if(!(avctx->flags & CODEC_FLAG_BITEXACT)){
                     +                c->float_to_int16 = ff_float_to_int16_3dnow;
                     +                c->float_to_int16_interleave = float_to_int16_interleave_3dnow;
                     +            }
                     +        }
                     +        if (HAVE_AMD3DNOWEXT && mm_flags & AV_CPU_FLAG_3DNOWEXT) {
                     +            if(!(avctx->flags & CODEC_FLAG_BITEXACT)){
                     +                c->float_to_int16_interleave = float_to_int16_interleave_3dnowext;
                     +            }
                     +        }
                     +        if (HAVE_SSE && mm_flags & AV_CPU_FLAG_SSE) {
                     +            c->int32_to_float_fmul_scalar = ff_int32_to_float_fmul_scalar_sse;
                     +            c->float_to_int16 = ff_float_to_int16_sse;
                     +            c->float_to_int16_interleave = float_to_int16_interleave_sse;
                     +            c->float_interleave = float_interleave_sse;
                     +        }
                     +        if (HAVE_SSE && mm_flags & AV_CPU_FLAG_SSE2) {
                     +            c->int32_to_float_fmul_scalar = ff_int32_to_float_fmul_scalar_sse2;
                     +            c->float_to_int16 = ff_float_to_int16_sse2;
                     +            c->float_to_int16_interleave = float_to_int16_interleave_sse2;
                     +        }
                     +    }
                     +#endif
                     +}

                     new file mode 100644
@@ -0,0 +1,385 @@
                     +/*
                     + * Copyright (c) 2004-2005 Michael Niedermayer, Loren Merritt
                     + *
                     + * This file is part of FFmpeg.
                     + *
                     + * FFmpeg is free software; you can redistribute it and/or
                     + * modify it under the terms of the GNU Lesser General Public
                     + * License as published by the Free Software Foundation; either
                     + * version 2.1 of the License, or (at your option) any later version.
                     + *
                     + * FFmpeg is distributed in the hope that it will be useful,
                     + * but WITHOUT ANY WARRANTY; without even the implied warranty of
                     + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
                     + * Lesser General Public License for more details.
                     + *
                     + * You should have received a copy of the GNU Lesser General Public
                     + * License along with FFmpeg; if not, write to the Free Software
                     + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
                     + */
+                    +
                     +#include "libavutil/cpu.h"
                     +#include "libavutil/x86/asm.h"
                     +#include "libavcodec/h264dsp.h"
                     +#include "dsputil_mmx.h"
+                    +
                     +/***********************************/
                     +/* IDCT */
                     +#define IDCT_ADD_FUNC(NUM, DEPTH, OPT)                                  \
                     +void ff_h264_idct ## NUM ## _add_ ## DEPTH ## _ ## OPT(uint8_t *dst,    \
                     +                                                       int16_t *block,  \
                     +                                                       int stride);
+                    +
                     +IDCT_ADD_FUNC(, 8, mmx)
                     +IDCT_ADD_FUNC(, 10, sse2)
                     +IDCT_ADD_FUNC(_dc, 8, mmx2)
                     +IDCT_ADD_FUNC(_dc, 10, mmx2)
                     +IDCT_ADD_FUNC(8_dc, 8, mmx2)
                     +IDCT_ADD_FUNC(8_dc, 10, sse2)
                     +IDCT_ADD_FUNC(8, 8, mmx)
                     +IDCT_ADD_FUNC(8, 8, sse2)
                     +IDCT_ADD_FUNC(8, 10, sse2)
                     +#if HAVE_AVX
                     +IDCT_ADD_FUNC(, 10, avx)
                     +IDCT_ADD_FUNC(8_dc, 10, avx)
                     +IDCT_ADD_FUNC(8, 10, avx)
                     +#endif
+                    +
+                    +
                     +#define IDCT_ADD_REP_FUNC(NUM, REP, DEPTH, OPT)                         \
                     +void ff_h264_idct ## NUM ## _add ## REP ## _ ## DEPTH ## _ ## OPT       \
                     +    (uint8_t *dst, const int *block_offset,                             \
                     +     DCTELEM *block, int stride, const uint8_t nnzc[6 * 8]);
+                    +
                     +IDCT_ADD_REP_FUNC(8, 4, 8, mmx)
                     +IDCT_ADD_REP_FUNC(8, 4, 8, mmx2)
                     +IDCT_ADD_REP_FUNC(8, 4, 8, sse2)
                     +IDCT_ADD_REP_FUNC(8, 4, 10, sse2)
                     +IDCT_ADD_REP_FUNC(8, 4, 10, avx)
                     +IDCT_ADD_REP_FUNC(, 16, 8, mmx)
                     +IDCT_ADD_REP_FUNC(, 16, 8, mmx2)
                     +IDCT_ADD_REP_FUNC(, 16, 8, sse2)
                     +IDCT_ADD_REP_FUNC(, 16, 10, sse2)
                     +IDCT_ADD_REP_FUNC(, 16intra, 8, mmx)
                     +IDCT_ADD_REP_FUNC(, 16intra, 8, mmx2)
                     +IDCT_ADD_REP_FUNC(, 16intra, 8, sse2)
                     +IDCT_ADD_REP_FUNC(, 16intra, 10, sse2)
                     +#if HAVE_AVX
                     +IDCT_ADD_REP_FUNC(, 16, 10, avx)
                     +IDCT_ADD_REP_FUNC(, 16intra, 10, avx)
                     +#endif
+                    +
+                    +
                     +#define IDCT_ADD_REP_FUNC2(NUM, REP, DEPTH, OPT)                      \
                     +void ff_h264_idct ## NUM ## _add ## REP ## _ ## DEPTH ## _ ## OPT     \
                     +    (uint8_t **dst, const int *block_offset,                          \
                     +     DCTELEM *block, int stride, const uint8_t nnzc[6 * 8]);
+                    +
                     +IDCT_ADD_REP_FUNC2(, 8, 8, mmx)
                     +IDCT_ADD_REP_FUNC2(, 8, 8, mmx2)
                     +IDCT_ADD_REP_FUNC2(, 8, 8, sse2)
                     +IDCT_ADD_REP_FUNC2(, 8, 10, sse2)
                     +#if HAVE_AVX
                     +IDCT_ADD_REP_FUNC2(, 8, 10, avx)
                     +#endif
+                    +
                     +void ff_h264_luma_dc_dequant_idct_mmx(DCTELEM *output, DCTELEM *input, int qmul);
                     +void ff_h264_luma_dc_dequant_idct_sse2(DCTELEM *output, DCTELEM *input, int qmul);
+                    +
                     +/***********************************/
                     +/* deblocking */
+                    +
                     +void ff_h264_loop_filter_strength_mmx2(int16_t bS[2][4][4], uint8_t nnz[40],
                     +                                       int8_t ref[2][40], int16_t mv[2][40][2],
                     +                                       int bidir, int edges, int step,
                     +                                       int mask_mv0, int mask_mv1, int field);
+                    +
                     +#define LF_FUNC(DIR, TYPE, DEPTH, OPT)                                        \
                     +void ff_deblock_ ## DIR ## _ ## TYPE ## _ ## DEPTH ## _ ## OPT(uint8_t *pix,  \
                     +                                                               int stride,    \
                     +                                                               int alpha,     \
                     +                                                               int beta,      \
                     +                                                               int8_t *tc0);
                     +#define LF_IFUNC(DIR, TYPE, DEPTH, OPT) \
                     +void ff_deblock_ ## DIR ## _ ## TYPE ## _ ## DEPTH ## _ ## OPT(uint8_t *pix,  \
                     +                                                               int stride,    \
                     +                                                               int alpha,     \
                     +                                                               int beta);
+                    +
                     +#define LF_FUNCS(type, depth)                   \
                     +LF_FUNC(h,  chroma,       depth, mmx2)          \
                     +LF_IFUNC(h, chroma_intra, depth, mmx2)          \
                     +LF_FUNC(v,  chroma,       depth, mmx2)          \
                     +LF_IFUNC(v, chroma_intra, depth, mmx2)          \
                     +LF_FUNC(h,  luma,         depth, mmx2)          \
                     +LF_IFUNC(h, luma_intra,   depth, mmx2)          \
                     +LF_FUNC(h,  luma,         depth, sse2)          \
                     +LF_IFUNC(h, luma_intra,   depth, sse2)          \
                     +LF_FUNC(v,  luma,         depth, sse2)          \
                     +LF_IFUNC(v, luma_intra,   depth, sse2)          \
                     +LF_FUNC(h,  chroma,       depth, sse2)          \
                     +LF_IFUNC(h, chroma_intra, depth, sse2)          \
                     +LF_FUNC(v,  chroma,       depth, sse2)          \
                     +LF_IFUNC(v, chroma_intra, depth, sse2)          \
                     +LF_FUNC(h,  luma,         depth, avx)           \
                     +LF_IFUNC(h, luma_intra,   depth, avx)           \
                     +LF_FUNC(v,  luma,         depth, avx)           \
                     +LF_IFUNC(v, luma_intra,   depth, avx)           \
                     +LF_FUNC(h,  chroma,       depth, avx)           \
                     +LF_IFUNC(h, chroma_intra, depth, avx)           \
                     +LF_FUNC(v,  chroma,       depth, avx)           \
                     +LF_IFUNC(v, chroma_intra, depth, avx)
+                    +
                     +LF_FUNCS(uint8_t,   8)
                     +LF_FUNCS(uint16_t, 10)
+                    +
                     +#if ARCH_X86_32 && HAVE_YASM
                     +LF_FUNC(v8, luma, 8, mmx2)
                     +static void ff_deblock_v_luma_8_mmx2(uint8_t *pix, int stride, int alpha,
                     +                                     int beta, int8_t *tc0)
                     +{
                     +    if ((tc0[0] & tc0[1]) >= 0)
                     +        ff_deblock_v8_luma_8_mmx2(pix + 0, stride, alpha, beta, tc0);
                     +    if ((tc0[2] & tc0[3]) >= 0)
                     +        ff_deblock_v8_luma_8_mmx2(pix + 8, stride, alpha, beta, tc0 + 2);
                     +}
+                    +
                     +LF_IFUNC(v8, luma_intra, 8, mmx2)
                     +static void ff_deblock_v_luma_intra_8_mmx2(uint8_t *pix, int stride,
                     +                                           int alpha, int beta)
                     +{
                     +    ff_deblock_v8_luma_intra_8_mmx2(pix + 0, stride, alpha, beta);
                     +    ff_deblock_v8_luma_intra_8_mmx2(pix + 8, stride, alpha, beta);
                     +}
                     +#endif /* ARCH_X86_32 */
+                    +
                     +LF_FUNC(v,  luma,       10, mmx2)
                     +LF_IFUNC(v, luma_intra, 10, mmx2)
+                    +
                     +/***********************************/
                     +/* weighted prediction */
+                    +
                     +#define H264_WEIGHT(W, OPT)                                             \
                     +void ff_h264_weight_ ## W ## _ ## OPT(uint8_t *dst, int stride,         \
                     +                                      int height, int log2_denom,       \
                     +                                      int weight, int offset);
+                    +
                     +#define H264_BIWEIGHT(W, OPT)                                           \
                     +void ff_h264_biweight_ ## W ## _ ## OPT(uint8_t *dst, uint8_t *src,     \
                     +                                        int stride, int height,         \
                     +                                        int log2_denom, int weightd,    \
                     +                                        int weights, int offset);
+                    +
                     +#define H264_BIWEIGHT_MMX(W)                    \
                     +    H264_WEIGHT(W, mmx2)                        \
                     +    H264_BIWEIGHT(W, mmx2)
+                    +
                     +#define H264_BIWEIGHT_MMX_SSE(W)                \
                     +    H264_BIWEIGHT_MMX(W)                        \
                     +    H264_WEIGHT(W, sse2)                        \
                     +    H264_BIWEIGHT(W, sse2)                      \
                     +    H264_BIWEIGHT(W, ssse3)
+                    +
                     +H264_BIWEIGHT_MMX_SSE(16)
                     +H264_BIWEIGHT_MMX_SSE(8)
                     +H264_BIWEIGHT_MMX(4)
+                    +
                     +#define H264_WEIGHT_10(W, DEPTH, OPT)                                   \
                     +void ff_h264_weight_ ## W ## _ ## DEPTH ## _ ## OPT(uint8_t *dst,       \
                     +                                                    int stride,         \
                     +                                                    int height,         \
                     +                                                    int log2_denom,     \
                     +                                                    int weight,         \
                     +                                                    int offset);
+                    +
                     +#define H264_BIWEIGHT_10(W, DEPTH, OPT)                                 \
                     +void ff_h264_biweight_ ## W ## _ ## DEPTH ## _ ## OPT(uint8_t *dst,     \
                     +                                                      uint8_t *src,     \
                     +                                                      int stride,       \
                     +                                                      int height,       \
                     +                                                      int log2_denom,   \
                     +                                                      int weightd,      \
                     +                                                      int weights,      \
                     +                                                      int offset);
+                    +
                     +#define H264_BIWEIGHT_10_SSE(W, DEPTH)          \
                     +    H264_WEIGHT_10(W, DEPTH, sse2)              \
                     +    H264_WEIGHT_10(W, DEPTH, sse4)              \
                     +    H264_BIWEIGHT_10(W, DEPTH, sse2)            \
                     +    H264_BIWEIGHT_10(W, DEPTH, sse4)
+                    +
                     +H264_BIWEIGHT_10_SSE(16, 10)
                     +H264_BIWEIGHT_10_SSE(8,  10)
                     +H264_BIWEIGHT_10_SSE(4,  10)
+                    +
                     +void ff_h264dsp_init_x86(H264DSPContext *c, const int bit_depth,
                     +                         const int chroma_format_idc)
                     +{
                     +#if HAVE_YASM
                     +    int mm_flags = av_get_cpu_flags();
+                    +
                     +    if (chroma_format_idc == 1 && mm_flags & AV_CPU_FLAG_MMXEXT)
                     +        c->h264_loop_filter_strength = ff_h264_loop_filter_strength_mmx2;
+                    +
                     +    if (bit_depth == 8) {
                     +        if (mm_flags & AV_CPU_FLAG_MMX) {
                     +            c->h264_idct_dc_add   =
                     +            c->h264_idct_add      = ff_h264_idct_add_8_mmx;
                     +            c->h264_idct8_dc_add  =
                     +            c->h264_idct8_add     = ff_h264_idct8_add_8_mmx;
+                    +
                     +            c->h264_idct_add16 = ff_h264_idct_add16_8_mmx;
                     +            c->h264_idct8_add4 = ff_h264_idct8_add4_8_mmx;
                     +            if (chroma_format_idc == 1)
                     +                c->h264_idct_add8 = ff_h264_idct_add8_8_mmx;
                     +            c->h264_idct_add16intra = ff_h264_idct_add16intra_8_mmx;
                     +            if (mm_flags & AV_CPU_FLAG_CMOV)
                     +                c->h264_luma_dc_dequant_idct = ff_h264_luma_dc_dequant_idct_mmx;
+                    +
                     +            if (mm_flags & AV_CPU_FLAG_MMXEXT) {
                     +                c->h264_idct_dc_add  = ff_h264_idct_dc_add_8_mmx2;
                     +                c->h264_idct8_dc_add = ff_h264_idct8_dc_add_8_mmx2;
                     +                c->h264_idct_add16   = ff_h264_idct_add16_8_mmx2;
                     +                c->h264_idct8_add4   = ff_h264_idct8_add4_8_mmx2;
                     +                if (chroma_format_idc == 1)
                     +                    c->h264_idct_add8 = ff_h264_idct_add8_8_mmx2;
                     +                c->h264_idct_add16intra = ff_h264_idct_add16intra_8_mmx2;
+                    +
                     +                c->h264_v_loop_filter_chroma       = ff_deblock_v_chroma_8_mmx2;
                     +                c->h264_v_loop_filter_chroma_intra = ff_deblock_v_chroma_intra_8_mmx2;
                     +                if (chroma_format_idc == 1) {
                     +                    c->h264_h_loop_filter_chroma       = ff_deblock_h_chroma_8_mmx2;
                     +                    c->h264_h_loop_filter_chroma_intra = ff_deblock_h_chroma_intra_8_mmx2;
                     +                }
                     +#if ARCH_X86_32
                     +                c->h264_v_loop_filter_luma       = ff_deblock_v_luma_8_mmx2;
                     +                c->h264_h_loop_filter_luma       = ff_deblock_h_luma_8_mmx2;
                     +                c->h264_v_loop_filter_luma_intra = ff_deblock_v_luma_intra_8_mmx2;
                     +                c->h264_h_loop_filter_luma_intra = ff_deblock_h_luma_intra_8_mmx2;
                     +#endif /* ARCH_X86_32 */
                     +                c->weight_h264_pixels_tab[0] = ff_h264_weight_16_mmx2;
                     +                c->weight_h264_pixels_tab[1] = ff_h264_weight_8_mmx2;
                     +                c->weight_h264_pixels_tab[2] = ff_h264_weight_4_mmx2;
+                    +
                     +                c->biweight_h264_pixels_tab[0] = ff_h264_biweight_16_mmx2;
                     +                c->biweight_h264_pixels_tab[1] = ff_h264_biweight_8_mmx2;
                     +                c->biweight_h264_pixels_tab[2] = ff_h264_biweight_4_mmx2;
+                    +
                     +                if (mm_flags & AV_CPU_FLAG_SSE2) {
                     +                    c->h264_idct8_add  = ff_h264_idct8_add_8_sse2;
+                    +
                     +                    c->h264_idct_add16 = ff_h264_idct_add16_8_sse2;
                     +                    c->h264_idct8_add4 = ff_h264_idct8_add4_8_sse2;
                     +                    if (chroma_format_idc == 1)
                     +                        c->h264_idct_add8 = ff_h264_idct_add8_8_sse2;
                     +                    c->h264_idct_add16intra      = ff_h264_idct_add16intra_8_sse2;
                     +                    c->h264_luma_dc_dequant_idct = ff_h264_luma_dc_dequant_idct_sse2;
+                    +
                     +                    c->weight_h264_pixels_tab[0] = ff_h264_weight_16_sse2;
                     +                    c->weight_h264_pixels_tab[1] = ff_h264_weight_8_sse2;
+                    +
                     +                    c->biweight_h264_pixels_tab[0] = ff_h264_biweight_16_sse2;
                     +                    c->biweight_h264_pixels_tab[1] = ff_h264_biweight_8_sse2;
+                    +
                     +#if HAVE_ALIGNED_STACK
                     +                    c->h264_v_loop_filter_luma       = ff_deblock_v_luma_8_sse2;
                     +                    c->h264_h_loop_filter_luma       = ff_deblock_h_luma_8_sse2;
                     +                    c->h264_v_loop_filter_luma_intra = ff_deblock_v_luma_intra_8_sse2;
                     +                    c->h264_h_loop_filter_luma_intra = ff_deblock_h_luma_intra_8_sse2;
                     +#endif /* HAVE_ALIGNED_STACK */
                     +                }
                     +                if (mm_flags & AV_CPU_FLAG_SSSE3) {
                     +                    c->biweight_h264_pixels_tab[0] = ff_h264_biweight_16_ssse3;
                     +                    c->biweight_h264_pixels_tab[1] = ff_h264_biweight_8_ssse3;
                     +                }
                     +                if (HAVE_AVX && mm_flags & AV_CPU_FLAG_AVX) {
                     +#if HAVE_ALIGNED_STACK
                     +                    c->h264_v_loop_filter_luma       = ff_deblock_v_luma_8_avx;
                     +                    c->h264_h_loop_filter_luma       = ff_deblock_h_luma_8_avx;
                     +                    c->h264_v_loop_filter_luma_intra = ff_deblock_v_luma_intra_8_avx;
                     +                    c->h264_h_loop_filter_luma_intra = ff_deblock_h_luma_intra_8_avx;
                     +#endif /* HAVE_ALIGNED_STACK */
                     +                }
                     +            }
                     +        }
                     +    } else if (bit_depth == 10) {
                     +        if (mm_flags & AV_CPU_FLAG_MMX) {
                     +            if (mm_flags & AV_CPU_FLAG_MMXEXT) {
                     +#if ARCH_X86_32
                     +                c->h264_v_loop_filter_chroma       = ff_deblock_v_chroma_10_mmx2;
                     +                c->h264_v_loop_filter_chroma_intra = ff_deblock_v_chroma_intra_10_mmx2;
                     +                c->h264_v_loop_filter_luma         = ff_deblock_v_luma_10_mmx2;
                     +                c->h264_h_loop_filter_luma         = ff_deblock_h_luma_10_mmx2;
                     +                c->h264_v_loop_filter_luma_intra   = ff_deblock_v_luma_intra_10_mmx2;
                     +                c->h264_h_loop_filter_luma_intra   = ff_deblock_h_luma_intra_10_mmx2;
                     +#endif /* ARCH_X86_32 */
                     +                c->h264_idct_dc_add = ff_h264_idct_dc_add_10_mmx2;
                     +                if (mm_flags & AV_CPU_FLAG_SSE2) {
                     +                    c->h264_idct_add     = ff_h264_idct_add_10_sse2;
                     +                    c->h264_idct8_dc_add = ff_h264_idct8_dc_add_10_sse2;
+                    +
                     +                    c->h264_idct_add16 = ff_h264_idct_add16_10_sse2;
                     +                    if (chroma_format_idc == 1)
                     +                        c->h264_idct_add8 = ff_h264_idct_add8_10_sse2;
                     +                    c->h264_idct_add16intra = ff_h264_idct_add16intra_10_sse2;
                     +#if HAVE_ALIGNED_STACK
                     +                    c->h264_idct8_add  = ff_h264_idct8_add_10_sse2;
                     +                    c->h264_idct8_add4 = ff_h264_idct8_add4_10_sse2;
                     +#endif /* HAVE_ALIGNED_STACK */
+                    +
                     +                    c->weight_h264_pixels_tab[0] = ff_h264_weight_16_10_sse2;
                     +                    c->weight_h264_pixels_tab[1] = ff_h264_weight_8_10_sse2;
                     +                    c->weight_h264_pixels_tab[2] = ff_h264_weight_4_10_sse2;
+                    +
                     +                    c->biweight_h264_pixels_tab[0] = ff_h264_biweight_16_10_sse2;
                     +                    c->biweight_h264_pixels_tab[1] = ff_h264_biweight_8_10_sse2;
                     +                    c->biweight_h264_pixels_tab[2] = ff_h264_biweight_4_10_sse2;
+                    +
                     +                    c->h264_v_loop_filter_chroma       = ff_deblock_v_chroma_10_sse2;
                     +                    c->h264_v_loop_filter_chroma_intra = ff_deblock_v_chroma_intra_10_sse2;
                     +#if HAVE_ALIGNED_STACK
                     +                    c->h264_v_loop_filter_luma       = ff_deblock_v_luma_10_sse2;
                     +                    c->h264_h_loop_filter_luma       = ff_deblock_h_luma_10_sse2;
                     +                    c->h264_v_loop_filter_luma_intra = ff_deblock_v_luma_intra_10_sse2;
                     +                    c->h264_h_loop_filter_luma_intra = ff_deblock_h_luma_intra_10_sse2;
                     +#endif /* HAVE_ALIGNED_STACK */
                     +                }
                     +                if (mm_flags & AV_CPU_FLAG_SSE4) {
                     +                    c->weight_h264_pixels_tab[0] = ff_h264_weight_16_10_sse4;
                     +                    c->weight_h264_pixels_tab[1] = ff_h264_weight_8_10_sse4;
                     +                    c->weight_h264_pixels_tab[2] = ff_h264_weight_4_10_sse4;
+                    +
                     +                    c->biweight_h264_pixels_tab[0] = ff_h264_biweight_16_10_sse4;
                     +                    c->biweight_h264_pixels_tab[1] = ff_h264_biweight_8_10_sse4;
                     +                    c->biweight_h264_pixels_tab[2] = ff_h264_biweight_4_10_sse4;
                     +                }
                     +#if HAVE_AVX
                     +                if (mm_flags & AV_CPU_FLAG_AVX) {
                     +                    c->h264_idct_dc_add  =
                     +                    c->h264_idct_add     = ff_h264_idct_add_10_avx;
                     +                    c->h264_idct8_dc_add = ff_h264_idct8_dc_add_10_avx;
+                    +
                     +                    c->h264_idct_add16 = ff_h264_idct_add16_10_avx;
                     +                    if (chroma_format_idc == 1)
                     +                        c->h264_idct_add8 = ff_h264_idct_add8_10_avx;
                     +                    c->h264_idct_add16intra = ff_h264_idct_add16intra_10_avx;
                     +#if HAVE_ALIGNED_STACK
                     +                    c->h264_idct8_add  = ff_h264_idct8_add_10_avx;
                     +                    c->h264_idct8_add4 = ff_h264_idct8_add4_10_avx;
                     +#endif /* HAVE_ALIGNED_STACK */
+                    +
                     +                    c->h264_v_loop_filter_chroma       = ff_deblock_v_chroma_10_avx;
                     +                    c->h264_v_loop_filter_chroma_intra = ff_deblock_v_chroma_intra_10_avx;
                     +#if HAVE_ALIGNED_STACK
                     +                    c->h264_v_loop_filter_luma         = ff_deblock_v_luma_10_avx;
                     +                    c->h264_h_loop_filter_luma         = ff_deblock_h_luma_10_avx;
                     +                    c->h264_v_loop_filter_luma_intra   = ff_deblock_v_luma_intra_10_avx;
                     +                    c->h264_h_loop_filter_luma_intra   = ff_deblock_h_luma_intra_10_avx;
                     +#endif /* HAVE_ALIGNED_STACK */
                     +                }
                     +#endif /* HAVE_AVX */
                     +            }
                     +        }
                     +    }
                     +#endif /* HAVE_YASM */
                     +}

@@ -360,13 +360,5 @@ static int RENAME(dct_quantize)(MpegEncContext *s,
                              block[0x3E] = temp_block[0x3E]; block[0x3F] = temp_block[0x3F];
+                         }
                          end:
                     -/*
                     -    for(i=0; i<last_non_zero_p1; i++)
                     -    {
                     -       int j= zigzag_direct_noperm[i];
                     -       block[block_permute_op(j)]= temp_block[j];
                     -    }
                     -*/
+                    -
                          return last_non_zero_p1 - 1;
+                     }

@@ -33,15 +33,6 @@
                      #define HMAC_OPAD_VAL 0x5C
                      /**
                     - * A non-zero transaction id requires the server to send back
                     - * a _result or _error response.
                     - * Setting it to 0 marks the message as a notification not
                     - * requiring feedback.
                     - */
+                    -
                     -#define RTMP_NOTIFICATION 0
+                    -
                     -/**
                       * emulated Flash client version - 9.0.124.2 on Linux
                       * @{
                       */

@@ -91,7 +91,11 @@ typedef struct RTMPContext {
                          int           nb_invokes;                 ///< keeps track of invoke messages
                          char*         tcurl;                      ///< url of the target stream
                          char*         flashver;                   ///< version of the flash plugin
                     +    char*         swfhash;                    ///< SHA256 hash of the decompressed SWF file (32 bytes)
                     +    int           swfhash_len;                ///< length of the SHA256 hash
                     +    int           swfsize;                    ///< size of the decompressed SWF file
                          char*         swfurl;                     ///< url of the swf player
                     +    char          swfverification[42];        ///< hash of the SWF verification
                          char*         pageurl;                    ///< url of the web page
                          char*         subscribe;                  ///< name of live stream to subscribe
                          int           server_bw;                  ///< server bandwidth
@@ -593,6 +597,27 @@ static int gen_pong(URLContext *s, RTMPContext *rt, RTMPPacket *ppkt)
+                     }
                      /**
                     + * Generate SWF verification message and send it to the server.
                     + */
                     +static int gen_swf_verification(URLContext *s, RTMPContext *rt)
                     +{
                     +    RTMPPacket pkt;
                     +    uint8_t *p;
                     +    int ret;
+                    +
                     +    av_log(s, AV_LOG_DEBUG, "Sending SWF verification...\n");
                     +    if ((ret = ff_rtmp_packet_create(&pkt, RTMP_NETWORK_CHANNEL, RTMP_PT_PING,
                     +                                     0, 44)) < 0)
                     +        return ret;
+                    +
                     +    p = pkt.data;
                     +    bytestream_put_be16(&p, 27);
                     +    memcpy(p, rt->swfverification, 42);
+                    +
                     +    return rtmp_send_packet(rt, &pkt, 0);
                     +}
+                    +
                     +/**
                       * Generate server bandwidth message and send it to the server.
                       */
                      static int gen_server_bw(URLContext *s, RTMPContext *rt)
@@ -626,10 +651,10 @@ static int gen_check_bw(URLContext *s, RTMPContext *rt)
                          p = pkt.data;
                          ff_amf_write_string(&p, "_checkbw");
                     -    ff_amf_write_number(&p, RTMP_NOTIFICATION);
                     +    ff_amf_write_number(&p, ++rt->nb_invokes);
                          ff_amf_write_null(&p);
                     -    return rtmp_send_packet(rt, &pkt, 0);
                     +    return rtmp_send_packet(rt, &pkt, 1);
+                     }
                      /**
@@ -776,6 +801,30 @@ static int rtmp_validate_digest(uint8_t *buf, int off)
                          return 0;
+                     }
                     +static int rtmp_calc_swf_verification(URLContext *s, RTMPContext *rt,
                     +                                      uint8_t *buf)
                     +{
                     +    uint8_t *p;
                     +    int ret;
+                    +
                     +    if (rt->swfhash_len != 32) {
                     +        av_log(s, AV_LOG_ERROR,
                     +               "Hash of the decompressed SWF file is not 32 bytes long.\n");
                     +        return AVERROR(EINVAL);
                     +    }
+                    +
                     +    p = &rt->swfverification[0];
                     +    bytestream_put_byte(&p, 1);
                     +    bytestream_put_byte(&p, 1);
                     +    bytestream_put_be32(&p, rt->swfsize);
                     +    bytestream_put_be32(&p, rt->swfsize);
+                    +
                     +    if ((ret = ff_rtmp_calc_digest(rt->swfhash, 32, 0, buf, 32, p)) < 0)
                     +        return ret;
+                    +
                     +    return 0;
                     +}
+                    +
                      /**
                       * Perform handshake with the server by means of exchanging pseudorandom data
                       * signed with HMAC-SHA2 digest.
@@ -866,6 +915,14 @@ static int rtmp_handshake(URLContext *s, RTMPContext *rt)
+                                 }
+                             }
                     +        /* Generate SWFVerification token (SHA256 HMAC hash of decompressed SWF,
                     +         * key are the last 32 bytes of the server handshake. */
                     +        if (rt->swfsize) {
                     +            if ((ret = rtmp_calc_swf_verification(s, rt, serverdata + 1 +
                     +                                                  RTMP_HANDSHAKE_PACKET_SIZE - 32)) < 0)
                     +                return ret;
                     +        }
+                    +
                              ret = ff_rtmp_calc_digest(tosend + 1 + client_pos, 32, 0,
                                                        rtmp_server_key, sizeof(rtmp_server_key),
                                                        digest);
@@ -1001,6 +1058,13 @@ static int handle_ping(URLContext *s, RTMPPacket *pkt)
                          if (t == 6) {
                              if ((ret = gen_pong(s, rt, pkt)) < 0)
                                  return ret;
                     +    } else if (t == 26) {
                     +        if (rt->swfsize) {
                     +            if ((ret = gen_swf_verification(s, rt)) < 0)
                     +                return ret;
                     +        } else {
                     +            av_log(s, AV_LOG_WARNING, "Ignoring SWFVerification request.\n");
                     +        }
+                         }
                          return 0;
@@ -1055,15 +1119,27 @@ static int handle_server_bw(URLContext *s, RTMPPacket *pkt)
                      static int handle_invoke_error(URLContext *s, RTMPPacket *pkt)
+                     {
                          const uint8_t *data_end = pkt->data + pkt->data_size;
                     +    char *tracked_method = NULL;
                     +    int level = AV_LOG_ERROR;
                          uint8_t tmpstr[256];
                     +    int ret;
+                    +
                     +    if ((ret = find_tracked_method(s, pkt, 9, &tracked_method)) < 0)
                     +        return ret;
                          if (!ff_amf_get_field_value(pkt->data + 9, data_end,
                                                      "description", tmpstr, sizeof(tmpstr))) {
                     -        av_log(s, AV_LOG_ERROR, "Server error: %s\n", tmpstr);
                     -        return -1;
                     +        if (tracked_method && !strcmp(tracked_method, "_checkbw")) {
                     +            /* Ignore _checkbw errors. */
                     +            level = AV_LOG_WARNING;
                     +            ret = 0;
                     +        } else
                     +            ret = -1;
                     +        av_log(s, level, "Server error: %s\n", tmpstr);
+                         }
                     -    return 0;
                     +    av_free(tracked_method);
                     +    return ret;
+                     }
                      static int handle_invoke_result(URLContext *s, RTMPPacket *pkt)
@@ -1705,6 +1781,8 @@ static const AVOption rtmp_options[] = {
                          {"rtmp_pageurl", "URL of the web page in which the media was embedded. By default no value will be sent.", OFFSET(pageurl), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, DEC},
                          {"rtmp_playpath", "Stream identifier to play or to publish", OFFSET(playpath), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, DEC|ENC},
                          {"rtmp_subscribe", "Name of live stream to subscribe to. Defaults to rtmp_playpath.", OFFSET(subscribe), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, DEC},
                     +    {"rtmp_swfhash", "SHA256 hash of the decompressed SWF file (32 bytes).", OFFSET(swfhash), AV_OPT_TYPE_BINARY, .flags = DEC},
                     +    {"rtmp_swfsize", "Size of the decompressed SWF file, required for SWFVerification.", OFFSET(swfsize), AV_OPT_TYPE_INT, {0}, 0, INT_MAX, DEC},
                          {"rtmp_swfurl", "URL of the SWF player. By default no value will be sent", OFFSET(swfurl), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, DEC|ENC},
                          {"rtmp_tcurl", "URL of the target stream. Defaults to proto://host[:port]/app.", OFFSET(tcurl), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, DEC|ENC},
                          { NULL },

@@ -31,7 +31,7 @@
                      #define LIBAVFORMAT_VERSION_MAJOR 54
                      #define LIBAVFORMAT_VERSION_MINOR 23
                     -#define LIBAVFORMAT_VERSION_MICRO 100
                     +#define LIBAVFORMAT_VERSION_MICRO 101
                      #define LIBAVFORMAT_VERSION_INT AV_VERSION_INT(LIBAVFORMAT_VERSION_MAJOR, \
                                                                     LIBAVFORMAT_VERSION_MINOR, \

@@ -335,7 +335,9 @@ int ff_audio_mix_init(AVAudioResampleContext *avr)
                                                            avr->out_channel_layout,
                                                            avr->center_mix_level,
                                                            avr->surround_mix_level,
                     -                                      avr->lfe_mix_level, 1, matrix_dbl,
                     +                                      avr->lfe_mix_level,
                     +                                      avr->normalize_mix_level,
                     +                                      matrix_dbl,
                                                            avr->in_channels,
                                                            avr->matrix_encoding);
                              if (ret < 0) {

@@ -45,6 +45,7 @@ struct AVAudioResampleContext {
                          double center_mix_level;                    /**< center mix level       */
                          double surround_mix_level;                  /**< surround mix level     */
                          double lfe_mix_level;                       /**< lfe mix level          */
                     +    int normalize_mix_level;                    /**< enable mix level normalization */
                          int force_resampling;                       /**< force resampling       */
                          int filter_size;                            /**< length of each FIR filter in the resampling filterbank relative to the cutoff frequency */
                          int phase_shift;                            /**< log2 of the number of entries in the resampling polyphase filterbank */

@@ -47,6 +47,7 @@ static const AVOption options[] = {
                          { "center_mix_level",       "Center Mix Level",         OFFSET(center_mix_level),       AV_OPT_TYPE_DOUBLE, { M_SQRT1_2             }, -32.0,                32.0,                   PARAM },
                          { "surround_mix_level",     "Surround Mix Level",       OFFSET(surround_mix_level),     AV_OPT_TYPE_DOUBLE, { M_SQRT1_2             }, -32.0,                32.0,                   PARAM },
                          { "lfe_mix_level",          "LFE Mix Level",            OFFSET(lfe_mix_level),          AV_OPT_TYPE_DOUBLE, { 0.0                   }, -32.0,                32.0,                   PARAM },
                     +    { "normalize_mix_level",    "Normalize Mix Level",      OFFSET(normalize_mix_level),    AV_OPT_TYPE_INT,    { 1                     }, 0,                    1,                      PARAM },
                          { "force_resampling",       "Force Resampling",         OFFSET(force_resampling),       AV_OPT_TYPE_INT,    { 0                     }, 0,                    1,                      PARAM },
                          { "filter_size",            "Resampling Filter Size",   OFFSET(filter_size),            AV_OPT_TYPE_INT,    { 16                    }, 0,                    32, /* ??? */           PARAM },
                          { "phase_shift",            "Resampling Phase Shift",   OFFSET(phase_shift),            AV_OPT_TYPE_INT,    { 10                    }, 0,                    30, /* ??? */           PARAM },