Browse code

lavfi: USPP Filter

Previous version reviewed by: Stefano Sabatini <stefasab@gmail.com>
Signed-off-by: Michael Niedermayer <michaelni@gmx.at>

Arwa Arif authored on 2014/12/07 22:26:46
Showing 5 changed files
... ...
@@ -2622,6 +2622,7 @@ vidstabtransform_filter_deps="libvidstab"
2622 2622
 pixfmts_super2xsai_test_deps="super2xsai_filter"
2623 2623
 tinterlace_merge_test_deps="tinterlace_filter"
2624 2624
 tinterlace_pad_test_deps="tinterlace_filter"
2625
+uspp_filter_deps="gpl avcodec"
2625 2626
 zmq_filter_deps="libzmq"
2626 2627
 zoompan_filter_deps="swscale"
2627 2628
 
... ...
@@ -8935,6 +8935,31 @@ unsharp=7:7:-2:7:7:-2
8935 8935
 @end example
8936 8936
 @end itemize
8937 8937
 
8938
+@section uspp
8939
+
8940
+Apply ultra slow/simple postprocessing filter that compresses and decompresses
8941
+the image at several (or - in the case of @option{quality} level @code{8} - all)
8942
+shifts and average the results.
8943
+
8944
+The way this differs from the behavior of spp is that uspp actually encodes &
8945
+decodes each case with libavcodec Snow, whereas spp uses a simplified intra only 8x8
8946
+DCT similar to MJPEG.
8947
+
8948
+The filter accepts the following options:
8949
+
8950
+@table @option
8951
+@item quality
8952
+Set quality. This option defines the number of levels for averaging. It accepts
8953
+an integer in the range 0-8. If set to @code{0}, the filter will have no
8954
+effect. A value of @code{8} means the higher quality. For each increment of
8955
+that value the speed drops by a factor of approximately 2.  Default value is
8956
+@code{3}.
8957
+
8958
+@item qp
8959
+Force a constant quantization parameter. If not set, the filter will use the QP
8960
+from the video stream (if available).
8961
+@end table
8962
+
8938 8963
 @anchor{vidstabdetect}
8939 8964
 @section vidstabdetect
8940 8965
 
... ...
@@ -193,6 +193,7 @@ OBJS-$(CONFIG_TINTERLACE_FILTER)             += vf_tinterlace.o
193 193
 OBJS-$(CONFIG_TRANSPOSE_FILTER)              += vf_transpose.o
194 194
 OBJS-$(CONFIG_TRIM_FILTER)                   += trim.o
195 195
 OBJS-$(CONFIG_UNSHARP_FILTER)                += vf_unsharp.o
196
+OBJS-$(CONFIG_USPP_FILTER)                   += vf_uspp.o
196 197
 OBJS-$(CONFIG_VFLIP_FILTER)                  += vf_vflip.o
197 198
 OBJS-$(CONFIG_VIDSTABDETECT_FILTER)          += vidstabutils.o vf_vidstabdetect.o
198 199
 OBJS-$(CONFIG_VIDSTABTRANSFORM_FILTER)       += vidstabutils.o vf_vidstabtransform.o
... ...
@@ -208,6 +208,7 @@ void avfilter_register_all(void)
208 208
     REGISTER_FILTER(TRANSPOSE,      transpose,      vf);
209 209
     REGISTER_FILTER(TRIM,           trim,           vf);
210 210
     REGISTER_FILTER(UNSHARP,        unsharp,        vf);
211
+    REGISTER_FILTER(USPP,           uspp,           vf);
211 212
     REGISTER_FILTER(VFLIP,          vflip,          vf);
212 213
     REGISTER_FILTER(VIDSTABDETECT,  vidstabdetect,  vf);
213 214
     REGISTER_FILTER(VIDSTABTRANSFORM, vidstabtransform, vf);
214 215
new file mode 100644
... ...
@@ -0,0 +1,490 @@
0
+/*
1
+ * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
2
+ * Copyright (c) 2014 Arwa Arif <arwaarif1994@gmail.com>
3
+ *
4
+ * This file is part of FFmpeg.
5
+ *
6
+ * FFmpeg is free software; you can redistribute it and/or modify
7
+ * it under the terms of the GNU General Public License as published by
8
+ * the Free Software Foundation; either version 2 of the License, or
9
+ * (at your option) any later version.
10
+ *
11
+ * FFmpeg is distributed in the hope that it will be useful,
12
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
13
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14
+ * GNU General Public License for more details.
15
+ *
16
+ * You should have received a copy of the GNU General Public License along
17
+ * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
18
+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
19
+ */
20
+
21
+/**
22
+ * @file
23
+ * Ultra Slow/Simple Post-processing filter.
24
+ *
25
+ * Originally written by Michael Niedermayer for the MPlayer project, and
26
+ * ported by Arwa Arif for FFmpeg.
27
+ */
28
+
29
+#include "libavutil/avassert.h"
30
+#include "libavutil/imgutils.h"
31
+#include "libavutil/opt.h"
32
+#include "libavutil/pixdesc.h"
33
+#include "internal.h"
34
+#include "libavcodec/avcodec.h"
35
+#include "avfilter.h"
36
+
37
+#define MAX_LEVEL 8 /* quality levels */
38
+#define BLOCK 16
39
+
40
+typedef struct {
41
+    const AVClass *av_class;
42
+    int log2_count;
43
+    int qp;
44
+    int qscale_type;
45
+    int temp_stride[3];
46
+    uint8_t *src[3];
47
+    int16_t *temp[3];
48
+    int outbuf_size;
49
+    uint8_t *outbuf;
50
+    AVCodecContext *avctx_enc[BLOCK*BLOCK];
51
+    AVFrame *frame;
52
+    AVFrame *frame_dec;
53
+    uint8_t *non_b_qp_table;
54
+    int non_b_qp_alloc_size;
55
+    int use_bframe_qp;
56
+
57
+} USPPContext;
58
+
59
+#define OFFSET(x) offsetof(USPPContext, x)
60
+#define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
61
+static const AVOption uspp_options[] = {
62
+    { "quality" , "set quality" , OFFSET(log2_count) , AV_OPT_TYPE_INT , {.i64 = 3} , 0 , MAX_LEVEL , FLAGS },
63
+    { "qp" , "force a constant quantizer parameter" , OFFSET(qp) , AV_OPT_TYPE_INT , {.i64 = 0} , 0 , 63 , FLAGS },
64
+    { "use_bframe_qp" , "use B-frames' QP" , OFFSET(use_bframe_qp) , AV_OPT_TYPE_INT , {.i64 = 0} , 0 , 1 , FLAGS },
65
+    { NULL }
66
+};
67
+
68
+static const AVClass uspp_class = {
69
+    .class_name       = "uspp",
70
+    .item_name        = av_default_item_name,
71
+    .option           = uspp_options,
72
+    .version          = LIBAVUTIL_VERSION_INT,
73
+    .category         = AV_CLASS_CATEGORY_FILTER,
74
+};
75
+
76
+//===========================================================================//
77
+DECLARE_ALIGNED(8, static const uint8_t, dither)[8][8] = {
78
+    {  0*4,  48*4,  12*4,  60*4,   3*4,  51*4,  15*4,  63*4, },
79
+    { 32*4,  16*4,  44*4,  28*4,  35*4,  19*4,  47*4,  31*4, },
80
+    {  8*4,  56*4,   4*4,  52*4,  11*4,  59*4,   7*4,  55*4, },
81
+    { 40*4,  24*4,  36*4,  20*4,  43*4,  27*4,  39*4,  23*4, },
82
+    {  2*4,  50*4,  14*4,  62*4,   1*4,  49*4,  13*4,  61*4, },
83
+    { 34*4,  18*4,  46*4,  30*4,  33*4,  17*4,  45*4,  29*4, },
84
+    { 10*4,  58*4,   6*4,  54*4,   9*4,  57*4,   5*4,  53*4, },
85
+    { 42*4,  26*4,  38*4,  22*4,  41*4,  25*4,  37*4,  21*4, },
86
+};
87
+
88
+static const uint8_t offset[511][2]= {
89
+    { 0, 0},
90
+    { 0, 0}, { 8, 8},                                                              // quality 1
91
+    { 0, 0}, { 4, 4}, {12, 8}, { 8,12},                                            // quality 2
92
+    { 0, 0}, {10, 2}, { 4, 4}, {14, 6}, { 8, 8}, { 2,10}, {12,12}, { 6,14},        // quality 3
93
+
94
+    { 0, 0}, {10, 2}, { 4, 4}, {14, 6}, { 8, 8}, { 2,10}, {12,12}, { 6,14},
95
+    { 5, 1}, {15, 3}, { 9, 5}, { 3, 7}, {13, 9}, { 7,11}, { 1,13}, {11,15},        // quality 4
96
+
97
+    { 0, 0}, { 8, 0}, { 0, 8}, { 8, 8}, { 5, 1}, {13, 1}, { 5, 9}, {13, 9},
98
+    { 2, 2}, {10, 2}, { 2,10}, {10,10}, { 7, 3}, {15, 3}, { 7,11}, {15,11},
99
+    { 4, 4}, {12, 4}, { 4,12}, {12,12}, { 1, 5}, { 9, 5}, { 1,13}, { 9,13},
100
+    { 6, 6}, {14, 6}, { 6,14}, {14,14}, { 3, 7}, {11, 7}, { 3,15}, {11,15},        // quality 5
101
+
102
+    { 0, 0}, { 8, 0}, { 0, 8}, { 8, 8}, { 4, 0}, {12, 0}, { 4, 8}, {12, 8},
103
+    { 1, 1}, { 9, 1}, { 1, 9}, { 9, 9}, { 5, 1}, {13, 1}, { 5, 9}, {13, 9},
104
+    { 3, 2}, {11, 2}, { 3,10}, {11,10}, { 7, 2}, {15, 2}, { 7,10}, {15,10},
105
+    { 2, 3}, {10, 3}, { 2,11}, {10,11}, { 6, 3}, {14, 3}, { 6,11}, {14,11},
106
+    { 0, 4}, { 8, 4}, { 0,12}, { 8,12}, { 4, 4}, {12, 4}, { 4,12}, {12,12},
107
+    { 1, 5}, { 9, 5}, { 1,13}, { 9,13}, { 5, 5}, {13, 5}, { 5,13}, {13,13},
108
+    { 3, 6}, {11, 6}, { 3,14}, {11,14}, { 7, 6}, {15, 6}, { 7,14}, {15,14},
109
+    { 2, 7}, {10, 7}, { 2,15}, {10,15}, { 6, 7}, {14, 7}, { 6,15}, {14,15},        // quality 6
110
+
111
+    { 0, 0}, { 8, 0}, { 0, 8}, { 8, 8}, { 0, 2}, { 8, 2}, { 0,10}, { 8,10},
112
+    { 0, 4}, { 8, 4}, { 0,12}, { 8,12}, { 0, 6}, { 8, 6}, { 0,14}, { 8,14},
113
+    { 1, 1}, { 9, 1}, { 1, 9}, { 9, 9}, { 1, 3}, { 9, 3}, { 1,11}, { 9,11},
114
+    { 1, 5}, { 9, 5}, { 1,13}, { 9,13}, { 1, 7}, { 9, 7}, { 1,15}, { 9,15},
115
+    { 2, 0}, {10, 0}, { 2, 8}, {10, 8}, { 2, 2}, {10, 2}, { 2,10}, {10,10},
116
+    { 2, 4}, {10, 4}, { 2,12}, {10,12}, { 2, 6}, {10, 6}, { 2,14}, {10,14},
117
+    { 3, 1}, {11, 1}, { 3, 9}, {11, 9}, { 3, 3}, {11, 3}, { 3,11}, {11,11},
118
+    { 3, 5}, {11, 5}, { 3,13}, {11,13}, { 3, 7}, {11, 7}, { 3,15}, {11,15},
119
+    { 4, 0}, {12, 0}, { 4, 8}, {12, 8}, { 4, 2}, {12, 2}, { 4,10}, {12,10},
120
+    { 4, 4}, {12, 4}, { 4,12}, {12,12}, { 4, 6}, {12, 6}, { 4,14}, {12,14},
121
+    { 5, 1}, {13, 1}, { 5, 9}, {13, 9}, { 5, 3}, {13, 3}, { 5,11}, {13,11},
122
+    { 5, 5}, {13, 5}, { 5,13}, {13,13}, { 5, 7}, {13, 7}, { 5,15}, {13,15},
123
+    { 6, 0}, {14, 0}, { 6, 8}, {14, 8}, { 6, 2}, {14, 2}, { 6,10}, {14,10},
124
+    { 6, 4}, {14, 4}, { 6,12}, {14,12}, { 6, 6}, {14, 6}, { 6,14}, {14,14},
125
+    { 7, 1}, {15, 1}, { 7, 9}, {15, 9}, { 7, 3}, {15, 3}, { 7,11}, {15,11},
126
+    { 7, 5}, {15, 5}, { 7,13}, {15,13}, { 7, 7}, {15, 7}, { 7,15}, {15,15},        // quality 7
127
+
128
+    { 0, 0}, { 8, 0}, { 0, 8}, { 8, 8}, { 4, 4}, {12, 4}, { 4,12}, {12,12},
129
+    { 0, 4}, { 8, 4}, { 0,12}, { 8,12}, { 4, 0}, {12, 0}, { 4, 8}, {12, 8},
130
+    { 2, 2}, {10, 2}, { 2,10}, {10,10}, { 6, 6}, {14, 6}, { 6,14}, {14,14},
131
+    { 2, 6}, {10, 6}, { 2,14}, {10,14}, { 6, 2}, {14, 2}, { 6,10}, {14,10},
132
+    { 0, 2}, { 8, 2}, { 0,10}, { 8,10}, { 4, 6}, {12, 6}, { 4,14}, {12,14},
133
+    { 0, 6}, { 8, 6}, { 0,14}, { 8,14}, { 4, 2}, {12, 2}, { 4,10}, {12,10},
134
+    { 2, 0}, {10, 0}, { 2, 8}, {10, 8}, { 6, 4}, {14, 4}, { 6,12}, {14,12},
135
+    { 2, 4}, {10, 4}, { 2,12}, {10,12}, { 6, 0}, {14, 0}, { 6, 8}, {14, 8},
136
+    { 1, 1}, { 9, 1}, { 1, 9}, { 9, 9}, { 5, 5}, {13, 5}, { 5,13}, {13,13},
137
+    { 1, 5}, { 9, 5}, { 1,13}, { 9,13}, { 5, 1}, {13, 1}, { 5, 9}, {13, 9},
138
+    { 3, 3}, {11, 3}, { 3,11}, {11,11}, { 7, 7}, {15, 7}, { 7,15}, {15,15},
139
+    { 3, 7}, {11, 7}, { 3,15}, {11,15}, { 7, 3}, {15, 3}, { 7,11}, {15,11},
140
+    { 1, 3}, { 9, 3}, { 1,11}, { 9,11}, { 5, 7}, {13, 7}, { 5,15}, {13,15},
141
+    { 1, 7}, { 9, 7}, { 1,15}, { 9,15}, { 5, 3}, {13, 3}, { 5,11}, {13,11},        // quality 8
142
+    { 3, 1}, {11, 1}, { 3, 9}, {11, 9}, { 7, 5}, {15, 5}, { 7,13}, {15,13},
143
+    { 3, 5}, {11, 5}, { 3,13}, {11,13}, { 7, 1}, {15, 1}, { 7, 9}, {15, 9},
144
+    { 0, 1}, { 8, 1}, { 0, 9}, { 8, 9}, { 4, 5}, {12, 5}, { 4,13}, {12,13},
145
+    { 0, 5}, { 8, 5}, { 0,13}, { 8,13}, { 4, 1}, {12, 1}, { 4, 9}, {12, 9},
146
+    { 2, 3}, {10, 3}, { 2,11}, {10,11}, { 6, 7}, {14, 7}, { 6,15}, {14,15},
147
+    { 2, 7}, {10, 7}, { 2,15}, {10,15}, { 6, 3}, {14, 3}, { 6,11}, {14,11},
148
+    { 0, 3}, { 8, 3}, { 0,11}, { 8,11}, { 4, 7}, {12, 7}, { 4,15}, {12,15},
149
+    { 0, 7}, { 8, 7}, { 0,15}, { 8,15}, { 4, 3}, {12, 3}, { 4,11}, {12,11},
150
+    { 2, 1}, {10, 1}, { 2, 9}, {10, 9}, { 6, 5}, {14, 5}, { 6,13}, {14,13},
151
+    { 2, 5}, {10, 5}, { 2,13}, {10,13}, { 6, 1}, {14, 1}, { 6, 9}, {14, 9},
152
+    { 1, 0}, { 9, 0}, { 1, 8}, { 9, 8}, { 5, 4}, {13, 4}, { 5,12}, {13,12},
153
+    { 1, 4}, { 9, 4}, { 1,12}, { 9,12}, { 5, 0}, {13, 0}, { 5, 8}, {13, 8},
154
+    { 3, 2}, {11, 2}, { 3,10}, {11,10}, { 7, 6}, {15, 6}, { 7,14}, {15,14},
155
+    { 3, 6}, {11, 6}, { 3,14}, {11,14}, { 7, 2}, {15, 2}, { 7,10}, {15,10},
156
+    { 1, 2}, { 9, 2}, { 1,10}, { 9,10}, { 5, 6}, {13, 6}, { 5,14}, {13,14},
157
+    { 1, 6}, { 9, 6}, { 1,14}, { 9,14}, { 5, 2}, {13, 2}, { 5,10}, {13,10},
158
+    { 3, 0}, {11, 0}, { 3, 8}, {11, 8}, { 7, 4}, {15, 4}, { 7,12}, {15,12},
159
+    { 3, 4}, {11, 4}, { 3,12}, {11,12}, { 7, 0}, {15, 0}, { 7, 8}, {15, 8},
160
+};
161
+
162
+static void store_slice_c(uint8_t *dst, int16_t *src,
163
+                         int dst_stride, int src_stride,
164
+                         int width, int height, int log2_scale )
165
+{
166
+    int y, x;
167
+
168
+#define STORE(pos) do {                                                  \
169
+    temp = ((src[x + y * src_stride + pos] << log2_scale) + d[pos]) >> 8;  \
170
+    if (temp & 0x100) temp = ~(temp >> 31);                              \
171
+    dst[x + y * dst_stride + pos] = temp;                                  \
172
+} while (0);
173
+
174
+    for (y = 0 ; y < height ; y++) {
175
+    const uint8_t *d = dither[y&7];
176
+        for (x = 0 ; x < width ; x += 8) {
177
+            int temp;
178
+            STORE(0);
179
+            STORE(1);
180
+            STORE(2);
181
+            STORE(3);
182
+            STORE(4);
183
+            STORE(5);
184
+            STORE(6);
185
+            STORE(7);
186
+        }
187
+    }
188
+}
189
+
190
+static inline int norm_qscale(int qscale, int type)
191
+{
192
+    switch (type) {
193
+    case FF_QSCALE_TYPE_MPEG1: return qscale;
194
+    case FF_QSCALE_TYPE_MPEG2: return qscale >> 1;
195
+    case FF_QSCALE_TYPE_H264:  return qscale >> 2;
196
+    case FF_QSCALE_TYPE_VP56:  return (63 - qscale + 2) >> 2;
197
+    }
198
+    return qscale;
199
+}
200
+
201
+static void filter(USPPContext *p, uint8_t *dst[3], uint8_t *src[3],
202
+                 int dst_stride[3], int src_stride[3], int width,
203
+                 int height, uint8_t *qp_store, int qp_stride)
204
+{
205
+    int x, y, i, j;
206
+    const int count = 1<<p->log2_count;
207
+    for (i = 0 ; i < 3 ; i++) {
208
+        int is_chroma = !!i;
209
+        int w = width  >> is_chroma;
210
+        int h = height >> is_chroma;
211
+        int stride = p->temp_stride[i];
212
+        int block = BLOCK >> is_chroma;
213
+
214
+        if (!src[i] || !dst[i])
215
+            continue;
216
+        for (y = 0 ; y < h ; y++) {
217
+            int index = block + block * stride + y * stride;
218
+            memcpy( p->src[i] + index , src[i] + y * src_stride[i] , w );
219
+            for (x = 0 ; x < block ; x++) {
220
+                p->src[i][index     - x - 1]= p->src[i][index +     x    ];
221
+                p->src[i][index + w + x    ]= p->src[i][index + w - x - 1];
222
+            }
223
+        }
224
+        for (y = 0 ; y < block ; y++){
225
+            memcpy(p->src[i] + (  block-1-y) * stride , p->src[i] + (  y+block  ) * stride , stride);
226
+            memcpy(p->src[i] + (h+block  +y) * stride , p->src[i] + (h-y+block-1) * stride , stride);
227
+        }
228
+
229
+        p->frame->linesize[i] = stride;
230
+        memset(p->temp[i] , 0 , (h + 2 * block) * stride * sizeof(int16_t));
231
+    }
232
+
233
+    if (p->qp)
234
+        p->frame->quality = p->qp * FF_QP2LAMBDA;
235
+    else
236
+        p->frame->quality = norm_qscale(qp_store[0] , p->qscale_type) * FF_QP2LAMBDA;
237
+//    init per MB qscale stuff FIXME
238
+    p->frame->height = height;
239
+    p->frame->width  = width;
240
+
241
+    for (i = 0 ; i < count ; i++) {
242
+        const int x1 = offset[i+count-1][0];
243
+        const int y1 = offset[i+count-1][1];
244
+        int offset;
245
+        AVPacket pkt;
246
+        int got_pkt_ptr;
247
+
248
+        av_init_packet(&pkt);
249
+        pkt.data = p->outbuf;
250
+        pkt.size = p->outbuf_size;
251
+
252
+        p->frame->data[0] = p->src[0] + x1   + y1   * p->frame->linesize[0];
253
+        p->frame->data[1] = p->src[1] + x1/2 + y1/2 * p->frame->linesize[1];
254
+        p->frame->data[2] = p->src[2] + x1/2 + y1/2 * p->frame->linesize[2];
255
+        p->frame->format  = p->avctx_enc[i]->pix_fmt;
256
+
257
+        avcodec_encode_video2(p->avctx_enc[i] , &pkt , p->frame , &got_pkt_ptr);
258
+        p->frame_dec = p->avctx_enc[i]->coded_frame;
259
+
260
+        offset = (BLOCK-x1) + (BLOCK-y1) * p->frame_dec->linesize[0];
261
+
262
+        for (y = 0 ; y < height ; y++)
263
+            for (x = 0 ; x < width ; x++)
264
+                p->temp[0][ x + y * p->temp_stride[0] ] += p->frame_dec->data[0][ x + y * p->frame_dec->linesize[0] + offset ];
265
+
266
+        offset = (BLOCK/2-x1/2) + (BLOCK/2-y1/2) * p->frame_dec->linesize[1];
267
+
268
+        for (y = 0 ; y < height/2 ; y++) {
269
+            for (x = 0; x < width/2 ; x++) {
270
+                p->temp[1][ x + y * p->temp_stride[1] ] += p->frame_dec->data[1][ x + y * p->frame_dec->linesize[1] + offset ];
271
+                p->temp[2][ x + y * p->temp_stride[2] ] += p->frame_dec->data[2][ x + y * p->frame_dec->linesize[2] + offset ];
272
+            }
273
+        }
274
+    }
275
+
276
+    for (j = 0 ; j < 3 ; j++) {
277
+        int is_chroma = !!j;
278
+        if (!dst[j])
279
+            continue;
280
+        store_slice_c(dst[j] , p->temp[j] , dst_stride[j] , p->temp_stride[j] ,
281
+             width >> is_chroma , height >> is_chroma , 8-p->log2_count);
282
+    }
283
+}
284
+
285
+static int query_formats(AVFilterContext *ctx)
286
+{
287
+    static const enum PixelFormat pix_fmts[] = {
288
+        AV_PIX_FMT_YUV444P,  AV_PIX_FMT_YUV422P,
289
+        AV_PIX_FMT_YUV420P,  AV_PIX_FMT_YUV411P,
290
+        AV_PIX_FMT_YUV410P,  AV_PIX_FMT_YUV440P,
291
+        AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVJ422P,
292
+        AV_PIX_FMT_YUVJ420P, AV_PIX_FMT_YUVJ440P,
293
+        AV_PIX_FMT_NONE
294
+    };
295
+    ff_set_common_formats(ctx, ff_make_format_list(pix_fmts));
296
+    return 0;
297
+}
298
+
299
+static int config_input(AVFilterLink *inlink)
300
+{
301
+
302
+    AVFilterContext *ctx = inlink->dst;
303
+    USPPContext *uspp = ctx->priv;
304
+    const int height = inlink->h;
305
+    const int width  = inlink->w;
306
+    int i;
307
+
308
+    AVCodec *enc = avcodec_find_encoder(AV_CODEC_ID_SNOW);
309
+    if(!enc)
310
+    {
311
+        av_log(ctx, AV_LOG_ERROR, "SNOW encoder not found.\n");
312
+        return AVERROR(EINVAL);
313
+    }
314
+
315
+    if (!uspp->use_bframe_qp) {
316
+        /* we are assuming here the qp blocks will not be smaller that 16x16 */
317
+        uspp->non_b_qp_alloc_size = FF_CEIL_RSHIFT(width, 4) * FF_CEIL_RSHIFT(height, 4);
318
+        uspp->non_b_qp_table = av_calloc(uspp->non_b_qp_alloc_size, sizeof(*uspp->non_b_qp_table));
319
+
320
+        if (!uspp->non_b_qp_table)
321
+            return AVERROR(ENOMEM);
322
+    }
323
+
324
+    for (i = 0 ; i < 3; i++) {
325
+        int is_chroma = !!i;
326
+        int w = ((width  + 4 * BLOCK-1) & (~(2 * BLOCK-1))) >> is_chroma;
327
+        int h = ((height + 4 * BLOCK-1) & (~(2 * BLOCK-1))) >> is_chroma;
328
+
329
+        uspp->temp_stride[i] = w;
330
+        if (!(uspp->temp[i] = av_malloc(uspp->temp_stride[i] * h * sizeof(int16_t))))
331
+            return AVERROR(ENOMEM);
332
+        if (!(uspp->src [i] = av_malloc(uspp->temp_stride[i] * h * sizeof(uint8_t))))
333
+            return AVERROR(ENOMEM);
334
+    }
335
+
336
+    for (i = 0 ; i < (1<<uspp->log2_count) ; i++) {
337
+        AVCodecContext *avctx_enc;
338
+        AVDictionary *opts = NULL;
339
+        int ret;
340
+
341
+        if (!(uspp->avctx_enc[i] = avcodec_alloc_context3(NULL)))
342
+            return AVERROR(ENOMEM);
343
+
344
+        avctx_enc = uspp->avctx_enc[i];
345
+        avctx_enc->width = width + BLOCK;
346
+        avctx_enc->height = height + BLOCK;
347
+        avctx_enc->time_base = (AVRational){1,25};  // meaningless
348
+        avctx_enc->gop_size = 300;
349
+        avctx_enc->max_b_frames = 0;
350
+        avctx_enc->pix_fmt = AV_PIX_FMT_YUV420P;
351
+        avctx_enc->flags = CODEC_FLAG_QSCALE | CODEC_FLAG_LOW_DELAY;
352
+        avctx_enc->strict_std_compliance = FF_COMPLIANCE_EXPERIMENTAL;
353
+        avctx_enc->global_quality = 123;
354
+        av_dict_set(&opts, "no_bitstream", "1", 0);
355
+        ret = avcodec_open2(avctx_enc, enc, &opts);
356
+        if (ret < 0)
357
+            return ret;
358
+        av_dict_free(&opts);
359
+        av_assert0(avctx_enc->codec);
360
+    }
361
+
362
+    uspp->outbuf_size = (width + BLOCK) * (height + BLOCK) * 10;
363
+    if (!(uspp->frame = av_frame_alloc()))
364
+            return AVERROR(ENOMEM);
365
+    if (!(uspp->outbuf = av_malloc(uspp->outbuf_size)))
366
+            return AVERROR(ENOMEM);
367
+
368
+    return 0;
369
+}
370
+
371
+static int filter_frame(AVFilterLink *inlink, AVFrame *in)
372
+{
373
+    AVFilterContext *ctx = inlink->dst;
374
+    USPPContext *uspp = ctx->priv;
375
+    AVFilterLink *outlink = ctx->outputs[0];
376
+    AVFrame *out = in;
377
+
378
+    int qp_stride = 0;
379
+    uint8_t *qp_table = NULL;
380
+
381
+    /* if we are not in a constant user quantizer mode and we don't want to use
382
+     * the quantizers from the B-frames (B-frames often have a higher QP), we
383
+     * need to save the qp table from the last non B-frame; this is what the
384
+     * following code block does */
385
+    if (!uspp->qp) {
386
+        qp_table = av_frame_get_qp_table(in, &qp_stride, &uspp->qscale_type);
387
+
388
+        if (qp_table && !uspp->use_bframe_qp && in->pict_type != AV_PICTURE_TYPE_B) {
389
+            int w, h;
390
+
391
+            /* if the qp stride is not set, it means the QP are only defined on
392
+             * a line basis */
393
+            if (!qp_stride) {
394
+                w = FF_CEIL_RSHIFT(inlink->w, 4);
395
+                h = 1;
396
+            } else {
397
+                w = FF_CEIL_RSHIFT(qp_stride, 4);
398
+                h = FF_CEIL_RSHIFT(inlink->h, 4);
399
+            }
400
+            av_assert0(w * h <= uspp->non_b_qp_alloc_size);
401
+            memcpy(uspp->non_b_qp_table , qp_table , w * h);
402
+        }
403
+    }
404
+
405
+    if (uspp->log2_count && !ctx->is_disabled) {
406
+        if (!uspp->use_bframe_qp && uspp->non_b_qp_table)
407
+            qp_table = uspp->non_b_qp_table;
408
+
409
+        if (qp_table || uspp->qp) {
410
+
411
+            /* get a new frame if in-place is not possible or if the dimensions
412
+             * are not multiple of 8 */
413
+            if (!av_frame_is_writable(in) || (inlink->w & 7) || (inlink->h & 7)) {
414
+                const int aligned_w = FFALIGN(inlink->w, 8);
415
+                const int aligned_h = FFALIGN(inlink->h, 8);
416
+
417
+                out = ff_get_video_buffer(outlink, aligned_w, aligned_h);
418
+                if (!out) {
419
+                    av_frame_free(&in);
420
+                    return AVERROR(ENOMEM);
421
+                }
422
+                av_frame_copy_props(out, in);
423
+                out->width  = in->width;
424
+                out->height = in->height;
425
+            }
426
+
427
+            filter(uspp , out->data , in->data , out->linesize , in->linesize , inlink->w , inlink->h , qp_table , qp_stride);
428
+        }
429
+    }
430
+
431
+    if (in != out) {
432
+        if (in->data[3])
433
+            av_image_copy_plane(out->data[3], out->linesize[3],
434
+                                in ->data[3], in ->linesize[3],
435
+                                inlink->w, inlink->h);
436
+        av_frame_free(&in);
437
+    }
438
+    return ff_filter_frame(outlink, out);
439
+}
440
+
441
+static av_cold void uninit(AVFilterContext *ctx)
442
+{
443
+    USPPContext *uspp = ctx->priv;
444
+    int i;
445
+
446
+    for (i = 0 ; i < 3 ; i++) {
447
+        av_freep(&uspp->temp[i]);
448
+        av_freep(&uspp->src[i]);
449
+    }
450
+
451
+    for (i = 0 ; i < (1 << uspp->log2_count) ; i++) {
452
+        avcodec_close(uspp->avctx_enc[i]);
453
+        av_freep(&uspp->avctx_enc[i]);
454
+    }
455
+
456
+    av_freep(&uspp->non_b_qp_table);
457
+    av_freep(&uspp->outbuf);
458
+    av_frame_free(&uspp->frame);
459
+}
460
+
461
+static const AVFilterPad uspp_inputs[] = {
462
+    {
463
+        .name         = "default",
464
+        .type         = AVMEDIA_TYPE_VIDEO,
465
+        .config_props = config_input,
466
+        .filter_frame = filter_frame,
467
+    },
468
+    { NULL }
469
+};
470
+
471
+static const AVFilterPad uspp_outputs[] = {
472
+    {
473
+        .name = "default",
474
+        .type = AVMEDIA_TYPE_VIDEO,
475
+    },
476
+    { NULL }
477
+};
478
+
479
+AVFilter ff_vf_uspp = {
480
+    .name            = "uspp",
481
+    .description     = NULL_IF_CONFIG_SMALL("Apply Ultra Simple / Slow Post-processing filter."),
482
+    .priv_size       = sizeof(USPPContext),
483
+    .uninit          = uninit,
484
+    .query_formats   = query_formats,
485
+    .inputs          = uspp_inputs,
486
+    .outputs         = uspp_outputs,
487
+    .priv_class      = &uspp_class,
488
+    .flags           = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,
489
+};