GitList

libavfilter/vf_thumbnail.c

15a2a29b	/* * Copyright (c) 2011 Smartjog S.A.S, Clément Bœsch <clement.boesch@smartjog.com> * * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA / /* * @file * Potential thumbnail lookup filter to reduce the risk of an inappropriate * selection (such as a black frame) we could get with an absolute seek. * * Simplified version of algorithm by Vadim Zaliva <lord@crocodile.org>.
174880f5	* @see http://notbrainsurgery.livejournal.com/29773.html
15a2a29b	*/
386dc9a3	#include "libavutil/opt.h"
15a2a29b	#include "avfilter.h"
c9e183b4	#include "internal.h"
15a2a29b	#define HIST_SIZE (3*256) struct thumb_frame {
a05a44e2	AVFrame *buf; ///< cached frame
15a2a29b	int histogram[HIST_SIZE]; ///< RGB color distribution histogram of the frame };
ed93ed5e	typedef struct ThumbContext {
386dc9a3	const AVClass *class;
15a2a29b	int n; ///< current frame int n_frames; ///< number of frames for analysis struct thumb_frame *frames; ///< the n_frames frames
a95a3879	AVRational tb; ///< copy of the input timebase to ease access
15a2a29b	} ThumbContext;
386dc9a3	#define OFFSET(x) offsetof(ThumbContext, x) #define FLAGS AV_OPT_FLAG_VIDEO_PARAM\|AV_OPT_FLAG_FILTERING_PARAM static const AVOption thumbnail_options[] = { { "n", "set the frames batch size", OFFSET(n_frames), AV_OPT_TYPE_INT, {.i64=100}, 2, INT_MAX, FLAGS }, { NULL } }; AVFILTER_DEFINE_CLASS(thumbnail);
fd6228e6	static av_cold int init(AVFilterContext *ctx)
15a2a29b	{
b45ff138	ThumbContext *s = ctx->priv;
15a2a29b
b45ff138	s->frames = av_calloc(s->n_frames, sizeof(*s->frames)); if (!s->frames) {
15a2a29b	av_log(ctx, AV_LOG_ERROR, "Allocation failure, try to lower the number of frames\n"); return AVERROR(ENOMEM); }
b45ff138	av_log(ctx, AV_LOG_VERBOSE, "batch size: %d frames\n", s->n_frames);
15a2a29b	return 0; } /** * @brief Compute Sum-square deviation to estimate "closeness". * @param hist color distribution histogram * @param median average color distribution histogram * @return sum of squared errors / static double frame_sum_square_err(const int hist, const double median) { int i; double err, sum_sq_err = 0; for (i = 0; i < HIST_SIZE; i++) { err = median[i] - (double)hist[i]; sum_sq_err += errerr; } return sum_sq_err; }
a95a3879	static AVFrame get_best_frame(AVFilterContext ctx)
15a2a29b	{
a95a3879	AVFrame *picref;
b45ff138	ThumbContext *s = ctx->priv;
15a2a29b	int i, j, best_frame_idx = 0;
b45ff138	int nb_frames = s->n;
15a2a29b	double avg_hist[HIST_SIZE] = {0}, sq_err, min_sq_err = -1;
a95a3879	// average histogram of the N frames for (j = 0; j < FF_ARRAY_ELEMS(avg_hist); j++) { for (i = 0; i < nb_frames; i++)
b45ff138	avg_hist[j] += (double)s->frames[i].histogram[j];
a95a3879	avg_hist[j] /= nb_frames; } // find the frame closer to the average using the sum of squared errors for (i = 0; i < nb_frames; i++) {
b45ff138	sq_err = frame_sum_square_err(s->frames[i].histogram, avg_hist);
a95a3879	if (i == 0 \|\| sq_err < min_sq_err) best_frame_idx = i, min_sq_err = sq_err; } // free and reset everything (except the best frame buffer) for (i = 0; i < nb_frames; i++) {
b45ff138	memset(s->frames[i].histogram, 0, sizeof(s->frames[i].histogram));
a95a3879	if (i != best_frame_idx)
b45ff138	av_frame_free(&s->frames[i].buf);
a95a3879	}
b45ff138	s->n = 0;
a95a3879	// raise the chosen one
b45ff138	picref = s->frames[best_frame_idx].buf;
a95a3879	av_log(ctx, AV_LOG_INFO, "frame id #%d (pts_time=%f) selected " "from a set of %d images\n", best_frame_idx,
b45ff138	picref->pts * av_q2d(s->tb), nb_frames); s->frames[best_frame_idx].buf = NULL;
a95a3879	return picref; } static int filter_frame(AVFilterLink inlink, AVFrame frame) { int i, j;
15a2a29b	AVFilterContext *ctx = inlink->dst;
b45ff138	ThumbContext *s = ctx->priv;
5d796270	AVFilterLink *outlink = ctx->outputs[0];
b45ff138	int *hist = s->frames[s->n].histogram;
24f42531	const uint8_t *p = frame->data[0];
15a2a29b	// keep a reference of each frame
b45ff138	s->frames[s->n].buf = frame;
24f42531	// update current frame RGB histogram for (j = 0; j < inlink->h; j++) { for (i = 0; i < inlink->w; i++) { hist[0256 + p[i3 ]]++; hist[1256 + p[i3 + 1]]++; hist[2256 + p[i3 + 2]]++; } p += frame->linesize[0]; }
15a2a29b	// no selection until the buffer of N frames is filled up
b45ff138	s->n++; if (s->n < s->n_frames)
88beb2df	return 0;
15a2a29b
a95a3879	return ff_filter_frame(outlink, get_best_frame(ctx));
15a2a29b	} static av_cold void uninit(AVFilterContext *ctx) { int i;
b45ff138	ThumbContext *s = ctx->priv; for (i = 0; i < s->n_frames && s->frames[i].buf; i++) av_frame_free(&s->frames[i].buf); av_freep(&s->frames);
15a2a29b	} static int request_frame(AVFilterLink *link) {
a95a3879	AVFilterContext *ctx = link->src;
b45ff138	ThumbContext *s = ctx->priv;
ea2fd42f	int ret = ff_request_frame(ctx->inputs[0]);
15a2a29b
ea2fd42f	if (ret == AVERROR_EOF && s->n) { ret = ff_filter_frame(link, get_best_frame(ctx));
15a2a29b	if (ret < 0) return ret;
ea2fd42f	ret = AVERROR_EOF; } if (ret < 0) return ret;
15a2a29b	return 0; }
a95a3879	static int config_props(AVFilterLink inlink) { AVFilterContext ctx = inlink->dst;
b45ff138	ThumbContext *s = ctx->priv;
a95a3879
b45ff138	s->tb = inlink->time_base;
a95a3879	return 0; }
15a2a29b	static int query_formats(AVFilterContext *ctx) {
ac627b3d	static const enum AVPixelFormat pix_fmts[] = { AV_PIX_FMT_RGB24, AV_PIX_FMT_BGR24, AV_PIX_FMT_NONE
15a2a29b	};
a0854c08	AVFilterFormats *fmts_list = ff_make_format_list(pix_fmts); if (!fmts_list) return AVERROR(ENOMEM); return ff_set_common_formats(ctx, fmts_list);
15a2a29b	}
2d9d4440	static const AVFilterPad thumbnail_inputs[] = { {
b211607b	.name = "default", .type = AVMEDIA_TYPE_VIDEO, .config_props = config_props, .filter_frame = filter_frame,
2d9d4440	}, { NULL } }; static const AVFilterPad thumbnail_outputs[] = { { .name = "default", .type = AVMEDIA_TYPE_VIDEO, .request_frame = request_frame, }, { NULL } };
325f6e0a	AVFilter ff_vf_thumbnail = {
15a2a29b	.name = "thumbnail", .description = NULL_IF_CONFIG_SMALL("Select the most representative frame in a given sequence of consecutive frames."), .priv_size = sizeof(ThumbContext), .init = init, .uninit = uninit, .query_formats = query_formats,
2d9d4440	.inputs = thumbnail_inputs, .outputs = thumbnail_outputs,
386dc9a3	.priv_class = &thumbnail_class,
15a2a29b	};