pmhd: ffmpeg/libavfilter/vf_thumbnail.c annotate

annotate ffmpeg/libavfilter/vf_thumbnail.c @ 13:844d341cf643 tip

Back up before ISMIR

author	Yading Song <yading.song@eecs.qmul.ac.uk>
date	Thu, 31 Oct 2013 13:17:06 +0000
parents	f445c3017523
children

rev	line source
yading@11	1 /*
yading@11	2 * Copyright (c) 2011 Smartjog S.A.S, Clément Bœsch <clement.boesch@smartjog.com>
yading@11	3 *
yading@11	4 * This file is part of FFmpeg.
yading@11	5 *
yading@11	6 * FFmpeg is free software; you can redistribute it and/or
yading@11	7 * modify it under the terms of the GNU Lesser General Public
yading@11	8 * License as published by the Free Software Foundation; either
yading@11	9 * version 2.1 of the License, or (at your option) any later version.
yading@11	10 *
yading@11	11 * FFmpeg is distributed in the hope that it will be useful,
yading@11	12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
yading@11	13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
yading@11	14 * Lesser General Public License for more details.
yading@11	15 *
yading@11	16 * You should have received a copy of the GNU Lesser General Public
yading@11	17 * License along with FFmpeg; if not, write to the Free Software
yading@11	18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
yading@11	19 */
yading@11	20
yading@11	21 /**
yading@11	22 * @file
yading@11	23 * Potential thumbnail lookup filter to reduce the risk of an inappropriate
yading@11	24 * selection (such as a black frame) we could get with an absolute seek.
yading@11	25 *
yading@11	26 * Simplified version of algorithm by Vadim Zaliva <lord@crocodile.org>.
yading@11	27 * @see http://notbrainsurgery.livejournal.com/29773.html
yading@11	28 */
yading@11	29
yading@11	30 #include "libavutil/opt.h"
yading@11	31 #include "avfilter.h"
yading@11	32 #include "internal.h"
yading@11	33
yading@11	34 #define HIST_SIZE (3*256)
yading@11	35
yading@11	36 struct thumb_frame {
yading@11	37 AVFrame *buf; ///< cached frame
yading@11	38 int histogram[HIST_SIZE]; ///< RGB color distribution histogram of the frame
yading@11	39 };
yading@11	40
yading@11	41 typedef struct {
yading@11	42 const AVClass *class;
yading@11	43 int n; ///< current frame
yading@11	44 int n_frames; ///< number of frames for analysis
yading@11	45 struct thumb_frame *frames; ///< the n_frames frames
yading@11	46 AVRational tb; ///< copy of the input timebase to ease access
yading@11	47 } ThumbContext;
yading@11	48
yading@11	49 #define OFFSET(x) offsetof(ThumbContext, x)
yading@11	50 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM\|AV_OPT_FLAG_FILTERING_PARAM
yading@11	51
yading@11	52 static const AVOption thumbnail_options[] = {
yading@11	53 { "n", "set the frames batch size", OFFSET(n_frames), AV_OPT_TYPE_INT, {.i64=100}, 2, INT_MAX, FLAGS },
yading@11	54 { NULL }
yading@11	55 };
yading@11	56
yading@11	57 AVFILTER_DEFINE_CLASS(thumbnail);
yading@11	58
yading@11	59 static av_cold int init(AVFilterContext *ctx)
yading@11	60 {
yading@11	61 ThumbContext *thumb = ctx->priv;
yading@11	62
yading@11	63 thumb->frames = av_calloc(thumb->n_frames, sizeof(*thumb->frames));
yading@11	64 if (!thumb->frames) {
yading@11	65 av_log(ctx, AV_LOG_ERROR,
yading@11	66 "Allocation failure, try to lower the number of frames\n");
yading@11	67 return AVERROR(ENOMEM);
yading@11	68 }
yading@11	69 av_log(ctx, AV_LOG_VERBOSE, "batch size: %d frames\n", thumb->n_frames);
yading@11	70 return 0;
yading@11	71 }
yading@11	72
yading@11	73 /**
yading@11	74 * @brief Compute Sum-square deviation to estimate "closeness".
yading@11	75 * @param hist color distribution histogram
yading@11	76 * @param median average color distribution histogram
yading@11	77 * @return sum of squared errors
yading@11	78 */
yading@11	79 static double frame_sum_square_err(const int hist, const double median)
yading@11	80 {
yading@11	81 int i;
yading@11	82 double err, sum_sq_err = 0;
yading@11	83
yading@11	84 for (i = 0; i < HIST_SIZE; i++) {
yading@11	85 err = median[i] - (double)hist[i];
yading@11	86 sum_sq_err += err*err;
yading@11	87 }
yading@11	88 return sum_sq_err;
yading@11	89 }
yading@11	90
yading@11	91 static AVFrame get_best_frame(AVFilterContext ctx)
yading@11	92 {
yading@11	93 AVFrame *picref;
yading@11	94 ThumbContext *thumb = ctx->priv;
yading@11	95 int i, j, best_frame_idx = 0;
yading@11	96 int nb_frames = thumb->n;
yading@11	97 double avg_hist[HIST_SIZE] = {0}, sq_err, min_sq_err = -1;
yading@11	98
yading@11	99 // average histogram of the N frames
yading@11	100 for (j = 0; j < FF_ARRAY_ELEMS(avg_hist); j++) {
yading@11	101 for (i = 0; i < nb_frames; i++)
yading@11	102 avg_hist[j] += (double)thumb->frames[i].histogram[j];
yading@11	103 avg_hist[j] /= nb_frames;
yading@11	104 }
yading@11	105
yading@11	106 // find the frame closer to the average using the sum of squared errors
yading@11	107 for (i = 0; i < nb_frames; i++) {
yading@11	108 sq_err = frame_sum_square_err(thumb->frames[i].histogram, avg_hist);
yading@11	109 if (i == 0 \|\| sq_err < min_sq_err)
yading@11	110 best_frame_idx = i, min_sq_err = sq_err;
yading@11	111 }
yading@11	112
yading@11	113 // free and reset everything (except the best frame buffer)
yading@11	114 for (i = 0; i < nb_frames; i++) {
yading@11	115 memset(thumb->frames[i].histogram, 0, sizeof(thumb->frames[i].histogram));
yading@11	116 if (i != best_frame_idx)
yading@11	117 av_frame_free(&thumb->frames[i].buf);
yading@11	118 }
yading@11	119 thumb->n = 0;
yading@11	120
yading@11	121 // raise the chosen one
yading@11	122 picref = thumb->frames[best_frame_idx].buf;
yading@11	123 av_log(ctx, AV_LOG_INFO, "frame id #%d (pts_time=%f) selected "
yading@11	124 "from a set of %d images\n", best_frame_idx,
yading@11	125 picref->pts * av_q2d(thumb->tb), nb_frames);
yading@11	126 thumb->frames[best_frame_idx].buf = NULL;
yading@11	127
yading@11	128 return picref;
yading@11	129 }
yading@11	130
yading@11	131 static int filter_frame(AVFilterLink inlink, AVFrame frame)
yading@11	132 {
yading@11	133 int i, j;
yading@11	134 AVFilterContext *ctx = inlink->dst;
yading@11	135 ThumbContext *thumb = ctx->priv;
yading@11	136 AVFilterLink *outlink = ctx->outputs[0];
yading@11	137 int *hist = thumb->frames[thumb->n].histogram;
yading@11	138 const uint8_t *p = frame->data[0];
yading@11	139
yading@11	140 // keep a reference of each frame
yading@11	141 thumb->frames[thumb->n].buf = frame;
yading@11	142
yading@11	143 // update current frame RGB histogram
yading@11	144 for (j = 0; j < inlink->h; j++) {
yading@11	145 for (i = 0; i < inlink->w; i++) {
yading@11	146 hist[0256 + p[i3 ]]++;
yading@11	147 hist[1256 + p[i3 + 1]]++;
yading@11	148 hist[2256 + p[i3 + 2]]++;
yading@11	149 }
yading@11	150 p += frame->linesize[0];
yading@11	151 }
yading@11	152
yading@11	153 // no selection until the buffer of N frames is filled up
yading@11	154 thumb->n++;
yading@11	155 if (thumb->n < thumb->n_frames)
yading@11	156 return 0;
yading@11	157
yading@11	158 return ff_filter_frame(outlink, get_best_frame(ctx));
yading@11	159 }
yading@11	160
yading@11	161 static av_cold void uninit(AVFilterContext *ctx)
yading@11	162 {
yading@11	163 int i;
yading@11	164 ThumbContext *thumb = ctx->priv;
yading@11	165 for (i = 0; i < thumb->n_frames && thumb->frames[i].buf; i++)
yading@11	166 av_frame_free(&thumb->frames[i].buf);
yading@11	167 av_freep(&thumb->frames);
yading@11	168 }
yading@11	169
yading@11	170 static int request_frame(AVFilterLink *link)
yading@11	171 {
yading@11	172 AVFilterContext *ctx = link->src;
yading@11	173 ThumbContext *thumb = ctx->priv;
yading@11	174
yading@11	175 /* loop until a frame thumbnail is available (when a frame is queued,
yading@11	176 * thumb->n is reset to zero) */
yading@11	177 do {
yading@11	178 int ret = ff_request_frame(ctx->inputs[0]);
yading@11	179 if (ret == AVERROR_EOF && thumb->n) {
yading@11	180 ret = ff_filter_frame(link, get_best_frame(ctx));
yading@11	181 if (ret < 0)
yading@11	182 return ret;
yading@11	183 ret = AVERROR_EOF;
yading@11	184 }
yading@11	185 if (ret < 0)
yading@11	186 return ret;
yading@11	187 } while (thumb->n);
yading@11	188 return 0;
yading@11	189 }
yading@11	190
yading@11	191 static int config_props(AVFilterLink *inlink)
yading@11	192 {
yading@11	193 AVFilterContext *ctx = inlink->dst;
yading@11	194 ThumbContext *thumb = ctx->priv;
yading@11	195
yading@11	196 thumb->tb = inlink->time_base;
yading@11	197 return 0;
yading@11	198 }
yading@11	199
yading@11	200 static int query_formats(AVFilterContext *ctx)
yading@11	201 {
yading@11	202 static const enum AVPixelFormat pix_fmts[] = {
yading@11	203 AV_PIX_FMT_RGB24, AV_PIX_FMT_BGR24,
yading@11	204 AV_PIX_FMT_NONE
yading@11	205 };
yading@11	206 ff_set_common_formats(ctx, ff_make_format_list(pix_fmts));
yading@11	207 return 0;
yading@11	208 }
yading@11	209
yading@11	210 static const AVFilterPad thumbnail_inputs[] = {
yading@11	211 {
yading@11	212 .name = "default",
yading@11	213 .type = AVMEDIA_TYPE_VIDEO,
yading@11	214 .config_props = config_props,
yading@11	215 .get_video_buffer = ff_null_get_video_buffer,
yading@11	216 .filter_frame = filter_frame,
yading@11	217 },
yading@11	218 { NULL }
yading@11	219 };
yading@11	220
yading@11	221 static const AVFilterPad thumbnail_outputs[] = {
yading@11	222 {
yading@11	223 .name = "default",
yading@11	224 .type = AVMEDIA_TYPE_VIDEO,
yading@11	225 .request_frame = request_frame,
yading@11	226 },
yading@11	227 { NULL }
yading@11	228 };
yading@11	229
yading@11	230 AVFilter avfilter_vf_thumbnail = {
yading@11	231 .name = "thumbnail",
yading@11	232 .description = NULL_IF_CONFIG_SMALL("Select the most representative frame in a given sequence of consecutive frames."),
yading@11	233 .priv_size = sizeof(ThumbContext),
yading@11	234 .init = init,
yading@11	235 .uninit = uninit,
yading@11	236 .query_formats = query_formats,
yading@11	237 .inputs = thumbnail_inputs,
yading@11	238 .outputs = thumbnail_outputs,
yading@11	239 .priv_class = &thumbnail_class,
yading@11	240 };

Mercurial > hg > pmhd

annotate ffmpeg/libavfilter/vf_thumbnail.c @ 13:844d341cf643 tip