annotate ffmpeg/libavfilter/vf_decimate.c @ 13:844d341cf643 tip

Back up before ISMIR
author Yading Song <yading.song@eecs.qmul.ac.uk>
date Thu, 31 Oct 2013 13:17:06 +0000
parents 6840f77b83aa
children
rev   line source
yading@10 1 /*
yading@10 2 * Copyright (c) 2012 Fredrik Mellbin
yading@10 3 * Copyright (c) 2013 Clément Bœsch
yading@10 4 *
yading@10 5 * This file is part of FFmpeg.
yading@10 6 *
yading@10 7 * FFmpeg is free software; you can redistribute it and/or
yading@10 8 * modify it under the terms of the GNU Lesser General Public
yading@10 9 * License as published by the Free Software Foundation; either
yading@10 10 * version 2.1 of the License, or (at your option) any later version.
yading@10 11 *
yading@10 12 * FFmpeg is distributed in the hope that it will be useful,
yading@10 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
yading@10 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
yading@10 15 * Lesser General Public License for more details.
yading@10 16 *
yading@10 17 * You should have received a copy of the GNU Lesser General Public
yading@10 18 * License along with FFmpeg; if not, write to the Free Software
yading@10 19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
yading@10 20 */
yading@10 21
yading@10 22 #include "libavutil/opt.h"
yading@10 23 #include "libavutil/pixdesc.h"
yading@10 24 #include "libavutil/timestamp.h"
yading@10 25 #include "avfilter.h"
yading@10 26 #include "internal.h"
yading@10 27
yading@10 28 #define INPUT_MAIN 0
yading@10 29 #define INPUT_CLEANSRC 1
yading@10 30
yading@10 31 struct qitem {
yading@10 32 AVFrame *frame;
yading@10 33 int64_t maxbdiff;
yading@10 34 int64_t totdiff;
yading@10 35 };
yading@10 36
yading@10 37 typedef struct {
yading@10 38 const AVClass *class;
yading@10 39 struct qitem *queue; ///< window of cycle frames and the associated data diff
yading@10 40 int fid; ///< current frame id in the queue
yading@10 41 int filled; ///< 1 if the queue is filled, 0 otherwise
yading@10 42 AVFrame *last; ///< last frame from the previous queue
yading@10 43 int64_t frame_count; ///< output frame counter
yading@10 44 AVFrame **clean_src; ///< frame queue for the clean source
yading@10 45 int got_frame[2]; ///< frame request flag for each input stream
yading@10 46 double ts_unit; ///< timestamp units for the output frames
yading@10 47 uint32_t eof; ///< bitmask for end of stream
yading@10 48 int hsub, vsub; ///< chroma subsampling values
yading@10 49 int depth;
yading@10 50 int nxblocks, nyblocks;
yading@10 51 int bdiffsize;
yading@10 52 int64_t *bdiffs;
yading@10 53
yading@10 54 /* options */
yading@10 55 int cycle;
yading@10 56 double dupthresh_flt;
yading@10 57 double scthresh_flt;
yading@10 58 int64_t dupthresh;
yading@10 59 int64_t scthresh;
yading@10 60 int blockx, blocky;
yading@10 61 int ppsrc;
yading@10 62 int chroma;
yading@10 63 } DecimateContext;
yading@10 64
yading@10 65 #define OFFSET(x) offsetof(DecimateContext, x)
yading@10 66 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
yading@10 67
yading@10 68 static const AVOption decimate_options[] = {
yading@10 69 { "cycle", "set the number of frame from which one will be dropped", OFFSET(cycle), AV_OPT_TYPE_INT, {.i64 = 5}, 2, 25, FLAGS },
yading@10 70 { "dupthresh", "set duplicate threshold", OFFSET(dupthresh_flt), AV_OPT_TYPE_DOUBLE, {.dbl = 1.1}, 0, 100, FLAGS },
yading@10 71 { "scthresh", "set scene change threshold", OFFSET(scthresh_flt), AV_OPT_TYPE_DOUBLE, {.dbl = 15.0}, 0, 100, FLAGS },
yading@10 72 { "blockx", "set the size of the x-axis blocks used during metric calculations", OFFSET(blockx), AV_OPT_TYPE_INT, {.i64 = 32}, 4, 1<<9, FLAGS },
yading@10 73 { "blocky", "set the size of the y-axis blocks used during metric calculations", OFFSET(blocky), AV_OPT_TYPE_INT, {.i64 = 32}, 4, 1<<9, FLAGS },
yading@10 74 { "ppsrc", "mark main input as a pre-processed input and activate clean source input stream", OFFSET(ppsrc), AV_OPT_TYPE_INT, {.i64=0}, 0, 1, FLAGS },
yading@10 75 { "chroma", "set whether or not chroma is considered in the metric calculations", OFFSET(chroma), AV_OPT_TYPE_INT, {.i64=1}, 0, 1, FLAGS },
yading@10 76 { NULL }
yading@10 77 };
yading@10 78
yading@10 79 AVFILTER_DEFINE_CLASS(decimate);
yading@10 80
yading@10 81 static void calc_diffs(const DecimateContext *dm, struct qitem *q,
yading@10 82 const AVFrame *f1, const AVFrame *f2)
yading@10 83 {
yading@10 84 int64_t maxdiff = -1;
yading@10 85 int64_t *bdiffs = dm->bdiffs;
yading@10 86 int plane, i, j;
yading@10 87
yading@10 88 memset(bdiffs, 0, dm->bdiffsize * sizeof(*bdiffs));
yading@10 89
yading@10 90 for (plane = 0; plane < (dm->chroma ? 3 : 1); plane++) {
yading@10 91 int x, y, xl;
yading@10 92 const int linesize1 = f1->linesize[plane];
yading@10 93 const int linesize2 = f2->linesize[plane];
yading@10 94 const uint8_t *f1p = f1->data[plane];
yading@10 95 const uint8_t *f2p = f2->data[plane];
yading@10 96 int width = plane ? f1->width >> dm->hsub : f1->width;
yading@10 97 int height = plane ? f1->height >> dm->vsub : f1->height;
yading@10 98 int hblockx = dm->blockx / 2;
yading@10 99 int hblocky = dm->blocky / 2;
yading@10 100
yading@10 101 if (plane) {
yading@10 102 hblockx >>= dm->hsub;
yading@10 103 hblocky >>= dm->vsub;
yading@10 104 }
yading@10 105
yading@10 106 for (y = 0; y < height; y++) {
yading@10 107 int ydest = y / hblocky;
yading@10 108 int xdest = 0;
yading@10 109
yading@10 110 #define CALC_DIFF(nbits) do { \
yading@10 111 for (x = 0; x < width; x += hblockx) { \
yading@10 112 int64_t acc = 0; \
yading@10 113 int m = FFMIN(width, x + hblockx); \
yading@10 114 for (xl = x; xl < m; xl++) \
yading@10 115 acc += abs(((const uint##nbits##_t *)f1p)[xl] - \
yading@10 116 ((const uint##nbits##_t *)f2p)[xl]); \
yading@10 117 bdiffs[ydest * dm->nxblocks + xdest] += acc; \
yading@10 118 xdest++; \
yading@10 119 } \
yading@10 120 } while (0)
yading@10 121 if (dm->depth == 8) CALC_DIFF(8);
yading@10 122 else CALC_DIFF(16);
yading@10 123
yading@10 124 f1p += linesize1;
yading@10 125 f2p += linesize2;
yading@10 126 }
yading@10 127 }
yading@10 128
yading@10 129 for (i = 0; i < dm->nyblocks - 1; i++) {
yading@10 130 for (j = 0; j < dm->nxblocks - 1; j++) {
yading@10 131 int64_t tmp = bdiffs[ i * dm->nxblocks + j ]
yading@10 132 + bdiffs[ i * dm->nxblocks + j + 1]
yading@10 133 + bdiffs[(i + 1) * dm->nxblocks + j ]
yading@10 134 + bdiffs[(i + 1) * dm->nxblocks + j + 1];
yading@10 135 if (tmp > maxdiff)
yading@10 136 maxdiff = tmp;
yading@10 137 }
yading@10 138 }
yading@10 139
yading@10 140 q->totdiff = 0;
yading@10 141 for (i = 0; i < dm->bdiffsize; i++)
yading@10 142 q->totdiff += bdiffs[i];
yading@10 143 q->maxbdiff = maxdiff;
yading@10 144 }
yading@10 145
yading@10 146 static int filter_frame(AVFilterLink *inlink, AVFrame *in)
yading@10 147 {
yading@10 148 int scpos = -1, duppos = -1;
yading@10 149 int drop = INT_MIN, i, lowest = 0, ret;
yading@10 150 AVFilterContext *ctx = inlink->dst;
yading@10 151 AVFilterLink *outlink = ctx->outputs[0];
yading@10 152 DecimateContext *dm = ctx->priv;
yading@10 153 AVFrame *prv;
yading@10 154
yading@10 155 /* update frames queue(s) */
yading@10 156 if (FF_INLINK_IDX(inlink) == INPUT_MAIN) {
yading@10 157 dm->queue[dm->fid].frame = in;
yading@10 158 dm->got_frame[INPUT_MAIN] = 1;
yading@10 159 } else {
yading@10 160 dm->clean_src[dm->fid] = in;
yading@10 161 dm->got_frame[INPUT_CLEANSRC] = 1;
yading@10 162 }
yading@10 163 if (!dm->got_frame[INPUT_MAIN] || (dm->ppsrc && !dm->got_frame[INPUT_CLEANSRC]))
yading@10 164 return 0;
yading@10 165 dm->got_frame[INPUT_MAIN] = dm->got_frame[INPUT_CLEANSRC] = 0;
yading@10 166
yading@10 167 if (in) {
yading@10 168 /* update frame metrics */
yading@10 169 prv = dm->fid ? dm->queue[dm->fid - 1].frame : dm->last;
yading@10 170 if (!prv)
yading@10 171 prv = in;
yading@10 172 calc_diffs(dm, &dm->queue[dm->fid], prv, in);
yading@10 173 if (++dm->fid != dm->cycle)
yading@10 174 return 0;
yading@10 175 av_frame_free(&dm->last);
yading@10 176 dm->last = av_frame_clone(in);
yading@10 177 dm->fid = 0;
yading@10 178
yading@10 179 /* we have a complete cycle, select the frame to drop */
yading@10 180 lowest = 0;
yading@10 181 for (i = 0; i < dm->cycle; i++) {
yading@10 182 if (dm->queue[i].totdiff > dm->scthresh)
yading@10 183 scpos = i;
yading@10 184 if (dm->queue[i].maxbdiff < dm->queue[lowest].maxbdiff)
yading@10 185 lowest = i;
yading@10 186 }
yading@10 187 if (dm->queue[lowest].maxbdiff < dm->dupthresh)
yading@10 188 duppos = lowest;
yading@10 189 drop = scpos >= 0 && duppos < 0 ? scpos : lowest;
yading@10 190 }
yading@10 191
yading@10 192 /* metrics debug */
yading@10 193 if (av_log_get_level() >= AV_LOG_DEBUG) {
yading@10 194 av_log(ctx, AV_LOG_DEBUG, "1/%d frame drop:\n", dm->cycle);
yading@10 195 for (i = 0; i < dm->cycle && dm->queue[i].frame; i++) {
yading@10 196 av_log(ctx, AV_LOG_DEBUG," #%d: totdiff=%08"PRIx64" maxbdiff=%08"PRIx64"%s%s%s%s\n",
yading@10 197 i + 1, dm->queue[i].totdiff, dm->queue[i].maxbdiff,
yading@10 198 i == scpos ? " sc" : "",
yading@10 199 i == duppos ? " dup" : "",
yading@10 200 i == lowest ? " lowest" : "",
yading@10 201 i == drop ? " [DROP]" : "");
yading@10 202 }
yading@10 203 }
yading@10 204
yading@10 205 /* push all frames except the drop */
yading@10 206 ret = 0;
yading@10 207 for (i = 0; i < dm->cycle && dm->queue[i].frame; i++) {
yading@10 208 if (i == drop) {
yading@10 209 if (dm->ppsrc)
yading@10 210 av_frame_free(&dm->clean_src[i]);
yading@10 211 av_frame_free(&dm->queue[i].frame);
yading@10 212 } else {
yading@10 213 AVFrame *frame = dm->queue[i].frame;
yading@10 214 if (dm->ppsrc) {
yading@10 215 av_frame_free(&frame);
yading@10 216 frame = dm->clean_src[i];
yading@10 217 }
yading@10 218 frame->pts = dm->frame_count++ * dm->ts_unit;
yading@10 219 ret = ff_filter_frame(outlink, frame);
yading@10 220 if (ret < 0)
yading@10 221 break;
yading@10 222 }
yading@10 223 }
yading@10 224
yading@10 225 return ret;
yading@10 226 }
yading@10 227
yading@10 228 static int config_input(AVFilterLink *inlink)
yading@10 229 {
yading@10 230 int max_value;
yading@10 231 AVFilterContext *ctx = inlink->dst;
yading@10 232 DecimateContext *dm = ctx->priv;
yading@10 233 const AVPixFmtDescriptor *pix_desc = av_pix_fmt_desc_get(inlink->format);
yading@10 234 const int w = inlink->w;
yading@10 235 const int h = inlink->h;
yading@10 236
yading@10 237 dm->hsub = pix_desc->log2_chroma_w;
yading@10 238 dm->vsub = pix_desc->log2_chroma_h;
yading@10 239 dm->depth = pix_desc->comp[0].depth_minus1 + 1;
yading@10 240 max_value = (1 << dm->depth) - 1;
yading@10 241 dm->scthresh = (int64_t)(((int64_t)max_value * w * h * dm->scthresh_flt) / 100);
yading@10 242 dm->dupthresh = (int64_t)(((int64_t)max_value * dm->blockx * dm->blocky * dm->dupthresh_flt) / 100);
yading@10 243 dm->nxblocks = (w + dm->blockx/2 - 1) / (dm->blockx/2);
yading@10 244 dm->nyblocks = (h + dm->blocky/2 - 1) / (dm->blocky/2);
yading@10 245 dm->bdiffsize = dm->nxblocks * dm->nyblocks;
yading@10 246 dm->bdiffs = av_malloc(dm->bdiffsize * sizeof(*dm->bdiffs));
yading@10 247 dm->queue = av_calloc(dm->cycle, sizeof(*dm->queue));
yading@10 248
yading@10 249 if (!dm->bdiffs || !dm->queue)
yading@10 250 return AVERROR(ENOMEM);
yading@10 251
yading@10 252 if (dm->ppsrc) {
yading@10 253 dm->clean_src = av_calloc(dm->cycle, sizeof(*dm->clean_src));
yading@10 254 if (!dm->clean_src)
yading@10 255 return AVERROR(ENOMEM);
yading@10 256 }
yading@10 257
yading@10 258 return 0;
yading@10 259 }
yading@10 260
yading@10 261 static av_cold int decimate_init(AVFilterContext *ctx)
yading@10 262 {
yading@10 263 const DecimateContext *dm = ctx->priv;
yading@10 264 AVFilterPad pad = {
yading@10 265 .name = av_strdup("main"),
yading@10 266 .type = AVMEDIA_TYPE_VIDEO,
yading@10 267 .filter_frame = filter_frame,
yading@10 268 .config_props = config_input,
yading@10 269 };
yading@10 270
yading@10 271 if (!pad.name)
yading@10 272 return AVERROR(ENOMEM);
yading@10 273 ff_insert_inpad(ctx, INPUT_MAIN, &pad);
yading@10 274
yading@10 275 if (dm->ppsrc) {
yading@10 276 pad.name = av_strdup("clean_src");
yading@10 277 pad.config_props = NULL;
yading@10 278 if (!pad.name)
yading@10 279 return AVERROR(ENOMEM);
yading@10 280 ff_insert_inpad(ctx, INPUT_CLEANSRC, &pad);
yading@10 281 }
yading@10 282
yading@10 283 if ((dm->blockx & (dm->blockx - 1)) ||
yading@10 284 (dm->blocky & (dm->blocky - 1))) {
yading@10 285 av_log(ctx, AV_LOG_ERROR, "blockx and blocky settings must be power of two\n");
yading@10 286 return AVERROR(EINVAL);
yading@10 287 }
yading@10 288
yading@10 289 return 0;
yading@10 290 }
yading@10 291
yading@10 292 static av_cold void decimate_uninit(AVFilterContext *ctx)
yading@10 293 {
yading@10 294 int i;
yading@10 295 DecimateContext *dm = ctx->priv;
yading@10 296
yading@10 297 av_frame_free(&dm->last);
yading@10 298 av_freep(&dm->bdiffs);
yading@10 299 av_freep(&dm->queue);
yading@10 300 av_freep(&dm->clean_src);
yading@10 301 for (i = 0; i < ctx->nb_inputs; i++)
yading@10 302 av_freep(&ctx->input_pads[i].name);
yading@10 303 }
yading@10 304
yading@10 305 static int request_inlink(AVFilterContext *ctx, int lid)
yading@10 306 {
yading@10 307 int ret = 0;
yading@10 308 DecimateContext *dm = ctx->priv;
yading@10 309
yading@10 310 if (!dm->got_frame[lid]) {
yading@10 311 AVFilterLink *inlink = ctx->inputs[lid];
yading@10 312 ret = ff_request_frame(inlink);
yading@10 313 if (ret == AVERROR_EOF) { // flushing
yading@10 314 dm->eof |= 1 << lid;
yading@10 315 ret = filter_frame(inlink, NULL);
yading@10 316 }
yading@10 317 }
yading@10 318 return ret;
yading@10 319 }
yading@10 320
yading@10 321 static int request_frame(AVFilterLink *outlink)
yading@10 322 {
yading@10 323 int ret;
yading@10 324 AVFilterContext *ctx = outlink->src;
yading@10 325 DecimateContext *dm = ctx->priv;
yading@10 326 const uint32_t eof_mask = 1<<INPUT_MAIN | dm->ppsrc<<INPUT_CLEANSRC;
yading@10 327
yading@10 328 if ((dm->eof & eof_mask) == eof_mask) // flush done?
yading@10 329 return AVERROR_EOF;
yading@10 330 if ((ret = request_inlink(ctx, INPUT_MAIN)) < 0)
yading@10 331 return ret;
yading@10 332 if (dm->ppsrc && (ret = request_inlink(ctx, INPUT_CLEANSRC)) < 0)
yading@10 333 return ret;
yading@10 334 return 0;
yading@10 335 }
yading@10 336
yading@10 337 static int query_formats(AVFilterContext *ctx)
yading@10 338 {
yading@10 339 static const enum AVPixelFormat pix_fmts[] = {
yading@10 340 #define PF_NOALPHA(suf) AV_PIX_FMT_YUV420##suf, AV_PIX_FMT_YUV422##suf, AV_PIX_FMT_YUV444##suf
yading@10 341 #define PF_ALPHA(suf) AV_PIX_FMT_YUVA420##suf, AV_PIX_FMT_YUVA422##suf, AV_PIX_FMT_YUVA444##suf
yading@10 342 #define PF(suf) PF_NOALPHA(suf), PF_ALPHA(suf)
yading@10 343 PF(P), PF(P9), PF(P10), PF_NOALPHA(P12), PF_NOALPHA(P14), PF(P16),
yading@10 344 AV_PIX_FMT_YUV411P, AV_PIX_FMT_YUV410P,
yading@10 345 AV_PIX_FMT_GRAY8,
yading@10 346 AV_PIX_FMT_NONE
yading@10 347 };
yading@10 348 ff_set_common_formats(ctx, ff_make_format_list(pix_fmts));
yading@10 349 return 0;
yading@10 350 }
yading@10 351
yading@10 352 static int config_output(AVFilterLink *outlink)
yading@10 353 {
yading@10 354 AVFilterContext *ctx = outlink->src;
yading@10 355 DecimateContext *dm = ctx->priv;
yading@10 356 const AVFilterLink *inlink =
yading@10 357 ctx->inputs[dm->ppsrc ? INPUT_CLEANSRC : INPUT_MAIN];
yading@10 358 AVRational fps = inlink->frame_rate;
yading@10 359
yading@10 360 if (!fps.num || !fps.den) {
yading@10 361 av_log(ctx, AV_LOG_ERROR, "The input needs a constant frame rate; "
yading@10 362 "current rate of %d/%d is invalid\n", fps.num, fps.den);
yading@10 363 return AVERROR(EINVAL);
yading@10 364 }
yading@10 365 fps = av_mul_q(fps, (AVRational){dm->cycle - 1, dm->cycle});
yading@10 366 av_log(ctx, AV_LOG_VERBOSE, "FPS: %d/%d -> %d/%d\n",
yading@10 367 inlink->frame_rate.num, inlink->frame_rate.den, fps.num, fps.den);
yading@10 368 outlink->flags |= FF_LINK_FLAG_REQUEST_LOOP;
yading@10 369 outlink->time_base = inlink->time_base;
yading@10 370 outlink->frame_rate = fps;
yading@10 371 outlink->sample_aspect_ratio = inlink->sample_aspect_ratio;
yading@10 372 outlink->w = inlink->w;
yading@10 373 outlink->h = inlink->h;
yading@10 374 dm->ts_unit = av_q2d(av_inv_q(av_mul_q(fps, outlink->time_base)));
yading@10 375 return 0;
yading@10 376 }
yading@10 377
yading@10 378 static const AVFilterPad decimate_outputs[] = {
yading@10 379 {
yading@10 380 .name = "default",
yading@10 381 .type = AVMEDIA_TYPE_VIDEO,
yading@10 382 .request_frame = request_frame,
yading@10 383 .config_props = config_output,
yading@10 384 },
yading@10 385 { NULL }
yading@10 386 };
yading@10 387
yading@10 388 AVFilter avfilter_vf_decimate = {
yading@10 389 .name = "decimate",
yading@10 390 .description = NULL_IF_CONFIG_SMALL("Decimate frames (post field matching filter)."),
yading@10 391 .init = decimate_init,
yading@10 392 .uninit = decimate_uninit,
yading@10 393 .priv_size = sizeof(DecimateContext),
yading@10 394 .query_formats = query_formats,
yading@10 395 .outputs = decimate_outputs,
yading@10 396 .priv_class = &decimate_class,
yading@10 397 .flags = AVFILTER_FLAG_DYNAMIC_INPUTS,
yading@10 398 };