annotate ffmpeg/libavfilter/libmpcodecs/pullup.c @ 13:844d341cf643 tip

Back up before ISMIR
author Yading Song <yading.song@eecs.qmul.ac.uk>
date Thu, 31 Oct 2013 13:17:06 +0000
parents 6840f77b83aa
children
rev   line source
yading@10 1 /*
yading@10 2 * This file is part of MPlayer.
yading@10 3 *
yading@10 4 * MPlayer is free software; you can redistribute it and/or modify
yading@10 5 * it under the terms of the GNU General Public License as published by
yading@10 6 * the Free Software Foundation; either version 2 of the License, or
yading@10 7 * (at your option) any later version.
yading@10 8 *
yading@10 9 * MPlayer is distributed in the hope that it will be useful,
yading@10 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
yading@10 11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
yading@10 12 * GNU General Public License for more details.
yading@10 13 *
yading@10 14 * You should have received a copy of the GNU General Public License along
yading@10 15 * with MPlayer; if not, write to the Free Software Foundation, Inc.,
yading@10 16 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
yading@10 17 */
yading@10 18
yading@10 19 #include <stdio.h>
yading@10 20 #include <stdlib.h>
yading@10 21 #include <string.h>
yading@10 22
yading@10 23 #include "libavutil/x86/asm.h"
yading@10 24 #include "config.h"
yading@10 25 #include "pullup.h"
yading@10 26
yading@10 27
yading@10 28
yading@10 29 #if ARCH_X86
yading@10 30 #if HAVE_MMX
yading@10 31 static int diff_y_mmx(unsigned char *a, unsigned char *b, int s)
yading@10 32 {
yading@10 33 int ret;
yading@10 34 __asm__ volatile (
yading@10 35 "movl $4, %%ecx \n\t"
yading@10 36 "pxor %%mm4, %%mm4 \n\t"
yading@10 37 "pxor %%mm7, %%mm7 \n\t"
yading@10 38
yading@10 39 "1: \n\t"
yading@10 40
yading@10 41 "movq (%%"REG_S"), %%mm0 \n\t"
yading@10 42 "movq (%%"REG_S"), %%mm2 \n\t"
yading@10 43 "add %%"REG_a", %%"REG_S" \n\t"
yading@10 44 "movq (%%"REG_D"), %%mm1 \n\t"
yading@10 45 "add %%"REG_a", %%"REG_D" \n\t"
yading@10 46 "psubusb %%mm1, %%mm2 \n\t"
yading@10 47 "psubusb %%mm0, %%mm1 \n\t"
yading@10 48 "movq %%mm2, %%mm0 \n\t"
yading@10 49 "movq %%mm1, %%mm3 \n\t"
yading@10 50 "punpcklbw %%mm7, %%mm0 \n\t"
yading@10 51 "punpcklbw %%mm7, %%mm1 \n\t"
yading@10 52 "punpckhbw %%mm7, %%mm2 \n\t"
yading@10 53 "punpckhbw %%mm7, %%mm3 \n\t"
yading@10 54 "paddw %%mm0, %%mm4 \n\t"
yading@10 55 "paddw %%mm1, %%mm4 \n\t"
yading@10 56 "paddw %%mm2, %%mm4 \n\t"
yading@10 57 "paddw %%mm3, %%mm4 \n\t"
yading@10 58
yading@10 59 "decl %%ecx \n\t"
yading@10 60 "jnz 1b \n\t"
yading@10 61
yading@10 62 "movq %%mm4, %%mm3 \n\t"
yading@10 63 "punpcklwd %%mm7, %%mm4 \n\t"
yading@10 64 "punpckhwd %%mm7, %%mm3 \n\t"
yading@10 65 "paddd %%mm4, %%mm3 \n\t"
yading@10 66 "movd %%mm3, %%eax \n\t"
yading@10 67 "psrlq $32, %%mm3 \n\t"
yading@10 68 "movd %%mm3, %%edx \n\t"
yading@10 69 "addl %%edx, %%eax \n\t"
yading@10 70 "emms \n\t"
yading@10 71 : "=a" (ret)
yading@10 72 : "S" (a), "D" (b), "a" (s)
yading@10 73 : "%ecx", "%edx"
yading@10 74 );
yading@10 75 return ret;
yading@10 76 }
yading@10 77
yading@10 78 static int licomb_y_mmx(unsigned char *a, unsigned char *b, int s)
yading@10 79 {
yading@10 80 int ret;
yading@10 81 __asm__ volatile (
yading@10 82 "movl $4, %%ecx \n\t"
yading@10 83 "pxor %%mm6, %%mm6 \n\t"
yading@10 84 "pxor %%mm7, %%mm7 \n\t"
yading@10 85 "sub %%"REG_a", %%"REG_D" \n\t"
yading@10 86
yading@10 87 "2: \n\t"
yading@10 88
yading@10 89 "movq (%%"REG_D"), %%mm0 \n\t"
yading@10 90 "movq (%%"REG_D"), %%mm1 \n\t"
yading@10 91 "punpcklbw %%mm7, %%mm0 \n\t"
yading@10 92 "movq (%%"REG_D",%%"REG_a"), %%mm2 \n\t"
yading@10 93 "punpcklbw %%mm7, %%mm1 \n\t"
yading@10 94 "punpcklbw %%mm7, %%mm2 \n\t"
yading@10 95 "paddw %%mm0, %%mm0 \n\t"
yading@10 96 "paddw %%mm2, %%mm1 \n\t"
yading@10 97 "movq %%mm0, %%mm2 \n\t"
yading@10 98 "psubusw %%mm1, %%mm0 \n\t"
yading@10 99 "psubusw %%mm2, %%mm1 \n\t"
yading@10 100 "paddw %%mm0, %%mm6 \n\t"
yading@10 101 "paddw %%mm1, %%mm6 \n\t"
yading@10 102
yading@10 103 "movq (%%"REG_S"), %%mm0 \n\t"
yading@10 104 "movq (%%"REG_D"), %%mm1 \n\t"
yading@10 105 "punpckhbw %%mm7, %%mm0 \n\t"
yading@10 106 "movq (%%"REG_D",%%"REG_a"), %%mm2 \n\t"
yading@10 107 "punpckhbw %%mm7, %%mm1 \n\t"
yading@10 108 "punpckhbw %%mm7, %%mm2 \n\t"
yading@10 109 "paddw %%mm0, %%mm0 \n\t"
yading@10 110 "paddw %%mm2, %%mm1 \n\t"
yading@10 111 "movq %%mm0, %%mm2 \n\t"
yading@10 112 "psubusw %%mm1, %%mm0 \n\t"
yading@10 113 "psubusw %%mm2, %%mm1 \n\t"
yading@10 114 "paddw %%mm0, %%mm6 \n\t"
yading@10 115 "paddw %%mm1, %%mm6 \n\t"
yading@10 116
yading@10 117 "movq (%%"REG_D",%%"REG_a"), %%mm0 \n\t"
yading@10 118 "movq (%%"REG_S"), %%mm1 \n\t"
yading@10 119 "punpcklbw %%mm7, %%mm0 \n\t"
yading@10 120 "movq (%%"REG_S",%%"REG_a"), %%mm2 \n\t"
yading@10 121 "punpcklbw %%mm7, %%mm1 \n\t"
yading@10 122 "punpcklbw %%mm7, %%mm2 \n\t"
yading@10 123 "paddw %%mm0, %%mm0 \n\t"
yading@10 124 "paddw %%mm2, %%mm1 \n\t"
yading@10 125 "movq %%mm0, %%mm2 \n\t"
yading@10 126 "psubusw %%mm1, %%mm0 \n\t"
yading@10 127 "psubusw %%mm2, %%mm1 \n\t"
yading@10 128 "paddw %%mm0, %%mm6 \n\t"
yading@10 129 "paddw %%mm1, %%mm6 \n\t"
yading@10 130
yading@10 131 "movq (%%"REG_D",%%"REG_a"), %%mm0 \n\t"
yading@10 132 "movq (%%"REG_S"), %%mm1 \n\t"
yading@10 133 "punpckhbw %%mm7, %%mm0 \n\t"
yading@10 134 "movq (%%"REG_S",%%"REG_a"), %%mm2 \n\t"
yading@10 135 "punpckhbw %%mm7, %%mm1 \n\t"
yading@10 136 "punpckhbw %%mm7, %%mm2 \n\t"
yading@10 137 "paddw %%mm0, %%mm0 \n\t"
yading@10 138 "paddw %%mm2, %%mm1 \n\t"
yading@10 139 "movq %%mm0, %%mm2 \n\t"
yading@10 140 "psubusw %%mm1, %%mm0 \n\t"
yading@10 141 "psubusw %%mm2, %%mm1 \n\t"
yading@10 142 "paddw %%mm0, %%mm6 \n\t"
yading@10 143 "paddw %%mm1, %%mm6 \n\t"
yading@10 144
yading@10 145 "add %%"REG_a", %%"REG_S" \n\t"
yading@10 146 "add %%"REG_a", %%"REG_D" \n\t"
yading@10 147 "decl %%ecx \n\t"
yading@10 148 "jnz 2b \n\t"
yading@10 149
yading@10 150 "movq %%mm6, %%mm5 \n\t"
yading@10 151 "punpcklwd %%mm7, %%mm6 \n\t"
yading@10 152 "punpckhwd %%mm7, %%mm5 \n\t"
yading@10 153 "paddd %%mm6, %%mm5 \n\t"
yading@10 154 "movd %%mm5, %%eax \n\t"
yading@10 155 "psrlq $32, %%mm5 \n\t"
yading@10 156 "movd %%mm5, %%edx \n\t"
yading@10 157 "addl %%edx, %%eax \n\t"
yading@10 158
yading@10 159 "emms \n\t"
yading@10 160 : "=a" (ret)
yading@10 161 : "S" (a), "D" (b), "a" (s)
yading@10 162 : "%ecx", "%edx"
yading@10 163 );
yading@10 164 return ret;
yading@10 165 }
yading@10 166
yading@10 167 static int var_y_mmx(unsigned char *a, unsigned char *b, int s)
yading@10 168 {
yading@10 169 int ret;
yading@10 170 __asm__ volatile (
yading@10 171 "movl $3, %%ecx \n\t"
yading@10 172 "pxor %%mm4, %%mm4 \n\t"
yading@10 173 "pxor %%mm7, %%mm7 \n\t"
yading@10 174
yading@10 175 "1: \n\t"
yading@10 176
yading@10 177 "movq (%%"REG_S"), %%mm0 \n\t"
yading@10 178 "movq (%%"REG_S"), %%mm2 \n\t"
yading@10 179 "movq (%%"REG_S",%%"REG_a"), %%mm1 \n\t"
yading@10 180 "add %%"REG_a", %%"REG_S" \n\t"
yading@10 181 "psubusb %%mm1, %%mm2 \n\t"
yading@10 182 "psubusb %%mm0, %%mm1 \n\t"
yading@10 183 "movq %%mm2, %%mm0 \n\t"
yading@10 184 "movq %%mm1, %%mm3 \n\t"
yading@10 185 "punpcklbw %%mm7, %%mm0 \n\t"
yading@10 186 "punpcklbw %%mm7, %%mm1 \n\t"
yading@10 187 "punpckhbw %%mm7, %%mm2 \n\t"
yading@10 188 "punpckhbw %%mm7, %%mm3 \n\t"
yading@10 189 "paddw %%mm0, %%mm4 \n\t"
yading@10 190 "paddw %%mm1, %%mm4 \n\t"
yading@10 191 "paddw %%mm2, %%mm4 \n\t"
yading@10 192 "paddw %%mm3, %%mm4 \n\t"
yading@10 193
yading@10 194 "decl %%ecx \n\t"
yading@10 195 "jnz 1b \n\t"
yading@10 196
yading@10 197 "movq %%mm4, %%mm3 \n\t"
yading@10 198 "punpcklwd %%mm7, %%mm4 \n\t"
yading@10 199 "punpckhwd %%mm7, %%mm3 \n\t"
yading@10 200 "paddd %%mm4, %%mm3 \n\t"
yading@10 201 "movd %%mm3, %%eax \n\t"
yading@10 202 "psrlq $32, %%mm3 \n\t"
yading@10 203 "movd %%mm3, %%edx \n\t"
yading@10 204 "addl %%edx, %%eax \n\t"
yading@10 205 "emms \n\t"
yading@10 206 : "=a" (ret)
yading@10 207 : "S" (a), "a" (s)
yading@10 208 : "%ecx", "%edx"
yading@10 209 );
yading@10 210 return 4*ret;
yading@10 211 }
yading@10 212 #endif
yading@10 213 #endif
yading@10 214
yading@10 215 #define ABS(a) (((a)^((a)>>31))-((a)>>31))
yading@10 216
yading@10 217 static int diff_y(unsigned char *a, unsigned char *b, int s)
yading@10 218 {
yading@10 219 int i, j, diff=0;
yading@10 220 for (i=4; i; i--) {
yading@10 221 for (j=0; j<8; j++) diff += ABS(a[j]-b[j]);
yading@10 222 a+=s; b+=s;
yading@10 223 }
yading@10 224 return diff;
yading@10 225 }
yading@10 226
yading@10 227 static int licomb_y(unsigned char *a, unsigned char *b, int s)
yading@10 228 {
yading@10 229 int i, j, diff=0;
yading@10 230 for (i=4; i; i--) {
yading@10 231 for (j=0; j<8; j++)
yading@10 232 diff += ABS((a[j]<<1) - b[j-s] - b[j])
yading@10 233 + ABS((b[j]<<1) - a[j] - a[j+s]);
yading@10 234 a+=s; b+=s;
yading@10 235 }
yading@10 236 return diff;
yading@10 237 }
yading@10 238
yading@10 239 #if 0
yading@10 240 static int qpcomb_y(unsigned char *a, unsigned char *b, int s)
yading@10 241 {
yading@10 242 int i, j, diff=0;
yading@10 243 for (i=4; i; i--) {
yading@10 244 for (j=0; j<8; j++)
yading@10 245 diff += ABS(a[j] - 3*b[j-s] + 3*a[j+s] - b[j]);
yading@10 246 a+=s; b+=s;
yading@10 247 }
yading@10 248 return diff;
yading@10 249 }
yading@10 250
yading@10 251 static int licomb_y_test(unsigned char *a, unsigned char *b, int s)
yading@10 252 {
yading@10 253 int c = licomb_y(a,b,s);
yading@10 254 int m = licomb_y_mmx(a,b,s);
yading@10 255 if (c != m) printf("%d != %d\n", c, m);
yading@10 256 return m;
yading@10 257 }
yading@10 258 #endif
yading@10 259
yading@10 260 static int var_y(unsigned char *a, unsigned char *b, int s)
yading@10 261 {
yading@10 262 int i, j, var=0;
yading@10 263 for (i=3; i; i--) {
yading@10 264 for (j=0; j<8; j++) {
yading@10 265 var += ABS(a[j]-a[j+s]);
yading@10 266 }
yading@10 267 a+=s; b+=s;
yading@10 268 }
yading@10 269 return 4*var; /* match comb scaling */
yading@10 270 }
yading@10 271
yading@10 272
yading@10 273
yading@10 274
yading@10 275
yading@10 276
yading@10 277
yading@10 278
yading@10 279
yading@10 280 static void alloc_buffer(struct pullup_context *c, struct pullup_buffer *b)
yading@10 281 {
yading@10 282 int i;
yading@10 283 if (b->planes) return;
yading@10 284 b->planes = calloc(c->nplanes, sizeof(unsigned char *));
yading@10 285 for (i = 0; i < c->nplanes; i++) {
yading@10 286 b->planes[i] = malloc(c->h[i]*c->stride[i]);
yading@10 287 /* Deal with idiotic 128=0 for chroma: */
yading@10 288 memset(b->planes[i], c->background[i], c->h[i]*c->stride[i]);
yading@10 289 }
yading@10 290 }
yading@10 291
yading@10 292 struct pullup_buffer *ff_pullup_lock_buffer(struct pullup_buffer *b, int parity)
yading@10 293 {
yading@10 294 if (!b) return 0;
yading@10 295 if ((parity+1) & 1) b->lock[0]++;
yading@10 296 if ((parity+1) & 2) b->lock[1]++;
yading@10 297 return b;
yading@10 298 }
yading@10 299
yading@10 300 void ff_pullup_release_buffer(struct pullup_buffer *b, int parity)
yading@10 301 {
yading@10 302 if (!b) return;
yading@10 303 if ((parity+1) & 1) b->lock[0]--;
yading@10 304 if ((parity+1) & 2) b->lock[1]--;
yading@10 305 }
yading@10 306
yading@10 307 struct pullup_buffer *ff_pullup_get_buffer(struct pullup_context *c, int parity)
yading@10 308 {
yading@10 309 int i;
yading@10 310
yading@10 311 /* Try first to get the sister buffer for the previous field */
yading@10 312 if (parity < 2 && c->last && parity != c->last->parity
yading@10 313 && !c->last->buffer->lock[parity]) {
yading@10 314 alloc_buffer(c, c->last->buffer);
yading@10 315 return ff_pullup_lock_buffer(c->last->buffer, parity);
yading@10 316 }
yading@10 317
yading@10 318 /* Prefer a buffer with both fields open */
yading@10 319 for (i = 0; i < c->nbuffers; i++) {
yading@10 320 if (c->buffers[i].lock[0]) continue;
yading@10 321 if (c->buffers[i].lock[1]) continue;
yading@10 322 alloc_buffer(c, &c->buffers[i]);
yading@10 323 return ff_pullup_lock_buffer(&c->buffers[i], parity);
yading@10 324 }
yading@10 325
yading@10 326 if (parity == 2) return 0;
yading@10 327
yading@10 328 /* Search for any half-free buffer */
yading@10 329 for (i = 0; i < c->nbuffers; i++) {
yading@10 330 if (((parity+1) & 1) && c->buffers[i].lock[0]) continue;
yading@10 331 if (((parity+1) & 2) && c->buffers[i].lock[1]) continue;
yading@10 332 alloc_buffer(c, &c->buffers[i]);
yading@10 333 return ff_pullup_lock_buffer(&c->buffers[i], parity);
yading@10 334 }
yading@10 335
yading@10 336 return 0;
yading@10 337 }
yading@10 338
yading@10 339
yading@10 340
yading@10 341
yading@10 342
yading@10 343
yading@10 344 static void compute_metric(struct pullup_context *c,
yading@10 345 struct pullup_field *fa, int pa,
yading@10 346 struct pullup_field *fb, int pb,
yading@10 347 int (*func)(unsigned char *, unsigned char *, int), int *dest)
yading@10 348 {
yading@10 349 unsigned char *a, *b;
yading@10 350 int x, y;
yading@10 351 int mp = c->metric_plane;
yading@10 352 int xstep = c->bpp[mp];
yading@10 353 int ystep = c->stride[mp]<<3;
yading@10 354 int s = c->stride[mp]<<1; /* field stride */
yading@10 355 int w = c->metric_w*xstep;
yading@10 356
yading@10 357 if (!fa->buffer || !fb->buffer) return;
yading@10 358
yading@10 359 /* Shortcut for duplicate fields (e.g. from RFF flag) */
yading@10 360 if (fa->buffer == fb->buffer && pa == pb) {
yading@10 361 memset(dest, 0, c->metric_len * sizeof(int));
yading@10 362 return;
yading@10 363 }
yading@10 364
yading@10 365 a = fa->buffer->planes[mp] + pa * c->stride[mp] + c->metric_offset;
yading@10 366 b = fb->buffer->planes[mp] + pb * c->stride[mp] + c->metric_offset;
yading@10 367
yading@10 368 for (y = c->metric_h; y; y--) {
yading@10 369 for (x = 0; x < w; x += xstep) {
yading@10 370 *dest++ = func(a + x, b + x, s);
yading@10 371 }
yading@10 372 a += ystep; b += ystep;
yading@10 373 }
yading@10 374 }
yading@10 375
yading@10 376
yading@10 377
yading@10 378
yading@10 379
yading@10 380 static void alloc_metrics(struct pullup_context *c, struct pullup_field *f)
yading@10 381 {
yading@10 382 f->diffs = calloc(c->metric_len, sizeof(int));
yading@10 383 f->comb = calloc(c->metric_len, sizeof(int));
yading@10 384 f->var = calloc(c->metric_len, sizeof(int));
yading@10 385 /* add more metrics here as needed */
yading@10 386 }
yading@10 387
yading@10 388 static struct pullup_field *make_field_queue(struct pullup_context *c, int len)
yading@10 389 {
yading@10 390 struct pullup_field *head, *f;
yading@10 391 f = head = calloc(1, sizeof(struct pullup_field));
yading@10 392 alloc_metrics(c, f);
yading@10 393 for (; len > 0; len--) {
yading@10 394 f->next = calloc(1, sizeof(struct pullup_field));
yading@10 395 f->next->prev = f;
yading@10 396 f = f->next;
yading@10 397 alloc_metrics(c, f);
yading@10 398 }
yading@10 399 f->next = head;
yading@10 400 head->prev = f;
yading@10 401 return head;
yading@10 402 }
yading@10 403
yading@10 404 static void check_field_queue(struct pullup_context *c)
yading@10 405 {
yading@10 406 if (c->head->next == c->first) {
yading@10 407 struct pullup_field *f = calloc(1, sizeof(struct pullup_field));
yading@10 408 alloc_metrics(c, f);
yading@10 409 f->prev = c->head;
yading@10 410 f->next = c->first;
yading@10 411 c->head->next = f;
yading@10 412 c->first->prev = f;
yading@10 413 }
yading@10 414 }
yading@10 415
yading@10 416 void ff_pullup_submit_field(struct pullup_context *c, struct pullup_buffer *b, int parity)
yading@10 417 {
yading@10 418 struct pullup_field *f;
yading@10 419
yading@10 420 /* Grow the circular list if needed */
yading@10 421 check_field_queue(c);
yading@10 422
yading@10 423 /* Cannot have two fields of same parity in a row; drop the new one */
yading@10 424 if (c->last && c->last->parity == parity) return;
yading@10 425
yading@10 426 f = c->head;
yading@10 427 f->parity = parity;
yading@10 428 f->buffer = ff_pullup_lock_buffer(b, parity);
yading@10 429 f->flags = 0;
yading@10 430 f->breaks = 0;
yading@10 431 f->affinity = 0;
yading@10 432
yading@10 433 compute_metric(c, f, parity, f->prev->prev, parity, c->diff, f->diffs);
yading@10 434 compute_metric(c, parity?f->prev:f, 0, parity?f:f->prev, 1, c->comb, f->comb);
yading@10 435 compute_metric(c, f, parity, f, -1, c->var, f->var);
yading@10 436
yading@10 437 /* Advance the circular list */
yading@10 438 if (!c->first) c->first = c->head;
yading@10 439 c->last = c->head;
yading@10 440 c->head = c->head->next;
yading@10 441 }
yading@10 442
yading@10 443 void ff_pullup_flush_fields(struct pullup_context *c)
yading@10 444 {
yading@10 445 struct pullup_field *f;
yading@10 446
yading@10 447 for (f = c->first; f && f != c->head; f = f->next) {
yading@10 448 ff_pullup_release_buffer(f->buffer, f->parity);
yading@10 449 f->buffer = 0;
yading@10 450 }
yading@10 451 c->first = c->last = 0;
yading@10 452 }
yading@10 453
yading@10 454
yading@10 455
yading@10 456
yading@10 457
yading@10 458
yading@10 459
yading@10 460
yading@10 461 #define F_HAVE_BREAKS 1
yading@10 462 #define F_HAVE_AFFINITY 2
yading@10 463
yading@10 464
yading@10 465 #define BREAK_LEFT 1
yading@10 466 #define BREAK_RIGHT 2
yading@10 467
yading@10 468
yading@10 469
yading@10 470
yading@10 471 static int queue_length(struct pullup_field *begin, struct pullup_field *end)
yading@10 472 {
yading@10 473 int count = 1;
yading@10 474 struct pullup_field *f;
yading@10 475
yading@10 476 if (!begin || !end) return 0;
yading@10 477 for (f = begin; f != end; f = f->next) count++;
yading@10 478 return count;
yading@10 479 }
yading@10 480
yading@10 481 static int find_first_break(struct pullup_field *f, int max)
yading@10 482 {
yading@10 483 int i;
yading@10 484 for (i = 0; i < max; i++) {
yading@10 485 if (f->breaks & BREAK_RIGHT || f->next->breaks & BREAK_LEFT)
yading@10 486 return i+1;
yading@10 487 f = f->next;
yading@10 488 }
yading@10 489 return 0;
yading@10 490 }
yading@10 491
yading@10 492 static void compute_breaks(struct pullup_context *c, struct pullup_field *f0)
yading@10 493 {
yading@10 494 int i;
yading@10 495 struct pullup_field *f1 = f0->next;
yading@10 496 struct pullup_field *f2 = f1->next;
yading@10 497 struct pullup_field *f3 = f2->next;
yading@10 498 int l, max_l=0, max_r=0;
yading@10 499 //struct pullup_field *ff;
yading@10 500 //for (i=0, ff=c->first; ff != f0; i++, ff=ff->next);
yading@10 501
yading@10 502 if (f0->flags & F_HAVE_BREAKS) return;
yading@10 503 //printf("\n%d: ", i);
yading@10 504 f0->flags |= F_HAVE_BREAKS;
yading@10 505
yading@10 506 /* Special case when fields are 100% identical */
yading@10 507 if (f0->buffer == f2->buffer && f1->buffer != f3->buffer) {
yading@10 508 f2->breaks |= BREAK_RIGHT;
yading@10 509 return;
yading@10 510 }
yading@10 511 if (f0->buffer != f2->buffer && f1->buffer == f3->buffer) {
yading@10 512 f1->breaks |= BREAK_LEFT;
yading@10 513 return;
yading@10 514 }
yading@10 515
yading@10 516 for (i = 0; i < c->metric_len; i++) {
yading@10 517 l = f2->diffs[i] - f3->diffs[i];
yading@10 518 if (l > max_l) max_l = l;
yading@10 519 if (-l > max_r) max_r = -l;
yading@10 520 }
yading@10 521 /* Don't get tripped up when differences are mostly quant error */
yading@10 522 //printf("%d %d\n", max_l, max_r);
yading@10 523 if (max_l + max_r < 128) return;
yading@10 524 if (max_l > 4*max_r) f1->breaks |= BREAK_LEFT;
yading@10 525 if (max_r > 4*max_l) f2->breaks |= BREAK_RIGHT;
yading@10 526 }
yading@10 527
yading@10 528 static void compute_affinity(struct pullup_context *c, struct pullup_field *f)
yading@10 529 {
yading@10 530 int i;
yading@10 531 int max_l=0, max_r=0, l;
yading@10 532 if (f->flags & F_HAVE_AFFINITY) return;
yading@10 533 f->flags |= F_HAVE_AFFINITY;
yading@10 534 if (f->buffer == f->next->next->buffer) {
yading@10 535 f->affinity = 1;
yading@10 536 f->next->affinity = 0;
yading@10 537 f->next->next->affinity = -1;
yading@10 538 f->next->flags |= F_HAVE_AFFINITY;
yading@10 539 f->next->next->flags |= F_HAVE_AFFINITY;
yading@10 540 return;
yading@10 541 }
yading@10 542 if (1) {
yading@10 543 for (i = 0; i < c->metric_len; i++) {
yading@10 544 int lv = f->prev->var[i];
yading@10 545 int rv = f->next->var[i];
yading@10 546 int v = f->var[i];
yading@10 547 int lc = f->comb[i] - (v+lv) + ABS(v-lv);
yading@10 548 int rc = f->next->comb[i] - (v+rv) + ABS(v-rv);
yading@10 549 lc = lc>0 ? lc : 0;
yading@10 550 rc = rc>0 ? rc : 0;
yading@10 551 l = lc - rc;
yading@10 552 if (l > max_l) max_l = l;
yading@10 553 if (-l > max_r) max_r = -l;
yading@10 554 }
yading@10 555 if (max_l + max_r < 64) return;
yading@10 556 if (max_r > 6*max_l) f->affinity = -1;
yading@10 557 else if (max_l > 6*max_r) f->affinity = 1;
yading@10 558 } else {
yading@10 559 for (i = 0; i < c->metric_len; i++) {
yading@10 560 l = f->comb[i] - f->next->comb[i];
yading@10 561 if (l > max_l) max_l = l;
yading@10 562 if (-l > max_r) max_r = -l;
yading@10 563 }
yading@10 564 if (max_l + max_r < 64) return;
yading@10 565 if (max_r > 2*max_l) f->affinity = -1;
yading@10 566 else if (max_l > 2*max_r) f->affinity = 1;
yading@10 567 }
yading@10 568 }
yading@10 569
yading@10 570 static void foo(struct pullup_context *c)
yading@10 571 {
yading@10 572 struct pullup_field *f = c->first;
yading@10 573 int i, n = queue_length(f, c->last);
yading@10 574 for (i = 0; i < n-1; i++) {
yading@10 575 if (i < n-3) compute_breaks(c, f);
yading@10 576 compute_affinity(c, f);
yading@10 577 f = f->next;
yading@10 578 }
yading@10 579 }
yading@10 580
yading@10 581 static int decide_frame_length(struct pullup_context *c)
yading@10 582 {
yading@10 583 struct pullup_field *f0 = c->first;
yading@10 584 struct pullup_field *f1 = f0->next;
yading@10 585 struct pullup_field *f2 = f1->next;
yading@10 586 int l;
yading@10 587
yading@10 588 if (queue_length(c->first, c->last) < 4) return 0;
yading@10 589 foo(c);
yading@10 590
yading@10 591 if (f0->affinity == -1) return 1;
yading@10 592
yading@10 593 l = find_first_break(f0, 3);
yading@10 594 if (l == 1 && c->strict_breaks < 0) l = 0;
yading@10 595
yading@10 596 switch (l) {
yading@10 597 case 1:
yading@10 598 if (c->strict_breaks < 1 && f0->affinity == 1 && f1->affinity == -1)
yading@10 599 return 2;
yading@10 600 else return 1;
yading@10 601 case 2:
yading@10 602 /* FIXME: strictly speaking, f0->prev is no longer valid... :) */
yading@10 603 if (c->strict_pairs
yading@10 604 && (f0->prev->breaks & BREAK_RIGHT) && (f2->breaks & BREAK_LEFT)
yading@10 605 && (f0->affinity != 1 || f1->affinity != -1) )
yading@10 606 return 1;
yading@10 607 if (f1->affinity == 1) return 1;
yading@10 608 else return 2;
yading@10 609 case 3:
yading@10 610 if (f2->affinity == 1) return 2;
yading@10 611 else return 3;
yading@10 612 default:
yading@10 613 /* 9 possibilities covered before switch */
yading@10 614 if (f1->affinity == 1) return 1; /* covers 6 */
yading@10 615 else if (f1->affinity == -1) return 2; /* covers 6 */
yading@10 616 else if (f2->affinity == -1) { /* covers 2 */
yading@10 617 if (f0->affinity == 1) return 3;
yading@10 618 else return 1;
yading@10 619 }
yading@10 620 else return 2; /* the remaining 6 */
yading@10 621 }
yading@10 622 }
yading@10 623
yading@10 624
yading@10 625 static void print_aff_and_breaks(struct pullup_context *c, struct pullup_field *f)
yading@10 626 {
yading@10 627 int i;
yading@10 628 struct pullup_field *f0 = f;
yading@10 629 const char aff_l[] = "+..", aff_r[] = "..+";
yading@10 630 printf("\naffinity: ");
yading@10 631 for (i = 0; i < 4; i++) {
yading@10 632 printf("%c%d%c", aff_l[1+f->affinity], i, aff_r[1+f->affinity]);
yading@10 633 f = f->next;
yading@10 634 }
yading@10 635 f = f0;
yading@10 636 printf("\nbreaks: ");
yading@10 637 for (i=0; i<4; i++) {
yading@10 638 printf("%c%d%c", f->breaks & BREAK_LEFT ? '|' : '.', i, f->breaks & BREAK_RIGHT ? '|' : '.');
yading@10 639 f = f->next;
yading@10 640 }
yading@10 641 printf("\n");
yading@10 642 }
yading@10 643
yading@10 644
yading@10 645
yading@10 646
yading@10 647
yading@10 648 struct pullup_frame *ff_pullup_get_frame(struct pullup_context *c)
yading@10 649 {
yading@10 650 int i;
yading@10 651 struct pullup_frame *fr = c->frame;
yading@10 652 int n = decide_frame_length(c);
yading@10 653 int aff = c->first->next->affinity;
yading@10 654
yading@10 655 if (!n) return 0;
yading@10 656 if (fr->lock) return 0;
yading@10 657
yading@10 658 if (c->verbose) {
yading@10 659 print_aff_and_breaks(c, c->first);
yading@10 660 printf("duration: %d \n", n);
yading@10 661 }
yading@10 662
yading@10 663 fr->lock++;
yading@10 664 fr->length = n;
yading@10 665 fr->parity = c->first->parity;
yading@10 666 fr->buffer = 0;
yading@10 667 for (i = 0; i < n; i++) {
yading@10 668 /* We cheat and steal the buffer without release+relock */
yading@10 669 fr->ifields[i] = c->first->buffer;
yading@10 670 c->first->buffer = 0;
yading@10 671 c->first = c->first->next;
yading@10 672 }
yading@10 673
yading@10 674 if (n == 1) {
yading@10 675 fr->ofields[fr->parity] = fr->ifields[0];
yading@10 676 fr->ofields[fr->parity^1] = 0;
yading@10 677 } else if (n == 2) {
yading@10 678 fr->ofields[fr->parity] = fr->ifields[0];
yading@10 679 fr->ofields[fr->parity^1] = fr->ifields[1];
yading@10 680 } else if (n == 3) {
yading@10 681 if (aff == 0)
yading@10 682 aff = (fr->ifields[0] == fr->ifields[1]) ? -1 : 1;
yading@10 683 /* else if (c->verbose) printf("forced aff: %d \n", aff); */
yading@10 684 fr->ofields[fr->parity] = fr->ifields[1+aff];
yading@10 685 fr->ofields[fr->parity^1] = fr->ifields[1];
yading@10 686 }
yading@10 687 ff_pullup_lock_buffer(fr->ofields[0], 0);
yading@10 688 ff_pullup_lock_buffer(fr->ofields[1], 1);
yading@10 689
yading@10 690 if (fr->ofields[0] == fr->ofields[1]) {
yading@10 691 fr->buffer = fr->ofields[0];
yading@10 692 ff_pullup_lock_buffer(fr->buffer, 2);
yading@10 693 return fr;
yading@10 694 }
yading@10 695 return fr;
yading@10 696 }
yading@10 697
yading@10 698 static void copy_field(struct pullup_context *c, struct pullup_buffer *dest,
yading@10 699 struct pullup_buffer *src, int parity)
yading@10 700 {
yading@10 701 int i, j;
yading@10 702 unsigned char *d, *s;
yading@10 703 for (i = 0; i < c->nplanes; i++) {
yading@10 704 s = src->planes[i] + parity*c->stride[i];
yading@10 705 d = dest->planes[i] + parity*c->stride[i];
yading@10 706 for (j = c->h[i]>>1; j; j--) {
yading@10 707 memcpy(d, s, c->stride[i]);
yading@10 708 s += c->stride[i]<<1;
yading@10 709 d += c->stride[i]<<1;
yading@10 710 }
yading@10 711 }
yading@10 712 }
yading@10 713
yading@10 714 void ff_pullup_pack_frame(struct pullup_context *c, struct pullup_frame *fr)
yading@10 715 {
yading@10 716 int i;
yading@10 717 if (fr->buffer) return;
yading@10 718 if (fr->length < 2) return; /* FIXME: deal with this */
yading@10 719 for (i = 0; i < 2; i++)
yading@10 720 {
yading@10 721 if (fr->ofields[i]->lock[i^1]) continue;
yading@10 722 fr->buffer = fr->ofields[i];
yading@10 723 ff_pullup_lock_buffer(fr->buffer, 2);
yading@10 724 copy_field(c, fr->buffer, fr->ofields[i^1], i^1);
yading@10 725 return;
yading@10 726 }
yading@10 727 fr->buffer = ff_pullup_get_buffer(c, 2);
yading@10 728 copy_field(c, fr->buffer, fr->ofields[0], 0);
yading@10 729 copy_field(c, fr->buffer, fr->ofields[1], 1);
yading@10 730 }
yading@10 731
yading@10 732 void ff_pullup_release_frame(struct pullup_frame *fr)
yading@10 733 {
yading@10 734 int i;
yading@10 735 for (i = 0; i < fr->length; i++)
yading@10 736 ff_pullup_release_buffer(fr->ifields[i], fr->parity ^ (i&1));
yading@10 737 ff_pullup_release_buffer(fr->ofields[0], 0);
yading@10 738 ff_pullup_release_buffer(fr->ofields[1], 1);
yading@10 739 if (fr->buffer) ff_pullup_release_buffer(fr->buffer, 2);
yading@10 740 fr->lock--;
yading@10 741 }
yading@10 742
yading@10 743
yading@10 744
yading@10 745
yading@10 746
yading@10 747
yading@10 748 struct pullup_context *ff_pullup_alloc_context(void)
yading@10 749 {
yading@10 750 struct pullup_context *c;
yading@10 751
yading@10 752 c = calloc(1, sizeof(struct pullup_context));
yading@10 753
yading@10 754 return c;
yading@10 755 }
yading@10 756
yading@10 757 void ff_pullup_preinit_context(struct pullup_context *c)
yading@10 758 {
yading@10 759 c->bpp = calloc(c->nplanes, sizeof(int));
yading@10 760 c->w = calloc(c->nplanes, sizeof(int));
yading@10 761 c->h = calloc(c->nplanes, sizeof(int));
yading@10 762 c->stride = calloc(c->nplanes, sizeof(int));
yading@10 763 c->background = calloc(c->nplanes, sizeof(int));
yading@10 764 }
yading@10 765
yading@10 766 void ff_pullup_init_context(struct pullup_context *c)
yading@10 767 {
yading@10 768 int mp = c->metric_plane;
yading@10 769 if (c->nbuffers < 10) c->nbuffers = 10;
yading@10 770 c->buffers = calloc(c->nbuffers, sizeof (struct pullup_buffer));
yading@10 771
yading@10 772 c->metric_w = (c->w[mp] - ((c->junk_left + c->junk_right) << 3)) >> 3;
yading@10 773 c->metric_h = (c->h[mp] - ((c->junk_top + c->junk_bottom) << 1)) >> 3;
yading@10 774 c->metric_offset = c->junk_left*c->bpp[mp] + (c->junk_top<<1)*c->stride[mp];
yading@10 775 c->metric_len = c->metric_w * c->metric_h;
yading@10 776
yading@10 777 c->head = make_field_queue(c, 8);
yading@10 778
yading@10 779 c->frame = calloc(1, sizeof (struct pullup_frame));
yading@10 780 c->frame->ifields = calloc(3, sizeof (struct pullup_buffer *));
yading@10 781
yading@10 782 switch(c->format) {
yading@10 783 case PULLUP_FMT_Y:
yading@10 784 c->diff = diff_y;
yading@10 785 c->comb = licomb_y;
yading@10 786 c->var = var_y;
yading@10 787 #if ARCH_X86
yading@10 788 #if HAVE_MMX
yading@10 789 if (c->cpu & PULLUP_CPU_MMX) {
yading@10 790 c->diff = diff_y_mmx;
yading@10 791 c->comb = licomb_y_mmx;
yading@10 792 c->var = var_y_mmx;
yading@10 793 }
yading@10 794 #endif
yading@10 795 #endif
yading@10 796 /* c->comb = qpcomb_y; */
yading@10 797 break;
yading@10 798 #if 0
yading@10 799 case PULLUP_FMT_YUY2:
yading@10 800 c->diff = diff_yuy2;
yading@10 801 break;
yading@10 802 case PULLUP_FMT_RGB32:
yading@10 803 c->diff = diff_rgb32;
yading@10 804 break;
yading@10 805 #endif
yading@10 806 }
yading@10 807 }
yading@10 808
yading@10 809 void ff_pullup_free_context(struct pullup_context *c)
yading@10 810 {
yading@10 811 struct pullup_field *f;
yading@10 812 free(c->buffers);
yading@10 813 f = c->head;
yading@10 814 do {
yading@10 815 if (!f) break;
yading@10 816 free(f->diffs);
yading@10 817 free(f->comb);
yading@10 818 f = f->next;
yading@10 819 free(f->prev);
yading@10 820 } while (f != c->head);
yading@10 821 free(c->frame);
yading@10 822 free(c);
yading@10 823 }