yading@10
|
1 /*
|
yading@10
|
2 * This file is part of MPlayer.
|
yading@10
|
3 *
|
yading@10
|
4 * MPlayer is free software; you can redistribute it and/or modify
|
yading@10
|
5 * it under the terms of the GNU General Public License as published by
|
yading@10
|
6 * the Free Software Foundation; either version 2 of the License, or
|
yading@10
|
7 * (at your option) any later version.
|
yading@10
|
8 *
|
yading@10
|
9 * MPlayer is distributed in the hope that it will be useful,
|
yading@10
|
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
yading@10
|
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
yading@10
|
12 * GNU General Public License for more details.
|
yading@10
|
13 *
|
yading@10
|
14 * You should have received a copy of the GNU General Public License along
|
yading@10
|
15 * with MPlayer; if not, write to the Free Software Foundation, Inc.,
|
yading@10
|
16 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
yading@10
|
17 */
|
yading@10
|
18
|
yading@10
|
19 #include <stdio.h>
|
yading@10
|
20 #include <stdlib.h>
|
yading@10
|
21 #include <string.h>
|
yading@10
|
22
|
yading@10
|
23 #include "libavutil/x86/asm.h"
|
yading@10
|
24 #include "config.h"
|
yading@10
|
25 #include "pullup.h"
|
yading@10
|
26
|
yading@10
|
27
|
yading@10
|
28
|
yading@10
|
29 #if ARCH_X86
|
yading@10
|
30 #if HAVE_MMX
|
yading@10
|
31 static int diff_y_mmx(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
32 {
|
yading@10
|
33 int ret;
|
yading@10
|
34 __asm__ volatile (
|
yading@10
|
35 "movl $4, %%ecx \n\t"
|
yading@10
|
36 "pxor %%mm4, %%mm4 \n\t"
|
yading@10
|
37 "pxor %%mm7, %%mm7 \n\t"
|
yading@10
|
38
|
yading@10
|
39 "1: \n\t"
|
yading@10
|
40
|
yading@10
|
41 "movq (%%"REG_S"), %%mm0 \n\t"
|
yading@10
|
42 "movq (%%"REG_S"), %%mm2 \n\t"
|
yading@10
|
43 "add %%"REG_a", %%"REG_S" \n\t"
|
yading@10
|
44 "movq (%%"REG_D"), %%mm1 \n\t"
|
yading@10
|
45 "add %%"REG_a", %%"REG_D" \n\t"
|
yading@10
|
46 "psubusb %%mm1, %%mm2 \n\t"
|
yading@10
|
47 "psubusb %%mm0, %%mm1 \n\t"
|
yading@10
|
48 "movq %%mm2, %%mm0 \n\t"
|
yading@10
|
49 "movq %%mm1, %%mm3 \n\t"
|
yading@10
|
50 "punpcklbw %%mm7, %%mm0 \n\t"
|
yading@10
|
51 "punpcklbw %%mm7, %%mm1 \n\t"
|
yading@10
|
52 "punpckhbw %%mm7, %%mm2 \n\t"
|
yading@10
|
53 "punpckhbw %%mm7, %%mm3 \n\t"
|
yading@10
|
54 "paddw %%mm0, %%mm4 \n\t"
|
yading@10
|
55 "paddw %%mm1, %%mm4 \n\t"
|
yading@10
|
56 "paddw %%mm2, %%mm4 \n\t"
|
yading@10
|
57 "paddw %%mm3, %%mm4 \n\t"
|
yading@10
|
58
|
yading@10
|
59 "decl %%ecx \n\t"
|
yading@10
|
60 "jnz 1b \n\t"
|
yading@10
|
61
|
yading@10
|
62 "movq %%mm4, %%mm3 \n\t"
|
yading@10
|
63 "punpcklwd %%mm7, %%mm4 \n\t"
|
yading@10
|
64 "punpckhwd %%mm7, %%mm3 \n\t"
|
yading@10
|
65 "paddd %%mm4, %%mm3 \n\t"
|
yading@10
|
66 "movd %%mm3, %%eax \n\t"
|
yading@10
|
67 "psrlq $32, %%mm3 \n\t"
|
yading@10
|
68 "movd %%mm3, %%edx \n\t"
|
yading@10
|
69 "addl %%edx, %%eax \n\t"
|
yading@10
|
70 "emms \n\t"
|
yading@10
|
71 : "=a" (ret)
|
yading@10
|
72 : "S" (a), "D" (b), "a" (s)
|
yading@10
|
73 : "%ecx", "%edx"
|
yading@10
|
74 );
|
yading@10
|
75 return ret;
|
yading@10
|
76 }
|
yading@10
|
77
|
yading@10
|
78 static int licomb_y_mmx(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
79 {
|
yading@10
|
80 int ret;
|
yading@10
|
81 __asm__ volatile (
|
yading@10
|
82 "movl $4, %%ecx \n\t"
|
yading@10
|
83 "pxor %%mm6, %%mm6 \n\t"
|
yading@10
|
84 "pxor %%mm7, %%mm7 \n\t"
|
yading@10
|
85 "sub %%"REG_a", %%"REG_D" \n\t"
|
yading@10
|
86
|
yading@10
|
87 "2: \n\t"
|
yading@10
|
88
|
yading@10
|
89 "movq (%%"REG_D"), %%mm0 \n\t"
|
yading@10
|
90 "movq (%%"REG_D"), %%mm1 \n\t"
|
yading@10
|
91 "punpcklbw %%mm7, %%mm0 \n\t"
|
yading@10
|
92 "movq (%%"REG_D",%%"REG_a"), %%mm2 \n\t"
|
yading@10
|
93 "punpcklbw %%mm7, %%mm1 \n\t"
|
yading@10
|
94 "punpcklbw %%mm7, %%mm2 \n\t"
|
yading@10
|
95 "paddw %%mm0, %%mm0 \n\t"
|
yading@10
|
96 "paddw %%mm2, %%mm1 \n\t"
|
yading@10
|
97 "movq %%mm0, %%mm2 \n\t"
|
yading@10
|
98 "psubusw %%mm1, %%mm0 \n\t"
|
yading@10
|
99 "psubusw %%mm2, %%mm1 \n\t"
|
yading@10
|
100 "paddw %%mm0, %%mm6 \n\t"
|
yading@10
|
101 "paddw %%mm1, %%mm6 \n\t"
|
yading@10
|
102
|
yading@10
|
103 "movq (%%"REG_S"), %%mm0 \n\t"
|
yading@10
|
104 "movq (%%"REG_D"), %%mm1 \n\t"
|
yading@10
|
105 "punpckhbw %%mm7, %%mm0 \n\t"
|
yading@10
|
106 "movq (%%"REG_D",%%"REG_a"), %%mm2 \n\t"
|
yading@10
|
107 "punpckhbw %%mm7, %%mm1 \n\t"
|
yading@10
|
108 "punpckhbw %%mm7, %%mm2 \n\t"
|
yading@10
|
109 "paddw %%mm0, %%mm0 \n\t"
|
yading@10
|
110 "paddw %%mm2, %%mm1 \n\t"
|
yading@10
|
111 "movq %%mm0, %%mm2 \n\t"
|
yading@10
|
112 "psubusw %%mm1, %%mm0 \n\t"
|
yading@10
|
113 "psubusw %%mm2, %%mm1 \n\t"
|
yading@10
|
114 "paddw %%mm0, %%mm6 \n\t"
|
yading@10
|
115 "paddw %%mm1, %%mm6 \n\t"
|
yading@10
|
116
|
yading@10
|
117 "movq (%%"REG_D",%%"REG_a"), %%mm0 \n\t"
|
yading@10
|
118 "movq (%%"REG_S"), %%mm1 \n\t"
|
yading@10
|
119 "punpcklbw %%mm7, %%mm0 \n\t"
|
yading@10
|
120 "movq (%%"REG_S",%%"REG_a"), %%mm2 \n\t"
|
yading@10
|
121 "punpcklbw %%mm7, %%mm1 \n\t"
|
yading@10
|
122 "punpcklbw %%mm7, %%mm2 \n\t"
|
yading@10
|
123 "paddw %%mm0, %%mm0 \n\t"
|
yading@10
|
124 "paddw %%mm2, %%mm1 \n\t"
|
yading@10
|
125 "movq %%mm0, %%mm2 \n\t"
|
yading@10
|
126 "psubusw %%mm1, %%mm0 \n\t"
|
yading@10
|
127 "psubusw %%mm2, %%mm1 \n\t"
|
yading@10
|
128 "paddw %%mm0, %%mm6 \n\t"
|
yading@10
|
129 "paddw %%mm1, %%mm6 \n\t"
|
yading@10
|
130
|
yading@10
|
131 "movq (%%"REG_D",%%"REG_a"), %%mm0 \n\t"
|
yading@10
|
132 "movq (%%"REG_S"), %%mm1 \n\t"
|
yading@10
|
133 "punpckhbw %%mm7, %%mm0 \n\t"
|
yading@10
|
134 "movq (%%"REG_S",%%"REG_a"), %%mm2 \n\t"
|
yading@10
|
135 "punpckhbw %%mm7, %%mm1 \n\t"
|
yading@10
|
136 "punpckhbw %%mm7, %%mm2 \n\t"
|
yading@10
|
137 "paddw %%mm0, %%mm0 \n\t"
|
yading@10
|
138 "paddw %%mm2, %%mm1 \n\t"
|
yading@10
|
139 "movq %%mm0, %%mm2 \n\t"
|
yading@10
|
140 "psubusw %%mm1, %%mm0 \n\t"
|
yading@10
|
141 "psubusw %%mm2, %%mm1 \n\t"
|
yading@10
|
142 "paddw %%mm0, %%mm6 \n\t"
|
yading@10
|
143 "paddw %%mm1, %%mm6 \n\t"
|
yading@10
|
144
|
yading@10
|
145 "add %%"REG_a", %%"REG_S" \n\t"
|
yading@10
|
146 "add %%"REG_a", %%"REG_D" \n\t"
|
yading@10
|
147 "decl %%ecx \n\t"
|
yading@10
|
148 "jnz 2b \n\t"
|
yading@10
|
149
|
yading@10
|
150 "movq %%mm6, %%mm5 \n\t"
|
yading@10
|
151 "punpcklwd %%mm7, %%mm6 \n\t"
|
yading@10
|
152 "punpckhwd %%mm7, %%mm5 \n\t"
|
yading@10
|
153 "paddd %%mm6, %%mm5 \n\t"
|
yading@10
|
154 "movd %%mm5, %%eax \n\t"
|
yading@10
|
155 "psrlq $32, %%mm5 \n\t"
|
yading@10
|
156 "movd %%mm5, %%edx \n\t"
|
yading@10
|
157 "addl %%edx, %%eax \n\t"
|
yading@10
|
158
|
yading@10
|
159 "emms \n\t"
|
yading@10
|
160 : "=a" (ret)
|
yading@10
|
161 : "S" (a), "D" (b), "a" (s)
|
yading@10
|
162 : "%ecx", "%edx"
|
yading@10
|
163 );
|
yading@10
|
164 return ret;
|
yading@10
|
165 }
|
yading@10
|
166
|
yading@10
|
167 static int var_y_mmx(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
168 {
|
yading@10
|
169 int ret;
|
yading@10
|
170 __asm__ volatile (
|
yading@10
|
171 "movl $3, %%ecx \n\t"
|
yading@10
|
172 "pxor %%mm4, %%mm4 \n\t"
|
yading@10
|
173 "pxor %%mm7, %%mm7 \n\t"
|
yading@10
|
174
|
yading@10
|
175 "1: \n\t"
|
yading@10
|
176
|
yading@10
|
177 "movq (%%"REG_S"), %%mm0 \n\t"
|
yading@10
|
178 "movq (%%"REG_S"), %%mm2 \n\t"
|
yading@10
|
179 "movq (%%"REG_S",%%"REG_a"), %%mm1 \n\t"
|
yading@10
|
180 "add %%"REG_a", %%"REG_S" \n\t"
|
yading@10
|
181 "psubusb %%mm1, %%mm2 \n\t"
|
yading@10
|
182 "psubusb %%mm0, %%mm1 \n\t"
|
yading@10
|
183 "movq %%mm2, %%mm0 \n\t"
|
yading@10
|
184 "movq %%mm1, %%mm3 \n\t"
|
yading@10
|
185 "punpcklbw %%mm7, %%mm0 \n\t"
|
yading@10
|
186 "punpcklbw %%mm7, %%mm1 \n\t"
|
yading@10
|
187 "punpckhbw %%mm7, %%mm2 \n\t"
|
yading@10
|
188 "punpckhbw %%mm7, %%mm3 \n\t"
|
yading@10
|
189 "paddw %%mm0, %%mm4 \n\t"
|
yading@10
|
190 "paddw %%mm1, %%mm4 \n\t"
|
yading@10
|
191 "paddw %%mm2, %%mm4 \n\t"
|
yading@10
|
192 "paddw %%mm3, %%mm4 \n\t"
|
yading@10
|
193
|
yading@10
|
194 "decl %%ecx \n\t"
|
yading@10
|
195 "jnz 1b \n\t"
|
yading@10
|
196
|
yading@10
|
197 "movq %%mm4, %%mm3 \n\t"
|
yading@10
|
198 "punpcklwd %%mm7, %%mm4 \n\t"
|
yading@10
|
199 "punpckhwd %%mm7, %%mm3 \n\t"
|
yading@10
|
200 "paddd %%mm4, %%mm3 \n\t"
|
yading@10
|
201 "movd %%mm3, %%eax \n\t"
|
yading@10
|
202 "psrlq $32, %%mm3 \n\t"
|
yading@10
|
203 "movd %%mm3, %%edx \n\t"
|
yading@10
|
204 "addl %%edx, %%eax \n\t"
|
yading@10
|
205 "emms \n\t"
|
yading@10
|
206 : "=a" (ret)
|
yading@10
|
207 : "S" (a), "a" (s)
|
yading@10
|
208 : "%ecx", "%edx"
|
yading@10
|
209 );
|
yading@10
|
210 return 4*ret;
|
yading@10
|
211 }
|
yading@10
|
212 #endif
|
yading@10
|
213 #endif
|
yading@10
|
214
|
yading@10
|
215 #define ABS(a) (((a)^((a)>>31))-((a)>>31))
|
yading@10
|
216
|
yading@10
|
217 static int diff_y(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
218 {
|
yading@10
|
219 int i, j, diff=0;
|
yading@10
|
220 for (i=4; i; i--) {
|
yading@10
|
221 for (j=0; j<8; j++) diff += ABS(a[j]-b[j]);
|
yading@10
|
222 a+=s; b+=s;
|
yading@10
|
223 }
|
yading@10
|
224 return diff;
|
yading@10
|
225 }
|
yading@10
|
226
|
yading@10
|
227 static int licomb_y(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
228 {
|
yading@10
|
229 int i, j, diff=0;
|
yading@10
|
230 for (i=4; i; i--) {
|
yading@10
|
231 for (j=0; j<8; j++)
|
yading@10
|
232 diff += ABS((a[j]<<1) - b[j-s] - b[j])
|
yading@10
|
233 + ABS((b[j]<<1) - a[j] - a[j+s]);
|
yading@10
|
234 a+=s; b+=s;
|
yading@10
|
235 }
|
yading@10
|
236 return diff;
|
yading@10
|
237 }
|
yading@10
|
238
|
yading@10
|
239 #if 0
|
yading@10
|
240 static int qpcomb_y(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
241 {
|
yading@10
|
242 int i, j, diff=0;
|
yading@10
|
243 for (i=4; i; i--) {
|
yading@10
|
244 for (j=0; j<8; j++)
|
yading@10
|
245 diff += ABS(a[j] - 3*b[j-s] + 3*a[j+s] - b[j]);
|
yading@10
|
246 a+=s; b+=s;
|
yading@10
|
247 }
|
yading@10
|
248 return diff;
|
yading@10
|
249 }
|
yading@10
|
250
|
yading@10
|
251 static int licomb_y_test(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
252 {
|
yading@10
|
253 int c = licomb_y(a,b,s);
|
yading@10
|
254 int m = licomb_y_mmx(a,b,s);
|
yading@10
|
255 if (c != m) printf("%d != %d\n", c, m);
|
yading@10
|
256 return m;
|
yading@10
|
257 }
|
yading@10
|
258 #endif
|
yading@10
|
259
|
yading@10
|
260 static int var_y(unsigned char *a, unsigned char *b, int s)
|
yading@10
|
261 {
|
yading@10
|
262 int i, j, var=0;
|
yading@10
|
263 for (i=3; i; i--) {
|
yading@10
|
264 for (j=0; j<8; j++) {
|
yading@10
|
265 var += ABS(a[j]-a[j+s]);
|
yading@10
|
266 }
|
yading@10
|
267 a+=s; b+=s;
|
yading@10
|
268 }
|
yading@10
|
269 return 4*var; /* match comb scaling */
|
yading@10
|
270 }
|
yading@10
|
271
|
yading@10
|
272
|
yading@10
|
273
|
yading@10
|
274
|
yading@10
|
275
|
yading@10
|
276
|
yading@10
|
277
|
yading@10
|
278
|
yading@10
|
279
|
yading@10
|
280 static void alloc_buffer(struct pullup_context *c, struct pullup_buffer *b)
|
yading@10
|
281 {
|
yading@10
|
282 int i;
|
yading@10
|
283 if (b->planes) return;
|
yading@10
|
284 b->planes = calloc(c->nplanes, sizeof(unsigned char *));
|
yading@10
|
285 for (i = 0; i < c->nplanes; i++) {
|
yading@10
|
286 b->planes[i] = malloc(c->h[i]*c->stride[i]);
|
yading@10
|
287 /* Deal with idiotic 128=0 for chroma: */
|
yading@10
|
288 memset(b->planes[i], c->background[i], c->h[i]*c->stride[i]);
|
yading@10
|
289 }
|
yading@10
|
290 }
|
yading@10
|
291
|
yading@10
|
292 struct pullup_buffer *ff_pullup_lock_buffer(struct pullup_buffer *b, int parity)
|
yading@10
|
293 {
|
yading@10
|
294 if (!b) return 0;
|
yading@10
|
295 if ((parity+1) & 1) b->lock[0]++;
|
yading@10
|
296 if ((parity+1) & 2) b->lock[1]++;
|
yading@10
|
297 return b;
|
yading@10
|
298 }
|
yading@10
|
299
|
yading@10
|
300 void ff_pullup_release_buffer(struct pullup_buffer *b, int parity)
|
yading@10
|
301 {
|
yading@10
|
302 if (!b) return;
|
yading@10
|
303 if ((parity+1) & 1) b->lock[0]--;
|
yading@10
|
304 if ((parity+1) & 2) b->lock[1]--;
|
yading@10
|
305 }
|
yading@10
|
306
|
yading@10
|
307 struct pullup_buffer *ff_pullup_get_buffer(struct pullup_context *c, int parity)
|
yading@10
|
308 {
|
yading@10
|
309 int i;
|
yading@10
|
310
|
yading@10
|
311 /* Try first to get the sister buffer for the previous field */
|
yading@10
|
312 if (parity < 2 && c->last && parity != c->last->parity
|
yading@10
|
313 && !c->last->buffer->lock[parity]) {
|
yading@10
|
314 alloc_buffer(c, c->last->buffer);
|
yading@10
|
315 return ff_pullup_lock_buffer(c->last->buffer, parity);
|
yading@10
|
316 }
|
yading@10
|
317
|
yading@10
|
318 /* Prefer a buffer with both fields open */
|
yading@10
|
319 for (i = 0; i < c->nbuffers; i++) {
|
yading@10
|
320 if (c->buffers[i].lock[0]) continue;
|
yading@10
|
321 if (c->buffers[i].lock[1]) continue;
|
yading@10
|
322 alloc_buffer(c, &c->buffers[i]);
|
yading@10
|
323 return ff_pullup_lock_buffer(&c->buffers[i], parity);
|
yading@10
|
324 }
|
yading@10
|
325
|
yading@10
|
326 if (parity == 2) return 0;
|
yading@10
|
327
|
yading@10
|
328 /* Search for any half-free buffer */
|
yading@10
|
329 for (i = 0; i < c->nbuffers; i++) {
|
yading@10
|
330 if (((parity+1) & 1) && c->buffers[i].lock[0]) continue;
|
yading@10
|
331 if (((parity+1) & 2) && c->buffers[i].lock[1]) continue;
|
yading@10
|
332 alloc_buffer(c, &c->buffers[i]);
|
yading@10
|
333 return ff_pullup_lock_buffer(&c->buffers[i], parity);
|
yading@10
|
334 }
|
yading@10
|
335
|
yading@10
|
336 return 0;
|
yading@10
|
337 }
|
yading@10
|
338
|
yading@10
|
339
|
yading@10
|
340
|
yading@10
|
341
|
yading@10
|
342
|
yading@10
|
343
|
yading@10
|
344 static void compute_metric(struct pullup_context *c,
|
yading@10
|
345 struct pullup_field *fa, int pa,
|
yading@10
|
346 struct pullup_field *fb, int pb,
|
yading@10
|
347 int (*func)(unsigned char *, unsigned char *, int), int *dest)
|
yading@10
|
348 {
|
yading@10
|
349 unsigned char *a, *b;
|
yading@10
|
350 int x, y;
|
yading@10
|
351 int mp = c->metric_plane;
|
yading@10
|
352 int xstep = c->bpp[mp];
|
yading@10
|
353 int ystep = c->stride[mp]<<3;
|
yading@10
|
354 int s = c->stride[mp]<<1; /* field stride */
|
yading@10
|
355 int w = c->metric_w*xstep;
|
yading@10
|
356
|
yading@10
|
357 if (!fa->buffer || !fb->buffer) return;
|
yading@10
|
358
|
yading@10
|
359 /* Shortcut for duplicate fields (e.g. from RFF flag) */
|
yading@10
|
360 if (fa->buffer == fb->buffer && pa == pb) {
|
yading@10
|
361 memset(dest, 0, c->metric_len * sizeof(int));
|
yading@10
|
362 return;
|
yading@10
|
363 }
|
yading@10
|
364
|
yading@10
|
365 a = fa->buffer->planes[mp] + pa * c->stride[mp] + c->metric_offset;
|
yading@10
|
366 b = fb->buffer->planes[mp] + pb * c->stride[mp] + c->metric_offset;
|
yading@10
|
367
|
yading@10
|
368 for (y = c->metric_h; y; y--) {
|
yading@10
|
369 for (x = 0; x < w; x += xstep) {
|
yading@10
|
370 *dest++ = func(a + x, b + x, s);
|
yading@10
|
371 }
|
yading@10
|
372 a += ystep; b += ystep;
|
yading@10
|
373 }
|
yading@10
|
374 }
|
yading@10
|
375
|
yading@10
|
376
|
yading@10
|
377
|
yading@10
|
378
|
yading@10
|
379
|
yading@10
|
380 static void alloc_metrics(struct pullup_context *c, struct pullup_field *f)
|
yading@10
|
381 {
|
yading@10
|
382 f->diffs = calloc(c->metric_len, sizeof(int));
|
yading@10
|
383 f->comb = calloc(c->metric_len, sizeof(int));
|
yading@10
|
384 f->var = calloc(c->metric_len, sizeof(int));
|
yading@10
|
385 /* add more metrics here as needed */
|
yading@10
|
386 }
|
yading@10
|
387
|
yading@10
|
388 static struct pullup_field *make_field_queue(struct pullup_context *c, int len)
|
yading@10
|
389 {
|
yading@10
|
390 struct pullup_field *head, *f;
|
yading@10
|
391 f = head = calloc(1, sizeof(struct pullup_field));
|
yading@10
|
392 alloc_metrics(c, f);
|
yading@10
|
393 for (; len > 0; len--) {
|
yading@10
|
394 f->next = calloc(1, sizeof(struct pullup_field));
|
yading@10
|
395 f->next->prev = f;
|
yading@10
|
396 f = f->next;
|
yading@10
|
397 alloc_metrics(c, f);
|
yading@10
|
398 }
|
yading@10
|
399 f->next = head;
|
yading@10
|
400 head->prev = f;
|
yading@10
|
401 return head;
|
yading@10
|
402 }
|
yading@10
|
403
|
yading@10
|
404 static void check_field_queue(struct pullup_context *c)
|
yading@10
|
405 {
|
yading@10
|
406 if (c->head->next == c->first) {
|
yading@10
|
407 struct pullup_field *f = calloc(1, sizeof(struct pullup_field));
|
yading@10
|
408 alloc_metrics(c, f);
|
yading@10
|
409 f->prev = c->head;
|
yading@10
|
410 f->next = c->first;
|
yading@10
|
411 c->head->next = f;
|
yading@10
|
412 c->first->prev = f;
|
yading@10
|
413 }
|
yading@10
|
414 }
|
yading@10
|
415
|
yading@10
|
416 void ff_pullup_submit_field(struct pullup_context *c, struct pullup_buffer *b, int parity)
|
yading@10
|
417 {
|
yading@10
|
418 struct pullup_field *f;
|
yading@10
|
419
|
yading@10
|
420 /* Grow the circular list if needed */
|
yading@10
|
421 check_field_queue(c);
|
yading@10
|
422
|
yading@10
|
423 /* Cannot have two fields of same parity in a row; drop the new one */
|
yading@10
|
424 if (c->last && c->last->parity == parity) return;
|
yading@10
|
425
|
yading@10
|
426 f = c->head;
|
yading@10
|
427 f->parity = parity;
|
yading@10
|
428 f->buffer = ff_pullup_lock_buffer(b, parity);
|
yading@10
|
429 f->flags = 0;
|
yading@10
|
430 f->breaks = 0;
|
yading@10
|
431 f->affinity = 0;
|
yading@10
|
432
|
yading@10
|
433 compute_metric(c, f, parity, f->prev->prev, parity, c->diff, f->diffs);
|
yading@10
|
434 compute_metric(c, parity?f->prev:f, 0, parity?f:f->prev, 1, c->comb, f->comb);
|
yading@10
|
435 compute_metric(c, f, parity, f, -1, c->var, f->var);
|
yading@10
|
436
|
yading@10
|
437 /* Advance the circular list */
|
yading@10
|
438 if (!c->first) c->first = c->head;
|
yading@10
|
439 c->last = c->head;
|
yading@10
|
440 c->head = c->head->next;
|
yading@10
|
441 }
|
yading@10
|
442
|
yading@10
|
443 void ff_pullup_flush_fields(struct pullup_context *c)
|
yading@10
|
444 {
|
yading@10
|
445 struct pullup_field *f;
|
yading@10
|
446
|
yading@10
|
447 for (f = c->first; f && f != c->head; f = f->next) {
|
yading@10
|
448 ff_pullup_release_buffer(f->buffer, f->parity);
|
yading@10
|
449 f->buffer = 0;
|
yading@10
|
450 }
|
yading@10
|
451 c->first = c->last = 0;
|
yading@10
|
452 }
|
yading@10
|
453
|
yading@10
|
454
|
yading@10
|
455
|
yading@10
|
456
|
yading@10
|
457
|
yading@10
|
458
|
yading@10
|
459
|
yading@10
|
460
|
yading@10
|
461 #define F_HAVE_BREAKS 1
|
yading@10
|
462 #define F_HAVE_AFFINITY 2
|
yading@10
|
463
|
yading@10
|
464
|
yading@10
|
465 #define BREAK_LEFT 1
|
yading@10
|
466 #define BREAK_RIGHT 2
|
yading@10
|
467
|
yading@10
|
468
|
yading@10
|
469
|
yading@10
|
470
|
yading@10
|
471 static int queue_length(struct pullup_field *begin, struct pullup_field *end)
|
yading@10
|
472 {
|
yading@10
|
473 int count = 1;
|
yading@10
|
474 struct pullup_field *f;
|
yading@10
|
475
|
yading@10
|
476 if (!begin || !end) return 0;
|
yading@10
|
477 for (f = begin; f != end; f = f->next) count++;
|
yading@10
|
478 return count;
|
yading@10
|
479 }
|
yading@10
|
480
|
yading@10
|
481 static int find_first_break(struct pullup_field *f, int max)
|
yading@10
|
482 {
|
yading@10
|
483 int i;
|
yading@10
|
484 for (i = 0; i < max; i++) {
|
yading@10
|
485 if (f->breaks & BREAK_RIGHT || f->next->breaks & BREAK_LEFT)
|
yading@10
|
486 return i+1;
|
yading@10
|
487 f = f->next;
|
yading@10
|
488 }
|
yading@10
|
489 return 0;
|
yading@10
|
490 }
|
yading@10
|
491
|
yading@10
|
492 static void compute_breaks(struct pullup_context *c, struct pullup_field *f0)
|
yading@10
|
493 {
|
yading@10
|
494 int i;
|
yading@10
|
495 struct pullup_field *f1 = f0->next;
|
yading@10
|
496 struct pullup_field *f2 = f1->next;
|
yading@10
|
497 struct pullup_field *f3 = f2->next;
|
yading@10
|
498 int l, max_l=0, max_r=0;
|
yading@10
|
499 //struct pullup_field *ff;
|
yading@10
|
500 //for (i=0, ff=c->first; ff != f0; i++, ff=ff->next);
|
yading@10
|
501
|
yading@10
|
502 if (f0->flags & F_HAVE_BREAKS) return;
|
yading@10
|
503 //printf("\n%d: ", i);
|
yading@10
|
504 f0->flags |= F_HAVE_BREAKS;
|
yading@10
|
505
|
yading@10
|
506 /* Special case when fields are 100% identical */
|
yading@10
|
507 if (f0->buffer == f2->buffer && f1->buffer != f3->buffer) {
|
yading@10
|
508 f2->breaks |= BREAK_RIGHT;
|
yading@10
|
509 return;
|
yading@10
|
510 }
|
yading@10
|
511 if (f0->buffer != f2->buffer && f1->buffer == f3->buffer) {
|
yading@10
|
512 f1->breaks |= BREAK_LEFT;
|
yading@10
|
513 return;
|
yading@10
|
514 }
|
yading@10
|
515
|
yading@10
|
516 for (i = 0; i < c->metric_len; i++) {
|
yading@10
|
517 l = f2->diffs[i] - f3->diffs[i];
|
yading@10
|
518 if (l > max_l) max_l = l;
|
yading@10
|
519 if (-l > max_r) max_r = -l;
|
yading@10
|
520 }
|
yading@10
|
521 /* Don't get tripped up when differences are mostly quant error */
|
yading@10
|
522 //printf("%d %d\n", max_l, max_r);
|
yading@10
|
523 if (max_l + max_r < 128) return;
|
yading@10
|
524 if (max_l > 4*max_r) f1->breaks |= BREAK_LEFT;
|
yading@10
|
525 if (max_r > 4*max_l) f2->breaks |= BREAK_RIGHT;
|
yading@10
|
526 }
|
yading@10
|
527
|
yading@10
|
528 static void compute_affinity(struct pullup_context *c, struct pullup_field *f)
|
yading@10
|
529 {
|
yading@10
|
530 int i;
|
yading@10
|
531 int max_l=0, max_r=0, l;
|
yading@10
|
532 if (f->flags & F_HAVE_AFFINITY) return;
|
yading@10
|
533 f->flags |= F_HAVE_AFFINITY;
|
yading@10
|
534 if (f->buffer == f->next->next->buffer) {
|
yading@10
|
535 f->affinity = 1;
|
yading@10
|
536 f->next->affinity = 0;
|
yading@10
|
537 f->next->next->affinity = -1;
|
yading@10
|
538 f->next->flags |= F_HAVE_AFFINITY;
|
yading@10
|
539 f->next->next->flags |= F_HAVE_AFFINITY;
|
yading@10
|
540 return;
|
yading@10
|
541 }
|
yading@10
|
542 if (1) {
|
yading@10
|
543 for (i = 0; i < c->metric_len; i++) {
|
yading@10
|
544 int lv = f->prev->var[i];
|
yading@10
|
545 int rv = f->next->var[i];
|
yading@10
|
546 int v = f->var[i];
|
yading@10
|
547 int lc = f->comb[i] - (v+lv) + ABS(v-lv);
|
yading@10
|
548 int rc = f->next->comb[i] - (v+rv) + ABS(v-rv);
|
yading@10
|
549 lc = lc>0 ? lc : 0;
|
yading@10
|
550 rc = rc>0 ? rc : 0;
|
yading@10
|
551 l = lc - rc;
|
yading@10
|
552 if (l > max_l) max_l = l;
|
yading@10
|
553 if (-l > max_r) max_r = -l;
|
yading@10
|
554 }
|
yading@10
|
555 if (max_l + max_r < 64) return;
|
yading@10
|
556 if (max_r > 6*max_l) f->affinity = -1;
|
yading@10
|
557 else if (max_l > 6*max_r) f->affinity = 1;
|
yading@10
|
558 } else {
|
yading@10
|
559 for (i = 0; i < c->metric_len; i++) {
|
yading@10
|
560 l = f->comb[i] - f->next->comb[i];
|
yading@10
|
561 if (l > max_l) max_l = l;
|
yading@10
|
562 if (-l > max_r) max_r = -l;
|
yading@10
|
563 }
|
yading@10
|
564 if (max_l + max_r < 64) return;
|
yading@10
|
565 if (max_r > 2*max_l) f->affinity = -1;
|
yading@10
|
566 else if (max_l > 2*max_r) f->affinity = 1;
|
yading@10
|
567 }
|
yading@10
|
568 }
|
yading@10
|
569
|
yading@10
|
570 static void foo(struct pullup_context *c)
|
yading@10
|
571 {
|
yading@10
|
572 struct pullup_field *f = c->first;
|
yading@10
|
573 int i, n = queue_length(f, c->last);
|
yading@10
|
574 for (i = 0; i < n-1; i++) {
|
yading@10
|
575 if (i < n-3) compute_breaks(c, f);
|
yading@10
|
576 compute_affinity(c, f);
|
yading@10
|
577 f = f->next;
|
yading@10
|
578 }
|
yading@10
|
579 }
|
yading@10
|
580
|
yading@10
|
581 static int decide_frame_length(struct pullup_context *c)
|
yading@10
|
582 {
|
yading@10
|
583 struct pullup_field *f0 = c->first;
|
yading@10
|
584 struct pullup_field *f1 = f0->next;
|
yading@10
|
585 struct pullup_field *f2 = f1->next;
|
yading@10
|
586 int l;
|
yading@10
|
587
|
yading@10
|
588 if (queue_length(c->first, c->last) < 4) return 0;
|
yading@10
|
589 foo(c);
|
yading@10
|
590
|
yading@10
|
591 if (f0->affinity == -1) return 1;
|
yading@10
|
592
|
yading@10
|
593 l = find_first_break(f0, 3);
|
yading@10
|
594 if (l == 1 && c->strict_breaks < 0) l = 0;
|
yading@10
|
595
|
yading@10
|
596 switch (l) {
|
yading@10
|
597 case 1:
|
yading@10
|
598 if (c->strict_breaks < 1 && f0->affinity == 1 && f1->affinity == -1)
|
yading@10
|
599 return 2;
|
yading@10
|
600 else return 1;
|
yading@10
|
601 case 2:
|
yading@10
|
602 /* FIXME: strictly speaking, f0->prev is no longer valid... :) */
|
yading@10
|
603 if (c->strict_pairs
|
yading@10
|
604 && (f0->prev->breaks & BREAK_RIGHT) && (f2->breaks & BREAK_LEFT)
|
yading@10
|
605 && (f0->affinity != 1 || f1->affinity != -1) )
|
yading@10
|
606 return 1;
|
yading@10
|
607 if (f1->affinity == 1) return 1;
|
yading@10
|
608 else return 2;
|
yading@10
|
609 case 3:
|
yading@10
|
610 if (f2->affinity == 1) return 2;
|
yading@10
|
611 else return 3;
|
yading@10
|
612 default:
|
yading@10
|
613 /* 9 possibilities covered before switch */
|
yading@10
|
614 if (f1->affinity == 1) return 1; /* covers 6 */
|
yading@10
|
615 else if (f1->affinity == -1) return 2; /* covers 6 */
|
yading@10
|
616 else if (f2->affinity == -1) { /* covers 2 */
|
yading@10
|
617 if (f0->affinity == 1) return 3;
|
yading@10
|
618 else return 1;
|
yading@10
|
619 }
|
yading@10
|
620 else return 2; /* the remaining 6 */
|
yading@10
|
621 }
|
yading@10
|
622 }
|
yading@10
|
623
|
yading@10
|
624
|
yading@10
|
625 static void print_aff_and_breaks(struct pullup_context *c, struct pullup_field *f)
|
yading@10
|
626 {
|
yading@10
|
627 int i;
|
yading@10
|
628 struct pullup_field *f0 = f;
|
yading@10
|
629 const char aff_l[] = "+..", aff_r[] = "..+";
|
yading@10
|
630 printf("\naffinity: ");
|
yading@10
|
631 for (i = 0; i < 4; i++) {
|
yading@10
|
632 printf("%c%d%c", aff_l[1+f->affinity], i, aff_r[1+f->affinity]);
|
yading@10
|
633 f = f->next;
|
yading@10
|
634 }
|
yading@10
|
635 f = f0;
|
yading@10
|
636 printf("\nbreaks: ");
|
yading@10
|
637 for (i=0; i<4; i++) {
|
yading@10
|
638 printf("%c%d%c", f->breaks & BREAK_LEFT ? '|' : '.', i, f->breaks & BREAK_RIGHT ? '|' : '.');
|
yading@10
|
639 f = f->next;
|
yading@10
|
640 }
|
yading@10
|
641 printf("\n");
|
yading@10
|
642 }
|
yading@10
|
643
|
yading@10
|
644
|
yading@10
|
645
|
yading@10
|
646
|
yading@10
|
647
|
yading@10
|
648 struct pullup_frame *ff_pullup_get_frame(struct pullup_context *c)
|
yading@10
|
649 {
|
yading@10
|
650 int i;
|
yading@10
|
651 struct pullup_frame *fr = c->frame;
|
yading@10
|
652 int n = decide_frame_length(c);
|
yading@10
|
653 int aff = c->first->next->affinity;
|
yading@10
|
654
|
yading@10
|
655 if (!n) return 0;
|
yading@10
|
656 if (fr->lock) return 0;
|
yading@10
|
657
|
yading@10
|
658 if (c->verbose) {
|
yading@10
|
659 print_aff_and_breaks(c, c->first);
|
yading@10
|
660 printf("duration: %d \n", n);
|
yading@10
|
661 }
|
yading@10
|
662
|
yading@10
|
663 fr->lock++;
|
yading@10
|
664 fr->length = n;
|
yading@10
|
665 fr->parity = c->first->parity;
|
yading@10
|
666 fr->buffer = 0;
|
yading@10
|
667 for (i = 0; i < n; i++) {
|
yading@10
|
668 /* We cheat and steal the buffer without release+relock */
|
yading@10
|
669 fr->ifields[i] = c->first->buffer;
|
yading@10
|
670 c->first->buffer = 0;
|
yading@10
|
671 c->first = c->first->next;
|
yading@10
|
672 }
|
yading@10
|
673
|
yading@10
|
674 if (n == 1) {
|
yading@10
|
675 fr->ofields[fr->parity] = fr->ifields[0];
|
yading@10
|
676 fr->ofields[fr->parity^1] = 0;
|
yading@10
|
677 } else if (n == 2) {
|
yading@10
|
678 fr->ofields[fr->parity] = fr->ifields[0];
|
yading@10
|
679 fr->ofields[fr->parity^1] = fr->ifields[1];
|
yading@10
|
680 } else if (n == 3) {
|
yading@10
|
681 if (aff == 0)
|
yading@10
|
682 aff = (fr->ifields[0] == fr->ifields[1]) ? -1 : 1;
|
yading@10
|
683 /* else if (c->verbose) printf("forced aff: %d \n", aff); */
|
yading@10
|
684 fr->ofields[fr->parity] = fr->ifields[1+aff];
|
yading@10
|
685 fr->ofields[fr->parity^1] = fr->ifields[1];
|
yading@10
|
686 }
|
yading@10
|
687 ff_pullup_lock_buffer(fr->ofields[0], 0);
|
yading@10
|
688 ff_pullup_lock_buffer(fr->ofields[1], 1);
|
yading@10
|
689
|
yading@10
|
690 if (fr->ofields[0] == fr->ofields[1]) {
|
yading@10
|
691 fr->buffer = fr->ofields[0];
|
yading@10
|
692 ff_pullup_lock_buffer(fr->buffer, 2);
|
yading@10
|
693 return fr;
|
yading@10
|
694 }
|
yading@10
|
695 return fr;
|
yading@10
|
696 }
|
yading@10
|
697
|
yading@10
|
698 static void copy_field(struct pullup_context *c, struct pullup_buffer *dest,
|
yading@10
|
699 struct pullup_buffer *src, int parity)
|
yading@10
|
700 {
|
yading@10
|
701 int i, j;
|
yading@10
|
702 unsigned char *d, *s;
|
yading@10
|
703 for (i = 0; i < c->nplanes; i++) {
|
yading@10
|
704 s = src->planes[i] + parity*c->stride[i];
|
yading@10
|
705 d = dest->planes[i] + parity*c->stride[i];
|
yading@10
|
706 for (j = c->h[i]>>1; j; j--) {
|
yading@10
|
707 memcpy(d, s, c->stride[i]);
|
yading@10
|
708 s += c->stride[i]<<1;
|
yading@10
|
709 d += c->stride[i]<<1;
|
yading@10
|
710 }
|
yading@10
|
711 }
|
yading@10
|
712 }
|
yading@10
|
713
|
yading@10
|
714 void ff_pullup_pack_frame(struct pullup_context *c, struct pullup_frame *fr)
|
yading@10
|
715 {
|
yading@10
|
716 int i;
|
yading@10
|
717 if (fr->buffer) return;
|
yading@10
|
718 if (fr->length < 2) return; /* FIXME: deal with this */
|
yading@10
|
719 for (i = 0; i < 2; i++)
|
yading@10
|
720 {
|
yading@10
|
721 if (fr->ofields[i]->lock[i^1]) continue;
|
yading@10
|
722 fr->buffer = fr->ofields[i];
|
yading@10
|
723 ff_pullup_lock_buffer(fr->buffer, 2);
|
yading@10
|
724 copy_field(c, fr->buffer, fr->ofields[i^1], i^1);
|
yading@10
|
725 return;
|
yading@10
|
726 }
|
yading@10
|
727 fr->buffer = ff_pullup_get_buffer(c, 2);
|
yading@10
|
728 copy_field(c, fr->buffer, fr->ofields[0], 0);
|
yading@10
|
729 copy_field(c, fr->buffer, fr->ofields[1], 1);
|
yading@10
|
730 }
|
yading@10
|
731
|
yading@10
|
732 void ff_pullup_release_frame(struct pullup_frame *fr)
|
yading@10
|
733 {
|
yading@10
|
734 int i;
|
yading@10
|
735 for (i = 0; i < fr->length; i++)
|
yading@10
|
736 ff_pullup_release_buffer(fr->ifields[i], fr->parity ^ (i&1));
|
yading@10
|
737 ff_pullup_release_buffer(fr->ofields[0], 0);
|
yading@10
|
738 ff_pullup_release_buffer(fr->ofields[1], 1);
|
yading@10
|
739 if (fr->buffer) ff_pullup_release_buffer(fr->buffer, 2);
|
yading@10
|
740 fr->lock--;
|
yading@10
|
741 }
|
yading@10
|
742
|
yading@10
|
743
|
yading@10
|
744
|
yading@10
|
745
|
yading@10
|
746
|
yading@10
|
747
|
yading@10
|
748 struct pullup_context *ff_pullup_alloc_context(void)
|
yading@10
|
749 {
|
yading@10
|
750 struct pullup_context *c;
|
yading@10
|
751
|
yading@10
|
752 c = calloc(1, sizeof(struct pullup_context));
|
yading@10
|
753
|
yading@10
|
754 return c;
|
yading@10
|
755 }
|
yading@10
|
756
|
yading@10
|
757 void ff_pullup_preinit_context(struct pullup_context *c)
|
yading@10
|
758 {
|
yading@10
|
759 c->bpp = calloc(c->nplanes, sizeof(int));
|
yading@10
|
760 c->w = calloc(c->nplanes, sizeof(int));
|
yading@10
|
761 c->h = calloc(c->nplanes, sizeof(int));
|
yading@10
|
762 c->stride = calloc(c->nplanes, sizeof(int));
|
yading@10
|
763 c->background = calloc(c->nplanes, sizeof(int));
|
yading@10
|
764 }
|
yading@10
|
765
|
yading@10
|
766 void ff_pullup_init_context(struct pullup_context *c)
|
yading@10
|
767 {
|
yading@10
|
768 int mp = c->metric_plane;
|
yading@10
|
769 if (c->nbuffers < 10) c->nbuffers = 10;
|
yading@10
|
770 c->buffers = calloc(c->nbuffers, sizeof (struct pullup_buffer));
|
yading@10
|
771
|
yading@10
|
772 c->metric_w = (c->w[mp] - ((c->junk_left + c->junk_right) << 3)) >> 3;
|
yading@10
|
773 c->metric_h = (c->h[mp] - ((c->junk_top + c->junk_bottom) << 1)) >> 3;
|
yading@10
|
774 c->metric_offset = c->junk_left*c->bpp[mp] + (c->junk_top<<1)*c->stride[mp];
|
yading@10
|
775 c->metric_len = c->metric_w * c->metric_h;
|
yading@10
|
776
|
yading@10
|
777 c->head = make_field_queue(c, 8);
|
yading@10
|
778
|
yading@10
|
779 c->frame = calloc(1, sizeof (struct pullup_frame));
|
yading@10
|
780 c->frame->ifields = calloc(3, sizeof (struct pullup_buffer *));
|
yading@10
|
781
|
yading@10
|
782 switch(c->format) {
|
yading@10
|
783 case PULLUP_FMT_Y:
|
yading@10
|
784 c->diff = diff_y;
|
yading@10
|
785 c->comb = licomb_y;
|
yading@10
|
786 c->var = var_y;
|
yading@10
|
787 #if ARCH_X86
|
yading@10
|
788 #if HAVE_MMX
|
yading@10
|
789 if (c->cpu & PULLUP_CPU_MMX) {
|
yading@10
|
790 c->diff = diff_y_mmx;
|
yading@10
|
791 c->comb = licomb_y_mmx;
|
yading@10
|
792 c->var = var_y_mmx;
|
yading@10
|
793 }
|
yading@10
|
794 #endif
|
yading@10
|
795 #endif
|
yading@10
|
796 /* c->comb = qpcomb_y; */
|
yading@10
|
797 break;
|
yading@10
|
798 #if 0
|
yading@10
|
799 case PULLUP_FMT_YUY2:
|
yading@10
|
800 c->diff = diff_yuy2;
|
yading@10
|
801 break;
|
yading@10
|
802 case PULLUP_FMT_RGB32:
|
yading@10
|
803 c->diff = diff_rgb32;
|
yading@10
|
804 break;
|
yading@10
|
805 #endif
|
yading@10
|
806 }
|
yading@10
|
807 }
|
yading@10
|
808
|
yading@10
|
809 void ff_pullup_free_context(struct pullup_context *c)
|
yading@10
|
810 {
|
yading@10
|
811 struct pullup_field *f;
|
yading@10
|
812 free(c->buffers);
|
yading@10
|
813 f = c->head;
|
yading@10
|
814 do {
|
yading@10
|
815 if (!f) break;
|
yading@10
|
816 free(f->diffs);
|
yading@10
|
817 free(f->comb);
|
yading@10
|
818 f = f->next;
|
yading@10
|
819 free(f->prev);
|
yading@10
|
820 } while (f != c->head);
|
yading@10
|
821 free(c->frame);
|
yading@10
|
822 free(c);
|
yading@10
|
823 }
|