yading@10
|
1 /*
|
yading@10
|
2 * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder
|
yading@10
|
3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
|
yading@10
|
4 *
|
yading@10
|
5 * This file is part of FFmpeg.
|
yading@10
|
6 *
|
yading@10
|
7 * FFmpeg is free software; you can redistribute it and/or
|
yading@10
|
8 * modify it under the terms of the GNU Lesser General Public
|
yading@10
|
9 * License as published by the Free Software Foundation; either
|
yading@10
|
10 * version 2.1 of the License, or (at your option) any later version.
|
yading@10
|
11 *
|
yading@10
|
12 * FFmpeg is distributed in the hope that it will be useful,
|
yading@10
|
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
yading@10
|
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
yading@10
|
15 * Lesser General Public License for more details.
|
yading@10
|
16 *
|
yading@10
|
17 * You should have received a copy of the GNU Lesser General Public
|
yading@10
|
18 * License along with FFmpeg; if not, write to the Free Software
|
yading@10
|
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
yading@10
|
20 */
|
yading@10
|
21
|
yading@10
|
22 /**
|
yading@10
|
23 * @file
|
yading@10
|
24 * H.264 / AVC / MPEG4 part10 prediction functions.
|
yading@10
|
25 * @author Michael Niedermayer <michaelni@gmx.at>
|
yading@10
|
26 */
|
yading@10
|
27
|
yading@10
|
28 #include "libavutil/avassert.h"
|
yading@10
|
29 #include "dsputil.h"
|
yading@10
|
30 #include "h264pred.h"
|
yading@10
|
31 #include "avcodec.h" // for AV_CODEC_ID_*
|
yading@10
|
32
|
yading@10
|
33 #define BIT_DEPTH 8
|
yading@10
|
34 #include "h264pred_template.c"
|
yading@10
|
35 #undef BIT_DEPTH
|
yading@10
|
36
|
yading@10
|
37 #define BIT_DEPTH 9
|
yading@10
|
38 #include "h264pred_template.c"
|
yading@10
|
39 #undef BIT_DEPTH
|
yading@10
|
40
|
yading@10
|
41 #define BIT_DEPTH 10
|
yading@10
|
42 #include "h264pred_template.c"
|
yading@10
|
43 #undef BIT_DEPTH
|
yading@10
|
44
|
yading@10
|
45 #define BIT_DEPTH 12
|
yading@10
|
46 #include "h264pred_template.c"
|
yading@10
|
47 #undef BIT_DEPTH
|
yading@10
|
48
|
yading@10
|
49 #define BIT_DEPTH 14
|
yading@10
|
50 #include "h264pred_template.c"
|
yading@10
|
51 #undef BIT_DEPTH
|
yading@10
|
52
|
yading@10
|
53 static void pred4x4_vertical_vp8_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
54 ptrdiff_t stride)
|
yading@10
|
55 {
|
yading@10
|
56 const unsigned lt = src[-1-1*stride];
|
yading@10
|
57 LOAD_TOP_EDGE
|
yading@10
|
58 LOAD_TOP_RIGHT_EDGE
|
yading@10
|
59 uint32_t v = PACK_4U8((lt + 2*t0 + t1 + 2) >> 2,
|
yading@10
|
60 (t0 + 2*t1 + t2 + 2) >> 2,
|
yading@10
|
61 (t1 + 2*t2 + t3 + 2) >> 2,
|
yading@10
|
62 (t2 + 2*t3 + t4 + 2) >> 2);
|
yading@10
|
63
|
yading@10
|
64 AV_WN32A(src+0*stride, v);
|
yading@10
|
65 AV_WN32A(src+1*stride, v);
|
yading@10
|
66 AV_WN32A(src+2*stride, v);
|
yading@10
|
67 AV_WN32A(src+3*stride, v);
|
yading@10
|
68 }
|
yading@10
|
69
|
yading@10
|
70 static void pred4x4_horizontal_vp8_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
71 ptrdiff_t stride)
|
yading@10
|
72 {
|
yading@10
|
73 const unsigned lt = src[-1-1*stride];
|
yading@10
|
74 LOAD_LEFT_EDGE
|
yading@10
|
75
|
yading@10
|
76 AV_WN32A(src+0*stride, ((lt + 2*l0 + l1 + 2) >> 2)*0x01010101);
|
yading@10
|
77 AV_WN32A(src+1*stride, ((l0 + 2*l1 + l2 + 2) >> 2)*0x01010101);
|
yading@10
|
78 AV_WN32A(src+2*stride, ((l1 + 2*l2 + l3 + 2) >> 2)*0x01010101);
|
yading@10
|
79 AV_WN32A(src+3*stride, ((l2 + 2*l3 + l3 + 2) >> 2)*0x01010101);
|
yading@10
|
80 }
|
yading@10
|
81
|
yading@10
|
82 static void pred4x4_down_left_svq3_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
83 ptrdiff_t stride)
|
yading@10
|
84 {
|
yading@10
|
85 LOAD_TOP_EDGE
|
yading@10
|
86 LOAD_LEFT_EDGE
|
yading@10
|
87
|
yading@10
|
88 src[0+0*stride]=(l1 + t1)>>1;
|
yading@10
|
89 src[1+0*stride]=
|
yading@10
|
90 src[0+1*stride]=(l2 + t2)>>1;
|
yading@10
|
91 src[2+0*stride]=
|
yading@10
|
92 src[1+1*stride]=
|
yading@10
|
93 src[0+2*stride]=
|
yading@10
|
94 src[3+0*stride]=
|
yading@10
|
95 src[2+1*stride]=
|
yading@10
|
96 src[1+2*stride]=
|
yading@10
|
97 src[0+3*stride]=
|
yading@10
|
98 src[3+1*stride]=
|
yading@10
|
99 src[2+2*stride]=
|
yading@10
|
100 src[1+3*stride]=
|
yading@10
|
101 src[3+2*stride]=
|
yading@10
|
102 src[2+3*stride]=
|
yading@10
|
103 src[3+3*stride]=(l3 + t3)>>1;
|
yading@10
|
104 }
|
yading@10
|
105
|
yading@10
|
106 static void pred4x4_down_left_rv40_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
107 ptrdiff_t stride)
|
yading@10
|
108 {
|
yading@10
|
109 LOAD_TOP_EDGE
|
yading@10
|
110 LOAD_TOP_RIGHT_EDGE
|
yading@10
|
111 LOAD_LEFT_EDGE
|
yading@10
|
112 LOAD_DOWN_LEFT_EDGE
|
yading@10
|
113
|
yading@10
|
114 src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
|
yading@10
|
115 src[1+0*stride]=
|
yading@10
|
116 src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
|
yading@10
|
117 src[2+0*stride]=
|
yading@10
|
118 src[1+1*stride]=
|
yading@10
|
119 src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + l4 + 2*l3 + 2)>>3;
|
yading@10
|
120 src[3+0*stride]=
|
yading@10
|
121 src[2+1*stride]=
|
yading@10
|
122 src[1+2*stride]=
|
yading@10
|
123 src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3 + l5 + 2*l4 + 2)>>3;
|
yading@10
|
124 src[3+1*stride]=
|
yading@10
|
125 src[2+2*stride]=
|
yading@10
|
126 src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l4 + l6 + 2*l5 + 2)>>3;
|
yading@10
|
127 src[3+2*stride]=
|
yading@10
|
128 src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l5 + l7 + 2*l6 + 2)>>3;
|
yading@10
|
129 src[3+3*stride]=(t6 + t7 + 1 + l6 + l7 + 1)>>2;
|
yading@10
|
130 }
|
yading@10
|
131
|
yading@10
|
132 static void pred4x4_down_left_rv40_nodown_c(uint8_t *src,
|
yading@10
|
133 const uint8_t *topright,
|
yading@10
|
134 ptrdiff_t stride)
|
yading@10
|
135 {
|
yading@10
|
136 LOAD_TOP_EDGE
|
yading@10
|
137 LOAD_TOP_RIGHT_EDGE
|
yading@10
|
138 LOAD_LEFT_EDGE
|
yading@10
|
139
|
yading@10
|
140 src[0+0*stride]=(t0 + t2 + 2*t1 + 2 + l0 + l2 + 2*l1 + 2)>>3;
|
yading@10
|
141 src[1+0*stride]=
|
yading@10
|
142 src[0+1*stride]=(t1 + t3 + 2*t2 + 2 + l1 + l3 + 2*l2 + 2)>>3;
|
yading@10
|
143 src[2+0*stride]=
|
yading@10
|
144 src[1+1*stride]=
|
yading@10
|
145 src[0+2*stride]=(t2 + t4 + 2*t3 + 2 + l2 + 3*l3 + 2)>>3;
|
yading@10
|
146 src[3+0*stride]=
|
yading@10
|
147 src[2+1*stride]=
|
yading@10
|
148 src[1+2*stride]=
|
yading@10
|
149 src[0+3*stride]=(t3 + t5 + 2*t4 + 2 + l3*4 + 2)>>3;
|
yading@10
|
150 src[3+1*stride]=
|
yading@10
|
151 src[2+2*stride]=
|
yading@10
|
152 src[1+3*stride]=(t4 + t6 + 2*t5 + 2 + l3*4 + 2)>>3;
|
yading@10
|
153 src[3+2*stride]=
|
yading@10
|
154 src[2+3*stride]=(t5 + t7 + 2*t6 + 2 + l3*4 + 2)>>3;
|
yading@10
|
155 src[3+3*stride]=(t6 + t7 + 1 + 2*l3 + 1)>>2;
|
yading@10
|
156 }
|
yading@10
|
157
|
yading@10
|
158 static void pred4x4_vertical_left_rv40(uint8_t *src, const uint8_t *topright,
|
yading@10
|
159 ptrdiff_t stride,
|
yading@10
|
160 const int l0, const int l1, const int l2,
|
yading@10
|
161 const int l3, const int l4)
|
yading@10
|
162 {
|
yading@10
|
163 LOAD_TOP_EDGE
|
yading@10
|
164 LOAD_TOP_RIGHT_EDGE
|
yading@10
|
165
|
yading@10
|
166 src[0+0*stride]=(2*t0 + 2*t1 + l1 + 2*l2 + l3 + 4)>>3;
|
yading@10
|
167 src[1+0*stride]=
|
yading@10
|
168 src[0+2*stride]=(t1 + t2 + 1)>>1;
|
yading@10
|
169 src[2+0*stride]=
|
yading@10
|
170 src[1+2*stride]=(t2 + t3 + 1)>>1;
|
yading@10
|
171 src[3+0*stride]=
|
yading@10
|
172 src[2+2*stride]=(t3 + t4+ 1)>>1;
|
yading@10
|
173 src[3+2*stride]=(t4 + t5+ 1)>>1;
|
yading@10
|
174 src[0+1*stride]=(t0 + 2*t1 + t2 + l2 + 2*l3 + l4 + 4)>>3;
|
yading@10
|
175 src[1+1*stride]=
|
yading@10
|
176 src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
|
yading@10
|
177 src[2+1*stride]=
|
yading@10
|
178 src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
|
yading@10
|
179 src[3+1*stride]=
|
yading@10
|
180 src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
|
yading@10
|
181 src[3+3*stride]=(t4 + 2*t5 + t6 + 2)>>2;
|
yading@10
|
182 }
|
yading@10
|
183
|
yading@10
|
184 static void pred4x4_vertical_left_rv40_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
185 ptrdiff_t stride)
|
yading@10
|
186 {
|
yading@10
|
187 LOAD_LEFT_EDGE
|
yading@10
|
188 LOAD_DOWN_LEFT_EDGE
|
yading@10
|
189
|
yading@10
|
190 pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l4);
|
yading@10
|
191 }
|
yading@10
|
192
|
yading@10
|
193 static void pred4x4_vertical_left_rv40_nodown_c(uint8_t *src,
|
yading@10
|
194 const uint8_t *topright,
|
yading@10
|
195 ptrdiff_t stride)
|
yading@10
|
196 {
|
yading@10
|
197 LOAD_LEFT_EDGE
|
yading@10
|
198
|
yading@10
|
199 pred4x4_vertical_left_rv40(src, topright, stride, l0, l1, l2, l3, l3);
|
yading@10
|
200 }
|
yading@10
|
201
|
yading@10
|
202 static void pred4x4_vertical_left_vp8_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
203 ptrdiff_t stride)
|
yading@10
|
204 {
|
yading@10
|
205 LOAD_TOP_EDGE
|
yading@10
|
206 LOAD_TOP_RIGHT_EDGE
|
yading@10
|
207
|
yading@10
|
208 src[0+0*stride]=(t0 + t1 + 1)>>1;
|
yading@10
|
209 src[1+0*stride]=
|
yading@10
|
210 src[0+2*stride]=(t1 + t2 + 1)>>1;
|
yading@10
|
211 src[2+0*stride]=
|
yading@10
|
212 src[1+2*stride]=(t2 + t3 + 1)>>1;
|
yading@10
|
213 src[3+0*stride]=
|
yading@10
|
214 src[2+2*stride]=(t3 + t4 + 1)>>1;
|
yading@10
|
215 src[0+1*stride]=(t0 + 2*t1 + t2 + 2)>>2;
|
yading@10
|
216 src[1+1*stride]=
|
yading@10
|
217 src[0+3*stride]=(t1 + 2*t2 + t3 + 2)>>2;
|
yading@10
|
218 src[2+1*stride]=
|
yading@10
|
219 src[1+3*stride]=(t2 + 2*t3 + t4 + 2)>>2;
|
yading@10
|
220 src[3+1*stride]=
|
yading@10
|
221 src[2+3*stride]=(t3 + 2*t4 + t5 + 2)>>2;
|
yading@10
|
222 src[3+2*stride]=(t4 + 2*t5 + t6 + 2)>>2;
|
yading@10
|
223 src[3+3*stride]=(t5 + 2*t6 + t7 + 2)>>2;
|
yading@10
|
224 }
|
yading@10
|
225
|
yading@10
|
226 static void pred4x4_horizontal_up_rv40_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
227 ptrdiff_t stride)
|
yading@10
|
228 {
|
yading@10
|
229 LOAD_LEFT_EDGE
|
yading@10
|
230 LOAD_DOWN_LEFT_EDGE
|
yading@10
|
231 LOAD_TOP_EDGE
|
yading@10
|
232 LOAD_TOP_RIGHT_EDGE
|
yading@10
|
233
|
yading@10
|
234 src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
|
yading@10
|
235 src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
|
yading@10
|
236 src[2+0*stride]=
|
yading@10
|
237 src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
|
yading@10
|
238 src[3+0*stride]=
|
yading@10
|
239 src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
|
yading@10
|
240 src[2+1*stride]=
|
yading@10
|
241 src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
|
yading@10
|
242 src[3+1*stride]=
|
yading@10
|
243 src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
|
yading@10
|
244 src[3+2*stride]=
|
yading@10
|
245 src[1+3*stride]=(l3 + 2*l4 + l5 + 2)>>2;
|
yading@10
|
246 src[0+3*stride]=
|
yading@10
|
247 src[2+2*stride]=(t6 + t7 + l3 + l4 + 2)>>2;
|
yading@10
|
248 src[2+3*stride]=(l4 + l5 + 1)>>1;
|
yading@10
|
249 src[3+3*stride]=(l4 + 2*l5 + l6 + 2)>>2;
|
yading@10
|
250 }
|
yading@10
|
251
|
yading@10
|
252 static void pred4x4_horizontal_up_rv40_nodown_c(uint8_t *src,
|
yading@10
|
253 const uint8_t *topright,
|
yading@10
|
254 ptrdiff_t stride)
|
yading@10
|
255 {
|
yading@10
|
256 LOAD_LEFT_EDGE
|
yading@10
|
257 LOAD_TOP_EDGE
|
yading@10
|
258 LOAD_TOP_RIGHT_EDGE
|
yading@10
|
259
|
yading@10
|
260 src[0+0*stride]=(t1 + 2*t2 + t3 + 2*l0 + 2*l1 + 4)>>3;
|
yading@10
|
261 src[1+0*stride]=(t2 + 2*t3 + t4 + l0 + 2*l1 + l2 + 4)>>3;
|
yading@10
|
262 src[2+0*stride]=
|
yading@10
|
263 src[0+1*stride]=(t3 + 2*t4 + t5 + 2*l1 + 2*l2 + 4)>>3;
|
yading@10
|
264 src[3+0*stride]=
|
yading@10
|
265 src[1+1*stride]=(t4 + 2*t5 + t6 + l1 + 2*l2 + l3 + 4)>>3;
|
yading@10
|
266 src[2+1*stride]=
|
yading@10
|
267 src[0+2*stride]=(t5 + 2*t6 + t7 + 2*l2 + 2*l3 + 4)>>3;
|
yading@10
|
268 src[3+1*stride]=
|
yading@10
|
269 src[1+2*stride]=(t6 + 3*t7 + l2 + 3*l3 + 4)>>3;
|
yading@10
|
270 src[3+2*stride]=
|
yading@10
|
271 src[1+3*stride]=l3;
|
yading@10
|
272 src[0+3*stride]=
|
yading@10
|
273 src[2+2*stride]=(t6 + t7 + 2*l3 + 2)>>2;
|
yading@10
|
274 src[2+3*stride]=
|
yading@10
|
275 src[3+3*stride]=l3;
|
yading@10
|
276 }
|
yading@10
|
277
|
yading@10
|
278 static void pred4x4_tm_vp8_c(uint8_t *src, const uint8_t *topright,
|
yading@10
|
279 ptrdiff_t stride)
|
yading@10
|
280 {
|
yading@10
|
281 const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
|
yading@10
|
282 uint8_t *top = src-stride;
|
yading@10
|
283 int y;
|
yading@10
|
284
|
yading@10
|
285 for (y = 0; y < 4; y++) {
|
yading@10
|
286 const uint8_t *cm_in = cm + src[-1];
|
yading@10
|
287 src[0] = cm_in[top[0]];
|
yading@10
|
288 src[1] = cm_in[top[1]];
|
yading@10
|
289 src[2] = cm_in[top[2]];
|
yading@10
|
290 src[3] = cm_in[top[3]];
|
yading@10
|
291 src += stride;
|
yading@10
|
292 }
|
yading@10
|
293 }
|
yading@10
|
294
|
yading@10
|
295 static void pred16x16_plane_svq3_c(uint8_t *src, ptrdiff_t stride)
|
yading@10
|
296 {
|
yading@10
|
297 pred16x16_plane_compat_8_c(src, stride, 1, 0);
|
yading@10
|
298 }
|
yading@10
|
299
|
yading@10
|
300 static void pred16x16_plane_rv40_c(uint8_t *src, ptrdiff_t stride)
|
yading@10
|
301 {
|
yading@10
|
302 pred16x16_plane_compat_8_c(src, stride, 0, 1);
|
yading@10
|
303 }
|
yading@10
|
304
|
yading@10
|
305 static void pred16x16_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
|
yading@10
|
306 {
|
yading@10
|
307 const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
|
yading@10
|
308 uint8_t *top = src-stride;
|
yading@10
|
309 int y;
|
yading@10
|
310
|
yading@10
|
311 for (y = 0; y < 16; y++) {
|
yading@10
|
312 const uint8_t *cm_in = cm + src[-1];
|
yading@10
|
313 src[0] = cm_in[top[0]];
|
yading@10
|
314 src[1] = cm_in[top[1]];
|
yading@10
|
315 src[2] = cm_in[top[2]];
|
yading@10
|
316 src[3] = cm_in[top[3]];
|
yading@10
|
317 src[4] = cm_in[top[4]];
|
yading@10
|
318 src[5] = cm_in[top[5]];
|
yading@10
|
319 src[6] = cm_in[top[6]];
|
yading@10
|
320 src[7] = cm_in[top[7]];
|
yading@10
|
321 src[8] = cm_in[top[8]];
|
yading@10
|
322 src[9] = cm_in[top[9]];
|
yading@10
|
323 src[10] = cm_in[top[10]];
|
yading@10
|
324 src[11] = cm_in[top[11]];
|
yading@10
|
325 src[12] = cm_in[top[12]];
|
yading@10
|
326 src[13] = cm_in[top[13]];
|
yading@10
|
327 src[14] = cm_in[top[14]];
|
yading@10
|
328 src[15] = cm_in[top[15]];
|
yading@10
|
329 src += stride;
|
yading@10
|
330 }
|
yading@10
|
331 }
|
yading@10
|
332
|
yading@10
|
333 static void pred8x8_left_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
|
yading@10
|
334 {
|
yading@10
|
335 int i;
|
yading@10
|
336 unsigned dc0;
|
yading@10
|
337
|
yading@10
|
338 dc0=0;
|
yading@10
|
339 for(i=0;i<8; i++)
|
yading@10
|
340 dc0+= src[-1+i*stride];
|
yading@10
|
341 dc0= 0x01010101*((dc0 + 4)>>3);
|
yading@10
|
342
|
yading@10
|
343 for(i=0; i<8; i++){
|
yading@10
|
344 ((uint32_t*)(src+i*stride))[0]=
|
yading@10
|
345 ((uint32_t*)(src+i*stride))[1]= dc0;
|
yading@10
|
346 }
|
yading@10
|
347 }
|
yading@10
|
348
|
yading@10
|
349 static void pred8x8_top_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
|
yading@10
|
350 {
|
yading@10
|
351 int i;
|
yading@10
|
352 unsigned dc0;
|
yading@10
|
353
|
yading@10
|
354 dc0=0;
|
yading@10
|
355 for(i=0;i<8; i++)
|
yading@10
|
356 dc0+= src[i-stride];
|
yading@10
|
357 dc0= 0x01010101*((dc0 + 4)>>3);
|
yading@10
|
358
|
yading@10
|
359 for(i=0; i<8; i++){
|
yading@10
|
360 ((uint32_t*)(src+i*stride))[0]=
|
yading@10
|
361 ((uint32_t*)(src+i*stride))[1]= dc0;
|
yading@10
|
362 }
|
yading@10
|
363 }
|
yading@10
|
364
|
yading@10
|
365 static void pred8x8_dc_rv40_c(uint8_t *src, ptrdiff_t stride)
|
yading@10
|
366 {
|
yading@10
|
367 int i;
|
yading@10
|
368 unsigned dc0 = 0;
|
yading@10
|
369
|
yading@10
|
370 for(i=0;i<4; i++){
|
yading@10
|
371 dc0+= src[-1+i*stride] + src[i-stride];
|
yading@10
|
372 dc0+= src[4+i-stride];
|
yading@10
|
373 dc0+= src[-1+(i+4)*stride];
|
yading@10
|
374 }
|
yading@10
|
375 dc0= 0x01010101*((dc0 + 8)>>4);
|
yading@10
|
376
|
yading@10
|
377 for(i=0; i<4; i++){
|
yading@10
|
378 ((uint32_t*)(src+i*stride))[0]= dc0;
|
yading@10
|
379 ((uint32_t*)(src+i*stride))[1]= dc0;
|
yading@10
|
380 }
|
yading@10
|
381 for(i=4; i<8; i++){
|
yading@10
|
382 ((uint32_t*)(src+i*stride))[0]= dc0;
|
yading@10
|
383 ((uint32_t*)(src+i*stride))[1]= dc0;
|
yading@10
|
384 }
|
yading@10
|
385 }
|
yading@10
|
386
|
yading@10
|
387 static void pred8x8_tm_vp8_c(uint8_t *src, ptrdiff_t stride)
|
yading@10
|
388 {
|
yading@10
|
389 const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP - src[-1-stride];
|
yading@10
|
390 uint8_t *top = src-stride;
|
yading@10
|
391 int y;
|
yading@10
|
392
|
yading@10
|
393 for (y = 0; y < 8; y++) {
|
yading@10
|
394 const uint8_t *cm_in = cm + src[-1];
|
yading@10
|
395 src[0] = cm_in[top[0]];
|
yading@10
|
396 src[1] = cm_in[top[1]];
|
yading@10
|
397 src[2] = cm_in[top[2]];
|
yading@10
|
398 src[3] = cm_in[top[3]];
|
yading@10
|
399 src[4] = cm_in[top[4]];
|
yading@10
|
400 src[5] = cm_in[top[5]];
|
yading@10
|
401 src[6] = cm_in[top[6]];
|
yading@10
|
402 src[7] = cm_in[top[7]];
|
yading@10
|
403 src += stride;
|
yading@10
|
404 }
|
yading@10
|
405 }
|
yading@10
|
406
|
yading@10
|
407 /**
|
yading@10
|
408 * Set the intra prediction function pointers.
|
yading@10
|
409 */
|
yading@10
|
410 void ff_h264_pred_init(H264PredContext *h, int codec_id, const int bit_depth,
|
yading@10
|
411 int chroma_format_idc)
|
yading@10
|
412 {
|
yading@10
|
413 #undef FUNC
|
yading@10
|
414 #undef FUNCC
|
yading@10
|
415 #define FUNC(a, depth) a ## _ ## depth
|
yading@10
|
416 #define FUNCC(a, depth) a ## _ ## depth ## _c
|
yading@10
|
417 #define FUNCD(a) a ## _c
|
yading@10
|
418
|
yading@10
|
419 #define H264_PRED(depth) \
|
yading@10
|
420 if(codec_id != AV_CODEC_ID_RV40){\
|
yading@10
|
421 if(codec_id == AV_CODEC_ID_VP8) {\
|
yading@10
|
422 h->pred4x4[VERT_PRED ]= FUNCD(pred4x4_vertical_vp8);\
|
yading@10
|
423 h->pred4x4[HOR_PRED ]= FUNCD(pred4x4_horizontal_vp8);\
|
yading@10
|
424 } else {\
|
yading@10
|
425 h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
|
yading@10
|
426 h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
|
yading@10
|
427 }\
|
yading@10
|
428 h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
|
yading@10
|
429 if(codec_id == AV_CODEC_ID_SVQ3)\
|
yading@10
|
430 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_svq3);\
|
yading@10
|
431 else\
|
yading@10
|
432 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred4x4_down_left , depth);\
|
yading@10
|
433 h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
|
yading@10
|
434 h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
|
yading@10
|
435 h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
|
yading@10
|
436 if (codec_id == AV_CODEC_ID_VP8) {\
|
yading@10
|
437 h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_vp8);\
|
yading@10
|
438 } else\
|
yading@10
|
439 h->pred4x4[VERT_LEFT_PRED ]= FUNCC(pred4x4_vertical_left , depth);\
|
yading@10
|
440 h->pred4x4[HOR_UP_PRED ]= FUNCC(pred4x4_horizontal_up , depth);\
|
yading@10
|
441 if(codec_id != AV_CODEC_ID_VP8) {\
|
yading@10
|
442 h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
|
yading@10
|
443 h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
|
yading@10
|
444 h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
|
yading@10
|
445 } else {\
|
yading@10
|
446 h->pred4x4[TM_VP8_PRED ]= FUNCD(pred4x4_tm_vp8);\
|
yading@10
|
447 h->pred4x4[DC_127_PRED ]= FUNCC(pred4x4_127_dc , depth);\
|
yading@10
|
448 h->pred4x4[DC_129_PRED ]= FUNCC(pred4x4_129_dc , depth);\
|
yading@10
|
449 h->pred4x4[VERT_VP8_PRED ]= FUNCC(pred4x4_vertical , depth);\
|
yading@10
|
450 h->pred4x4[HOR_VP8_PRED ]= FUNCC(pred4x4_horizontal , depth);\
|
yading@10
|
451 }\
|
yading@10
|
452 }else{\
|
yading@10
|
453 h->pred4x4[VERT_PRED ]= FUNCC(pred4x4_vertical , depth);\
|
yading@10
|
454 h->pred4x4[HOR_PRED ]= FUNCC(pred4x4_horizontal , depth);\
|
yading@10
|
455 h->pred4x4[DC_PRED ]= FUNCC(pred4x4_dc , depth);\
|
yading@10
|
456 h->pred4x4[DIAG_DOWN_LEFT_PRED ]= FUNCD(pred4x4_down_left_rv40);\
|
yading@10
|
457 h->pred4x4[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred4x4_down_right , depth);\
|
yading@10
|
458 h->pred4x4[VERT_RIGHT_PRED ]= FUNCC(pred4x4_vertical_right , depth);\
|
yading@10
|
459 h->pred4x4[HOR_DOWN_PRED ]= FUNCC(pred4x4_horizontal_down , depth);\
|
yading@10
|
460 h->pred4x4[VERT_LEFT_PRED ]= FUNCD(pred4x4_vertical_left_rv40);\
|
yading@10
|
461 h->pred4x4[HOR_UP_PRED ]= FUNCD(pred4x4_horizontal_up_rv40);\
|
yading@10
|
462 h->pred4x4[LEFT_DC_PRED ]= FUNCC(pred4x4_left_dc , depth);\
|
yading@10
|
463 h->pred4x4[TOP_DC_PRED ]= FUNCC(pred4x4_top_dc , depth);\
|
yading@10
|
464 h->pred4x4[DC_128_PRED ]= FUNCC(pred4x4_128_dc , depth);\
|
yading@10
|
465 h->pred4x4[DIAG_DOWN_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_down_left_rv40_nodown);\
|
yading@10
|
466 h->pred4x4[HOR_UP_PRED_RV40_NODOWN]= FUNCD(pred4x4_horizontal_up_rv40_nodown);\
|
yading@10
|
467 h->pred4x4[VERT_LEFT_PRED_RV40_NODOWN]= FUNCD(pred4x4_vertical_left_rv40_nodown);\
|
yading@10
|
468 }\
|
yading@10
|
469 \
|
yading@10
|
470 h->pred8x8l[VERT_PRED ]= FUNCC(pred8x8l_vertical , depth);\
|
yading@10
|
471 h->pred8x8l[HOR_PRED ]= FUNCC(pred8x8l_horizontal , depth);\
|
yading@10
|
472 h->pred8x8l[DC_PRED ]= FUNCC(pred8x8l_dc , depth);\
|
yading@10
|
473 h->pred8x8l[DIAG_DOWN_LEFT_PRED ]= FUNCC(pred8x8l_down_left , depth);\
|
yading@10
|
474 h->pred8x8l[DIAG_DOWN_RIGHT_PRED]= FUNCC(pred8x8l_down_right , depth);\
|
yading@10
|
475 h->pred8x8l[VERT_RIGHT_PRED ]= FUNCC(pred8x8l_vertical_right , depth);\
|
yading@10
|
476 h->pred8x8l[HOR_DOWN_PRED ]= FUNCC(pred8x8l_horizontal_down , depth);\
|
yading@10
|
477 h->pred8x8l[VERT_LEFT_PRED ]= FUNCC(pred8x8l_vertical_left , depth);\
|
yading@10
|
478 h->pred8x8l[HOR_UP_PRED ]= FUNCC(pred8x8l_horizontal_up , depth);\
|
yading@10
|
479 h->pred8x8l[LEFT_DC_PRED ]= FUNCC(pred8x8l_left_dc , depth);\
|
yading@10
|
480 h->pred8x8l[TOP_DC_PRED ]= FUNCC(pred8x8l_top_dc , depth);\
|
yading@10
|
481 h->pred8x8l[DC_128_PRED ]= FUNCC(pred8x8l_128_dc , depth);\
|
yading@10
|
482 \
|
yading@10
|
483 if (chroma_format_idc == 1) {\
|
yading@10
|
484 h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x8_vertical , depth);\
|
yading@10
|
485 h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x8_horizontal , depth);\
|
yading@10
|
486 } else {\
|
yading@10
|
487 h->pred8x8[VERT_PRED8x8 ]= FUNCC(pred8x16_vertical , depth);\
|
yading@10
|
488 h->pred8x8[HOR_PRED8x8 ]= FUNCC(pred8x16_horizontal , depth);\
|
yading@10
|
489 }\
|
yading@10
|
490 if (codec_id != AV_CODEC_ID_VP8) {\
|
yading@10
|
491 if (chroma_format_idc == 1) {\
|
yading@10
|
492 h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x8_plane , depth);\
|
yading@10
|
493 } else {\
|
yading@10
|
494 h->pred8x8[PLANE_PRED8x8]= FUNCC(pred8x16_plane , depth);\
|
yading@10
|
495 }\
|
yading@10
|
496 } else\
|
yading@10
|
497 h->pred8x8[PLANE_PRED8x8]= FUNCD(pred8x8_tm_vp8);\
|
yading@10
|
498 if(codec_id != AV_CODEC_ID_RV40 && codec_id != AV_CODEC_ID_VP8){\
|
yading@10
|
499 if (chroma_format_idc == 1) {\
|
yading@10
|
500 h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x8_dc , depth);\
|
yading@10
|
501 h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x8_left_dc , depth);\
|
yading@10
|
502 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x8_top_dc , depth);\
|
yading@10
|
503 h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l0t, depth);\
|
yading@10
|
504 h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0lt, depth);\
|
yading@10
|
505 h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_l00, depth);\
|
yading@10
|
506 h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x8_mad_cow_dc_0l0, depth);\
|
yading@10
|
507 } else {\
|
yading@10
|
508 h->pred8x8[DC_PRED8x8 ]= FUNCC(pred8x16_dc , depth);\
|
yading@10
|
509 h->pred8x8[LEFT_DC_PRED8x8]= FUNCC(pred8x16_left_dc , depth);\
|
yading@10
|
510 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCC(pred8x16_top_dc , depth);\
|
yading@10
|
511 h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l0t, depth);\
|
yading@10
|
512 h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0lt, depth);\
|
yading@10
|
513 h->pred8x8[ALZHEIMER_DC_L00_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_l00, depth);\
|
yading@10
|
514 h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8 ]= FUNC(pred8x16_mad_cow_dc_0l0, depth);\
|
yading@10
|
515 }\
|
yading@10
|
516 }else{\
|
yading@10
|
517 h->pred8x8[DC_PRED8x8 ]= FUNCD(pred8x8_dc_rv40);\
|
yading@10
|
518 h->pred8x8[LEFT_DC_PRED8x8]= FUNCD(pred8x8_left_dc_rv40);\
|
yading@10
|
519 h->pred8x8[TOP_DC_PRED8x8 ]= FUNCD(pred8x8_top_dc_rv40);\
|
yading@10
|
520 if (codec_id == AV_CODEC_ID_VP8) {\
|
yading@10
|
521 h->pred8x8[DC_127_PRED8x8]= FUNCC(pred8x8_127_dc , depth);\
|
yading@10
|
522 h->pred8x8[DC_129_PRED8x8]= FUNCC(pred8x8_129_dc , depth);\
|
yading@10
|
523 }\
|
yading@10
|
524 }\
|
yading@10
|
525 if (chroma_format_idc == 1) {\
|
yading@10
|
526 h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x8_128_dc , depth);\
|
yading@10
|
527 } else {\
|
yading@10
|
528 h->pred8x8[DC_128_PRED8x8 ]= FUNCC(pred8x16_128_dc , depth);\
|
yading@10
|
529 }\
|
yading@10
|
530 \
|
yading@10
|
531 h->pred16x16[DC_PRED8x8 ]= FUNCC(pred16x16_dc , depth);\
|
yading@10
|
532 h->pred16x16[VERT_PRED8x8 ]= FUNCC(pred16x16_vertical , depth);\
|
yading@10
|
533 h->pred16x16[HOR_PRED8x8 ]= FUNCC(pred16x16_horizontal , depth);\
|
yading@10
|
534 switch(codec_id){\
|
yading@10
|
535 case AV_CODEC_ID_SVQ3:\
|
yading@10
|
536 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_svq3);\
|
yading@10
|
537 break;\
|
yading@10
|
538 case AV_CODEC_ID_RV40:\
|
yading@10
|
539 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_plane_rv40);\
|
yading@10
|
540 break;\
|
yading@10
|
541 case AV_CODEC_ID_VP8:\
|
yading@10
|
542 h->pred16x16[PLANE_PRED8x8 ]= FUNCD(pred16x16_tm_vp8);\
|
yading@10
|
543 h->pred16x16[DC_127_PRED8x8]= FUNCC(pred16x16_127_dc , depth);\
|
yading@10
|
544 h->pred16x16[DC_129_PRED8x8]= FUNCC(pred16x16_129_dc , depth);\
|
yading@10
|
545 break;\
|
yading@10
|
546 default:\
|
yading@10
|
547 h->pred16x16[PLANE_PRED8x8 ]= FUNCC(pred16x16_plane , depth);\
|
yading@10
|
548 break;\
|
yading@10
|
549 }\
|
yading@10
|
550 h->pred16x16[LEFT_DC_PRED8x8]= FUNCC(pred16x16_left_dc , depth);\
|
yading@10
|
551 h->pred16x16[TOP_DC_PRED8x8 ]= FUNCC(pred16x16_top_dc , depth);\
|
yading@10
|
552 h->pred16x16[DC_128_PRED8x8 ]= FUNCC(pred16x16_128_dc , depth);\
|
yading@10
|
553 \
|
yading@10
|
554 /* special lossless h/v prediction for h264 */ \
|
yading@10
|
555 h->pred4x4_add [VERT_PRED ]= FUNCC(pred4x4_vertical_add , depth);\
|
yading@10
|
556 h->pred4x4_add [ HOR_PRED ]= FUNCC(pred4x4_horizontal_add , depth);\
|
yading@10
|
557 h->pred8x8l_add [VERT_PRED ]= FUNCC(pred8x8l_vertical_add , depth);\
|
yading@10
|
558 h->pred8x8l_add [ HOR_PRED ]= FUNCC(pred8x8l_horizontal_add , depth);\
|
yading@10
|
559 if (chroma_format_idc == 1) {\
|
yading@10
|
560 h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x8_vertical_add , depth);\
|
yading@10
|
561 h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x8_horizontal_add , depth);\
|
yading@10
|
562 } else {\
|
yading@10
|
563 h->pred8x8_add [VERT_PRED8x8]= FUNCC(pred8x16_vertical_add , depth);\
|
yading@10
|
564 h->pred8x8_add [ HOR_PRED8x8]= FUNCC(pred8x16_horizontal_add , depth);\
|
yading@10
|
565 }\
|
yading@10
|
566 h->pred16x16_add[VERT_PRED8x8]= FUNCC(pred16x16_vertical_add , depth);\
|
yading@10
|
567 h->pred16x16_add[ HOR_PRED8x8]= FUNCC(pred16x16_horizontal_add , depth);\
|
yading@10
|
568
|
yading@10
|
569 if(!chroma_format_idc)
|
yading@10
|
570 chroma_format_idc = 1;
|
yading@10
|
571
|
yading@10
|
572 switch (bit_depth) {
|
yading@10
|
573 case 9:
|
yading@10
|
574 H264_PRED(9)
|
yading@10
|
575 break;
|
yading@10
|
576 case 10:
|
yading@10
|
577 H264_PRED(10)
|
yading@10
|
578 break;
|
yading@10
|
579 case 12:
|
yading@10
|
580 H264_PRED(12)
|
yading@10
|
581 break;
|
yading@10
|
582 case 14:
|
yading@10
|
583 H264_PRED(14)
|
yading@10
|
584 break;
|
yading@10
|
585 default:
|
yading@10
|
586 av_assert0(bit_depth<=8);
|
yading@10
|
587 H264_PRED(8)
|
yading@10
|
588 break;
|
yading@10
|
589 }
|
yading@10
|
590
|
yading@10
|
591 if (ARCH_ARM) ff_h264_pred_init_arm(h, codec_id, bit_depth, chroma_format_idc);
|
yading@10
|
592 if (ARCH_X86) ff_h264_pred_init_x86(h, codec_id, bit_depth, chroma_format_idc);
|
yading@10
|
593 }
|