annotate ffmpeg/libavcodec/cavs.c @ 13:844d341cf643 tip

Back up before ISMIR
author Yading Song <yading.song@eecs.qmul.ac.uk>
date Thu, 31 Oct 2013 13:17:06 +0000
parents 6840f77b83aa
children
rev   line source
yading@10 1 /*
yading@10 2 * Chinese AVS video (AVS1-P2, JiZhun profile) decoder.
yading@10 3 * Copyright (c) 2006 Stefan Gehrer <stefan.gehrer@gmx.de>
yading@10 4 *
yading@10 5 * This file is part of FFmpeg.
yading@10 6 *
yading@10 7 * FFmpeg is free software; you can redistribute it and/or
yading@10 8 * modify it under the terms of the GNU Lesser General Public
yading@10 9 * License as published by the Free Software Foundation; either
yading@10 10 * version 2.1 of the License, or (at your option) any later version.
yading@10 11 *
yading@10 12 * FFmpeg is distributed in the hope that it will be useful,
yading@10 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
yading@10 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
yading@10 15 * Lesser General Public License for more details.
yading@10 16 *
yading@10 17 * You should have received a copy of the GNU Lesser General Public
yading@10 18 * License along with FFmpeg; if not, write to the Free Software
yading@10 19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
yading@10 20 */
yading@10 21
yading@10 22 /**
yading@10 23 * @file
yading@10 24 * Chinese AVS video (AVS1-P2, JiZhun profile) decoder
yading@10 25 * @author Stefan Gehrer <stefan.gehrer@gmx.de>
yading@10 26 */
yading@10 27
yading@10 28 #include "avcodec.h"
yading@10 29 #include "get_bits.h"
yading@10 30 #include "golomb.h"
yading@10 31 #include "h264chroma.h"
yading@10 32 #include "mathops.h"
yading@10 33 #include "cavs.h"
yading@10 34
yading@10 35 static const uint8_t alpha_tab[64] = {
yading@10 36 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 2, 2, 2, 3, 3,
yading@10 37 4, 4, 5, 5, 6, 7, 8, 9, 10, 11, 12, 13, 15, 16, 18, 20,
yading@10 38 22, 24, 26, 28, 30, 33, 33, 35, 35, 36, 37, 37, 39, 39, 42, 44,
yading@10 39 46, 48, 50, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64
yading@10 40 };
yading@10 41
yading@10 42 static const uint8_t beta_tab[64] = {
yading@10 43 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2,
yading@10 44 2, 2, 3, 3, 3, 3, 4, 4, 4, 4, 5, 5, 5, 5, 6, 6,
yading@10 45 6, 7, 7, 7, 8, 8, 8, 9, 9, 10, 10, 11, 11, 12, 13, 14,
yading@10 46 15, 16, 17, 18, 19, 20, 21, 22, 23, 23, 24, 24, 25, 25, 26, 27
yading@10 47 };
yading@10 48
yading@10 49 static const uint8_t tc_tab[64] = {
yading@10 50 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
yading@10 51 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2,
yading@10 52 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4,
yading@10 53 5, 5, 5, 6, 6, 6, 7, 7, 7, 7, 8, 8, 8, 9, 9, 9
yading@10 54 };
yading@10 55
yading@10 56 /** mark block as unavailable, i.e. out of picture
yading@10 57 or not yet decoded */
yading@10 58 static const cavs_vector un_mv = { 0, 0, 1, NOT_AVAIL };
yading@10 59
yading@10 60 static const int8_t left_modifier_l[8] = { 0, -1, 6, -1, -1, 7, 6, 7 };
yading@10 61 static const int8_t top_modifier_l[8] = { -1, 1, 5, -1, -1, 5, 7, 7 };
yading@10 62 static const int8_t left_modifier_c[7] = { 5, -1, 2, -1, 6, 5, 6 };
yading@10 63 static const int8_t top_modifier_c[7] = { 4, 1, -1, -1, 4, 6, 6 };
yading@10 64
yading@10 65 /*****************************************************************************
yading@10 66 *
yading@10 67 * in-loop deblocking filter
yading@10 68 *
yading@10 69 ****************************************************************************/
yading@10 70
yading@10 71 static inline int get_bs(cavs_vector *mvP, cavs_vector *mvQ, int b)
yading@10 72 {
yading@10 73 if ((mvP->ref == REF_INTRA) || (mvQ->ref == REF_INTRA))
yading@10 74 return 2;
yading@10 75 if ((abs(mvP->x - mvQ->x) >= 4) || (abs(mvP->y - mvQ->y) >= 4))
yading@10 76 return 1;
yading@10 77 if (b) {
yading@10 78 mvP += MV_BWD_OFFS;
yading@10 79 mvQ += MV_BWD_OFFS;
yading@10 80 if ((abs(mvP->x - mvQ->x) >= 4) || (abs(mvP->y - mvQ->y) >= 4))
yading@10 81 return 1;
yading@10 82 } else {
yading@10 83 if (mvP->ref != mvQ->ref)
yading@10 84 return 1;
yading@10 85 }
yading@10 86 return 0;
yading@10 87 }
yading@10 88
yading@10 89 #define SET_PARAMS \
yading@10 90 alpha = alpha_tab[av_clip(qp_avg + h->alpha_offset, 0, 63)]; \
yading@10 91 beta = beta_tab[av_clip(qp_avg + h->beta_offset, 0, 63)]; \
yading@10 92 tc = tc_tab[av_clip(qp_avg + h->alpha_offset, 0, 63)];
yading@10 93
yading@10 94 /**
yading@10 95 * in-loop deblocking filter for a single macroblock
yading@10 96 *
yading@10 97 * boundary strength (bs) mapping:
yading@10 98 *
yading@10 99 * --4---5--
yading@10 100 * 0 2 |
yading@10 101 * | 6 | 7 |
yading@10 102 * 1 3 |
yading@10 103 * ---------
yading@10 104 *
yading@10 105 */
yading@10 106 void ff_cavs_filter(AVSContext *h, enum cavs_mb mb_type)
yading@10 107 {
yading@10 108 uint8_t bs[8];
yading@10 109 int qp_avg, alpha, beta, tc;
yading@10 110 int i;
yading@10 111
yading@10 112 /* save un-deblocked lines */
yading@10 113 h->topleft_border_y = h->top_border_y[h->mbx * 16 + 15];
yading@10 114 h->topleft_border_u = h->top_border_u[h->mbx * 10 + 8];
yading@10 115 h->topleft_border_v = h->top_border_v[h->mbx * 10 + 8];
yading@10 116 memcpy(&h->top_border_y[h->mbx * 16], h->cy + 15 * h->l_stride, 16);
yading@10 117 memcpy(&h->top_border_u[h->mbx * 10 + 1], h->cu + 7 * h->c_stride, 8);
yading@10 118 memcpy(&h->top_border_v[h->mbx * 10 + 1], h->cv + 7 * h->c_stride, 8);
yading@10 119 for (i = 0; i < 8; i++) {
yading@10 120 h->left_border_y[i * 2 + 1] = *(h->cy + 15 + (i * 2 + 0) * h->l_stride);
yading@10 121 h->left_border_y[i * 2 + 2] = *(h->cy + 15 + (i * 2 + 1) * h->l_stride);
yading@10 122 h->left_border_u[i + 1] = *(h->cu + 7 + i * h->c_stride);
yading@10 123 h->left_border_v[i + 1] = *(h->cv + 7 + i * h->c_stride);
yading@10 124 }
yading@10 125 if (!h->loop_filter_disable) {
yading@10 126 /* determine bs */
yading@10 127 if (mb_type == I_8X8)
yading@10 128 memset(bs, 2, 8);
yading@10 129 else{
yading@10 130 memset(bs, 0, 8);
yading@10 131 if (ff_cavs_partition_flags[mb_type] & SPLITV) {
yading@10 132 bs[2] = get_bs(&h->mv[MV_FWD_X0], &h->mv[MV_FWD_X1], mb_type > P_8X8);
yading@10 133 bs[3] = get_bs(&h->mv[MV_FWD_X2], &h->mv[MV_FWD_X3], mb_type > P_8X8);
yading@10 134 }
yading@10 135 if (ff_cavs_partition_flags[mb_type] & SPLITH) {
yading@10 136 bs[6] = get_bs(&h->mv[MV_FWD_X0], &h->mv[MV_FWD_X2], mb_type > P_8X8);
yading@10 137 bs[7] = get_bs(&h->mv[MV_FWD_X1], &h->mv[MV_FWD_X3], mb_type > P_8X8);
yading@10 138 }
yading@10 139 bs[0] = get_bs(&h->mv[MV_FWD_A1], &h->mv[MV_FWD_X0], mb_type > P_8X8);
yading@10 140 bs[1] = get_bs(&h->mv[MV_FWD_A3], &h->mv[MV_FWD_X2], mb_type > P_8X8);
yading@10 141 bs[4] = get_bs(&h->mv[MV_FWD_B2], &h->mv[MV_FWD_X0], mb_type > P_8X8);
yading@10 142 bs[5] = get_bs(&h->mv[MV_FWD_B3], &h->mv[MV_FWD_X1], mb_type > P_8X8);
yading@10 143 }
yading@10 144 if (AV_RN64(bs)) {
yading@10 145 if (h->flags & A_AVAIL) {
yading@10 146 qp_avg = (h->qp + h->left_qp + 1) >> 1;
yading@10 147 SET_PARAMS;
yading@10 148 h->cdsp.cavs_filter_lv(h->cy, h->l_stride, alpha, beta, tc, bs[0], bs[1]);
yading@10 149 h->cdsp.cavs_filter_cv(h->cu, h->c_stride, alpha, beta, tc, bs[0], bs[1]);
yading@10 150 h->cdsp.cavs_filter_cv(h->cv, h->c_stride, alpha, beta, tc, bs[0], bs[1]);
yading@10 151 }
yading@10 152 qp_avg = h->qp;
yading@10 153 SET_PARAMS;
yading@10 154 h->cdsp.cavs_filter_lv(h->cy + 8, h->l_stride, alpha, beta, tc, bs[2], bs[3]);
yading@10 155 h->cdsp.cavs_filter_lh(h->cy + 8 * h->l_stride, h->l_stride, alpha, beta, tc, bs[6], bs[7]);
yading@10 156
yading@10 157 if (h->flags & B_AVAIL) {
yading@10 158 qp_avg = (h->qp + h->top_qp[h->mbx] + 1) >> 1;
yading@10 159 SET_PARAMS;
yading@10 160 h->cdsp.cavs_filter_lh(h->cy, h->l_stride, alpha, beta, tc, bs[4], bs[5]);
yading@10 161 h->cdsp.cavs_filter_ch(h->cu, h->c_stride, alpha, beta, tc, bs[4], bs[5]);
yading@10 162 h->cdsp.cavs_filter_ch(h->cv, h->c_stride, alpha, beta, tc, bs[4], bs[5]);
yading@10 163 }
yading@10 164 }
yading@10 165 }
yading@10 166 h->left_qp = h->qp;
yading@10 167 h->top_qp[h->mbx] = h->qp;
yading@10 168 }
yading@10 169
yading@10 170 #undef SET_PARAMS
yading@10 171
yading@10 172 /*****************************************************************************
yading@10 173 *
yading@10 174 * spatial intra prediction
yading@10 175 *
yading@10 176 ****************************************************************************/
yading@10 177
yading@10 178 void ff_cavs_load_intra_pred_luma(AVSContext *h, uint8_t *top,
yading@10 179 uint8_t **left, int block)
yading@10 180 {
yading@10 181 int i;
yading@10 182
yading@10 183 switch (block) {
yading@10 184 case 0:
yading@10 185 *left = h->left_border_y;
yading@10 186 h->left_border_y[0] = h->left_border_y[1];
yading@10 187 memset(&h->left_border_y[17], h->left_border_y[16], 9);
yading@10 188 memcpy(&top[1], &h->top_border_y[h->mbx * 16], 16);
yading@10 189 top[17] = top[16];
yading@10 190 top[0] = top[1];
yading@10 191 if ((h->flags & A_AVAIL) && (h->flags & B_AVAIL))
yading@10 192 h->left_border_y[0] = top[0] = h->topleft_border_y;
yading@10 193 break;
yading@10 194 case 1:
yading@10 195 *left = h->intern_border_y;
yading@10 196 for (i = 0; i < 8; i++)
yading@10 197 h->intern_border_y[i + 1] = *(h->cy + 7 + i * h->l_stride);
yading@10 198 memset(&h->intern_border_y[9], h->intern_border_y[8], 9);
yading@10 199 h->intern_border_y[0] = h->intern_border_y[1];
yading@10 200 memcpy(&top[1], &h->top_border_y[h->mbx * 16 + 8], 8);
yading@10 201 if (h->flags & C_AVAIL)
yading@10 202 memcpy(&top[9], &h->top_border_y[(h->mbx + 1) * 16], 8);
yading@10 203 else
yading@10 204 memset(&top[9], top[8], 9);
yading@10 205 top[17] = top[16];
yading@10 206 top[0] = top[1];
yading@10 207 if (h->flags & B_AVAIL)
yading@10 208 h->intern_border_y[0] = top[0] = h->top_border_y[h->mbx * 16 + 7];
yading@10 209 break;
yading@10 210 case 2:
yading@10 211 *left = &h->left_border_y[8];
yading@10 212 memcpy(&top[1], h->cy + 7 * h->l_stride, 16);
yading@10 213 top[17] = top[16];
yading@10 214 top[0] = top[1];
yading@10 215 if (h->flags & A_AVAIL)
yading@10 216 top[0] = h->left_border_y[8];
yading@10 217 break;
yading@10 218 case 3:
yading@10 219 *left = &h->intern_border_y[8];
yading@10 220 for (i = 0; i < 8; i++)
yading@10 221 h->intern_border_y[i + 9] = *(h->cy + 7 + (i + 8) * h->l_stride);
yading@10 222 memset(&h->intern_border_y[17], h->intern_border_y[16], 9);
yading@10 223 memcpy(&top[0], h->cy + 7 + 7 * h->l_stride, 9);
yading@10 224 memset(&top[9], top[8], 9);
yading@10 225 break;
yading@10 226 }
yading@10 227 }
yading@10 228
yading@10 229 void ff_cavs_load_intra_pred_chroma(AVSContext *h)
yading@10 230 {
yading@10 231 /* extend borders by one pixel */
yading@10 232 h->left_border_u[9] = h->left_border_u[8];
yading@10 233 h->left_border_v[9] = h->left_border_v[8];
yading@10 234 h->top_border_u[h->mbx * 10 + 9] = h->top_border_u[h->mbx * 10 + 8];
yading@10 235 h->top_border_v[h->mbx * 10 + 9] = h->top_border_v[h->mbx * 10 + 8];
yading@10 236 if (h->mbx && h->mby) {
yading@10 237 h->top_border_u[h->mbx * 10] = h->left_border_u[0] = h->topleft_border_u;
yading@10 238 h->top_border_v[h->mbx * 10] = h->left_border_v[0] = h->topleft_border_v;
yading@10 239 } else {
yading@10 240 h->left_border_u[0] = h->left_border_u[1];
yading@10 241 h->left_border_v[0] = h->left_border_v[1];
yading@10 242 h->top_border_u[h->mbx * 10] = h->top_border_u[h->mbx * 10 + 1];
yading@10 243 h->top_border_v[h->mbx * 10] = h->top_border_v[h->mbx * 10 + 1];
yading@10 244 }
yading@10 245 }
yading@10 246
yading@10 247 static void intra_pred_vert(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 248 {
yading@10 249 int y;
yading@10 250 uint64_t a = AV_RN64(&top[1]);
yading@10 251 for (y = 0; y < 8; y++) {
yading@10 252 *((uint64_t *)(d + y * stride)) = a;
yading@10 253 }
yading@10 254 }
yading@10 255
yading@10 256 static void intra_pred_horiz(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 257 {
yading@10 258 int y;
yading@10 259 uint64_t a;
yading@10 260 for (y = 0; y < 8; y++) {
yading@10 261 a = left[y + 1] * 0x0101010101010101ULL;
yading@10 262 *((uint64_t *)(d + y * stride)) = a;
yading@10 263 }
yading@10 264 }
yading@10 265
yading@10 266 static void intra_pred_dc_128(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 267 {
yading@10 268 int y;
yading@10 269 uint64_t a = 0x8080808080808080ULL;
yading@10 270 for (y = 0; y < 8; y++)
yading@10 271 *((uint64_t *)(d + y * stride)) = a;
yading@10 272 }
yading@10 273
yading@10 274 static void intra_pred_plane(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 275 {
yading@10 276 int x, y, ia;
yading@10 277 int ih = 0;
yading@10 278 int iv = 0;
yading@10 279 const uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
yading@10 280
yading@10 281 for (x = 0; x < 4; x++) {
yading@10 282 ih += (x + 1) * (top [5 + x] - top [3 - x]);
yading@10 283 iv += (x + 1) * (left[5 + x] - left[3 - x]);
yading@10 284 }
yading@10 285 ia = (top[8] + left[8]) << 4;
yading@10 286 ih = (17 * ih + 16) >> 5;
yading@10 287 iv = (17 * iv + 16) >> 5;
yading@10 288 for (y = 0; y < 8; y++)
yading@10 289 for (x = 0; x < 8; x++)
yading@10 290 d[y * stride + x] = cm[(ia + (x - 3) * ih + (y - 3) * iv + 16) >> 5];
yading@10 291 }
yading@10 292
yading@10 293 #define LOWPASS(ARRAY,INDEX) \
yading@10 294 ((ARRAY[(INDEX) - 1] + 2 * ARRAY[(INDEX)] + ARRAY[(INDEX) + 1] + 2) >> 2)
yading@10 295
yading@10 296 static void intra_pred_lp(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 297 {
yading@10 298 int x, y;
yading@10 299 for (y = 0; y < 8; y++)
yading@10 300 for (x = 0; x < 8; x++)
yading@10 301 d[y * stride + x] = (LOWPASS(top, x + 1) + LOWPASS(left, y + 1)) >> 1;
yading@10 302 }
yading@10 303
yading@10 304 static void intra_pred_down_left(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 305 {
yading@10 306 int x, y;
yading@10 307 for (y = 0; y < 8; y++)
yading@10 308 for (x = 0; x < 8; x++)
yading@10 309 d[y * stride + x] = (LOWPASS(top, x + y + 2) + LOWPASS(left, x + y + 2)) >> 1;
yading@10 310 }
yading@10 311
yading@10 312 static void intra_pred_down_right(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 313 {
yading@10 314 int x, y;
yading@10 315 for (y = 0; y < 8; y++)
yading@10 316 for (x = 0; x < 8; x++)
yading@10 317 if (x == y)
yading@10 318 d[y * stride + x] = (left[1] + 2 * top[0] + top[1] + 2) >> 2;
yading@10 319 else if (x > y)
yading@10 320 d[y * stride + x] = LOWPASS(top, x - y);
yading@10 321 else
yading@10 322 d[y * stride + x] = LOWPASS(left, y - x);
yading@10 323 }
yading@10 324
yading@10 325 static void intra_pred_lp_left(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 326 {
yading@10 327 int x, y;
yading@10 328 for (y = 0; y < 8; y++)
yading@10 329 for (x = 0; x < 8; x++)
yading@10 330 d[y * stride + x] = LOWPASS(left, y + 1);
yading@10 331 }
yading@10 332
yading@10 333 static void intra_pred_lp_top(uint8_t *d,uint8_t *top,uint8_t *left,int stride)
yading@10 334 {
yading@10 335 int x, y;
yading@10 336 for (y = 0; y < 8; y++)
yading@10 337 for (x = 0; x < 8; x++)
yading@10 338 d[y * stride + x] = LOWPASS(top, x + 1);
yading@10 339 }
yading@10 340
yading@10 341 #undef LOWPASS
yading@10 342
yading@10 343 static inline void modify_pred(const int8_t *mod_table, int *mode)
yading@10 344 {
yading@10 345 *mode = mod_table[*mode];
yading@10 346 if (*mode < 0) {
yading@10 347 av_log(NULL, AV_LOG_ERROR, "Illegal intra prediction mode\n");
yading@10 348 *mode = 0;
yading@10 349 }
yading@10 350 }
yading@10 351
yading@10 352 void ff_cavs_modify_mb_i(AVSContext *h, int *pred_mode_uv)
yading@10 353 {
yading@10 354 /* save pred modes before they get modified */
yading@10 355 h->pred_mode_Y[3] = h->pred_mode_Y[5];
yading@10 356 h->pred_mode_Y[6] = h->pred_mode_Y[8];
yading@10 357 h->top_pred_Y[h->mbx * 2 + 0] = h->pred_mode_Y[7];
yading@10 358 h->top_pred_Y[h->mbx * 2 + 1] = h->pred_mode_Y[8];
yading@10 359
yading@10 360 /* modify pred modes according to availability of neighbour samples */
yading@10 361 if (!(h->flags & A_AVAIL)) {
yading@10 362 modify_pred(left_modifier_l, &h->pred_mode_Y[4]);
yading@10 363 modify_pred(left_modifier_l, &h->pred_mode_Y[7]);
yading@10 364 modify_pred(left_modifier_c, pred_mode_uv);
yading@10 365 }
yading@10 366 if (!(h->flags & B_AVAIL)) {
yading@10 367 modify_pred(top_modifier_l, &h->pred_mode_Y[4]);
yading@10 368 modify_pred(top_modifier_l, &h->pred_mode_Y[5]);
yading@10 369 modify_pred(top_modifier_c, pred_mode_uv);
yading@10 370 }
yading@10 371 }
yading@10 372
yading@10 373 /*****************************************************************************
yading@10 374 *
yading@10 375 * motion compensation
yading@10 376 *
yading@10 377 ****************************************************************************/
yading@10 378
yading@10 379 static inline void mc_dir_part(AVSContext *h, AVFrame *pic,
yading@10 380 int chroma_height,int delta,int list,uint8_t *dest_y,
yading@10 381 uint8_t *dest_cb,uint8_t *dest_cr,int src_x_offset,
yading@10 382 int src_y_offset,qpel_mc_func *qpix_op,
yading@10 383 h264_chroma_mc_func chroma_op,cavs_vector *mv)
yading@10 384 {
yading@10 385 const int mx= mv->x + src_x_offset*8;
yading@10 386 const int my= mv->y + src_y_offset*8;
yading@10 387 const int luma_xy= (mx&3) + ((my&3)<<2);
yading@10 388 uint8_t * src_y = pic->data[0] + (mx >> 2) + (my >> 2) * h->l_stride;
yading@10 389 uint8_t * src_cb = pic->data[1] + (mx >> 3) + (my >> 3) * h->c_stride;
yading@10 390 uint8_t * src_cr = pic->data[2] + (mx >> 3) + (my >> 3) * h->c_stride;
yading@10 391 int extra_width = 0;
yading@10 392 int extra_height= extra_width;
yading@10 393 int emu=0;
yading@10 394 const int full_mx= mx>>2;
yading@10 395 const int full_my= my>>2;
yading@10 396 const int pic_width = 16*h->mb_width;
yading@10 397 const int pic_height = 16*h->mb_height;
yading@10 398
yading@10 399 if (!pic->data[0])
yading@10 400 return;
yading@10 401 if(mx&7) extra_width -= 3;
yading@10 402 if(my&7) extra_height -= 3;
yading@10 403
yading@10 404 if( full_mx < 0-extra_width
yading@10 405 || full_my < 0-extra_height
yading@10 406 || full_mx + 16/*FIXME*/ > pic_width + extra_width
yading@10 407 || full_my + 16/*FIXME*/ > pic_height + extra_height){
yading@10 408 h->vdsp.emulated_edge_mc(h->edge_emu_buffer, src_y - 2 - 2*h->l_stride, h->l_stride,
yading@10 409 16+5, 16+5/*FIXME*/, full_mx-2, full_my-2, pic_width, pic_height);
yading@10 410 src_y= h->edge_emu_buffer + 2 + 2*h->l_stride;
yading@10 411 emu=1;
yading@10 412 }
yading@10 413
yading@10 414 qpix_op[luma_xy](dest_y, src_y, h->l_stride); //FIXME try variable height perhaps?
yading@10 415
yading@10 416 if(emu){
yading@10 417 h->vdsp.emulated_edge_mc(h->edge_emu_buffer, src_cb, h->c_stride,
yading@10 418 9, 9/*FIXME*/, (mx>>3), (my>>3), pic_width>>1, pic_height>>1);
yading@10 419 src_cb= h->edge_emu_buffer;
yading@10 420 }
yading@10 421 chroma_op(dest_cb, src_cb, h->c_stride, chroma_height, mx&7, my&7);
yading@10 422
yading@10 423 if(emu){
yading@10 424 h->vdsp.emulated_edge_mc(h->edge_emu_buffer, src_cr, h->c_stride,
yading@10 425 9, 9/*FIXME*/, (mx>>3), (my>>3), pic_width>>1, pic_height>>1);
yading@10 426 src_cr= h->edge_emu_buffer;
yading@10 427 }
yading@10 428 chroma_op(dest_cr, src_cr, h->c_stride, chroma_height, mx&7, my&7);
yading@10 429 }
yading@10 430
yading@10 431 static inline void mc_part_std(AVSContext *h,int chroma_height,int delta,
yading@10 432 uint8_t *dest_y,uint8_t *dest_cb,uint8_t *dest_cr,
yading@10 433 int x_offset, int y_offset,qpel_mc_func *qpix_put,
yading@10 434 h264_chroma_mc_func chroma_put,qpel_mc_func *qpix_avg,
yading@10 435 h264_chroma_mc_func chroma_avg, cavs_vector *mv)
yading@10 436 {
yading@10 437 qpel_mc_func *qpix_op= qpix_put;
yading@10 438 h264_chroma_mc_func chroma_op= chroma_put;
yading@10 439
yading@10 440 dest_y += 2*x_offset + 2*y_offset*h->l_stride;
yading@10 441 dest_cb += x_offset + y_offset*h->c_stride;
yading@10 442 dest_cr += x_offset + y_offset*h->c_stride;
yading@10 443 x_offset += 8*h->mbx;
yading@10 444 y_offset += 8*h->mby;
yading@10 445
yading@10 446 if(mv->ref >= 0){
yading@10 447 AVFrame *ref = h->DPB[mv->ref].f;
yading@10 448 mc_dir_part(h, ref, chroma_height, delta, 0,
yading@10 449 dest_y, dest_cb, dest_cr, x_offset, y_offset,
yading@10 450 qpix_op, chroma_op, mv);
yading@10 451
yading@10 452 qpix_op= qpix_avg;
yading@10 453 chroma_op= chroma_avg;
yading@10 454 }
yading@10 455
yading@10 456 if((mv+MV_BWD_OFFS)->ref >= 0){
yading@10 457 AVFrame *ref = h->DPB[0].f;
yading@10 458 mc_dir_part(h, ref, chroma_height, delta, 1,
yading@10 459 dest_y, dest_cb, dest_cr, x_offset, y_offset,
yading@10 460 qpix_op, chroma_op, mv+MV_BWD_OFFS);
yading@10 461 }
yading@10 462 }
yading@10 463
yading@10 464 void ff_cavs_inter(AVSContext *h, enum cavs_mb mb_type) {
yading@10 465 if(ff_cavs_partition_flags[mb_type] == 0){ // 16x16
yading@10 466 mc_part_std(h, 8, 0, h->cy, h->cu, h->cv, 0, 0,
yading@10 467 h->cdsp.put_cavs_qpel_pixels_tab[0],
yading@10 468 h->h264chroma.put_h264_chroma_pixels_tab[0],
yading@10 469 h->cdsp.avg_cavs_qpel_pixels_tab[0],
yading@10 470 h->h264chroma.avg_h264_chroma_pixels_tab[0],
yading@10 471 &h->mv[MV_FWD_X0]);
yading@10 472 }else{
yading@10 473 mc_part_std(h, 4, 0, h->cy, h->cu, h->cv, 0, 0,
yading@10 474 h->cdsp.put_cavs_qpel_pixels_tab[1],
yading@10 475 h->h264chroma.put_h264_chroma_pixels_tab[1],
yading@10 476 h->cdsp.avg_cavs_qpel_pixels_tab[1],
yading@10 477 h->h264chroma.avg_h264_chroma_pixels_tab[1],
yading@10 478 &h->mv[MV_FWD_X0]);
yading@10 479 mc_part_std(h, 4, 0, h->cy, h->cu, h->cv, 4, 0,
yading@10 480 h->cdsp.put_cavs_qpel_pixels_tab[1],
yading@10 481 h->h264chroma.put_h264_chroma_pixels_tab[1],
yading@10 482 h->cdsp.avg_cavs_qpel_pixels_tab[1],
yading@10 483 h->h264chroma.avg_h264_chroma_pixels_tab[1],
yading@10 484 &h->mv[MV_FWD_X1]);
yading@10 485 mc_part_std(h, 4, 0, h->cy, h->cu, h->cv, 0, 4,
yading@10 486 h->cdsp.put_cavs_qpel_pixels_tab[1],
yading@10 487 h->h264chroma.put_h264_chroma_pixels_tab[1],
yading@10 488 h->cdsp.avg_cavs_qpel_pixels_tab[1],
yading@10 489 h->h264chroma.avg_h264_chroma_pixels_tab[1],
yading@10 490 &h->mv[MV_FWD_X2]);
yading@10 491 mc_part_std(h, 4, 0, h->cy, h->cu, h->cv, 4, 4,
yading@10 492 h->cdsp.put_cavs_qpel_pixels_tab[1],
yading@10 493 h->h264chroma.put_h264_chroma_pixels_tab[1],
yading@10 494 h->cdsp.avg_cavs_qpel_pixels_tab[1],
yading@10 495 h->h264chroma.avg_h264_chroma_pixels_tab[1],
yading@10 496 &h->mv[MV_FWD_X3]);
yading@10 497 }
yading@10 498 }
yading@10 499
yading@10 500 /*****************************************************************************
yading@10 501 *
yading@10 502 * motion vector prediction
yading@10 503 *
yading@10 504 ****************************************************************************/
yading@10 505
yading@10 506 static inline void scale_mv(AVSContext *h, int *d_x, int *d_y, cavs_vector *src, int distp) {
yading@10 507 int den = h->scale_den[src->ref];
yading@10 508
yading@10 509 *d_x = (src->x*distp*den + 256 + (src->x>>31)) >> 9;
yading@10 510 *d_y = (src->y*distp*den + 256 + (src->y>>31)) >> 9;
yading@10 511 }
yading@10 512
yading@10 513 static inline void mv_pred_median(AVSContext *h, cavs_vector *mvP,
yading@10 514 cavs_vector *mvA, cavs_vector *mvB, cavs_vector *mvC) {
yading@10 515 int ax, ay, bx, by, cx, cy;
yading@10 516 int len_ab, len_bc, len_ca, len_mid;
yading@10 517
yading@10 518 /* scale candidates according to their temporal span */
yading@10 519 scale_mv(h, &ax, &ay, mvA, mvP->dist);
yading@10 520 scale_mv(h, &bx, &by, mvB, mvP->dist);
yading@10 521 scale_mv(h, &cx, &cy, mvC, mvP->dist);
yading@10 522 /* find the geometrical median of the three candidates */
yading@10 523 len_ab = abs(ax - bx) + abs(ay - by);
yading@10 524 len_bc = abs(bx - cx) + abs(by - cy);
yading@10 525 len_ca = abs(cx - ax) + abs(cy - ay);
yading@10 526 len_mid = mid_pred(len_ab, len_bc, len_ca);
yading@10 527 if(len_mid == len_ab) {
yading@10 528 mvP->x = cx;
yading@10 529 mvP->y = cy;
yading@10 530 } else if(len_mid == len_bc) {
yading@10 531 mvP->x = ax;
yading@10 532 mvP->y = ay;
yading@10 533 } else {
yading@10 534 mvP->x = bx;
yading@10 535 mvP->y = by;
yading@10 536 }
yading@10 537 }
yading@10 538
yading@10 539 void ff_cavs_mv(AVSContext *h, enum cavs_mv_loc nP, enum cavs_mv_loc nC,
yading@10 540 enum cavs_mv_pred mode, enum cavs_block size, int ref) {
yading@10 541 cavs_vector *mvP = &h->mv[nP];
yading@10 542 cavs_vector *mvA = &h->mv[nP-1];
yading@10 543 cavs_vector *mvB = &h->mv[nP-4];
yading@10 544 cavs_vector *mvC = &h->mv[nC];
yading@10 545 const cavs_vector *mvP2 = NULL;
yading@10 546
yading@10 547 mvP->ref = ref;
yading@10 548 mvP->dist = h->dist[mvP->ref];
yading@10 549 if(mvC->ref == NOT_AVAIL)
yading@10 550 mvC = &h->mv[nP-5]; // set to top-left (mvD)
yading@10 551 if((mode == MV_PRED_PSKIP) &&
yading@10 552 ((mvA->ref == NOT_AVAIL) || (mvB->ref == NOT_AVAIL) ||
yading@10 553 ((mvA->x | mvA->y | mvA->ref) == 0) ||
yading@10 554 ((mvB->x | mvB->y | mvB->ref) == 0) )) {
yading@10 555 mvP2 = &un_mv;
yading@10 556 /* if there is only one suitable candidate, take it */
yading@10 557 } else if((mvA->ref >= 0) && (mvB->ref < 0) && (mvC->ref < 0)) {
yading@10 558 mvP2= mvA;
yading@10 559 } else if((mvA->ref < 0) && (mvB->ref >= 0) && (mvC->ref < 0)) {
yading@10 560 mvP2= mvB;
yading@10 561 } else if((mvA->ref < 0) && (mvB->ref < 0) && (mvC->ref >= 0)) {
yading@10 562 mvP2= mvC;
yading@10 563 } else if(mode == MV_PRED_LEFT && mvA->ref == ref){
yading@10 564 mvP2= mvA;
yading@10 565 } else if(mode == MV_PRED_TOP && mvB->ref == ref){
yading@10 566 mvP2= mvB;
yading@10 567 } else if(mode == MV_PRED_TOPRIGHT && mvC->ref == ref){
yading@10 568 mvP2= mvC;
yading@10 569 }
yading@10 570 if(mvP2){
yading@10 571 mvP->x = mvP2->x;
yading@10 572 mvP->y = mvP2->y;
yading@10 573 }else
yading@10 574 mv_pred_median(h, mvP, mvA, mvB, mvC);
yading@10 575
yading@10 576 if(mode < MV_PRED_PSKIP) {
yading@10 577 mvP->x += get_se_golomb(&h->gb);
yading@10 578 mvP->y += get_se_golomb(&h->gb);
yading@10 579 }
yading@10 580 set_mvs(mvP,size);
yading@10 581 }
yading@10 582
yading@10 583 /*****************************************************************************
yading@10 584 *
yading@10 585 * macroblock level
yading@10 586 *
yading@10 587 ****************************************************************************/
yading@10 588
yading@10 589 /**
yading@10 590 * initialise predictors for motion vectors and intra prediction
yading@10 591 */
yading@10 592 void ff_cavs_init_mb(AVSContext *h) {
yading@10 593 int i;
yading@10 594
yading@10 595 /* copy predictors from top line (MB B and C) into cache */
yading@10 596 for(i=0;i<3;i++) {
yading@10 597 h->mv[MV_FWD_B2+i] = h->top_mv[0][h->mbx*2+i];
yading@10 598 h->mv[MV_BWD_B2+i] = h->top_mv[1][h->mbx*2+i];
yading@10 599 }
yading@10 600 h->pred_mode_Y[1] = h->top_pred_Y[h->mbx*2+0];
yading@10 601 h->pred_mode_Y[2] = h->top_pred_Y[h->mbx*2+1];
yading@10 602 /* clear top predictors if MB B is not available */
yading@10 603 if(!(h->flags & B_AVAIL)) {
yading@10 604 h->mv[MV_FWD_B2] = un_mv;
yading@10 605 h->mv[MV_FWD_B3] = un_mv;
yading@10 606 h->mv[MV_BWD_B2] = un_mv;
yading@10 607 h->mv[MV_BWD_B3] = un_mv;
yading@10 608 h->pred_mode_Y[1] = h->pred_mode_Y[2] = NOT_AVAIL;
yading@10 609 h->flags &= ~(C_AVAIL|D_AVAIL);
yading@10 610 } else if(h->mbx) {
yading@10 611 h->flags |= D_AVAIL;
yading@10 612 }
yading@10 613 if(h->mbx == h->mb_width-1) //MB C not available
yading@10 614 h->flags &= ~C_AVAIL;
yading@10 615 /* clear top-right predictors if MB C is not available */
yading@10 616 if(!(h->flags & C_AVAIL)) {
yading@10 617 h->mv[MV_FWD_C2] = un_mv;
yading@10 618 h->mv[MV_BWD_C2] = un_mv;
yading@10 619 }
yading@10 620 /* clear top-left predictors if MB D is not available */
yading@10 621 if(!(h->flags & D_AVAIL)) {
yading@10 622 h->mv[MV_FWD_D3] = un_mv;
yading@10 623 h->mv[MV_BWD_D3] = un_mv;
yading@10 624 }
yading@10 625 }
yading@10 626
yading@10 627 /**
yading@10 628 * save predictors for later macroblocks and increase
yading@10 629 * macroblock address
yading@10 630 * @return 0 if end of frame is reached, 1 otherwise
yading@10 631 */
yading@10 632 int ff_cavs_next_mb(AVSContext *h) {
yading@10 633 int i;
yading@10 634
yading@10 635 h->flags |= A_AVAIL;
yading@10 636 h->cy += 16;
yading@10 637 h->cu += 8;
yading@10 638 h->cv += 8;
yading@10 639 /* copy mvs as predictors to the left */
yading@10 640 for(i=0;i<=20;i+=4)
yading@10 641 h->mv[i] = h->mv[i+2];
yading@10 642 /* copy bottom mvs from cache to top line */
yading@10 643 h->top_mv[0][h->mbx*2+0] = h->mv[MV_FWD_X2];
yading@10 644 h->top_mv[0][h->mbx*2+1] = h->mv[MV_FWD_X3];
yading@10 645 h->top_mv[1][h->mbx*2+0] = h->mv[MV_BWD_X2];
yading@10 646 h->top_mv[1][h->mbx*2+1] = h->mv[MV_BWD_X3];
yading@10 647 /* next MB address */
yading@10 648 h->mbidx++;
yading@10 649 h->mbx++;
yading@10 650 if(h->mbx == h->mb_width) { //new mb line
yading@10 651 h->flags = B_AVAIL|C_AVAIL;
yading@10 652 /* clear left pred_modes */
yading@10 653 h->pred_mode_Y[3] = h->pred_mode_Y[6] = NOT_AVAIL;
yading@10 654 /* clear left mv predictors */
yading@10 655 for(i=0;i<=20;i+=4)
yading@10 656 h->mv[i] = un_mv;
yading@10 657 h->mbx = 0;
yading@10 658 h->mby++;
yading@10 659 /* re-calculate sample pointers */
yading@10 660 h->cy = h->cur.f->data[0] + h->mby * 16 * h->l_stride;
yading@10 661 h->cu = h->cur.f->data[1] + h->mby * 8 * h->c_stride;
yading@10 662 h->cv = h->cur.f->data[2] + h->mby * 8 * h->c_stride;
yading@10 663 if(h->mby == h->mb_height) { //frame end
yading@10 664 return 0;
yading@10 665 }
yading@10 666 }
yading@10 667 return 1;
yading@10 668 }
yading@10 669
yading@10 670 /*****************************************************************************
yading@10 671 *
yading@10 672 * frame level
yading@10 673 *
yading@10 674 ****************************************************************************/
yading@10 675
yading@10 676 int ff_cavs_init_pic(AVSContext *h) {
yading@10 677 int i;
yading@10 678
yading@10 679 /* clear some predictors */
yading@10 680 for(i=0;i<=20;i+=4)
yading@10 681 h->mv[i] = un_mv;
yading@10 682 h->mv[MV_BWD_X0] = ff_cavs_dir_mv;
yading@10 683 set_mvs(&h->mv[MV_BWD_X0], BLK_16X16);
yading@10 684 h->mv[MV_FWD_X0] = ff_cavs_dir_mv;
yading@10 685 set_mvs(&h->mv[MV_FWD_X0], BLK_16X16);
yading@10 686 h->pred_mode_Y[3] = h->pred_mode_Y[6] = NOT_AVAIL;
yading@10 687 h->cy = h->cur.f->data[0];
yading@10 688 h->cu = h->cur.f->data[1];
yading@10 689 h->cv = h->cur.f->data[2];
yading@10 690 h->l_stride = h->cur.f->linesize[0];
yading@10 691 h->c_stride = h->cur.f->linesize[1];
yading@10 692 h->luma_scan[2] = 8*h->l_stride;
yading@10 693 h->luma_scan[3] = 8*h->l_stride+8;
yading@10 694 h->mbx = h->mby = h->mbidx = 0;
yading@10 695 h->flags = 0;
yading@10 696
yading@10 697 return 0;
yading@10 698 }
yading@10 699
yading@10 700 /*****************************************************************************
yading@10 701 *
yading@10 702 * headers and interface
yading@10 703 *
yading@10 704 ****************************************************************************/
yading@10 705
yading@10 706 /**
yading@10 707 * some predictions require data from the top-neighbouring macroblock.
yading@10 708 * this data has to be stored for one complete row of macroblocks
yading@10 709 * and this storage space is allocated here
yading@10 710 */
yading@10 711 void ff_cavs_init_top_lines(AVSContext *h) {
yading@10 712 /* alloc top line of predictors */
yading@10 713 h->top_qp = av_mallocz( h->mb_width);
yading@10 714 h->top_mv[0] = av_mallocz((h->mb_width*2+1)*sizeof(cavs_vector));
yading@10 715 h->top_mv[1] = av_mallocz((h->mb_width*2+1)*sizeof(cavs_vector));
yading@10 716 h->top_pred_Y = av_mallocz( h->mb_width*2*sizeof(*h->top_pred_Y));
yading@10 717 h->top_border_y = av_mallocz((h->mb_width+1)*16);
yading@10 718 h->top_border_u = av_mallocz( h->mb_width * 10);
yading@10 719 h->top_border_v = av_mallocz( h->mb_width * 10);
yading@10 720
yading@10 721 /* alloc space for co-located MVs and types */
yading@10 722 h->col_mv = av_mallocz( h->mb_width*h->mb_height*4*sizeof(cavs_vector));
yading@10 723 h->col_type_base = av_mallocz(h->mb_width*h->mb_height);
yading@10 724 h->block = av_mallocz(64*sizeof(int16_t));
yading@10 725 }
yading@10 726
yading@10 727 av_cold int ff_cavs_init(AVCodecContext *avctx) {
yading@10 728 AVSContext *h = avctx->priv_data;
yading@10 729
yading@10 730 ff_dsputil_init(&h->dsp, avctx);
yading@10 731 ff_h264chroma_init(&h->h264chroma, 8);
yading@10 732 ff_videodsp_init(&h->vdsp, 8);
yading@10 733 ff_cavsdsp_init(&h->cdsp, avctx);
yading@10 734 ff_init_scantable_permutation(h->dsp.idct_permutation,
yading@10 735 h->cdsp.idct_perm);
yading@10 736 ff_init_scantable(h->dsp.idct_permutation, &h->scantable, ff_zigzag_direct);
yading@10 737
yading@10 738 h->avctx = avctx;
yading@10 739 avctx->pix_fmt= AV_PIX_FMT_YUV420P;
yading@10 740
yading@10 741 h->cur.f = av_frame_alloc();
yading@10 742 h->DPB[0].f = av_frame_alloc();
yading@10 743 h->DPB[1].f = av_frame_alloc();
yading@10 744 if (!h->cur.f || !h->DPB[0].f || !h->DPB[1].f) {
yading@10 745 ff_cavs_end(avctx);
yading@10 746 return AVERROR(ENOMEM);
yading@10 747 }
yading@10 748
yading@10 749 h->luma_scan[0] = 0;
yading@10 750 h->luma_scan[1] = 8;
yading@10 751 h->intra_pred_l[ INTRA_L_VERT] = intra_pred_vert;
yading@10 752 h->intra_pred_l[ INTRA_L_HORIZ] = intra_pred_horiz;
yading@10 753 h->intra_pred_l[ INTRA_L_LP] = intra_pred_lp;
yading@10 754 h->intra_pred_l[ INTRA_L_DOWN_LEFT] = intra_pred_down_left;
yading@10 755 h->intra_pred_l[INTRA_L_DOWN_RIGHT] = intra_pred_down_right;
yading@10 756 h->intra_pred_l[ INTRA_L_LP_LEFT] = intra_pred_lp_left;
yading@10 757 h->intra_pred_l[ INTRA_L_LP_TOP] = intra_pred_lp_top;
yading@10 758 h->intra_pred_l[ INTRA_L_DC_128] = intra_pred_dc_128;
yading@10 759 h->intra_pred_c[ INTRA_C_LP] = intra_pred_lp;
yading@10 760 h->intra_pred_c[ INTRA_C_HORIZ] = intra_pred_horiz;
yading@10 761 h->intra_pred_c[ INTRA_C_VERT] = intra_pred_vert;
yading@10 762 h->intra_pred_c[ INTRA_C_PLANE] = intra_pred_plane;
yading@10 763 h->intra_pred_c[ INTRA_C_LP_LEFT] = intra_pred_lp_left;
yading@10 764 h->intra_pred_c[ INTRA_C_LP_TOP] = intra_pred_lp_top;
yading@10 765 h->intra_pred_c[ INTRA_C_DC_128] = intra_pred_dc_128;
yading@10 766 h->mv[ 7] = un_mv;
yading@10 767 h->mv[19] = un_mv;
yading@10 768 return 0;
yading@10 769 }
yading@10 770
yading@10 771 av_cold int ff_cavs_end(AVCodecContext *avctx) {
yading@10 772 AVSContext *h = avctx->priv_data;
yading@10 773
yading@10 774 av_frame_free(&h->cur.f);
yading@10 775 av_frame_free(&h->DPB[0].f);
yading@10 776 av_frame_free(&h->DPB[1].f);
yading@10 777
yading@10 778 av_free(h->top_qp);
yading@10 779 av_free(h->top_mv[0]);
yading@10 780 av_free(h->top_mv[1]);
yading@10 781 av_free(h->top_pred_Y);
yading@10 782 av_free(h->top_border_y);
yading@10 783 av_free(h->top_border_u);
yading@10 784 av_free(h->top_border_v);
yading@10 785 av_free(h->col_mv);
yading@10 786 av_free(h->col_type_base);
yading@10 787 av_free(h->block);
yading@10 788 av_freep(&h->edge_emu_buffer);
yading@10 789 return 0;
yading@10 790 }