yading@10: ;***************************************************************************** yading@10: ;* MMX/SSE2/AVX-optimized 10-bit H.264 weighted prediction code yading@10: ;***************************************************************************** yading@10: ;* Copyright (C) 2005-2011 x264 project yading@10: ;* yading@10: ;* Authors: Daniel Kang yading@10: ;* yading@10: ;* This file is part of Libav. yading@10: ;* yading@10: ;* Libav is free software; you can redistribute it and/or yading@10: ;* modify it under the terms of the GNU Lesser General Public yading@10: ;* License as published by the Free Software Foundation; either yading@10: ;* version 2.1 of the License, or (at your option) any later version. yading@10: ;* yading@10: ;* Libav is distributed in the hope that it will be useful, yading@10: ;* but WITHOUT ANY WARRANTY; without even the implied warranty of yading@10: ;* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU yading@10: ;* Lesser General Public License for more details. yading@10: ;* yading@10: ;* You should have received a copy of the GNU Lesser General Public yading@10: ;* License along with Libav; if not, write to the Free Software yading@10: ;* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA yading@10: ;****************************************************************************** yading@10: yading@10: %include "libavutil/x86/x86util.asm" yading@10: yading@10: SECTION_RODATA 32 yading@10: yading@10: pw_pixel_max: times 8 dw ((1 << 10)-1) yading@10: sq_1: dq 1 yading@10: dq 0 yading@10: yading@10: cextern pw_1 yading@10: yading@10: SECTION .text yading@10: yading@10: ;----------------------------------------------------------------------------- yading@10: ; void h264_weight(uint8_t *dst, int stride, int height, int log2_denom, yading@10: ; int weight, int offset); yading@10: ;----------------------------------------------------------------------------- yading@10: %macro WEIGHT_PROLOGUE 0 yading@10: .prologue: yading@10: PROLOGUE 0,6,8 yading@10: movifnidn r0, r0mp yading@10: movifnidn r1d, r1m yading@10: movifnidn r2d, r2m yading@10: movifnidn r4d, r4m yading@10: movifnidn r5d, r5m yading@10: %endmacro yading@10: yading@10: %macro WEIGHT_SETUP 0 yading@10: mova m0, [pw_1] yading@10: movd m2, r3m yading@10: pslld m0, m2 ; 1<