yading@10
|
1 ;******************************************************************************
|
yading@10
|
2 ;* MMX optimized deinterlacing functions
|
yading@10
|
3 ;* Copyright (c) 2010 Vitor Sessak
|
yading@10
|
4 ;* Copyright (c) 2002 Michael Niedermayer
|
yading@10
|
5 ;*
|
yading@10
|
6 ;* This file is part of FFmpeg.
|
yading@10
|
7 ;*
|
yading@10
|
8 ;* FFmpeg is free software; you can redistribute it and/or
|
yading@10
|
9 ;* modify it under the terms of the GNU Lesser General Public
|
yading@10
|
10 ;* License as published by the Free Software Foundation; either
|
yading@10
|
11 ;* version 2.1 of the License, or (at your option) any later version.
|
yading@10
|
12 ;*
|
yading@10
|
13 ;* FFmpeg is distributed in the hope that it will be useful,
|
yading@10
|
14 ;* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
yading@10
|
15 ;* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
yading@10
|
16 ;* Lesser General Public License for more details.
|
yading@10
|
17 ;*
|
yading@10
|
18 ;* You should have received a copy of the GNU Lesser General Public
|
yading@10
|
19 ;* License along with FFmpeg; if not, write to the Free Software
|
yading@10
|
20 ;* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
yading@10
|
21 ;******************************************************************************
|
yading@10
|
22
|
yading@10
|
23 %include "libavutil/x86/x86util.asm"
|
yading@10
|
24
|
yading@10
|
25 SECTION_RODATA
|
yading@10
|
26
|
yading@10
|
27 cextern pw_4
|
yading@10
|
28
|
yading@10
|
29 SECTION .text
|
yading@10
|
30
|
yading@10
|
31 %macro DEINTERLACE 1
|
yading@10
|
32 %ifidn %1, inplace
|
yading@10
|
33 ;void ff_deinterlace_line_inplace_mmx(const uint8_t *lum_m4, const uint8_t *lum_m3, const uint8_t *lum_m2, const uint8_t *lum_m1, const uint8_t *lum, int size)
|
yading@10
|
34 cglobal deinterlace_line_inplace_mmx, 6,6,7, lum_m4, lum_m3, lum_m2, lum_m1, lum, size
|
yading@10
|
35 %else
|
yading@10
|
36 ;void ff_deinterlace_line_mmx(uint8_t *dst, const uint8_t *lum_m4, const uint8_t *lum_m3, const uint8_t *lum_m2, const uint8_t *lum_m1, const uint8_t *lum, int size)
|
yading@10
|
37 cglobal deinterlace_line_mmx, 7,7,7, dst, lum_m4, lum_m3, lum_m2, lum_m1, lum, size
|
yading@10
|
38 %endif
|
yading@10
|
39 pxor mm7, mm7
|
yading@10
|
40 movq mm6, [pw_4]
|
yading@10
|
41 .nextrow:
|
yading@10
|
42 movd mm0, [lum_m4q]
|
yading@10
|
43 movd mm1, [lum_m3q]
|
yading@10
|
44 movd mm2, [lum_m2q]
|
yading@10
|
45 %ifidn %1, inplace
|
yading@10
|
46 movd [lum_m4q], mm2
|
yading@10
|
47 %endif
|
yading@10
|
48 movd mm3, [lum_m1q]
|
yading@10
|
49 movd mm4, [lumq]
|
yading@10
|
50 punpcklbw mm0, mm7
|
yading@10
|
51 punpcklbw mm1, mm7
|
yading@10
|
52 punpcklbw mm2, mm7
|
yading@10
|
53 punpcklbw mm3, mm7
|
yading@10
|
54 punpcklbw mm4, mm7
|
yading@10
|
55 paddw mm1, mm3
|
yading@10
|
56 psllw mm2, 1
|
yading@10
|
57 paddw mm0, mm4
|
yading@10
|
58 psllw mm1, 2
|
yading@10
|
59 paddw mm2, mm6
|
yading@10
|
60 paddw mm1, mm2
|
yading@10
|
61 psubusw mm1, mm0
|
yading@10
|
62 psrlw mm1, 3
|
yading@10
|
63 packuswb mm1, mm7
|
yading@10
|
64 %ifidn %1, inplace
|
yading@10
|
65 movd [lum_m2q], mm1
|
yading@10
|
66 %else
|
yading@10
|
67 movd [dstq], mm1
|
yading@10
|
68 add dstq, 4
|
yading@10
|
69 %endif
|
yading@10
|
70 add lum_m4q, 4
|
yading@10
|
71 add lum_m3q, 4
|
yading@10
|
72 add lum_m2q, 4
|
yading@10
|
73 add lum_m1q, 4
|
yading@10
|
74 add lumq, 4
|
yading@10
|
75 sub sized, 4
|
yading@10
|
76 jg .nextrow
|
yading@10
|
77 REP_RET
|
yading@10
|
78 %endmacro
|
yading@10
|
79
|
yading@10
|
80 DEINTERLACE ""
|
yading@10
|
81
|
yading@10
|
82 DEINTERLACE inplace
|