yading@10
|
1 /*
|
yading@10
|
2 * Copyright (c) 2011 Mans Rullgard <mans@mansr.com>
|
yading@10
|
3 *
|
yading@10
|
4 * This file is part of Libav.
|
yading@10
|
5 *
|
yading@10
|
6 * Libav is free software; you can redistribute it and/or
|
yading@10
|
7 * modify it under the terms of the GNU Lesser General Public
|
yading@10
|
8 * License as published by the Free Software Foundation; either
|
yading@10
|
9 * version 2.1 of the License, or (at your option) any later version.
|
yading@10
|
10 *
|
yading@10
|
11 * Libav is distributed in the hope that it will be useful,
|
yading@10
|
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
yading@10
|
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
yading@10
|
14 * Lesser General Public License for more details.
|
yading@10
|
15 *
|
yading@10
|
16 * You should have received a copy of the GNU Lesser General Public
|
yading@10
|
17 * License along with Libav; if not, write to the Free Software
|
yading@10
|
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
yading@10
|
19 */
|
yading@10
|
20
|
yading@10
|
21 #ifndef AVCODEC_ARM_DCA_H
|
yading@10
|
22 #define AVCODEC_ARM_DCA_H
|
yading@10
|
23
|
yading@10
|
24 #include <stdint.h>
|
yading@10
|
25
|
yading@10
|
26 #include "config.h"
|
yading@10
|
27 #include "libavcodec/mathops.h"
|
yading@10
|
28
|
yading@10
|
29 #if HAVE_ARMV6_INLINE && AV_GCC_VERSION_AT_LEAST(4,4) && !CONFIG_THUMB
|
yading@10
|
30
|
yading@10
|
31 #define decode_blockcodes decode_blockcodes
|
yading@10
|
32 static inline int decode_blockcodes(int code1, int code2, int levels,
|
yading@10
|
33 int *values)
|
yading@10
|
34 {
|
yading@10
|
35 int v0, v1, v2, v3, v4, v5;
|
yading@10
|
36
|
yading@10
|
37 __asm__ ("smmul %0, %6, %10 \n"
|
yading@10
|
38 "smmul %3, %7, %10 \n"
|
yading@10
|
39 "smlabb %6, %0, %9, %6 \n"
|
yading@10
|
40 "smlabb %7, %3, %9, %7 \n"
|
yading@10
|
41 "smmul %1, %0, %10 \n"
|
yading@10
|
42 "smmul %4, %3, %10 \n"
|
yading@10
|
43 "sub %6, %6, %8, lsr #1 \n"
|
yading@10
|
44 "sub %7, %7, %8, lsr #1 \n"
|
yading@10
|
45 "smlabb %0, %1, %9, %0 \n"
|
yading@10
|
46 "smlabb %3, %4, %9, %3 \n"
|
yading@10
|
47 "smmul %2, %1, %10 \n"
|
yading@10
|
48 "smmul %5, %4, %10 \n"
|
yading@10
|
49 "str %6, [%11, #0] \n"
|
yading@10
|
50 "str %7, [%11, #16] \n"
|
yading@10
|
51 "sub %0, %0, %8, lsr #1 \n"
|
yading@10
|
52 "sub %3, %3, %8, lsr #1 \n"
|
yading@10
|
53 "smlabb %1, %2, %9, %1 \n"
|
yading@10
|
54 "smlabb %4, %5, %9, %4 \n"
|
yading@10
|
55 "smmul %6, %2, %10 \n"
|
yading@10
|
56 "smmul %7, %5, %10 \n"
|
yading@10
|
57 "str %0, [%11, #4] \n"
|
yading@10
|
58 "str %3, [%11, #20] \n"
|
yading@10
|
59 "sub %1, %1, %8, lsr #1 \n"
|
yading@10
|
60 "sub %4, %4, %8, lsr #1 \n"
|
yading@10
|
61 "smlabb %2, %6, %9, %2 \n"
|
yading@10
|
62 "smlabb %5, %7, %9, %5 \n"
|
yading@10
|
63 "str %1, [%11, #8] \n"
|
yading@10
|
64 "str %4, [%11, #24] \n"
|
yading@10
|
65 "sub %2, %2, %8, lsr #1 \n"
|
yading@10
|
66 "sub %5, %5, %8, lsr #1 \n"
|
yading@10
|
67 "str %2, [%11, #12] \n"
|
yading@10
|
68 "str %5, [%11, #28] \n"
|
yading@10
|
69 : "=&r"(v0), "=&r"(v1), "=&r"(v2),
|
yading@10
|
70 "=&r"(v3), "=&r"(v4), "=&r"(v5),
|
yading@10
|
71 "+&r"(code1), "+&r"(code2)
|
yading@10
|
72 : "r"(levels - 1), "r"(-levels),
|
yading@10
|
73 "r"(ff_inverse[levels]), "r"(values)
|
yading@10
|
74 : "memory");
|
yading@10
|
75
|
yading@10
|
76 return code1 | code2;
|
yading@10
|
77 }
|
yading@10
|
78
|
yading@10
|
79 #endif
|
yading@10
|
80
|
yading@10
|
81 #if HAVE_NEON_INLINE && HAVE_ASM_MOD_Y
|
yading@10
|
82
|
yading@10
|
83 #define int8x8_fmul_int32 int8x8_fmul_int32
|
yading@10
|
84 static inline void int8x8_fmul_int32(float *dst, const int8_t *src, int scale)
|
yading@10
|
85 {
|
yading@10
|
86 __asm__ ("vcvt.f32.s32 %2, %2, #4 \n"
|
yading@10
|
87 "vld1.8 {d0}, [%1,:64] \n"
|
yading@10
|
88 "vmovl.s8 q0, d0 \n"
|
yading@10
|
89 "vmovl.s16 q1, d1 \n"
|
yading@10
|
90 "vmovl.s16 q0, d0 \n"
|
yading@10
|
91 "vcvt.f32.s32 q0, q0 \n"
|
yading@10
|
92 "vcvt.f32.s32 q1, q1 \n"
|
yading@10
|
93 "vmul.f32 q0, q0, %y2 \n"
|
yading@10
|
94 "vmul.f32 q1, q1, %y2 \n"
|
yading@10
|
95 "vst1.32 {q0-q1}, [%m0,:128] \n"
|
yading@10
|
96 : "=Um"(*(float (*)[8])dst)
|
yading@10
|
97 : "r"(src), "x"(scale)
|
yading@10
|
98 : "d0", "d1", "d2", "d3");
|
yading@10
|
99 }
|
yading@10
|
100
|
yading@10
|
101 #endif
|
yading@10
|
102
|
yading@10
|
103 #endif /* AVCODEC_ARM_DCA_H */
|