Chris@69
|
1 /***********************************************************************
|
Chris@69
|
2 Copyright (c) 2006-2011, Skype Limited. All rights reserved.
|
Chris@69
|
3 Copyright (c) 2013 Parrot
|
Chris@69
|
4 Redistribution and use in source and binary forms, with or without
|
Chris@69
|
5 modification, are permitted provided that the following conditions
|
Chris@69
|
6 are met:
|
Chris@69
|
7 - Redistributions of source code must retain the above copyright notice,
|
Chris@69
|
8 this list of conditions and the following disclaimer.
|
Chris@69
|
9 - Redistributions in binary form must reproduce the above copyright
|
Chris@69
|
10 notice, this list of conditions and the following disclaimer in the
|
Chris@69
|
11 documentation and/or other materials provided with the distribution.
|
Chris@69
|
12 - Neither the name of Internet Society, IETF or IETF Trust, nor the
|
Chris@69
|
13 names of specific contributors, may be used to endorse or promote
|
Chris@69
|
14 products derived from this software without specific prior written
|
Chris@69
|
15 permission.
|
Chris@69
|
16 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
Chris@69
|
17 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
Chris@69
|
18 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
Chris@69
|
19 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
Chris@69
|
20 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
Chris@69
|
21 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
Chris@69
|
22 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
Chris@69
|
23 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
Chris@69
|
24 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
Chris@69
|
25 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
Chris@69
|
26 POSSIBILITY OF SUCH DAMAGE.
|
Chris@69
|
27 ***********************************************************************/
|
Chris@69
|
28
|
Chris@69
|
29 #ifndef SILK_MACROS_ARMv5E_H
|
Chris@69
|
30 #define SILK_MACROS_ARMv5E_H
|
Chris@69
|
31
|
Chris@69
|
32 /* This macro only avoids the undefined behaviour from a left shift of
|
Chris@69
|
33 a negative value. It should only be used in macros that can't include
|
Chris@69
|
34 SigProc_FIX.h. In other cases, use silk_LSHIFT32(). */
|
Chris@69
|
35 #define SAFE_SHL(a,b) ((opus_int32)((opus_uint32)(a) << (b)))
|
Chris@69
|
36
|
Chris@69
|
37 /* (a32 * (opus_int32)((opus_int16)(b32))) >> 16 output have to be 32bit int */
|
Chris@69
|
38 #undef silk_SMULWB
|
Chris@69
|
39 static OPUS_INLINE opus_int32 silk_SMULWB_armv5e(opus_int32 a, opus_int16 b)
|
Chris@69
|
40 {
|
Chris@69
|
41 int res;
|
Chris@69
|
42 __asm__(
|
Chris@69
|
43 "#silk_SMULWB\n\t"
|
Chris@69
|
44 "smulwb %0, %1, %2\n\t"
|
Chris@69
|
45 : "=r"(res)
|
Chris@69
|
46 : "r"(a), "r"(b)
|
Chris@69
|
47 );
|
Chris@69
|
48 return res;
|
Chris@69
|
49 }
|
Chris@69
|
50 #define silk_SMULWB(a, b) (silk_SMULWB_armv5e(a, b))
|
Chris@69
|
51
|
Chris@69
|
52 /* a32 + (b32 * (opus_int32)((opus_int16)(c32))) >> 16 output have to be 32bit int */
|
Chris@69
|
53 #undef silk_SMLAWB
|
Chris@69
|
54 static OPUS_INLINE opus_int32 silk_SMLAWB_armv5e(opus_int32 a, opus_int32 b,
|
Chris@69
|
55 opus_int16 c)
|
Chris@69
|
56 {
|
Chris@69
|
57 int res;
|
Chris@69
|
58 __asm__(
|
Chris@69
|
59 "#silk_SMLAWB\n\t"
|
Chris@69
|
60 "smlawb %0, %1, %2, %3\n\t"
|
Chris@69
|
61 : "=r"(res)
|
Chris@69
|
62 : "r"(b), "r"(c), "r"(a)
|
Chris@69
|
63 );
|
Chris@69
|
64 return res;
|
Chris@69
|
65 }
|
Chris@69
|
66 #define silk_SMLAWB(a, b, c) (silk_SMLAWB_armv5e(a, b, c))
|
Chris@69
|
67
|
Chris@69
|
68 /* (a32 * (b32 >> 16)) >> 16 */
|
Chris@69
|
69 #undef silk_SMULWT
|
Chris@69
|
70 static OPUS_INLINE opus_int32 silk_SMULWT_armv5e(opus_int32 a, opus_int32 b)
|
Chris@69
|
71 {
|
Chris@69
|
72 int res;
|
Chris@69
|
73 __asm__(
|
Chris@69
|
74 "#silk_SMULWT\n\t"
|
Chris@69
|
75 "smulwt %0, %1, %2\n\t"
|
Chris@69
|
76 : "=r"(res)
|
Chris@69
|
77 : "r"(a), "r"(b)
|
Chris@69
|
78 );
|
Chris@69
|
79 return res;
|
Chris@69
|
80 }
|
Chris@69
|
81 #define silk_SMULWT(a, b) (silk_SMULWT_armv5e(a, b))
|
Chris@69
|
82
|
Chris@69
|
83 /* a32 + (b32 * (c32 >> 16)) >> 16 */
|
Chris@69
|
84 #undef silk_SMLAWT
|
Chris@69
|
85 static OPUS_INLINE opus_int32 silk_SMLAWT_armv5e(opus_int32 a, opus_int32 b,
|
Chris@69
|
86 opus_int32 c)
|
Chris@69
|
87 {
|
Chris@69
|
88 int res;
|
Chris@69
|
89 __asm__(
|
Chris@69
|
90 "#silk_SMLAWT\n\t"
|
Chris@69
|
91 "smlawt %0, %1, %2, %3\n\t"
|
Chris@69
|
92 : "=r"(res)
|
Chris@69
|
93 : "r"(b), "r"(c), "r"(a)
|
Chris@69
|
94 );
|
Chris@69
|
95 return res;
|
Chris@69
|
96 }
|
Chris@69
|
97 #define silk_SMLAWT(a, b, c) (silk_SMLAWT_armv5e(a, b, c))
|
Chris@69
|
98
|
Chris@69
|
99 /* (opus_int32)((opus_int16)(a3))) * (opus_int32)((opus_int16)(b32)) output have to be 32bit int */
|
Chris@69
|
100 #undef silk_SMULBB
|
Chris@69
|
101 static OPUS_INLINE opus_int32 silk_SMULBB_armv5e(opus_int32 a, opus_int32 b)
|
Chris@69
|
102 {
|
Chris@69
|
103 int res;
|
Chris@69
|
104 __asm__(
|
Chris@69
|
105 "#silk_SMULBB\n\t"
|
Chris@69
|
106 "smulbb %0, %1, %2\n\t"
|
Chris@69
|
107 : "=r"(res)
|
Chris@69
|
108 : "%r"(a), "r"(b)
|
Chris@69
|
109 );
|
Chris@69
|
110 return res;
|
Chris@69
|
111 }
|
Chris@69
|
112 #define silk_SMULBB(a, b) (silk_SMULBB_armv5e(a, b))
|
Chris@69
|
113
|
Chris@69
|
114 /* a32 + (opus_int32)((opus_int16)(b32)) * (opus_int32)((opus_int16)(c32)) output have to be 32bit int */
|
Chris@69
|
115 #undef silk_SMLABB
|
Chris@69
|
116 static OPUS_INLINE opus_int32 silk_SMLABB_armv5e(opus_int32 a, opus_int32 b,
|
Chris@69
|
117 opus_int32 c)
|
Chris@69
|
118 {
|
Chris@69
|
119 int res;
|
Chris@69
|
120 __asm__(
|
Chris@69
|
121 "#silk_SMLABB\n\t"
|
Chris@69
|
122 "smlabb %0, %1, %2, %3\n\t"
|
Chris@69
|
123 : "=r"(res)
|
Chris@69
|
124 : "%r"(b), "r"(c), "r"(a)
|
Chris@69
|
125 );
|
Chris@69
|
126 return res;
|
Chris@69
|
127 }
|
Chris@69
|
128 #define silk_SMLABB(a, b, c) (silk_SMLABB_armv5e(a, b, c))
|
Chris@69
|
129
|
Chris@69
|
130 /* (opus_int32)((opus_int16)(a32)) * (b32 >> 16) */
|
Chris@69
|
131 #undef silk_SMULBT
|
Chris@69
|
132 static OPUS_INLINE opus_int32 silk_SMULBT_armv5e(opus_int32 a, opus_int32 b)
|
Chris@69
|
133 {
|
Chris@69
|
134 int res;
|
Chris@69
|
135 __asm__(
|
Chris@69
|
136 "#silk_SMULBT\n\t"
|
Chris@69
|
137 "smulbt %0, %1, %2\n\t"
|
Chris@69
|
138 : "=r"(res)
|
Chris@69
|
139 : "r"(a), "r"(b)
|
Chris@69
|
140 );
|
Chris@69
|
141 return res;
|
Chris@69
|
142 }
|
Chris@69
|
143 #define silk_SMULBT(a, b) (silk_SMULBT_armv5e(a, b))
|
Chris@69
|
144
|
Chris@69
|
145 /* a32 + (opus_int32)((opus_int16)(b32)) * (c32 >> 16) */
|
Chris@69
|
146 #undef silk_SMLABT
|
Chris@69
|
147 static OPUS_INLINE opus_int32 silk_SMLABT_armv5e(opus_int32 a, opus_int32 b,
|
Chris@69
|
148 opus_int32 c)
|
Chris@69
|
149 {
|
Chris@69
|
150 int res;
|
Chris@69
|
151 __asm__(
|
Chris@69
|
152 "#silk_SMLABT\n\t"
|
Chris@69
|
153 "smlabt %0, %1, %2, %3\n\t"
|
Chris@69
|
154 : "=r"(res)
|
Chris@69
|
155 : "r"(b), "r"(c), "r"(a)
|
Chris@69
|
156 );
|
Chris@69
|
157 return res;
|
Chris@69
|
158 }
|
Chris@69
|
159 #define silk_SMLABT(a, b, c) (silk_SMLABT_armv5e(a, b, c))
|
Chris@69
|
160
|
Chris@69
|
161 /* add/subtract with output saturated */
|
Chris@69
|
162 #undef silk_ADD_SAT32
|
Chris@69
|
163 static OPUS_INLINE opus_int32 silk_ADD_SAT32_armv5e(opus_int32 a, opus_int32 b)
|
Chris@69
|
164 {
|
Chris@69
|
165 int res;
|
Chris@69
|
166 __asm__(
|
Chris@69
|
167 "#silk_ADD_SAT32\n\t"
|
Chris@69
|
168 "qadd %0, %1, %2\n\t"
|
Chris@69
|
169 : "=r"(res)
|
Chris@69
|
170 : "%r"(a), "r"(b)
|
Chris@69
|
171 );
|
Chris@69
|
172 return res;
|
Chris@69
|
173 }
|
Chris@69
|
174 #define silk_ADD_SAT32(a, b) (silk_ADD_SAT32_armv5e(a, b))
|
Chris@69
|
175
|
Chris@69
|
176 #undef silk_SUB_SAT32
|
Chris@69
|
177 static OPUS_INLINE opus_int32 silk_SUB_SAT32_armv5e(opus_int32 a, opus_int32 b)
|
Chris@69
|
178 {
|
Chris@69
|
179 int res;
|
Chris@69
|
180 __asm__(
|
Chris@69
|
181 "#silk_SUB_SAT32\n\t"
|
Chris@69
|
182 "qsub %0, %1, %2\n\t"
|
Chris@69
|
183 : "=r"(res)
|
Chris@69
|
184 : "r"(a), "r"(b)
|
Chris@69
|
185 );
|
Chris@69
|
186 return res;
|
Chris@69
|
187 }
|
Chris@69
|
188 #define silk_SUB_SAT32(a, b) (silk_SUB_SAT32_armv5e(a, b))
|
Chris@69
|
189
|
Chris@69
|
190 #undef silk_CLZ16
|
Chris@69
|
191 static OPUS_INLINE opus_int32 silk_CLZ16_armv5(opus_int16 in16)
|
Chris@69
|
192 {
|
Chris@69
|
193 int res;
|
Chris@69
|
194 __asm__(
|
Chris@69
|
195 "#silk_CLZ16\n\t"
|
Chris@69
|
196 "clz %0, %1;\n"
|
Chris@69
|
197 : "=r"(res)
|
Chris@69
|
198 : "r"(SAFE_SHL(in16,16)|0x8000)
|
Chris@69
|
199 );
|
Chris@69
|
200 return res;
|
Chris@69
|
201 }
|
Chris@69
|
202 #define silk_CLZ16(in16) (silk_CLZ16_armv5(in16))
|
Chris@69
|
203
|
Chris@69
|
204 #undef silk_CLZ32
|
Chris@69
|
205 static OPUS_INLINE opus_int32 silk_CLZ32_armv5(opus_int32 in32)
|
Chris@69
|
206 {
|
Chris@69
|
207 int res;
|
Chris@69
|
208 __asm__(
|
Chris@69
|
209 "#silk_CLZ32\n\t"
|
Chris@69
|
210 "clz %0, %1\n\t"
|
Chris@69
|
211 : "=r"(res)
|
Chris@69
|
212 : "r"(in32)
|
Chris@69
|
213 );
|
Chris@69
|
214 return res;
|
Chris@69
|
215 }
|
Chris@69
|
216 #define silk_CLZ32(in32) (silk_CLZ32_armv5(in32))
|
Chris@69
|
217
|
Chris@69
|
218 #undef SAFE_SHL
|
Chris@69
|
219
|
Chris@69
|
220 #endif /* SILK_MACROS_ARMv5E_H */
|