annotate src/opus-1.3/silk/arm/macros_armv5e.h @ 81:7029a4916348

Merge build update
author Chris Cannam
date Thu, 31 Oct 2019 13:36:58 +0000
parents 7aeed7906520
children
rev   line source
Chris@69 1 /***********************************************************************
Chris@69 2 Copyright (c) 2006-2011, Skype Limited. All rights reserved.
Chris@69 3 Copyright (c) 2013 Parrot
Chris@69 4 Redistribution and use in source and binary forms, with or without
Chris@69 5 modification, are permitted provided that the following conditions
Chris@69 6 are met:
Chris@69 7 - Redistributions of source code must retain the above copyright notice,
Chris@69 8 this list of conditions and the following disclaimer.
Chris@69 9 - Redistributions in binary form must reproduce the above copyright
Chris@69 10 notice, this list of conditions and the following disclaimer in the
Chris@69 11 documentation and/or other materials provided with the distribution.
Chris@69 12 - Neither the name of Internet Society, IETF or IETF Trust, nor the
Chris@69 13 names of specific contributors, may be used to endorse or promote
Chris@69 14 products derived from this software without specific prior written
Chris@69 15 permission.
Chris@69 16 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
Chris@69 17 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
Chris@69 18 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
Chris@69 19 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
Chris@69 20 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
Chris@69 21 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
Chris@69 22 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
Chris@69 23 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
Chris@69 24 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
Chris@69 25 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
Chris@69 26 POSSIBILITY OF SUCH DAMAGE.
Chris@69 27 ***********************************************************************/
Chris@69 28
Chris@69 29 #ifndef SILK_MACROS_ARMv5E_H
Chris@69 30 #define SILK_MACROS_ARMv5E_H
Chris@69 31
Chris@69 32 /* This macro only avoids the undefined behaviour from a left shift of
Chris@69 33 a negative value. It should only be used in macros that can't include
Chris@69 34 SigProc_FIX.h. In other cases, use silk_LSHIFT32(). */
Chris@69 35 #define SAFE_SHL(a,b) ((opus_int32)((opus_uint32)(a) << (b)))
Chris@69 36
Chris@69 37 /* (a32 * (opus_int32)((opus_int16)(b32))) >> 16 output have to be 32bit int */
Chris@69 38 #undef silk_SMULWB
Chris@69 39 static OPUS_INLINE opus_int32 silk_SMULWB_armv5e(opus_int32 a, opus_int16 b)
Chris@69 40 {
Chris@69 41 int res;
Chris@69 42 __asm__(
Chris@69 43 "#silk_SMULWB\n\t"
Chris@69 44 "smulwb %0, %1, %2\n\t"
Chris@69 45 : "=r"(res)
Chris@69 46 : "r"(a), "r"(b)
Chris@69 47 );
Chris@69 48 return res;
Chris@69 49 }
Chris@69 50 #define silk_SMULWB(a, b) (silk_SMULWB_armv5e(a, b))
Chris@69 51
Chris@69 52 /* a32 + (b32 * (opus_int32)((opus_int16)(c32))) >> 16 output have to be 32bit int */
Chris@69 53 #undef silk_SMLAWB
Chris@69 54 static OPUS_INLINE opus_int32 silk_SMLAWB_armv5e(opus_int32 a, opus_int32 b,
Chris@69 55 opus_int16 c)
Chris@69 56 {
Chris@69 57 int res;
Chris@69 58 __asm__(
Chris@69 59 "#silk_SMLAWB\n\t"
Chris@69 60 "smlawb %0, %1, %2, %3\n\t"
Chris@69 61 : "=r"(res)
Chris@69 62 : "r"(b), "r"(c), "r"(a)
Chris@69 63 );
Chris@69 64 return res;
Chris@69 65 }
Chris@69 66 #define silk_SMLAWB(a, b, c) (silk_SMLAWB_armv5e(a, b, c))
Chris@69 67
Chris@69 68 /* (a32 * (b32 >> 16)) >> 16 */
Chris@69 69 #undef silk_SMULWT
Chris@69 70 static OPUS_INLINE opus_int32 silk_SMULWT_armv5e(opus_int32 a, opus_int32 b)
Chris@69 71 {
Chris@69 72 int res;
Chris@69 73 __asm__(
Chris@69 74 "#silk_SMULWT\n\t"
Chris@69 75 "smulwt %0, %1, %2\n\t"
Chris@69 76 : "=r"(res)
Chris@69 77 : "r"(a), "r"(b)
Chris@69 78 );
Chris@69 79 return res;
Chris@69 80 }
Chris@69 81 #define silk_SMULWT(a, b) (silk_SMULWT_armv5e(a, b))
Chris@69 82
Chris@69 83 /* a32 + (b32 * (c32 >> 16)) >> 16 */
Chris@69 84 #undef silk_SMLAWT
Chris@69 85 static OPUS_INLINE opus_int32 silk_SMLAWT_armv5e(opus_int32 a, opus_int32 b,
Chris@69 86 opus_int32 c)
Chris@69 87 {
Chris@69 88 int res;
Chris@69 89 __asm__(
Chris@69 90 "#silk_SMLAWT\n\t"
Chris@69 91 "smlawt %0, %1, %2, %3\n\t"
Chris@69 92 : "=r"(res)
Chris@69 93 : "r"(b), "r"(c), "r"(a)
Chris@69 94 );
Chris@69 95 return res;
Chris@69 96 }
Chris@69 97 #define silk_SMLAWT(a, b, c) (silk_SMLAWT_armv5e(a, b, c))
Chris@69 98
Chris@69 99 /* (opus_int32)((opus_int16)(a3))) * (opus_int32)((opus_int16)(b32)) output have to be 32bit int */
Chris@69 100 #undef silk_SMULBB
Chris@69 101 static OPUS_INLINE opus_int32 silk_SMULBB_armv5e(opus_int32 a, opus_int32 b)
Chris@69 102 {
Chris@69 103 int res;
Chris@69 104 __asm__(
Chris@69 105 "#silk_SMULBB\n\t"
Chris@69 106 "smulbb %0, %1, %2\n\t"
Chris@69 107 : "=r"(res)
Chris@69 108 : "%r"(a), "r"(b)
Chris@69 109 );
Chris@69 110 return res;
Chris@69 111 }
Chris@69 112 #define silk_SMULBB(a, b) (silk_SMULBB_armv5e(a, b))
Chris@69 113
Chris@69 114 /* a32 + (opus_int32)((opus_int16)(b32)) * (opus_int32)((opus_int16)(c32)) output have to be 32bit int */
Chris@69 115 #undef silk_SMLABB
Chris@69 116 static OPUS_INLINE opus_int32 silk_SMLABB_armv5e(opus_int32 a, opus_int32 b,
Chris@69 117 opus_int32 c)
Chris@69 118 {
Chris@69 119 int res;
Chris@69 120 __asm__(
Chris@69 121 "#silk_SMLABB\n\t"
Chris@69 122 "smlabb %0, %1, %2, %3\n\t"
Chris@69 123 : "=r"(res)
Chris@69 124 : "%r"(b), "r"(c), "r"(a)
Chris@69 125 );
Chris@69 126 return res;
Chris@69 127 }
Chris@69 128 #define silk_SMLABB(a, b, c) (silk_SMLABB_armv5e(a, b, c))
Chris@69 129
Chris@69 130 /* (opus_int32)((opus_int16)(a32)) * (b32 >> 16) */
Chris@69 131 #undef silk_SMULBT
Chris@69 132 static OPUS_INLINE opus_int32 silk_SMULBT_armv5e(opus_int32 a, opus_int32 b)
Chris@69 133 {
Chris@69 134 int res;
Chris@69 135 __asm__(
Chris@69 136 "#silk_SMULBT\n\t"
Chris@69 137 "smulbt %0, %1, %2\n\t"
Chris@69 138 : "=r"(res)
Chris@69 139 : "r"(a), "r"(b)
Chris@69 140 );
Chris@69 141 return res;
Chris@69 142 }
Chris@69 143 #define silk_SMULBT(a, b) (silk_SMULBT_armv5e(a, b))
Chris@69 144
Chris@69 145 /* a32 + (opus_int32)((opus_int16)(b32)) * (c32 >> 16) */
Chris@69 146 #undef silk_SMLABT
Chris@69 147 static OPUS_INLINE opus_int32 silk_SMLABT_armv5e(opus_int32 a, opus_int32 b,
Chris@69 148 opus_int32 c)
Chris@69 149 {
Chris@69 150 int res;
Chris@69 151 __asm__(
Chris@69 152 "#silk_SMLABT\n\t"
Chris@69 153 "smlabt %0, %1, %2, %3\n\t"
Chris@69 154 : "=r"(res)
Chris@69 155 : "r"(b), "r"(c), "r"(a)
Chris@69 156 );
Chris@69 157 return res;
Chris@69 158 }
Chris@69 159 #define silk_SMLABT(a, b, c) (silk_SMLABT_armv5e(a, b, c))
Chris@69 160
Chris@69 161 /* add/subtract with output saturated */
Chris@69 162 #undef silk_ADD_SAT32
Chris@69 163 static OPUS_INLINE opus_int32 silk_ADD_SAT32_armv5e(opus_int32 a, opus_int32 b)
Chris@69 164 {
Chris@69 165 int res;
Chris@69 166 __asm__(
Chris@69 167 "#silk_ADD_SAT32\n\t"
Chris@69 168 "qadd %0, %1, %2\n\t"
Chris@69 169 : "=r"(res)
Chris@69 170 : "%r"(a), "r"(b)
Chris@69 171 );
Chris@69 172 return res;
Chris@69 173 }
Chris@69 174 #define silk_ADD_SAT32(a, b) (silk_ADD_SAT32_armv5e(a, b))
Chris@69 175
Chris@69 176 #undef silk_SUB_SAT32
Chris@69 177 static OPUS_INLINE opus_int32 silk_SUB_SAT32_armv5e(opus_int32 a, opus_int32 b)
Chris@69 178 {
Chris@69 179 int res;
Chris@69 180 __asm__(
Chris@69 181 "#silk_SUB_SAT32\n\t"
Chris@69 182 "qsub %0, %1, %2\n\t"
Chris@69 183 : "=r"(res)
Chris@69 184 : "r"(a), "r"(b)
Chris@69 185 );
Chris@69 186 return res;
Chris@69 187 }
Chris@69 188 #define silk_SUB_SAT32(a, b) (silk_SUB_SAT32_armv5e(a, b))
Chris@69 189
Chris@69 190 #undef silk_CLZ16
Chris@69 191 static OPUS_INLINE opus_int32 silk_CLZ16_armv5(opus_int16 in16)
Chris@69 192 {
Chris@69 193 int res;
Chris@69 194 __asm__(
Chris@69 195 "#silk_CLZ16\n\t"
Chris@69 196 "clz %0, %1;\n"
Chris@69 197 : "=r"(res)
Chris@69 198 : "r"(SAFE_SHL(in16,16)|0x8000)
Chris@69 199 );
Chris@69 200 return res;
Chris@69 201 }
Chris@69 202 #define silk_CLZ16(in16) (silk_CLZ16_armv5(in16))
Chris@69 203
Chris@69 204 #undef silk_CLZ32
Chris@69 205 static OPUS_INLINE opus_int32 silk_CLZ32_armv5(opus_int32 in32)
Chris@69 206 {
Chris@69 207 int res;
Chris@69 208 __asm__(
Chris@69 209 "#silk_CLZ32\n\t"
Chris@69 210 "clz %0, %1\n\t"
Chris@69 211 : "=r"(res)
Chris@69 212 : "r"(in32)
Chris@69 213 );
Chris@69 214 return res;
Chris@69 215 }
Chris@69 216 #define silk_CLZ32(in32) (silk_CLZ32_armv5(in32))
Chris@69 217
Chris@69 218 #undef SAFE_SHL
Chris@69 219
Chris@69 220 #endif /* SILK_MACROS_ARMv5E_H */