Chris@69: /*********************************************************************** Chris@69: Copyright (c) 2006-2011, Skype Limited. All rights reserved. Chris@69: Copyright (c) 2013 Parrot Chris@69: Redistribution and use in source and binary forms, with or without Chris@69: modification, are permitted provided that the following conditions Chris@69: are met: Chris@69: - Redistributions of source code must retain the above copyright notice, Chris@69: this list of conditions and the following disclaimer. Chris@69: - Redistributions in binary form must reproduce the above copyright Chris@69: notice, this list of conditions and the following disclaimer in the Chris@69: documentation and/or other materials provided with the distribution. Chris@69: - Neither the name of Internet Society, IETF or IETF Trust, nor the Chris@69: names of specific contributors, may be used to endorse or promote Chris@69: products derived from this software without specific prior written Chris@69: permission. Chris@69: THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" Chris@69: AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE Chris@69: IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE Chris@69: ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE Chris@69: LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR Chris@69: CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF Chris@69: SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS Chris@69: INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN Chris@69: CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) Chris@69: ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE Chris@69: POSSIBILITY OF SUCH DAMAGE. Chris@69: ***********************************************************************/ Chris@69: Chris@69: #ifndef SILK_MACROS_ARMv5E_H Chris@69: #define SILK_MACROS_ARMv5E_H Chris@69: Chris@69: /* This macro only avoids the undefined behaviour from a left shift of Chris@69: a negative value. It should only be used in macros that can't include Chris@69: SigProc_FIX.h. In other cases, use silk_LSHIFT32(). */ Chris@69: #define SAFE_SHL(a,b) ((opus_int32)((opus_uint32)(a) << (b))) Chris@69: Chris@69: /* (a32 * (opus_int32)((opus_int16)(b32))) >> 16 output have to be 32bit int */ Chris@69: #undef silk_SMULWB Chris@69: static OPUS_INLINE opus_int32 silk_SMULWB_armv5e(opus_int32 a, opus_int16 b) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMULWB\n\t" Chris@69: "smulwb %0, %1, %2\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(a), "r"(b) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMULWB(a, b) (silk_SMULWB_armv5e(a, b)) Chris@69: Chris@69: /* a32 + (b32 * (opus_int32)((opus_int16)(c32))) >> 16 output have to be 32bit int */ Chris@69: #undef silk_SMLAWB Chris@69: static OPUS_INLINE opus_int32 silk_SMLAWB_armv5e(opus_int32 a, opus_int32 b, Chris@69: opus_int16 c) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMLAWB\n\t" Chris@69: "smlawb %0, %1, %2, %3\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(b), "r"(c), "r"(a) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMLAWB(a, b, c) (silk_SMLAWB_armv5e(a, b, c)) Chris@69: Chris@69: /* (a32 * (b32 >> 16)) >> 16 */ Chris@69: #undef silk_SMULWT Chris@69: static OPUS_INLINE opus_int32 silk_SMULWT_armv5e(opus_int32 a, opus_int32 b) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMULWT\n\t" Chris@69: "smulwt %0, %1, %2\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(a), "r"(b) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMULWT(a, b) (silk_SMULWT_armv5e(a, b)) Chris@69: Chris@69: /* a32 + (b32 * (c32 >> 16)) >> 16 */ Chris@69: #undef silk_SMLAWT Chris@69: static OPUS_INLINE opus_int32 silk_SMLAWT_armv5e(opus_int32 a, opus_int32 b, Chris@69: opus_int32 c) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMLAWT\n\t" Chris@69: "smlawt %0, %1, %2, %3\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(b), "r"(c), "r"(a) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMLAWT(a, b, c) (silk_SMLAWT_armv5e(a, b, c)) Chris@69: Chris@69: /* (opus_int32)((opus_int16)(a3))) * (opus_int32)((opus_int16)(b32)) output have to be 32bit int */ Chris@69: #undef silk_SMULBB Chris@69: static OPUS_INLINE opus_int32 silk_SMULBB_armv5e(opus_int32 a, opus_int32 b) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMULBB\n\t" Chris@69: "smulbb %0, %1, %2\n\t" Chris@69: : "=r"(res) Chris@69: : "%r"(a), "r"(b) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMULBB(a, b) (silk_SMULBB_armv5e(a, b)) Chris@69: Chris@69: /* a32 + (opus_int32)((opus_int16)(b32)) * (opus_int32)((opus_int16)(c32)) output have to be 32bit int */ Chris@69: #undef silk_SMLABB Chris@69: static OPUS_INLINE opus_int32 silk_SMLABB_armv5e(opus_int32 a, opus_int32 b, Chris@69: opus_int32 c) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMLABB\n\t" Chris@69: "smlabb %0, %1, %2, %3\n\t" Chris@69: : "=r"(res) Chris@69: : "%r"(b), "r"(c), "r"(a) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMLABB(a, b, c) (silk_SMLABB_armv5e(a, b, c)) Chris@69: Chris@69: /* (opus_int32)((opus_int16)(a32)) * (b32 >> 16) */ Chris@69: #undef silk_SMULBT Chris@69: static OPUS_INLINE opus_int32 silk_SMULBT_armv5e(opus_int32 a, opus_int32 b) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMULBT\n\t" Chris@69: "smulbt %0, %1, %2\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(a), "r"(b) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMULBT(a, b) (silk_SMULBT_armv5e(a, b)) Chris@69: Chris@69: /* a32 + (opus_int32)((opus_int16)(b32)) * (c32 >> 16) */ Chris@69: #undef silk_SMLABT Chris@69: static OPUS_INLINE opus_int32 silk_SMLABT_armv5e(opus_int32 a, opus_int32 b, Chris@69: opus_int32 c) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SMLABT\n\t" Chris@69: "smlabt %0, %1, %2, %3\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(b), "r"(c), "r"(a) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SMLABT(a, b, c) (silk_SMLABT_armv5e(a, b, c)) Chris@69: Chris@69: /* add/subtract with output saturated */ Chris@69: #undef silk_ADD_SAT32 Chris@69: static OPUS_INLINE opus_int32 silk_ADD_SAT32_armv5e(opus_int32 a, opus_int32 b) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_ADD_SAT32\n\t" Chris@69: "qadd %0, %1, %2\n\t" Chris@69: : "=r"(res) Chris@69: : "%r"(a), "r"(b) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_ADD_SAT32(a, b) (silk_ADD_SAT32_armv5e(a, b)) Chris@69: Chris@69: #undef silk_SUB_SAT32 Chris@69: static OPUS_INLINE opus_int32 silk_SUB_SAT32_armv5e(opus_int32 a, opus_int32 b) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_SUB_SAT32\n\t" Chris@69: "qsub %0, %1, %2\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(a), "r"(b) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_SUB_SAT32(a, b) (silk_SUB_SAT32_armv5e(a, b)) Chris@69: Chris@69: #undef silk_CLZ16 Chris@69: static OPUS_INLINE opus_int32 silk_CLZ16_armv5(opus_int16 in16) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_CLZ16\n\t" Chris@69: "clz %0, %1;\n" Chris@69: : "=r"(res) Chris@69: : "r"(SAFE_SHL(in16,16)|0x8000) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_CLZ16(in16) (silk_CLZ16_armv5(in16)) Chris@69: Chris@69: #undef silk_CLZ32 Chris@69: static OPUS_INLINE opus_int32 silk_CLZ32_armv5(opus_int32 in32) Chris@69: { Chris@69: int res; Chris@69: __asm__( Chris@69: "#silk_CLZ32\n\t" Chris@69: "clz %0, %1\n\t" Chris@69: : "=r"(res) Chris@69: : "r"(in32) Chris@69: ); Chris@69: return res; Chris@69: } Chris@69: #define silk_CLZ32(in32) (silk_CLZ32_armv5(in32)) Chris@69: Chris@69: #undef SAFE_SHL Chris@69: Chris@69: #endif /* SILK_MACROS_ARMv5E_H */