annotate src/opus-1.3/silk/x86/main_sse.h @ 169:223a55898ab9 tip default

Add null config files
author Chris Cannam <cannam@all-day-breakfast.com>
date Mon, 02 Mar 2020 14:03:47 +0000
parents 4664ac0c1032
children
rev   line source
cannam@154 1 /* Copyright (c) 2014, Cisco Systems, INC
cannam@154 2 Written by XiangMingZhu WeiZhou MinPeng YanWang
cannam@154 3
cannam@154 4 Redistribution and use in source and binary forms, with or without
cannam@154 5 modification, are permitted provided that the following conditions
cannam@154 6 are met:
cannam@154 7
cannam@154 8 - Redistributions of source code must retain the above copyright
cannam@154 9 notice, this list of conditions and the following disclaimer.
cannam@154 10
cannam@154 11 - Redistributions in binary form must reproduce the above copyright
cannam@154 12 notice, this list of conditions and the following disclaimer in the
cannam@154 13 documentation and/or other materials provided with the distribution.
cannam@154 14
cannam@154 15 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
cannam@154 16 ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
cannam@154 17 LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
cannam@154 18 A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
cannam@154 19 OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
cannam@154 20 EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
cannam@154 21 PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
cannam@154 22 PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
cannam@154 23 LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
cannam@154 24 NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
cannam@154 25 SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
cannam@154 26 */
cannam@154 27
cannam@154 28 #ifndef MAIN_SSE_H
cannam@154 29 #define MAIN_SSE_H
cannam@154 30
cannam@154 31 #ifdef HAVE_CONFIG_H
cannam@154 32 #include "config.h"
cannam@154 33 #endif
cannam@154 34
cannam@154 35 # if defined(OPUS_X86_MAY_HAVE_SSE4_1)
cannam@154 36
cannam@154 37 #if 0 /* FIXME: SSE disabled until silk_VQ_WMat_EC_sse4_1() gets updated. */
cannam@154 38 # define OVERRIDE_silk_VQ_WMat_EC
cannam@154 39
cannam@154 40 void silk_VQ_WMat_EC_sse4_1(
cannam@154 41 opus_int8 *ind, /* O index of best codebook vector */
cannam@154 42 opus_int32 *rate_dist_Q14, /* O best weighted quant error + mu * rate */
cannam@154 43 opus_int *gain_Q7, /* O sum of absolute LTP coefficients */
cannam@154 44 const opus_int16 *in_Q14, /* I input vector to be quantized */
cannam@154 45 const opus_int32 *W_Q18, /* I weighting matrix */
cannam@154 46 const opus_int8 *cb_Q7, /* I codebook */
cannam@154 47 const opus_uint8 *cb_gain_Q7, /* I codebook effective gain */
cannam@154 48 const opus_uint8 *cl_Q5, /* I code length for each codebook vector */
cannam@154 49 const opus_int mu_Q9, /* I tradeoff betw. weighted error and rate */
cannam@154 50 const opus_int32 max_gain_Q7, /* I maximum sum of absolute LTP coefficients */
cannam@154 51 opus_int L /* I number of vectors in codebook */
cannam@154 52 );
cannam@154 53
cannam@154 54 #if defined OPUS_X86_PRESUME_SSE4_1
cannam@154 55
cannam@154 56 #define silk_VQ_WMat_EC(ind, rate_dist_Q14, gain_Q7, in_Q14, W_Q18, cb_Q7, cb_gain_Q7, cl_Q5, \
cannam@154 57 mu_Q9, max_gain_Q7, L, arch) \
cannam@154 58 ((void)(arch),silk_VQ_WMat_EC_sse4_1(ind, rate_dist_Q14, gain_Q7, in_Q14, W_Q18, cb_Q7, cb_gain_Q7, cl_Q5, \
cannam@154 59 mu_Q9, max_gain_Q7, L))
cannam@154 60
cannam@154 61 #else
cannam@154 62
cannam@154 63 extern void (*const SILK_VQ_WMAT_EC_IMPL[OPUS_ARCHMASK + 1])(
cannam@154 64 opus_int8 *ind, /* O index of best codebook vector */
cannam@154 65 opus_int32 *rate_dist_Q14, /* O best weighted quant error + mu * rate */
cannam@154 66 opus_int *gain_Q7, /* O sum of absolute LTP coefficients */
cannam@154 67 const opus_int16 *in_Q14, /* I input vector to be quantized */
cannam@154 68 const opus_int32 *W_Q18, /* I weighting matrix */
cannam@154 69 const opus_int8 *cb_Q7, /* I codebook */
cannam@154 70 const opus_uint8 *cb_gain_Q7, /* I codebook effective gain */
cannam@154 71 const opus_uint8 *cl_Q5, /* I code length for each codebook vector */
cannam@154 72 const opus_int mu_Q9, /* I tradeoff betw. weighted error and rate */
cannam@154 73 const opus_int32 max_gain_Q7, /* I maximum sum of absolute LTP coefficients */
cannam@154 74 opus_int L /* I number of vectors in codebook */
cannam@154 75 );
cannam@154 76
cannam@154 77 # define silk_VQ_WMat_EC(ind, rate_dist_Q14, gain_Q7, in_Q14, W_Q18, cb_Q7, cb_gain_Q7, cl_Q5, \
cannam@154 78 mu_Q9, max_gain_Q7, L, arch) \
cannam@154 79 ((*SILK_VQ_WMAT_EC_IMPL[(arch) & OPUS_ARCHMASK])(ind, rate_dist_Q14, gain_Q7, in_Q14, W_Q18, cb_Q7, cb_gain_Q7, cl_Q5, \
cannam@154 80 mu_Q9, max_gain_Q7, L))
cannam@154 81
cannam@154 82 #endif
cannam@154 83 #endif
cannam@154 84
cannam@154 85 #if 0 /* FIXME: SSE disabled until the NSQ code gets updated. */
cannam@154 86 # define OVERRIDE_silk_NSQ
cannam@154 87
cannam@154 88 void silk_NSQ_sse4_1(
cannam@154 89 const silk_encoder_state *psEncC, /* I Encoder State */
cannam@154 90 silk_nsq_state *NSQ, /* I/O NSQ state */
cannam@154 91 SideInfoIndices *psIndices, /* I/O Quantization Indices */
cannam@154 92 const opus_int32 x_Q3[], /* I Prefiltered input signal */
cannam@154 93 opus_int8 pulses[], /* O Quantized pulse signal */
cannam@154 94 const opus_int16 PredCoef_Q12[ 2 * MAX_LPC_ORDER ], /* I Short term prediction coefs */
cannam@154 95 const opus_int16 LTPCoef_Q14[ LTP_ORDER * MAX_NB_SUBFR ], /* I Long term prediction coefs */
cannam@154 96 const opus_int16 AR2_Q13[ MAX_NB_SUBFR * MAX_SHAPE_LPC_ORDER ], /* I Noise shaping coefs */
cannam@154 97 const opus_int HarmShapeGain_Q14[ MAX_NB_SUBFR ], /* I Long term shaping coefs */
cannam@154 98 const opus_int Tilt_Q14[ MAX_NB_SUBFR ], /* I Spectral tilt */
cannam@154 99 const opus_int32 LF_shp_Q14[ MAX_NB_SUBFR ], /* I Low frequency shaping coefs */
cannam@154 100 const opus_int32 Gains_Q16[ MAX_NB_SUBFR ], /* I Quantization step sizes */
cannam@154 101 const opus_int pitchL[ MAX_NB_SUBFR ], /* I Pitch lags */
cannam@154 102 const opus_int Lambda_Q10, /* I Rate/distortion tradeoff */
cannam@154 103 const opus_int LTP_scale_Q14 /* I LTP state scaling */
cannam@154 104 );
cannam@154 105
cannam@154 106 #if defined OPUS_X86_PRESUME_SSE4_1
cannam@154 107
cannam@154 108 #define silk_NSQ(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 109 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14, arch) \
cannam@154 110 ((void)(arch),silk_NSQ_sse4_1(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 111 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14))
cannam@154 112
cannam@154 113 #else
cannam@154 114
cannam@154 115 extern void (*const SILK_NSQ_IMPL[OPUS_ARCHMASK + 1])(
cannam@154 116 const silk_encoder_state *psEncC, /* I Encoder State */
cannam@154 117 silk_nsq_state *NSQ, /* I/O NSQ state */
cannam@154 118 SideInfoIndices *psIndices, /* I/O Quantization Indices */
cannam@154 119 const opus_int32 x_Q3[], /* I Prefiltered input signal */
cannam@154 120 opus_int8 pulses[], /* O Quantized pulse signal */
cannam@154 121 const opus_int16 PredCoef_Q12[ 2 * MAX_LPC_ORDER ], /* I Short term prediction coefs */
cannam@154 122 const opus_int16 LTPCoef_Q14[ LTP_ORDER * MAX_NB_SUBFR ], /* I Long term prediction coefs */
cannam@154 123 const opus_int16 AR2_Q13[ MAX_NB_SUBFR * MAX_SHAPE_LPC_ORDER ], /* I Noise shaping coefs */
cannam@154 124 const opus_int HarmShapeGain_Q14[ MAX_NB_SUBFR ], /* I Long term shaping coefs */
cannam@154 125 const opus_int Tilt_Q14[ MAX_NB_SUBFR ], /* I Spectral tilt */
cannam@154 126 const opus_int32 LF_shp_Q14[ MAX_NB_SUBFR ], /* I Low frequency shaping coefs */
cannam@154 127 const opus_int32 Gains_Q16[ MAX_NB_SUBFR ], /* I Quantization step sizes */
cannam@154 128 const opus_int pitchL[ MAX_NB_SUBFR ], /* I Pitch lags */
cannam@154 129 const opus_int Lambda_Q10, /* I Rate/distortion tradeoff */
cannam@154 130 const opus_int LTP_scale_Q14 /* I LTP state scaling */
cannam@154 131 );
cannam@154 132
cannam@154 133 # define silk_NSQ(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 134 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14, arch) \
cannam@154 135 ((*SILK_NSQ_IMPL[(arch) & OPUS_ARCHMASK])(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 136 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14))
cannam@154 137
cannam@154 138 #endif
cannam@154 139
cannam@154 140 # define OVERRIDE_silk_NSQ_del_dec
cannam@154 141
cannam@154 142 void silk_NSQ_del_dec_sse4_1(
cannam@154 143 const silk_encoder_state *psEncC, /* I Encoder State */
cannam@154 144 silk_nsq_state *NSQ, /* I/O NSQ state */
cannam@154 145 SideInfoIndices *psIndices, /* I/O Quantization Indices */
cannam@154 146 const opus_int32 x_Q3[], /* I Prefiltered input signal */
cannam@154 147 opus_int8 pulses[], /* O Quantized pulse signal */
cannam@154 148 const opus_int16 PredCoef_Q12[ 2 * MAX_LPC_ORDER ], /* I Short term prediction coefs */
cannam@154 149 const opus_int16 LTPCoef_Q14[ LTP_ORDER * MAX_NB_SUBFR ], /* I Long term prediction coefs */
cannam@154 150 const opus_int16 AR2_Q13[ MAX_NB_SUBFR * MAX_SHAPE_LPC_ORDER ], /* I Noise shaping coefs */
cannam@154 151 const opus_int HarmShapeGain_Q14[ MAX_NB_SUBFR ], /* I Long term shaping coefs */
cannam@154 152 const opus_int Tilt_Q14[ MAX_NB_SUBFR ], /* I Spectral tilt */
cannam@154 153 const opus_int32 LF_shp_Q14[ MAX_NB_SUBFR ], /* I Low frequency shaping coefs */
cannam@154 154 const opus_int32 Gains_Q16[ MAX_NB_SUBFR ], /* I Quantization step sizes */
cannam@154 155 const opus_int pitchL[ MAX_NB_SUBFR ], /* I Pitch lags */
cannam@154 156 const opus_int Lambda_Q10, /* I Rate/distortion tradeoff */
cannam@154 157 const opus_int LTP_scale_Q14 /* I LTP state scaling */
cannam@154 158 );
cannam@154 159
cannam@154 160 #if defined OPUS_X86_PRESUME_SSE4_1
cannam@154 161
cannam@154 162 #define silk_NSQ_del_dec(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 163 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14, arch) \
cannam@154 164 ((void)(arch),silk_NSQ_del_dec_sse4_1(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 165 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14))
cannam@154 166
cannam@154 167 #else
cannam@154 168
cannam@154 169 extern void (*const SILK_NSQ_DEL_DEC_IMPL[OPUS_ARCHMASK + 1])(
cannam@154 170 const silk_encoder_state *psEncC, /* I Encoder State */
cannam@154 171 silk_nsq_state *NSQ, /* I/O NSQ state */
cannam@154 172 SideInfoIndices *psIndices, /* I/O Quantization Indices */
cannam@154 173 const opus_int32 x_Q3[], /* I Prefiltered input signal */
cannam@154 174 opus_int8 pulses[], /* O Quantized pulse signal */
cannam@154 175 const opus_int16 PredCoef_Q12[ 2 * MAX_LPC_ORDER ], /* I Short term prediction coefs */
cannam@154 176 const opus_int16 LTPCoef_Q14[ LTP_ORDER * MAX_NB_SUBFR ], /* I Long term prediction coefs */
cannam@154 177 const opus_int16 AR2_Q13[ MAX_NB_SUBFR * MAX_SHAPE_LPC_ORDER ], /* I Noise shaping coefs */
cannam@154 178 const opus_int HarmShapeGain_Q14[ MAX_NB_SUBFR ], /* I Long term shaping coefs */
cannam@154 179 const opus_int Tilt_Q14[ MAX_NB_SUBFR ], /* I Spectral tilt */
cannam@154 180 const opus_int32 LF_shp_Q14[ MAX_NB_SUBFR ], /* I Low frequency shaping coefs */
cannam@154 181 const opus_int32 Gains_Q16[ MAX_NB_SUBFR ], /* I Quantization step sizes */
cannam@154 182 const opus_int pitchL[ MAX_NB_SUBFR ], /* I Pitch lags */
cannam@154 183 const opus_int Lambda_Q10, /* I Rate/distortion tradeoff */
cannam@154 184 const opus_int LTP_scale_Q14 /* I LTP state scaling */
cannam@154 185 );
cannam@154 186
cannam@154 187 # define silk_NSQ_del_dec(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 188 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14, arch) \
cannam@154 189 ((*SILK_NSQ_DEL_DEC_IMPL[(arch) & OPUS_ARCHMASK])(psEncC, NSQ, psIndices, x_Q3, pulses, PredCoef_Q12, LTPCoef_Q14, AR2_Q13, \
cannam@154 190 HarmShapeGain_Q14, Tilt_Q14, LF_shp_Q14, Gains_Q16, pitchL, Lambda_Q10, LTP_scale_Q14))
cannam@154 191
cannam@154 192 #endif
cannam@154 193 #endif
cannam@154 194
cannam@154 195 void silk_noise_shape_quantizer(
cannam@154 196 silk_nsq_state *NSQ, /* I/O NSQ state */
cannam@154 197 opus_int signalType, /* I Signal type */
cannam@154 198 const opus_int32 x_sc_Q10[], /* I */
cannam@154 199 opus_int8 pulses[], /* O */
cannam@154 200 opus_int16 xq[], /* O */
cannam@154 201 opus_int32 sLTP_Q15[], /* I/O LTP state */
cannam@154 202 const opus_int16 a_Q12[], /* I Short term prediction coefs */
cannam@154 203 const opus_int16 b_Q14[], /* I Long term prediction coefs */
cannam@154 204 const opus_int16 AR_shp_Q13[], /* I Noise shaping AR coefs */
cannam@154 205 opus_int lag, /* I Pitch lag */
cannam@154 206 opus_int32 HarmShapeFIRPacked_Q14, /* I */
cannam@154 207 opus_int Tilt_Q14, /* I Spectral tilt */
cannam@154 208 opus_int32 LF_shp_Q14, /* I */
cannam@154 209 opus_int32 Gain_Q16, /* I */
cannam@154 210 opus_int Lambda_Q10, /* I */
cannam@154 211 opus_int offset_Q10, /* I */
cannam@154 212 opus_int length, /* I Input length */
cannam@154 213 opus_int shapingLPCOrder, /* I Noise shaping AR filter order */
cannam@154 214 opus_int predictLPCOrder, /* I Prediction filter order */
cannam@154 215 int arch /* I Architecture */
cannam@154 216 );
cannam@154 217
cannam@154 218 /**************************/
cannam@154 219 /* Noise level estimation */
cannam@154 220 /**************************/
cannam@154 221 void silk_VAD_GetNoiseLevels(
cannam@154 222 const opus_int32 pX[ VAD_N_BANDS ], /* I subband energies */
cannam@154 223 silk_VAD_state *psSilk_VAD /* I/O Pointer to Silk VAD state */
cannam@154 224 );
cannam@154 225
cannam@154 226 # define OVERRIDE_silk_VAD_GetSA_Q8
cannam@154 227
cannam@154 228 opus_int silk_VAD_GetSA_Q8_sse4_1(
cannam@154 229 silk_encoder_state *psEnC,
cannam@154 230 const opus_int16 pIn[]
cannam@154 231 );
cannam@154 232
cannam@154 233 #if defined(OPUS_X86_PRESUME_SSE4_1)
cannam@154 234 #define silk_VAD_GetSA_Q8(psEnC, pIn, arch) ((void)(arch),silk_VAD_GetSA_Q8_sse4_1(psEnC, pIn))
cannam@154 235
cannam@154 236 #else
cannam@154 237
cannam@154 238 # define silk_VAD_GetSA_Q8(psEnC, pIn, arch) \
cannam@154 239 ((*SILK_VAD_GETSA_Q8_IMPL[(arch) & OPUS_ARCHMASK])(psEnC, pIn))
cannam@154 240
cannam@154 241 extern opus_int (*const SILK_VAD_GETSA_Q8_IMPL[OPUS_ARCHMASK + 1])(
cannam@154 242 silk_encoder_state *psEnC,
cannam@154 243 const opus_int16 pIn[]);
cannam@154 244
cannam@154 245 #endif
cannam@154 246
cannam@154 247 # endif
cannam@154 248 #endif