annotate src/fftw-3.3.5/dft/simd/common/n1fv_128.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents 2cd0e3b3e1fd
children
rev   line source
Chris@42 1 /*
Chris@42 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@42 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@42 4 *
Chris@42 5 * This program is free software; you can redistribute it and/or modify
Chris@42 6 * it under the terms of the GNU General Public License as published by
Chris@42 7 * the Free Software Foundation; either version 2 of the License, or
Chris@42 8 * (at your option) any later version.
Chris@42 9 *
Chris@42 10 * This program is distributed in the hope that it will be useful,
Chris@42 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@42 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@42 13 * GNU General Public License for more details.
Chris@42 14 *
Chris@42 15 * You should have received a copy of the GNU General Public License
Chris@42 16 * along with this program; if not, write to the Free Software
Chris@42 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@42 18 *
Chris@42 19 */
Chris@42 20
Chris@42 21 /* This file was automatically generated --- DO NOT EDIT */
Chris@42 22 /* Generated on Sat Jul 30 16:38:48 EDT 2016 */
Chris@42 23
Chris@42 24 #include "codelet-dft.h"
Chris@42 25
Chris@42 26 #ifdef HAVE_FMA
Chris@42 27
Chris@42 28 /* Generated by: ../../../genfft/gen_notw_c.native -fma -reorder-insns -schedule-for-pipeline -simd -compact -variables 4 -pipeline-latency 8 -n 128 -name n1fv_128 -include n1f.h */
Chris@42 29
Chris@42 30 /*
Chris@42 31 * This function contains 1082 FP additions, 642 FP multiplications,
Chris@42 32 * (or, 440 additions, 0 multiplications, 642 fused multiply/add),
Chris@42 33 * 295 stack variables, 31 constants, and 256 memory accesses
Chris@42 34 */
Chris@42 35 #include "n1f.h"
Chris@42 36
Chris@42 37 static void n1fv_128(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT v, INT ivs, INT ovs)
Chris@42 38 {
Chris@42 39 DVK(KP903989293, +0.903989293123443331586200297230537048710132025);
Chris@42 40 DVK(KP941544065, +0.941544065183020778412509402599502357185589796);
Chris@42 41 DVK(KP357805721, +0.357805721314524104672487743774474392487532769);
Chris@42 42 DVK(KP472964775, +0.472964775891319928124438237972992463904131113);
Chris@42 43 DVK(KP857728610, +0.857728610000272069902269984284770137042490799);
Chris@42 44 DVK(KP970031253, +0.970031253194543992603984207286100251456865962);
Chris@42 45 DVK(KP250486960, +0.250486960191305461595702160124721208578685568);
Chris@42 46 DVK(KP998795456, +0.998795456205172392714771604759100694443203615);
Chris@42 47 DVK(KP740951125, +0.740951125354959091175616897495162729728955309);
Chris@42 48 DVK(KP599376933, +0.599376933681923766271389869014404232837890546);
Chris@42 49 DVK(KP906347169, +0.906347169019147157946142717268914412664134293);
Chris@42 50 DVK(KP049126849, +0.049126849769467254105343321271313617079695752);
Chris@42 51 DVK(KP989176509, +0.989176509964780973451673738016243063983689533);
Chris@42 52 DVK(KP803207531, +0.803207531480644909806676512963141923879569427);
Chris@42 53 DVK(KP741650546, +0.741650546272035369581266691172079863842265220);
Chris@42 54 DVK(KP956940335, +0.956940335732208864935797886980269969482849206);
Chris@42 55 DVK(KP148335987, +0.148335987538347428753676511486911367000625355);
Chris@42 56 DVK(KP881921264, +0.881921264348355029712756863660388349508442621);
Chris@42 57 DVK(KP303346683, +0.303346683607342391675883946941299872384187453);
Chris@42 58 DVK(KP534511135, +0.534511135950791641089685961295362908582039528);
Chris@42 59 DVK(KP773010453, +0.773010453362736960810906609758469800971041293);
Chris@42 60 DVK(KP995184726, +0.995184726672196886244836953109479921575474869);
Chris@42 61 DVK(KP820678790, +0.820678790828660330972281985331011598767386482);
Chris@42 62 DVK(KP098491403, +0.098491403357164253077197521291327432293052451);
Chris@42 63 DVK(KP831469612, +0.831469612302545237078788377617905756738560812);
Chris@42 64 DVK(KP980785280, +0.980785280403230449126182236134239036973933731);
Chris@42 65 DVK(KP198912367, +0.198912367379658006911597622644676228597850501);
Chris@42 66 DVK(KP668178637, +0.668178637919298919997757686523080761552472251);
Chris@42 67 DVK(KP923879532, +0.923879532511286756128183189396788286822416626);
Chris@42 68 DVK(KP414213562, +0.414213562373095048801688724209698078569671875);
Chris@42 69 DVK(KP707106781, +0.707106781186547524400844362104849039284835938);
Chris@42 70 {
Chris@42 71 INT i;
Chris@42 72 const R *xi;
Chris@42 73 R *xo;
Chris@42 74 xi = ri;
Chris@42 75 xo = ro;
Chris@42 76 for (i = v; i > 0; i = i - VL, xi = xi + (VL * ivs), xo = xo + (VL * ovs), MAKE_VOLATILE_STRIDE(256, is), MAKE_VOLATILE_STRIDE(256, os)) {
Chris@42 77 V T6a, T5J, T6b, T5K, T6B, T6C, T6J, T6A, T6o, T6j, T6r, T68, T6e, T5O, T5R;
Chris@42 78 V T6d, T6D, T6K;
Chris@42 79 {
Chris@42 80 V Tad, TcZ, T6Z, T8T, T4U, Tr, Tfq, TgG, Ted, Tgf, Td0, Tcc, T9k, T84, Tb6;
Chris@42 81 V Tbt, Td8, TdK, TeK, Tgq, TeV, Tgt, T7q, T94, T3p, T5X, T7B, T97, T2G, T5U;
Chris@42 82 V TbD, Tc0, Tdf, TdN, Tf5, Tgx, Tfg, TgA, T7J, T9b, T4E, T64, T7U, T9e, T3V;
Chris@42 83 V T61, Td2, Td3, T85, T72, T4V, TI, Tcd, Tas, TgH, Tek, Tgg, Tft, T86, T75;
Chris@42 84 V T4W, TZ, TaI, Tcg, Tdr, TdG, Tgi, Tet, Tgj, Teq, T8X, T7a, T5M, T1B, T8W;
Chris@42 85 V T7d, T5N, T1s, TaX, Tcf, Tdo, TdH, Tgl, TeC, Tgm, Tez, T90, T7h, T5P, T2c;
Chris@42 86 V T8Z, T7k, T5Q, T23, T3Y, T49, TdL, Tdb, Tbu, Tbl, Tgu, TeR, Tgr, TeY, Tf6;
Chris@42 87 V TbG, T5V, T3s, T5Y, T3f, T95, T7E, T98, T7x, T4g, T4f, T4q, TbH, T41, TbI;
Chris@42 88 V T44, T4h, T4j, T4k, Tf9, TbN;
Chris@42 89 {
Chris@42 90 V Tu, TF, Ty, TL, TW, Tah, Tx, Tag, Tee, Tz, TM, TN, Teh, Tan, TP;
Chris@42 91 V TQ;
Chris@42 92 {
Chris@42 93 V TeG, T2A, Tbq, TeT, Tbp, TeH, T3m, T2x, Td6, T7o, T2q, T3l, T7z, Tbr, T2D;
Chris@42 94 V T82, T83;
Chris@42 95 {
Chris@42 96 V Ta7, T3, Ta8, T4O, Taa, Tab, Ta, T4P, Te, Tc9, Th, Tca, Tl, Tc6, Tc7;
Chris@42 97 V To;
Chris@42 98 {
Chris@42 99 V T1, T2, T4M, T4N;
Chris@42 100 T1 = LD(&(xi[0]), ivs, &(xi[0]));
Chris@42 101 T2 = LD(&(xi[WS(is, 64)]), ivs, &(xi[0]));
Chris@42 102 T4M = LD(&(xi[WS(is, 32)]), ivs, &(xi[0]));
Chris@42 103 T4N = LD(&(xi[WS(is, 96)]), ivs, &(xi[0]));
Chris@42 104 {
Chris@42 105 V T4, T5, T7, T8;
Chris@42 106 T4 = LD(&(xi[WS(is, 16)]), ivs, &(xi[0]));
Chris@42 107 T5 = LD(&(xi[WS(is, 80)]), ivs, &(xi[0]));
Chris@42 108 T7 = LD(&(xi[WS(is, 112)]), ivs, &(xi[0]));
Chris@42 109 T8 = LD(&(xi[WS(is, 48)]), ivs, &(xi[0]));
Chris@42 110 {
Chris@42 111 V Tc, T6, T9, Td, Tf, Tg;
Chris@42 112 Tc = LD(&(xi[WS(is, 8)]), ivs, &(xi[0]));
Chris@42 113 Ta7 = VADD(T1, T2);
Chris@42 114 T3 = VSUB(T1, T2);
Chris@42 115 Ta8 = VADD(T4M, T4N);
Chris@42 116 T4O = VSUB(T4M, T4N);
Chris@42 117 Taa = VADD(T4, T5);
Chris@42 118 T6 = VSUB(T4, T5);
Chris@42 119 Tab = VADD(T7, T8);
Chris@42 120 T9 = VSUB(T7, T8);
Chris@42 121 Td = LD(&(xi[WS(is, 72)]), ivs, &(xi[0]));
Chris@42 122 Tf = LD(&(xi[WS(is, 40)]), ivs, &(xi[0]));
Chris@42 123 Tg = LD(&(xi[WS(is, 104)]), ivs, &(xi[0]));
Chris@42 124 {
Chris@42 125 V Tj, Tk, Tm, Tn;
Chris@42 126 Tj = LD(&(xi[WS(is, 120)]), ivs, &(xi[0]));
Chris@42 127 Tk = LD(&(xi[WS(is, 56)]), ivs, &(xi[0]));
Chris@42 128 Tm = LD(&(xi[WS(is, 88)]), ivs, &(xi[0]));
Chris@42 129 Tn = LD(&(xi[WS(is, 24)]), ivs, &(xi[0]));
Chris@42 130 Ta = VADD(T6, T9);
Chris@42 131 T4P = VSUB(T9, T6);
Chris@42 132 Te = VSUB(Tc, Td);
Chris@42 133 Tc9 = VADD(Tc, Td);
Chris@42 134 Th = VSUB(Tf, Tg);
Chris@42 135 Tca = VADD(Tf, Tg);
Chris@42 136 Tl = VSUB(Tj, Tk);
Chris@42 137 Tc6 = VADD(Tj, Tk);
Chris@42 138 Tc7 = VADD(Tn, Tm);
Chris@42 139 To = VSUB(Tm, Tn);
Chris@42 140 }
Chris@42 141 }
Chris@42 142 }
Chris@42 143 }
Chris@42 144 {
Chris@42 145 V T6X, Tb, Te9, Ta9, Tcb, Tea, T4R, Ti, Tfo, Tac, Tp, T4S, Tc8, Teb, T4Q;
Chris@42 146 T6X = VFNMS(LDK(KP707106781), Ta, T3);
Chris@42 147 Tb = VFMA(LDK(KP707106781), Ta, T3);
Chris@42 148 Te9 = VSUB(Ta7, Ta8);
Chris@42 149 Ta9 = VADD(Ta7, Ta8);
Chris@42 150 Tcb = VADD(Tc9, Tca);
Chris@42 151 Tea = VSUB(Tc9, Tca);
Chris@42 152 T4R = VFMA(LDK(KP414213562), Te, Th);
Chris@42 153 Ti = VFNMS(LDK(KP414213562), Th, Te);
Chris@42 154 Tfo = VSUB(Tab, Taa);
Chris@42 155 Tac = VADD(Taa, Tab);
Chris@42 156 Tp = VFNMS(LDK(KP414213562), To, Tl);
Chris@42 157 T4S = VFMA(LDK(KP414213562), Tl, To);
Chris@42 158 Tc8 = VADD(Tc6, Tc7);
Chris@42 159 Teb = VSUB(Tc6, Tc7);
Chris@42 160 T4Q = VFNMS(LDK(KP707106781), T4P, T4O);
Chris@42 161 T82 = VFMA(LDK(KP707106781), T4P, T4O);
Chris@42 162 {
Chris@42 163 V T4T, T6Y, Tq, Tfp, Tec;
Chris@42 164 T4T = VSUB(T4R, T4S);
Chris@42 165 T6Y = VADD(T4R, T4S);
Chris@42 166 T83 = VSUB(Tp, Ti);
Chris@42 167 Tq = VADD(Ti, Tp);
Chris@42 168 Tfp = VSUB(Teb, Tea);
Chris@42 169 Tec = VADD(Tea, Teb);
Chris@42 170 Tad = VSUB(Ta9, Tac);
Chris@42 171 TcZ = VADD(Ta9, Tac);
Chris@42 172 T6Z = VFMA(LDK(KP923879532), T6Y, T6X);
Chris@42 173 T8T = VFNMS(LDK(KP923879532), T6Y, T6X);
Chris@42 174 T4U = VFMA(LDK(KP923879532), T4T, T4Q);
Chris@42 175 T6a = VFNMS(LDK(KP923879532), T4T, T4Q);
Chris@42 176 Tr = VFMA(LDK(KP923879532), Tq, Tb);
Chris@42 177 T5J = VFNMS(LDK(KP923879532), Tq, Tb);
Chris@42 178 Tfq = VFMA(LDK(KP707106781), Tfp, Tfo);
Chris@42 179 TgG = VFNMS(LDK(KP707106781), Tfp, Tfo);
Chris@42 180 Ted = VFMA(LDK(KP707106781), Tec, Te9);
Chris@42 181 Tgf = VFNMS(LDK(KP707106781), Tec, Te9);
Chris@42 182 Td0 = VADD(Tcb, Tc8);
Chris@42 183 Tcc = VSUB(Tc8, Tcb);
Chris@42 184 }
Chris@42 185 }
Chris@42 186 }
Chris@42 187 {
Chris@42 188 V T2i, T3j, Tb2, T2B, Tb5, T3k, T2p, T2C;
Chris@42 189 {
Chris@42 190 V T2m, Tb0, Tb1, Tb3, T2l, T2n;
Chris@42 191 {
Chris@42 192 V T2g, T2h, T3h, T3i, T2j, T2k;
Chris@42 193 T2g = LD(&(xi[WS(is, 1)]), ivs, &(xi[WS(is, 1)]));
Chris@42 194 T2h = LD(&(xi[WS(is, 65)]), ivs, &(xi[WS(is, 1)]));
Chris@42 195 T3h = LD(&(xi[WS(is, 33)]), ivs, &(xi[WS(is, 1)]));
Chris@42 196 T3i = LD(&(xi[WS(is, 97)]), ivs, &(xi[WS(is, 1)]));
Chris@42 197 T2j = LD(&(xi[WS(is, 17)]), ivs, &(xi[WS(is, 1)]));
Chris@42 198 T2k = LD(&(xi[WS(is, 81)]), ivs, &(xi[WS(is, 1)]));
Chris@42 199 T2m = LD(&(xi[WS(is, 113)]), ivs, &(xi[WS(is, 1)]));
Chris@42 200 T9k = VFNMS(LDK(KP923879532), T83, T82);
Chris@42 201 T84 = VFMA(LDK(KP923879532), T83, T82);
Chris@42 202 T2i = VSUB(T2g, T2h);
Chris@42 203 Tb0 = VADD(T2g, T2h);
Chris@42 204 T3j = VSUB(T3h, T3i);
Chris@42 205 Tb1 = VADD(T3h, T3i);
Chris@42 206 Tb3 = VADD(T2j, T2k);
Chris@42 207 T2l = VSUB(T2j, T2k);
Chris@42 208 T2n = LD(&(xi[WS(is, 49)]), ivs, &(xi[WS(is, 1)]));
Chris@42 209 }
Chris@42 210 {
Chris@42 211 V T2r, T2s, T2u, T2v;
Chris@42 212 T2r = LD(&(xi[WS(is, 9)]), ivs, &(xi[WS(is, 1)]));
Chris@42 213 T2s = LD(&(xi[WS(is, 73)]), ivs, &(xi[WS(is, 1)]));
Chris@42 214 T2u = LD(&(xi[WS(is, 41)]), ivs, &(xi[WS(is, 1)]));
Chris@42 215 T2v = LD(&(xi[WS(is, 105)]), ivs, &(xi[WS(is, 1)]));
Chris@42 216 TeG = VSUB(Tb0, Tb1);
Chris@42 217 Tb2 = VADD(Tb0, Tb1);
Chris@42 218 {
Chris@42 219 V T2y, T2z, Tb4, T2o, Tbn, T2t, Tbo, T2w;
Chris@42 220 T2y = LD(&(xi[WS(is, 121)]), ivs, &(xi[WS(is, 1)]));
Chris@42 221 T2z = LD(&(xi[WS(is, 57)]), ivs, &(xi[WS(is, 1)]));
Chris@42 222 Tb4 = VADD(T2m, T2n);
Chris@42 223 T2o = VSUB(T2m, T2n);
Chris@42 224 Tbn = VADD(T2r, T2s);
Chris@42 225 T2t = VSUB(T2r, T2s);
Chris@42 226 Tbo = VADD(T2u, T2v);
Chris@42 227 T2w = VSUB(T2u, T2v);
Chris@42 228 T2B = LD(&(xi[WS(is, 25)]), ivs, &(xi[WS(is, 1)]));
Chris@42 229 T2A = VSUB(T2y, T2z);
Chris@42 230 Tbq = VADD(T2y, T2z);
Chris@42 231 TeT = VSUB(Tb3, Tb4);
Chris@42 232 Tb5 = VADD(Tb3, Tb4);
Chris@42 233 T3k = VSUB(T2l, T2o);
Chris@42 234 T2p = VADD(T2l, T2o);
Chris@42 235 Tbp = VADD(Tbn, Tbo);
Chris@42 236 TeH = VSUB(Tbn, Tbo);
Chris@42 237 T3m = VFMA(LDK(KP414213562), T2t, T2w);
Chris@42 238 T2x = VFNMS(LDK(KP414213562), T2w, T2t);
Chris@42 239 T2C = LD(&(xi[WS(is, 89)]), ivs, &(xi[WS(is, 1)]));
Chris@42 240 }
Chris@42 241 }
Chris@42 242 }
Chris@42 243 Td6 = VADD(Tb2, Tb5);
Chris@42 244 Tb6 = VSUB(Tb2, Tb5);
Chris@42 245 T7o = VFNMS(LDK(KP707106781), T2p, T2i);
Chris@42 246 T2q = VFMA(LDK(KP707106781), T2p, T2i);
Chris@42 247 T3l = VFMA(LDK(KP707106781), T3k, T3j);
Chris@42 248 T7z = VFNMS(LDK(KP707106781), T3k, T3j);
Chris@42 249 Tbr = VADD(T2B, T2C);
Chris@42 250 T2D = VSUB(T2B, T2C);
Chris@42 251 }
Chris@42 252 {
Chris@42 253 V Tf1, Tfe, Tf2, TbZ, T3M, T4B, Tdd, T3F, T7H, T4A, T7S, TbW, Tf3, T4C, T3T;
Chris@42 254 {
Chris@42 255 V T3x, T4y, Tbz, T3Q, TbC, T4z, T3E, T3R, T3P, TbU, TbV, T3S;
Chris@42 256 {
Chris@42 257 V T3y, T3z, T3B, T3C;
Chris@42 258 {
Chris@42 259 V T3v, T3w, T4w, T4x;
Chris@42 260 T3v = LD(&(xi[WS(is, 127)]), ivs, &(xi[WS(is, 1)]));
Chris@42 261 T3w = LD(&(xi[WS(is, 63)]), ivs, &(xi[WS(is, 1)]));
Chris@42 262 T4w = LD(&(xi[WS(is, 95)]), ivs, &(xi[WS(is, 1)]));
Chris@42 263 T4x = LD(&(xi[WS(is, 31)]), ivs, &(xi[WS(is, 1)]));
Chris@42 264 T3y = LD(&(xi[WS(is, 15)]), ivs, &(xi[WS(is, 1)]));
Chris@42 265 {
Chris@42 266 V Tbs, TeI, T3n, T2E, Tbx;
Chris@42 267 Tbs = VADD(Tbq, Tbr);
Chris@42 268 TeI = VSUB(Tbq, Tbr);
Chris@42 269 T3n = VFNMS(LDK(KP414213562), T2A, T2D);
Chris@42 270 T2E = VFMA(LDK(KP414213562), T2D, T2A);
Chris@42 271 T3x = VSUB(T3v, T3w);
Chris@42 272 Tbx = VADD(T3v, T3w);
Chris@42 273 {
Chris@42 274 V Tby, Td7, TeJ, TeU;
Chris@42 275 T4y = VSUB(T4w, T4x);
Chris@42 276 Tby = VADD(T4x, T4w);
Chris@42 277 Td7 = VADD(Tbp, Tbs);
Chris@42 278 Tbt = VSUB(Tbp, Tbs);
Chris@42 279 TeJ = VADD(TeH, TeI);
Chris@42 280 TeU = VSUB(TeH, TeI);
Chris@42 281 {
Chris@42 282 V T7p, T3o, T7A, T2F;
Chris@42 283 T7p = VSUB(T3m, T3n);
Chris@42 284 T3o = VADD(T3m, T3n);
Chris@42 285 T7A = VSUB(T2x, T2E);
Chris@42 286 T2F = VADD(T2x, T2E);
Chris@42 287 Tbz = VADD(Tbx, Tby);
Chris@42 288 Tf1 = VSUB(Tbx, Tby);
Chris@42 289 Td8 = VADD(Td6, Td7);
Chris@42 290 TdK = VSUB(Td6, Td7);
Chris@42 291 TeK = VFMA(LDK(KP707106781), TeJ, TeG);
Chris@42 292 Tgq = VFNMS(LDK(KP707106781), TeJ, TeG);
Chris@42 293 TeV = VFMA(LDK(KP707106781), TeU, TeT);
Chris@42 294 Tgt = VFNMS(LDK(KP707106781), TeU, TeT);
Chris@42 295 T7q = VFMA(LDK(KP923879532), T7p, T7o);
Chris@42 296 T94 = VFNMS(LDK(KP923879532), T7p, T7o);
Chris@42 297 T3p = VFMA(LDK(KP923879532), T3o, T3l);
Chris@42 298 T5X = VFNMS(LDK(KP923879532), T3o, T3l);
Chris@42 299 T7B = VFNMS(LDK(KP923879532), T7A, T7z);
Chris@42 300 T97 = VFMA(LDK(KP923879532), T7A, T7z);
Chris@42 301 T2G = VFMA(LDK(KP923879532), T2F, T2q);
Chris@42 302 T5U = VFNMS(LDK(KP923879532), T2F, T2q);
Chris@42 303 T3z = LD(&(xi[WS(is, 79)]), ivs, &(xi[WS(is, 1)]));
Chris@42 304 }
Chris@42 305 }
Chris@42 306 }
Chris@42 307 T3B = LD(&(xi[WS(is, 111)]), ivs, &(xi[WS(is, 1)]));
Chris@42 308 T3C = LD(&(xi[WS(is, 47)]), ivs, &(xi[WS(is, 1)]));
Chris@42 309 }
Chris@42 310 {
Chris@42 311 V T3G, T3H, T3J, T3K;
Chris@42 312 T3G = LD(&(xi[WS(is, 7)]), ivs, &(xi[WS(is, 1)]));
Chris@42 313 T3H = LD(&(xi[WS(is, 71)]), ivs, &(xi[WS(is, 1)]));
Chris@42 314 T3J = LD(&(xi[WS(is, 103)]), ivs, &(xi[WS(is, 1)]));
Chris@42 315 T3K = LD(&(xi[WS(is, 39)]), ivs, &(xi[WS(is, 1)]));
Chris@42 316 {
Chris@42 317 V T3N, T3A, TbA, T3D, TbB, T3I, TbX, T3L, TbY, T3O;
Chris@42 318 T3N = LD(&(xi[WS(is, 119)]), ivs, &(xi[WS(is, 1)]));
Chris@42 319 T3A = VSUB(T3y, T3z);
Chris@42 320 TbA = VADD(T3y, T3z);
Chris@42 321 T3D = VSUB(T3B, T3C);
Chris@42 322 TbB = VADD(T3B, T3C);
Chris@42 323 T3I = VSUB(T3G, T3H);
Chris@42 324 TbX = VADD(T3G, T3H);
Chris@42 325 T3L = VSUB(T3J, T3K);
Chris@42 326 TbY = VADD(T3K, T3J);
Chris@42 327 T3O = LD(&(xi[WS(is, 55)]), ivs, &(xi[WS(is, 1)]));
Chris@42 328 T3Q = LD(&(xi[WS(is, 87)]), ivs, &(xi[WS(is, 1)]));
Chris@42 329 Tfe = VSUB(TbB, TbA);
Chris@42 330 TbC = VADD(TbA, TbB);
Chris@42 331 T4z = VSUB(T3D, T3A);
Chris@42 332 T3E = VADD(T3A, T3D);
Chris@42 333 T3R = LD(&(xi[WS(is, 23)]), ivs, &(xi[WS(is, 1)]));
Chris@42 334 Tf2 = VSUB(TbX, TbY);
Chris@42 335 TbZ = VADD(TbX, TbY);
Chris@42 336 T3M = VFMA(LDK(KP414213562), T3L, T3I);
Chris@42 337 T4B = VFNMS(LDK(KP414213562), T3I, T3L);
Chris@42 338 T3P = VSUB(T3N, T3O);
Chris@42 339 TbU = VADD(T3N, T3O);
Chris@42 340 }
Chris@42 341 }
Chris@42 342 }
Chris@42 343 Tdd = VADD(Tbz, TbC);
Chris@42 344 TbD = VSUB(Tbz, TbC);
Chris@42 345 TbV = VADD(T3R, T3Q);
Chris@42 346 T3S = VSUB(T3Q, T3R);
Chris@42 347 T3F = VFMA(LDK(KP707106781), T3E, T3x);
Chris@42 348 T7H = VFNMS(LDK(KP707106781), T3E, T3x);
Chris@42 349 T4A = VFMA(LDK(KP707106781), T4z, T4y);
Chris@42 350 T7S = VFNMS(LDK(KP707106781), T4z, T4y);
Chris@42 351 TbW = VADD(TbU, TbV);
Chris@42 352 Tf3 = VSUB(TbU, TbV);
Chris@42 353 T4C = VFMA(LDK(KP414213562), T3P, T3S);
Chris@42 354 T3T = VFNMS(LDK(KP414213562), T3S, T3P);
Chris@42 355 }
Chris@42 356 {
Chris@42 357 V TD, Tae, TE, TJ, TK, TU, TV;
Chris@42 358 {
Chris@42 359 V Ts, Tt, Tde, Tf4, Tff;
Chris@42 360 Ts = LD(&(xi[WS(is, 4)]), ivs, &(xi[0]));
Chris@42 361 Tt = LD(&(xi[WS(is, 68)]), ivs, &(xi[0]));
Chris@42 362 TD = LD(&(xi[WS(is, 36)]), ivs, &(xi[0]));
Chris@42 363 Tde = VADD(TbZ, TbW);
Chris@42 364 Tc0 = VSUB(TbW, TbZ);
Chris@42 365 Tf4 = VADD(Tf2, Tf3);
Chris@42 366 Tff = VSUB(Tf3, Tf2);
Chris@42 367 {
Chris@42 368 V T7I, T4D, T7T, T3U;
Chris@42 369 T7I = VSUB(T4C, T4B);
Chris@42 370 T4D = VADD(T4B, T4C);
Chris@42 371 T7T = VSUB(T3T, T3M);
Chris@42 372 T3U = VADD(T3M, T3T);
Chris@42 373 Tae = VADD(Ts, Tt);
Chris@42 374 Tu = VSUB(Ts, Tt);
Chris@42 375 Tdf = VADD(Tdd, Tde);
Chris@42 376 TdN = VSUB(Tdd, Tde);
Chris@42 377 Tf5 = VFMA(LDK(KP707106781), Tf4, Tf1);
Chris@42 378 Tgx = VFNMS(LDK(KP707106781), Tf4, Tf1);
Chris@42 379 Tfg = VFMA(LDK(KP707106781), Tff, Tfe);
Chris@42 380 TgA = VFNMS(LDK(KP707106781), Tff, Tfe);
Chris@42 381 T7J = VFMA(LDK(KP923879532), T7I, T7H);
Chris@42 382 T9b = VFNMS(LDK(KP923879532), T7I, T7H);
Chris@42 383 T4E = VFMA(LDK(KP923879532), T4D, T4A);
Chris@42 384 T64 = VFNMS(LDK(KP923879532), T4D, T4A);
Chris@42 385 T7U = VFNMS(LDK(KP923879532), T7T, T7S);
Chris@42 386 T9e = VFMA(LDK(KP923879532), T7T, T7S);
Chris@42 387 T3V = VFMA(LDK(KP923879532), T3U, T3F);
Chris@42 388 T61 = VFNMS(LDK(KP923879532), T3U, T3F);
Chris@42 389 TE = LD(&(xi[WS(is, 100)]), ivs, &(xi[0]));
Chris@42 390 }
Chris@42 391 }
Chris@42 392 TJ = LD(&(xi[WS(is, 124)]), ivs, &(xi[0]));
Chris@42 393 TK = LD(&(xi[WS(is, 60)]), ivs, &(xi[0]));
Chris@42 394 TU = LD(&(xi[WS(is, 92)]), ivs, &(xi[0]));
Chris@42 395 TV = LD(&(xi[WS(is, 28)]), ivs, &(xi[0]));
Chris@42 396 {
Chris@42 397 V Tal, Tam, Tv, Tw, Taf;
Chris@42 398 Tv = LD(&(xi[WS(is, 20)]), ivs, &(xi[0]));
Chris@42 399 Tw = LD(&(xi[WS(is, 84)]), ivs, &(xi[0]));
Chris@42 400 Taf = VADD(TD, TE);
Chris@42 401 TF = VSUB(TD, TE);
Chris@42 402 Ty = LD(&(xi[WS(is, 116)]), ivs, &(xi[0]));
Chris@42 403 TL = VSUB(TJ, TK);
Chris@42 404 Tal = VADD(TJ, TK);
Chris@42 405 TW = VSUB(TU, TV);
Chris@42 406 Tam = VADD(TV, TU);
Chris@42 407 Tah = VADD(Tv, Tw);
Chris@42 408 Tx = VSUB(Tv, Tw);
Chris@42 409 Tag = VADD(Tae, Taf);
Chris@42 410 Tee = VSUB(Tae, Taf);
Chris@42 411 Tz = LD(&(xi[WS(is, 52)]), ivs, &(xi[0]));
Chris@42 412 TM = LD(&(xi[WS(is, 12)]), ivs, &(xi[0]));
Chris@42 413 TN = LD(&(xi[WS(is, 76)]), ivs, &(xi[0]));
Chris@42 414 Teh = VSUB(Tal, Tam);
Chris@42 415 Tan = VADD(Tal, Tam);
Chris@42 416 TP = LD(&(xi[WS(is, 108)]), ivs, &(xi[0]));
Chris@42 417 TQ = LD(&(xi[WS(is, 44)]), ivs, &(xi[0]));
Chris@42 418 }
Chris@42 419 }
Chris@42 420 }
Chris@42 421 }
Chris@42 422 {
Chris@42 423 V Tev, TeA, Tdm, TaP, Tew, TaV, T1U, T29, T7f, T1N, T28, T7i, Tex, TaS, T21;
Chris@42 424 V T2a;
Chris@42 425 {
Chris@42 426 V Tem, Ter, Ten, TaD, T1j, T1y, TaA, Tdp, T1c, T78, T7b, T1x, TaG, Teo, T1z;
Chris@42 427 V T1q;
Chris@42 428 {
Chris@42 429 V T14, T1v, Taw, Taz, T1b, T1w, T1n, T1o, T1m, TaE, TaF, T1p;
Chris@42 430 {
Chris@42 431 V Tau, Tav, T15, T16, T18, T19;
Chris@42 432 {
Chris@42 433 V T12, Tai, TA, Tao, TO, T13;
Chris@42 434 T12 = LD(&(xi[WS(is, 2)]), ivs, &(xi[0]));
Chris@42 435 Tai = VADD(Ty, Tz);
Chris@42 436 TA = VSUB(Ty, Tz);
Chris@42 437 Tao = VADD(TM, TN);
Chris@42 438 TO = VSUB(TM, TN);
Chris@42 439 T13 = LD(&(xi[WS(is, 66)]), ivs, &(xi[0]));
Chris@42 440 {
Chris@42 441 V T1t, Tap, TR, Taj, Tef, TG, TB, T1u;
Chris@42 442 T1t = LD(&(xi[WS(is, 34)]), ivs, &(xi[0]));
Chris@42 443 Tap = VADD(TP, TQ);
Chris@42 444 TR = VSUB(TP, TQ);
Chris@42 445 Taj = VADD(Tah, Tai);
Chris@42 446 Tef = VSUB(Tah, Tai);
Chris@42 447 TG = VSUB(Tx, TA);
Chris@42 448 TB = VADD(Tx, TA);
Chris@42 449 Tau = VADD(T12, T13);
Chris@42 450 T14 = VSUB(T12, T13);
Chris@42 451 T1u = LD(&(xi[WS(is, 98)]), ivs, &(xi[0]));
Chris@42 452 {
Chris@42 453 V Taq, Tei, TX, TS, Tak;
Chris@42 454 Taq = VADD(Tao, Tap);
Chris@42 455 Tei = VSUB(Tap, Tao);
Chris@42 456 TX = VSUB(TR, TO);
Chris@42 457 TS = VADD(TO, TR);
Chris@42 458 Tak = VSUB(Tag, Taj);
Chris@42 459 Td2 = VADD(Tag, Taj);
Chris@42 460 {
Chris@42 461 V Teg, Tfs, T71, TH;
Chris@42 462 Teg = VFNMS(LDK(KP414213562), Tef, Tee);
Chris@42 463 Tfs = VFMA(LDK(KP414213562), Tee, Tef);
Chris@42 464 T71 = VFNMS(LDK(KP707106781), TG, TF);
Chris@42 465 TH = VFMA(LDK(KP707106781), TG, TF);
Chris@42 466 {
Chris@42 467 V T70, TC, Tar, Tej, Tfr;
Chris@42 468 T70 = VFNMS(LDK(KP707106781), TB, Tu);
Chris@42 469 TC = VFMA(LDK(KP707106781), TB, Tu);
Chris@42 470 Tar = VSUB(Tan, Taq);
Chris@42 471 Td3 = VADD(Tan, Taq);
Chris@42 472 Tej = VFNMS(LDK(KP414213562), Tei, Teh);
Chris@42 473 Tfr = VFMA(LDK(KP414213562), Teh, Tei);
Chris@42 474 {
Chris@42 475 V T74, TY, T73, TT;
Chris@42 476 T74 = VFNMS(LDK(KP707106781), TX, TW);
Chris@42 477 TY = VFMA(LDK(KP707106781), TX, TW);
Chris@42 478 T73 = VFNMS(LDK(KP707106781), TS, TL);
Chris@42 479 TT = VFMA(LDK(KP707106781), TS, TL);
Chris@42 480 T85 = VFNMS(LDK(KP668178637), T70, T71);
Chris@42 481 T72 = VFMA(LDK(KP668178637), T71, T70);
Chris@42 482 T4V = VFMA(LDK(KP198912367), TC, TH);
Chris@42 483 TI = VFNMS(LDK(KP198912367), TH, TC);
Chris@42 484 Tcd = VSUB(Tar, Tak);
Chris@42 485 Tas = VADD(Tak, Tar);
Chris@42 486 TgH = VSUB(Tej, Teg);
Chris@42 487 Tek = VADD(Teg, Tej);
Chris@42 488 Tgg = VADD(Tfs, Tfr);
Chris@42 489 Tft = VSUB(Tfr, Tfs);
Chris@42 490 T86 = VFNMS(LDK(KP668178637), T73, T74);
Chris@42 491 T75 = VFMA(LDK(KP668178637), T74, T73);
Chris@42 492 T4W = VFMA(LDK(KP198912367), TT, TY);
Chris@42 493 TZ = VFNMS(LDK(KP198912367), TY, TT);
Chris@42 494 Tav = VADD(T1t, T1u);
Chris@42 495 T1v = VSUB(T1t, T1u);
Chris@42 496 }
Chris@42 497 }
Chris@42 498 }
Chris@42 499 }
Chris@42 500 }
Chris@42 501 }
Chris@42 502 T15 = LD(&(xi[WS(is, 18)]), ivs, &(xi[0]));
Chris@42 503 T16 = LD(&(xi[WS(is, 82)]), ivs, &(xi[0]));
Chris@42 504 T18 = LD(&(xi[WS(is, 114)]), ivs, &(xi[0]));
Chris@42 505 T19 = LD(&(xi[WS(is, 50)]), ivs, &(xi[0]));
Chris@42 506 {
Chris@42 507 V T1d, T1e, T1g, T1h, Tax, T17, Tay, T1a;
Chris@42 508 T1d = LD(&(xi[WS(is, 10)]), ivs, &(xi[0]));
Chris@42 509 Taw = VADD(Tau, Tav);
Chris@42 510 Tem = VSUB(Tau, Tav);
Chris@42 511 T1e = LD(&(xi[WS(is, 74)]), ivs, &(xi[0]));
Chris@42 512 T1g = LD(&(xi[WS(is, 42)]), ivs, &(xi[0]));
Chris@42 513 T1h = LD(&(xi[WS(is, 106)]), ivs, &(xi[0]));
Chris@42 514 Tax = VADD(T15, T16);
Chris@42 515 T17 = VSUB(T15, T16);
Chris@42 516 Tay = VADD(T18, T19);
Chris@42 517 T1a = VSUB(T18, T19);
Chris@42 518 {
Chris@42 519 V T1k, T1f, TaB, T1i, TaC, T1l;
Chris@42 520 T1k = LD(&(xi[WS(is, 122)]), ivs, &(xi[0]));
Chris@42 521 T1f = VSUB(T1d, T1e);
Chris@42 522 TaB = VADD(T1d, T1e);
Chris@42 523 T1i = VSUB(T1g, T1h);
Chris@42 524 TaC = VADD(T1g, T1h);
Chris@42 525 T1l = LD(&(xi[WS(is, 58)]), ivs, &(xi[0]));
Chris@42 526 Taz = VADD(Tax, Tay);
Chris@42 527 Ter = VSUB(Tax, Tay);
Chris@42 528 T1b = VADD(T17, T1a);
Chris@42 529 T1w = VSUB(T17, T1a);
Chris@42 530 T1n = LD(&(xi[WS(is, 26)]), ivs, &(xi[0]));
Chris@42 531 T1o = LD(&(xi[WS(is, 90)]), ivs, &(xi[0]));
Chris@42 532 Ten = VSUB(TaB, TaC);
Chris@42 533 TaD = VADD(TaB, TaC);
Chris@42 534 T1j = VFNMS(LDK(KP414213562), T1i, T1f);
Chris@42 535 T1y = VFMA(LDK(KP414213562), T1f, T1i);
Chris@42 536 T1m = VSUB(T1k, T1l);
Chris@42 537 TaE = VADD(T1k, T1l);
Chris@42 538 }
Chris@42 539 }
Chris@42 540 }
Chris@42 541 TaA = VSUB(Taw, Taz);
Chris@42 542 Tdp = VADD(Taw, Taz);
Chris@42 543 TaF = VADD(T1n, T1o);
Chris@42 544 T1p = VSUB(T1n, T1o);
Chris@42 545 T1c = VFMA(LDK(KP707106781), T1b, T14);
Chris@42 546 T78 = VFNMS(LDK(KP707106781), T1b, T14);
Chris@42 547 T7b = VFNMS(LDK(KP707106781), T1w, T1v);
Chris@42 548 T1x = VFMA(LDK(KP707106781), T1w, T1v);
Chris@42 549 TaG = VADD(TaE, TaF);
Chris@42 550 Teo = VSUB(TaE, TaF);
Chris@42 551 T1z = VFNMS(LDK(KP414213562), T1m, T1p);
Chris@42 552 T1q = VFMA(LDK(KP414213562), T1p, T1m);
Chris@42 553 }
Chris@42 554 {
Chris@42 555 V T1F, T26, T1Q, TaT, TaL, TaO, T27, T1M, T1Y, T1Z, TaU, T1T, TaQ, T1X, T20;
Chris@42 556 V TaR;
Chris@42 557 {
Chris@42 558 V T24, TaJ, T25, T1G, T1H, T1J, T1K, T1D, T1E;
Chris@42 559 T1D = LD(&(xi[WS(is, 126)]), ivs, &(xi[0]));
Chris@42 560 T1E = LD(&(xi[WS(is, 62)]), ivs, &(xi[0]));
Chris@42 561 T24 = LD(&(xi[WS(is, 94)]), ivs, &(xi[0]));
Chris@42 562 {
Chris@42 563 V TaH, Tdq, Tes, Tep;
Chris@42 564 TaH = VSUB(TaD, TaG);
Chris@42 565 Tdq = VADD(TaD, TaG);
Chris@42 566 Tes = VSUB(Ten, Teo);
Chris@42 567 Tep = VADD(Ten, Teo);
Chris@42 568 {
Chris@42 569 V T79, T1A, T7c, T1r;
Chris@42 570 T79 = VSUB(T1y, T1z);
Chris@42 571 T1A = VADD(T1y, T1z);
Chris@42 572 T7c = VSUB(T1j, T1q);
Chris@42 573 T1r = VADD(T1j, T1q);
Chris@42 574 TaJ = VADD(T1D, T1E);
Chris@42 575 T1F = VSUB(T1D, T1E);
Chris@42 576 TaI = VFNMS(LDK(KP414213562), TaH, TaA);
Chris@42 577 Tcg = VFMA(LDK(KP414213562), TaA, TaH);
Chris@42 578 Tdr = VADD(Tdp, Tdq);
Chris@42 579 TdG = VSUB(Tdp, Tdq);
Chris@42 580 Tgi = VFNMS(LDK(KP707106781), Tes, Ter);
Chris@42 581 Tet = VFMA(LDK(KP707106781), Tes, Ter);
Chris@42 582 Tgj = VFNMS(LDK(KP707106781), Tep, Tem);
Chris@42 583 Teq = VFMA(LDK(KP707106781), Tep, Tem);
Chris@42 584 T8X = VFNMS(LDK(KP923879532), T79, T78);
Chris@42 585 T7a = VFMA(LDK(KP923879532), T79, T78);
Chris@42 586 T5M = VFNMS(LDK(KP923879532), T1A, T1x);
Chris@42 587 T1B = VFMA(LDK(KP923879532), T1A, T1x);
Chris@42 588 T8W = VFMA(LDK(KP923879532), T7c, T7b);
Chris@42 589 T7d = VFNMS(LDK(KP923879532), T7c, T7b);
Chris@42 590 T5N = VFNMS(LDK(KP923879532), T1r, T1c);
Chris@42 591 T1s = VFMA(LDK(KP923879532), T1r, T1c);
Chris@42 592 T25 = LD(&(xi[WS(is, 30)]), ivs, &(xi[0]));
Chris@42 593 }
Chris@42 594 }
Chris@42 595 T1G = LD(&(xi[WS(is, 14)]), ivs, &(xi[0]));
Chris@42 596 T1H = LD(&(xi[WS(is, 78)]), ivs, &(xi[0]));
Chris@42 597 T1J = LD(&(xi[WS(is, 110)]), ivs, &(xi[0]));
Chris@42 598 T1K = LD(&(xi[WS(is, 46)]), ivs, &(xi[0]));
Chris@42 599 {
Chris@42 600 V T1R, T1I, TaM, T1L, TaN, T1S, T1O, T1P, TaK, T1V, T1W;
Chris@42 601 T1O = LD(&(xi[WS(is, 6)]), ivs, &(xi[0]));
Chris@42 602 T1P = LD(&(xi[WS(is, 70)]), ivs, &(xi[0]));
Chris@42 603 T26 = VSUB(T24, T25);
Chris@42 604 TaK = VADD(T25, T24);
Chris@42 605 T1R = LD(&(xi[WS(is, 102)]), ivs, &(xi[0]));
Chris@42 606 T1I = VSUB(T1G, T1H);
Chris@42 607 TaM = VADD(T1G, T1H);
Chris@42 608 T1L = VSUB(T1J, T1K);
Chris@42 609 TaN = VADD(T1J, T1K);
Chris@42 610 T1Q = VSUB(T1O, T1P);
Chris@42 611 TaT = VADD(T1O, T1P);
Chris@42 612 Tev = VSUB(TaJ, TaK);
Chris@42 613 TaL = VADD(TaJ, TaK);
Chris@42 614 T1S = LD(&(xi[WS(is, 38)]), ivs, &(xi[0]));
Chris@42 615 T1V = LD(&(xi[WS(is, 118)]), ivs, &(xi[0]));
Chris@42 616 T1W = LD(&(xi[WS(is, 54)]), ivs, &(xi[0]));
Chris@42 617 TeA = VSUB(TaN, TaM);
Chris@42 618 TaO = VADD(TaM, TaN);
Chris@42 619 T27 = VSUB(T1L, T1I);
Chris@42 620 T1M = VADD(T1I, T1L);
Chris@42 621 T1Y = LD(&(xi[WS(is, 86)]), ivs, &(xi[0]));
Chris@42 622 T1Z = LD(&(xi[WS(is, 22)]), ivs, &(xi[0]));
Chris@42 623 TaU = VADD(T1S, T1R);
Chris@42 624 T1T = VSUB(T1R, T1S);
Chris@42 625 TaQ = VADD(T1V, T1W);
Chris@42 626 T1X = VSUB(T1V, T1W);
Chris@42 627 }
Chris@42 628 }
Chris@42 629 Tdm = VADD(TaL, TaO);
Chris@42 630 TaP = VSUB(TaL, TaO);
Chris@42 631 T20 = VSUB(T1Y, T1Z);
Chris@42 632 TaR = VADD(T1Z, T1Y);
Chris@42 633 Tew = VSUB(TaT, TaU);
Chris@42 634 TaV = VADD(TaT, TaU);
Chris@42 635 T1U = VFMA(LDK(KP414213562), T1T, T1Q);
Chris@42 636 T29 = VFNMS(LDK(KP414213562), T1Q, T1T);
Chris@42 637 T7f = VFNMS(LDK(KP707106781), T1M, T1F);
Chris@42 638 T1N = VFMA(LDK(KP707106781), T1M, T1F);
Chris@42 639 T28 = VFMA(LDK(KP707106781), T27, T26);
Chris@42 640 T7i = VFNMS(LDK(KP707106781), T27, T26);
Chris@42 641 Tex = VSUB(TaQ, TaR);
Chris@42 642 TaS = VADD(TaQ, TaR);
Chris@42 643 T21 = VFNMS(LDK(KP414213562), T20, T1X);
Chris@42 644 T2a = VFMA(LDK(KP414213562), T1X, T20);
Chris@42 645 }
Chris@42 646 }
Chris@42 647 {
Chris@42 648 V T2J, T2U, T30, T3b, TeL, Tb9, TeO, Tbg, T2M, Tba, T2P, Tbb, T34, Tbh, T33;
Chris@42 649 V T35;
Chris@42 650 {
Chris@42 651 V T2H, T2I, T2S, T2T, T2Y, T2Z, T39, T3a;
Chris@42 652 T2H = LD(&(xi[WS(is, 5)]), ivs, &(xi[WS(is, 1)]));
Chris@42 653 {
Chris@42 654 V Tdn, TaW, Tey, TeB;
Chris@42 655 Tdn = VADD(TaV, TaS);
Chris@42 656 TaW = VSUB(TaS, TaV);
Chris@42 657 Tey = VADD(Tew, Tex);
Chris@42 658 TeB = VSUB(Tex, Tew);
Chris@42 659 {
Chris@42 660 V T2b, T7g, T22, T7j;
Chris@42 661 T2b = VADD(T29, T2a);
Chris@42 662 T7g = VSUB(T2a, T29);
Chris@42 663 T22 = VADD(T1U, T21);
Chris@42 664 T7j = VSUB(T21, T1U);
Chris@42 665 TaX = VFNMS(LDK(KP414213562), TaW, TaP);
Chris@42 666 Tcf = VFMA(LDK(KP414213562), TaP, TaW);
Chris@42 667 Tdo = VADD(Tdm, Tdn);
Chris@42 668 TdH = VSUB(Tdm, Tdn);
Chris@42 669 Tgl = VFNMS(LDK(KP707106781), TeB, TeA);
Chris@42 670 TeC = VFMA(LDK(KP707106781), TeB, TeA);
Chris@42 671 Tgm = VFNMS(LDK(KP707106781), Tey, Tev);
Chris@42 672 Tez = VFMA(LDK(KP707106781), Tey, Tev);
Chris@42 673 T90 = VFNMS(LDK(KP923879532), T7g, T7f);
Chris@42 674 T7h = VFMA(LDK(KP923879532), T7g, T7f);
Chris@42 675 T5P = VFNMS(LDK(KP923879532), T2b, T28);
Chris@42 676 T2c = VFMA(LDK(KP923879532), T2b, T28);
Chris@42 677 T8Z = VFMA(LDK(KP923879532), T7j, T7i);
Chris@42 678 T7k = VFNMS(LDK(KP923879532), T7j, T7i);
Chris@42 679 T5Q = VFNMS(LDK(KP923879532), T22, T1N);
Chris@42 680 T23 = VFMA(LDK(KP923879532), T22, T1N);
Chris@42 681 T2I = LD(&(xi[WS(is, 69)]), ivs, &(xi[WS(is, 1)]));
Chris@42 682 }
Chris@42 683 }
Chris@42 684 T2S = LD(&(xi[WS(is, 37)]), ivs, &(xi[WS(is, 1)]));
Chris@42 685 T2T = LD(&(xi[WS(is, 101)]), ivs, &(xi[WS(is, 1)]));
Chris@42 686 T2Y = LD(&(xi[WS(is, 125)]), ivs, &(xi[WS(is, 1)]));
Chris@42 687 T2Z = LD(&(xi[WS(is, 61)]), ivs, &(xi[WS(is, 1)]));
Chris@42 688 T39 = LD(&(xi[WS(is, 29)]), ivs, &(xi[WS(is, 1)]));
Chris@42 689 T3a = LD(&(xi[WS(is, 93)]), ivs, &(xi[WS(is, 1)]));
Chris@42 690 {
Chris@42 691 V T2K, Tbe, Tbf, T2L, T2N, T2O, Tb7, Tb8, T31, T32;
Chris@42 692 T2K = LD(&(xi[WS(is, 21)]), ivs, &(xi[WS(is, 1)]));
Chris@42 693 T2J = VSUB(T2H, T2I);
Chris@42 694 Tb7 = VADD(T2H, T2I);
Chris@42 695 T2U = VSUB(T2S, T2T);
Chris@42 696 Tb8 = VADD(T2S, T2T);
Chris@42 697 T30 = VSUB(T2Y, T2Z);
Chris@42 698 Tbe = VADD(T2Y, T2Z);
Chris@42 699 T3b = VSUB(T39, T3a);
Chris@42 700 Tbf = VADD(T39, T3a);
Chris@42 701 T2L = LD(&(xi[WS(is, 85)]), ivs, &(xi[WS(is, 1)]));
Chris@42 702 T2N = LD(&(xi[WS(is, 117)]), ivs, &(xi[WS(is, 1)]));
Chris@42 703 T2O = LD(&(xi[WS(is, 53)]), ivs, &(xi[WS(is, 1)]));
Chris@42 704 TeL = VSUB(Tb7, Tb8);
Chris@42 705 Tb9 = VADD(Tb7, Tb8);
Chris@42 706 T31 = LD(&(xi[WS(is, 13)]), ivs, &(xi[WS(is, 1)]));
Chris@42 707 T32 = LD(&(xi[WS(is, 77)]), ivs, &(xi[WS(is, 1)]));
Chris@42 708 TeO = VSUB(Tbe, Tbf);
Chris@42 709 Tbg = VADD(Tbe, Tbf);
Chris@42 710 T2M = VSUB(T2K, T2L);
Chris@42 711 Tba = VADD(T2K, T2L);
Chris@42 712 T2P = VSUB(T2N, T2O);
Chris@42 713 Tbb = VADD(T2N, T2O);
Chris@42 714 T34 = LD(&(xi[WS(is, 109)]), ivs, &(xi[WS(is, 1)]));
Chris@42 715 Tbh = VADD(T31, T32);
Chris@42 716 T33 = VSUB(T31, T32);
Chris@42 717 T35 = LD(&(xi[WS(is, 45)]), ivs, &(xi[WS(is, 1)]));
Chris@42 718 }
Chris@42 719 }
Chris@42 720 {
Chris@42 721 V T4d, T4e, T4o, T4p;
Chris@42 722 {
Chris@42 723 V T2X, T3q, T7t, T7C, T3r, T3e, T7D, T7w;
Chris@42 724 {
Chris@42 725 V T47, TbE, Tbd, Td9, TeW, TeN, T7s, T2W, T7r, T2R, TeP, Tbj, T37, T3c, T48;
Chris@42 726 {
Chris@42 727 V T3W, T3X, TeM, Tbc, T2Q, T2V, Tbi, T36;
Chris@42 728 T3W = LD(&(xi[WS(is, 3)]), ivs, &(xi[WS(is, 1)]));
Chris@42 729 T3X = LD(&(xi[WS(is, 67)]), ivs, &(xi[WS(is, 1)]));
Chris@42 730 TeM = VSUB(Tba, Tbb);
Chris@42 731 Tbc = VADD(Tba, Tbb);
Chris@42 732 T2Q = VADD(T2M, T2P);
Chris@42 733 T2V = VSUB(T2M, T2P);
Chris@42 734 T47 = LD(&(xi[WS(is, 99)]), ivs, &(xi[WS(is, 1)]));
Chris@42 735 Tbi = VADD(T34, T35);
Chris@42 736 T36 = VSUB(T34, T35);
Chris@42 737 TbE = VADD(T3W, T3X);
Chris@42 738 T3Y = VSUB(T3W, T3X);
Chris@42 739 Tbd = VSUB(Tb9, Tbc);
Chris@42 740 Td9 = VADD(Tb9, Tbc);
Chris@42 741 TeW = VFMA(LDK(KP414213562), TeL, TeM);
Chris@42 742 TeN = VFNMS(LDK(KP414213562), TeM, TeL);
Chris@42 743 T7s = VFNMS(LDK(KP707106781), T2V, T2U);
Chris@42 744 T2W = VFMA(LDK(KP707106781), T2V, T2U);
Chris@42 745 T7r = VFNMS(LDK(KP707106781), T2Q, T2J);
Chris@42 746 T2R = VFMA(LDK(KP707106781), T2Q, T2J);
Chris@42 747 TeP = VSUB(Tbh, Tbi);
Chris@42 748 Tbj = VADD(Tbh, Tbi);
Chris@42 749 T37 = VADD(T33, T36);
Chris@42 750 T3c = VSUB(T33, T36);
Chris@42 751 T48 = LD(&(xi[WS(is, 35)]), ivs, &(xi[WS(is, 1)]));
Chris@42 752 }
Chris@42 753 T2X = VFNMS(LDK(KP198912367), T2W, T2R);
Chris@42 754 T3q = VFMA(LDK(KP198912367), T2R, T2W);
Chris@42 755 T7t = VFMA(LDK(KP668178637), T7s, T7r);
Chris@42 756 T7C = VFNMS(LDK(KP668178637), T7r, T7s);
Chris@42 757 {
Chris@42 758 V Tbk, Tda, TeX, TeQ;
Chris@42 759 Tbk = VSUB(Tbg, Tbj);
Chris@42 760 Tda = VADD(Tbg, Tbj);
Chris@42 761 TeX = VFNMS(LDK(KP414213562), TeO, TeP);
Chris@42 762 TeQ = VFMA(LDK(KP414213562), TeP, TeO);
Chris@42 763 {
Chris@42 764 V T7v, T3d, T7u, T38, TbF;
Chris@42 765 T7v = VFNMS(LDK(KP707106781), T3c, T3b);
Chris@42 766 T3d = VFMA(LDK(KP707106781), T3c, T3b);
Chris@42 767 T7u = VFNMS(LDK(KP707106781), T37, T30);
Chris@42 768 T38 = VFMA(LDK(KP707106781), T37, T30);
Chris@42 769 T49 = VSUB(T47, T48);
Chris@42 770 TbF = VADD(T48, T47);
Chris@42 771 TdL = VSUB(Td9, Tda);
Chris@42 772 Tdb = VADD(Td9, Tda);
Chris@42 773 Tbu = VSUB(Tbd, Tbk);
Chris@42 774 Tbl = VADD(Tbd, Tbk);
Chris@42 775 Tgu = VSUB(TeN, TeQ);
Chris@42 776 TeR = VADD(TeN, TeQ);
Chris@42 777 Tgr = VSUB(TeW, TeX);
Chris@42 778 TeY = VADD(TeW, TeX);
Chris@42 779 T3r = VFNMS(LDK(KP198912367), T38, T3d);
Chris@42 780 T3e = VFMA(LDK(KP198912367), T3d, T38);
Chris@42 781 T7D = VFMA(LDK(KP668178637), T7u, T7v);
Chris@42 782 T7w = VFNMS(LDK(KP668178637), T7v, T7u);
Chris@42 783 Tf6 = VSUB(TbE, TbF);
Chris@42 784 TbG = VADD(TbE, TbF);
Chris@42 785 }
Chris@42 786 }
Chris@42 787 }
Chris@42 788 T4d = LD(&(xi[WS(is, 123)]), ivs, &(xi[WS(is, 1)]));
Chris@42 789 T5V = VSUB(T3q, T3r);
Chris@42 790 T3s = VADD(T3q, T3r);
Chris@42 791 T5Y = VSUB(T2X, T3e);
Chris@42 792 T3f = VADD(T2X, T3e);
Chris@42 793 T95 = VSUB(T7D, T7C);
Chris@42 794 T7E = VADD(T7C, T7D);
Chris@42 795 T98 = VSUB(T7t, T7w);
Chris@42 796 T7x = VADD(T7t, T7w);
Chris@42 797 T4e = LD(&(xi[WS(is, 59)]), ivs, &(xi[WS(is, 1)]));
Chris@42 798 T4o = LD(&(xi[WS(is, 91)]), ivs, &(xi[WS(is, 1)]));
Chris@42 799 T4p = LD(&(xi[WS(is, 27)]), ivs, &(xi[WS(is, 1)]));
Chris@42 800 }
Chris@42 801 {
Chris@42 802 V T3Z, T40, T42, T43, TbL, TbM;
Chris@42 803 T3Z = LD(&(xi[WS(is, 19)]), ivs, &(xi[WS(is, 1)]));
Chris@42 804 T40 = LD(&(xi[WS(is, 83)]), ivs, &(xi[WS(is, 1)]));
Chris@42 805 T42 = LD(&(xi[WS(is, 115)]), ivs, &(xi[WS(is, 1)]));
Chris@42 806 T43 = LD(&(xi[WS(is, 51)]), ivs, &(xi[WS(is, 1)]));
Chris@42 807 T4g = LD(&(xi[WS(is, 11)]), ivs, &(xi[WS(is, 1)]));
Chris@42 808 T4f = VSUB(T4d, T4e);
Chris@42 809 TbL = VADD(T4d, T4e);
Chris@42 810 T4q = VSUB(T4o, T4p);
Chris@42 811 TbM = VADD(T4p, T4o);
Chris@42 812 TbH = VADD(T3Z, T40);
Chris@42 813 T41 = VSUB(T3Z, T40);
Chris@42 814 TbI = VADD(T42, T43);
Chris@42 815 T44 = VSUB(T42, T43);
Chris@42 816 T4h = LD(&(xi[WS(is, 75)]), ivs, &(xi[WS(is, 1)]));
Chris@42 817 T4j = LD(&(xi[WS(is, 107)]), ivs, &(xi[WS(is, 1)]));
Chris@42 818 T4k = LD(&(xi[WS(is, 43)]), ivs, &(xi[WS(is, 1)]));
Chris@42 819 Tf9 = VSUB(TbL, TbM);
Chris@42 820 TbN = VADD(TbL, TbM);
Chris@42 821 }
Chris@42 822 }
Chris@42 823 }
Chris@42 824 }
Chris@42 825 }
Chris@42 826 {
Chris@42 827 V TgB, Tgy, T62, T4H, T65, T4u, T9c, T7X, T9f, T7Q, Tg0, Tga, TfF, TeF, TfT;
Chris@42 828 V TfU, TfP, Tg7, TfI, Tfy, TfA, Tf0, Tfz, Tfl, Tg2, TfS;
Chris@42 829 {
Chris@42 830 V Tc1, TbS, Tfc, Tfj, TdX, Te5, TdZ, TdR, Te7, Te3, TdU, Te4;
Chris@42 831 {
Chris@42 832 V TdF, TdS, Tdx, Td5, TdO, TdE, TdC, Tdt, Tdk;
Chris@42 833 {
Chris@42 834 V Tdc, TdA, T4F, T4c, T7V, T7M, T4G, T4t, T7W, T7P, TdB, Tdj;
Chris@42 835 {
Chris@42 836 V Td1, Tdg, TbK, Tf8, Tfh, T4b, T7L, T46, T7K, TbQ, Tfa, T4r, T4m, Td4;
Chris@42 837 TdF = VSUB(TcZ, Td0);
Chris@42 838 Td1 = VADD(TcZ, Td0);
Chris@42 839 {
Chris@42 840 V TbJ, Tf7, T4a, T45;
Chris@42 841 TbJ = VADD(TbH, TbI);
Chris@42 842 Tf7 = VSUB(TbI, TbH);
Chris@42 843 T4a = VSUB(T44, T41);
Chris@42 844 T45 = VADD(T41, T44);
Chris@42 845 {
Chris@42 846 V TbO, T4i, TbP, T4l;
Chris@42 847 TbO = VADD(T4g, T4h);
Chris@42 848 T4i = VSUB(T4g, T4h);
Chris@42 849 TbP = VADD(T4j, T4k);
Chris@42 850 T4l = VSUB(T4j, T4k);
Chris@42 851 Tdg = VADD(TbG, TbJ);
Chris@42 852 TbK = VSUB(TbG, TbJ);
Chris@42 853 Tf8 = VFMA(LDK(KP414213562), Tf7, Tf6);
Chris@42 854 Tfh = VFNMS(LDK(KP414213562), Tf6, Tf7);
Chris@42 855 T4b = VFMA(LDK(KP707106781), T4a, T49);
Chris@42 856 T7L = VFNMS(LDK(KP707106781), T4a, T49);
Chris@42 857 T46 = VFMA(LDK(KP707106781), T45, T3Y);
Chris@42 858 T7K = VFNMS(LDK(KP707106781), T45, T3Y);
Chris@42 859 TbQ = VADD(TbO, TbP);
Chris@42 860 Tfa = VSUB(TbP, TbO);
Chris@42 861 T4r = VSUB(T4l, T4i);
Chris@42 862 T4m = VADD(T4i, T4l);
Chris@42 863 Td4 = VADD(Td2, Td3);
Chris@42 864 TdS = VSUB(Td3, Td2);
Chris@42 865 }
Chris@42 866 }
Chris@42 867 Tdc = VSUB(Td8, Tdb);
Chris@42 868 TdA = VADD(Td8, Tdb);
Chris@42 869 T4F = VFNMS(LDK(KP198912367), T46, T4b);
Chris@42 870 T4c = VFMA(LDK(KP198912367), T4b, T46);
Chris@42 871 T7V = VFMA(LDK(KP668178637), T7K, T7L);
Chris@42 872 T7M = VFNMS(LDK(KP668178637), T7L, T7K);
Chris@42 873 {
Chris@42 874 V Tdh, TbR, Tfb, Tfi;
Chris@42 875 Tdh = VADD(TbN, TbQ);
Chris@42 876 TbR = VSUB(TbN, TbQ);
Chris@42 877 Tfb = VFNMS(LDK(KP414213562), Tfa, Tf9);
Chris@42 878 Tfi = VFMA(LDK(KP414213562), Tf9, Tfa);
Chris@42 879 {
Chris@42 880 V T4s, T7O, T4n, T7N, Tdi;
Chris@42 881 T4s = VFMA(LDK(KP707106781), T4r, T4q);
Chris@42 882 T7O = VFNMS(LDK(KP707106781), T4r, T4q);
Chris@42 883 T4n = VFMA(LDK(KP707106781), T4m, T4f);
Chris@42 884 T7N = VFNMS(LDK(KP707106781), T4m, T4f);
Chris@42 885 Tdx = VADD(Td1, Td4);
Chris@42 886 Td5 = VSUB(Td1, Td4);
Chris@42 887 TdO = VSUB(Tdh, Tdg);
Chris@42 888 Tdi = VADD(Tdg, Tdh);
Chris@42 889 Tc1 = VSUB(TbR, TbK);
Chris@42 890 TbS = VADD(TbK, TbR);
Chris@42 891 TgB = VSUB(Tfb, Tf8);
Chris@42 892 Tfc = VADD(Tf8, Tfb);
Chris@42 893 Tgy = VSUB(Tfi, Tfh);
Chris@42 894 Tfj = VADD(Tfh, Tfi);
Chris@42 895 T4G = VFMA(LDK(KP198912367), T4n, T4s);
Chris@42 896 T4t = VFNMS(LDK(KP198912367), T4s, T4n);
Chris@42 897 T7W = VFNMS(LDK(KP668178637), T7N, T7O);
Chris@42 898 T7P = VFMA(LDK(KP668178637), T7O, T7N);
Chris@42 899 TdB = VADD(Tdf, Tdi);
Chris@42 900 Tdj = VSUB(Tdf, Tdi);
Chris@42 901 }
Chris@42 902 }
Chris@42 903 }
Chris@42 904 T62 = VSUB(T4G, T4F);
Chris@42 905 T4H = VADD(T4F, T4G);
Chris@42 906 T65 = VSUB(T4t, T4c);
Chris@42 907 T4u = VADD(T4c, T4t);
Chris@42 908 T9c = VSUB(T7V, T7W);
Chris@42 909 T7X = VADD(T7V, T7W);
Chris@42 910 T9f = VSUB(T7P, T7M);
Chris@42 911 T7Q = VADD(T7M, T7P);
Chris@42 912 TdE = VSUB(TdB, TdA);
Chris@42 913 TdC = VADD(TdA, TdB);
Chris@42 914 Tdt = VSUB(Tdj, Tdc);
Chris@42 915 Tdk = VADD(Tdc, Tdj);
Chris@42 916 }
Chris@42 917 {
Chris@42 918 V TdT, Tdl, Tdv, TdJ, Te1, Te2, TdQ, Tdz, TdD, Tdu, Tdw;
Chris@42 919 {
Chris@42 920 V TdI, TdP, TdV, TdW, TdM, Tds, Tdy;
Chris@42 921 TdI = VADD(TdG, TdH);
Chris@42 922 TdT = VSUB(TdH, TdG);
Chris@42 923 TdP = VFNMS(LDK(KP414213562), TdO, TdN);
Chris@42 924 TdV = VFMA(LDK(KP414213562), TdN, TdO);
Chris@42 925 TdW = VFMA(LDK(KP414213562), TdK, TdL);
Chris@42 926 TdM = VFNMS(LDK(KP414213562), TdL, TdK);
Chris@42 927 Tdl = VFNMS(LDK(KP707106781), Tdk, Td5);
Chris@42 928 Tdv = VFMA(LDK(KP707106781), Tdk, Td5);
Chris@42 929 Tds = VSUB(Tdo, Tdr);
Chris@42 930 Tdy = VADD(Tdr, Tdo);
Chris@42 931 TdJ = VFMA(LDK(KP707106781), TdI, TdF);
Chris@42 932 Te1 = VFNMS(LDK(KP707106781), TdI, TdF);
Chris@42 933 TdX = VSUB(TdV, TdW);
Chris@42 934 Te2 = VADD(TdW, TdV);
Chris@42 935 Te5 = VSUB(TdP, TdM);
Chris@42 936 TdQ = VADD(TdM, TdP);
Chris@42 937 Tdz = VADD(Tdx, Tdy);
Chris@42 938 TdD = VSUB(Tdx, Tdy);
Chris@42 939 Tdu = VFNMS(LDK(KP707106781), Tdt, Tds);
Chris@42 940 Tdw = VFMA(LDK(KP707106781), Tdt, Tds);
Chris@42 941 }
Chris@42 942 TdZ = VFMA(LDK(KP923879532), TdQ, TdJ);
Chris@42 943 TdR = VFNMS(LDK(KP923879532), TdQ, TdJ);
Chris@42 944 Te7 = VFMA(LDK(KP923879532), Te2, Te1);
Chris@42 945 Te3 = VFNMS(LDK(KP923879532), Te2, Te1);
Chris@42 946 ST(&(xo[WS(os, 32)]), VFMAI(TdE, TdD), ovs, &(xo[0]));
Chris@42 947 ST(&(xo[WS(os, 96)]), VFNMSI(TdE, TdD), ovs, &(xo[0]));
Chris@42 948 ST(&(xo[0]), VADD(Tdz, TdC), ovs, &(xo[0]));
Chris@42 949 ST(&(xo[WS(os, 64)]), VSUB(Tdz, TdC), ovs, &(xo[0]));
Chris@42 950 ST(&(xo[WS(os, 16)]), VFMAI(Tdw, Tdv), ovs, &(xo[0]));
Chris@42 951 ST(&(xo[WS(os, 112)]), VFNMSI(Tdw, Tdv), ovs, &(xo[0]));
Chris@42 952 ST(&(xo[WS(os, 80)]), VFMAI(Tdu, Tdl), ovs, &(xo[0]));
Chris@42 953 ST(&(xo[WS(os, 48)]), VFNMSI(Tdu, Tdl), ovs, &(xo[0]));
Chris@42 954 TdU = VFMA(LDK(KP707106781), TdT, TdS);
Chris@42 955 Te4 = VFNMS(LDK(KP707106781), TdT, TdS);
Chris@42 956 }
Chris@42 957 }
Chris@42 958 {
Chris@42 959 V Tcx, TcJ, TcI, Tcy, TcA, Tbm, Tcp, TaZ, Tcs, Tci, Tbv, TcB, TcD, TbT, Tc2;
Chris@42 960 V TcE, Tat, TaY;
Chris@42 961 Tcx = VFNMS(LDK(KP707106781), Tas, Tad);
Chris@42 962 Tat = VFMA(LDK(KP707106781), Tas, Tad);
Chris@42 963 TaY = VADD(TaI, TaX);
Chris@42 964 TcJ = VSUB(TaX, TaI);
Chris@42 965 {
Chris@42 966 V Tce, Tch, Te8, Te6, TdY, Te0;
Chris@42 967 TcI = VFNMS(LDK(KP707106781), Tcd, Tcc);
Chris@42 968 Tce = VFMA(LDK(KP707106781), Tcd, Tcc);
Chris@42 969 Tch = VSUB(Tcf, Tcg);
Chris@42 970 Tcy = VADD(Tcg, Tcf);
Chris@42 971 Te8 = VFNMS(LDK(KP923879532), Te5, Te4);
Chris@42 972 Te6 = VFMA(LDK(KP923879532), Te5, Te4);
Chris@42 973 TdY = VFNMS(LDK(KP923879532), TdX, TdU);
Chris@42 974 Te0 = VFMA(LDK(KP923879532), TdX, TdU);
Chris@42 975 TcA = VFNMS(LDK(KP707106781), Tbl, Tb6);
Chris@42 976 Tbm = VFMA(LDK(KP707106781), Tbl, Tb6);
Chris@42 977 Tcp = VFNMS(LDK(KP923879532), TaY, Tat);
Chris@42 978 TaZ = VFMA(LDK(KP923879532), TaY, Tat);
Chris@42 979 Tcs = VFNMS(LDK(KP923879532), Tch, Tce);
Chris@42 980 Tci = VFMA(LDK(KP923879532), Tch, Tce);
Chris@42 981 ST(&(xo[WS(os, 88)]), VFNMSI(Te6, Te3), ovs, &(xo[0]));
Chris@42 982 ST(&(xo[WS(os, 40)]), VFMAI(Te6, Te3), ovs, &(xo[0]));
Chris@42 983 ST(&(xo[WS(os, 104)]), VFMAI(Te8, Te7), ovs, &(xo[0]));
Chris@42 984 ST(&(xo[WS(os, 24)]), VFNMSI(Te8, Te7), ovs, &(xo[0]));
Chris@42 985 ST(&(xo[WS(os, 8)]), VFMAI(Te0, TdZ), ovs, &(xo[0]));
Chris@42 986 ST(&(xo[WS(os, 120)]), VFNMSI(Te0, TdZ), ovs, &(xo[0]));
Chris@42 987 ST(&(xo[WS(os, 72)]), VFMAI(TdY, TdR), ovs, &(xo[0]));
Chris@42 988 ST(&(xo[WS(os, 56)]), VFNMSI(TdY, TdR), ovs, &(xo[0]));
Chris@42 989 Tbv = VFMA(LDK(KP707106781), Tbu, Tbt);
Chris@42 990 TcB = VFNMS(LDK(KP707106781), Tbu, Tbt);
Chris@42 991 TcD = VFNMS(LDK(KP707106781), TbS, TbD);
Chris@42 992 TbT = VFMA(LDK(KP707106781), TbS, TbD);
Chris@42 993 Tc2 = VFMA(LDK(KP707106781), Tc1, Tc0);
Chris@42 994 TcE = VFNMS(LDK(KP707106781), Tc1, Tc0);
Chris@42 995 }
Chris@42 996 {
Chris@42 997 V TcR, Tcz, TcU, TcK, Tcq, Tcl, Tct, Tc4;
Chris@42 998 {
Chris@42 999 V Tck, Tbw, Tcj, Tc3;
Chris@42 1000 Tck = VFMA(LDK(KP198912367), Tbm, Tbv);
Chris@42 1001 Tbw = VFNMS(LDK(KP198912367), Tbv, Tbm);
Chris@42 1002 Tcj = VFMA(LDK(KP198912367), TbT, Tc2);
Chris@42 1003 Tc3 = VFNMS(LDK(KP198912367), Tc2, TbT);
Chris@42 1004 TcR = VFNMS(LDK(KP923879532), Tcy, Tcx);
Chris@42 1005 Tcz = VFMA(LDK(KP923879532), Tcy, Tcx);
Chris@42 1006 TcU = VFMA(LDK(KP923879532), TcJ, TcI);
Chris@42 1007 TcK = VFNMS(LDK(KP923879532), TcJ, TcI);
Chris@42 1008 Tcq = VADD(Tck, Tcj);
Chris@42 1009 Tcl = VSUB(Tcj, Tck);
Chris@42 1010 Tct = VSUB(Tc3, Tbw);
Chris@42 1011 Tc4 = VADD(Tbw, Tc3);
Chris@42 1012 }
Chris@42 1013 {
Chris@42 1014 V TfN, Tel, TfY, Tfu, Tfw, Tfv, TcT, TcX, TcQ, TcO, TcW, TcY, TcP, TcH, TfZ;
Chris@42 1015 V TeE;
Chris@42 1016 {
Chris@42 1017 V Teu, TcS, TcN, TcV, TcG, TeD;
Chris@42 1018 TfN = VFNMS(LDK(KP923879532), Tek, Ted);
Chris@42 1019 Tel = VFMA(LDK(KP923879532), Tek, Ted);
Chris@42 1020 {
Chris@42 1021 V TcM, TcC, Tcr, Tcv;
Chris@42 1022 TcM = VFNMS(LDK(KP668178637), TcA, TcB);
Chris@42 1023 TcC = VFMA(LDK(KP668178637), TcB, TcA);
Chris@42 1024 Tcr = VFNMS(LDK(KP980785280), Tcq, Tcp);
Chris@42 1025 Tcv = VFMA(LDK(KP980785280), Tcq, Tcp);
Chris@42 1026 {
Chris@42 1027 V Tco, Tcm, Tcu, Tcw;
Chris@42 1028 Tco = VFMA(LDK(KP980785280), Tcl, Tci);
Chris@42 1029 Tcm = VFNMS(LDK(KP980785280), Tcl, Tci);
Chris@42 1030 Tcu = VFMA(LDK(KP980785280), Tct, Tcs);
Chris@42 1031 Tcw = VFNMS(LDK(KP980785280), Tct, Tcs);
Chris@42 1032 {
Chris@42 1033 V Tcn, Tc5, TcL, TcF;
Chris@42 1034 Tcn = VFMA(LDK(KP980785280), Tc4, TaZ);
Chris@42 1035 Tc5 = VFNMS(LDK(KP980785280), Tc4, TaZ);
Chris@42 1036 TcL = VFNMS(LDK(KP668178637), TcD, TcE);
Chris@42 1037 TcF = VFMA(LDK(KP668178637), TcE, TcD);
Chris@42 1038 TfY = VFNMS(LDK(KP923879532), Tft, Tfq);
Chris@42 1039 Tfu = VFMA(LDK(KP923879532), Tft, Tfq);
Chris@42 1040 Tfw = VFMA(LDK(KP198912367), Teq, Tet);
Chris@42 1041 Teu = VFNMS(LDK(KP198912367), Tet, Teq);
Chris@42 1042 ST(&(xo[WS(os, 92)]), VFNMSI(Tcu, Tcr), ovs, &(xo[0]));
Chris@42 1043 ST(&(xo[WS(os, 36)]), VFMAI(Tcu, Tcr), ovs, &(xo[0]));
Chris@42 1044 ST(&(xo[WS(os, 100)]), VFMAI(Tcw, Tcv), ovs, &(xo[0]));
Chris@42 1045 ST(&(xo[WS(os, 28)]), VFNMSI(Tcw, Tcv), ovs, &(xo[0]));
Chris@42 1046 ST(&(xo[WS(os, 4)]), VFMAI(Tco, Tcn), ovs, &(xo[0]));
Chris@42 1047 ST(&(xo[WS(os, 124)]), VFNMSI(Tco, Tcn), ovs, &(xo[0]));
Chris@42 1048 ST(&(xo[WS(os, 68)]), VFMAI(Tcm, Tc5), ovs, &(xo[0]));
Chris@42 1049 ST(&(xo[WS(os, 60)]), VFNMSI(Tcm, Tc5), ovs, &(xo[0]));
Chris@42 1050 TcS = VADD(TcM, TcL);
Chris@42 1051 TcN = VSUB(TcL, TcM);
Chris@42 1052 TcV = VSUB(TcF, TcC);
Chris@42 1053 TcG = VADD(TcC, TcF);
Chris@42 1054 TeD = VFNMS(LDK(KP198912367), TeC, Tez);
Chris@42 1055 Tfv = VFMA(LDK(KP198912367), Tez, TeC);
Chris@42 1056 }
Chris@42 1057 }
Chris@42 1058 }
Chris@42 1059 TcT = VFMA(LDK(KP831469612), TcS, TcR);
Chris@42 1060 TcX = VFNMS(LDK(KP831469612), TcS, TcR);
Chris@42 1061 TcQ = VFMA(LDK(KP831469612), TcN, TcK);
Chris@42 1062 TcO = VFNMS(LDK(KP831469612), TcN, TcK);
Chris@42 1063 TcW = VFNMS(LDK(KP831469612), TcV, TcU);
Chris@42 1064 TcY = VFMA(LDK(KP831469612), TcV, TcU);
Chris@42 1065 TcP = VFMA(LDK(KP831469612), TcG, Tcz);
Chris@42 1066 TcH = VFNMS(LDK(KP831469612), TcG, Tcz);
Chris@42 1067 TfZ = VSUB(TeD, Teu);
Chris@42 1068 TeE = VADD(Teu, TeD);
Chris@42 1069 }
Chris@42 1070 {
Chris@42 1071 V TfQ, TeS, TfO, Tfx, TeZ, TfR, Tfd, Tfk;
Chris@42 1072 TfQ = VFNMS(LDK(KP923879532), TeR, TeK);
Chris@42 1073 TeS = VFMA(LDK(KP923879532), TeR, TeK);
Chris@42 1074 ST(&(xo[WS(os, 84)]), VFMAI(TcW, TcT), ovs, &(xo[0]));
Chris@42 1075 ST(&(xo[WS(os, 44)]), VFNMSI(TcW, TcT), ovs, &(xo[0]));
Chris@42 1076 ST(&(xo[WS(os, 108)]), VFNMSI(TcY, TcX), ovs, &(xo[0]));
Chris@42 1077 ST(&(xo[WS(os, 20)]), VFMAI(TcY, TcX), ovs, &(xo[0]));
Chris@42 1078 ST(&(xo[WS(os, 116)]), VFMAI(TcQ, TcP), ovs, &(xo[0]));
Chris@42 1079 ST(&(xo[WS(os, 12)]), VFNMSI(TcQ, TcP), ovs, &(xo[0]));
Chris@42 1080 ST(&(xo[WS(os, 52)]), VFMAI(TcO, TcH), ovs, &(xo[0]));
Chris@42 1081 ST(&(xo[WS(os, 76)]), VFNMSI(TcO, TcH), ovs, &(xo[0]));
Chris@42 1082 Tg0 = VFNMS(LDK(KP980785280), TfZ, TfY);
Chris@42 1083 Tga = VFMA(LDK(KP980785280), TfZ, TfY);
Chris@42 1084 TfF = VFNMS(LDK(KP980785280), TeE, Tel);
Chris@42 1085 TeF = VFMA(LDK(KP980785280), TeE, Tel);
Chris@42 1086 TfO = VADD(Tfw, Tfv);
Chris@42 1087 Tfx = VSUB(Tfv, Tfw);
Chris@42 1088 TeZ = VFMA(LDK(KP923879532), TeY, TeV);
Chris@42 1089 TfR = VFNMS(LDK(KP923879532), TeY, TeV);
Chris@42 1090 TfT = VFNMS(LDK(KP923879532), Tfc, Tf5);
Chris@42 1091 Tfd = VFMA(LDK(KP923879532), Tfc, Tf5);
Chris@42 1092 Tfk = VFMA(LDK(KP923879532), Tfj, Tfg);
Chris@42 1093 TfU = VFNMS(LDK(KP923879532), Tfj, Tfg);
Chris@42 1094 TfP = VFMA(LDK(KP980785280), TfO, TfN);
Chris@42 1095 Tg7 = VFNMS(LDK(KP980785280), TfO, TfN);
Chris@42 1096 TfI = VFNMS(LDK(KP980785280), Tfx, Tfu);
Chris@42 1097 Tfy = VFMA(LDK(KP980785280), Tfx, Tfu);
Chris@42 1098 TfA = VFMA(LDK(KP098491403), TeS, TeZ);
Chris@42 1099 Tf0 = VFNMS(LDK(KP098491403), TeZ, TeS);
Chris@42 1100 Tfz = VFMA(LDK(KP098491403), Tfd, Tfk);
Chris@42 1101 Tfl = VFNMS(LDK(KP098491403), Tfk, Tfd);
Chris@42 1102 Tg2 = VFNMS(LDK(KP820678790), TfQ, TfR);
Chris@42 1103 TfS = VFMA(LDK(KP820678790), TfR, TfQ);
Chris@42 1104 }
Chris@42 1105 }
Chris@42 1106 }
Chris@42 1107 }
Chris@42 1108 }
Chris@42 1109 {
Chris@42 1110 V T8x, T8y, T8F, T8w, T8k, T8f, T8n, T80, T9l, T76, T87, T8U, T89, T7e, T7l;
Chris@42 1111 V T8a;
Chris@42 1112 {
Chris@42 1113 V The, Tho, TgT, Tgp, Th7, Th8, Thg, Th6, Th3, Thl, TgW, TgM, TgU, TgP, TgX;
Chris@42 1114 V TgE;
Chris@42 1115 {
Chris@42 1116 V Th1, TgI, TgK, TgJ;
Chris@42 1117 {
Chris@42 1118 V Tgh, Thc, Tgk, TfG, TfB, TfJ, Tfm, Tg1, TfV, Tgn, TfL, TfH;
Chris@42 1119 Th1 = VFMA(LDK(KP923879532), Tgg, Tgf);
Chris@42 1120 Tgh = VFNMS(LDK(KP923879532), Tgg, Tgf);
Chris@42 1121 Thc = VFNMS(LDK(KP923879532), TgH, TgG);
Chris@42 1122 TgI = VFMA(LDK(KP923879532), TgH, TgG);
Chris@42 1123 TgK = VFMA(LDK(KP668178637), Tgi, Tgj);
Chris@42 1124 Tgk = VFNMS(LDK(KP668178637), Tgj, Tgi);
Chris@42 1125 TfG = VADD(TfA, Tfz);
Chris@42 1126 TfB = VSUB(Tfz, TfA);
Chris@42 1127 TfJ = VSUB(Tfl, Tf0);
Chris@42 1128 Tfm = VADD(Tf0, Tfl);
Chris@42 1129 Tg1 = VFNMS(LDK(KP820678790), TfT, TfU);
Chris@42 1130 TfV = VFMA(LDK(KP820678790), TfU, TfT);
Chris@42 1131 Tgn = VFNMS(LDK(KP668178637), Tgm, Tgl);
Chris@42 1132 TgJ = VFMA(LDK(KP668178637), Tgl, Tgm);
Chris@42 1133 TfL = VFMA(LDK(KP995184726), TfG, TfF);
Chris@42 1134 TfH = VFNMS(LDK(KP995184726), TfG, TfF);
Chris@42 1135 {
Chris@42 1136 V TfE, TfC, TfM, TfK;
Chris@42 1137 TfE = VFMA(LDK(KP995184726), TfB, Tfy);
Chris@42 1138 TfC = VFNMS(LDK(KP995184726), TfB, Tfy);
Chris@42 1139 TfM = VFNMS(LDK(KP995184726), TfJ, TfI);
Chris@42 1140 TfK = VFMA(LDK(KP995184726), TfJ, TfI);
Chris@42 1141 {
Chris@42 1142 V TfD, Tfn, Tg8, Tg3;
Chris@42 1143 TfD = VFMA(LDK(KP995184726), Tfm, TeF);
Chris@42 1144 Tfn = VFNMS(LDK(KP995184726), Tfm, TeF);
Chris@42 1145 Tg8 = VADD(Tg2, Tg1);
Chris@42 1146 Tg3 = VSUB(Tg1, Tg2);
Chris@42 1147 {
Chris@42 1148 V Tgb, TfW, Thd, Tgo;
Chris@42 1149 Tgb = VSUB(TfV, TfS);
Chris@42 1150 TfW = VADD(TfS, TfV);
Chris@42 1151 Thd = VSUB(Tgn, Tgk);
Chris@42 1152 Tgo = VADD(Tgk, Tgn);
Chris@42 1153 ST(&(xo[WS(os, 98)]), VFMAI(TfM, TfL), ovs, &(xo[0]));
Chris@42 1154 ST(&(xo[WS(os, 30)]), VFNMSI(TfM, TfL), ovs, &(xo[0]));
Chris@42 1155 ST(&(xo[WS(os, 94)]), VFNMSI(TfK, TfH), ovs, &(xo[0]));
Chris@42 1156 ST(&(xo[WS(os, 34)]), VFMAI(TfK, TfH), ovs, &(xo[0]));
Chris@42 1157 ST(&(xo[WS(os, 2)]), VFMAI(TfE, TfD), ovs, &(xo[0]));
Chris@42 1158 ST(&(xo[WS(os, 126)]), VFNMSI(TfE, TfD), ovs, &(xo[0]));
Chris@42 1159 ST(&(xo[WS(os, 66)]), VFMAI(TfC, Tfn), ovs, &(xo[0]));
Chris@42 1160 ST(&(xo[WS(os, 62)]), VFNMSI(TfC, Tfn), ovs, &(xo[0]));
Chris@42 1161 {
Chris@42 1162 V Tgd, Tg9, Tg6, Tg4;
Chris@42 1163 Tgd = VFNMS(LDK(KP773010453), Tg8, Tg7);
Chris@42 1164 Tg9 = VFMA(LDK(KP773010453), Tg8, Tg7);
Chris@42 1165 Tg6 = VFMA(LDK(KP773010453), Tg3, Tg0);
Chris@42 1166 Tg4 = VFNMS(LDK(KP773010453), Tg3, Tg0);
Chris@42 1167 {
Chris@42 1168 V Tge, Tgc, Tg5, TfX;
Chris@42 1169 Tge = VFMA(LDK(KP773010453), Tgb, Tga);
Chris@42 1170 Tgc = VFNMS(LDK(KP773010453), Tgb, Tga);
Chris@42 1171 Tg5 = VFMA(LDK(KP773010453), TfW, TfP);
Chris@42 1172 TfX = VFNMS(LDK(KP773010453), TfW, TfP);
Chris@42 1173 The = VFMA(LDK(KP831469612), Thd, Thc);
Chris@42 1174 Tho = VFNMS(LDK(KP831469612), Thd, Thc);
Chris@42 1175 TgT = VFMA(LDK(KP831469612), Tgo, Tgh);
Chris@42 1176 Tgp = VFNMS(LDK(KP831469612), Tgo, Tgh);
Chris@42 1177 ST(&(xo[WS(os, 110)]), VFNMSI(Tge, Tgd), ovs, &(xo[0]));
Chris@42 1178 ST(&(xo[WS(os, 18)]), VFMAI(Tge, Tgd), ovs, &(xo[0]));
Chris@42 1179 ST(&(xo[WS(os, 82)]), VFMAI(Tgc, Tg9), ovs, &(xo[0]));
Chris@42 1180 ST(&(xo[WS(os, 46)]), VFNMSI(Tgc, Tg9), ovs, &(xo[0]));
Chris@42 1181 ST(&(xo[WS(os, 114)]), VFMAI(Tg6, Tg5), ovs, &(xo[0]));
Chris@42 1182 ST(&(xo[WS(os, 14)]), VFNMSI(Tg6, Tg5), ovs, &(xo[0]));
Chris@42 1183 ST(&(xo[WS(os, 50)]), VFMAI(Tg4, TfX), ovs, &(xo[0]));
Chris@42 1184 ST(&(xo[WS(os, 78)]), VFNMSI(Tg4, TfX), ovs, &(xo[0]));
Chris@42 1185 }
Chris@42 1186 }
Chris@42 1187 }
Chris@42 1188 }
Chris@42 1189 }
Chris@42 1190 }
Chris@42 1191 {
Chris@42 1192 V Th4, Tgs, Tgv, Th5, Tgz, TgC, Th2, TgL;
Chris@42 1193 Th4 = VFMA(LDK(KP923879532), Tgr, Tgq);
Chris@42 1194 Tgs = VFNMS(LDK(KP923879532), Tgr, Tgq);
Chris@42 1195 Tgv = VFMA(LDK(KP923879532), Tgu, Tgt);
Chris@42 1196 Th5 = VFNMS(LDK(KP923879532), Tgu, Tgt);
Chris@42 1197 Th7 = VFMA(LDK(KP923879532), Tgy, Tgx);
Chris@42 1198 Tgz = VFNMS(LDK(KP923879532), Tgy, Tgx);
Chris@42 1199 TgC = VFMA(LDK(KP923879532), TgB, TgA);
Chris@42 1200 Th8 = VFNMS(LDK(KP923879532), TgB, TgA);
Chris@42 1201 Th2 = VADD(TgK, TgJ);
Chris@42 1202 TgL = VSUB(TgJ, TgK);
Chris@42 1203 {
Chris@42 1204 V TgO, Tgw, TgN, TgD;
Chris@42 1205 TgO = VFMA(LDK(KP534511135), Tgs, Tgv);
Chris@42 1206 Tgw = VFNMS(LDK(KP534511135), Tgv, Tgs);
Chris@42 1207 TgN = VFMA(LDK(KP534511135), Tgz, TgC);
Chris@42 1208 TgD = VFNMS(LDK(KP534511135), TgC, Tgz);
Chris@42 1209 Thg = VFNMS(LDK(KP303346683), Th4, Th5);
Chris@42 1210 Th6 = VFMA(LDK(KP303346683), Th5, Th4);
Chris@42 1211 Th3 = VFMA(LDK(KP831469612), Th2, Th1);
Chris@42 1212 Thl = VFNMS(LDK(KP831469612), Th2, Th1);
Chris@42 1213 TgW = VFNMS(LDK(KP831469612), TgL, TgI);
Chris@42 1214 TgM = VFMA(LDK(KP831469612), TgL, TgI);
Chris@42 1215 TgU = VADD(TgO, TgN);
Chris@42 1216 TgP = VSUB(TgN, TgO);
Chris@42 1217 TgX = VSUB(TgD, Tgw);
Chris@42 1218 TgE = VADD(Tgw, TgD);
Chris@42 1219 }
Chris@42 1220 }
Chris@42 1221 }
Chris@42 1222 {
Chris@42 1223 V T8u, T8v, T7R, T8d, T7G, Thm, Thh, Thp, Tha, T7Y, Thr, Thn;
Chris@42 1224 {
Chris@42 1225 V T7y, T7F, TgZ, TgV;
Chris@42 1226 T8u = VFNMS(LDK(KP831469612), T7x, T7q);
Chris@42 1227 T7y = VFMA(LDK(KP831469612), T7x, T7q);
Chris@42 1228 T7F = VFMA(LDK(KP831469612), T7E, T7B);
Chris@42 1229 T8v = VFNMS(LDK(KP831469612), T7E, T7B);
Chris@42 1230 T8x = VFNMS(LDK(KP831469612), T7Q, T7J);
Chris@42 1231 T7R = VFMA(LDK(KP831469612), T7Q, T7J);
Chris@42 1232 TgZ = VFMA(LDK(KP881921264), TgU, TgT);
Chris@42 1233 TgV = VFNMS(LDK(KP881921264), TgU, TgT);
Chris@42 1234 {
Chris@42 1235 V TgS, TgQ, Th0, TgY;
Chris@42 1236 TgS = VFMA(LDK(KP881921264), TgP, TgM);
Chris@42 1237 TgQ = VFNMS(LDK(KP881921264), TgP, TgM);
Chris@42 1238 Th0 = VFNMS(LDK(KP881921264), TgX, TgW);
Chris@42 1239 TgY = VFMA(LDK(KP881921264), TgX, TgW);
Chris@42 1240 {
Chris@42 1241 V TgR, TgF, Thf, Th9;
Chris@42 1242 TgR = VFMA(LDK(KP881921264), TgE, Tgp);
Chris@42 1243 TgF = VFNMS(LDK(KP881921264), TgE, Tgp);
Chris@42 1244 Thf = VFNMS(LDK(KP303346683), Th7, Th8);
Chris@42 1245 Th9 = VFMA(LDK(KP303346683), Th8, Th7);
Chris@42 1246 T8d = VFNMS(LDK(KP148335987), T7y, T7F);
Chris@42 1247 T7G = VFMA(LDK(KP148335987), T7F, T7y);
Chris@42 1248 ST(&(xo[WS(os, 106)]), VFMAI(Th0, TgZ), ovs, &(xo[0]));
Chris@42 1249 ST(&(xo[WS(os, 22)]), VFNMSI(Th0, TgZ), ovs, &(xo[0]));
Chris@42 1250 ST(&(xo[WS(os, 86)]), VFNMSI(TgY, TgV), ovs, &(xo[0]));
Chris@42 1251 ST(&(xo[WS(os, 42)]), VFMAI(TgY, TgV), ovs, &(xo[0]));
Chris@42 1252 ST(&(xo[WS(os, 10)]), VFMAI(TgS, TgR), ovs, &(xo[0]));
Chris@42 1253 ST(&(xo[WS(os, 118)]), VFNMSI(TgS, TgR), ovs, &(xo[0]));
Chris@42 1254 ST(&(xo[WS(os, 74)]), VFMAI(TgQ, TgF), ovs, &(xo[0]));
Chris@42 1255 ST(&(xo[WS(os, 54)]), VFNMSI(TgQ, TgF), ovs, &(xo[0]));
Chris@42 1256 Thm = VADD(Thg, Thf);
Chris@42 1257 Thh = VSUB(Thf, Thg);
Chris@42 1258 Thp = VSUB(Th9, Th6);
Chris@42 1259 Tha = VADD(Th6, Th9);
Chris@42 1260 T7Y = VFMA(LDK(KP831469612), T7X, T7U);
Chris@42 1261 T8y = VFNMS(LDK(KP831469612), T7X, T7U);
Chris@42 1262 }
Chris@42 1263 }
Chris@42 1264 }
Chris@42 1265 Thr = VFNMS(LDK(KP956940335), Thm, Thl);
Chris@42 1266 Thn = VFMA(LDK(KP956940335), Thm, Thl);
Chris@42 1267 {
Chris@42 1268 V Thk, Thi, Ths, Thq;
Chris@42 1269 Thk = VFMA(LDK(KP956940335), Thh, The);
Chris@42 1270 Thi = VFNMS(LDK(KP956940335), Thh, The);
Chris@42 1271 Ths = VFMA(LDK(KP956940335), Thp, Tho);
Chris@42 1272 Thq = VFNMS(LDK(KP956940335), Thp, Tho);
Chris@42 1273 {
Chris@42 1274 V Thj, Thb, T8e, T7Z;
Chris@42 1275 Thj = VFMA(LDK(KP956940335), Tha, Th3);
Chris@42 1276 Thb = VFNMS(LDK(KP956940335), Tha, Th3);
Chris@42 1277 T8e = VFNMS(LDK(KP148335987), T7R, T7Y);
Chris@42 1278 T7Z = VFMA(LDK(KP148335987), T7Y, T7R);
Chris@42 1279 T8F = VFMA(LDK(KP741650546), T8u, T8v);
Chris@42 1280 T8w = VFNMS(LDK(KP741650546), T8v, T8u);
Chris@42 1281 ST(&(xo[WS(os, 102)]), VFNMSI(Ths, Thr), ovs, &(xo[0]));
Chris@42 1282 ST(&(xo[WS(os, 26)]), VFMAI(Ths, Thr), ovs, &(xo[0]));
Chris@42 1283 ST(&(xo[WS(os, 90)]), VFMAI(Thq, Thn), ovs, &(xo[0]));
Chris@42 1284 ST(&(xo[WS(os, 38)]), VFNMSI(Thq, Thn), ovs, &(xo[0]));
Chris@42 1285 ST(&(xo[WS(os, 122)]), VFMAI(Thk, Thj), ovs, &(xo[0]));
Chris@42 1286 ST(&(xo[WS(os, 6)]), VFNMSI(Thk, Thj), ovs, &(xo[0]));
Chris@42 1287 ST(&(xo[WS(os, 58)]), VFMAI(Thi, Thb), ovs, &(xo[0]));
Chris@42 1288 ST(&(xo[WS(os, 70)]), VFNMSI(Thi, Thb), ovs, &(xo[0]));
Chris@42 1289 T8k = VADD(T8d, T8e);
Chris@42 1290 T8f = VSUB(T8d, T8e);
Chris@42 1291 T8n = VSUB(T7Z, T7G);
Chris@42 1292 T80 = VADD(T7G, T7Z);
Chris@42 1293 }
Chris@42 1294 }
Chris@42 1295 T9l = VSUB(T75, T72);
Chris@42 1296 T76 = VADD(T72, T75);
Chris@42 1297 T87 = VSUB(T85, T86);
Chris@42 1298 T8U = VADD(T85, T86);
Chris@42 1299 T89 = VFNMS(LDK(KP303346683), T7a, T7d);
Chris@42 1300 T7e = VFMA(LDK(KP303346683), T7d, T7a);
Chris@42 1301 T7l = VFMA(LDK(KP303346683), T7k, T7h);
Chris@42 1302 T8a = VFNMS(LDK(KP303346683), T7h, T7k);
Chris@42 1303 }
Chris@42 1304 }
Chris@42 1305 {
Chris@42 1306 V T11, T5h, T5a, T55, T5d, T4K, T5C, T5x, T5F, T5q, T4X, T4Z, T1C, T2d, T50;
Chris@42 1307 {
Chris@42 1308 V T5k, T3g, T3t, T5l, T5n, T4v, T4I, T5o, T8G, T8z;
Chris@42 1309 T5k = VFNMS(LDK(KP980785280), T3f, T2G);
Chris@42 1310 T3g = VFMA(LDK(KP980785280), T3f, T2G);
Chris@42 1311 T8G = VFMA(LDK(KP741650546), T8x, T8y);
Chris@42 1312 T8z = VFNMS(LDK(KP741650546), T8y, T8x);
Chris@42 1313 {
Chris@42 1314 V T8r, T77, T8C, T88;
Chris@42 1315 T8r = VFNMS(LDK(KP831469612), T76, T6Z);
Chris@42 1316 T77 = VFMA(LDK(KP831469612), T76, T6Z);
Chris@42 1317 T8C = VFNMS(LDK(KP831469612), T87, T84);
Chris@42 1318 T88 = VFMA(LDK(KP831469612), T87, T84);
Chris@42 1319 {
Chris@42 1320 V T8D, T7m, T8s, T8b;
Chris@42 1321 T8D = VSUB(T7l, T7e);
Chris@42 1322 T7m = VADD(T7e, T7l);
Chris@42 1323 T8s = VADD(T89, T8a);
Chris@42 1324 T8b = VSUB(T89, T8a);
Chris@42 1325 {
Chris@42 1326 V T8M, T8H, T8P, T8A;
Chris@42 1327 T8M = VADD(T8F, T8G);
Chris@42 1328 T8H = VSUB(T8F, T8G);
Chris@42 1329 T8P = VSUB(T8z, T8w);
Chris@42 1330 T8A = VADD(T8w, T8z);
Chris@42 1331 {
Chris@42 1332 V T8E, T8O, T8j, T7n;
Chris@42 1333 T8E = VFNMS(LDK(KP956940335), T8D, T8C);
Chris@42 1334 T8O = VFMA(LDK(KP956940335), T8D, T8C);
Chris@42 1335 T8j = VFNMS(LDK(KP956940335), T7m, T77);
Chris@42 1336 T7n = VFMA(LDK(KP956940335), T7m, T77);
Chris@42 1337 {
Chris@42 1338 V T8t, T8L, T8m, T8c;
Chris@42 1339 T8t = VFNMS(LDK(KP956940335), T8s, T8r);
Chris@42 1340 T8L = VFMA(LDK(KP956940335), T8s, T8r);
Chris@42 1341 T8m = VFNMS(LDK(KP956940335), T8b, T88);
Chris@42 1342 T8c = VFMA(LDK(KP956940335), T8b, T88);
Chris@42 1343 {
Chris@42 1344 V T8K, T8I, T8S, T8Q;
Chris@42 1345 T8K = VFMA(LDK(KP803207531), T8H, T8E);
Chris@42 1346 T8I = VFNMS(LDK(KP803207531), T8H, T8E);
Chris@42 1347 T8S = VFMA(LDK(KP803207531), T8P, T8O);
Chris@42 1348 T8Q = VFNMS(LDK(KP803207531), T8P, T8O);
Chris@42 1349 {
Chris@42 1350 V T8p, T8l, T8h, T81;
Chris@42 1351 T8p = VFNMS(LDK(KP989176509), T8k, T8j);
Chris@42 1352 T8l = VFMA(LDK(KP989176509), T8k, T8j);
Chris@42 1353 T8h = VFMA(LDK(KP989176509), T80, T7n);
Chris@42 1354 T81 = VFNMS(LDK(KP989176509), T80, T7n);
Chris@42 1355 {
Chris@42 1356 V T8J, T8B, T8R, T8N;
Chris@42 1357 T8J = VFMA(LDK(KP803207531), T8A, T8t);
Chris@42 1358 T8B = VFNMS(LDK(KP803207531), T8A, T8t);
Chris@42 1359 T8R = VFMA(LDK(KP803207531), T8M, T8L);
Chris@42 1360 T8N = VFNMS(LDK(KP803207531), T8M, T8L);
Chris@42 1361 {
Chris@42 1362 V T8q, T8o, T8i, T8g;
Chris@42 1363 T8q = VFNMS(LDK(KP989176509), T8n, T8m);
Chris@42 1364 T8o = VFMA(LDK(KP989176509), T8n, T8m);
Chris@42 1365 T8i = VFMA(LDK(KP989176509), T8f, T8c);
Chris@42 1366 T8g = VFNMS(LDK(KP989176509), T8f, T8c);
Chris@42 1367 ST(&(xo[WS(os, 115)]), VFMAI(T8K, T8J), ovs, &(xo[WS(os, 1)]));
Chris@42 1368 ST(&(xo[WS(os, 13)]), VFNMSI(T8K, T8J), ovs, &(xo[WS(os, 1)]));
Chris@42 1369 ST(&(xo[WS(os, 51)]), VFMAI(T8I, T8B), ovs, &(xo[WS(os, 1)]));
Chris@42 1370 ST(&(xo[WS(os, 77)]), VFNMSI(T8I, T8B), ovs, &(xo[WS(os, 1)]));
Chris@42 1371 ST(&(xo[WS(os, 109)]), VFNMSI(T8S, T8R), ovs, &(xo[WS(os, 1)]));
Chris@42 1372 ST(&(xo[WS(os, 19)]), VFMAI(T8S, T8R), ovs, &(xo[WS(os, 1)]));
Chris@42 1373 ST(&(xo[WS(os, 83)]), VFMAI(T8Q, T8N), ovs, &(xo[WS(os, 1)]));
Chris@42 1374 ST(&(xo[WS(os, 45)]), VFNMSI(T8Q, T8N), ovs, &(xo[WS(os, 1)]));
Chris@42 1375 ST(&(xo[WS(os, 99)]), VFMAI(T8q, T8p), ovs, &(xo[WS(os, 1)]));
Chris@42 1376 ST(&(xo[WS(os, 29)]), VFNMSI(T8q, T8p), ovs, &(xo[WS(os, 1)]));
Chris@42 1377 ST(&(xo[WS(os, 93)]), VFNMSI(T8o, T8l), ovs, &(xo[WS(os, 1)]));
Chris@42 1378 ST(&(xo[WS(os, 35)]), VFMAI(T8o, T8l), ovs, &(xo[WS(os, 1)]));
Chris@42 1379 ST(&(xo[WS(os, 3)]), VFMAI(T8i, T8h), ovs, &(xo[WS(os, 1)]));
Chris@42 1380 ST(&(xo[WS(os, 125)]), VFNMSI(T8i, T8h), ovs, &(xo[WS(os, 1)]));
Chris@42 1381 ST(&(xo[WS(os, 67)]), VFMAI(T8g, T81), ovs, &(xo[WS(os, 1)]));
Chris@42 1382 ST(&(xo[WS(os, 61)]), VFNMSI(T8g, T81), ovs, &(xo[WS(os, 1)]));
Chris@42 1383 T3t = VFMA(LDK(KP980785280), T3s, T3p);
Chris@42 1384 T5l = VFNMS(LDK(KP980785280), T3s, T3p);
Chris@42 1385 }
Chris@42 1386 }
Chris@42 1387 }
Chris@42 1388 }
Chris@42 1389 }
Chris@42 1390 }
Chris@42 1391 }
Chris@42 1392 }
Chris@42 1393 }
Chris@42 1394 T5n = VFNMS(LDK(KP980785280), T4u, T3V);
Chris@42 1395 T4v = VFMA(LDK(KP980785280), T4u, T3V);
Chris@42 1396 T4I = VFMA(LDK(KP980785280), T4H, T4E);
Chris@42 1397 T5o = VFNMS(LDK(KP980785280), T4H, T4E);
Chris@42 1398 {
Chris@42 1399 V T53, T3u, T54, T4J, T5v, T5m, T5w, T5p, T10;
Chris@42 1400 T6b = VSUB(TZ, TI);
Chris@42 1401 T10 = VADD(TI, TZ);
Chris@42 1402 T53 = VFMA(LDK(KP049126849), T3g, T3t);
Chris@42 1403 T3u = VFNMS(LDK(KP049126849), T3t, T3g);
Chris@42 1404 T54 = VFMA(LDK(KP049126849), T4v, T4I);
Chris@42 1405 T4J = VFNMS(LDK(KP049126849), T4I, T4v);
Chris@42 1406 T5v = VFNMS(LDK(KP906347169), T5k, T5l);
Chris@42 1407 T5m = VFMA(LDK(KP906347169), T5l, T5k);
Chris@42 1408 T5w = VFNMS(LDK(KP906347169), T5n, T5o);
Chris@42 1409 T5p = VFMA(LDK(KP906347169), T5o, T5n);
Chris@42 1410 T11 = VFMA(LDK(KP980785280), T10, Tr);
Chris@42 1411 T5h = VFNMS(LDK(KP980785280), T10, Tr);
Chris@42 1412 T5a = VADD(T53, T54);
Chris@42 1413 T55 = VSUB(T53, T54);
Chris@42 1414 T5d = VSUB(T4J, T3u);
Chris@42 1415 T4K = VADD(T3u, T4J);
Chris@42 1416 T5C = VADD(T5v, T5w);
Chris@42 1417 T5x = VSUB(T5v, T5w);
Chris@42 1418 T5F = VSUB(T5p, T5m);
Chris@42 1419 T5q = VADD(T5m, T5p);
Chris@42 1420 T4X = VSUB(T4V, T4W);
Chris@42 1421 T5K = VADD(T4V, T4W);
Chris@42 1422 }
Chris@42 1423 T4Z = VFMA(LDK(KP098491403), T1s, T1B);
Chris@42 1424 T1C = VFNMS(LDK(KP098491403), T1B, T1s);
Chris@42 1425 T2d = VFNMS(LDK(KP098491403), T2c, T23);
Chris@42 1426 T50 = VFMA(LDK(KP098491403), T23, T2c);
Chris@42 1427 }
Chris@42 1428 {
Chris@42 1429 V T9y, T9t, T9B, T9i, T9o, T9n, T9F, T8V, T9Q, T9m, T9R, T92, Ta0, T9V, Ta3;
Chris@42 1430 V T9O;
Chris@42 1431 {
Chris@42 1432 V T9I, T9J, T9L, T9d, T5s, T4Y, T5t, T2e, T5i, T51, T9r, T9a, T9g, T9M, T96;
Chris@42 1433 V T99;
Chris@42 1434 T9I = VFMA(LDK(KP831469612), T95, T94);
Chris@42 1435 T96 = VFNMS(LDK(KP831469612), T95, T94);
Chris@42 1436 T99 = VFNMS(LDK(KP831469612), T98, T97);
Chris@42 1437 T9J = VFMA(LDK(KP831469612), T98, T97);
Chris@42 1438 T9L = VFMA(LDK(KP831469612), T9c, T9b);
Chris@42 1439 T9d = VFNMS(LDK(KP831469612), T9c, T9b);
Chris@42 1440 T5s = VFNMS(LDK(KP980785280), T4X, T4U);
Chris@42 1441 T4Y = VFMA(LDK(KP980785280), T4X, T4U);
Chris@42 1442 T5t = VSUB(T2d, T1C);
Chris@42 1443 T2e = VADD(T1C, T2d);
Chris@42 1444 T5i = VADD(T4Z, T50);
Chris@42 1445 T51 = VSUB(T4Z, T50);
Chris@42 1446 T9r = VFNMS(LDK(KP599376933), T96, T99);
Chris@42 1447 T9a = VFMA(LDK(KP599376933), T99, T96);
Chris@42 1448 T9g = VFNMS(LDK(KP831469612), T9f, T9e);
Chris@42 1449 T9M = VFMA(LDK(KP831469612), T9f, T9e);
Chris@42 1450 {
Chris@42 1451 V T5u, T5E, T8Y, T91;
Chris@42 1452 T5u = VFMA(LDK(KP995184726), T5t, T5s);
Chris@42 1453 T5E = VFNMS(LDK(KP995184726), T5t, T5s);
Chris@42 1454 {
Chris@42 1455 V T59, T2f, T5j, T5B;
Chris@42 1456 T59 = VFNMS(LDK(KP995184726), T2e, T11);
Chris@42 1457 T2f = VFMA(LDK(KP995184726), T2e, T11);
Chris@42 1458 T5j = VFMA(LDK(KP995184726), T5i, T5h);
Chris@42 1459 T5B = VFNMS(LDK(KP995184726), T5i, T5h);
Chris@42 1460 {
Chris@42 1461 V T5c, T52, T9s, T9h;
Chris@42 1462 T5c = VFNMS(LDK(KP995184726), T51, T4Y);
Chris@42 1463 T52 = VFMA(LDK(KP995184726), T51, T4Y);
Chris@42 1464 T9s = VFNMS(LDK(KP599376933), T9d, T9g);
Chris@42 1465 T9h = VFMA(LDK(KP599376933), T9g, T9d);
Chris@42 1466 {
Chris@42 1467 V T5A, T5y, T5I, T5G;
Chris@42 1468 T5A = VFMA(LDK(KP740951125), T5x, T5u);
Chris@42 1469 T5y = VFNMS(LDK(KP740951125), T5x, T5u);
Chris@42 1470 T5I = VFNMS(LDK(KP740951125), T5F, T5E);
Chris@42 1471 T5G = VFMA(LDK(KP740951125), T5F, T5E);
Chris@42 1472 {
Chris@42 1473 V T5f, T5b, T57, T4L;
Chris@42 1474 T5f = VFMA(LDK(KP998795456), T5a, T59);
Chris@42 1475 T5b = VFNMS(LDK(KP998795456), T5a, T59);
Chris@42 1476 T57 = VFMA(LDK(KP998795456), T4K, T2f);
Chris@42 1477 T4L = VFNMS(LDK(KP998795456), T4K, T2f);
Chris@42 1478 {
Chris@42 1479 V T5z, T5r, T5H, T5D;
Chris@42 1480 T5z = VFMA(LDK(KP740951125), T5q, T5j);
Chris@42 1481 T5r = VFNMS(LDK(KP740951125), T5q, T5j);
Chris@42 1482 T5H = VFNMS(LDK(KP740951125), T5C, T5B);
Chris@42 1483 T5D = VFMA(LDK(KP740951125), T5C, T5B);
Chris@42 1484 {
Chris@42 1485 V T5g, T5e, T58, T56;
Chris@42 1486 T5g = VFMA(LDK(KP998795456), T5d, T5c);
Chris@42 1487 T5e = VFNMS(LDK(KP998795456), T5d, T5c);
Chris@42 1488 T58 = VFMA(LDK(KP998795456), T55, T52);
Chris@42 1489 T56 = VFNMS(LDK(KP998795456), T55, T52);
Chris@42 1490 T9y = VADD(T9r, T9s);
Chris@42 1491 T9t = VSUB(T9r, T9s);
Chris@42 1492 T9B = VSUB(T9h, T9a);
Chris@42 1493 T9i = VADD(T9a, T9h);
Chris@42 1494 ST(&(xo[WS(os, 15)]), VFMAI(T5A, T5z), ovs, &(xo[WS(os, 1)]));
Chris@42 1495 ST(&(xo[WS(os, 113)]), VFNMSI(T5A, T5z), ovs, &(xo[WS(os, 1)]));
Chris@42 1496 ST(&(xo[WS(os, 79)]), VFMAI(T5y, T5r), ovs, &(xo[WS(os, 1)]));
Chris@42 1497 ST(&(xo[WS(os, 49)]), VFNMSI(T5y, T5r), ovs, &(xo[WS(os, 1)]));
Chris@42 1498 ST(&(xo[WS(os, 111)]), VFMAI(T5I, T5H), ovs, &(xo[WS(os, 1)]));
Chris@42 1499 ST(&(xo[WS(os, 17)]), VFNMSI(T5I, T5H), ovs, &(xo[WS(os, 1)]));
Chris@42 1500 ST(&(xo[WS(os, 81)]), VFNMSI(T5G, T5D), ovs, &(xo[WS(os, 1)]));
Chris@42 1501 ST(&(xo[WS(os, 47)]), VFMAI(T5G, T5D), ovs, &(xo[WS(os, 1)]));
Chris@42 1502 ST(&(xo[WS(os, 97)]), VFNMSI(T5g, T5f), ovs, &(xo[WS(os, 1)]));
Chris@42 1503 ST(&(xo[WS(os, 31)]), VFMAI(T5g, T5f), ovs, &(xo[WS(os, 1)]));
Chris@42 1504 ST(&(xo[WS(os, 95)]), VFMAI(T5e, T5b), ovs, &(xo[WS(os, 1)]));
Chris@42 1505 ST(&(xo[WS(os, 33)]), VFNMSI(T5e, T5b), ovs, &(xo[WS(os, 1)]));
Chris@42 1506 ST(&(xo[WS(os, 127)]), VFMAI(T58, T57), ovs, &(xo[WS(os, 1)]));
Chris@42 1507 ST(&(xo[WS(os, 1)]), VFNMSI(T58, T57), ovs, &(xo[WS(os, 1)]));
Chris@42 1508 ST(&(xo[WS(os, 63)]), VFMAI(T56, T4L), ovs, &(xo[WS(os, 1)]));
Chris@42 1509 ST(&(xo[WS(os, 65)]), VFNMSI(T56, T4L), ovs, &(xo[WS(os, 1)]));
Chris@42 1510 }
Chris@42 1511 }
Chris@42 1512 }
Chris@42 1513 }
Chris@42 1514 }
Chris@42 1515 }
Chris@42 1516 T9o = VFNMS(LDK(KP534511135), T8W, T8X);
Chris@42 1517 T8Y = VFMA(LDK(KP534511135), T8X, T8W);
Chris@42 1518 T91 = VFMA(LDK(KP534511135), T90, T8Z);
Chris@42 1519 T9n = VFNMS(LDK(KP534511135), T8Z, T90);
Chris@42 1520 {
Chris@42 1521 V T9T, T9K, T9U, T9N;
Chris@42 1522 T9T = VFMA(LDK(KP250486960), T9I, T9J);
Chris@42 1523 T9K = VFNMS(LDK(KP250486960), T9J, T9I);
Chris@42 1524 T9U = VFMA(LDK(KP250486960), T9L, T9M);
Chris@42 1525 T9N = VFNMS(LDK(KP250486960), T9M, T9L);
Chris@42 1526 T9F = VFNMS(LDK(KP831469612), T8U, T8T);
Chris@42 1527 T8V = VFMA(LDK(KP831469612), T8U, T8T);
Chris@42 1528 T9Q = VFNMS(LDK(KP831469612), T9l, T9k);
Chris@42 1529 T9m = VFMA(LDK(KP831469612), T9l, T9k);
Chris@42 1530 T9R = VSUB(T8Y, T91);
Chris@42 1531 T92 = VADD(T8Y, T91);
Chris@42 1532 Ta0 = VADD(T9T, T9U);
Chris@42 1533 T9V = VSUB(T9T, T9U);
Chris@42 1534 Ta3 = VSUB(T9N, T9K);
Chris@42 1535 T9O = VADD(T9K, T9N);
Chris@42 1536 }
Chris@42 1537 }
Chris@42 1538 }
Chris@42 1539 {
Chris@42 1540 V T6y, T6z, T63, T9Y, T9W, Ta6, Ta4, T9D, T9z, T9v, T9j, T6h, T60, T9H, T9Z;
Chris@42 1541 V T9A, T9q, T66, T9X, T9P;
Chris@42 1542 {
Chris@42 1543 V T5W, T9S, Ta2, T9x, T93, T5Z, T9G, T9p;
Chris@42 1544 T6y = VFMA(LDK(KP980785280), T5V, T5U);
Chris@42 1545 T5W = VFNMS(LDK(KP980785280), T5V, T5U);
Chris@42 1546 T9S = VFMA(LDK(KP881921264), T9R, T9Q);
Chris@42 1547 Ta2 = VFNMS(LDK(KP881921264), T9R, T9Q);
Chris@42 1548 T9x = VFNMS(LDK(KP881921264), T92, T8V);
Chris@42 1549 T93 = VFMA(LDK(KP881921264), T92, T8V);
Chris@42 1550 T5Z = VFMA(LDK(KP980785280), T5Y, T5X);
Chris@42 1551 T6z = VFNMS(LDK(KP980785280), T5Y, T5X);
Chris@42 1552 T6B = VFMA(LDK(KP980785280), T62, T61);
Chris@42 1553 T63 = VFNMS(LDK(KP980785280), T62, T61);
Chris@42 1554 T9G = VADD(T9o, T9n);
Chris@42 1555 T9p = VSUB(T9n, T9o);
Chris@42 1556 T9Y = VFMA(LDK(KP970031253), T9V, T9S);
Chris@42 1557 T9W = VFNMS(LDK(KP970031253), T9V, T9S);
Chris@42 1558 Ta6 = VFMA(LDK(KP970031253), Ta3, Ta2);
Chris@42 1559 Ta4 = VFNMS(LDK(KP970031253), Ta3, Ta2);
Chris@42 1560 T9D = VFNMS(LDK(KP857728610), T9y, T9x);
Chris@42 1561 T9z = VFMA(LDK(KP857728610), T9y, T9x);
Chris@42 1562 T9v = VFMA(LDK(KP857728610), T9i, T93);
Chris@42 1563 T9j = VFNMS(LDK(KP857728610), T9i, T93);
Chris@42 1564 T6h = VFMA(LDK(KP472964775), T5W, T5Z);
Chris@42 1565 T60 = VFNMS(LDK(KP472964775), T5Z, T5W);
Chris@42 1566 T9H = VFMA(LDK(KP881921264), T9G, T9F);
Chris@42 1567 T9Z = VFNMS(LDK(KP881921264), T9G, T9F);
Chris@42 1568 T9A = VFNMS(LDK(KP881921264), T9p, T9m);
Chris@42 1569 T9q = VFMA(LDK(KP881921264), T9p, T9m);
Chris@42 1570 T66 = VFMA(LDK(KP980785280), T65, T64);
Chris@42 1571 T6C = VFNMS(LDK(KP980785280), T65, T64);
Chris@42 1572 }
Chris@42 1573 T9X = VFMA(LDK(KP970031253), T9O, T9H);
Chris@42 1574 T9P = VFNMS(LDK(KP970031253), T9O, T9H);
Chris@42 1575 {
Chris@42 1576 V Ta5, Ta1, T9E, T9C;
Chris@42 1577 Ta5 = VFMA(LDK(KP970031253), Ta0, T9Z);
Chris@42 1578 Ta1 = VFNMS(LDK(KP970031253), Ta0, T9Z);
Chris@42 1579 T9E = VFNMS(LDK(KP857728610), T9B, T9A);
Chris@42 1580 T9C = VFMA(LDK(KP857728610), T9B, T9A);
Chris@42 1581 {
Chris@42 1582 V T9w, T9u, T6i, T67;
Chris@42 1583 T9w = VFMA(LDK(KP857728610), T9t, T9q);
Chris@42 1584 T9u = VFNMS(LDK(KP857728610), T9t, T9q);
Chris@42 1585 T6i = VFMA(LDK(KP472964775), T63, T66);
Chris@42 1586 T67 = VFNMS(LDK(KP472964775), T66, T63);
Chris@42 1587 T6J = VFNMS(LDK(KP357805721), T6y, T6z);
Chris@42 1588 T6A = VFMA(LDK(KP357805721), T6z, T6y);
Chris@42 1589 ST(&(xo[WS(os, 123)]), VFMAI(T9Y, T9X), ovs, &(xo[WS(os, 1)]));
Chris@42 1590 ST(&(xo[WS(os, 5)]), VFNMSI(T9Y, T9X), ovs, &(xo[WS(os, 1)]));
Chris@42 1591 ST(&(xo[WS(os, 59)]), VFMAI(T9W, T9P), ovs, &(xo[WS(os, 1)]));
Chris@42 1592 ST(&(xo[WS(os, 69)]), VFNMSI(T9W, T9P), ovs, &(xo[WS(os, 1)]));
Chris@42 1593 ST(&(xo[WS(os, 101)]), VFNMSI(Ta6, Ta5), ovs, &(xo[WS(os, 1)]));
Chris@42 1594 ST(&(xo[WS(os, 27)]), VFMAI(Ta6, Ta5), ovs, &(xo[WS(os, 1)]));
Chris@42 1595 ST(&(xo[WS(os, 91)]), VFMAI(Ta4, Ta1), ovs, &(xo[WS(os, 1)]));
Chris@42 1596 ST(&(xo[WS(os, 37)]), VFNMSI(Ta4, Ta1), ovs, &(xo[WS(os, 1)]));
Chris@42 1597 ST(&(xo[WS(os, 107)]), VFMAI(T9E, T9D), ovs, &(xo[WS(os, 1)]));
Chris@42 1598 ST(&(xo[WS(os, 21)]), VFNMSI(T9E, T9D), ovs, &(xo[WS(os, 1)]));
Chris@42 1599 ST(&(xo[WS(os, 85)]), VFNMSI(T9C, T9z), ovs, &(xo[WS(os, 1)]));
Chris@42 1600 ST(&(xo[WS(os, 43)]), VFMAI(T9C, T9z), ovs, &(xo[WS(os, 1)]));
Chris@42 1601 ST(&(xo[WS(os, 11)]), VFMAI(T9w, T9v), ovs, &(xo[WS(os, 1)]));
Chris@42 1602 ST(&(xo[WS(os, 117)]), VFNMSI(T9w, T9v), ovs, &(xo[WS(os, 1)]));
Chris@42 1603 ST(&(xo[WS(os, 75)]), VFMAI(T9u, T9j), ovs, &(xo[WS(os, 1)]));
Chris@42 1604 ST(&(xo[WS(os, 53)]), VFNMSI(T9u, T9j), ovs, &(xo[WS(os, 1)]));
Chris@42 1605 T6o = VADD(T6h, T6i);
Chris@42 1606 T6j = VSUB(T6h, T6i);
Chris@42 1607 T6r = VSUB(T67, T60);
Chris@42 1608 T68 = VADD(T60, T67);
Chris@42 1609 }
Chris@42 1610 }
Chris@42 1611 T6e = VFMA(LDK(KP820678790), T5M, T5N);
Chris@42 1612 T5O = VFNMS(LDK(KP820678790), T5N, T5M);
Chris@42 1613 T5R = VFNMS(LDK(KP820678790), T5Q, T5P);
Chris@42 1614 T6d = VFMA(LDK(KP820678790), T5P, T5Q);
Chris@42 1615 }
Chris@42 1616 }
Chris@42 1617 }
Chris@42 1618 }
Chris@42 1619 }
Chris@42 1620 }
Chris@42 1621 T6D = VFMA(LDK(KP357805721), T6C, T6B);
Chris@42 1622 T6K = VFNMS(LDK(KP357805721), T6B, T6C);
Chris@42 1623 {
Chris@42 1624 V T5L, T6v, T6c, T6G;
Chris@42 1625 T5L = VFNMS(LDK(KP980785280), T5K, T5J);
Chris@42 1626 T6v = VFMA(LDK(KP980785280), T5K, T5J);
Chris@42 1627 T6c = VFNMS(LDK(KP980785280), T6b, T6a);
Chris@42 1628 T6G = VFMA(LDK(KP980785280), T6b, T6a);
Chris@42 1629 {
Chris@42 1630 V T5S, T6H, T6f, T6w;
Chris@42 1631 T5S = VADD(T5O, T5R);
Chris@42 1632 T6H = VSUB(T5O, T5R);
Chris@42 1633 T6f = VSUB(T6d, T6e);
Chris@42 1634 T6w = VADD(T6e, T6d);
Chris@42 1635 {
Chris@42 1636 V T6L, T6Q, T6E, T6T;
Chris@42 1637 T6L = VSUB(T6J, T6K);
Chris@42 1638 T6Q = VADD(T6J, T6K);
Chris@42 1639 T6E = VADD(T6A, T6D);
Chris@42 1640 T6T = VSUB(T6D, T6A);
Chris@42 1641 {
Chris@42 1642 V T6S, T6I, T5T, T6n;
Chris@42 1643 T6S = VFNMS(LDK(KP773010453), T6H, T6G);
Chris@42 1644 T6I = VFMA(LDK(KP773010453), T6H, T6G);
Chris@42 1645 T5T = VFNMS(LDK(KP773010453), T5S, T5L);
Chris@42 1646 T6n = VFMA(LDK(KP773010453), T5S, T5L);
Chris@42 1647 {
Chris@42 1648 V T6P, T6x, T6g, T6q;
Chris@42 1649 T6P = VFNMS(LDK(KP773010453), T6w, T6v);
Chris@42 1650 T6x = VFMA(LDK(KP773010453), T6w, T6v);
Chris@42 1651 T6g = VFNMS(LDK(KP773010453), T6f, T6c);
Chris@42 1652 T6q = VFMA(LDK(KP773010453), T6f, T6c);
Chris@42 1653 {
Chris@42 1654 V T6M, T6O, T6U, T6W;
Chris@42 1655 T6M = VFNMS(LDK(KP941544065), T6L, T6I);
Chris@42 1656 T6O = VFMA(LDK(KP941544065), T6L, T6I);
Chris@42 1657 T6U = VFMA(LDK(KP941544065), T6T, T6S);
Chris@42 1658 T6W = VFNMS(LDK(KP941544065), T6T, T6S);
Chris@42 1659 {
Chris@42 1660 V T6p, T6t, T69, T6l;
Chris@42 1661 T6p = VFNMS(LDK(KP903989293), T6o, T6n);
Chris@42 1662 T6t = VFMA(LDK(KP903989293), T6o, T6n);
Chris@42 1663 T69 = VFNMS(LDK(KP903989293), T68, T5T);
Chris@42 1664 T6l = VFMA(LDK(KP903989293), T68, T5T);
Chris@42 1665 {
Chris@42 1666 V T6F, T6N, T6R, T6V;
Chris@42 1667 T6F = VFNMS(LDK(KP941544065), T6E, T6x);
Chris@42 1668 T6N = VFMA(LDK(KP941544065), T6E, T6x);
Chris@42 1669 T6R = VFMA(LDK(KP941544065), T6Q, T6P);
Chris@42 1670 T6V = VFNMS(LDK(KP941544065), T6Q, T6P);
Chris@42 1671 {
Chris@42 1672 V T6s, T6u, T6k, T6m;
Chris@42 1673 T6s = VFNMS(LDK(KP903989293), T6r, T6q);
Chris@42 1674 T6u = VFMA(LDK(KP903989293), T6r, T6q);
Chris@42 1675 T6k = VFNMS(LDK(KP903989293), T6j, T6g);
Chris@42 1676 T6m = VFMA(LDK(KP903989293), T6j, T6g);
Chris@42 1677 ST(&(xo[WS(os, 7)]), VFMAI(T6O, T6N), ovs, &(xo[WS(os, 1)]));
Chris@42 1678 ST(&(xo[WS(os, 121)]), VFNMSI(T6O, T6N), ovs, &(xo[WS(os, 1)]));
Chris@42 1679 ST(&(xo[WS(os, 71)]), VFMAI(T6M, T6F), ovs, &(xo[WS(os, 1)]));
Chris@42 1680 ST(&(xo[WS(os, 57)]), VFNMSI(T6M, T6F), ovs, &(xo[WS(os, 1)]));
Chris@42 1681 ST(&(xo[WS(os, 103)]), VFMAI(T6W, T6V), ovs, &(xo[WS(os, 1)]));
Chris@42 1682 ST(&(xo[WS(os, 25)]), VFNMSI(T6W, T6V), ovs, &(xo[WS(os, 1)]));
Chris@42 1683 ST(&(xo[WS(os, 89)]), VFNMSI(T6U, T6R), ovs, &(xo[WS(os, 1)]));
Chris@42 1684 ST(&(xo[WS(os, 39)]), VFMAI(T6U, T6R), ovs, &(xo[WS(os, 1)]));
Chris@42 1685 ST(&(xo[WS(os, 105)]), VFNMSI(T6u, T6t), ovs, &(xo[WS(os, 1)]));
Chris@42 1686 ST(&(xo[WS(os, 23)]), VFMAI(T6u, T6t), ovs, &(xo[WS(os, 1)]));
Chris@42 1687 ST(&(xo[WS(os, 87)]), VFMAI(T6s, T6p), ovs, &(xo[WS(os, 1)]));
Chris@42 1688 ST(&(xo[WS(os, 41)]), VFNMSI(T6s, T6p), ovs, &(xo[WS(os, 1)]));
Chris@42 1689 ST(&(xo[WS(os, 119)]), VFMAI(T6m, T6l), ovs, &(xo[WS(os, 1)]));
Chris@42 1690 ST(&(xo[WS(os, 9)]), VFNMSI(T6m, T6l), ovs, &(xo[WS(os, 1)]));
Chris@42 1691 ST(&(xo[WS(os, 55)]), VFMAI(T6k, T69), ovs, &(xo[WS(os, 1)]));
Chris@42 1692 ST(&(xo[WS(os, 73)]), VFNMSI(T6k, T69), ovs, &(xo[WS(os, 1)]));
Chris@42 1693 }
Chris@42 1694 }
Chris@42 1695 }
Chris@42 1696 }
Chris@42 1697 }
Chris@42 1698 }
Chris@42 1699 }
Chris@42 1700 }
Chris@42 1701 }
Chris@42 1702 }
Chris@42 1703 }
Chris@42 1704 VLEAVE();
Chris@42 1705 }
Chris@42 1706
Chris@42 1707 static const kdft_desc desc = { 128, XSIMD_STRING("n1fv_128"), {440, 0, 642, 0}, &GENUS, 0, 0, 0, 0 };
Chris@42 1708
Chris@42 1709 void XSIMD(codelet_n1fv_128) (planner *p) {
Chris@42 1710 X(kdft_register) (p, n1fv_128, &desc);
Chris@42 1711 }
Chris@42 1712
Chris@42 1713 #else /* HAVE_FMA */
Chris@42 1714
Chris@42 1715 /* Generated by: ../../../genfft/gen_notw_c.native -simd -compact -variables 4 -pipeline-latency 8 -n 128 -name n1fv_128 -include n1f.h */
Chris@42 1716
Chris@42 1717 /*
Chris@42 1718 * This function contains 1082 FP additions, 330 FP multiplications,
Chris@42 1719 * (or, 938 additions, 186 multiplications, 144 fused multiply/add),
Chris@42 1720 * 194 stack variables, 31 constants, and 256 memory accesses
Chris@42 1721 */
Chris@42 1722 #include "n1f.h"
Chris@42 1723
Chris@42 1724 static void n1fv_128(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT v, INT ivs, INT ovs)
Chris@42 1725 {
Chris@42 1726 DVK(KP941544065, +0.941544065183020778412509402599502357185589796);
Chris@42 1727 DVK(KP336889853, +0.336889853392220050689253212619147570477766780);
Chris@42 1728 DVK(KP903989293, +0.903989293123443331586200297230537048710132025);
Chris@42 1729 DVK(KP427555093, +0.427555093430282094320966856888798534304578629);
Chris@42 1730 DVK(KP970031253, +0.970031253194543992603984207286100251456865962);
Chris@42 1731 DVK(KP242980179, +0.242980179903263889948274162077471118320990783);
Chris@42 1732 DVK(KP857728610, +0.857728610000272069902269984284770137042490799);
Chris@42 1733 DVK(KP514102744, +0.514102744193221726593693838968815772608049120);
Chris@42 1734 DVK(KP671558954, +0.671558954847018400625376850427421803228750632);
Chris@42 1735 DVK(KP740951125, +0.740951125354959091175616897495162729728955309);
Chris@42 1736 DVK(KP049067674, +0.049067674327418014254954976942682658314745363);
Chris@42 1737 DVK(KP998795456, +0.998795456205172392714771604759100694443203615);
Chris@42 1738 DVK(KP595699304, +0.595699304492433343467036528829969889511926338);
Chris@42 1739 DVK(KP803207531, +0.803207531480644909806676512963141923879569427);
Chris@42 1740 DVK(KP146730474, +0.146730474455361751658850129646717819706215317);
Chris@42 1741 DVK(KP989176509, +0.989176509964780973451673738016243063983689533);
Chris@42 1742 DVK(KP956940335, +0.956940335732208864935797886980269969482849206);
Chris@42 1743 DVK(KP290284677, +0.290284677254462367636192375817395274691476278);
Chris@42 1744 DVK(KP881921264, +0.881921264348355029712756863660388349508442621);
Chris@42 1745 DVK(KP471396736, +0.471396736825997648556387625905254377657460319);
Chris@42 1746 DVK(KP634393284, +0.634393284163645498215171613225493370675687095);
Chris@42 1747 DVK(KP773010453, +0.773010453362736960810906609758469800971041293);
Chris@42 1748 DVK(KP098017140, +0.098017140329560601994195563888641845861136673);
Chris@42 1749 DVK(KP995184726, +0.995184726672196886244836953109479921575474869);
Chris@42 1750 DVK(KP555570233, +0.555570233019602224742830813948532874374937191);
Chris@42 1751 DVK(KP831469612, +0.831469612302545237078788377617905756738560812);
Chris@42 1752 DVK(KP195090322, +0.195090322016128267848284868477022240927691618);
Chris@42 1753 DVK(KP980785280, +0.980785280403230449126182236134239036973933731);
Chris@42 1754 DVK(KP382683432, +0.382683432365089771728459984030398866761344562);
Chris@42 1755 DVK(KP923879532, +0.923879532511286756128183189396788286822416626);
Chris@42 1756 DVK(KP707106781, +0.707106781186547524400844362104849039284835938);
Chris@42 1757 {
Chris@42 1758 INT i;
Chris@42 1759 const R *xi;
Chris@42 1760 R *xo;
Chris@42 1761 xi = ri;
Chris@42 1762 xo = ro;
Chris@42 1763 for (i = v; i > 0; i = i - VL, xi = xi + (VL * ivs), xo = xo + (VL * ovs), MAKE_VOLATILE_STRIDE(256, is), MAKE_VOLATILE_STRIDE(256, os)) {
Chris@42 1764 V Tr, T5J, Ted, Tgf, Tfq, TgH, T4U, T6b, T6Z, T8T, Tad, TcZ, Tcc, Td0, T84;
Chris@42 1765 V T9l, Tb6, Tbt, T2G, T5X, TeV, Tgr, T3p, T5V, T7B, T95, TeK, Tgt, T7q, T97;
Chris@42 1766 V Td8, TdK, TbD, Tc0, T3V, T61, Tfg, TgB, T4E, T65, T7U, T9f, Tf5, Tgx, T7J;
Chris@42 1767 V T9b, Tdf, TdN, Td2, Td3, TI, T4V, Tft, Tgg, TZ, T4W, T75, T86, Tek, TgG;
Chris@42 1768 V T72, T85, Tas, Tcd, Tdp, Tdq, TdG, Teq, Tgm, Tet, Tgl, T1s, T5P, T1B, T5Q;
Chris@42 1769 V T7d, T8Z, TaI, Tcf, T7a, T90, Tdm, Tdn, TdH, Tez, Tgi, TeC, Tgj, T23, T5N;
Chris@42 1770 V T2c, T5M, T7k, T8X, TaX, Tcg, T7h, T8W, Tbl, Tbu, Tdb, TdL, TeY, Tgu, TeR;
Chris@42 1771 V Tgq, T7x, T98, T7E, T94, T3f, T5Y, T3s, T5U, TbS, Tc1, Tdi, TdO, Tfj, Tgy;
Chris@42 1772 V Tfc, TgA, T7Q, T9e, T7X, T9c, T4u, T64, T4H, T62;
Chris@42 1773 {
Chris@42 1774 V T3, Ta7, T4P, Ta8, Ta, Tab, T4M, Taa, Tc9, Tca, Ti, Tea, T4S, Tc6, Tc7;
Chris@42 1775 V Tp, Teb, T4R;
Chris@42 1776 {
Chris@42 1777 V T1, T2, T4N, T4O;
Chris@42 1778 T1 = LD(&(xi[0]), ivs, &(xi[0]));
Chris@42 1779 T2 = LD(&(xi[WS(is, 64)]), ivs, &(xi[0]));
Chris@42 1780 T3 = VSUB(T1, T2);
Chris@42 1781 Ta7 = VADD(T1, T2);
Chris@42 1782 T4N = LD(&(xi[WS(is, 32)]), ivs, &(xi[0]));
Chris@42 1783 T4O = LD(&(xi[WS(is, 96)]), ivs, &(xi[0]));
Chris@42 1784 T4P = VSUB(T4N, T4O);
Chris@42 1785 Ta8 = VADD(T4N, T4O);
Chris@42 1786 }
Chris@42 1787 {
Chris@42 1788 V T4, T5, T6, T7, T8, T9;
Chris@42 1789 T4 = LD(&(xi[WS(is, 16)]), ivs, &(xi[0]));
Chris@42 1790 T5 = LD(&(xi[WS(is, 80)]), ivs, &(xi[0]));
Chris@42 1791 T6 = VSUB(T4, T5);
Chris@42 1792 T7 = LD(&(xi[WS(is, 112)]), ivs, &(xi[0]));
Chris@42 1793 T8 = LD(&(xi[WS(is, 48)]), ivs, &(xi[0]));
Chris@42 1794 T9 = VSUB(T7, T8);
Chris@42 1795 Ta = VMUL(LDK(KP707106781), VADD(T6, T9));
Chris@42 1796 Tab = VADD(T7, T8);
Chris@42 1797 T4M = VMUL(LDK(KP707106781), VSUB(T9, T6));
Chris@42 1798 Taa = VADD(T4, T5);
Chris@42 1799 }
Chris@42 1800 {
Chris@42 1801 V Te, Th, Tl, To;
Chris@42 1802 {
Chris@42 1803 V Tc, Td, Tf, Tg;
Chris@42 1804 Tc = LD(&(xi[WS(is, 8)]), ivs, &(xi[0]));
Chris@42 1805 Td = LD(&(xi[WS(is, 72)]), ivs, &(xi[0]));
Chris@42 1806 Te = VSUB(Tc, Td);
Chris@42 1807 Tc9 = VADD(Tc, Td);
Chris@42 1808 Tf = LD(&(xi[WS(is, 40)]), ivs, &(xi[0]));
Chris@42 1809 Tg = LD(&(xi[WS(is, 104)]), ivs, &(xi[0]));
Chris@42 1810 Th = VSUB(Tf, Tg);
Chris@42 1811 Tca = VADD(Tf, Tg);
Chris@42 1812 }
Chris@42 1813 Ti = VFNMS(LDK(KP382683432), Th, VMUL(LDK(KP923879532), Te));
Chris@42 1814 Tea = VSUB(Tc9, Tca);
Chris@42 1815 T4S = VFMA(LDK(KP382683432), Te, VMUL(LDK(KP923879532), Th));
Chris@42 1816 {
Chris@42 1817 V Tj, Tk, Tm, Tn;
Chris@42 1818 Tj = LD(&(xi[WS(is, 120)]), ivs, &(xi[0]));
Chris@42 1819 Tk = LD(&(xi[WS(is, 56)]), ivs, &(xi[0]));
Chris@42 1820 Tl = VSUB(Tj, Tk);
Chris@42 1821 Tc6 = VADD(Tj, Tk);
Chris@42 1822 Tm = LD(&(xi[WS(is, 24)]), ivs, &(xi[0]));
Chris@42 1823 Tn = LD(&(xi[WS(is, 88)]), ivs, &(xi[0]));
Chris@42 1824 To = VSUB(Tm, Tn);
Chris@42 1825 Tc7 = VADD(Tm, Tn);
Chris@42 1826 }
Chris@42 1827 Tp = VFMA(LDK(KP923879532), Tl, VMUL(LDK(KP382683432), To));
Chris@42 1828 Teb = VSUB(Tc6, Tc7);
Chris@42 1829 T4R = VFNMS(LDK(KP923879532), To, VMUL(LDK(KP382683432), Tl));
Chris@42 1830 }
Chris@42 1831 {
Chris@42 1832 V Tb, Tq, Te9, Tec;
Chris@42 1833 Tb = VADD(T3, Ta);
Chris@42 1834 Tq = VADD(Ti, Tp);
Chris@42 1835 Tr = VADD(Tb, Tq);
Chris@42 1836 T5J = VSUB(Tb, Tq);
Chris@42 1837 Te9 = VSUB(Ta7, Ta8);
Chris@42 1838 Tec = VMUL(LDK(KP707106781), VADD(Tea, Teb));
Chris@42 1839 Ted = VADD(Te9, Tec);
Chris@42 1840 Tgf = VSUB(Te9, Tec);
Chris@42 1841 }
Chris@42 1842 {
Chris@42 1843 V Tfo, Tfp, T4Q, T4T;
Chris@42 1844 Tfo = VSUB(Tab, Taa);
Chris@42 1845 Tfp = VMUL(LDK(KP707106781), VSUB(Teb, Tea));
Chris@42 1846 Tfq = VADD(Tfo, Tfp);
Chris@42 1847 TgH = VSUB(Tfp, Tfo);
Chris@42 1848 T4Q = VSUB(T4M, T4P);
Chris@42 1849 T4T = VSUB(T4R, T4S);
Chris@42 1850 T4U = VADD(T4Q, T4T);
Chris@42 1851 T6b = VSUB(T4T, T4Q);
Chris@42 1852 }
Chris@42 1853 {
Chris@42 1854 V T6X, T6Y, Ta9, Tac;
Chris@42 1855 T6X = VSUB(T3, Ta);
Chris@42 1856 T6Y = VADD(T4S, T4R);
Chris@42 1857 T6Z = VADD(T6X, T6Y);
Chris@42 1858 T8T = VSUB(T6X, T6Y);
Chris@42 1859 Ta9 = VADD(Ta7, Ta8);
Chris@42 1860 Tac = VADD(Taa, Tab);
Chris@42 1861 Tad = VSUB(Ta9, Tac);
Chris@42 1862 TcZ = VADD(Ta9, Tac);
Chris@42 1863 }
Chris@42 1864 {
Chris@42 1865 V Tc8, Tcb, T82, T83;
Chris@42 1866 Tc8 = VADD(Tc6, Tc7);
Chris@42 1867 Tcb = VADD(Tc9, Tca);
Chris@42 1868 Tcc = VSUB(Tc8, Tcb);
Chris@42 1869 Td0 = VADD(Tcb, Tc8);
Chris@42 1870 T82 = VADD(T4P, T4M);
Chris@42 1871 T83 = VSUB(Tp, Ti);
Chris@42 1872 T84 = VADD(T82, T83);
Chris@42 1873 T9l = VSUB(T83, T82);
Chris@42 1874 }
Chris@42 1875 }
Chris@42 1876 {
Chris@42 1877 V Tb0, Tb1, T2i, Tb2, T3k, Tb3, Tb4, T2p, Tb5, T3h, T2x, TeH, T3n, Tbs, T2E;
Chris@42 1878 V TeI, T3m, Tbp, T2l, T2o, TeG, TeJ;
Chris@42 1879 {
Chris@42 1880 V T2g, T2h, T3i, T3j;
Chris@42 1881 T2g = LD(&(xi[WS(is, 1)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1882 T2h = LD(&(xi[WS(is, 65)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1883 Tb0 = VADD(T2g, T2h);
Chris@42 1884 T3i = LD(&(xi[WS(is, 33)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1885 T3j = LD(&(xi[WS(is, 97)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1886 Tb1 = VADD(T3i, T3j);
Chris@42 1887 T2i = VSUB(T2g, T2h);
Chris@42 1888 Tb2 = VADD(Tb0, Tb1);
Chris@42 1889 T3k = VSUB(T3i, T3j);
Chris@42 1890 }
Chris@42 1891 {
Chris@42 1892 V T2j, T2k, T2m, T2n;
Chris@42 1893 T2j = LD(&(xi[WS(is, 17)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1894 T2k = LD(&(xi[WS(is, 81)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1895 T2l = VSUB(T2j, T2k);
Chris@42 1896 Tb3 = VADD(T2j, T2k);
Chris@42 1897 T2m = LD(&(xi[WS(is, 113)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1898 T2n = LD(&(xi[WS(is, 49)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1899 T2o = VSUB(T2m, T2n);
Chris@42 1900 Tb4 = VADD(T2m, T2n);
Chris@42 1901 }
Chris@42 1902 T2p = VMUL(LDK(KP707106781), VADD(T2l, T2o));
Chris@42 1903 Tb5 = VADD(Tb3, Tb4);
Chris@42 1904 T3h = VMUL(LDK(KP707106781), VSUB(T2o, T2l));
Chris@42 1905 {
Chris@42 1906 V T2t, Tbq, T2w, Tbr;
Chris@42 1907 {
Chris@42 1908 V T2r, T2s, T2u, T2v;
Chris@42 1909 T2r = LD(&(xi[WS(is, 9)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1910 T2s = LD(&(xi[WS(is, 73)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1911 T2t = VSUB(T2r, T2s);
Chris@42 1912 Tbq = VADD(T2r, T2s);
Chris@42 1913 T2u = LD(&(xi[WS(is, 41)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1914 T2v = LD(&(xi[WS(is, 105)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1915 T2w = VSUB(T2u, T2v);
Chris@42 1916 Tbr = VADD(T2u, T2v);
Chris@42 1917 }
Chris@42 1918 T2x = VFNMS(LDK(KP382683432), T2w, VMUL(LDK(KP923879532), T2t));
Chris@42 1919 TeH = VSUB(Tbq, Tbr);
Chris@42 1920 T3n = VFMA(LDK(KP382683432), T2t, VMUL(LDK(KP923879532), T2w));
Chris@42 1921 Tbs = VADD(Tbq, Tbr);
Chris@42 1922 }
Chris@42 1923 {
Chris@42 1924 V T2A, Tbn, T2D, Tbo;
Chris@42 1925 {
Chris@42 1926 V T2y, T2z, T2B, T2C;
Chris@42 1927 T2y = LD(&(xi[WS(is, 121)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1928 T2z = LD(&(xi[WS(is, 57)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1929 T2A = VSUB(T2y, T2z);
Chris@42 1930 Tbn = VADD(T2y, T2z);
Chris@42 1931 T2B = LD(&(xi[WS(is, 25)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1932 T2C = LD(&(xi[WS(is, 89)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1933 T2D = VSUB(T2B, T2C);
Chris@42 1934 Tbo = VADD(T2B, T2C);
Chris@42 1935 }
Chris@42 1936 T2E = VFMA(LDK(KP923879532), T2A, VMUL(LDK(KP382683432), T2D));
Chris@42 1937 TeI = VSUB(Tbn, Tbo);
Chris@42 1938 T3m = VFNMS(LDK(KP923879532), T2D, VMUL(LDK(KP382683432), T2A));
Chris@42 1939 Tbp = VADD(Tbn, Tbo);
Chris@42 1940 }
Chris@42 1941 Tb6 = VSUB(Tb2, Tb5);
Chris@42 1942 Tbt = VSUB(Tbp, Tbs);
Chris@42 1943 {
Chris@42 1944 V T2q, T2F, TeT, TeU;
Chris@42 1945 T2q = VADD(T2i, T2p);
Chris@42 1946 T2F = VADD(T2x, T2E);
Chris@42 1947 T2G = VADD(T2q, T2F);
Chris@42 1948 T5X = VSUB(T2q, T2F);
Chris@42 1949 TeT = VSUB(Tb4, Tb3);
Chris@42 1950 TeU = VMUL(LDK(KP707106781), VSUB(TeI, TeH));
Chris@42 1951 TeV = VADD(TeT, TeU);
Chris@42 1952 Tgr = VSUB(TeU, TeT);
Chris@42 1953 }
Chris@42 1954 {
Chris@42 1955 V T3l, T3o, T7z, T7A;
Chris@42 1956 T3l = VSUB(T3h, T3k);
Chris@42 1957 T3o = VSUB(T3m, T3n);
Chris@42 1958 T3p = VADD(T3l, T3o);
Chris@42 1959 T5V = VSUB(T3o, T3l);
Chris@42 1960 T7z = VADD(T3k, T3h);
Chris@42 1961 T7A = VSUB(T2E, T2x);
Chris@42 1962 T7B = VADD(T7z, T7A);
Chris@42 1963 T95 = VSUB(T7A, T7z);
Chris@42 1964 }
Chris@42 1965 TeG = VSUB(Tb0, Tb1);
Chris@42 1966 TeJ = VMUL(LDK(KP707106781), VADD(TeH, TeI));
Chris@42 1967 TeK = VADD(TeG, TeJ);
Chris@42 1968 Tgt = VSUB(TeG, TeJ);
Chris@42 1969 {
Chris@42 1970 V T7o, T7p, Td6, Td7;
Chris@42 1971 T7o = VSUB(T2i, T2p);
Chris@42 1972 T7p = VADD(T3n, T3m);
Chris@42 1973 T7q = VADD(T7o, T7p);
Chris@42 1974 T97 = VSUB(T7o, T7p);
Chris@42 1975 Td6 = VADD(Tb2, Tb5);
Chris@42 1976 Td7 = VADD(Tbs, Tbp);
Chris@42 1977 Td8 = VADD(Td6, Td7);
Chris@42 1978 TdK = VSUB(Td6, Td7);
Chris@42 1979 }
Chris@42 1980 }
Chris@42 1981 {
Chris@42 1982 V Tbx, Tby, T3x, Tbz, T4z, TbA, TbB, T3E, TbC, T4w, T3M, Tf2, T4C, TbZ, T3T;
Chris@42 1983 V Tf3, T4B, TbW, T3A, T3D, Tf1, Tf4;
Chris@42 1984 {
Chris@42 1985 V T3v, T3w, T4x, T4y;
Chris@42 1986 T3v = LD(&(xi[WS(is, 127)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1987 T3w = LD(&(xi[WS(is, 63)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1988 Tbx = VADD(T3v, T3w);
Chris@42 1989 T4x = LD(&(xi[WS(is, 31)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1990 T4y = LD(&(xi[WS(is, 95)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1991 Tby = VADD(T4x, T4y);
Chris@42 1992 T3x = VSUB(T3v, T3w);
Chris@42 1993 Tbz = VADD(Tbx, Tby);
Chris@42 1994 T4z = VSUB(T4x, T4y);
Chris@42 1995 }
Chris@42 1996 {
Chris@42 1997 V T3y, T3z, T3B, T3C;
Chris@42 1998 T3y = LD(&(xi[WS(is, 15)]), ivs, &(xi[WS(is, 1)]));
Chris@42 1999 T3z = LD(&(xi[WS(is, 79)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2000 T3A = VSUB(T3y, T3z);
Chris@42 2001 TbA = VADD(T3y, T3z);
Chris@42 2002 T3B = LD(&(xi[WS(is, 111)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2003 T3C = LD(&(xi[WS(is, 47)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2004 T3D = VSUB(T3B, T3C);
Chris@42 2005 TbB = VADD(T3B, T3C);
Chris@42 2006 }
Chris@42 2007 T3E = VMUL(LDK(KP707106781), VADD(T3A, T3D));
Chris@42 2008 TbC = VADD(TbA, TbB);
Chris@42 2009 T4w = VMUL(LDK(KP707106781), VSUB(T3D, T3A));
Chris@42 2010 {
Chris@42 2011 V T3I, TbX, T3L, TbY;
Chris@42 2012 {
Chris@42 2013 V T3G, T3H, T3J, T3K;
Chris@42 2014 T3G = LD(&(xi[WS(is, 7)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2015 T3H = LD(&(xi[WS(is, 71)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2016 T3I = VSUB(T3G, T3H);
Chris@42 2017 TbX = VADD(T3G, T3H);
Chris@42 2018 T3J = LD(&(xi[WS(is, 39)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2019 T3K = LD(&(xi[WS(is, 103)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2020 T3L = VSUB(T3J, T3K);
Chris@42 2021 TbY = VADD(T3J, T3K);
Chris@42 2022 }
Chris@42 2023 T3M = VFNMS(LDK(KP382683432), T3L, VMUL(LDK(KP923879532), T3I));
Chris@42 2024 Tf2 = VSUB(TbX, TbY);
Chris@42 2025 T4C = VFMA(LDK(KP382683432), T3I, VMUL(LDK(KP923879532), T3L));
Chris@42 2026 TbZ = VADD(TbX, TbY);
Chris@42 2027 }
Chris@42 2028 {
Chris@42 2029 V T3P, TbU, T3S, TbV;
Chris@42 2030 {
Chris@42 2031 V T3N, T3O, T3Q, T3R;
Chris@42 2032 T3N = LD(&(xi[WS(is, 119)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2033 T3O = LD(&(xi[WS(is, 55)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2034 T3P = VSUB(T3N, T3O);
Chris@42 2035 TbU = VADD(T3N, T3O);
Chris@42 2036 T3Q = LD(&(xi[WS(is, 23)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2037 T3R = LD(&(xi[WS(is, 87)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2038 T3S = VSUB(T3Q, T3R);
Chris@42 2039 TbV = VADD(T3Q, T3R);
Chris@42 2040 }
Chris@42 2041 T3T = VFMA(LDK(KP923879532), T3P, VMUL(LDK(KP382683432), T3S));
Chris@42 2042 Tf3 = VSUB(TbU, TbV);
Chris@42 2043 T4B = VFNMS(LDK(KP923879532), T3S, VMUL(LDK(KP382683432), T3P));
Chris@42 2044 TbW = VADD(TbU, TbV);
Chris@42 2045 }
Chris@42 2046 TbD = VSUB(Tbz, TbC);
Chris@42 2047 Tc0 = VSUB(TbW, TbZ);
Chris@42 2048 {
Chris@42 2049 V T3F, T3U, Tfe, Tff;
Chris@42 2050 T3F = VADD(T3x, T3E);
Chris@42 2051 T3U = VADD(T3M, T3T);
Chris@42 2052 T3V = VADD(T3F, T3U);
Chris@42 2053 T61 = VSUB(T3F, T3U);
Chris@42 2054 Tfe = VSUB(TbB, TbA);
Chris@42 2055 Tff = VMUL(LDK(KP707106781), VSUB(Tf3, Tf2));
Chris@42 2056 Tfg = VADD(Tfe, Tff);
Chris@42 2057 TgB = VSUB(Tff, Tfe);
Chris@42 2058 }
Chris@42 2059 {
Chris@42 2060 V T4A, T4D, T7S, T7T;
Chris@42 2061 T4A = VSUB(T4w, T4z);
Chris@42 2062 T4D = VSUB(T4B, T4C);
Chris@42 2063 T4E = VADD(T4A, T4D);
Chris@42 2064 T65 = VSUB(T4D, T4A);
Chris@42 2065 T7S = VADD(T4z, T4w);
Chris@42 2066 T7T = VSUB(T3T, T3M);
Chris@42 2067 T7U = VADD(T7S, T7T);
Chris@42 2068 T9f = VSUB(T7T, T7S);
Chris@42 2069 }
Chris@42 2070 Tf1 = VSUB(Tbx, Tby);
Chris@42 2071 Tf4 = VMUL(LDK(KP707106781), VADD(Tf2, Tf3));
Chris@42 2072 Tf5 = VADD(Tf1, Tf4);
Chris@42 2073 Tgx = VSUB(Tf1, Tf4);
Chris@42 2074 {
Chris@42 2075 V T7H, T7I, Tdd, Tde;
Chris@42 2076 T7H = VSUB(T3x, T3E);
Chris@42 2077 T7I = VADD(T4C, T4B);
Chris@42 2078 T7J = VADD(T7H, T7I);
Chris@42 2079 T9b = VSUB(T7H, T7I);
Chris@42 2080 Tdd = VADD(Tbz, TbC);
Chris@42 2081 Tde = VADD(TbZ, TbW);
Chris@42 2082 Tdf = VADD(Tdd, Tde);
Chris@42 2083 TdN = VSUB(Tdd, Tde);
Chris@42 2084 }
Chris@42 2085 }
Chris@42 2086 {
Chris@42 2087 V Tu, Tee, TG, Tag, TL, Teh, TX, Tan, TB, Tef, TD, Taj, TS, Tei, TU;
Chris@42 2088 V Taq, Teg, Tej;
Chris@42 2089 {
Chris@42 2090 V Ts, Tt, Tae, TE, TF, Taf;
Chris@42 2091 Ts = LD(&(xi[WS(is, 4)]), ivs, &(xi[0]));
Chris@42 2092 Tt = LD(&(xi[WS(is, 68)]), ivs, &(xi[0]));
Chris@42 2093 Tae = VADD(Ts, Tt);
Chris@42 2094 TE = LD(&(xi[WS(is, 36)]), ivs, &(xi[0]));
Chris@42 2095 TF = LD(&(xi[WS(is, 100)]), ivs, &(xi[0]));
Chris@42 2096 Taf = VADD(TE, TF);
Chris@42 2097 Tu = VSUB(Ts, Tt);
Chris@42 2098 Tee = VSUB(Tae, Taf);
Chris@42 2099 TG = VSUB(TE, TF);
Chris@42 2100 Tag = VADD(Tae, Taf);
Chris@42 2101 }
Chris@42 2102 {
Chris@42 2103 V TJ, TK, Tal, TV, TW, Tam;
Chris@42 2104 TJ = LD(&(xi[WS(is, 124)]), ivs, &(xi[0]));
Chris@42 2105 TK = LD(&(xi[WS(is, 60)]), ivs, &(xi[0]));
Chris@42 2106 Tal = VADD(TJ, TK);
Chris@42 2107 TV = LD(&(xi[WS(is, 28)]), ivs, &(xi[0]));
Chris@42 2108 TW = LD(&(xi[WS(is, 92)]), ivs, &(xi[0]));
Chris@42 2109 Tam = VADD(TV, TW);
Chris@42 2110 TL = VSUB(TJ, TK);
Chris@42 2111 Teh = VSUB(Tal, Tam);
Chris@42 2112 TX = VSUB(TV, TW);
Chris@42 2113 Tan = VADD(Tal, Tam);
Chris@42 2114 }
Chris@42 2115 {
Chris@42 2116 V Tx, Tah, TA, Tai;
Chris@42 2117 {
Chris@42 2118 V Tv, Tw, Ty, Tz;
Chris@42 2119 Tv = LD(&(xi[WS(is, 20)]), ivs, &(xi[0]));
Chris@42 2120 Tw = LD(&(xi[WS(is, 84)]), ivs, &(xi[0]));
Chris@42 2121 Tx = VSUB(Tv, Tw);
Chris@42 2122 Tah = VADD(Tv, Tw);
Chris@42 2123 Ty = LD(&(xi[WS(is, 116)]), ivs, &(xi[0]));
Chris@42 2124 Tz = LD(&(xi[WS(is, 52)]), ivs, &(xi[0]));
Chris@42 2125 TA = VSUB(Ty, Tz);
Chris@42 2126 Tai = VADD(Ty, Tz);
Chris@42 2127 }
Chris@42 2128 TB = VMUL(LDK(KP707106781), VADD(Tx, TA));
Chris@42 2129 Tef = VSUB(Tai, Tah);
Chris@42 2130 TD = VMUL(LDK(KP707106781), VSUB(TA, Tx));
Chris@42 2131 Taj = VADD(Tah, Tai);
Chris@42 2132 }
Chris@42 2133 {
Chris@42 2134 V TO, Tao, TR, Tap;
Chris@42 2135 {
Chris@42 2136 V TM, TN, TP, TQ;
Chris@42 2137 TM = LD(&(xi[WS(is, 12)]), ivs, &(xi[0]));
Chris@42 2138 TN = LD(&(xi[WS(is, 76)]), ivs, &(xi[0]));
Chris@42 2139 TO = VSUB(TM, TN);
Chris@42 2140 Tao = VADD(TM, TN);
Chris@42 2141 TP = LD(&(xi[WS(is, 108)]), ivs, &(xi[0]));
Chris@42 2142 TQ = LD(&(xi[WS(is, 44)]), ivs, &(xi[0]));
Chris@42 2143 TR = VSUB(TP, TQ);
Chris@42 2144 Tap = VADD(TP, TQ);
Chris@42 2145 }
Chris@42 2146 TS = VMUL(LDK(KP707106781), VADD(TO, TR));
Chris@42 2147 Tei = VSUB(Tap, Tao);
Chris@42 2148 TU = VMUL(LDK(KP707106781), VSUB(TR, TO));
Chris@42 2149 Taq = VADD(Tao, Tap);
Chris@42 2150 }
Chris@42 2151 Td2 = VADD(Tag, Taj);
Chris@42 2152 Td3 = VADD(Tan, Taq);
Chris@42 2153 {
Chris@42 2154 V TC, TH, Tfr, Tfs;
Chris@42 2155 TC = VADD(Tu, TB);
Chris@42 2156 TH = VSUB(TD, TG);
Chris@42 2157 TI = VFMA(LDK(KP980785280), TC, VMUL(LDK(KP195090322), TH));
Chris@42 2158 T4V = VFNMS(LDK(KP195090322), TC, VMUL(LDK(KP980785280), TH));
Chris@42 2159 Tfr = VFNMS(LDK(KP382683432), Tee, VMUL(LDK(KP923879532), Tef));
Chris@42 2160 Tfs = VFMA(LDK(KP382683432), Teh, VMUL(LDK(KP923879532), Tei));
Chris@42 2161 Tft = VADD(Tfr, Tfs);
Chris@42 2162 Tgg = VSUB(Tfs, Tfr);
Chris@42 2163 }
Chris@42 2164 {
Chris@42 2165 V TT, TY, T73, T74;
Chris@42 2166 TT = VADD(TL, TS);
Chris@42 2167 TY = VSUB(TU, TX);
Chris@42 2168 TZ = VFNMS(LDK(KP195090322), TY, VMUL(LDK(KP980785280), TT));
Chris@42 2169 T4W = VFMA(LDK(KP195090322), TT, VMUL(LDK(KP980785280), TY));
Chris@42 2170 T73 = VSUB(TL, TS);
Chris@42 2171 T74 = VADD(TX, TU);
Chris@42 2172 T75 = VFNMS(LDK(KP555570233), T74, VMUL(LDK(KP831469612), T73));
Chris@42 2173 T86 = VFMA(LDK(KP555570233), T73, VMUL(LDK(KP831469612), T74));
Chris@42 2174 }
Chris@42 2175 Teg = VFMA(LDK(KP923879532), Tee, VMUL(LDK(KP382683432), Tef));
Chris@42 2176 Tej = VFNMS(LDK(KP382683432), Tei, VMUL(LDK(KP923879532), Teh));
Chris@42 2177 Tek = VADD(Teg, Tej);
Chris@42 2178 TgG = VSUB(Tej, Teg);
Chris@42 2179 {
Chris@42 2180 V T70, T71, Tak, Tar;
Chris@42 2181 T70 = VSUB(Tu, TB);
Chris@42 2182 T71 = VADD(TG, TD);
Chris@42 2183 T72 = VFMA(LDK(KP831469612), T70, VMUL(LDK(KP555570233), T71));
Chris@42 2184 T85 = VFNMS(LDK(KP555570233), T70, VMUL(LDK(KP831469612), T71));
Chris@42 2185 Tak = VSUB(Tag, Taj);
Chris@42 2186 Tar = VSUB(Tan, Taq);
Chris@42 2187 Tas = VMUL(LDK(KP707106781), VADD(Tak, Tar));
Chris@42 2188 Tcd = VMUL(LDK(KP707106781), VSUB(Tar, Tak));
Chris@42 2189 }
Chris@42 2190 }
Chris@42 2191 {
Chris@42 2192 V Tav, Tau, T1b, Taw, T1v, Tay, Tax, T18, Taz, T1w, T1j, Teo, T1z, TaD, T1q;
Chris@42 2193 V Ten, T1y, TaG, T14, T17, Tem, Tep;
Chris@42 2194 {
Chris@42 2195 V T19, T1a, T1t, T1u;
Chris@42 2196 T19 = LD(&(xi[WS(is, 34)]), ivs, &(xi[0]));
Chris@42 2197 T1a = LD(&(xi[WS(is, 98)]), ivs, &(xi[0]));
Chris@42 2198 Tav = VADD(T19, T1a);
Chris@42 2199 T1t = LD(&(xi[WS(is, 2)]), ivs, &(xi[0]));
Chris@42 2200 T1u = LD(&(xi[WS(is, 66)]), ivs, &(xi[0]));
Chris@42 2201 Tau = VADD(T1t, T1u);
Chris@42 2202 T1b = VSUB(T19, T1a);
Chris@42 2203 Taw = VADD(Tau, Tav);
Chris@42 2204 T1v = VSUB(T1t, T1u);
Chris@42 2205 }
Chris@42 2206 {
Chris@42 2207 V T12, T13, T15, T16;
Chris@42 2208 T12 = LD(&(xi[WS(is, 114)]), ivs, &(xi[0]));
Chris@42 2209 T13 = LD(&(xi[WS(is, 50)]), ivs, &(xi[0]));
Chris@42 2210 T14 = VSUB(T12, T13);
Chris@42 2211 Tay = VADD(T12, T13);
Chris@42 2212 T15 = LD(&(xi[WS(is, 18)]), ivs, &(xi[0]));
Chris@42 2213 T16 = LD(&(xi[WS(is, 82)]), ivs, &(xi[0]));
Chris@42 2214 T17 = VSUB(T15, T16);
Chris@42 2215 Tax = VADD(T15, T16);
Chris@42 2216 }
Chris@42 2217 T18 = VMUL(LDK(KP707106781), VSUB(T14, T17));
Chris@42 2218 Taz = VADD(Tax, Tay);
Chris@42 2219 T1w = VMUL(LDK(KP707106781), VADD(T17, T14));
Chris@42 2220 {
Chris@42 2221 V T1f, TaB, T1i, TaC;
Chris@42 2222 {
Chris@42 2223 V T1d, T1e, T1g, T1h;
Chris@42 2224 T1d = LD(&(xi[WS(is, 122)]), ivs, &(xi[0]));
Chris@42 2225 T1e = LD(&(xi[WS(is, 58)]), ivs, &(xi[0]));
Chris@42 2226 T1f = VSUB(T1d, T1e);
Chris@42 2227 TaB = VADD(T1d, T1e);
Chris@42 2228 T1g = LD(&(xi[WS(is, 26)]), ivs, &(xi[0]));
Chris@42 2229 T1h = LD(&(xi[WS(is, 90)]), ivs, &(xi[0]));
Chris@42 2230 T1i = VSUB(T1g, T1h);
Chris@42 2231 TaC = VADD(T1g, T1h);
Chris@42 2232 }
Chris@42 2233 T1j = VFNMS(LDK(KP923879532), T1i, VMUL(LDK(KP382683432), T1f));
Chris@42 2234 Teo = VSUB(TaB, TaC);
Chris@42 2235 T1z = VFMA(LDK(KP923879532), T1f, VMUL(LDK(KP382683432), T1i));
Chris@42 2236 TaD = VADD(TaB, TaC);
Chris@42 2237 }
Chris@42 2238 {
Chris@42 2239 V T1m, TaE, T1p, TaF;
Chris@42 2240 {
Chris@42 2241 V T1k, T1l, T1n, T1o;
Chris@42 2242 T1k = LD(&(xi[WS(is, 10)]), ivs, &(xi[0]));
Chris@42 2243 T1l = LD(&(xi[WS(is, 74)]), ivs, &(xi[0]));
Chris@42 2244 T1m = VSUB(T1k, T1l);
Chris@42 2245 TaE = VADD(T1k, T1l);
Chris@42 2246 T1n = LD(&(xi[WS(is, 42)]), ivs, &(xi[0]));
Chris@42 2247 T1o = LD(&(xi[WS(is, 106)]), ivs, &(xi[0]));
Chris@42 2248 T1p = VSUB(T1n, T1o);
Chris@42 2249 TaF = VADD(T1n, T1o);
Chris@42 2250 }
Chris@42 2251 T1q = VFMA(LDK(KP382683432), T1m, VMUL(LDK(KP923879532), T1p));
Chris@42 2252 Ten = VSUB(TaE, TaF);
Chris@42 2253 T1y = VFNMS(LDK(KP382683432), T1p, VMUL(LDK(KP923879532), T1m));
Chris@42 2254 TaG = VADD(TaE, TaF);
Chris@42 2255 }
Chris@42 2256 Tdp = VADD(Taw, Taz);
Chris@42 2257 Tdq = VADD(TaG, TaD);
Chris@42 2258 TdG = VSUB(Tdp, Tdq);
Chris@42 2259 Tem = VSUB(Tau, Tav);
Chris@42 2260 Tep = VMUL(LDK(KP707106781), VADD(Ten, Teo));
Chris@42 2261 Teq = VADD(Tem, Tep);
Chris@42 2262 Tgm = VSUB(Tem, Tep);
Chris@42 2263 {
Chris@42 2264 V Ter, Tes, T1c, T1r;
Chris@42 2265 Ter = VSUB(Tay, Tax);
Chris@42 2266 Tes = VMUL(LDK(KP707106781), VSUB(Teo, Ten));
Chris@42 2267 Tet = VADD(Ter, Tes);
Chris@42 2268 Tgl = VSUB(Tes, Ter);
Chris@42 2269 T1c = VSUB(T18, T1b);
Chris@42 2270 T1r = VSUB(T1j, T1q);
Chris@42 2271 T1s = VADD(T1c, T1r);
Chris@42 2272 T5P = VSUB(T1r, T1c);
Chris@42 2273 }
Chris@42 2274 {
Chris@42 2275 V T1x, T1A, T7b, T7c;
Chris@42 2276 T1x = VADD(T1v, T1w);
Chris@42 2277 T1A = VADD(T1y, T1z);
Chris@42 2278 T1B = VADD(T1x, T1A);
Chris@42 2279 T5Q = VSUB(T1x, T1A);
Chris@42 2280 T7b = VADD(T1b, T18);
Chris@42 2281 T7c = VSUB(T1z, T1y);
Chris@42 2282 T7d = VADD(T7b, T7c);
Chris@42 2283 T8Z = VSUB(T7c, T7b);
Chris@42 2284 }
Chris@42 2285 {
Chris@42 2286 V TaA, TaH, T78, T79;
Chris@42 2287 TaA = VSUB(Taw, Taz);
Chris@42 2288 TaH = VSUB(TaD, TaG);
Chris@42 2289 TaI = VFMA(LDK(KP923879532), TaA, VMUL(LDK(KP382683432), TaH));
Chris@42 2290 Tcf = VFNMS(LDK(KP382683432), TaA, VMUL(LDK(KP923879532), TaH));
Chris@42 2291 T78 = VSUB(T1v, T1w);
Chris@42 2292 T79 = VADD(T1q, T1j);
Chris@42 2293 T7a = VADD(T78, T79);
Chris@42 2294 T90 = VSUB(T78, T79);
Chris@42 2295 }
Chris@42 2296 }
Chris@42 2297 {
Chris@42 2298 V TaJ, TaK, T1F, TaL, T27, TaM, TaN, T1M, TaO, T24, T1U, Tew, T2a, TaV, T21;
Chris@42 2299 V Tex, T29, TaS, T1I, T1L, Tev, Tey;
Chris@42 2300 {
Chris@42 2301 V T1D, T1E, T25, T26;
Chris@42 2302 T1D = LD(&(xi[WS(is, 126)]), ivs, &(xi[0]));
Chris@42 2303 T1E = LD(&(xi[WS(is, 62)]), ivs, &(xi[0]));
Chris@42 2304 TaJ = VADD(T1D, T1E);
Chris@42 2305 T25 = LD(&(xi[WS(is, 30)]), ivs, &(xi[0]));
Chris@42 2306 T26 = LD(&(xi[WS(is, 94)]), ivs, &(xi[0]));
Chris@42 2307 TaK = VADD(T25, T26);
Chris@42 2308 T1F = VSUB(T1D, T1E);
Chris@42 2309 TaL = VADD(TaJ, TaK);
Chris@42 2310 T27 = VSUB(T25, T26);
Chris@42 2311 }
Chris@42 2312 {
Chris@42 2313 V T1G, T1H, T1J, T1K;
Chris@42 2314 T1G = LD(&(xi[WS(is, 14)]), ivs, &(xi[0]));
Chris@42 2315 T1H = LD(&(xi[WS(is, 78)]), ivs, &(xi[0]));
Chris@42 2316 T1I = VSUB(T1G, T1H);
Chris@42 2317 TaM = VADD(T1G, T1H);
Chris@42 2318 T1J = LD(&(xi[WS(is, 110)]), ivs, &(xi[0]));
Chris@42 2319 T1K = LD(&(xi[WS(is, 46)]), ivs, &(xi[0]));
Chris@42 2320 T1L = VSUB(T1J, T1K);
Chris@42 2321 TaN = VADD(T1J, T1K);
Chris@42 2322 }
Chris@42 2323 T1M = VMUL(LDK(KP707106781), VADD(T1I, T1L));
Chris@42 2324 TaO = VADD(TaM, TaN);
Chris@42 2325 T24 = VMUL(LDK(KP707106781), VSUB(T1L, T1I));
Chris@42 2326 {
Chris@42 2327 V T1Q, TaT, T1T, TaU;
Chris@42 2328 {
Chris@42 2329 V T1O, T1P, T1R, T1S;
Chris@42 2330 T1O = LD(&(xi[WS(is, 6)]), ivs, &(xi[0]));
Chris@42 2331 T1P = LD(&(xi[WS(is, 70)]), ivs, &(xi[0]));
Chris@42 2332 T1Q = VSUB(T1O, T1P);
Chris@42 2333 TaT = VADD(T1O, T1P);
Chris@42 2334 T1R = LD(&(xi[WS(is, 38)]), ivs, &(xi[0]));
Chris@42 2335 T1S = LD(&(xi[WS(is, 102)]), ivs, &(xi[0]));
Chris@42 2336 T1T = VSUB(T1R, T1S);
Chris@42 2337 TaU = VADD(T1R, T1S);
Chris@42 2338 }
Chris@42 2339 T1U = VFNMS(LDK(KP382683432), T1T, VMUL(LDK(KP923879532), T1Q));
Chris@42 2340 Tew = VSUB(TaT, TaU);
Chris@42 2341 T2a = VFMA(LDK(KP382683432), T1Q, VMUL(LDK(KP923879532), T1T));
Chris@42 2342 TaV = VADD(TaT, TaU);
Chris@42 2343 }
Chris@42 2344 {
Chris@42 2345 V T1X, TaQ, T20, TaR;
Chris@42 2346 {
Chris@42 2347 V T1V, T1W, T1Y, T1Z;
Chris@42 2348 T1V = LD(&(xi[WS(is, 118)]), ivs, &(xi[0]));
Chris@42 2349 T1W = LD(&(xi[WS(is, 54)]), ivs, &(xi[0]));
Chris@42 2350 T1X = VSUB(T1V, T1W);
Chris@42 2351 TaQ = VADD(T1V, T1W);
Chris@42 2352 T1Y = LD(&(xi[WS(is, 22)]), ivs, &(xi[0]));
Chris@42 2353 T1Z = LD(&(xi[WS(is, 86)]), ivs, &(xi[0]));
Chris@42 2354 T20 = VSUB(T1Y, T1Z);
Chris@42 2355 TaR = VADD(T1Y, T1Z);
Chris@42 2356 }
Chris@42 2357 T21 = VFMA(LDK(KP923879532), T1X, VMUL(LDK(KP382683432), T20));
Chris@42 2358 Tex = VSUB(TaQ, TaR);
Chris@42 2359 T29 = VFNMS(LDK(KP923879532), T20, VMUL(LDK(KP382683432), T1X));
Chris@42 2360 TaS = VADD(TaQ, TaR);
Chris@42 2361 }
Chris@42 2362 Tdm = VADD(TaL, TaO);
Chris@42 2363 Tdn = VADD(TaV, TaS);
Chris@42 2364 TdH = VSUB(Tdm, Tdn);
Chris@42 2365 Tev = VSUB(TaJ, TaK);
Chris@42 2366 Tey = VMUL(LDK(KP707106781), VADD(Tew, Tex));
Chris@42 2367 Tez = VADD(Tev, Tey);
Chris@42 2368 Tgi = VSUB(Tev, Tey);
Chris@42 2369 {
Chris@42 2370 V TeA, TeB, T1N, T22;
Chris@42 2371 TeA = VSUB(TaN, TaM);
Chris@42 2372 TeB = VMUL(LDK(KP707106781), VSUB(Tex, Tew));
Chris@42 2373 TeC = VADD(TeA, TeB);
Chris@42 2374 Tgj = VSUB(TeB, TeA);
Chris@42 2375 T1N = VADD(T1F, T1M);
Chris@42 2376 T22 = VADD(T1U, T21);
Chris@42 2377 T23 = VADD(T1N, T22);
Chris@42 2378 T5N = VSUB(T1N, T22);
Chris@42 2379 }
Chris@42 2380 {
Chris@42 2381 V T28, T2b, T7i, T7j;
Chris@42 2382 T28 = VSUB(T24, T27);
Chris@42 2383 T2b = VSUB(T29, T2a);
Chris@42 2384 T2c = VADD(T28, T2b);
Chris@42 2385 T5M = VSUB(T2b, T28);
Chris@42 2386 T7i = VADD(T27, T24);
Chris@42 2387 T7j = VSUB(T21, T1U);
Chris@42 2388 T7k = VADD(T7i, T7j);
Chris@42 2389 T8X = VSUB(T7j, T7i);
Chris@42 2390 }
Chris@42 2391 {
Chris@42 2392 V TaP, TaW, T7f, T7g;
Chris@42 2393 TaP = VSUB(TaL, TaO);
Chris@42 2394 TaW = VSUB(TaS, TaV);
Chris@42 2395 TaX = VFNMS(LDK(KP382683432), TaW, VMUL(LDK(KP923879532), TaP));
Chris@42 2396 Tcg = VFMA(LDK(KP382683432), TaP, VMUL(LDK(KP923879532), TaW));
Chris@42 2397 T7f = VSUB(T1F, T1M);
Chris@42 2398 T7g = VADD(T2a, T29);
Chris@42 2399 T7h = VADD(T7f, T7g);
Chris@42 2400 T8W = VSUB(T7f, T7g);
Chris@42 2401 }
Chris@42 2402 }
Chris@42 2403 {
Chris@42 2404 V T2J, TeL, T2V, Tb9, T30, TeO, T3c, Tbg, T2Q, TeM, T2S, Tbc, T37, TeP, T39;
Chris@42 2405 V Tbj;
Chris@42 2406 {
Chris@42 2407 V T2H, T2I, Tb7, T2T, T2U, Tb8;
Chris@42 2408 T2H = LD(&(xi[WS(is, 5)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2409 T2I = LD(&(xi[WS(is, 69)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2410 Tb7 = VADD(T2H, T2I);
Chris@42 2411 T2T = LD(&(xi[WS(is, 37)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2412 T2U = LD(&(xi[WS(is, 101)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2413 Tb8 = VADD(T2T, T2U);
Chris@42 2414 T2J = VSUB(T2H, T2I);
Chris@42 2415 TeL = VSUB(Tb7, Tb8);
Chris@42 2416 T2V = VSUB(T2T, T2U);
Chris@42 2417 Tb9 = VADD(Tb7, Tb8);
Chris@42 2418 }
Chris@42 2419 {
Chris@42 2420 V T2Y, T2Z, Tbe, T3a, T3b, Tbf;
Chris@42 2421 T2Y = LD(&(xi[WS(is, 125)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2422 T2Z = LD(&(xi[WS(is, 61)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2423 Tbe = VADD(T2Y, T2Z);
Chris@42 2424 T3a = LD(&(xi[WS(is, 29)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2425 T3b = LD(&(xi[WS(is, 93)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2426 Tbf = VADD(T3a, T3b);
Chris@42 2427 T30 = VSUB(T2Y, T2Z);
Chris@42 2428 TeO = VSUB(Tbe, Tbf);
Chris@42 2429 T3c = VSUB(T3a, T3b);
Chris@42 2430 Tbg = VADD(Tbe, Tbf);
Chris@42 2431 }
Chris@42 2432 {
Chris@42 2433 V T2M, Tba, T2P, Tbb;
Chris@42 2434 {
Chris@42 2435 V T2K, T2L, T2N, T2O;
Chris@42 2436 T2K = LD(&(xi[WS(is, 21)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2437 T2L = LD(&(xi[WS(is, 85)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2438 T2M = VSUB(T2K, T2L);
Chris@42 2439 Tba = VADD(T2K, T2L);
Chris@42 2440 T2N = LD(&(xi[WS(is, 117)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2441 T2O = LD(&(xi[WS(is, 53)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2442 T2P = VSUB(T2N, T2O);
Chris@42 2443 Tbb = VADD(T2N, T2O);
Chris@42 2444 }
Chris@42 2445 T2Q = VMUL(LDK(KP707106781), VADD(T2M, T2P));
Chris@42 2446 TeM = VSUB(Tbb, Tba);
Chris@42 2447 T2S = VMUL(LDK(KP707106781), VSUB(T2P, T2M));
Chris@42 2448 Tbc = VADD(Tba, Tbb);
Chris@42 2449 }
Chris@42 2450 {
Chris@42 2451 V T33, Tbh, T36, Tbi;
Chris@42 2452 {
Chris@42 2453 V T31, T32, T34, T35;
Chris@42 2454 T31 = LD(&(xi[WS(is, 13)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2455 T32 = LD(&(xi[WS(is, 77)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2456 T33 = VSUB(T31, T32);
Chris@42 2457 Tbh = VADD(T31, T32);
Chris@42 2458 T34 = LD(&(xi[WS(is, 109)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2459 T35 = LD(&(xi[WS(is, 45)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2460 T36 = VSUB(T34, T35);
Chris@42 2461 Tbi = VADD(T34, T35);
Chris@42 2462 }
Chris@42 2463 T37 = VMUL(LDK(KP707106781), VADD(T33, T36));
Chris@42 2464 TeP = VSUB(Tbi, Tbh);
Chris@42 2465 T39 = VMUL(LDK(KP707106781), VSUB(T36, T33));
Chris@42 2466 Tbj = VADD(Tbh, Tbi);
Chris@42 2467 }
Chris@42 2468 {
Chris@42 2469 V Tbd, Tbk, TeN, TeQ;
Chris@42 2470 Tbd = VSUB(Tb9, Tbc);
Chris@42 2471 Tbk = VSUB(Tbg, Tbj);
Chris@42 2472 Tbl = VMUL(LDK(KP707106781), VADD(Tbd, Tbk));
Chris@42 2473 Tbu = VMUL(LDK(KP707106781), VSUB(Tbk, Tbd));
Chris@42 2474 {
Chris@42 2475 V Td9, Tda, TeW, TeX;
Chris@42 2476 Td9 = VADD(Tb9, Tbc);
Chris@42 2477 Tda = VADD(Tbg, Tbj);
Chris@42 2478 Tdb = VADD(Td9, Tda);
Chris@42 2479 TdL = VSUB(Tda, Td9);
Chris@42 2480 TeW = VFNMS(LDK(KP382683432), TeL, VMUL(LDK(KP923879532), TeM));
Chris@42 2481 TeX = VFMA(LDK(KP382683432), TeO, VMUL(LDK(KP923879532), TeP));
Chris@42 2482 TeY = VADD(TeW, TeX);
Chris@42 2483 Tgu = VSUB(TeX, TeW);
Chris@42 2484 }
Chris@42 2485 TeN = VFMA(LDK(KP923879532), TeL, VMUL(LDK(KP382683432), TeM));
Chris@42 2486 TeQ = VFNMS(LDK(KP382683432), TeP, VMUL(LDK(KP923879532), TeO));
Chris@42 2487 TeR = VADD(TeN, TeQ);
Chris@42 2488 Tgq = VSUB(TeQ, TeN);
Chris@42 2489 {
Chris@42 2490 V T7t, T7C, T7w, T7D;
Chris@42 2491 {
Chris@42 2492 V T7r, T7s, T7u, T7v;
Chris@42 2493 T7r = VSUB(T2J, T2Q);
Chris@42 2494 T7s = VADD(T2V, T2S);
Chris@42 2495 T7t = VFMA(LDK(KP831469612), T7r, VMUL(LDK(KP555570233), T7s));
Chris@42 2496 T7C = VFNMS(LDK(KP555570233), T7r, VMUL(LDK(KP831469612), T7s));
Chris@42 2497 T7u = VSUB(T30, T37);
Chris@42 2498 T7v = VADD(T3c, T39);
Chris@42 2499 T7w = VFNMS(LDK(KP555570233), T7v, VMUL(LDK(KP831469612), T7u));
Chris@42 2500 T7D = VFMA(LDK(KP555570233), T7u, VMUL(LDK(KP831469612), T7v));
Chris@42 2501 }
Chris@42 2502 T7x = VADD(T7t, T7w);
Chris@42 2503 T98 = VSUB(T7D, T7C);
Chris@42 2504 T7E = VADD(T7C, T7D);
Chris@42 2505 T94 = VSUB(T7w, T7t);
Chris@42 2506 }
Chris@42 2507 {
Chris@42 2508 V T2X, T3q, T3e, T3r;
Chris@42 2509 {
Chris@42 2510 V T2R, T2W, T38, T3d;
Chris@42 2511 T2R = VADD(T2J, T2Q);
Chris@42 2512 T2W = VSUB(T2S, T2V);
Chris@42 2513 T2X = VFMA(LDK(KP980785280), T2R, VMUL(LDK(KP195090322), T2W));
Chris@42 2514 T3q = VFNMS(LDK(KP195090322), T2R, VMUL(LDK(KP980785280), T2W));
Chris@42 2515 T38 = VADD(T30, T37);
Chris@42 2516 T3d = VSUB(T39, T3c);
Chris@42 2517 T3e = VFNMS(LDK(KP195090322), T3d, VMUL(LDK(KP980785280), T38));
Chris@42 2518 T3r = VFMA(LDK(KP195090322), T38, VMUL(LDK(KP980785280), T3d));
Chris@42 2519 }
Chris@42 2520 T3f = VADD(T2X, T3e);
Chris@42 2521 T5Y = VSUB(T3r, T3q);
Chris@42 2522 T3s = VADD(T3q, T3r);
Chris@42 2523 T5U = VSUB(T3e, T2X);
Chris@42 2524 }
Chris@42 2525 }
Chris@42 2526 }
Chris@42 2527 {
Chris@42 2528 V T3Y, Tf6, T4a, TbG, T4f, Tf9, T4r, TbN, T45, Tf7, T47, TbJ, T4m, Tfa, T4o;
Chris@42 2529 V TbQ;
Chris@42 2530 {
Chris@42 2531 V T3W, T3X, TbE, T48, T49, TbF;
Chris@42 2532 T3W = LD(&(xi[WS(is, 3)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2533 T3X = LD(&(xi[WS(is, 67)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2534 TbE = VADD(T3W, T3X);
Chris@42 2535 T48 = LD(&(xi[WS(is, 35)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2536 T49 = LD(&(xi[WS(is, 99)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2537 TbF = VADD(T48, T49);
Chris@42 2538 T3Y = VSUB(T3W, T3X);
Chris@42 2539 Tf6 = VSUB(TbE, TbF);
Chris@42 2540 T4a = VSUB(T48, T49);
Chris@42 2541 TbG = VADD(TbE, TbF);
Chris@42 2542 }
Chris@42 2543 {
Chris@42 2544 V T4d, T4e, TbL, T4p, T4q, TbM;
Chris@42 2545 T4d = LD(&(xi[WS(is, 123)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2546 T4e = LD(&(xi[WS(is, 59)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2547 TbL = VADD(T4d, T4e);
Chris@42 2548 T4p = LD(&(xi[WS(is, 27)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2549 T4q = LD(&(xi[WS(is, 91)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2550 TbM = VADD(T4p, T4q);
Chris@42 2551 T4f = VSUB(T4d, T4e);
Chris@42 2552 Tf9 = VSUB(TbL, TbM);
Chris@42 2553 T4r = VSUB(T4p, T4q);
Chris@42 2554 TbN = VADD(TbL, TbM);
Chris@42 2555 }
Chris@42 2556 {
Chris@42 2557 V T41, TbH, T44, TbI;
Chris@42 2558 {
Chris@42 2559 V T3Z, T40, T42, T43;
Chris@42 2560 T3Z = LD(&(xi[WS(is, 19)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2561 T40 = LD(&(xi[WS(is, 83)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2562 T41 = VSUB(T3Z, T40);
Chris@42 2563 TbH = VADD(T3Z, T40);
Chris@42 2564 T42 = LD(&(xi[WS(is, 115)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2565 T43 = LD(&(xi[WS(is, 51)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2566 T44 = VSUB(T42, T43);
Chris@42 2567 TbI = VADD(T42, T43);
Chris@42 2568 }
Chris@42 2569 T45 = VMUL(LDK(KP707106781), VADD(T41, T44));
Chris@42 2570 Tf7 = VSUB(TbI, TbH);
Chris@42 2571 T47 = VMUL(LDK(KP707106781), VSUB(T44, T41));
Chris@42 2572 TbJ = VADD(TbH, TbI);
Chris@42 2573 }
Chris@42 2574 {
Chris@42 2575 V T4i, TbO, T4l, TbP;
Chris@42 2576 {
Chris@42 2577 V T4g, T4h, T4j, T4k;
Chris@42 2578 T4g = LD(&(xi[WS(is, 11)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2579 T4h = LD(&(xi[WS(is, 75)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2580 T4i = VSUB(T4g, T4h);
Chris@42 2581 TbO = VADD(T4g, T4h);
Chris@42 2582 T4j = LD(&(xi[WS(is, 107)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2583 T4k = LD(&(xi[WS(is, 43)]), ivs, &(xi[WS(is, 1)]));
Chris@42 2584 T4l = VSUB(T4j, T4k);
Chris@42 2585 TbP = VADD(T4j, T4k);
Chris@42 2586 }
Chris@42 2587 T4m = VMUL(LDK(KP707106781), VADD(T4i, T4l));
Chris@42 2588 Tfa = VSUB(TbP, TbO);
Chris@42 2589 T4o = VMUL(LDK(KP707106781), VSUB(T4l, T4i));
Chris@42 2590 TbQ = VADD(TbO, TbP);
Chris@42 2591 }
Chris@42 2592 {
Chris@42 2593 V TbK, TbR, Tf8, Tfb;
Chris@42 2594 TbK = VSUB(TbG, TbJ);
Chris@42 2595 TbR = VSUB(TbN, TbQ);
Chris@42 2596 TbS = VMUL(LDK(KP707106781), VADD(TbK, TbR));
Chris@42 2597 Tc1 = VMUL(LDK(KP707106781), VSUB(TbR, TbK));
Chris@42 2598 {
Chris@42 2599 V Tdg, Tdh, Tfh, Tfi;
Chris@42 2600 Tdg = VADD(TbG, TbJ);
Chris@42 2601 Tdh = VADD(TbN, TbQ);
Chris@42 2602 Tdi = VADD(Tdg, Tdh);
Chris@42 2603 TdO = VSUB(Tdh, Tdg);
Chris@42 2604 Tfh = VFNMS(LDK(KP382683432), Tf6, VMUL(LDK(KP923879532), Tf7));
Chris@42 2605 Tfi = VFMA(LDK(KP382683432), Tf9, VMUL(LDK(KP923879532), Tfa));
Chris@42 2606 Tfj = VADD(Tfh, Tfi);
Chris@42 2607 Tgy = VSUB(Tfi, Tfh);
Chris@42 2608 }
Chris@42 2609 Tf8 = VFMA(LDK(KP923879532), Tf6, VMUL(LDK(KP382683432), Tf7));
Chris@42 2610 Tfb = VFNMS(LDK(KP382683432), Tfa, VMUL(LDK(KP923879532), Tf9));
Chris@42 2611 Tfc = VADD(Tf8, Tfb);
Chris@42 2612 TgA = VSUB(Tfb, Tf8);
Chris@42 2613 {
Chris@42 2614 V T7M, T7V, T7P, T7W;
Chris@42 2615 {
Chris@42 2616 V T7K, T7L, T7N, T7O;
Chris@42 2617 T7K = VSUB(T3Y, T45);
Chris@42 2618 T7L = VADD(T4a, T47);
Chris@42 2619 T7M = VFMA(LDK(KP831469612), T7K, VMUL(LDK(KP555570233), T7L));
Chris@42 2620 T7V = VFNMS(LDK(KP555570233), T7K, VMUL(LDK(KP831469612), T7L));
Chris@42 2621 T7N = VSUB(T4f, T4m);
Chris@42 2622 T7O = VADD(T4r, T4o);
Chris@42 2623 T7P = VFNMS(LDK(KP555570233), T7O, VMUL(LDK(KP831469612), T7N));
Chris@42 2624 T7W = VFMA(LDK(KP555570233), T7N, VMUL(LDK(KP831469612), T7O));
Chris@42 2625 }
Chris@42 2626 T7Q = VADD(T7M, T7P);
Chris@42 2627 T9e = VSUB(T7P, T7M);
Chris@42 2628 T7X = VADD(T7V, T7W);
Chris@42 2629 T9c = VSUB(T7W, T7V);
Chris@42 2630 }
Chris@42 2631 {
Chris@42 2632 V T4c, T4F, T4t, T4G;
Chris@42 2633 {
Chris@42 2634 V T46, T4b, T4n, T4s;
Chris@42 2635 T46 = VADD(T3Y, T45);
Chris@42 2636 T4b = VSUB(T47, T4a);
Chris@42 2637 T4c = VFMA(LDK(KP980785280), T46, VMUL(LDK(KP195090322), T4b));
Chris@42 2638 T4F = VFNMS(LDK(KP195090322), T46, VMUL(LDK(KP980785280), T4b));
Chris@42 2639 T4n = VADD(T4f, T4m);
Chris@42 2640 T4s = VSUB(T4o, T4r);
Chris@42 2641 T4t = VFNMS(LDK(KP195090322), T4s, VMUL(LDK(KP980785280), T4n));
Chris@42 2642 T4G = VFMA(LDK(KP195090322), T4n, VMUL(LDK(KP980785280), T4s));
Chris@42 2643 }
Chris@42 2644 T4u = VADD(T4c, T4t);
Chris@42 2645 T64 = VSUB(T4t, T4c);
Chris@42 2646 T4H = VADD(T4F, T4G);
Chris@42 2647 T62 = VSUB(T4G, T4F);
Chris@42 2648 }
Chris@42 2649 }
Chris@42 2650 }
Chris@42 2651 {
Chris@42 2652 V Td5, Tdx, TdC, TdE, Tdk, Tdt, Tds, Tdy, Tdz, TdD;
Chris@42 2653 {
Chris@42 2654 V Td1, Td4, TdA, TdB;
Chris@42 2655 Td1 = VADD(TcZ, Td0);
Chris@42 2656 Td4 = VADD(Td2, Td3);
Chris@42 2657 Td5 = VSUB(Td1, Td4);
Chris@42 2658 Tdx = VADD(Td1, Td4);
Chris@42 2659 TdA = VADD(Td8, Tdb);
Chris@42 2660 TdB = VADD(Tdf, Tdi);
Chris@42 2661 TdC = VADD(TdA, TdB);
Chris@42 2662 TdE = VBYI(VSUB(TdB, TdA));
Chris@42 2663 }
Chris@42 2664 {
Chris@42 2665 V Tdc, Tdj, Tdo, Tdr;
Chris@42 2666 Tdc = VSUB(Td8, Tdb);
Chris@42 2667 Tdj = VSUB(Tdf, Tdi);
Chris@42 2668 Tdk = VMUL(LDK(KP707106781), VADD(Tdc, Tdj));
Chris@42 2669 Tdt = VMUL(LDK(KP707106781), VSUB(Tdj, Tdc));
Chris@42 2670 Tdo = VADD(Tdm, Tdn);
Chris@42 2671 Tdr = VADD(Tdp, Tdq);
Chris@42 2672 Tds = VSUB(Tdo, Tdr);
Chris@42 2673 Tdy = VADD(Tdr, Tdo);
Chris@42 2674 }
Chris@42 2675 Tdz = VADD(Tdx, Tdy);
Chris@42 2676 ST(&(xo[WS(os, 64)]), VSUB(Tdz, TdC), ovs, &(xo[0]));
Chris@42 2677 ST(&(xo[0]), VADD(Tdz, TdC), ovs, &(xo[0]));
Chris@42 2678 TdD = VSUB(Tdx, Tdy);
Chris@42 2679 ST(&(xo[WS(os, 96)]), VSUB(TdD, TdE), ovs, &(xo[0]));
Chris@42 2680 ST(&(xo[WS(os, 32)]), VADD(TdD, TdE), ovs, &(xo[0]));
Chris@42 2681 {
Chris@42 2682 V Tdl, Tdu, Tdv, Tdw;
Chris@42 2683 Tdl = VADD(Td5, Tdk);
Chris@42 2684 Tdu = VBYI(VADD(Tds, Tdt));
Chris@42 2685 ST(&(xo[WS(os, 112)]), VSUB(Tdl, Tdu), ovs, &(xo[0]));
Chris@42 2686 ST(&(xo[WS(os, 16)]), VADD(Tdl, Tdu), ovs, &(xo[0]));
Chris@42 2687 Tdv = VSUB(Td5, Tdk);
Chris@42 2688 Tdw = VBYI(VSUB(Tdt, Tds));
Chris@42 2689 ST(&(xo[WS(os, 80)]), VSUB(Tdv, Tdw), ovs, &(xo[0]));
Chris@42 2690 ST(&(xo[WS(os, 48)]), VADD(Tdv, Tdw), ovs, &(xo[0]));
Chris@42 2691 }
Chris@42 2692 }
Chris@42 2693 {
Chris@42 2694 V TdJ, Te4, TdX, Te5, TdQ, Te1, TdU, Te2;
Chris@42 2695 {
Chris@42 2696 V TdF, TdI, TdV, TdW;
Chris@42 2697 TdF = VSUB(TcZ, Td0);
Chris@42 2698 TdI = VMUL(LDK(KP707106781), VADD(TdG, TdH));
Chris@42 2699 TdJ = VADD(TdF, TdI);
Chris@42 2700 Te4 = VSUB(TdF, TdI);
Chris@42 2701 TdV = VFNMS(LDK(KP382683432), TdK, VMUL(LDK(KP923879532), TdL));
Chris@42 2702 TdW = VFMA(LDK(KP382683432), TdN, VMUL(LDK(KP923879532), TdO));
Chris@42 2703 TdX = VADD(TdV, TdW);
Chris@42 2704 Te5 = VSUB(TdW, TdV);
Chris@42 2705 }
Chris@42 2706 {
Chris@42 2707 V TdM, TdP, TdS, TdT;
Chris@42 2708 TdM = VFMA(LDK(KP923879532), TdK, VMUL(LDK(KP382683432), TdL));
Chris@42 2709 TdP = VFNMS(LDK(KP382683432), TdO, VMUL(LDK(KP923879532), TdN));
Chris@42 2710 TdQ = VADD(TdM, TdP);
Chris@42 2711 Te1 = VSUB(TdP, TdM);
Chris@42 2712 TdS = VSUB(Td3, Td2);
Chris@42 2713 TdT = VMUL(LDK(KP707106781), VSUB(TdH, TdG));
Chris@42 2714 TdU = VADD(TdS, TdT);
Chris@42 2715 Te2 = VSUB(TdT, TdS);
Chris@42 2716 }
Chris@42 2717 {
Chris@42 2718 V TdR, TdY, Te7, Te8;
Chris@42 2719 TdR = VADD(TdJ, TdQ);
Chris@42 2720 TdY = VBYI(VADD(TdU, TdX));
Chris@42 2721 ST(&(xo[WS(os, 120)]), VSUB(TdR, TdY), ovs, &(xo[0]));
Chris@42 2722 ST(&(xo[WS(os, 8)]), VADD(TdR, TdY), ovs, &(xo[0]));
Chris@42 2723 Te7 = VBYI(VADD(Te2, Te1));
Chris@42 2724 Te8 = VADD(Te4, Te5);
Chris@42 2725 ST(&(xo[WS(os, 24)]), VADD(Te7, Te8), ovs, &(xo[0]));
Chris@42 2726 ST(&(xo[WS(os, 104)]), VSUB(Te8, Te7), ovs, &(xo[0]));
Chris@42 2727 }
Chris@42 2728 {
Chris@42 2729 V TdZ, Te0, Te3, Te6;
Chris@42 2730 TdZ = VSUB(TdJ, TdQ);
Chris@42 2731 Te0 = VBYI(VSUB(TdX, TdU));
Chris@42 2732 ST(&(xo[WS(os, 72)]), VSUB(TdZ, Te0), ovs, &(xo[0]));
Chris@42 2733 ST(&(xo[WS(os, 56)]), VADD(TdZ, Te0), ovs, &(xo[0]));
Chris@42 2734 Te3 = VBYI(VSUB(Te1, Te2));
Chris@42 2735 Te6 = VSUB(Te4, Te5);
Chris@42 2736 ST(&(xo[WS(os, 40)]), VADD(Te3, Te6), ovs, &(xo[0]));
Chris@42 2737 ST(&(xo[WS(os, 88)]), VSUB(Te6, Te3), ovs, &(xo[0]));
Chris@42 2738 }
Chris@42 2739 }
Chris@42 2740 {
Chris@42 2741 V TaZ, Tcs, Tci, Tcq, Tc4, Tct, Tcl, Tcp;
Chris@42 2742 {
Chris@42 2743 V Tat, TaY, Tce, Tch;
Chris@42 2744 Tat = VADD(Tad, Tas);
Chris@42 2745 TaY = VADD(TaI, TaX);
Chris@42 2746 TaZ = VADD(Tat, TaY);
Chris@42 2747 Tcs = VSUB(Tat, TaY);
Chris@42 2748 Tce = VADD(Tcc, Tcd);
Chris@42 2749 Tch = VADD(Tcf, Tcg);
Chris@42 2750 Tci = VADD(Tce, Tch);
Chris@42 2751 Tcq = VSUB(Tch, Tce);
Chris@42 2752 {
Chris@42 2753 V Tbw, Tcj, Tc3, Tck;
Chris@42 2754 {
Chris@42 2755 V Tbm, Tbv, TbT, Tc2;
Chris@42 2756 Tbm = VADD(Tb6, Tbl);
Chris@42 2757 Tbv = VADD(Tbt, Tbu);
Chris@42 2758 Tbw = VFMA(LDK(KP980785280), Tbm, VMUL(LDK(KP195090322), Tbv));
Chris@42 2759 Tcj = VFNMS(LDK(KP195090322), Tbm, VMUL(LDK(KP980785280), Tbv));
Chris@42 2760 TbT = VADD(TbD, TbS);
Chris@42 2761 Tc2 = VADD(Tc0, Tc1);
Chris@42 2762 Tc3 = VFNMS(LDK(KP195090322), Tc2, VMUL(LDK(KP980785280), TbT));
Chris@42 2763 Tck = VFMA(LDK(KP195090322), TbT, VMUL(LDK(KP980785280), Tc2));
Chris@42 2764 }
Chris@42 2765 Tc4 = VADD(Tbw, Tc3);
Chris@42 2766 Tct = VSUB(Tck, Tcj);
Chris@42 2767 Tcl = VADD(Tcj, Tck);
Chris@42 2768 Tcp = VSUB(Tc3, Tbw);
Chris@42 2769 }
Chris@42 2770 }
Chris@42 2771 {
Chris@42 2772 V Tc5, Tcm, Tcv, Tcw;
Chris@42 2773 Tc5 = VADD(TaZ, Tc4);
Chris@42 2774 Tcm = VBYI(VADD(Tci, Tcl));
Chris@42 2775 ST(&(xo[WS(os, 124)]), VSUB(Tc5, Tcm), ovs, &(xo[0]));
Chris@42 2776 ST(&(xo[WS(os, 4)]), VADD(Tc5, Tcm), ovs, &(xo[0]));
Chris@42 2777 Tcv = VBYI(VADD(Tcq, Tcp));
Chris@42 2778 Tcw = VADD(Tcs, Tct);
Chris@42 2779 ST(&(xo[WS(os, 28)]), VADD(Tcv, Tcw), ovs, &(xo[0]));
Chris@42 2780 ST(&(xo[WS(os, 100)]), VSUB(Tcw, Tcv), ovs, &(xo[0]));
Chris@42 2781 }
Chris@42 2782 {
Chris@42 2783 V Tcn, Tco, Tcr, Tcu;
Chris@42 2784 Tcn = VSUB(TaZ, Tc4);
Chris@42 2785 Tco = VBYI(VSUB(Tcl, Tci));
Chris@42 2786 ST(&(xo[WS(os, 68)]), VSUB(Tcn, Tco), ovs, &(xo[0]));
Chris@42 2787 ST(&(xo[WS(os, 60)]), VADD(Tcn, Tco), ovs, &(xo[0]));
Chris@42 2788 Tcr = VBYI(VSUB(Tcp, Tcq));
Chris@42 2789 Tcu = VSUB(Tcs, Tct);
Chris@42 2790 ST(&(xo[WS(os, 36)]), VADD(Tcr, Tcu), ovs, &(xo[0]));
Chris@42 2791 ST(&(xo[WS(os, 92)]), VSUB(Tcu, Tcr), ovs, &(xo[0]));
Chris@42 2792 }
Chris@42 2793 }
Chris@42 2794 {
Chris@42 2795 V Tcz, TcU, TcK, TcS, TcG, TcV, TcN, TcR;
Chris@42 2796 {
Chris@42 2797 V Tcx, Tcy, TcI, TcJ;
Chris@42 2798 Tcx = VSUB(Tad, Tas);
Chris@42 2799 Tcy = VSUB(Tcg, Tcf);
Chris@42 2800 Tcz = VADD(Tcx, Tcy);
Chris@42 2801 TcU = VSUB(Tcx, Tcy);
Chris@42 2802 TcI = VSUB(Tcd, Tcc);
Chris@42 2803 TcJ = VSUB(TaX, TaI);
Chris@42 2804 TcK = VADD(TcI, TcJ);
Chris@42 2805 TcS = VSUB(TcJ, TcI);
Chris@42 2806 {
Chris@42 2807 V TcC, TcL, TcF, TcM;
Chris@42 2808 {
Chris@42 2809 V TcA, TcB, TcD, TcE;
Chris@42 2810 TcA = VSUB(Tb6, Tbl);
Chris@42 2811 TcB = VSUB(Tbu, Tbt);
Chris@42 2812 TcC = VFMA(LDK(KP831469612), TcA, VMUL(LDK(KP555570233), TcB));
Chris@42 2813 TcL = VFNMS(LDK(KP555570233), TcA, VMUL(LDK(KP831469612), TcB));
Chris@42 2814 TcD = VSUB(TbD, TbS);
Chris@42 2815 TcE = VSUB(Tc1, Tc0);
Chris@42 2816 TcF = VFNMS(LDK(KP555570233), TcE, VMUL(LDK(KP831469612), TcD));
Chris@42 2817 TcM = VFMA(LDK(KP555570233), TcD, VMUL(LDK(KP831469612), TcE));
Chris@42 2818 }
Chris@42 2819 TcG = VADD(TcC, TcF);
Chris@42 2820 TcV = VSUB(TcM, TcL);
Chris@42 2821 TcN = VADD(TcL, TcM);
Chris@42 2822 TcR = VSUB(TcF, TcC);
Chris@42 2823 }
Chris@42 2824 }
Chris@42 2825 {
Chris@42 2826 V TcH, TcO, TcX, TcY;
Chris@42 2827 TcH = VADD(Tcz, TcG);
Chris@42 2828 TcO = VBYI(VADD(TcK, TcN));
Chris@42 2829 ST(&(xo[WS(os, 116)]), VSUB(TcH, TcO), ovs, &(xo[0]));
Chris@42 2830 ST(&(xo[WS(os, 12)]), VADD(TcH, TcO), ovs, &(xo[0]));
Chris@42 2831 TcX = VBYI(VADD(TcS, TcR));
Chris@42 2832 TcY = VADD(TcU, TcV);
Chris@42 2833 ST(&(xo[WS(os, 20)]), VADD(TcX, TcY), ovs, &(xo[0]));
Chris@42 2834 ST(&(xo[WS(os, 108)]), VSUB(TcY, TcX), ovs, &(xo[0]));
Chris@42 2835 }
Chris@42 2836 {
Chris@42 2837 V TcP, TcQ, TcT, TcW;
Chris@42 2838 TcP = VSUB(Tcz, TcG);
Chris@42 2839 TcQ = VBYI(VSUB(TcN, TcK));
Chris@42 2840 ST(&(xo[WS(os, 76)]), VSUB(TcP, TcQ), ovs, &(xo[0]));
Chris@42 2841 ST(&(xo[WS(os, 52)]), VADD(TcP, TcQ), ovs, &(xo[0]));
Chris@42 2842 TcT = VBYI(VSUB(TcR, TcS));
Chris@42 2843 TcW = VSUB(TcU, TcV);
Chris@42 2844 ST(&(xo[WS(os, 44)]), VADD(TcT, TcW), ovs, &(xo[0]));
Chris@42 2845 ST(&(xo[WS(os, 84)]), VSUB(TcW, TcT), ovs, &(xo[0]));
Chris@42 2846 }
Chris@42 2847 }
Chris@42 2848 {
Chris@42 2849 V TeF, Tg8, TfI, Tg0, Tfy, Tga, TfG, TfP, Tfm, TfJ, TfB, TfF, TfW, Tgb, Tg3;
Chris@42 2850 V Tg7;
Chris@42 2851 {
Chris@42 2852 V Tel, TfY, TeE, TfZ, Teu, TeD;
Chris@42 2853 Tel = VADD(Ted, Tek);
Chris@42 2854 TfY = VSUB(Tft, Tfq);
Chris@42 2855 Teu = VFMA(LDK(KP980785280), Teq, VMUL(LDK(KP195090322), Tet));
Chris@42 2856 TeD = VFNMS(LDK(KP195090322), TeC, VMUL(LDK(KP980785280), Tez));
Chris@42 2857 TeE = VADD(Teu, TeD);
Chris@42 2858 TfZ = VSUB(TeD, Teu);
Chris@42 2859 TeF = VADD(Tel, TeE);
Chris@42 2860 Tg8 = VSUB(TfZ, TfY);
Chris@42 2861 TfI = VSUB(Tel, TeE);
Chris@42 2862 Tg0 = VADD(TfY, TfZ);
Chris@42 2863 }
Chris@42 2864 {
Chris@42 2865 V Tfu, TfN, Tfx, TfO, Tfv, Tfw;
Chris@42 2866 Tfu = VADD(Tfq, Tft);
Chris@42 2867 TfN = VSUB(Ted, Tek);
Chris@42 2868 Tfv = VFNMS(LDK(KP195090322), Teq, VMUL(LDK(KP980785280), Tet));
Chris@42 2869 Tfw = VFMA(LDK(KP195090322), Tez, VMUL(LDK(KP980785280), TeC));
Chris@42 2870 Tfx = VADD(Tfv, Tfw);
Chris@42 2871 TfO = VSUB(Tfw, Tfv);
Chris@42 2872 Tfy = VADD(Tfu, Tfx);
Chris@42 2873 Tga = VSUB(TfN, TfO);
Chris@42 2874 TfG = VSUB(Tfx, Tfu);
Chris@42 2875 TfP = VADD(TfN, TfO);
Chris@42 2876 }
Chris@42 2877 {
Chris@42 2878 V Tf0, Tfz, Tfl, TfA;
Chris@42 2879 {
Chris@42 2880 V TeS, TeZ, Tfd, Tfk;
Chris@42 2881 TeS = VADD(TeK, TeR);
Chris@42 2882 TeZ = VADD(TeV, TeY);
Chris@42 2883 Tf0 = VFMA(LDK(KP995184726), TeS, VMUL(LDK(KP098017140), TeZ));
Chris@42 2884 Tfz = VFNMS(LDK(KP098017140), TeS, VMUL(LDK(KP995184726), TeZ));
Chris@42 2885 Tfd = VADD(Tf5, Tfc);
Chris@42 2886 Tfk = VADD(Tfg, Tfj);
Chris@42 2887 Tfl = VFNMS(LDK(KP098017140), Tfk, VMUL(LDK(KP995184726), Tfd));
Chris@42 2888 TfA = VFMA(LDK(KP098017140), Tfd, VMUL(LDK(KP995184726), Tfk));
Chris@42 2889 }
Chris@42 2890 Tfm = VADD(Tf0, Tfl);
Chris@42 2891 TfJ = VSUB(TfA, Tfz);
Chris@42 2892 TfB = VADD(Tfz, TfA);
Chris@42 2893 TfF = VSUB(Tfl, Tf0);
Chris@42 2894 }
Chris@42 2895 {
Chris@42 2896 V TfS, Tg1, TfV, Tg2;
Chris@42 2897 {
Chris@42 2898 V TfQ, TfR, TfT, TfU;
Chris@42 2899 TfQ = VSUB(TeK, TeR);
Chris@42 2900 TfR = VSUB(TeY, TeV);
Chris@42 2901 TfS = VFMA(LDK(KP773010453), TfQ, VMUL(LDK(KP634393284), TfR));
Chris@42 2902 Tg1 = VFNMS(LDK(KP634393284), TfQ, VMUL(LDK(KP773010453), TfR));
Chris@42 2903 TfT = VSUB(Tf5, Tfc);
Chris@42 2904 TfU = VSUB(Tfj, Tfg);
Chris@42 2905 TfV = VFNMS(LDK(KP634393284), TfU, VMUL(LDK(KP773010453), TfT));
Chris@42 2906 Tg2 = VFMA(LDK(KP634393284), TfT, VMUL(LDK(KP773010453), TfU));
Chris@42 2907 }
Chris@42 2908 TfW = VADD(TfS, TfV);
Chris@42 2909 Tgb = VSUB(Tg2, Tg1);
Chris@42 2910 Tg3 = VADD(Tg1, Tg2);
Chris@42 2911 Tg7 = VSUB(TfV, TfS);
Chris@42 2912 }
Chris@42 2913 {
Chris@42 2914 V Tfn, TfC, Tg9, Tgc;
Chris@42 2915 Tfn = VADD(TeF, Tfm);
Chris@42 2916 TfC = VBYI(VADD(Tfy, TfB));
Chris@42 2917 ST(&(xo[WS(os, 126)]), VSUB(Tfn, TfC), ovs, &(xo[0]));
Chris@42 2918 ST(&(xo[WS(os, 2)]), VADD(Tfn, TfC), ovs, &(xo[0]));
Chris@42 2919 Tg9 = VBYI(VSUB(Tg7, Tg8));
Chris@42 2920 Tgc = VSUB(Tga, Tgb);
Chris@42 2921 ST(&(xo[WS(os, 46)]), VADD(Tg9, Tgc), ovs, &(xo[0]));
Chris@42 2922 ST(&(xo[WS(os, 82)]), VSUB(Tgc, Tg9), ovs, &(xo[0]));
Chris@42 2923 }
Chris@42 2924 {
Chris@42 2925 V Tgd, Tge, TfD, TfE;
Chris@42 2926 Tgd = VBYI(VADD(Tg8, Tg7));
Chris@42 2927 Tge = VADD(Tga, Tgb);
Chris@42 2928 ST(&(xo[WS(os, 18)]), VADD(Tgd, Tge), ovs, &(xo[0]));
Chris@42 2929 ST(&(xo[WS(os, 110)]), VSUB(Tge, Tgd), ovs, &(xo[0]));
Chris@42 2930 TfD = VSUB(TeF, Tfm);
Chris@42 2931 TfE = VBYI(VSUB(TfB, Tfy));
Chris@42 2932 ST(&(xo[WS(os, 66)]), VSUB(TfD, TfE), ovs, &(xo[0]));
Chris@42 2933 ST(&(xo[WS(os, 62)]), VADD(TfD, TfE), ovs, &(xo[0]));
Chris@42 2934 }
Chris@42 2935 {
Chris@42 2936 V TfH, TfK, TfX, Tg4;
Chris@42 2937 TfH = VBYI(VSUB(TfF, TfG));
Chris@42 2938 TfK = VSUB(TfI, TfJ);
Chris@42 2939 ST(&(xo[WS(os, 34)]), VADD(TfH, TfK), ovs, &(xo[0]));
Chris@42 2940 ST(&(xo[WS(os, 94)]), VSUB(TfK, TfH), ovs, &(xo[0]));
Chris@42 2941 TfX = VADD(TfP, TfW);
Chris@42 2942 Tg4 = VBYI(VADD(Tg0, Tg3));
Chris@42 2943 ST(&(xo[WS(os, 114)]), VSUB(TfX, Tg4), ovs, &(xo[0]));
Chris@42 2944 ST(&(xo[WS(os, 14)]), VADD(TfX, Tg4), ovs, &(xo[0]));
Chris@42 2945 }
Chris@42 2946 {
Chris@42 2947 V Tg5, Tg6, TfL, TfM;
Chris@42 2948 Tg5 = VSUB(TfP, TfW);
Chris@42 2949 Tg6 = VBYI(VSUB(Tg3, Tg0));
Chris@42 2950 ST(&(xo[WS(os, 78)]), VSUB(Tg5, Tg6), ovs, &(xo[0]));
Chris@42 2951 ST(&(xo[WS(os, 50)]), VADD(Tg5, Tg6), ovs, &(xo[0]));
Chris@42 2952 TfL = VBYI(VADD(TfG, TfF));
Chris@42 2953 TfM = VADD(TfI, TfJ);
Chris@42 2954 ST(&(xo[WS(os, 30)]), VADD(TfL, TfM), ovs, &(xo[0]));
Chris@42 2955 ST(&(xo[WS(os, 98)]), VSUB(TfM, TfL), ovs, &(xo[0]));
Chris@42 2956 }
Chris@42 2957 }
Chris@42 2958 {
Chris@42 2959 V Tgp, Thm, TgW, The, TgM, Tho, TgU, Th3, TgE, TgX, TgP, TgT, Tha, Thp, Thh;
Chris@42 2960 V Thl;
Chris@42 2961 {
Chris@42 2962 V Tgh, Thc, Tgo, Thd, Tgk, Tgn;
Chris@42 2963 Tgh = VSUB(Tgf, Tgg);
Chris@42 2964 Thc = VADD(TgH, TgG);
Chris@42 2965 Tgk = VFMA(LDK(KP555570233), Tgi, VMUL(LDK(KP831469612), Tgj));
Chris@42 2966 Tgn = VFNMS(LDK(KP555570233), Tgm, VMUL(LDK(KP831469612), Tgl));
Chris@42 2967 Tgo = VSUB(Tgk, Tgn);
Chris@42 2968 Thd = VADD(Tgn, Tgk);
Chris@42 2969 Tgp = VADD(Tgh, Tgo);
Chris@42 2970 Thm = VSUB(Thd, Thc);
Chris@42 2971 TgW = VSUB(Tgh, Tgo);
Chris@42 2972 The = VADD(Thc, Thd);
Chris@42 2973 }
Chris@42 2974 {
Chris@42 2975 V TgI, Th1, TgL, Th2, TgJ, TgK;
Chris@42 2976 TgI = VSUB(TgG, TgH);
Chris@42 2977 Th1 = VADD(Tgf, Tgg);
Chris@42 2978 TgJ = VFNMS(LDK(KP555570233), Tgj, VMUL(LDK(KP831469612), Tgi));
Chris@42 2979 TgK = VFMA(LDK(KP831469612), Tgm, VMUL(LDK(KP555570233), Tgl));
Chris@42 2980 TgL = VSUB(TgJ, TgK);
Chris@42 2981 Th2 = VADD(TgK, TgJ);
Chris@42 2982 TgM = VADD(TgI, TgL);
Chris@42 2983 Tho = VSUB(Th1, Th2);
Chris@42 2984 TgU = VSUB(TgL, TgI);
Chris@42 2985 Th3 = VADD(Th1, Th2);
Chris@42 2986 }
Chris@42 2987 {
Chris@42 2988 V Tgw, TgN, TgD, TgO;
Chris@42 2989 {
Chris@42 2990 V Tgs, Tgv, Tgz, TgC;
Chris@42 2991 Tgs = VSUB(Tgq, Tgr);
Chris@42 2992 Tgv = VSUB(Tgt, Tgu);
Chris@42 2993 Tgw = VFMA(LDK(KP471396736), Tgs, VMUL(LDK(KP881921264), Tgv));
Chris@42 2994 TgN = VFNMS(LDK(KP471396736), Tgv, VMUL(LDK(KP881921264), Tgs));
Chris@42 2995 Tgz = VSUB(Tgx, Tgy);
Chris@42 2996 TgC = VSUB(TgA, TgB);
Chris@42 2997 TgD = VFNMS(LDK(KP471396736), TgC, VMUL(LDK(KP881921264), Tgz));
Chris@42 2998 TgO = VFMA(LDK(KP881921264), TgC, VMUL(LDK(KP471396736), Tgz));
Chris@42 2999 }
Chris@42 3000 TgE = VADD(Tgw, TgD);
Chris@42 3001 TgX = VSUB(TgO, TgN);
Chris@42 3002 TgP = VADD(TgN, TgO);
Chris@42 3003 TgT = VSUB(TgD, Tgw);
Chris@42 3004 }
Chris@42 3005 {
Chris@42 3006 V Th6, Thf, Th9, Thg;
Chris@42 3007 {
Chris@42 3008 V Th4, Th5, Th7, Th8;
Chris@42 3009 Th4 = VADD(Tgr, Tgq);
Chris@42 3010 Th5 = VADD(Tgt, Tgu);
Chris@42 3011 Th6 = VFMA(LDK(KP290284677), Th4, VMUL(LDK(KP956940335), Th5));
Chris@42 3012 Thf = VFNMS(LDK(KP290284677), Th5, VMUL(LDK(KP956940335), Th4));
Chris@42 3013 Th7 = VADD(Tgx, Tgy);
Chris@42 3014 Th8 = VADD(TgB, TgA);
Chris@42 3015 Th9 = VFNMS(LDK(KP290284677), Th8, VMUL(LDK(KP956940335), Th7));
Chris@42 3016 Thg = VFMA(LDK(KP956940335), Th8, VMUL(LDK(KP290284677), Th7));
Chris@42 3017 }
Chris@42 3018 Tha = VADD(Th6, Th9);
Chris@42 3019 Thp = VSUB(Thg, Thf);
Chris@42 3020 Thh = VADD(Thf, Thg);
Chris@42 3021 Thl = VSUB(Th9, Th6);
Chris@42 3022 }
Chris@42 3023 {
Chris@42 3024 V TgF, TgQ, Thn, Thq;
Chris@42 3025 TgF = VADD(Tgp, TgE);
Chris@42 3026 TgQ = VBYI(VADD(TgM, TgP));
Chris@42 3027 ST(&(xo[WS(os, 118)]), VSUB(TgF, TgQ), ovs, &(xo[0]));
Chris@42 3028 ST(&(xo[WS(os, 10)]), VADD(TgF, TgQ), ovs, &(xo[0]));
Chris@42 3029 Thn = VBYI(VSUB(Thl, Thm));
Chris@42 3030 Thq = VSUB(Tho, Thp);
Chris@42 3031 ST(&(xo[WS(os, 38)]), VADD(Thn, Thq), ovs, &(xo[0]));
Chris@42 3032 ST(&(xo[WS(os, 90)]), VSUB(Thq, Thn), ovs, &(xo[0]));
Chris@42 3033 }
Chris@42 3034 {
Chris@42 3035 V Thr, Ths, TgR, TgS;
Chris@42 3036 Thr = VBYI(VADD(Thm, Thl));
Chris@42 3037 Ths = VADD(Tho, Thp);
Chris@42 3038 ST(&(xo[WS(os, 26)]), VADD(Thr, Ths), ovs, &(xo[0]));
Chris@42 3039 ST(&(xo[WS(os, 102)]), VSUB(Ths, Thr), ovs, &(xo[0]));
Chris@42 3040 TgR = VSUB(Tgp, TgE);
Chris@42 3041 TgS = VBYI(VSUB(TgP, TgM));
Chris@42 3042 ST(&(xo[WS(os, 74)]), VSUB(TgR, TgS), ovs, &(xo[0]));
Chris@42 3043 ST(&(xo[WS(os, 54)]), VADD(TgR, TgS), ovs, &(xo[0]));
Chris@42 3044 }
Chris@42 3045 {
Chris@42 3046 V TgV, TgY, Thb, Thi;
Chris@42 3047 TgV = VBYI(VSUB(TgT, TgU));
Chris@42 3048 TgY = VSUB(TgW, TgX);
Chris@42 3049 ST(&(xo[WS(os, 42)]), VADD(TgV, TgY), ovs, &(xo[0]));
Chris@42 3050 ST(&(xo[WS(os, 86)]), VSUB(TgY, TgV), ovs, &(xo[0]));
Chris@42 3051 Thb = VADD(Th3, Tha);
Chris@42 3052 Thi = VBYI(VADD(The, Thh));
Chris@42 3053 ST(&(xo[WS(os, 122)]), VSUB(Thb, Thi), ovs, &(xo[0]));
Chris@42 3054 ST(&(xo[WS(os, 6)]), VADD(Thb, Thi), ovs, &(xo[0]));
Chris@42 3055 }
Chris@42 3056 {
Chris@42 3057 V Thj, Thk, TgZ, Th0;
Chris@42 3058 Thj = VSUB(Th3, Tha);
Chris@42 3059 Thk = VBYI(VSUB(Thh, The));
Chris@42 3060 ST(&(xo[WS(os, 70)]), VSUB(Thj, Thk), ovs, &(xo[0]));
Chris@42 3061 ST(&(xo[WS(os, 58)]), VADD(Thj, Thk), ovs, &(xo[0]));
Chris@42 3062 TgZ = VBYI(VADD(TgU, TgT));
Chris@42 3063 Th0 = VADD(TgW, TgX);
Chris@42 3064 ST(&(xo[WS(os, 22)]), VADD(TgZ, Th0), ovs, &(xo[0]));
Chris@42 3065 ST(&(xo[WS(os, 106)]), VSUB(Th0, TgZ), ovs, &(xo[0]));
Chris@42 3066 }
Chris@42 3067 }
Chris@42 3068 {
Chris@42 3069 V T80, T8n, T8f, T8j, T8A, T8P, T8H, T8L, T7n, T8M, T8O, T8c, T8k, T8t, T8E;
Chris@42 3070 V T8m;
Chris@42 3071 {
Chris@42 3072 V T7G, T8d, T7Z, T8e;
Chris@42 3073 {
Chris@42 3074 V T7y, T7F, T7R, T7Y;
Chris@42 3075 T7y = VADD(T7q, T7x);
Chris@42 3076 T7F = VADD(T7B, T7E);
Chris@42 3077 T7G = VFMA(LDK(KP989176509), T7y, VMUL(LDK(KP146730474), T7F));
Chris@42 3078 T8d = VFNMS(LDK(KP146730474), T7y, VMUL(LDK(KP989176509), T7F));
Chris@42 3079 T7R = VADD(T7J, T7Q);
Chris@42 3080 T7Y = VADD(T7U, T7X);
Chris@42 3081 T7Z = VFNMS(LDK(KP146730474), T7Y, VMUL(LDK(KP989176509), T7R));
Chris@42 3082 T8e = VFMA(LDK(KP146730474), T7R, VMUL(LDK(KP989176509), T7Y));
Chris@42 3083 }
Chris@42 3084 T80 = VADD(T7G, T7Z);
Chris@42 3085 T8n = VSUB(T8e, T8d);
Chris@42 3086 T8f = VADD(T8d, T8e);
Chris@42 3087 T8j = VSUB(T7Z, T7G);
Chris@42 3088 }
Chris@42 3089 {
Chris@42 3090 V T8w, T8F, T8z, T8G;
Chris@42 3091 {
Chris@42 3092 V T8u, T8v, T8x, T8y;
Chris@42 3093 T8u = VSUB(T7q, T7x);
Chris@42 3094 T8v = VSUB(T7E, T7B);
Chris@42 3095 T8w = VFMA(LDK(KP803207531), T8u, VMUL(LDK(KP595699304), T8v));
Chris@42 3096 T8F = VFNMS(LDK(KP595699304), T8u, VMUL(LDK(KP803207531), T8v));
Chris@42 3097 T8x = VSUB(T7J, T7Q);
Chris@42 3098 T8y = VSUB(T7X, T7U);
Chris@42 3099 T8z = VFNMS(LDK(KP595699304), T8y, VMUL(LDK(KP803207531), T8x));
Chris@42 3100 T8G = VFMA(LDK(KP595699304), T8x, VMUL(LDK(KP803207531), T8y));
Chris@42 3101 }
Chris@42 3102 T8A = VADD(T8w, T8z);
Chris@42 3103 T8P = VSUB(T8G, T8F);
Chris@42 3104 T8H = VADD(T8F, T8G);
Chris@42 3105 T8L = VSUB(T8z, T8w);
Chris@42 3106 }
Chris@42 3107 {
Chris@42 3108 V T77, T8r, T88, T8C, T7m, T8D, T8b, T8s, T76, T87;
Chris@42 3109 T76 = VADD(T72, T75);
Chris@42 3110 T77 = VADD(T6Z, T76);
Chris@42 3111 T8r = VSUB(T6Z, T76);
Chris@42 3112 T87 = VADD(T85, T86);
Chris@42 3113 T88 = VADD(T84, T87);
Chris@42 3114 T8C = VSUB(T87, T84);
Chris@42 3115 {
Chris@42 3116 V T7e, T7l, T89, T8a;
Chris@42 3117 T7e = VFMA(LDK(KP956940335), T7a, VMUL(LDK(KP290284677), T7d));
Chris@42 3118 T7l = VFNMS(LDK(KP290284677), T7k, VMUL(LDK(KP956940335), T7h));
Chris@42 3119 T7m = VADD(T7e, T7l);
Chris@42 3120 T8D = VSUB(T7l, T7e);
Chris@42 3121 T89 = VFNMS(LDK(KP290284677), T7a, VMUL(LDK(KP956940335), T7d));
Chris@42 3122 T8a = VFMA(LDK(KP290284677), T7h, VMUL(LDK(KP956940335), T7k));
Chris@42 3123 T8b = VADD(T89, T8a);
Chris@42 3124 T8s = VSUB(T8a, T89);
Chris@42 3125 }
Chris@42 3126 T7n = VADD(T77, T7m);
Chris@42 3127 T8M = VSUB(T8D, T8C);
Chris@42 3128 T8O = VSUB(T8r, T8s);
Chris@42 3129 T8c = VADD(T88, T8b);
Chris@42 3130 T8k = VSUB(T8b, T88);
Chris@42 3131 T8t = VADD(T8r, T8s);
Chris@42 3132 T8E = VADD(T8C, T8D);
Chris@42 3133 T8m = VSUB(T77, T7m);
Chris@42 3134 }
Chris@42 3135 {
Chris@42 3136 V T81, T8g, T8N, T8Q;
Chris@42 3137 T81 = VADD(T7n, T80);
Chris@42 3138 T8g = VBYI(VADD(T8c, T8f));
Chris@42 3139 ST(&(xo[WS(os, 125)]), VSUB(T81, T8g), ovs, &(xo[WS(os, 1)]));
Chris@42 3140 ST(&(xo[WS(os, 3)]), VADD(T81, T8g), ovs, &(xo[WS(os, 1)]));
Chris@42 3141 T8N = VBYI(VSUB(T8L, T8M));
Chris@42 3142 T8Q = VSUB(T8O, T8P);
Chris@42 3143 ST(&(xo[WS(os, 45)]), VADD(T8N, T8Q), ovs, &(xo[WS(os, 1)]));
Chris@42 3144 ST(&(xo[WS(os, 83)]), VSUB(T8Q, T8N), ovs, &(xo[WS(os, 1)]));
Chris@42 3145 }
Chris@42 3146 {
Chris@42 3147 V T8R, T8S, T8h, T8i;
Chris@42 3148 T8R = VBYI(VADD(T8M, T8L));
Chris@42 3149 T8S = VADD(T8O, T8P);
Chris@42 3150 ST(&(xo[WS(os, 19)]), VADD(T8R, T8S), ovs, &(xo[WS(os, 1)]));
Chris@42 3151 ST(&(xo[WS(os, 109)]), VSUB(T8S, T8R), ovs, &(xo[WS(os, 1)]));
Chris@42 3152 T8h = VSUB(T7n, T80);
Chris@42 3153 T8i = VBYI(VSUB(T8f, T8c));
Chris@42 3154 ST(&(xo[WS(os, 67)]), VSUB(T8h, T8i), ovs, &(xo[WS(os, 1)]));
Chris@42 3155 ST(&(xo[WS(os, 61)]), VADD(T8h, T8i), ovs, &(xo[WS(os, 1)]));
Chris@42 3156 }
Chris@42 3157 {
Chris@42 3158 V T8l, T8o, T8B, T8I;
Chris@42 3159 T8l = VBYI(VSUB(T8j, T8k));
Chris@42 3160 T8o = VSUB(T8m, T8n);
Chris@42 3161 ST(&(xo[WS(os, 35)]), VADD(T8l, T8o), ovs, &(xo[WS(os, 1)]));
Chris@42 3162 ST(&(xo[WS(os, 93)]), VSUB(T8o, T8l), ovs, &(xo[WS(os, 1)]));
Chris@42 3163 T8B = VADD(T8t, T8A);
Chris@42 3164 T8I = VBYI(VADD(T8E, T8H));
Chris@42 3165 ST(&(xo[WS(os, 115)]), VSUB(T8B, T8I), ovs, &(xo[WS(os, 1)]));
Chris@42 3166 ST(&(xo[WS(os, 13)]), VADD(T8B, T8I), ovs, &(xo[WS(os, 1)]));
Chris@42 3167 }
Chris@42 3168 {
Chris@42 3169 V T8J, T8K, T8p, T8q;
Chris@42 3170 T8J = VSUB(T8t, T8A);
Chris@42 3171 T8K = VBYI(VSUB(T8H, T8E));
Chris@42 3172 ST(&(xo[WS(os, 77)]), VSUB(T8J, T8K), ovs, &(xo[WS(os, 1)]));
Chris@42 3173 ST(&(xo[WS(os, 51)]), VADD(T8J, T8K), ovs, &(xo[WS(os, 1)]));
Chris@42 3174 T8p = VBYI(VADD(T8k, T8j));
Chris@42 3175 T8q = VADD(T8m, T8n);
Chris@42 3176 ST(&(xo[WS(os, 29)]), VADD(T8p, T8q), ovs, &(xo[WS(os, 1)]));
Chris@42 3177 ST(&(xo[WS(os, 99)]), VSUB(T8q, T8p), ovs, &(xo[WS(os, 1)]));
Chris@42 3178 }
Chris@42 3179 }
Chris@42 3180 {
Chris@42 3181 V T4K, T5d, T55, T59, T5q, T5F, T5x, T5B, T2f, T5C, T5E, T52, T5a, T5j, T5u;
Chris@42 3182 V T5c;
Chris@42 3183 {
Chris@42 3184 V T3u, T53, T4J, T54;
Chris@42 3185 {
Chris@42 3186 V T3g, T3t, T4v, T4I;
Chris@42 3187 T3g = VADD(T2G, T3f);
Chris@42 3188 T3t = VADD(T3p, T3s);
Chris@42 3189 T3u = VFMA(LDK(KP998795456), T3g, VMUL(LDK(KP049067674), T3t));
Chris@42 3190 T53 = VFNMS(LDK(KP049067674), T3g, VMUL(LDK(KP998795456), T3t));
Chris@42 3191 T4v = VADD(T3V, T4u);
Chris@42 3192 T4I = VADD(T4E, T4H);
Chris@42 3193 T4J = VFNMS(LDK(KP049067674), T4I, VMUL(LDK(KP998795456), T4v));
Chris@42 3194 T54 = VFMA(LDK(KP049067674), T4v, VMUL(LDK(KP998795456), T4I));
Chris@42 3195 }
Chris@42 3196 T4K = VADD(T3u, T4J);
Chris@42 3197 T5d = VSUB(T54, T53);
Chris@42 3198 T55 = VADD(T53, T54);
Chris@42 3199 T59 = VSUB(T4J, T3u);
Chris@42 3200 }
Chris@42 3201 {
Chris@42 3202 V T5m, T5v, T5p, T5w;
Chris@42 3203 {
Chris@42 3204 V T5k, T5l, T5n, T5o;
Chris@42 3205 T5k = VSUB(T2G, T3f);
Chris@42 3206 T5l = VSUB(T3s, T3p);
Chris@42 3207 T5m = VFMA(LDK(KP740951125), T5k, VMUL(LDK(KP671558954), T5l));
Chris@42 3208 T5v = VFNMS(LDK(KP671558954), T5k, VMUL(LDK(KP740951125), T5l));
Chris@42 3209 T5n = VSUB(T3V, T4u);
Chris@42 3210 T5o = VSUB(T4H, T4E);
Chris@42 3211 T5p = VFNMS(LDK(KP671558954), T5o, VMUL(LDK(KP740951125), T5n));
Chris@42 3212 T5w = VFMA(LDK(KP671558954), T5n, VMUL(LDK(KP740951125), T5o));
Chris@42 3213 }
Chris@42 3214 T5q = VADD(T5m, T5p);
Chris@42 3215 T5F = VSUB(T5w, T5v);
Chris@42 3216 T5x = VADD(T5v, T5w);
Chris@42 3217 T5B = VSUB(T5p, T5m);
Chris@42 3218 }
Chris@42 3219 {
Chris@42 3220 V T11, T5h, T4Y, T5s, T2e, T5t, T51, T5i, T10, T4X;
Chris@42 3221 T10 = VADD(TI, TZ);
Chris@42 3222 T11 = VADD(Tr, T10);
Chris@42 3223 T5h = VSUB(Tr, T10);
Chris@42 3224 T4X = VADD(T4V, T4W);
Chris@42 3225 T4Y = VADD(T4U, T4X);
Chris@42 3226 T5s = VSUB(T4X, T4U);
Chris@42 3227 {
Chris@42 3228 V T1C, T2d, T4Z, T50;
Chris@42 3229 T1C = VFMA(LDK(KP098017140), T1s, VMUL(LDK(KP995184726), T1B));
Chris@42 3230 T2d = VFNMS(LDK(KP098017140), T2c, VMUL(LDK(KP995184726), T23));
Chris@42 3231 T2e = VADD(T1C, T2d);
Chris@42 3232 T5t = VSUB(T2d, T1C);
Chris@42 3233 T4Z = VFNMS(LDK(KP098017140), T1B, VMUL(LDK(KP995184726), T1s));
Chris@42 3234 T50 = VFMA(LDK(KP995184726), T2c, VMUL(LDK(KP098017140), T23));
Chris@42 3235 T51 = VADD(T4Z, T50);
Chris@42 3236 T5i = VSUB(T50, T4Z);
Chris@42 3237 }
Chris@42 3238 T2f = VADD(T11, T2e);
Chris@42 3239 T5C = VSUB(T5t, T5s);
Chris@42 3240 T5E = VSUB(T5h, T5i);
Chris@42 3241 T52 = VADD(T4Y, T51);
Chris@42 3242 T5a = VSUB(T51, T4Y);
Chris@42 3243 T5j = VADD(T5h, T5i);
Chris@42 3244 T5u = VADD(T5s, T5t);
Chris@42 3245 T5c = VSUB(T11, T2e);
Chris@42 3246 }
Chris@42 3247 {
Chris@42 3248 V T4L, T56, T5D, T5G;
Chris@42 3249 T4L = VADD(T2f, T4K);
Chris@42 3250 T56 = VBYI(VADD(T52, T55));
Chris@42 3251 ST(&(xo[WS(os, 127)]), VSUB(T4L, T56), ovs, &(xo[WS(os, 1)]));
Chris@42 3252 ST(&(xo[WS(os, 1)]), VADD(T4L, T56), ovs, &(xo[WS(os, 1)]));
Chris@42 3253 T5D = VBYI(VSUB(T5B, T5C));
Chris@42 3254 T5G = VSUB(T5E, T5F);
Chris@42 3255 ST(&(xo[WS(os, 47)]), VADD(T5D, T5G), ovs, &(xo[WS(os, 1)]));
Chris@42 3256 ST(&(xo[WS(os, 81)]), VSUB(T5G, T5D), ovs, &(xo[WS(os, 1)]));
Chris@42 3257 }
Chris@42 3258 {
Chris@42 3259 V T5H, T5I, T57, T58;
Chris@42 3260 T5H = VBYI(VADD(T5C, T5B));
Chris@42 3261 T5I = VADD(T5E, T5F);
Chris@42 3262 ST(&(xo[WS(os, 17)]), VADD(T5H, T5I), ovs, &(xo[WS(os, 1)]));
Chris@42 3263 ST(&(xo[WS(os, 111)]), VSUB(T5I, T5H), ovs, &(xo[WS(os, 1)]));
Chris@42 3264 T57 = VSUB(T2f, T4K);
Chris@42 3265 T58 = VBYI(VSUB(T55, T52));
Chris@42 3266 ST(&(xo[WS(os, 65)]), VSUB(T57, T58), ovs, &(xo[WS(os, 1)]));
Chris@42 3267 ST(&(xo[WS(os, 63)]), VADD(T57, T58), ovs, &(xo[WS(os, 1)]));
Chris@42 3268 }
Chris@42 3269 {
Chris@42 3270 V T5b, T5e, T5r, T5y;
Chris@42 3271 T5b = VBYI(VSUB(T59, T5a));
Chris@42 3272 T5e = VSUB(T5c, T5d);
Chris@42 3273 ST(&(xo[WS(os, 33)]), VADD(T5b, T5e), ovs, &(xo[WS(os, 1)]));
Chris@42 3274 ST(&(xo[WS(os, 95)]), VSUB(T5e, T5b), ovs, &(xo[WS(os, 1)]));
Chris@42 3275 T5r = VADD(T5j, T5q);
Chris@42 3276 T5y = VBYI(VADD(T5u, T5x));
Chris@42 3277 ST(&(xo[WS(os, 113)]), VSUB(T5r, T5y), ovs, &(xo[WS(os, 1)]));
Chris@42 3278 ST(&(xo[WS(os, 15)]), VADD(T5r, T5y), ovs, &(xo[WS(os, 1)]));
Chris@42 3279 }
Chris@42 3280 {
Chris@42 3281 V T5z, T5A, T5f, T5g;
Chris@42 3282 T5z = VSUB(T5j, T5q);
Chris@42 3283 T5A = VBYI(VSUB(T5x, T5u));
Chris@42 3284 ST(&(xo[WS(os, 79)]), VSUB(T5z, T5A), ovs, &(xo[WS(os, 1)]));
Chris@42 3285 ST(&(xo[WS(os, 49)]), VADD(T5z, T5A), ovs, &(xo[WS(os, 1)]));
Chris@42 3286 T5f = VBYI(VADD(T5a, T59));
Chris@42 3287 T5g = VADD(T5c, T5d);
Chris@42 3288 ST(&(xo[WS(os, 31)]), VADD(T5f, T5g), ovs, &(xo[WS(os, 1)]));
Chris@42 3289 ST(&(xo[WS(os, 97)]), VSUB(T5g, T5f), ovs, &(xo[WS(os, 1)]));
Chris@42 3290 }
Chris@42 3291 }
Chris@42 3292 {
Chris@42 3293 V T9i, T9B, T9t, T9x, T9O, Ta3, T9V, T9Z, T93, Ta0, Ta2, T9q, T9y, T9H, T9S;
Chris@42 3294 V T9A;
Chris@42 3295 {
Chris@42 3296 V T9a, T9r, T9h, T9s;
Chris@42 3297 {
Chris@42 3298 V T96, T99, T9d, T9g;
Chris@42 3299 T96 = VSUB(T94, T95);
Chris@42 3300 T99 = VSUB(T97, T98);
Chris@42 3301 T9a = VFMA(LDK(KP514102744), T96, VMUL(LDK(KP857728610), T99));
Chris@42 3302 T9r = VFNMS(LDK(KP514102744), T99, VMUL(LDK(KP857728610), T96));
Chris@42 3303 T9d = VSUB(T9b, T9c);
Chris@42 3304 T9g = VSUB(T9e, T9f);
Chris@42 3305 T9h = VFNMS(LDK(KP514102744), T9g, VMUL(LDK(KP857728610), T9d));
Chris@42 3306 T9s = VFMA(LDK(KP857728610), T9g, VMUL(LDK(KP514102744), T9d));
Chris@42 3307 }
Chris@42 3308 T9i = VADD(T9a, T9h);
Chris@42 3309 T9B = VSUB(T9s, T9r);
Chris@42 3310 T9t = VADD(T9r, T9s);
Chris@42 3311 T9x = VSUB(T9h, T9a);
Chris@42 3312 }
Chris@42 3313 {
Chris@42 3314 V T9K, T9T, T9N, T9U;
Chris@42 3315 {
Chris@42 3316 V T9I, T9J, T9L, T9M;
Chris@42 3317 T9I = VADD(T95, T94);
Chris@42 3318 T9J = VADD(T97, T98);
Chris@42 3319 T9K = VFMA(LDK(KP242980179), T9I, VMUL(LDK(KP970031253), T9J));
Chris@42 3320 T9T = VFNMS(LDK(KP242980179), T9J, VMUL(LDK(KP970031253), T9I));
Chris@42 3321 T9L = VADD(T9b, T9c);
Chris@42 3322 T9M = VADD(T9f, T9e);
Chris@42 3323 T9N = VFNMS(LDK(KP242980179), T9M, VMUL(LDK(KP970031253), T9L));
Chris@42 3324 T9U = VFMA(LDK(KP970031253), T9M, VMUL(LDK(KP242980179), T9L));
Chris@42 3325 }
Chris@42 3326 T9O = VADD(T9K, T9N);
Chris@42 3327 Ta3 = VSUB(T9U, T9T);
Chris@42 3328 T9V = VADD(T9T, T9U);
Chris@42 3329 T9Z = VSUB(T9N, T9K);
Chris@42 3330 }
Chris@42 3331 {
Chris@42 3332 V T8V, T9F, T9m, T9Q, T92, T9R, T9p, T9G, T8U, T9k;
Chris@42 3333 T8U = VSUB(T86, T85);
Chris@42 3334 T8V = VSUB(T8T, T8U);
Chris@42 3335 T9F = VADD(T8T, T8U);
Chris@42 3336 T9k = VSUB(T75, T72);
Chris@42 3337 T9m = VSUB(T9k, T9l);
Chris@42 3338 T9Q = VADD(T9l, T9k);
Chris@42 3339 {
Chris@42 3340 V T8Y, T91, T9n, T9o;
Chris@42 3341 T8Y = VFMA(LDK(KP471396736), T8W, VMUL(LDK(KP881921264), T8X));
Chris@42 3342 T91 = VFNMS(LDK(KP471396736), T90, VMUL(LDK(KP881921264), T8Z));
Chris@42 3343 T92 = VSUB(T8Y, T91);
Chris@42 3344 T9R = VADD(T91, T8Y);
Chris@42 3345 T9n = VFNMS(LDK(KP471396736), T8X, VMUL(LDK(KP881921264), T8W));
Chris@42 3346 T9o = VFMA(LDK(KP881921264), T90, VMUL(LDK(KP471396736), T8Z));
Chris@42 3347 T9p = VSUB(T9n, T9o);
Chris@42 3348 T9G = VADD(T9o, T9n);
Chris@42 3349 }
Chris@42 3350 T93 = VADD(T8V, T92);
Chris@42 3351 Ta0 = VSUB(T9R, T9Q);
Chris@42 3352 Ta2 = VSUB(T9F, T9G);
Chris@42 3353 T9q = VADD(T9m, T9p);
Chris@42 3354 T9y = VSUB(T9p, T9m);
Chris@42 3355 T9H = VADD(T9F, T9G);
Chris@42 3356 T9S = VADD(T9Q, T9R);
Chris@42 3357 T9A = VSUB(T8V, T92);
Chris@42 3358 }
Chris@42 3359 {
Chris@42 3360 V T9j, T9u, Ta1, Ta4;
Chris@42 3361 T9j = VADD(T93, T9i);
Chris@42 3362 T9u = VBYI(VADD(T9q, T9t));
Chris@42 3363 ST(&(xo[WS(os, 117)]), VSUB(T9j, T9u), ovs, &(xo[WS(os, 1)]));
Chris@42 3364 ST(&(xo[WS(os, 11)]), VADD(T9j, T9u), ovs, &(xo[WS(os, 1)]));
Chris@42 3365 Ta1 = VBYI(VSUB(T9Z, Ta0));
Chris@42 3366 Ta4 = VSUB(Ta2, Ta3);
Chris@42 3367 ST(&(xo[WS(os, 37)]), VADD(Ta1, Ta4), ovs, &(xo[WS(os, 1)]));
Chris@42 3368 ST(&(xo[WS(os, 91)]), VSUB(Ta4, Ta1), ovs, &(xo[WS(os, 1)]));
Chris@42 3369 }
Chris@42 3370 {
Chris@42 3371 V Ta5, Ta6, T9v, T9w;
Chris@42 3372 Ta5 = VBYI(VADD(Ta0, T9Z));
Chris@42 3373 Ta6 = VADD(Ta2, Ta3);
Chris@42 3374 ST(&(xo[WS(os, 27)]), VADD(Ta5, Ta6), ovs, &(xo[WS(os, 1)]));
Chris@42 3375 ST(&(xo[WS(os, 101)]), VSUB(Ta6, Ta5), ovs, &(xo[WS(os, 1)]));
Chris@42 3376 T9v = VSUB(T93, T9i);
Chris@42 3377 T9w = VBYI(VSUB(T9t, T9q));
Chris@42 3378 ST(&(xo[WS(os, 75)]), VSUB(T9v, T9w), ovs, &(xo[WS(os, 1)]));
Chris@42 3379 ST(&(xo[WS(os, 53)]), VADD(T9v, T9w), ovs, &(xo[WS(os, 1)]));
Chris@42 3380 }
Chris@42 3381 {
Chris@42 3382 V T9z, T9C, T9P, T9W;
Chris@42 3383 T9z = VBYI(VSUB(T9x, T9y));
Chris@42 3384 T9C = VSUB(T9A, T9B);
Chris@42 3385 ST(&(xo[WS(os, 43)]), VADD(T9z, T9C), ovs, &(xo[WS(os, 1)]));
Chris@42 3386 ST(&(xo[WS(os, 85)]), VSUB(T9C, T9z), ovs, &(xo[WS(os, 1)]));
Chris@42 3387 T9P = VADD(T9H, T9O);
Chris@42 3388 T9W = VBYI(VADD(T9S, T9V));
Chris@42 3389 ST(&(xo[WS(os, 123)]), VSUB(T9P, T9W), ovs, &(xo[WS(os, 1)]));
Chris@42 3390 ST(&(xo[WS(os, 5)]), VADD(T9P, T9W), ovs, &(xo[WS(os, 1)]));
Chris@42 3391 }
Chris@42 3392 {
Chris@42 3393 V T9X, T9Y, T9D, T9E;
Chris@42 3394 T9X = VSUB(T9H, T9O);
Chris@42 3395 T9Y = VBYI(VSUB(T9V, T9S));
Chris@42 3396 ST(&(xo[WS(os, 69)]), VSUB(T9X, T9Y), ovs, &(xo[WS(os, 1)]));
Chris@42 3397 ST(&(xo[WS(os, 59)]), VADD(T9X, T9Y), ovs, &(xo[WS(os, 1)]));
Chris@42 3398 T9D = VBYI(VADD(T9y, T9x));
Chris@42 3399 T9E = VADD(T9A, T9B);
Chris@42 3400 ST(&(xo[WS(os, 21)]), VADD(T9D, T9E), ovs, &(xo[WS(os, 1)]));
Chris@42 3401 ST(&(xo[WS(os, 107)]), VSUB(T9E, T9D), ovs, &(xo[WS(os, 1)]));
Chris@42 3402 }
Chris@42 3403 }
Chris@42 3404 {
Chris@42 3405 V T68, T6r, T6j, T6n, T6E, T6T, T6L, T6P, T5T, T6Q, T6S, T6g, T6o, T6x, T6I;
Chris@42 3406 V T6q;
Chris@42 3407 {
Chris@42 3408 V T60, T6h, T67, T6i;
Chris@42 3409 {
Chris@42 3410 V T5W, T5Z, T63, T66;
Chris@42 3411 T5W = VSUB(T5U, T5V);
Chris@42 3412 T5Z = VSUB(T5X, T5Y);
Chris@42 3413 T60 = VFMA(LDK(KP427555093), T5W, VMUL(LDK(KP903989293), T5Z));
Chris@42 3414 T6h = VFNMS(LDK(KP427555093), T5Z, VMUL(LDK(KP903989293), T5W));
Chris@42 3415 T63 = VSUB(T61, T62);
Chris@42 3416 T66 = VSUB(T64, T65);
Chris@42 3417 T67 = VFNMS(LDK(KP427555093), T66, VMUL(LDK(KP903989293), T63));
Chris@42 3418 T6i = VFMA(LDK(KP903989293), T66, VMUL(LDK(KP427555093), T63));
Chris@42 3419 }
Chris@42 3420 T68 = VADD(T60, T67);
Chris@42 3421 T6r = VSUB(T6i, T6h);
Chris@42 3422 T6j = VADD(T6h, T6i);
Chris@42 3423 T6n = VSUB(T67, T60);
Chris@42 3424 }
Chris@42 3425 {
Chris@42 3426 V T6A, T6J, T6D, T6K;
Chris@42 3427 {
Chris@42 3428 V T6y, T6z, T6B, T6C;
Chris@42 3429 T6y = VADD(T5V, T5U);
Chris@42 3430 T6z = VADD(T5X, T5Y);
Chris@42 3431 T6A = VFMA(LDK(KP336889853), T6y, VMUL(LDK(KP941544065), T6z));
Chris@42 3432 T6J = VFNMS(LDK(KP336889853), T6z, VMUL(LDK(KP941544065), T6y));
Chris@42 3433 T6B = VADD(T61, T62);
Chris@42 3434 T6C = VADD(T65, T64);
Chris@42 3435 T6D = VFNMS(LDK(KP336889853), T6C, VMUL(LDK(KP941544065), T6B));
Chris@42 3436 T6K = VFMA(LDK(KP941544065), T6C, VMUL(LDK(KP336889853), T6B));
Chris@42 3437 }
Chris@42 3438 T6E = VADD(T6A, T6D);
Chris@42 3439 T6T = VSUB(T6K, T6J);
Chris@42 3440 T6L = VADD(T6J, T6K);
Chris@42 3441 T6P = VSUB(T6D, T6A);
Chris@42 3442 }
Chris@42 3443 {
Chris@42 3444 V T5L, T6v, T6c, T6G, T5S, T6H, T6f, T6w, T5K, T6a;
Chris@42 3445 T5K = VSUB(T4W, T4V);
Chris@42 3446 T5L = VSUB(T5J, T5K);
Chris@42 3447 T6v = VADD(T5J, T5K);
Chris@42 3448 T6a = VSUB(TZ, TI);
Chris@42 3449 T6c = VSUB(T6a, T6b);
Chris@42 3450 T6G = VADD(T6b, T6a);
Chris@42 3451 {
Chris@42 3452 V T5O, T5R, T6d, T6e;
Chris@42 3453 T5O = VFMA(LDK(KP773010453), T5M, VMUL(LDK(KP634393284), T5N));
Chris@42 3454 T5R = VFNMS(LDK(KP634393284), T5Q, VMUL(LDK(KP773010453), T5P));
Chris@42 3455 T5S = VSUB(T5O, T5R);
Chris@42 3456 T6H = VADD(T5R, T5O);
Chris@42 3457 T6d = VFNMS(LDK(KP634393284), T5M, VMUL(LDK(KP773010453), T5N));
Chris@42 3458 T6e = VFMA(LDK(KP634393284), T5P, VMUL(LDK(KP773010453), T5Q));
Chris@42 3459 T6f = VSUB(T6d, T6e);
Chris@42 3460 T6w = VADD(T6e, T6d);
Chris@42 3461 }
Chris@42 3462 T5T = VADD(T5L, T5S);
Chris@42 3463 T6Q = VSUB(T6H, T6G);
Chris@42 3464 T6S = VSUB(T6v, T6w);
Chris@42 3465 T6g = VADD(T6c, T6f);
Chris@42 3466 T6o = VSUB(T6f, T6c);
Chris@42 3467 T6x = VADD(T6v, T6w);
Chris@42 3468 T6I = VADD(T6G, T6H);
Chris@42 3469 T6q = VSUB(T5L, T5S);
Chris@42 3470 }
Chris@42 3471 {
Chris@42 3472 V T69, T6k, T6R, T6U;
Chris@42 3473 T69 = VADD(T5T, T68);
Chris@42 3474 T6k = VBYI(VADD(T6g, T6j));
Chris@42 3475 ST(&(xo[WS(os, 119)]), VSUB(T69, T6k), ovs, &(xo[WS(os, 1)]));
Chris@42 3476 ST(&(xo[WS(os, 9)]), VADD(T69, T6k), ovs, &(xo[WS(os, 1)]));
Chris@42 3477 T6R = VBYI(VSUB(T6P, T6Q));
Chris@42 3478 T6U = VSUB(T6S, T6T);
Chris@42 3479 ST(&(xo[WS(os, 39)]), VADD(T6R, T6U), ovs, &(xo[WS(os, 1)]));
Chris@42 3480 ST(&(xo[WS(os, 89)]), VSUB(T6U, T6R), ovs, &(xo[WS(os, 1)]));
Chris@42 3481 }
Chris@42 3482 {
Chris@42 3483 V T6V, T6W, T6l, T6m;
Chris@42 3484 T6V = VBYI(VADD(T6Q, T6P));
Chris@42 3485 T6W = VADD(T6S, T6T);
Chris@42 3486 ST(&(xo[WS(os, 25)]), VADD(T6V, T6W), ovs, &(xo[WS(os, 1)]));
Chris@42 3487 ST(&(xo[WS(os, 103)]), VSUB(T6W, T6V), ovs, &(xo[WS(os, 1)]));
Chris@42 3488 T6l = VSUB(T5T, T68);
Chris@42 3489 T6m = VBYI(VSUB(T6j, T6g));
Chris@42 3490 ST(&(xo[WS(os, 73)]), VSUB(T6l, T6m), ovs, &(xo[WS(os, 1)]));
Chris@42 3491 ST(&(xo[WS(os, 55)]), VADD(T6l, T6m), ovs, &(xo[WS(os, 1)]));
Chris@42 3492 }
Chris@42 3493 {
Chris@42 3494 V T6p, T6s, T6F, T6M;
Chris@42 3495 T6p = VBYI(VSUB(T6n, T6o));
Chris@42 3496 T6s = VSUB(T6q, T6r);
Chris@42 3497 ST(&(xo[WS(os, 41)]), VADD(T6p, T6s), ovs, &(xo[WS(os, 1)]));
Chris@42 3498 ST(&(xo[WS(os, 87)]), VSUB(T6s, T6p), ovs, &(xo[WS(os, 1)]));
Chris@42 3499 T6F = VADD(T6x, T6E);
Chris@42 3500 T6M = VBYI(VADD(T6I, T6L));
Chris@42 3501 ST(&(xo[WS(os, 121)]), VSUB(T6F, T6M), ovs, &(xo[WS(os, 1)]));
Chris@42 3502 ST(&(xo[WS(os, 7)]), VADD(T6F, T6M), ovs, &(xo[WS(os, 1)]));
Chris@42 3503 }
Chris@42 3504 {
Chris@42 3505 V T6N, T6O, T6t, T6u;
Chris@42 3506 T6N = VSUB(T6x, T6E);
Chris@42 3507 T6O = VBYI(VSUB(T6L, T6I));
Chris@42 3508 ST(&(xo[WS(os, 71)]), VSUB(T6N, T6O), ovs, &(xo[WS(os, 1)]));
Chris@42 3509 ST(&(xo[WS(os, 57)]), VADD(T6N, T6O), ovs, &(xo[WS(os, 1)]));
Chris@42 3510 T6t = VBYI(VADD(T6o, T6n));
Chris@42 3511 T6u = VADD(T6q, T6r);
Chris@42 3512 ST(&(xo[WS(os, 23)]), VADD(T6t, T6u), ovs, &(xo[WS(os, 1)]));
Chris@42 3513 ST(&(xo[WS(os, 105)]), VSUB(T6u, T6t), ovs, &(xo[WS(os, 1)]));
Chris@42 3514 }
Chris@42 3515 }
Chris@42 3516 }
Chris@42 3517 }
Chris@42 3518 VLEAVE();
Chris@42 3519 }
Chris@42 3520
Chris@42 3521 static const kdft_desc desc = { 128, XSIMD_STRING("n1fv_128"), {938, 186, 144, 0}, &GENUS, 0, 0, 0, 0 };
Chris@42 3522
Chris@42 3523 void XSIMD(codelet_n1fv_128) (planner *p) {
Chris@42 3524 X(kdft_register) (p, n1fv_128, &desc);
Chris@42 3525 }
Chris@42 3526
Chris@42 3527 #endif /* HAVE_FMA */