annotate src/fftw-3.3.8/dft/simd/common/n1bv_128.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents d0c2a83c1364
children
rev   line source
Chris@82 1 /*
Chris@82 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@82 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@82 4 *
Chris@82 5 * This program is free software; you can redistribute it and/or modify
Chris@82 6 * it under the terms of the GNU General Public License as published by
Chris@82 7 * the Free Software Foundation; either version 2 of the License, or
Chris@82 8 * (at your option) any later version.
Chris@82 9 *
Chris@82 10 * This program is distributed in the hope that it will be useful,
Chris@82 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@82 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@82 13 * GNU General Public License for more details.
Chris@82 14 *
Chris@82 15 * You should have received a copy of the GNU General Public License
Chris@82 16 * along with this program; if not, write to the Free Software
Chris@82 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@82 18 *
Chris@82 19 */
Chris@82 20
Chris@82 21 /* This file was automatically generated --- DO NOT EDIT */
Chris@82 22 /* Generated on Thu May 24 08:05:00 EDT 2018 */
Chris@82 23
Chris@82 24 #include "dft/codelet-dft.h"
Chris@82 25
Chris@82 26 #if defined(ARCH_PREFERS_FMA) || defined(ISA_EXTENSION_PREFERS_FMA)
Chris@82 27
Chris@82 28 /* Generated by: ../../../genfft/gen_notw_c.native -fma -simd -compact -variables 4 -pipeline-latency 8 -sign 1 -n 128 -name n1bv_128 -include dft/simd/n1b.h */
Chris@82 29
Chris@82 30 /*
Chris@82 31 * This function contains 1082 FP additions, 642 FP multiplications,
Chris@82 32 * (or, 440 additions, 0 multiplications, 642 fused multiply/add),
Chris@82 33 * 194 stack variables, 31 constants, and 256 memory accesses
Chris@82 34 */
Chris@82 35 #include "dft/simd/n1b.h"
Chris@82 36
Chris@82 37 static void n1bv_128(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT v, INT ivs, INT ovs)
Chris@82 38 {
Chris@82 39 DVK(KP941544065, +0.941544065183020778412509402599502357185589796);
Chris@82 40 DVK(KP903989293, +0.903989293123443331586200297230537048710132025);
Chris@82 41 DVK(KP357805721, +0.357805721314524104672487743774474392487532769);
Chris@82 42 DVK(KP472964775, +0.472964775891319928124438237972992463904131113);
Chris@82 43 DVK(KP970031253, +0.970031253194543992603984207286100251456865962);
Chris@82 44 DVK(KP857728610, +0.857728610000272069902269984284770137042490799);
Chris@82 45 DVK(KP250486960, +0.250486960191305461595702160124721208578685568);
Chris@82 46 DVK(KP599376933, +0.599376933681923766271389869014404232837890546);
Chris@82 47 DVK(KP740951125, +0.740951125354959091175616897495162729728955309);
Chris@82 48 DVK(KP998795456, +0.998795456205172392714771604759100694443203615);
Chris@82 49 DVK(KP906347169, +0.906347169019147157946142717268914412664134293);
Chris@82 50 DVK(KP049126849, +0.049126849769467254105343321271313617079695752);
Chris@82 51 DVK(KP803207531, +0.803207531480644909806676512963141923879569427);
Chris@82 52 DVK(KP989176509, +0.989176509964780973451673738016243063983689533);
Chris@82 53 DVK(KP741650546, +0.741650546272035369581266691172079863842265220);
Chris@82 54 DVK(KP148335987, +0.148335987538347428753676511486911367000625355);
Chris@82 55 DVK(KP956940335, +0.956940335732208864935797886980269969482849206);
Chris@82 56 DVK(KP881921264, +0.881921264348355029712756863660388349508442621);
Chris@82 57 DVK(KP303346683, +0.303346683607342391675883946941299872384187453);
Chris@82 58 DVK(KP534511135, +0.534511135950791641089685961295362908582039528);
Chris@82 59 DVK(KP773010453, +0.773010453362736960810906609758469800971041293);
Chris@82 60 DVK(KP995184726, +0.995184726672196886244836953109479921575474869);
Chris@82 61 DVK(KP820678790, +0.820678790828660330972281985331011598767386482);
Chris@82 62 DVK(KP098491403, +0.098491403357164253077197521291327432293052451);
Chris@82 63 DVK(KP831469612, +0.831469612302545237078788377617905756738560812);
Chris@82 64 DVK(KP980785280, +0.980785280403230449126182236134239036973933731);
Chris@82 65 DVK(KP668178637, +0.668178637919298919997757686523080761552472251);
Chris@82 66 DVK(KP198912367, +0.198912367379658006911597622644676228597850501);
Chris@82 67 DVK(KP923879532, +0.923879532511286756128183189396788286822416626);
Chris@82 68 DVK(KP707106781, +0.707106781186547524400844362104849039284835938);
Chris@82 69 DVK(KP414213562, +0.414213562373095048801688724209698078569671875);
Chris@82 70 {
Chris@82 71 INT i;
Chris@82 72 const R *xi;
Chris@82 73 R *xo;
Chris@82 74 xi = ii;
Chris@82 75 xo = io;
Chris@82 76 for (i = v; i > 0; i = i - VL, xi = xi + (VL * ivs), xo = xo + (VL * ovs), MAKE_VOLATILE_STRIDE(256, is), MAKE_VOLATILE_STRIDE(256, os)) {
Chris@82 77 V Tr, T5J, Ted, Tgf, Tfq, TgG, T4U, T6a, T6Z, T8T, Tad, TcZ, Tcc, Td0, T84;
Chris@82 78 V T9k, Tb6, Tbt, T2G, T5U, TeV, Tgt, T3p, T5X, T7B, T97, TeK, Tgq, T7q, T94;
Chris@82 79 V Td8, TdK, TbD, Tc0, T3V, T61, Tfg, TgA, T4E, T64, T7U, T9e, Tf5, Tgx, T7J;
Chris@82 80 V T9b, Tdf, TdN, Td2, Td3, TI, T4V, Tft, Tgg, TZ, T4W, T75, T86, Tek, TgH;
Chris@82 81 V T72, T85, Tas, Tcd, Tdm, Tdn, TdG, Teq, Tgj, Tet, Tgi, T1s, T5N, T1B, T5M;
Chris@82 82 V T7d, T8W, TaI, Tcf, T7a, T8X, Tdp, Tdq, TdH, Tez, Tgm, TeC, Tgl, T23, T5Q;
Chris@82 83 V T2c, T5P, T7k, T8Z, TaX, Tcg, T7h, T90, Tbl, Tbu, Tdb, TdL, TeY, Tgr, TeR;
Chris@82 84 V Tgu, T7x, T98, T7E, T95, T3f, T5Y, T3s, T5V, TbS, Tc1, Tdi, TdO, Tfj, Tgy;
Chris@82 85 V Tfc, TgB, T7Q, T9f, T7X, T9c, T4u, T65, T4H, T62;
Chris@82 86 {
Chris@82 87 V T3, Ta7, T4O, Ta8, Ta, Tab, T4P, Taa, Tc6, Tc7, Ti, Tea, T4R, Tc9, Tca;
Chris@82 88 V Tp, Teb, T4S;
Chris@82 89 {
Chris@82 90 V T1, T2, T4M, T4N;
Chris@82 91 T1 = LD(&(xi[0]), ivs, &(xi[0]));
Chris@82 92 T2 = LD(&(xi[WS(is, 64)]), ivs, &(xi[0]));
Chris@82 93 T3 = VSUB(T1, T2);
Chris@82 94 Ta7 = VADD(T1, T2);
Chris@82 95 T4M = LD(&(xi[WS(is, 32)]), ivs, &(xi[0]));
Chris@82 96 T4N = LD(&(xi[WS(is, 96)]), ivs, &(xi[0]));
Chris@82 97 T4O = VSUB(T4M, T4N);
Chris@82 98 Ta8 = VADD(T4M, T4N);
Chris@82 99 }
Chris@82 100 {
Chris@82 101 V T4, T5, T6, T7, T8, T9;
Chris@82 102 T4 = LD(&(xi[WS(is, 16)]), ivs, &(xi[0]));
Chris@82 103 T5 = LD(&(xi[WS(is, 80)]), ivs, &(xi[0]));
Chris@82 104 T6 = VSUB(T4, T5);
Chris@82 105 T7 = LD(&(xi[WS(is, 112)]), ivs, &(xi[0]));
Chris@82 106 T8 = LD(&(xi[WS(is, 48)]), ivs, &(xi[0]));
Chris@82 107 T9 = VSUB(T7, T8);
Chris@82 108 Ta = VADD(T6, T9);
Chris@82 109 Tab = VADD(T7, T8);
Chris@82 110 T4P = VSUB(T6, T9);
Chris@82 111 Taa = VADD(T4, T5);
Chris@82 112 }
Chris@82 113 {
Chris@82 114 V Te, Th, Tl, To;
Chris@82 115 {
Chris@82 116 V Tc, Td, Tf, Tg;
Chris@82 117 Tc = LD(&(xi[WS(is, 8)]), ivs, &(xi[0]));
Chris@82 118 Td = LD(&(xi[WS(is, 72)]), ivs, &(xi[0]));
Chris@82 119 Te = VSUB(Tc, Td);
Chris@82 120 Tc6 = VADD(Tc, Td);
Chris@82 121 Tf = LD(&(xi[WS(is, 40)]), ivs, &(xi[0]));
Chris@82 122 Tg = LD(&(xi[WS(is, 104)]), ivs, &(xi[0]));
Chris@82 123 Th = VSUB(Tf, Tg);
Chris@82 124 Tc7 = VADD(Tf, Tg);
Chris@82 125 }
Chris@82 126 Ti = VFNMS(LDK(KP414213562), Th, Te);
Chris@82 127 Tea = VSUB(Tc6, Tc7);
Chris@82 128 T4R = VFMA(LDK(KP414213562), Te, Th);
Chris@82 129 {
Chris@82 130 V Tj, Tk, Tm, Tn;
Chris@82 131 Tj = LD(&(xi[WS(is, 120)]), ivs, &(xi[0]));
Chris@82 132 Tk = LD(&(xi[WS(is, 56)]), ivs, &(xi[0]));
Chris@82 133 Tl = VSUB(Tj, Tk);
Chris@82 134 Tc9 = VADD(Tj, Tk);
Chris@82 135 Tm = LD(&(xi[WS(is, 88)]), ivs, &(xi[0]));
Chris@82 136 Tn = LD(&(xi[WS(is, 24)]), ivs, &(xi[0]));
Chris@82 137 To = VSUB(Tm, Tn);
Chris@82 138 Tca = VADD(Tn, Tm);
Chris@82 139 }
Chris@82 140 Tp = VFNMS(LDK(KP414213562), To, Tl);
Chris@82 141 Teb = VSUB(Tc9, Tca);
Chris@82 142 T4S = VFMA(LDK(KP414213562), Tl, To);
Chris@82 143 }
Chris@82 144 {
Chris@82 145 V Tb, Tq, Te9, Tec;
Chris@82 146 Tb = VFMA(LDK(KP707106781), Ta, T3);
Chris@82 147 Tq = VADD(Ti, Tp);
Chris@82 148 Tr = VFMA(LDK(KP923879532), Tq, Tb);
Chris@82 149 T5J = VFNMS(LDK(KP923879532), Tq, Tb);
Chris@82 150 Te9 = VSUB(Ta7, Ta8);
Chris@82 151 Tec = VADD(Tea, Teb);
Chris@82 152 Ted = VFMA(LDK(KP707106781), Tec, Te9);
Chris@82 153 Tgf = VFNMS(LDK(KP707106781), Tec, Te9);
Chris@82 154 }
Chris@82 155 {
Chris@82 156 V Tfo, Tfp, T4Q, T4T;
Chris@82 157 Tfo = VSUB(Taa, Tab);
Chris@82 158 Tfp = VSUB(Tea, Teb);
Chris@82 159 Tfq = VFMA(LDK(KP707106781), Tfp, Tfo);
Chris@82 160 TgG = VFNMS(LDK(KP707106781), Tfp, Tfo);
Chris@82 161 T4Q = VFMA(LDK(KP707106781), T4P, T4O);
Chris@82 162 T4T = VSUB(T4R, T4S);
Chris@82 163 T4U = VFMA(LDK(KP923879532), T4T, T4Q);
Chris@82 164 T6a = VFNMS(LDK(KP923879532), T4T, T4Q);
Chris@82 165 }
Chris@82 166 {
Chris@82 167 V T6X, T6Y, Ta9, Tac;
Chris@82 168 T6X = VFNMS(LDK(KP707106781), Ta, T3);
Chris@82 169 T6Y = VADD(T4R, T4S);
Chris@82 170 T6Z = VFMA(LDK(KP923879532), T6Y, T6X);
Chris@82 171 T8T = VFNMS(LDK(KP923879532), T6Y, T6X);
Chris@82 172 Ta9 = VADD(Ta7, Ta8);
Chris@82 173 Tac = VADD(Taa, Tab);
Chris@82 174 Tad = VSUB(Ta9, Tac);
Chris@82 175 TcZ = VADD(Ta9, Tac);
Chris@82 176 }
Chris@82 177 {
Chris@82 178 V Tc8, Tcb, T82, T83;
Chris@82 179 Tc8 = VADD(Tc6, Tc7);
Chris@82 180 Tcb = VADD(Tc9, Tca);
Chris@82 181 Tcc = VSUB(Tc8, Tcb);
Chris@82 182 Td0 = VADD(Tc8, Tcb);
Chris@82 183 T82 = VFNMS(LDK(KP707106781), T4P, T4O);
Chris@82 184 T83 = VSUB(Ti, Tp);
Chris@82 185 T84 = VFNMS(LDK(KP923879532), T83, T82);
Chris@82 186 T9k = VFMA(LDK(KP923879532), T83, T82);
Chris@82 187 }
Chris@82 188 }
Chris@82 189 {
Chris@82 190 V Tb0, Tb1, T2i, Tb2, T3j, Tb3, Tb4, T2p, Tb5, T3k, T2x, TeH, T3m, Tbp, T2E;
Chris@82 191 V TeI, T3n, Tbs, T2l, T2o, TeG, TeJ;
Chris@82 192 {
Chris@82 193 V T2g, T2h, T3h, T3i;
Chris@82 194 T2g = LD(&(xi[WS(is, 1)]), ivs, &(xi[WS(is, 1)]));
Chris@82 195 T2h = LD(&(xi[WS(is, 65)]), ivs, &(xi[WS(is, 1)]));
Chris@82 196 Tb0 = VADD(T2g, T2h);
Chris@82 197 T3h = LD(&(xi[WS(is, 33)]), ivs, &(xi[WS(is, 1)]));
Chris@82 198 T3i = LD(&(xi[WS(is, 97)]), ivs, &(xi[WS(is, 1)]));
Chris@82 199 Tb1 = VADD(T3h, T3i);
Chris@82 200 T2i = VSUB(T2g, T2h);
Chris@82 201 Tb2 = VADD(Tb0, Tb1);
Chris@82 202 T3j = VSUB(T3h, T3i);
Chris@82 203 }
Chris@82 204 {
Chris@82 205 V T2j, T2k, T2m, T2n;
Chris@82 206 T2j = LD(&(xi[WS(is, 17)]), ivs, &(xi[WS(is, 1)]));
Chris@82 207 T2k = LD(&(xi[WS(is, 81)]), ivs, &(xi[WS(is, 1)]));
Chris@82 208 T2l = VSUB(T2j, T2k);
Chris@82 209 Tb3 = VADD(T2j, T2k);
Chris@82 210 T2m = LD(&(xi[WS(is, 113)]), ivs, &(xi[WS(is, 1)]));
Chris@82 211 T2n = LD(&(xi[WS(is, 49)]), ivs, &(xi[WS(is, 1)]));
Chris@82 212 T2o = VSUB(T2m, T2n);
Chris@82 213 Tb4 = VADD(T2m, T2n);
Chris@82 214 }
Chris@82 215 T2p = VADD(T2l, T2o);
Chris@82 216 Tb5 = VADD(Tb3, Tb4);
Chris@82 217 T3k = VSUB(T2l, T2o);
Chris@82 218 {
Chris@82 219 V T2t, Tbn, T2w, Tbo;
Chris@82 220 {
Chris@82 221 V T2r, T2s, T2u, T2v;
Chris@82 222 T2r = LD(&(xi[WS(is, 9)]), ivs, &(xi[WS(is, 1)]));
Chris@82 223 T2s = LD(&(xi[WS(is, 73)]), ivs, &(xi[WS(is, 1)]));
Chris@82 224 T2t = VSUB(T2r, T2s);
Chris@82 225 Tbn = VADD(T2r, T2s);
Chris@82 226 T2u = LD(&(xi[WS(is, 41)]), ivs, &(xi[WS(is, 1)]));
Chris@82 227 T2v = LD(&(xi[WS(is, 105)]), ivs, &(xi[WS(is, 1)]));
Chris@82 228 T2w = VSUB(T2u, T2v);
Chris@82 229 Tbo = VADD(T2u, T2v);
Chris@82 230 }
Chris@82 231 T2x = VFNMS(LDK(KP414213562), T2w, T2t);
Chris@82 232 TeH = VSUB(Tbn, Tbo);
Chris@82 233 T3m = VFMA(LDK(KP414213562), T2t, T2w);
Chris@82 234 Tbp = VADD(Tbn, Tbo);
Chris@82 235 }
Chris@82 236 {
Chris@82 237 V T2A, Tbq, T2D, Tbr;
Chris@82 238 {
Chris@82 239 V T2y, T2z, T2B, T2C;
Chris@82 240 T2y = LD(&(xi[WS(is, 121)]), ivs, &(xi[WS(is, 1)]));
Chris@82 241 T2z = LD(&(xi[WS(is, 57)]), ivs, &(xi[WS(is, 1)]));
Chris@82 242 T2A = VSUB(T2y, T2z);
Chris@82 243 Tbq = VADD(T2y, T2z);
Chris@82 244 T2B = LD(&(xi[WS(is, 25)]), ivs, &(xi[WS(is, 1)]));
Chris@82 245 T2C = LD(&(xi[WS(is, 89)]), ivs, &(xi[WS(is, 1)]));
Chris@82 246 T2D = VSUB(T2B, T2C);
Chris@82 247 Tbr = VADD(T2B, T2C);
Chris@82 248 }
Chris@82 249 T2E = VFMA(LDK(KP414213562), T2D, T2A);
Chris@82 250 TeI = VSUB(Tbq, Tbr);
Chris@82 251 T3n = VFNMS(LDK(KP414213562), T2A, T2D);
Chris@82 252 Tbs = VADD(Tbq, Tbr);
Chris@82 253 }
Chris@82 254 Tb6 = VSUB(Tb2, Tb5);
Chris@82 255 Tbt = VSUB(Tbp, Tbs);
Chris@82 256 {
Chris@82 257 V T2q, T2F, TeT, TeU;
Chris@82 258 T2q = VFMA(LDK(KP707106781), T2p, T2i);
Chris@82 259 T2F = VADD(T2x, T2E);
Chris@82 260 T2G = VFMA(LDK(KP923879532), T2F, T2q);
Chris@82 261 T5U = VFNMS(LDK(KP923879532), T2F, T2q);
Chris@82 262 TeT = VSUB(Tb3, Tb4);
Chris@82 263 TeU = VSUB(TeH, TeI);
Chris@82 264 TeV = VFMA(LDK(KP707106781), TeU, TeT);
Chris@82 265 Tgt = VFNMS(LDK(KP707106781), TeU, TeT);
Chris@82 266 }
Chris@82 267 {
Chris@82 268 V T3l, T3o, T7z, T7A;
Chris@82 269 T3l = VFMA(LDK(KP707106781), T3k, T3j);
Chris@82 270 T3o = VADD(T3m, T3n);
Chris@82 271 T3p = VFMA(LDK(KP923879532), T3o, T3l);
Chris@82 272 T5X = VFNMS(LDK(KP923879532), T3o, T3l);
Chris@82 273 T7z = VFNMS(LDK(KP707106781), T3k, T3j);
Chris@82 274 T7A = VSUB(T2x, T2E);
Chris@82 275 T7B = VFNMS(LDK(KP923879532), T7A, T7z);
Chris@82 276 T97 = VFMA(LDK(KP923879532), T7A, T7z);
Chris@82 277 }
Chris@82 278 TeG = VSUB(Tb0, Tb1);
Chris@82 279 TeJ = VADD(TeH, TeI);
Chris@82 280 TeK = VFMA(LDK(KP707106781), TeJ, TeG);
Chris@82 281 Tgq = VFNMS(LDK(KP707106781), TeJ, TeG);
Chris@82 282 {
Chris@82 283 V T7o, T7p, Td6, Td7;
Chris@82 284 T7o = VFNMS(LDK(KP707106781), T2p, T2i);
Chris@82 285 T7p = VSUB(T3m, T3n);
Chris@82 286 T7q = VFMA(LDK(KP923879532), T7p, T7o);
Chris@82 287 T94 = VFNMS(LDK(KP923879532), T7p, T7o);
Chris@82 288 Td6 = VADD(Tb2, Tb5);
Chris@82 289 Td7 = VADD(Tbp, Tbs);
Chris@82 290 Td8 = VADD(Td6, Td7);
Chris@82 291 TdK = VSUB(Td6, Td7);
Chris@82 292 }
Chris@82 293 }
Chris@82 294 {
Chris@82 295 V Tbx, Tby, T3x, Tbz, T4y, TbA, TbB, T3E, TbC, T4z, T3M, Tf2, T4B, TbZ, T3T;
Chris@82 296 V Tf3, T4C, TbW, T3A, T3D, Tf1, Tf4;
Chris@82 297 {
Chris@82 298 V T3v, T3w, T4w, T4x;
Chris@82 299 T3v = LD(&(xi[WS(is, 127)]), ivs, &(xi[WS(is, 1)]));
Chris@82 300 T3w = LD(&(xi[WS(is, 63)]), ivs, &(xi[WS(is, 1)]));
Chris@82 301 Tbx = VADD(T3v, T3w);
Chris@82 302 T4w = LD(&(xi[WS(is, 95)]), ivs, &(xi[WS(is, 1)]));
Chris@82 303 T4x = LD(&(xi[WS(is, 31)]), ivs, &(xi[WS(is, 1)]));
Chris@82 304 Tby = VADD(T4x, T4w);
Chris@82 305 T3x = VSUB(T3v, T3w);
Chris@82 306 Tbz = VADD(Tbx, Tby);
Chris@82 307 T4y = VSUB(T4w, T4x);
Chris@82 308 }
Chris@82 309 {
Chris@82 310 V T3y, T3z, T3B, T3C;
Chris@82 311 T3y = LD(&(xi[WS(is, 15)]), ivs, &(xi[WS(is, 1)]));
Chris@82 312 T3z = LD(&(xi[WS(is, 79)]), ivs, &(xi[WS(is, 1)]));
Chris@82 313 T3A = VSUB(T3y, T3z);
Chris@82 314 TbA = VADD(T3y, T3z);
Chris@82 315 T3B = LD(&(xi[WS(is, 111)]), ivs, &(xi[WS(is, 1)]));
Chris@82 316 T3C = LD(&(xi[WS(is, 47)]), ivs, &(xi[WS(is, 1)]));
Chris@82 317 T3D = VSUB(T3B, T3C);
Chris@82 318 TbB = VADD(T3B, T3C);
Chris@82 319 }
Chris@82 320 T3E = VADD(T3A, T3D);
Chris@82 321 TbC = VADD(TbA, TbB);
Chris@82 322 T4z = VSUB(T3D, T3A);
Chris@82 323 {
Chris@82 324 V T3I, TbX, T3L, TbY;
Chris@82 325 {
Chris@82 326 V T3G, T3H, T3J, T3K;
Chris@82 327 T3G = LD(&(xi[WS(is, 7)]), ivs, &(xi[WS(is, 1)]));
Chris@82 328 T3H = LD(&(xi[WS(is, 71)]), ivs, &(xi[WS(is, 1)]));
Chris@82 329 T3I = VSUB(T3G, T3H);
Chris@82 330 TbX = VADD(T3G, T3H);
Chris@82 331 T3J = LD(&(xi[WS(is, 103)]), ivs, &(xi[WS(is, 1)]));
Chris@82 332 T3K = LD(&(xi[WS(is, 39)]), ivs, &(xi[WS(is, 1)]));
Chris@82 333 T3L = VSUB(T3J, T3K);
Chris@82 334 TbY = VADD(T3K, T3J);
Chris@82 335 }
Chris@82 336 T3M = VFMA(LDK(KP414213562), T3L, T3I);
Chris@82 337 Tf2 = VSUB(TbX, TbY);
Chris@82 338 T4B = VFNMS(LDK(KP414213562), T3I, T3L);
Chris@82 339 TbZ = VADD(TbX, TbY);
Chris@82 340 }
Chris@82 341 {
Chris@82 342 V T3P, TbU, T3S, TbV;
Chris@82 343 {
Chris@82 344 V T3N, T3O, T3Q, T3R;
Chris@82 345 T3N = LD(&(xi[WS(is, 119)]), ivs, &(xi[WS(is, 1)]));
Chris@82 346 T3O = LD(&(xi[WS(is, 55)]), ivs, &(xi[WS(is, 1)]));
Chris@82 347 T3P = VSUB(T3N, T3O);
Chris@82 348 TbU = VADD(T3N, T3O);
Chris@82 349 T3Q = LD(&(xi[WS(is, 87)]), ivs, &(xi[WS(is, 1)]));
Chris@82 350 T3R = LD(&(xi[WS(is, 23)]), ivs, &(xi[WS(is, 1)]));
Chris@82 351 T3S = VSUB(T3Q, T3R);
Chris@82 352 TbV = VADD(T3R, T3Q);
Chris@82 353 }
Chris@82 354 T3T = VFNMS(LDK(KP414213562), T3S, T3P);
Chris@82 355 Tf3 = VSUB(TbU, TbV);
Chris@82 356 T4C = VFMA(LDK(KP414213562), T3P, T3S);
Chris@82 357 TbW = VADD(TbU, TbV);
Chris@82 358 }
Chris@82 359 TbD = VSUB(Tbz, TbC);
Chris@82 360 Tc0 = VSUB(TbW, TbZ);
Chris@82 361 {
Chris@82 362 V T3F, T3U, Tfe, Tff;
Chris@82 363 T3F = VFMA(LDK(KP707106781), T3E, T3x);
Chris@82 364 T3U = VADD(T3M, T3T);
Chris@82 365 T3V = VFMA(LDK(KP923879532), T3U, T3F);
Chris@82 366 T61 = VFNMS(LDK(KP923879532), T3U, T3F);
Chris@82 367 Tfe = VSUB(TbB, TbA);
Chris@82 368 Tff = VSUB(Tf3, Tf2);
Chris@82 369 Tfg = VFMA(LDK(KP707106781), Tff, Tfe);
Chris@82 370 TgA = VFNMS(LDK(KP707106781), Tff, Tfe);
Chris@82 371 }
Chris@82 372 {
Chris@82 373 V T4A, T4D, T7S, T7T;
Chris@82 374 T4A = VFMA(LDK(KP707106781), T4z, T4y);
Chris@82 375 T4D = VADD(T4B, T4C);
Chris@82 376 T4E = VFMA(LDK(KP923879532), T4D, T4A);
Chris@82 377 T64 = VFNMS(LDK(KP923879532), T4D, T4A);
Chris@82 378 T7S = VFNMS(LDK(KP707106781), T4z, T4y);
Chris@82 379 T7T = VSUB(T3T, T3M);
Chris@82 380 T7U = VFNMS(LDK(KP923879532), T7T, T7S);
Chris@82 381 T9e = VFMA(LDK(KP923879532), T7T, T7S);
Chris@82 382 }
Chris@82 383 Tf1 = VSUB(Tbx, Tby);
Chris@82 384 Tf4 = VADD(Tf2, Tf3);
Chris@82 385 Tf5 = VFMA(LDK(KP707106781), Tf4, Tf1);
Chris@82 386 Tgx = VFNMS(LDK(KP707106781), Tf4, Tf1);
Chris@82 387 {
Chris@82 388 V T7H, T7I, Tdd, Tde;
Chris@82 389 T7H = VFNMS(LDK(KP707106781), T3E, T3x);
Chris@82 390 T7I = VSUB(T4C, T4B);
Chris@82 391 T7J = VFMA(LDK(KP923879532), T7I, T7H);
Chris@82 392 T9b = VFNMS(LDK(KP923879532), T7I, T7H);
Chris@82 393 Tdd = VADD(Tbz, TbC);
Chris@82 394 Tde = VADD(TbZ, TbW);
Chris@82 395 Tdf = VADD(Tdd, Tde);
Chris@82 396 TdN = VSUB(Tdd, Tde);
Chris@82 397 }
Chris@82 398 }
Chris@82 399 {
Chris@82 400 V Tu, Tee, TF, Tag, TL, Teh, TW, Tan, TB, Tef, TG, Taj, TS, Tei, TX;
Chris@82 401 V Taq, Teg, Tej;
Chris@82 402 {
Chris@82 403 V Ts, Tt, Tae, TD, TE, Taf;
Chris@82 404 Ts = LD(&(xi[WS(is, 4)]), ivs, &(xi[0]));
Chris@82 405 Tt = LD(&(xi[WS(is, 68)]), ivs, &(xi[0]));
Chris@82 406 Tae = VADD(Ts, Tt);
Chris@82 407 TD = LD(&(xi[WS(is, 36)]), ivs, &(xi[0]));
Chris@82 408 TE = LD(&(xi[WS(is, 100)]), ivs, &(xi[0]));
Chris@82 409 Taf = VADD(TD, TE);
Chris@82 410 Tu = VSUB(Ts, Tt);
Chris@82 411 Tee = VSUB(Tae, Taf);
Chris@82 412 TF = VSUB(TD, TE);
Chris@82 413 Tag = VADD(Tae, Taf);
Chris@82 414 }
Chris@82 415 {
Chris@82 416 V TJ, TK, Tal, TU, TV, Tam;
Chris@82 417 TJ = LD(&(xi[WS(is, 124)]), ivs, &(xi[0]));
Chris@82 418 TK = LD(&(xi[WS(is, 60)]), ivs, &(xi[0]));
Chris@82 419 Tal = VADD(TJ, TK);
Chris@82 420 TU = LD(&(xi[WS(is, 92)]), ivs, &(xi[0]));
Chris@82 421 TV = LD(&(xi[WS(is, 28)]), ivs, &(xi[0]));
Chris@82 422 Tam = VADD(TV, TU);
Chris@82 423 TL = VSUB(TJ, TK);
Chris@82 424 Teh = VSUB(Tal, Tam);
Chris@82 425 TW = VSUB(TU, TV);
Chris@82 426 Tan = VADD(Tal, Tam);
Chris@82 427 }
Chris@82 428 {
Chris@82 429 V Tx, Tah, TA, Tai;
Chris@82 430 {
Chris@82 431 V Tv, Tw, Ty, Tz;
Chris@82 432 Tv = LD(&(xi[WS(is, 20)]), ivs, &(xi[0]));
Chris@82 433 Tw = LD(&(xi[WS(is, 84)]), ivs, &(xi[0]));
Chris@82 434 Tx = VSUB(Tv, Tw);
Chris@82 435 Tah = VADD(Tv, Tw);
Chris@82 436 Ty = LD(&(xi[WS(is, 116)]), ivs, &(xi[0]));
Chris@82 437 Tz = LD(&(xi[WS(is, 52)]), ivs, &(xi[0]));
Chris@82 438 TA = VSUB(Ty, Tz);
Chris@82 439 Tai = VADD(Ty, Tz);
Chris@82 440 }
Chris@82 441 TB = VADD(Tx, TA);
Chris@82 442 Tef = VSUB(Tah, Tai);
Chris@82 443 TG = VSUB(Tx, TA);
Chris@82 444 Taj = VADD(Tah, Tai);
Chris@82 445 }
Chris@82 446 {
Chris@82 447 V TO, Tao, TR, Tap;
Chris@82 448 {
Chris@82 449 V TM, TN, TP, TQ;
Chris@82 450 TM = LD(&(xi[WS(is, 12)]), ivs, &(xi[0]));
Chris@82 451 TN = LD(&(xi[WS(is, 76)]), ivs, &(xi[0]));
Chris@82 452 TO = VSUB(TM, TN);
Chris@82 453 Tao = VADD(TM, TN);
Chris@82 454 TP = LD(&(xi[WS(is, 108)]), ivs, &(xi[0]));
Chris@82 455 TQ = LD(&(xi[WS(is, 44)]), ivs, &(xi[0]));
Chris@82 456 TR = VSUB(TP, TQ);
Chris@82 457 Tap = VADD(TP, TQ);
Chris@82 458 }
Chris@82 459 TS = VADD(TO, TR);
Chris@82 460 Tei = VSUB(Tap, Tao);
Chris@82 461 TX = VSUB(TR, TO);
Chris@82 462 Taq = VADD(Tao, Tap);
Chris@82 463 }
Chris@82 464 Td2 = VADD(Tag, Taj);
Chris@82 465 Td3 = VADD(Tan, Taq);
Chris@82 466 {
Chris@82 467 V TC, TH, Tfr, Tfs;
Chris@82 468 TC = VFMA(LDK(KP707106781), TB, Tu);
Chris@82 469 TH = VFMA(LDK(KP707106781), TG, TF);
Chris@82 470 TI = VFNMS(LDK(KP198912367), TH, TC);
Chris@82 471 T4V = VFMA(LDK(KP198912367), TC, TH);
Chris@82 472 Tfr = VFMA(LDK(KP414213562), Tee, Tef);
Chris@82 473 Tfs = VFMA(LDK(KP414213562), Teh, Tei);
Chris@82 474 Tft = VSUB(Tfr, Tfs);
Chris@82 475 Tgg = VADD(Tfr, Tfs);
Chris@82 476 }
Chris@82 477 {
Chris@82 478 V TT, TY, T73, T74;
Chris@82 479 TT = VFMA(LDK(KP707106781), TS, TL);
Chris@82 480 TY = VFMA(LDK(KP707106781), TX, TW);
Chris@82 481 TZ = VFNMS(LDK(KP198912367), TY, TT);
Chris@82 482 T4W = VFMA(LDK(KP198912367), TT, TY);
Chris@82 483 T73 = VFNMS(LDK(KP707106781), TS, TL);
Chris@82 484 T74 = VFNMS(LDK(KP707106781), TX, TW);
Chris@82 485 T75 = VFMA(LDK(KP668178637), T74, T73);
Chris@82 486 T86 = VFNMS(LDK(KP668178637), T73, T74);
Chris@82 487 }
Chris@82 488 Teg = VFNMS(LDK(KP414213562), Tef, Tee);
Chris@82 489 Tej = VFNMS(LDK(KP414213562), Tei, Teh);
Chris@82 490 Tek = VADD(Teg, Tej);
Chris@82 491 TgH = VSUB(Teg, Tej);
Chris@82 492 {
Chris@82 493 V T70, T71, Tak, Tar;
Chris@82 494 T70 = VFNMS(LDK(KP707106781), TB, Tu);
Chris@82 495 T71 = VFNMS(LDK(KP707106781), TG, TF);
Chris@82 496 T72 = VFMA(LDK(KP668178637), T71, T70);
Chris@82 497 T85 = VFNMS(LDK(KP668178637), T70, T71);
Chris@82 498 Tak = VSUB(Tag, Taj);
Chris@82 499 Tar = VSUB(Tan, Taq);
Chris@82 500 Tas = VADD(Tak, Tar);
Chris@82 501 Tcd = VSUB(Tak, Tar);
Chris@82 502 }
Chris@82 503 }
Chris@82 504 {
Chris@82 505 V Tau, Tav, T14, Taw, T1v, Tax, Tay, T1b, Taz, T1w, T1j, Ten, T1y, TaD, T1q;
Chris@82 506 V Teo, T1z, TaG, T17, T1a, Tem, Tep;
Chris@82 507 {
Chris@82 508 V T12, T13, T1t, T1u;
Chris@82 509 T12 = LD(&(xi[WS(is, 2)]), ivs, &(xi[0]));
Chris@82 510 T13 = LD(&(xi[WS(is, 66)]), ivs, &(xi[0]));
Chris@82 511 Tau = VADD(T12, T13);
Chris@82 512 T1t = LD(&(xi[WS(is, 34)]), ivs, &(xi[0]));
Chris@82 513 T1u = LD(&(xi[WS(is, 98)]), ivs, &(xi[0]));
Chris@82 514 Tav = VADD(T1t, T1u);
Chris@82 515 T14 = VSUB(T12, T13);
Chris@82 516 Taw = VADD(Tau, Tav);
Chris@82 517 T1v = VSUB(T1t, T1u);
Chris@82 518 }
Chris@82 519 {
Chris@82 520 V T15, T16, T18, T19;
Chris@82 521 T15 = LD(&(xi[WS(is, 18)]), ivs, &(xi[0]));
Chris@82 522 T16 = LD(&(xi[WS(is, 82)]), ivs, &(xi[0]));
Chris@82 523 T17 = VSUB(T15, T16);
Chris@82 524 Tax = VADD(T15, T16);
Chris@82 525 T18 = LD(&(xi[WS(is, 114)]), ivs, &(xi[0]));
Chris@82 526 T19 = LD(&(xi[WS(is, 50)]), ivs, &(xi[0]));
Chris@82 527 T1a = VSUB(T18, T19);
Chris@82 528 Tay = VADD(T18, T19);
Chris@82 529 }
Chris@82 530 T1b = VADD(T17, T1a);
Chris@82 531 Taz = VADD(Tax, Tay);
Chris@82 532 T1w = VSUB(T17, T1a);
Chris@82 533 {
Chris@82 534 V T1f, TaB, T1i, TaC;
Chris@82 535 {
Chris@82 536 V T1d, T1e, T1g, T1h;
Chris@82 537 T1d = LD(&(xi[WS(is, 10)]), ivs, &(xi[0]));
Chris@82 538 T1e = LD(&(xi[WS(is, 74)]), ivs, &(xi[0]));
Chris@82 539 T1f = VSUB(T1d, T1e);
Chris@82 540 TaB = VADD(T1d, T1e);
Chris@82 541 T1g = LD(&(xi[WS(is, 42)]), ivs, &(xi[0]));
Chris@82 542 T1h = LD(&(xi[WS(is, 106)]), ivs, &(xi[0]));
Chris@82 543 T1i = VSUB(T1g, T1h);
Chris@82 544 TaC = VADD(T1g, T1h);
Chris@82 545 }
Chris@82 546 T1j = VFNMS(LDK(KP414213562), T1i, T1f);
Chris@82 547 Ten = VSUB(TaB, TaC);
Chris@82 548 T1y = VFMA(LDK(KP414213562), T1f, T1i);
Chris@82 549 TaD = VADD(TaB, TaC);
Chris@82 550 }
Chris@82 551 {
Chris@82 552 V T1m, TaE, T1p, TaF;
Chris@82 553 {
Chris@82 554 V T1k, T1l, T1n, T1o;
Chris@82 555 T1k = LD(&(xi[WS(is, 122)]), ivs, &(xi[0]));
Chris@82 556 T1l = LD(&(xi[WS(is, 58)]), ivs, &(xi[0]));
Chris@82 557 T1m = VSUB(T1k, T1l);
Chris@82 558 TaE = VADD(T1k, T1l);
Chris@82 559 T1n = LD(&(xi[WS(is, 26)]), ivs, &(xi[0]));
Chris@82 560 T1o = LD(&(xi[WS(is, 90)]), ivs, &(xi[0]));
Chris@82 561 T1p = VSUB(T1n, T1o);
Chris@82 562 TaF = VADD(T1n, T1o);
Chris@82 563 }
Chris@82 564 T1q = VFMA(LDK(KP414213562), T1p, T1m);
Chris@82 565 Teo = VSUB(TaE, TaF);
Chris@82 566 T1z = VFNMS(LDK(KP414213562), T1m, T1p);
Chris@82 567 TaG = VADD(TaE, TaF);
Chris@82 568 }
Chris@82 569 Tdm = VADD(Taw, Taz);
Chris@82 570 Tdn = VADD(TaD, TaG);
Chris@82 571 TdG = VSUB(Tdm, Tdn);
Chris@82 572 Tem = VSUB(Tau, Tav);
Chris@82 573 Tep = VADD(Ten, Teo);
Chris@82 574 Teq = VFMA(LDK(KP707106781), Tep, Tem);
Chris@82 575 Tgj = VFNMS(LDK(KP707106781), Tep, Tem);
Chris@82 576 {
Chris@82 577 V Ter, Tes, T1c, T1r;
Chris@82 578 Ter = VSUB(Tax, Tay);
Chris@82 579 Tes = VSUB(Ten, Teo);
Chris@82 580 Tet = VFMA(LDK(KP707106781), Tes, Ter);
Chris@82 581 Tgi = VFNMS(LDK(KP707106781), Tes, Ter);
Chris@82 582 T1c = VFMA(LDK(KP707106781), T1b, T14);
Chris@82 583 T1r = VADD(T1j, T1q);
Chris@82 584 T1s = VFMA(LDK(KP923879532), T1r, T1c);
Chris@82 585 T5N = VFNMS(LDK(KP923879532), T1r, T1c);
Chris@82 586 }
Chris@82 587 {
Chris@82 588 V T1x, T1A, T7b, T7c;
Chris@82 589 T1x = VFMA(LDK(KP707106781), T1w, T1v);
Chris@82 590 T1A = VADD(T1y, T1z);
Chris@82 591 T1B = VFMA(LDK(KP923879532), T1A, T1x);
Chris@82 592 T5M = VFNMS(LDK(KP923879532), T1A, T1x);
Chris@82 593 T7b = VFNMS(LDK(KP707106781), T1w, T1v);
Chris@82 594 T7c = VSUB(T1j, T1q);
Chris@82 595 T7d = VFNMS(LDK(KP923879532), T7c, T7b);
Chris@82 596 T8W = VFMA(LDK(KP923879532), T7c, T7b);
Chris@82 597 }
Chris@82 598 {
Chris@82 599 V TaA, TaH, T78, T79;
Chris@82 600 TaA = VSUB(Taw, Taz);
Chris@82 601 TaH = VSUB(TaD, TaG);
Chris@82 602 TaI = VFNMS(LDK(KP414213562), TaH, TaA);
Chris@82 603 Tcf = VFMA(LDK(KP414213562), TaA, TaH);
Chris@82 604 T78 = VFNMS(LDK(KP707106781), T1b, T14);
Chris@82 605 T79 = VSUB(T1y, T1z);
Chris@82 606 T7a = VFMA(LDK(KP923879532), T79, T78);
Chris@82 607 T8X = VFNMS(LDK(KP923879532), T79, T78);
Chris@82 608 }
Chris@82 609 }
Chris@82 610 {
Chris@82 611 V TaJ, TaK, T1F, TaL, T26, TaM, TaN, T1M, TaO, T27, T1U, Tew, T29, TaV, T21;
Chris@82 612 V Tex, T2a, TaS, T1I, T1L, Tev, Tey;
Chris@82 613 {
Chris@82 614 V T1D, T1E, T24, T25;
Chris@82 615 T1D = LD(&(xi[WS(is, 126)]), ivs, &(xi[0]));
Chris@82 616 T1E = LD(&(xi[WS(is, 62)]), ivs, &(xi[0]));
Chris@82 617 TaJ = VADD(T1D, T1E);
Chris@82 618 T24 = LD(&(xi[WS(is, 94)]), ivs, &(xi[0]));
Chris@82 619 T25 = LD(&(xi[WS(is, 30)]), ivs, &(xi[0]));
Chris@82 620 TaK = VADD(T25, T24);
Chris@82 621 T1F = VSUB(T1D, T1E);
Chris@82 622 TaL = VADD(TaJ, TaK);
Chris@82 623 T26 = VSUB(T24, T25);
Chris@82 624 }
Chris@82 625 {
Chris@82 626 V T1G, T1H, T1J, T1K;
Chris@82 627 T1G = LD(&(xi[WS(is, 14)]), ivs, &(xi[0]));
Chris@82 628 T1H = LD(&(xi[WS(is, 78)]), ivs, &(xi[0]));
Chris@82 629 T1I = VSUB(T1G, T1H);
Chris@82 630 TaM = VADD(T1G, T1H);
Chris@82 631 T1J = LD(&(xi[WS(is, 110)]), ivs, &(xi[0]));
Chris@82 632 T1K = LD(&(xi[WS(is, 46)]), ivs, &(xi[0]));
Chris@82 633 T1L = VSUB(T1J, T1K);
Chris@82 634 TaN = VADD(T1J, T1K);
Chris@82 635 }
Chris@82 636 T1M = VADD(T1I, T1L);
Chris@82 637 TaO = VADD(TaM, TaN);
Chris@82 638 T27 = VSUB(T1L, T1I);
Chris@82 639 {
Chris@82 640 V T1Q, TaT, T1T, TaU;
Chris@82 641 {
Chris@82 642 V T1O, T1P, T1R, T1S;
Chris@82 643 T1O = LD(&(xi[WS(is, 6)]), ivs, &(xi[0]));
Chris@82 644 T1P = LD(&(xi[WS(is, 70)]), ivs, &(xi[0]));
Chris@82 645 T1Q = VSUB(T1O, T1P);
Chris@82 646 TaT = VADD(T1O, T1P);
Chris@82 647 T1R = LD(&(xi[WS(is, 102)]), ivs, &(xi[0]));
Chris@82 648 T1S = LD(&(xi[WS(is, 38)]), ivs, &(xi[0]));
Chris@82 649 T1T = VSUB(T1R, T1S);
Chris@82 650 TaU = VADD(T1S, T1R);
Chris@82 651 }
Chris@82 652 T1U = VFMA(LDK(KP414213562), T1T, T1Q);
Chris@82 653 Tew = VSUB(TaT, TaU);
Chris@82 654 T29 = VFNMS(LDK(KP414213562), T1Q, T1T);
Chris@82 655 TaV = VADD(TaT, TaU);
Chris@82 656 }
Chris@82 657 {
Chris@82 658 V T1X, TaQ, T20, TaR;
Chris@82 659 {
Chris@82 660 V T1V, T1W, T1Y, T1Z;
Chris@82 661 T1V = LD(&(xi[WS(is, 118)]), ivs, &(xi[0]));
Chris@82 662 T1W = LD(&(xi[WS(is, 54)]), ivs, &(xi[0]));
Chris@82 663 T1X = VSUB(T1V, T1W);
Chris@82 664 TaQ = VADD(T1V, T1W);
Chris@82 665 T1Y = LD(&(xi[WS(is, 86)]), ivs, &(xi[0]));
Chris@82 666 T1Z = LD(&(xi[WS(is, 22)]), ivs, &(xi[0]));
Chris@82 667 T20 = VSUB(T1Y, T1Z);
Chris@82 668 TaR = VADD(T1Z, T1Y);
Chris@82 669 }
Chris@82 670 T21 = VFNMS(LDK(KP414213562), T20, T1X);
Chris@82 671 Tex = VSUB(TaQ, TaR);
Chris@82 672 T2a = VFMA(LDK(KP414213562), T1X, T20);
Chris@82 673 TaS = VADD(TaQ, TaR);
Chris@82 674 }
Chris@82 675 Tdp = VADD(TaL, TaO);
Chris@82 676 Tdq = VADD(TaV, TaS);
Chris@82 677 TdH = VSUB(Tdp, Tdq);
Chris@82 678 Tev = VSUB(TaJ, TaK);
Chris@82 679 Tey = VADD(Tew, Tex);
Chris@82 680 Tez = VFMA(LDK(KP707106781), Tey, Tev);
Chris@82 681 Tgm = VFNMS(LDK(KP707106781), Tey, Tev);
Chris@82 682 {
Chris@82 683 V TeA, TeB, T1N, T22;
Chris@82 684 TeA = VSUB(TaN, TaM);
Chris@82 685 TeB = VSUB(Tex, Tew);
Chris@82 686 TeC = VFMA(LDK(KP707106781), TeB, TeA);
Chris@82 687 Tgl = VFNMS(LDK(KP707106781), TeB, TeA);
Chris@82 688 T1N = VFMA(LDK(KP707106781), T1M, T1F);
Chris@82 689 T22 = VADD(T1U, T21);
Chris@82 690 T23 = VFMA(LDK(KP923879532), T22, T1N);
Chris@82 691 T5Q = VFNMS(LDK(KP923879532), T22, T1N);
Chris@82 692 }
Chris@82 693 {
Chris@82 694 V T28, T2b, T7i, T7j;
Chris@82 695 T28 = VFMA(LDK(KP707106781), T27, T26);
Chris@82 696 T2b = VADD(T29, T2a);
Chris@82 697 T2c = VFMA(LDK(KP923879532), T2b, T28);
Chris@82 698 T5P = VFNMS(LDK(KP923879532), T2b, T28);
Chris@82 699 T7i = VFNMS(LDK(KP707106781), T27, T26);
Chris@82 700 T7j = VSUB(T21, T1U);
Chris@82 701 T7k = VFNMS(LDK(KP923879532), T7j, T7i);
Chris@82 702 T8Z = VFMA(LDK(KP923879532), T7j, T7i);
Chris@82 703 }
Chris@82 704 {
Chris@82 705 V TaP, TaW, T7f, T7g;
Chris@82 706 TaP = VSUB(TaL, TaO);
Chris@82 707 TaW = VSUB(TaS, TaV);
Chris@82 708 TaX = VFNMS(LDK(KP414213562), TaW, TaP);
Chris@82 709 Tcg = VFMA(LDK(KP414213562), TaP, TaW);
Chris@82 710 T7f = VFNMS(LDK(KP707106781), T1M, T1F);
Chris@82 711 T7g = VSUB(T2a, T29);
Chris@82 712 T7h = VFMA(LDK(KP923879532), T7g, T7f);
Chris@82 713 T90 = VFNMS(LDK(KP923879532), T7g, T7f);
Chris@82 714 }
Chris@82 715 }
Chris@82 716 {
Chris@82 717 V T2J, TeL, T2U, Tb9, T30, TeO, T3b, Tbg, T2Q, TeM, T2V, Tbc, T37, TeP, T3c;
Chris@82 718 V Tbj;
Chris@82 719 {
Chris@82 720 V T2H, T2I, Tb7, T2S, T2T, Tb8;
Chris@82 721 T2H = LD(&(xi[WS(is, 5)]), ivs, &(xi[WS(is, 1)]));
Chris@82 722 T2I = LD(&(xi[WS(is, 69)]), ivs, &(xi[WS(is, 1)]));
Chris@82 723 Tb7 = VADD(T2H, T2I);
Chris@82 724 T2S = LD(&(xi[WS(is, 37)]), ivs, &(xi[WS(is, 1)]));
Chris@82 725 T2T = LD(&(xi[WS(is, 101)]), ivs, &(xi[WS(is, 1)]));
Chris@82 726 Tb8 = VADD(T2S, T2T);
Chris@82 727 T2J = VSUB(T2H, T2I);
Chris@82 728 TeL = VSUB(Tb7, Tb8);
Chris@82 729 T2U = VSUB(T2S, T2T);
Chris@82 730 Tb9 = VADD(Tb7, Tb8);
Chris@82 731 }
Chris@82 732 {
Chris@82 733 V T2Y, T2Z, Tbe, T39, T3a, Tbf;
Chris@82 734 T2Y = LD(&(xi[WS(is, 125)]), ivs, &(xi[WS(is, 1)]));
Chris@82 735 T2Z = LD(&(xi[WS(is, 61)]), ivs, &(xi[WS(is, 1)]));
Chris@82 736 Tbe = VADD(T2Y, T2Z);
Chris@82 737 T39 = LD(&(xi[WS(is, 29)]), ivs, &(xi[WS(is, 1)]));
Chris@82 738 T3a = LD(&(xi[WS(is, 93)]), ivs, &(xi[WS(is, 1)]));
Chris@82 739 Tbf = VADD(T39, T3a);
Chris@82 740 T30 = VSUB(T2Y, T2Z);
Chris@82 741 TeO = VSUB(Tbe, Tbf);
Chris@82 742 T3b = VSUB(T39, T3a);
Chris@82 743 Tbg = VADD(Tbe, Tbf);
Chris@82 744 }
Chris@82 745 {
Chris@82 746 V T2M, Tba, T2P, Tbb;
Chris@82 747 {
Chris@82 748 V T2K, T2L, T2N, T2O;
Chris@82 749 T2K = LD(&(xi[WS(is, 21)]), ivs, &(xi[WS(is, 1)]));
Chris@82 750 T2L = LD(&(xi[WS(is, 85)]), ivs, &(xi[WS(is, 1)]));
Chris@82 751 T2M = VSUB(T2K, T2L);
Chris@82 752 Tba = VADD(T2K, T2L);
Chris@82 753 T2N = LD(&(xi[WS(is, 117)]), ivs, &(xi[WS(is, 1)]));
Chris@82 754 T2O = LD(&(xi[WS(is, 53)]), ivs, &(xi[WS(is, 1)]));
Chris@82 755 T2P = VSUB(T2N, T2O);
Chris@82 756 Tbb = VADD(T2N, T2O);
Chris@82 757 }
Chris@82 758 T2Q = VADD(T2M, T2P);
Chris@82 759 TeM = VSUB(Tba, Tbb);
Chris@82 760 T2V = VSUB(T2M, T2P);
Chris@82 761 Tbc = VADD(Tba, Tbb);
Chris@82 762 }
Chris@82 763 {
Chris@82 764 V T33, Tbh, T36, Tbi;
Chris@82 765 {
Chris@82 766 V T31, T32, T34, T35;
Chris@82 767 T31 = LD(&(xi[WS(is, 13)]), ivs, &(xi[WS(is, 1)]));
Chris@82 768 T32 = LD(&(xi[WS(is, 77)]), ivs, &(xi[WS(is, 1)]));
Chris@82 769 T33 = VSUB(T31, T32);
Chris@82 770 Tbh = VADD(T31, T32);
Chris@82 771 T34 = LD(&(xi[WS(is, 109)]), ivs, &(xi[WS(is, 1)]));
Chris@82 772 T35 = LD(&(xi[WS(is, 45)]), ivs, &(xi[WS(is, 1)]));
Chris@82 773 T36 = VSUB(T34, T35);
Chris@82 774 Tbi = VADD(T34, T35);
Chris@82 775 }
Chris@82 776 T37 = VADD(T33, T36);
Chris@82 777 TeP = VSUB(Tbh, Tbi);
Chris@82 778 T3c = VSUB(T33, T36);
Chris@82 779 Tbj = VADD(Tbh, Tbi);
Chris@82 780 }
Chris@82 781 {
Chris@82 782 V Tbd, Tbk, TeN, TeQ;
Chris@82 783 Tbd = VSUB(Tb9, Tbc);
Chris@82 784 Tbk = VSUB(Tbg, Tbj);
Chris@82 785 Tbl = VADD(Tbd, Tbk);
Chris@82 786 Tbu = VSUB(Tbd, Tbk);
Chris@82 787 {
Chris@82 788 V Td9, Tda, TeW, TeX;
Chris@82 789 Td9 = VADD(Tb9, Tbc);
Chris@82 790 Tda = VADD(Tbg, Tbj);
Chris@82 791 Tdb = VADD(Td9, Tda);
Chris@82 792 TdL = VSUB(Td9, Tda);
Chris@82 793 TeW = VFMA(LDK(KP414213562), TeL, TeM);
Chris@82 794 TeX = VFNMS(LDK(KP414213562), TeO, TeP);
Chris@82 795 TeY = VADD(TeW, TeX);
Chris@82 796 Tgr = VSUB(TeW, TeX);
Chris@82 797 }
Chris@82 798 TeN = VFNMS(LDK(KP414213562), TeM, TeL);
Chris@82 799 TeQ = VFMA(LDK(KP414213562), TeP, TeO);
Chris@82 800 TeR = VADD(TeN, TeQ);
Chris@82 801 Tgu = VSUB(TeN, TeQ);
Chris@82 802 {
Chris@82 803 V T7t, T7C, T7w, T7D;
Chris@82 804 {
Chris@82 805 V T7r, T7s, T7u, T7v;
Chris@82 806 T7r = VFNMS(LDK(KP707106781), T2Q, T2J);
Chris@82 807 T7s = VFNMS(LDK(KP707106781), T2V, T2U);
Chris@82 808 T7t = VFMA(LDK(KP668178637), T7s, T7r);
Chris@82 809 T7C = VFNMS(LDK(KP668178637), T7r, T7s);
Chris@82 810 T7u = VFNMS(LDK(KP707106781), T37, T30);
Chris@82 811 T7v = VFNMS(LDK(KP707106781), T3c, T3b);
Chris@82 812 T7w = VFNMS(LDK(KP668178637), T7v, T7u);
Chris@82 813 T7D = VFMA(LDK(KP668178637), T7u, T7v);
Chris@82 814 }
Chris@82 815 T7x = VADD(T7t, T7w);
Chris@82 816 T98 = VSUB(T7t, T7w);
Chris@82 817 T7E = VADD(T7C, T7D);
Chris@82 818 T95 = VSUB(T7D, T7C);
Chris@82 819 }
Chris@82 820 {
Chris@82 821 V T2X, T3q, T3e, T3r;
Chris@82 822 {
Chris@82 823 V T2R, T2W, T38, T3d;
Chris@82 824 T2R = VFMA(LDK(KP707106781), T2Q, T2J);
Chris@82 825 T2W = VFMA(LDK(KP707106781), T2V, T2U);
Chris@82 826 T2X = VFNMS(LDK(KP198912367), T2W, T2R);
Chris@82 827 T3q = VFMA(LDK(KP198912367), T2R, T2W);
Chris@82 828 T38 = VFMA(LDK(KP707106781), T37, T30);
Chris@82 829 T3d = VFMA(LDK(KP707106781), T3c, T3b);
Chris@82 830 T3e = VFMA(LDK(KP198912367), T3d, T38);
Chris@82 831 T3r = VFNMS(LDK(KP198912367), T38, T3d);
Chris@82 832 }
Chris@82 833 T3f = VADD(T2X, T3e);
Chris@82 834 T5Y = VSUB(T2X, T3e);
Chris@82 835 T3s = VADD(T3q, T3r);
Chris@82 836 T5V = VSUB(T3q, T3r);
Chris@82 837 }
Chris@82 838 }
Chris@82 839 }
Chris@82 840 {
Chris@82 841 V T3Y, Tf6, T49, TbG, T4f, Tf9, T4q, TbN, T45, Tf7, T4a, TbJ, T4m, Tfa, T4r;
Chris@82 842 V TbQ;
Chris@82 843 {
Chris@82 844 V T3W, T3X, TbE, T47, T48, TbF;
Chris@82 845 T3W = LD(&(xi[WS(is, 3)]), ivs, &(xi[WS(is, 1)]));
Chris@82 846 T3X = LD(&(xi[WS(is, 67)]), ivs, &(xi[WS(is, 1)]));
Chris@82 847 TbE = VADD(T3W, T3X);
Chris@82 848 T47 = LD(&(xi[WS(is, 99)]), ivs, &(xi[WS(is, 1)]));
Chris@82 849 T48 = LD(&(xi[WS(is, 35)]), ivs, &(xi[WS(is, 1)]));
Chris@82 850 TbF = VADD(T48, T47);
Chris@82 851 T3Y = VSUB(T3W, T3X);
Chris@82 852 Tf6 = VSUB(TbE, TbF);
Chris@82 853 T49 = VSUB(T47, T48);
Chris@82 854 TbG = VADD(TbE, TbF);
Chris@82 855 }
Chris@82 856 {
Chris@82 857 V T4d, T4e, TbL, T4o, T4p, TbM;
Chris@82 858 T4d = LD(&(xi[WS(is, 123)]), ivs, &(xi[WS(is, 1)]));
Chris@82 859 T4e = LD(&(xi[WS(is, 59)]), ivs, &(xi[WS(is, 1)]));
Chris@82 860 TbL = VADD(T4d, T4e);
Chris@82 861 T4o = LD(&(xi[WS(is, 91)]), ivs, &(xi[WS(is, 1)]));
Chris@82 862 T4p = LD(&(xi[WS(is, 27)]), ivs, &(xi[WS(is, 1)]));
Chris@82 863 TbM = VADD(T4p, T4o);
Chris@82 864 T4f = VSUB(T4d, T4e);
Chris@82 865 Tf9 = VSUB(TbL, TbM);
Chris@82 866 T4q = VSUB(T4o, T4p);
Chris@82 867 TbN = VADD(TbL, TbM);
Chris@82 868 }
Chris@82 869 {
Chris@82 870 V T41, TbH, T44, TbI;
Chris@82 871 {
Chris@82 872 V T3Z, T40, T42, T43;
Chris@82 873 T3Z = LD(&(xi[WS(is, 19)]), ivs, &(xi[WS(is, 1)]));
Chris@82 874 T40 = LD(&(xi[WS(is, 83)]), ivs, &(xi[WS(is, 1)]));
Chris@82 875 T41 = VSUB(T3Z, T40);
Chris@82 876 TbH = VADD(T3Z, T40);
Chris@82 877 T42 = LD(&(xi[WS(is, 115)]), ivs, &(xi[WS(is, 1)]));
Chris@82 878 T43 = LD(&(xi[WS(is, 51)]), ivs, &(xi[WS(is, 1)]));
Chris@82 879 T44 = VSUB(T42, T43);
Chris@82 880 TbI = VADD(T42, T43);
Chris@82 881 }
Chris@82 882 T45 = VADD(T41, T44);
Chris@82 883 Tf7 = VSUB(TbI, TbH);
Chris@82 884 T4a = VSUB(T44, T41);
Chris@82 885 TbJ = VADD(TbH, TbI);
Chris@82 886 }
Chris@82 887 {
Chris@82 888 V T4i, TbO, T4l, TbP;
Chris@82 889 {
Chris@82 890 V T4g, T4h, T4j, T4k;
Chris@82 891 T4g = LD(&(xi[WS(is, 11)]), ivs, &(xi[WS(is, 1)]));
Chris@82 892 T4h = LD(&(xi[WS(is, 75)]), ivs, &(xi[WS(is, 1)]));
Chris@82 893 T4i = VSUB(T4g, T4h);
Chris@82 894 TbO = VADD(T4g, T4h);
Chris@82 895 T4j = LD(&(xi[WS(is, 107)]), ivs, &(xi[WS(is, 1)]));
Chris@82 896 T4k = LD(&(xi[WS(is, 43)]), ivs, &(xi[WS(is, 1)]));
Chris@82 897 T4l = VSUB(T4j, T4k);
Chris@82 898 TbP = VADD(T4j, T4k);
Chris@82 899 }
Chris@82 900 T4m = VADD(T4i, T4l);
Chris@82 901 Tfa = VSUB(TbP, TbO);
Chris@82 902 T4r = VSUB(T4l, T4i);
Chris@82 903 TbQ = VADD(TbO, TbP);
Chris@82 904 }
Chris@82 905 {
Chris@82 906 V TbK, TbR, Tf8, Tfb;
Chris@82 907 TbK = VSUB(TbG, TbJ);
Chris@82 908 TbR = VSUB(TbN, TbQ);
Chris@82 909 TbS = VADD(TbK, TbR);
Chris@82 910 Tc1 = VSUB(TbR, TbK);
Chris@82 911 {
Chris@82 912 V Tdg, Tdh, Tfh, Tfi;
Chris@82 913 Tdg = VADD(TbG, TbJ);
Chris@82 914 Tdh = VADD(TbN, TbQ);
Chris@82 915 Tdi = VADD(Tdg, Tdh);
Chris@82 916 TdO = VSUB(Tdh, Tdg);
Chris@82 917 Tfh = VFNMS(LDK(KP414213562), Tf6, Tf7);
Chris@82 918 Tfi = VFMA(LDK(KP414213562), Tf9, Tfa);
Chris@82 919 Tfj = VADD(Tfh, Tfi);
Chris@82 920 Tgy = VSUB(Tfi, Tfh);
Chris@82 921 }
Chris@82 922 Tf8 = VFMA(LDK(KP414213562), Tf7, Tf6);
Chris@82 923 Tfb = VFNMS(LDK(KP414213562), Tfa, Tf9);
Chris@82 924 Tfc = VADD(Tf8, Tfb);
Chris@82 925 TgB = VSUB(Tfb, Tf8);
Chris@82 926 {
Chris@82 927 V T7M, T7V, T7P, T7W;
Chris@82 928 {
Chris@82 929 V T7K, T7L, T7N, T7O;
Chris@82 930 T7K = VFNMS(LDK(KP707106781), T45, T3Y);
Chris@82 931 T7L = VFNMS(LDK(KP707106781), T4a, T49);
Chris@82 932 T7M = VFNMS(LDK(KP668178637), T7L, T7K);
Chris@82 933 T7V = VFMA(LDK(KP668178637), T7K, T7L);
Chris@82 934 T7N = VFNMS(LDK(KP707106781), T4m, T4f);
Chris@82 935 T7O = VFNMS(LDK(KP707106781), T4r, T4q);
Chris@82 936 T7P = VFMA(LDK(KP668178637), T7O, T7N);
Chris@82 937 T7W = VFNMS(LDK(KP668178637), T7N, T7O);
Chris@82 938 }
Chris@82 939 T7Q = VADD(T7M, T7P);
Chris@82 940 T9f = VSUB(T7P, T7M);
Chris@82 941 T7X = VADD(T7V, T7W);
Chris@82 942 T9c = VSUB(T7V, T7W);
Chris@82 943 }
Chris@82 944 {
Chris@82 945 V T4c, T4F, T4t, T4G;
Chris@82 946 {
Chris@82 947 V T46, T4b, T4n, T4s;
Chris@82 948 T46 = VFMA(LDK(KP707106781), T45, T3Y);
Chris@82 949 T4b = VFMA(LDK(KP707106781), T4a, T49);
Chris@82 950 T4c = VFMA(LDK(KP198912367), T4b, T46);
Chris@82 951 T4F = VFNMS(LDK(KP198912367), T46, T4b);
Chris@82 952 T4n = VFMA(LDK(KP707106781), T4m, T4f);
Chris@82 953 T4s = VFMA(LDK(KP707106781), T4r, T4q);
Chris@82 954 T4t = VFNMS(LDK(KP198912367), T4s, T4n);
Chris@82 955 T4G = VFMA(LDK(KP198912367), T4n, T4s);
Chris@82 956 }
Chris@82 957 T4u = VADD(T4c, T4t);
Chris@82 958 T65 = VSUB(T4t, T4c);
Chris@82 959 T4H = VADD(T4F, T4G);
Chris@82 960 T62 = VSUB(T4G, T4F);
Chris@82 961 }
Chris@82 962 }
Chris@82 963 }
Chris@82 964 {
Chris@82 965 V Td5, Tdx, TdC, TdE, Tdk, Tdt, Tds, Tdy, Tdz, TdD;
Chris@82 966 {
Chris@82 967 V Td1, Td4, TdA, TdB;
Chris@82 968 Td1 = VADD(TcZ, Td0);
Chris@82 969 Td4 = VADD(Td2, Td3);
Chris@82 970 Td5 = VSUB(Td1, Td4);
Chris@82 971 Tdx = VADD(Td1, Td4);
Chris@82 972 TdA = VADD(Td8, Tdb);
Chris@82 973 TdB = VADD(Tdf, Tdi);
Chris@82 974 TdC = VSUB(TdA, TdB);
Chris@82 975 TdE = VADD(TdA, TdB);
Chris@82 976 }
Chris@82 977 {
Chris@82 978 V Tdc, Tdj, Tdo, Tdr;
Chris@82 979 Tdc = VSUB(Td8, Tdb);
Chris@82 980 Tdj = VSUB(Tdf, Tdi);
Chris@82 981 Tdk = VADD(Tdc, Tdj);
Chris@82 982 Tdt = VSUB(Tdc, Tdj);
Chris@82 983 Tdo = VADD(Tdm, Tdn);
Chris@82 984 Tdr = VADD(Tdp, Tdq);
Chris@82 985 Tds = VSUB(Tdo, Tdr);
Chris@82 986 Tdy = VADD(Tdo, Tdr);
Chris@82 987 }
Chris@82 988 Tdz = VSUB(Tdx, Tdy);
Chris@82 989 ST(&(xo[WS(os, 96)]), VFNMSI(TdC, Tdz), ovs, &(xo[0]));
Chris@82 990 ST(&(xo[WS(os, 32)]), VFMAI(TdC, Tdz), ovs, &(xo[0]));
Chris@82 991 TdD = VADD(Tdx, Tdy);
Chris@82 992 ST(&(xo[WS(os, 64)]), VSUB(TdD, TdE), ovs, &(xo[0]));
Chris@82 993 ST(&(xo[0]), VADD(TdD, TdE), ovs, &(xo[0]));
Chris@82 994 {
Chris@82 995 V Tdl, Tdu, Tdv, Tdw;
Chris@82 996 Tdl = VFNMS(LDK(KP707106781), Tdk, Td5);
Chris@82 997 Tdu = VFNMS(LDK(KP707106781), Tdt, Tds);
Chris@82 998 ST(&(xo[WS(os, 48)]), VFNMSI(Tdu, Tdl), ovs, &(xo[0]));
Chris@82 999 ST(&(xo[WS(os, 80)]), VFMAI(Tdu, Tdl), ovs, &(xo[0]));
Chris@82 1000 Tdv = VFMA(LDK(KP707106781), Tdk, Td5);
Chris@82 1001 Tdw = VFMA(LDK(KP707106781), Tdt, Tds);
Chris@82 1002 ST(&(xo[WS(os, 16)]), VFMAI(Tdw, Tdv), ovs, &(xo[0]));
Chris@82 1003 ST(&(xo[WS(os, 112)]), VFNMSI(Tdw, Tdv), ovs, &(xo[0]));
Chris@82 1004 }
Chris@82 1005 }
Chris@82 1006 {
Chris@82 1007 V TdJ, Te1, TdX, Te2, TdQ, Te5, TdU, Te4;
Chris@82 1008 {
Chris@82 1009 V TdF, TdI, TdV, TdW;
Chris@82 1010 TdF = VSUB(TcZ, Td0);
Chris@82 1011 TdI = VADD(TdG, TdH);
Chris@82 1012 TdJ = VFMA(LDK(KP707106781), TdI, TdF);
Chris@82 1013 Te1 = VFNMS(LDK(KP707106781), TdI, TdF);
Chris@82 1014 TdV = VFMA(LDK(KP414213562), TdK, TdL);
Chris@82 1015 TdW = VFMA(LDK(KP414213562), TdN, TdO);
Chris@82 1016 TdX = VSUB(TdV, TdW);
Chris@82 1017 Te2 = VADD(TdV, TdW);
Chris@82 1018 }
Chris@82 1019 {
Chris@82 1020 V TdM, TdP, TdS, TdT;
Chris@82 1021 TdM = VFNMS(LDK(KP414213562), TdL, TdK);
Chris@82 1022 TdP = VFNMS(LDK(KP414213562), TdO, TdN);
Chris@82 1023 TdQ = VADD(TdM, TdP);
Chris@82 1024 Te5 = VSUB(TdM, TdP);
Chris@82 1025 TdS = VSUB(Td2, Td3);
Chris@82 1026 TdT = VSUB(TdG, TdH);
Chris@82 1027 TdU = VFMA(LDK(KP707106781), TdT, TdS);
Chris@82 1028 Te4 = VFNMS(LDK(KP707106781), TdT, TdS);
Chris@82 1029 }
Chris@82 1030 {
Chris@82 1031 V TdR, TdY, Te7, Te8;
Chris@82 1032 TdR = VFNMS(LDK(KP923879532), TdQ, TdJ);
Chris@82 1033 TdY = VFNMS(LDK(KP923879532), TdX, TdU);
Chris@82 1034 ST(&(xo[WS(os, 56)]), VFNMSI(TdY, TdR), ovs, &(xo[0]));
Chris@82 1035 ST(&(xo[WS(os, 72)]), VFMAI(TdY, TdR), ovs, &(xo[0]));
Chris@82 1036 Te7 = VFMA(LDK(KP923879532), Te2, Te1);
Chris@82 1037 Te8 = VFNMS(LDK(KP923879532), Te5, Te4);
Chris@82 1038 ST(&(xo[WS(os, 24)]), VFNMSI(Te8, Te7), ovs, &(xo[0]));
Chris@82 1039 ST(&(xo[WS(os, 104)]), VFMAI(Te8, Te7), ovs, &(xo[0]));
Chris@82 1040 }
Chris@82 1041 {
Chris@82 1042 V TdZ, Te0, Te3, Te6;
Chris@82 1043 TdZ = VFMA(LDK(KP923879532), TdQ, TdJ);
Chris@82 1044 Te0 = VFMA(LDK(KP923879532), TdX, TdU);
Chris@82 1045 ST(&(xo[WS(os, 120)]), VFNMSI(Te0, TdZ), ovs, &(xo[0]));
Chris@82 1046 ST(&(xo[WS(os, 8)]), VFMAI(Te0, TdZ), ovs, &(xo[0]));
Chris@82 1047 Te3 = VFNMS(LDK(KP923879532), Te2, Te1);
Chris@82 1048 Te6 = VFMA(LDK(KP923879532), Te5, Te4);
Chris@82 1049 ST(&(xo[WS(os, 40)]), VFMAI(Te6, Te3), ovs, &(xo[0]));
Chris@82 1050 ST(&(xo[WS(os, 88)]), VFNMSI(Te6, Te3), ovs, &(xo[0]));
Chris@82 1051 }
Chris@82 1052 }
Chris@82 1053 {
Chris@82 1054 V TaZ, Tcp, Tci, Tcs, Tc4, Tct, Tcl, Tcq;
Chris@82 1055 {
Chris@82 1056 V Tat, TaY, Tce, Tch;
Chris@82 1057 Tat = VFMA(LDK(KP707106781), Tas, Tad);
Chris@82 1058 TaY = VADD(TaI, TaX);
Chris@82 1059 TaZ = VFMA(LDK(KP923879532), TaY, Tat);
Chris@82 1060 Tcp = VFNMS(LDK(KP923879532), TaY, Tat);
Chris@82 1061 Tce = VFMA(LDK(KP707106781), Tcd, Tcc);
Chris@82 1062 Tch = VSUB(Tcf, Tcg);
Chris@82 1063 Tci = VFMA(LDK(KP923879532), Tch, Tce);
Chris@82 1064 Tcs = VFNMS(LDK(KP923879532), Tch, Tce);
Chris@82 1065 {
Chris@82 1066 V Tbw, Tcj, Tc3, Tck;
Chris@82 1067 {
Chris@82 1068 V Tbm, Tbv, TbT, Tc2;
Chris@82 1069 Tbm = VFMA(LDK(KP707106781), Tbl, Tb6);
Chris@82 1070 Tbv = VFMA(LDK(KP707106781), Tbu, Tbt);
Chris@82 1071 Tbw = VFNMS(LDK(KP198912367), Tbv, Tbm);
Chris@82 1072 Tcj = VFMA(LDK(KP198912367), Tbm, Tbv);
Chris@82 1073 TbT = VFMA(LDK(KP707106781), TbS, TbD);
Chris@82 1074 Tc2 = VFMA(LDK(KP707106781), Tc1, Tc0);
Chris@82 1075 Tc3 = VFNMS(LDK(KP198912367), Tc2, TbT);
Chris@82 1076 Tck = VFMA(LDK(KP198912367), TbT, Tc2);
Chris@82 1077 }
Chris@82 1078 Tc4 = VADD(Tbw, Tc3);
Chris@82 1079 Tct = VSUB(Tbw, Tc3);
Chris@82 1080 Tcl = VSUB(Tcj, Tck);
Chris@82 1081 Tcq = VADD(Tcj, Tck);
Chris@82 1082 }
Chris@82 1083 }
Chris@82 1084 {
Chris@82 1085 V Tc5, Tcm, Tcv, Tcw;
Chris@82 1086 Tc5 = VFNMS(LDK(KP980785280), Tc4, TaZ);
Chris@82 1087 Tcm = VFNMS(LDK(KP980785280), Tcl, Tci);
Chris@82 1088 ST(&(xo[WS(os, 60)]), VFNMSI(Tcm, Tc5), ovs, &(xo[0]));
Chris@82 1089 ST(&(xo[WS(os, 68)]), VFMAI(Tcm, Tc5), ovs, &(xo[0]));
Chris@82 1090 Tcv = VFMA(LDK(KP980785280), Tcq, Tcp);
Chris@82 1091 Tcw = VFNMS(LDK(KP980785280), Tct, Tcs);
Chris@82 1092 ST(&(xo[WS(os, 28)]), VFNMSI(Tcw, Tcv), ovs, &(xo[0]));
Chris@82 1093 ST(&(xo[WS(os, 100)]), VFMAI(Tcw, Tcv), ovs, &(xo[0]));
Chris@82 1094 }
Chris@82 1095 {
Chris@82 1096 V Tcn, Tco, Tcr, Tcu;
Chris@82 1097 Tcn = VFMA(LDK(KP980785280), Tc4, TaZ);
Chris@82 1098 Tco = VFMA(LDK(KP980785280), Tcl, Tci);
Chris@82 1099 ST(&(xo[WS(os, 124)]), VFNMSI(Tco, Tcn), ovs, &(xo[0]));
Chris@82 1100 ST(&(xo[WS(os, 4)]), VFMAI(Tco, Tcn), ovs, &(xo[0]));
Chris@82 1101 Tcr = VFNMS(LDK(KP980785280), Tcq, Tcp);
Chris@82 1102 Tcu = VFMA(LDK(KP980785280), Tct, Tcs);
Chris@82 1103 ST(&(xo[WS(os, 36)]), VFMAI(Tcu, Tcr), ovs, &(xo[0]));
Chris@82 1104 ST(&(xo[WS(os, 92)]), VFNMSI(Tcu, Tcr), ovs, &(xo[0]));
Chris@82 1105 }
Chris@82 1106 }
Chris@82 1107 {
Chris@82 1108 V Tcz, TcR, TcK, TcU, TcG, TcV, TcN, TcS;
Chris@82 1109 {
Chris@82 1110 V Tcx, Tcy, TcI, TcJ;
Chris@82 1111 Tcx = VFNMS(LDK(KP707106781), Tas, Tad);
Chris@82 1112 Tcy = VADD(Tcf, Tcg);
Chris@82 1113 Tcz = VFMA(LDK(KP923879532), Tcy, Tcx);
Chris@82 1114 TcR = VFNMS(LDK(KP923879532), Tcy, Tcx);
Chris@82 1115 TcI = VFNMS(LDK(KP707106781), Tcd, Tcc);
Chris@82 1116 TcJ = VSUB(TaI, TaX);
Chris@82 1117 TcK = VFNMS(LDK(KP923879532), TcJ, TcI);
Chris@82 1118 TcU = VFMA(LDK(KP923879532), TcJ, TcI);
Chris@82 1119 {
Chris@82 1120 V TcC, TcL, TcF, TcM;
Chris@82 1121 {
Chris@82 1122 V TcA, TcB, TcD, TcE;
Chris@82 1123 TcA = VFNMS(LDK(KP707106781), Tbl, Tb6);
Chris@82 1124 TcB = VFNMS(LDK(KP707106781), Tbu, Tbt);
Chris@82 1125 TcC = VFMA(LDK(KP668178637), TcB, TcA);
Chris@82 1126 TcL = VFNMS(LDK(KP668178637), TcA, TcB);
Chris@82 1127 TcD = VFNMS(LDK(KP707106781), TbS, TbD);
Chris@82 1128 TcE = VFNMS(LDK(KP707106781), Tc1, Tc0);
Chris@82 1129 TcF = VFMA(LDK(KP668178637), TcE, TcD);
Chris@82 1130 TcM = VFNMS(LDK(KP668178637), TcD, TcE);
Chris@82 1131 }
Chris@82 1132 TcG = VADD(TcC, TcF);
Chris@82 1133 TcV = VSUB(TcC, TcF);
Chris@82 1134 TcN = VSUB(TcL, TcM);
Chris@82 1135 TcS = VADD(TcL, TcM);
Chris@82 1136 }
Chris@82 1137 }
Chris@82 1138 {
Chris@82 1139 V TcH, TcO, TcX, TcY;
Chris@82 1140 TcH = VFNMS(LDK(KP831469612), TcG, Tcz);
Chris@82 1141 TcO = VFNMS(LDK(KP831469612), TcN, TcK);
Chris@82 1142 ST(&(xo[WS(os, 76)]), VFNMSI(TcO, TcH), ovs, &(xo[0]));
Chris@82 1143 ST(&(xo[WS(os, 52)]), VFMAI(TcO, TcH), ovs, &(xo[0]));
Chris@82 1144 TcX = VFNMS(LDK(KP831469612), TcS, TcR);
Chris@82 1145 TcY = VFMA(LDK(KP831469612), TcV, TcU);
Chris@82 1146 ST(&(xo[WS(os, 20)]), VFMAI(TcY, TcX), ovs, &(xo[0]));
Chris@82 1147 ST(&(xo[WS(os, 108)]), VFNMSI(TcY, TcX), ovs, &(xo[0]));
Chris@82 1148 }
Chris@82 1149 {
Chris@82 1150 V TcP, TcQ, TcT, TcW;
Chris@82 1151 TcP = VFMA(LDK(KP831469612), TcG, Tcz);
Chris@82 1152 TcQ = VFMA(LDK(KP831469612), TcN, TcK);
Chris@82 1153 ST(&(xo[WS(os, 12)]), VFNMSI(TcQ, TcP), ovs, &(xo[0]));
Chris@82 1154 ST(&(xo[WS(os, 116)]), VFMAI(TcQ, TcP), ovs, &(xo[0]));
Chris@82 1155 TcT = VFMA(LDK(KP831469612), TcS, TcR);
Chris@82 1156 TcW = VFNMS(LDK(KP831469612), TcV, TcU);
Chris@82 1157 ST(&(xo[WS(os, 44)]), VFNMSI(TcW, TcT), ovs, &(xo[0]));
Chris@82 1158 ST(&(xo[WS(os, 84)]), VFMAI(TcW, TcT), ovs, &(xo[0]));
Chris@82 1159 }
Chris@82 1160 }
Chris@82 1161 {
Chris@82 1162 V TeF, Tga, TfF, Tg0, Tfy, Tg7, TfI, TfP, Tfm, TfJ, TfB, TfG, TfW, Tgb, Tg3;
Chris@82 1163 V Tg8;
Chris@82 1164 {
Chris@82 1165 V Tel, TfY, TeE, TfZ, Teu, TeD;
Chris@82 1166 Tel = VFMA(LDK(KP923879532), Tek, Ted);
Chris@82 1167 TfY = VFNMS(LDK(KP923879532), Tft, Tfq);
Chris@82 1168 Teu = VFNMS(LDK(KP198912367), Tet, Teq);
Chris@82 1169 TeD = VFNMS(LDK(KP198912367), TeC, Tez);
Chris@82 1170 TeE = VADD(Teu, TeD);
Chris@82 1171 TfZ = VSUB(Teu, TeD);
Chris@82 1172 TeF = VFMA(LDK(KP980785280), TeE, Tel);
Chris@82 1173 Tga = VFMA(LDK(KP980785280), TfZ, TfY);
Chris@82 1174 TfF = VFNMS(LDK(KP980785280), TeE, Tel);
Chris@82 1175 Tg0 = VFNMS(LDK(KP980785280), TfZ, TfY);
Chris@82 1176 }
Chris@82 1177 {
Chris@82 1178 V Tfu, TfN, Tfx, TfO, Tfv, Tfw;
Chris@82 1179 Tfu = VFMA(LDK(KP923879532), Tft, Tfq);
Chris@82 1180 TfN = VFNMS(LDK(KP923879532), Tek, Ted);
Chris@82 1181 Tfv = VFMA(LDK(KP198912367), Teq, Tet);
Chris@82 1182 Tfw = VFMA(LDK(KP198912367), Tez, TeC);
Chris@82 1183 Tfx = VSUB(Tfv, Tfw);
Chris@82 1184 TfO = VADD(Tfv, Tfw);
Chris@82 1185 Tfy = VFMA(LDK(KP980785280), Tfx, Tfu);
Chris@82 1186 Tg7 = VFNMS(LDK(KP980785280), TfO, TfN);
Chris@82 1187 TfI = VFNMS(LDK(KP980785280), Tfx, Tfu);
Chris@82 1188 TfP = VFMA(LDK(KP980785280), TfO, TfN);
Chris@82 1189 }
Chris@82 1190 {
Chris@82 1191 V Tf0, Tfz, Tfl, TfA;
Chris@82 1192 {
Chris@82 1193 V TeS, TeZ, Tfd, Tfk;
Chris@82 1194 TeS = VFMA(LDK(KP923879532), TeR, TeK);
Chris@82 1195 TeZ = VFMA(LDK(KP923879532), TeY, TeV);
Chris@82 1196 Tf0 = VFNMS(LDK(KP098491403), TeZ, TeS);
Chris@82 1197 Tfz = VFMA(LDK(KP098491403), TeS, TeZ);
Chris@82 1198 Tfd = VFMA(LDK(KP923879532), Tfc, Tf5);
Chris@82 1199 Tfk = VFMA(LDK(KP923879532), Tfj, Tfg);
Chris@82 1200 Tfl = VFNMS(LDK(KP098491403), Tfk, Tfd);
Chris@82 1201 TfA = VFMA(LDK(KP098491403), Tfd, Tfk);
Chris@82 1202 }
Chris@82 1203 Tfm = VADD(Tf0, Tfl);
Chris@82 1204 TfJ = VSUB(Tf0, Tfl);
Chris@82 1205 TfB = VSUB(Tfz, TfA);
Chris@82 1206 TfG = VADD(Tfz, TfA);
Chris@82 1207 }
Chris@82 1208 {
Chris@82 1209 V TfS, Tg1, TfV, Tg2;
Chris@82 1210 {
Chris@82 1211 V TfQ, TfR, TfT, TfU;
Chris@82 1212 TfQ = VFNMS(LDK(KP923879532), TeR, TeK);
Chris@82 1213 TfR = VFNMS(LDK(KP923879532), TeY, TeV);
Chris@82 1214 TfS = VFMA(LDK(KP820678790), TfR, TfQ);
Chris@82 1215 Tg1 = VFNMS(LDK(KP820678790), TfQ, TfR);
Chris@82 1216 TfT = VFNMS(LDK(KP923879532), Tfc, Tf5);
Chris@82 1217 TfU = VFNMS(LDK(KP923879532), Tfj, Tfg);
Chris@82 1218 TfV = VFMA(LDK(KP820678790), TfU, TfT);
Chris@82 1219 Tg2 = VFNMS(LDK(KP820678790), TfT, TfU);
Chris@82 1220 }
Chris@82 1221 TfW = VADD(TfS, TfV);
Chris@82 1222 Tgb = VSUB(TfS, TfV);
Chris@82 1223 Tg3 = VSUB(Tg1, Tg2);
Chris@82 1224 Tg8 = VADD(Tg1, Tg2);
Chris@82 1225 }
Chris@82 1226 {
Chris@82 1227 V Tfn, TfC, Tg9, Tgc;
Chris@82 1228 Tfn = VFNMS(LDK(KP995184726), Tfm, TeF);
Chris@82 1229 TfC = VFNMS(LDK(KP995184726), TfB, Tfy);
Chris@82 1230 ST(&(xo[WS(os, 62)]), VFNMSI(TfC, Tfn), ovs, &(xo[0]));
Chris@82 1231 ST(&(xo[WS(os, 66)]), VFMAI(TfC, Tfn), ovs, &(xo[0]));
Chris@82 1232 Tg9 = VFMA(LDK(KP773010453), Tg8, Tg7);
Chris@82 1233 Tgc = VFNMS(LDK(KP773010453), Tgb, Tga);
Chris@82 1234 ST(&(xo[WS(os, 46)]), VFNMSI(Tgc, Tg9), ovs, &(xo[0]));
Chris@82 1235 ST(&(xo[WS(os, 82)]), VFMAI(Tgc, Tg9), ovs, &(xo[0]));
Chris@82 1236 }
Chris@82 1237 {
Chris@82 1238 V Tgd, Tge, TfD, TfE;
Chris@82 1239 Tgd = VFNMS(LDK(KP773010453), Tg8, Tg7);
Chris@82 1240 Tge = VFMA(LDK(KP773010453), Tgb, Tga);
Chris@82 1241 ST(&(xo[WS(os, 18)]), VFMAI(Tge, Tgd), ovs, &(xo[0]));
Chris@82 1242 ST(&(xo[WS(os, 110)]), VFNMSI(Tge, Tgd), ovs, &(xo[0]));
Chris@82 1243 TfD = VFMA(LDK(KP995184726), Tfm, TeF);
Chris@82 1244 TfE = VFMA(LDK(KP995184726), TfB, Tfy);
Chris@82 1245 ST(&(xo[WS(os, 126)]), VFNMSI(TfE, TfD), ovs, &(xo[0]));
Chris@82 1246 ST(&(xo[WS(os, 2)]), VFMAI(TfE, TfD), ovs, &(xo[0]));
Chris@82 1247 }
Chris@82 1248 {
Chris@82 1249 V TfH, TfK, TfX, Tg4;
Chris@82 1250 TfH = VFNMS(LDK(KP995184726), TfG, TfF);
Chris@82 1251 TfK = VFMA(LDK(KP995184726), TfJ, TfI);
Chris@82 1252 ST(&(xo[WS(os, 34)]), VFMAI(TfK, TfH), ovs, &(xo[0]));
Chris@82 1253 ST(&(xo[WS(os, 94)]), VFNMSI(TfK, TfH), ovs, &(xo[0]));
Chris@82 1254 TfX = VFNMS(LDK(KP773010453), TfW, TfP);
Chris@82 1255 Tg4 = VFNMS(LDK(KP773010453), Tg3, Tg0);
Chris@82 1256 ST(&(xo[WS(os, 78)]), VFNMSI(Tg4, TfX), ovs, &(xo[0]));
Chris@82 1257 ST(&(xo[WS(os, 50)]), VFMAI(Tg4, TfX), ovs, &(xo[0]));
Chris@82 1258 }
Chris@82 1259 {
Chris@82 1260 V Tg5, Tg6, TfL, TfM;
Chris@82 1261 Tg5 = VFMA(LDK(KP773010453), TfW, TfP);
Chris@82 1262 Tg6 = VFMA(LDK(KP773010453), Tg3, Tg0);
Chris@82 1263 ST(&(xo[WS(os, 14)]), VFNMSI(Tg6, Tg5), ovs, &(xo[0]));
Chris@82 1264 ST(&(xo[WS(os, 114)]), VFMAI(Tg6, Tg5), ovs, &(xo[0]));
Chris@82 1265 TfL = VFMA(LDK(KP995184726), TfG, TfF);
Chris@82 1266 TfM = VFNMS(LDK(KP995184726), TfJ, TfI);
Chris@82 1267 ST(&(xo[WS(os, 30)]), VFNMSI(TfM, TfL), ovs, &(xo[0]));
Chris@82 1268 ST(&(xo[WS(os, 98)]), VFMAI(TfM, TfL), ovs, &(xo[0]));
Chris@82 1269 }
Chris@82 1270 }
Chris@82 1271 {
Chris@82 1272 V Tgp, Tho, TgT, The, TgM, Thl, TgW, Th3, TgE, TgX, TgP, TgU, Tha, Thp, Thh;
Chris@82 1273 V Thm;
Chris@82 1274 {
Chris@82 1275 V Tgh, Thc, Tgo, Thd, Tgk, Tgn;
Chris@82 1276 Tgh = VFNMS(LDK(KP923879532), Tgg, Tgf);
Chris@82 1277 Thc = VFNMS(LDK(KP923879532), TgH, TgG);
Chris@82 1278 Tgk = VFNMS(LDK(KP668178637), Tgj, Tgi);
Chris@82 1279 Tgn = VFNMS(LDK(KP668178637), Tgm, Tgl);
Chris@82 1280 Tgo = VADD(Tgk, Tgn);
Chris@82 1281 Thd = VSUB(Tgk, Tgn);
Chris@82 1282 Tgp = VFNMS(LDK(KP831469612), Tgo, Tgh);
Chris@82 1283 Tho = VFNMS(LDK(KP831469612), Thd, Thc);
Chris@82 1284 TgT = VFMA(LDK(KP831469612), Tgo, Tgh);
Chris@82 1285 The = VFMA(LDK(KP831469612), Thd, Thc);
Chris@82 1286 }
Chris@82 1287 {
Chris@82 1288 V TgI, Th1, TgL, Th2, TgJ, TgK;
Chris@82 1289 TgI = VFMA(LDK(KP923879532), TgH, TgG);
Chris@82 1290 Th1 = VFMA(LDK(KP923879532), Tgg, Tgf);
Chris@82 1291 TgJ = VFMA(LDK(KP668178637), Tgi, Tgj);
Chris@82 1292 TgK = VFMA(LDK(KP668178637), Tgl, Tgm);
Chris@82 1293 TgL = VSUB(TgJ, TgK);
Chris@82 1294 Th2 = VADD(TgJ, TgK);
Chris@82 1295 TgM = VFMA(LDK(KP831469612), TgL, TgI);
Chris@82 1296 Thl = VFNMS(LDK(KP831469612), Th2, Th1);
Chris@82 1297 TgW = VFNMS(LDK(KP831469612), TgL, TgI);
Chris@82 1298 Th3 = VFMA(LDK(KP831469612), Th2, Th1);
Chris@82 1299 }
Chris@82 1300 {
Chris@82 1301 V Tgw, TgN, TgD, TgO;
Chris@82 1302 {
Chris@82 1303 V Tgs, Tgv, Tgz, TgC;
Chris@82 1304 Tgs = VFNMS(LDK(KP923879532), Tgr, Tgq);
Chris@82 1305 Tgv = VFMA(LDK(KP923879532), Tgu, Tgt);
Chris@82 1306 Tgw = VFNMS(LDK(KP534511135), Tgv, Tgs);
Chris@82 1307 TgN = VFMA(LDK(KP534511135), Tgs, Tgv);
Chris@82 1308 Tgz = VFNMS(LDK(KP923879532), Tgy, Tgx);
Chris@82 1309 TgC = VFMA(LDK(KP923879532), TgB, TgA);
Chris@82 1310 TgD = VFNMS(LDK(KP534511135), TgC, Tgz);
Chris@82 1311 TgO = VFMA(LDK(KP534511135), Tgz, TgC);
Chris@82 1312 }
Chris@82 1313 TgE = VADD(Tgw, TgD);
Chris@82 1314 TgX = VSUB(Tgw, TgD);
Chris@82 1315 TgP = VSUB(TgN, TgO);
Chris@82 1316 TgU = VADD(TgN, TgO);
Chris@82 1317 }
Chris@82 1318 {
Chris@82 1319 V Th6, Thf, Th9, Thg;
Chris@82 1320 {
Chris@82 1321 V Th4, Th5, Th7, Th8;
Chris@82 1322 Th4 = VFMA(LDK(KP923879532), Tgr, Tgq);
Chris@82 1323 Th5 = VFNMS(LDK(KP923879532), Tgu, Tgt);
Chris@82 1324 Th6 = VFMA(LDK(KP303346683), Th5, Th4);
Chris@82 1325 Thf = VFNMS(LDK(KP303346683), Th4, Th5);
Chris@82 1326 Th7 = VFMA(LDK(KP923879532), Tgy, Tgx);
Chris@82 1327 Th8 = VFNMS(LDK(KP923879532), TgB, TgA);
Chris@82 1328 Th9 = VFMA(LDK(KP303346683), Th8, Th7);
Chris@82 1329 Thg = VFNMS(LDK(KP303346683), Th7, Th8);
Chris@82 1330 }
Chris@82 1331 Tha = VADD(Th6, Th9);
Chris@82 1332 Thp = VSUB(Th6, Th9);
Chris@82 1333 Thh = VSUB(Thf, Thg);
Chris@82 1334 Thm = VADD(Thf, Thg);
Chris@82 1335 }
Chris@82 1336 {
Chris@82 1337 V TgF, TgQ, Thn, Thq;
Chris@82 1338 TgF = VFNMS(LDK(KP881921264), TgE, Tgp);
Chris@82 1339 TgQ = VFNMS(LDK(KP881921264), TgP, TgM);
Chris@82 1340 ST(&(xo[WS(os, 54)]), VFNMSI(TgQ, TgF), ovs, &(xo[0]));
Chris@82 1341 ST(&(xo[WS(os, 74)]), VFMAI(TgQ, TgF), ovs, &(xo[0]));
Chris@82 1342 Thn = VFMA(LDK(KP956940335), Thm, Thl);
Chris@82 1343 Thq = VFNMS(LDK(KP956940335), Thp, Tho);
Chris@82 1344 ST(&(xo[WS(os, 38)]), VFNMSI(Thq, Thn), ovs, &(xo[0]));
Chris@82 1345 ST(&(xo[WS(os, 90)]), VFMAI(Thq, Thn), ovs, &(xo[0]));
Chris@82 1346 }
Chris@82 1347 {
Chris@82 1348 V Thr, Ths, TgR, TgS;
Chris@82 1349 Thr = VFNMS(LDK(KP956940335), Thm, Thl);
Chris@82 1350 Ths = VFMA(LDK(KP956940335), Thp, Tho);
Chris@82 1351 ST(&(xo[WS(os, 26)]), VFMAI(Ths, Thr), ovs, &(xo[0]));
Chris@82 1352 ST(&(xo[WS(os, 102)]), VFNMSI(Ths, Thr), ovs, &(xo[0]));
Chris@82 1353 TgR = VFMA(LDK(KP881921264), TgE, Tgp);
Chris@82 1354 TgS = VFMA(LDK(KP881921264), TgP, TgM);
Chris@82 1355 ST(&(xo[WS(os, 118)]), VFNMSI(TgS, TgR), ovs, &(xo[0]));
Chris@82 1356 ST(&(xo[WS(os, 10)]), VFMAI(TgS, TgR), ovs, &(xo[0]));
Chris@82 1357 }
Chris@82 1358 {
Chris@82 1359 V TgV, TgY, Thb, Thi;
Chris@82 1360 TgV = VFNMS(LDK(KP881921264), TgU, TgT);
Chris@82 1361 TgY = VFMA(LDK(KP881921264), TgX, TgW);
Chris@82 1362 ST(&(xo[WS(os, 42)]), VFMAI(TgY, TgV), ovs, &(xo[0]));
Chris@82 1363 ST(&(xo[WS(os, 86)]), VFNMSI(TgY, TgV), ovs, &(xo[0]));
Chris@82 1364 Thb = VFNMS(LDK(KP956940335), Tha, Th3);
Chris@82 1365 Thi = VFNMS(LDK(KP956940335), Thh, The);
Chris@82 1366 ST(&(xo[WS(os, 70)]), VFNMSI(Thi, Thb), ovs, &(xo[0]));
Chris@82 1367 ST(&(xo[WS(os, 58)]), VFMAI(Thi, Thb), ovs, &(xo[0]));
Chris@82 1368 }
Chris@82 1369 {
Chris@82 1370 V Thj, Thk, TgZ, Th0;
Chris@82 1371 Thj = VFMA(LDK(KP956940335), Tha, Th3);
Chris@82 1372 Thk = VFMA(LDK(KP956940335), Thh, The);
Chris@82 1373 ST(&(xo[WS(os, 6)]), VFNMSI(Thk, Thj), ovs, &(xo[0]));
Chris@82 1374 ST(&(xo[WS(os, 122)]), VFMAI(Thk, Thj), ovs, &(xo[0]));
Chris@82 1375 TgZ = VFMA(LDK(KP881921264), TgU, TgT);
Chris@82 1376 Th0 = VFNMS(LDK(KP881921264), TgX, TgW);
Chris@82 1377 ST(&(xo[WS(os, 22)]), VFNMSI(Th0, TgZ), ovs, &(xo[0]));
Chris@82 1378 ST(&(xo[WS(os, 106)]), VFMAI(Th0, TgZ), ovs, &(xo[0]));
Chris@82 1379 }
Chris@82 1380 }
Chris@82 1381 {
Chris@82 1382 V T80, T8n, T8f, T8k, T8A, T8P, T8H, T8M, T7n, T8L, T8O, T8c, T8j, T8t, T8E;
Chris@82 1383 V T8m;
Chris@82 1384 {
Chris@82 1385 V T7G, T8d, T7Z, T8e;
Chris@82 1386 {
Chris@82 1387 V T7y, T7F, T7R, T7Y;
Chris@82 1388 T7y = VFMA(LDK(KP831469612), T7x, T7q);
Chris@82 1389 T7F = VFMA(LDK(KP831469612), T7E, T7B);
Chris@82 1390 T7G = VFMA(LDK(KP148335987), T7F, T7y);
Chris@82 1391 T8d = VFNMS(LDK(KP148335987), T7y, T7F);
Chris@82 1392 T7R = VFMA(LDK(KP831469612), T7Q, T7J);
Chris@82 1393 T7Y = VFMA(LDK(KP831469612), T7X, T7U);
Chris@82 1394 T7Z = VFMA(LDK(KP148335987), T7Y, T7R);
Chris@82 1395 T8e = VFNMS(LDK(KP148335987), T7R, T7Y);
Chris@82 1396 }
Chris@82 1397 T80 = VADD(T7G, T7Z);
Chris@82 1398 T8n = VSUB(T7G, T7Z);
Chris@82 1399 T8f = VSUB(T8d, T8e);
Chris@82 1400 T8k = VADD(T8d, T8e);
Chris@82 1401 }
Chris@82 1402 {
Chris@82 1403 V T8w, T8F, T8z, T8G;
Chris@82 1404 {
Chris@82 1405 V T8u, T8v, T8x, T8y;
Chris@82 1406 T8u = VFNMS(LDK(KP831469612), T7x, T7q);
Chris@82 1407 T8v = VFNMS(LDK(KP831469612), T7E, T7B);
Chris@82 1408 T8w = VFNMS(LDK(KP741650546), T8v, T8u);
Chris@82 1409 T8F = VFMA(LDK(KP741650546), T8u, T8v);
Chris@82 1410 T8x = VFNMS(LDK(KP831469612), T7Q, T7J);
Chris@82 1411 T8y = VFNMS(LDK(KP831469612), T7X, T7U);
Chris@82 1412 T8z = VFNMS(LDK(KP741650546), T8y, T8x);
Chris@82 1413 T8G = VFMA(LDK(KP741650546), T8x, T8y);
Chris@82 1414 }
Chris@82 1415 T8A = VADD(T8w, T8z);
Chris@82 1416 T8P = VSUB(T8w, T8z);
Chris@82 1417 T8H = VSUB(T8F, T8G);
Chris@82 1418 T8M = VADD(T8F, T8G);
Chris@82 1419 }
Chris@82 1420 {
Chris@82 1421 V T77, T8r, T88, T8C, T7m, T8D, T8b, T8s, T76, T87;
Chris@82 1422 T76 = VADD(T72, T75);
Chris@82 1423 T77 = VFMA(LDK(KP831469612), T76, T6Z);
Chris@82 1424 T8r = VFNMS(LDK(KP831469612), T76, T6Z);
Chris@82 1425 T87 = VSUB(T85, T86);
Chris@82 1426 T88 = VFMA(LDK(KP831469612), T87, T84);
Chris@82 1427 T8C = VFNMS(LDK(KP831469612), T87, T84);
Chris@82 1428 {
Chris@82 1429 V T7e, T7l, T89, T8a;
Chris@82 1430 T7e = VFMA(LDK(KP303346683), T7d, T7a);
Chris@82 1431 T7l = VFMA(LDK(KP303346683), T7k, T7h);
Chris@82 1432 T7m = VADD(T7e, T7l);
Chris@82 1433 T8D = VSUB(T7e, T7l);
Chris@82 1434 T89 = VFNMS(LDK(KP303346683), T7a, T7d);
Chris@82 1435 T8a = VFNMS(LDK(KP303346683), T7h, T7k);
Chris@82 1436 T8b = VSUB(T89, T8a);
Chris@82 1437 T8s = VADD(T89, T8a);
Chris@82 1438 }
Chris@82 1439 T7n = VFMA(LDK(KP956940335), T7m, T77);
Chris@82 1440 T8L = VFMA(LDK(KP956940335), T8s, T8r);
Chris@82 1441 T8O = VFNMS(LDK(KP956940335), T8D, T8C);
Chris@82 1442 T8c = VFMA(LDK(KP956940335), T8b, T88);
Chris@82 1443 T8j = VFNMS(LDK(KP956940335), T7m, T77);
Chris@82 1444 T8t = VFNMS(LDK(KP956940335), T8s, T8r);
Chris@82 1445 T8E = VFMA(LDK(KP956940335), T8D, T8C);
Chris@82 1446 T8m = VFNMS(LDK(KP956940335), T8b, T88);
Chris@82 1447 }
Chris@82 1448 {
Chris@82 1449 V T81, T8g, T8N, T8Q;
Chris@82 1450 T81 = VFNMS(LDK(KP989176509), T80, T7n);
Chris@82 1451 T8g = VFNMS(LDK(KP989176509), T8f, T8c);
Chris@82 1452 ST(&(xo[WS(os, 67)]), VFNMSI(T8g, T81), ovs, &(xo[WS(os, 1)]));
Chris@82 1453 ST(&(xo[WS(os, 61)]), VFMAI(T8g, T81), ovs, &(xo[WS(os, 1)]));
Chris@82 1454 T8N = VFNMS(LDK(KP803207531), T8M, T8L);
Chris@82 1455 T8Q = VFMA(LDK(KP803207531), T8P, T8O);
Chris@82 1456 ST(&(xo[WS(os, 45)]), VFMAI(T8Q, T8N), ovs, &(xo[WS(os, 1)]));
Chris@82 1457 ST(&(xo[WS(os, 83)]), VFNMSI(T8Q, T8N), ovs, &(xo[WS(os, 1)]));
Chris@82 1458 }
Chris@82 1459 {
Chris@82 1460 V T8R, T8S, T8h, T8i;
Chris@82 1461 T8R = VFMA(LDK(KP803207531), T8M, T8L);
Chris@82 1462 T8S = VFNMS(LDK(KP803207531), T8P, T8O);
Chris@82 1463 ST(&(xo[WS(os, 19)]), VFNMSI(T8S, T8R), ovs, &(xo[WS(os, 1)]));
Chris@82 1464 ST(&(xo[WS(os, 109)]), VFMAI(T8S, T8R), ovs, &(xo[WS(os, 1)]));
Chris@82 1465 T8h = VFMA(LDK(KP989176509), T80, T7n);
Chris@82 1466 T8i = VFMA(LDK(KP989176509), T8f, T8c);
Chris@82 1467 ST(&(xo[WS(os, 3)]), VFNMSI(T8i, T8h), ovs, &(xo[WS(os, 1)]));
Chris@82 1468 ST(&(xo[WS(os, 125)]), VFMAI(T8i, T8h), ovs, &(xo[WS(os, 1)]));
Chris@82 1469 }
Chris@82 1470 {
Chris@82 1471 V T8l, T8o, T8B, T8I;
Chris@82 1472 T8l = VFMA(LDK(KP989176509), T8k, T8j);
Chris@82 1473 T8o = VFNMS(LDK(KP989176509), T8n, T8m);
Chris@82 1474 ST(&(xo[WS(os, 35)]), VFNMSI(T8o, T8l), ovs, &(xo[WS(os, 1)]));
Chris@82 1475 ST(&(xo[WS(os, 93)]), VFMAI(T8o, T8l), ovs, &(xo[WS(os, 1)]));
Chris@82 1476 T8B = VFNMS(LDK(KP803207531), T8A, T8t);
Chris@82 1477 T8I = VFNMS(LDK(KP803207531), T8H, T8E);
Chris@82 1478 ST(&(xo[WS(os, 51)]), VFNMSI(T8I, T8B), ovs, &(xo[WS(os, 1)]));
Chris@82 1479 ST(&(xo[WS(os, 77)]), VFMAI(T8I, T8B), ovs, &(xo[WS(os, 1)]));
Chris@82 1480 }
Chris@82 1481 {
Chris@82 1482 V T8J, T8K, T8p, T8q;
Chris@82 1483 T8J = VFMA(LDK(KP803207531), T8A, T8t);
Chris@82 1484 T8K = VFMA(LDK(KP803207531), T8H, T8E);
Chris@82 1485 ST(&(xo[WS(os, 115)]), VFNMSI(T8K, T8J), ovs, &(xo[WS(os, 1)]));
Chris@82 1486 ST(&(xo[WS(os, 13)]), VFMAI(T8K, T8J), ovs, &(xo[WS(os, 1)]));
Chris@82 1487 T8p = VFNMS(LDK(KP989176509), T8k, T8j);
Chris@82 1488 T8q = VFMA(LDK(KP989176509), T8n, T8m);
Chris@82 1489 ST(&(xo[WS(os, 29)]), VFMAI(T8q, T8p), ovs, &(xo[WS(os, 1)]));
Chris@82 1490 ST(&(xo[WS(os, 99)]), VFNMSI(T8q, T8p), ovs, &(xo[WS(os, 1)]));
Chris@82 1491 }
Chris@82 1492 }
Chris@82 1493 {
Chris@82 1494 V T4K, T5d, T55, T5a, T5q, T5F, T5x, T5C, T2f, T5B, T5E, T52, T59, T5j, T5u;
Chris@82 1495 V T5c;
Chris@82 1496 {
Chris@82 1497 V T3u, T53, T4J, T54;
Chris@82 1498 {
Chris@82 1499 V T3g, T3t, T4v, T4I;
Chris@82 1500 T3g = VFMA(LDK(KP980785280), T3f, T2G);
Chris@82 1501 T3t = VFMA(LDK(KP980785280), T3s, T3p);
Chris@82 1502 T3u = VFNMS(LDK(KP049126849), T3t, T3g);
Chris@82 1503 T53 = VFMA(LDK(KP049126849), T3g, T3t);
Chris@82 1504 T4v = VFMA(LDK(KP980785280), T4u, T3V);
Chris@82 1505 T4I = VFMA(LDK(KP980785280), T4H, T4E);
Chris@82 1506 T4J = VFNMS(LDK(KP049126849), T4I, T4v);
Chris@82 1507 T54 = VFMA(LDK(KP049126849), T4v, T4I);
Chris@82 1508 }
Chris@82 1509 T4K = VADD(T3u, T4J);
Chris@82 1510 T5d = VSUB(T3u, T4J);
Chris@82 1511 T55 = VSUB(T53, T54);
Chris@82 1512 T5a = VADD(T53, T54);
Chris@82 1513 }
Chris@82 1514 {
Chris@82 1515 V T5m, T5v, T5p, T5w;
Chris@82 1516 {
Chris@82 1517 V T5k, T5l, T5n, T5o;
Chris@82 1518 T5k = VFNMS(LDK(KP980785280), T3f, T2G);
Chris@82 1519 T5l = VFNMS(LDK(KP980785280), T3s, T3p);
Chris@82 1520 T5m = VFMA(LDK(KP906347169), T5l, T5k);
Chris@82 1521 T5v = VFNMS(LDK(KP906347169), T5k, T5l);
Chris@82 1522 T5n = VFNMS(LDK(KP980785280), T4u, T3V);
Chris@82 1523 T5o = VFNMS(LDK(KP980785280), T4H, T4E);
Chris@82 1524 T5p = VFMA(LDK(KP906347169), T5o, T5n);
Chris@82 1525 T5w = VFNMS(LDK(KP906347169), T5n, T5o);
Chris@82 1526 }
Chris@82 1527 T5q = VADD(T5m, T5p);
Chris@82 1528 T5F = VSUB(T5m, T5p);
Chris@82 1529 T5x = VSUB(T5v, T5w);
Chris@82 1530 T5C = VADD(T5v, T5w);
Chris@82 1531 }
Chris@82 1532 {
Chris@82 1533 V T11, T5h, T4Y, T5s, T2e, T5t, T51, T5i, T10, T4X;
Chris@82 1534 T10 = VADD(TI, TZ);
Chris@82 1535 T11 = VFMA(LDK(KP980785280), T10, Tr);
Chris@82 1536 T5h = VFNMS(LDK(KP980785280), T10, Tr);
Chris@82 1537 T4X = VSUB(T4V, T4W);
Chris@82 1538 T4Y = VFMA(LDK(KP980785280), T4X, T4U);
Chris@82 1539 T5s = VFNMS(LDK(KP980785280), T4X, T4U);
Chris@82 1540 {
Chris@82 1541 V T1C, T2d, T4Z, T50;
Chris@82 1542 T1C = VFNMS(LDK(KP098491403), T1B, T1s);
Chris@82 1543 T2d = VFNMS(LDK(KP098491403), T2c, T23);
Chris@82 1544 T2e = VADD(T1C, T2d);
Chris@82 1545 T5t = VSUB(T1C, T2d);
Chris@82 1546 T4Z = VFMA(LDK(KP098491403), T1s, T1B);
Chris@82 1547 T50 = VFMA(LDK(KP098491403), T23, T2c);
Chris@82 1548 T51 = VSUB(T4Z, T50);
Chris@82 1549 T5i = VADD(T4Z, T50);
Chris@82 1550 }
Chris@82 1551 T2f = VFMA(LDK(KP995184726), T2e, T11);
Chris@82 1552 T5B = VFNMS(LDK(KP995184726), T5i, T5h);
Chris@82 1553 T5E = VFMA(LDK(KP995184726), T5t, T5s);
Chris@82 1554 T52 = VFMA(LDK(KP995184726), T51, T4Y);
Chris@82 1555 T59 = VFNMS(LDK(KP995184726), T2e, T11);
Chris@82 1556 T5j = VFMA(LDK(KP995184726), T5i, T5h);
Chris@82 1557 T5u = VFNMS(LDK(KP995184726), T5t, T5s);
Chris@82 1558 T5c = VFNMS(LDK(KP995184726), T51, T4Y);
Chris@82 1559 }
Chris@82 1560 {
Chris@82 1561 V T4L, T56, T5D, T5G;
Chris@82 1562 T4L = VFNMS(LDK(KP998795456), T4K, T2f);
Chris@82 1563 T56 = VFNMS(LDK(KP998795456), T55, T52);
Chris@82 1564 ST(&(xo[WS(os, 63)]), VFNMSI(T56, T4L), ovs, &(xo[WS(os, 1)]));
Chris@82 1565 ST(&(xo[WS(os, 65)]), VFMAI(T56, T4L), ovs, &(xo[WS(os, 1)]));
Chris@82 1566 T5D = VFMA(LDK(KP740951125), T5C, T5B);
Chris@82 1567 T5G = VFNMS(LDK(KP740951125), T5F, T5E);
Chris@82 1568 ST(&(xo[WS(os, 47)]), VFNMSI(T5G, T5D), ovs, &(xo[WS(os, 1)]));
Chris@82 1569 ST(&(xo[WS(os, 81)]), VFMAI(T5G, T5D), ovs, &(xo[WS(os, 1)]));
Chris@82 1570 }
Chris@82 1571 {
Chris@82 1572 V T5H, T5I, T57, T58;
Chris@82 1573 T5H = VFNMS(LDK(KP740951125), T5C, T5B);
Chris@82 1574 T5I = VFMA(LDK(KP740951125), T5F, T5E);
Chris@82 1575 ST(&(xo[WS(os, 17)]), VFMAI(T5I, T5H), ovs, &(xo[WS(os, 1)]));
Chris@82 1576 ST(&(xo[WS(os, 111)]), VFNMSI(T5I, T5H), ovs, &(xo[WS(os, 1)]));
Chris@82 1577 T57 = VFMA(LDK(KP998795456), T4K, T2f);
Chris@82 1578 T58 = VFMA(LDK(KP998795456), T55, T52);
Chris@82 1579 ST(&(xo[WS(os, 127)]), VFNMSI(T58, T57), ovs, &(xo[WS(os, 1)]));
Chris@82 1580 ST(&(xo[WS(os, 1)]), VFMAI(T58, T57), ovs, &(xo[WS(os, 1)]));
Chris@82 1581 }
Chris@82 1582 {
Chris@82 1583 V T5b, T5e, T5r, T5y;
Chris@82 1584 T5b = VFNMS(LDK(KP998795456), T5a, T59);
Chris@82 1585 T5e = VFMA(LDK(KP998795456), T5d, T5c);
Chris@82 1586 ST(&(xo[WS(os, 33)]), VFMAI(T5e, T5b), ovs, &(xo[WS(os, 1)]));
Chris@82 1587 ST(&(xo[WS(os, 95)]), VFNMSI(T5e, T5b), ovs, &(xo[WS(os, 1)]));
Chris@82 1588 T5r = VFNMS(LDK(KP740951125), T5q, T5j);
Chris@82 1589 T5y = VFNMS(LDK(KP740951125), T5x, T5u);
Chris@82 1590 ST(&(xo[WS(os, 79)]), VFNMSI(T5y, T5r), ovs, &(xo[WS(os, 1)]));
Chris@82 1591 ST(&(xo[WS(os, 49)]), VFMAI(T5y, T5r), ovs, &(xo[WS(os, 1)]));
Chris@82 1592 }
Chris@82 1593 {
Chris@82 1594 V T5z, T5A, T5f, T5g;
Chris@82 1595 T5z = VFMA(LDK(KP740951125), T5q, T5j);
Chris@82 1596 T5A = VFMA(LDK(KP740951125), T5x, T5u);
Chris@82 1597 ST(&(xo[WS(os, 15)]), VFNMSI(T5A, T5z), ovs, &(xo[WS(os, 1)]));
Chris@82 1598 ST(&(xo[WS(os, 113)]), VFMAI(T5A, T5z), ovs, &(xo[WS(os, 1)]));
Chris@82 1599 T5f = VFMA(LDK(KP998795456), T5a, T59);
Chris@82 1600 T5g = VFNMS(LDK(KP998795456), T5d, T5c);
Chris@82 1601 ST(&(xo[WS(os, 31)]), VFNMSI(T5g, T5f), ovs, &(xo[WS(os, 1)]));
Chris@82 1602 ST(&(xo[WS(os, 97)]), VFMAI(T5g, T5f), ovs, &(xo[WS(os, 1)]));
Chris@82 1603 }
Chris@82 1604 }
Chris@82 1605 {
Chris@82 1606 V T9i, T9B, T9t, T9y, T9O, Ta3, T9V, Ta0, T93, T9Z, Ta2, T9q, T9x, T9H, T9S;
Chris@82 1607 V T9A;
Chris@82 1608 {
Chris@82 1609 V T9a, T9r, T9h, T9s;
Chris@82 1610 {
Chris@82 1611 V T96, T99, T9d, T9g;
Chris@82 1612 T96 = VFNMS(LDK(KP831469612), T95, T94);
Chris@82 1613 T99 = VFNMS(LDK(KP831469612), T98, T97);
Chris@82 1614 T9a = VFMA(LDK(KP599376933), T99, T96);
Chris@82 1615 T9r = VFNMS(LDK(KP599376933), T96, T99);
Chris@82 1616 T9d = VFNMS(LDK(KP831469612), T9c, T9b);
Chris@82 1617 T9g = VFNMS(LDK(KP831469612), T9f, T9e);
Chris@82 1618 T9h = VFMA(LDK(KP599376933), T9g, T9d);
Chris@82 1619 T9s = VFNMS(LDK(KP599376933), T9d, T9g);
Chris@82 1620 }
Chris@82 1621 T9i = VADD(T9a, T9h);
Chris@82 1622 T9B = VSUB(T9a, T9h);
Chris@82 1623 T9t = VSUB(T9r, T9s);
Chris@82 1624 T9y = VADD(T9r, T9s);
Chris@82 1625 }
Chris@82 1626 {
Chris@82 1627 V T9K, T9T, T9N, T9U;
Chris@82 1628 {
Chris@82 1629 V T9I, T9J, T9L, T9M;
Chris@82 1630 T9I = VFMA(LDK(KP831469612), T95, T94);
Chris@82 1631 T9J = VFMA(LDK(KP831469612), T98, T97);
Chris@82 1632 T9K = VFNMS(LDK(KP250486960), T9J, T9I);
Chris@82 1633 T9T = VFMA(LDK(KP250486960), T9I, T9J);
Chris@82 1634 T9L = VFMA(LDK(KP831469612), T9c, T9b);
Chris@82 1635 T9M = VFMA(LDK(KP831469612), T9f, T9e);
Chris@82 1636 T9N = VFNMS(LDK(KP250486960), T9M, T9L);
Chris@82 1637 T9U = VFMA(LDK(KP250486960), T9L, T9M);
Chris@82 1638 }
Chris@82 1639 T9O = VADD(T9K, T9N);
Chris@82 1640 Ta3 = VSUB(T9K, T9N);
Chris@82 1641 T9V = VSUB(T9T, T9U);
Chris@82 1642 Ta0 = VADD(T9T, T9U);
Chris@82 1643 }
Chris@82 1644 {
Chris@82 1645 V T8V, T9F, T9m, T9Q, T92, T9R, T9p, T9G, T8U, T9l;
Chris@82 1646 T8U = VADD(T85, T86);
Chris@82 1647 T8V = VFMA(LDK(KP831469612), T8U, T8T);
Chris@82 1648 T9F = VFNMS(LDK(KP831469612), T8U, T8T);
Chris@82 1649 T9l = VSUB(T72, T75);
Chris@82 1650 T9m = VFNMS(LDK(KP831469612), T9l, T9k);
Chris@82 1651 T9Q = VFMA(LDK(KP831469612), T9l, T9k);
Chris@82 1652 {
Chris@82 1653 V T8Y, T91, T9n, T9o;
Chris@82 1654 T8Y = VFMA(LDK(KP534511135), T8X, T8W);
Chris@82 1655 T91 = VFMA(LDK(KP534511135), T90, T8Z);
Chris@82 1656 T92 = VADD(T8Y, T91);
Chris@82 1657 T9R = VSUB(T8Y, T91);
Chris@82 1658 T9n = VFNMS(LDK(KP534511135), T8W, T8X);
Chris@82 1659 T9o = VFNMS(LDK(KP534511135), T8Z, T90);
Chris@82 1660 T9p = VSUB(T9n, T9o);
Chris@82 1661 T9G = VADD(T9n, T9o);
Chris@82 1662 }
Chris@82 1663 T93 = VFMA(LDK(KP881921264), T92, T8V);
Chris@82 1664 T9Z = VFNMS(LDK(KP881921264), T9G, T9F);
Chris@82 1665 Ta2 = VFNMS(LDK(KP881921264), T9R, T9Q);
Chris@82 1666 T9q = VFNMS(LDK(KP881921264), T9p, T9m);
Chris@82 1667 T9x = VFNMS(LDK(KP881921264), T92, T8V);
Chris@82 1668 T9H = VFMA(LDK(KP881921264), T9G, T9F);
Chris@82 1669 T9S = VFMA(LDK(KP881921264), T9R, T9Q);
Chris@82 1670 T9A = VFMA(LDK(KP881921264), T9p, T9m);
Chris@82 1671 }
Chris@82 1672 {
Chris@82 1673 V T9j, T9u, Ta1, Ta4;
Chris@82 1674 T9j = VFNMS(LDK(KP857728610), T9i, T93);
Chris@82 1675 T9u = VFNMS(LDK(KP857728610), T9t, T9q);
Chris@82 1676 ST(&(xo[WS(os, 75)]), VFNMSI(T9u, T9j), ovs, &(xo[WS(os, 1)]));
Chris@82 1677 ST(&(xo[WS(os, 53)]), VFMAI(T9u, T9j), ovs, &(xo[WS(os, 1)]));
Chris@82 1678 Ta1 = VFNMS(LDK(KP970031253), Ta0, T9Z);
Chris@82 1679 Ta4 = VFMA(LDK(KP970031253), Ta3, Ta2);
Chris@82 1680 ST(&(xo[WS(os, 37)]), VFMAI(Ta4, Ta1), ovs, &(xo[WS(os, 1)]));
Chris@82 1681 ST(&(xo[WS(os, 91)]), VFNMSI(Ta4, Ta1), ovs, &(xo[WS(os, 1)]));
Chris@82 1682 }
Chris@82 1683 {
Chris@82 1684 V Ta5, Ta6, T9v, T9w;
Chris@82 1685 Ta5 = VFMA(LDK(KP970031253), Ta0, T9Z);
Chris@82 1686 Ta6 = VFNMS(LDK(KP970031253), Ta3, Ta2);
Chris@82 1687 ST(&(xo[WS(os, 27)]), VFNMSI(Ta6, Ta5), ovs, &(xo[WS(os, 1)]));
Chris@82 1688 ST(&(xo[WS(os, 101)]), VFMAI(Ta6, Ta5), ovs, &(xo[WS(os, 1)]));
Chris@82 1689 T9v = VFMA(LDK(KP857728610), T9i, T93);
Chris@82 1690 T9w = VFMA(LDK(KP857728610), T9t, T9q);
Chris@82 1691 ST(&(xo[WS(os, 11)]), VFNMSI(T9w, T9v), ovs, &(xo[WS(os, 1)]));
Chris@82 1692 ST(&(xo[WS(os, 117)]), VFMAI(T9w, T9v), ovs, &(xo[WS(os, 1)]));
Chris@82 1693 }
Chris@82 1694 {
Chris@82 1695 V T9z, T9C, T9P, T9W;
Chris@82 1696 T9z = VFMA(LDK(KP857728610), T9y, T9x);
Chris@82 1697 T9C = VFNMS(LDK(KP857728610), T9B, T9A);
Chris@82 1698 ST(&(xo[WS(os, 43)]), VFNMSI(T9C, T9z), ovs, &(xo[WS(os, 1)]));
Chris@82 1699 ST(&(xo[WS(os, 85)]), VFMAI(T9C, T9z), ovs, &(xo[WS(os, 1)]));
Chris@82 1700 T9P = VFNMS(LDK(KP970031253), T9O, T9H);
Chris@82 1701 T9W = VFNMS(LDK(KP970031253), T9V, T9S);
Chris@82 1702 ST(&(xo[WS(os, 59)]), VFNMSI(T9W, T9P), ovs, &(xo[WS(os, 1)]));
Chris@82 1703 ST(&(xo[WS(os, 69)]), VFMAI(T9W, T9P), ovs, &(xo[WS(os, 1)]));
Chris@82 1704 }
Chris@82 1705 {
Chris@82 1706 V T9X, T9Y, T9D, T9E;
Chris@82 1707 T9X = VFMA(LDK(KP970031253), T9O, T9H);
Chris@82 1708 T9Y = VFMA(LDK(KP970031253), T9V, T9S);
Chris@82 1709 ST(&(xo[WS(os, 123)]), VFNMSI(T9Y, T9X), ovs, &(xo[WS(os, 1)]));
Chris@82 1710 ST(&(xo[WS(os, 5)]), VFMAI(T9Y, T9X), ovs, &(xo[WS(os, 1)]));
Chris@82 1711 T9D = VFNMS(LDK(KP857728610), T9y, T9x);
Chris@82 1712 T9E = VFMA(LDK(KP857728610), T9B, T9A);
Chris@82 1713 ST(&(xo[WS(os, 21)]), VFMAI(T9E, T9D), ovs, &(xo[WS(os, 1)]));
Chris@82 1714 ST(&(xo[WS(os, 107)]), VFNMSI(T9E, T9D), ovs, &(xo[WS(os, 1)]));
Chris@82 1715 }
Chris@82 1716 }
Chris@82 1717 {
Chris@82 1718 V T68, T6r, T6j, T6o, T6E, T6T, T6L, T6Q, T5T, T6P, T6S, T6g, T6n, T6x, T6I;
Chris@82 1719 V T6q;
Chris@82 1720 {
Chris@82 1721 V T60, T6h, T67, T6i;
Chris@82 1722 {
Chris@82 1723 V T5W, T5Z, T63, T66;
Chris@82 1724 T5W = VFNMS(LDK(KP980785280), T5V, T5U);
Chris@82 1725 T5Z = VFMA(LDK(KP980785280), T5Y, T5X);
Chris@82 1726 T60 = VFNMS(LDK(KP472964775), T5Z, T5W);
Chris@82 1727 T6h = VFMA(LDK(KP472964775), T5W, T5Z);
Chris@82 1728 T63 = VFNMS(LDK(KP980785280), T62, T61);
Chris@82 1729 T66 = VFMA(LDK(KP980785280), T65, T64);
Chris@82 1730 T67 = VFNMS(LDK(KP472964775), T66, T63);
Chris@82 1731 T6i = VFMA(LDK(KP472964775), T63, T66);
Chris@82 1732 }
Chris@82 1733 T68 = VADD(T60, T67);
Chris@82 1734 T6r = VSUB(T60, T67);
Chris@82 1735 T6j = VSUB(T6h, T6i);
Chris@82 1736 T6o = VADD(T6h, T6i);
Chris@82 1737 }
Chris@82 1738 {
Chris@82 1739 V T6A, T6J, T6D, T6K;
Chris@82 1740 {
Chris@82 1741 V T6y, T6z, T6B, T6C;
Chris@82 1742 T6y = VFMA(LDK(KP980785280), T5V, T5U);
Chris@82 1743 T6z = VFNMS(LDK(KP980785280), T5Y, T5X);
Chris@82 1744 T6A = VFMA(LDK(KP357805721), T6z, T6y);
Chris@82 1745 T6J = VFNMS(LDK(KP357805721), T6y, T6z);
Chris@82 1746 T6B = VFMA(LDK(KP980785280), T62, T61);
Chris@82 1747 T6C = VFNMS(LDK(KP980785280), T65, T64);
Chris@82 1748 T6D = VFMA(LDK(KP357805721), T6C, T6B);
Chris@82 1749 T6K = VFNMS(LDK(KP357805721), T6B, T6C);
Chris@82 1750 }
Chris@82 1751 T6E = VADD(T6A, T6D);
Chris@82 1752 T6T = VSUB(T6A, T6D);
Chris@82 1753 T6L = VSUB(T6J, T6K);
Chris@82 1754 T6Q = VADD(T6J, T6K);
Chris@82 1755 }
Chris@82 1756 {
Chris@82 1757 V T5L, T6v, T6c, T6G, T5S, T6H, T6f, T6w, T5K, T6b;
Chris@82 1758 T5K = VADD(T4V, T4W);
Chris@82 1759 T5L = VFNMS(LDK(KP980785280), T5K, T5J);
Chris@82 1760 T6v = VFMA(LDK(KP980785280), T5K, T5J);
Chris@82 1761 T6b = VSUB(TI, TZ);
Chris@82 1762 T6c = VFMA(LDK(KP980785280), T6b, T6a);
Chris@82 1763 T6G = VFNMS(LDK(KP980785280), T6b, T6a);
Chris@82 1764 {
Chris@82 1765 V T5O, T5R, T6d, T6e;
Chris@82 1766 T5O = VFNMS(LDK(KP820678790), T5N, T5M);
Chris@82 1767 T5R = VFNMS(LDK(KP820678790), T5Q, T5P);
Chris@82 1768 T5S = VADD(T5O, T5R);
Chris@82 1769 T6H = VSUB(T5O, T5R);
Chris@82 1770 T6d = VFMA(LDK(KP820678790), T5M, T5N);
Chris@82 1771 T6e = VFMA(LDK(KP820678790), T5P, T5Q);
Chris@82 1772 T6f = VSUB(T6d, T6e);
Chris@82 1773 T6w = VADD(T6d, T6e);
Chris@82 1774 }
Chris@82 1775 T5T = VFNMS(LDK(KP773010453), T5S, T5L);
Chris@82 1776 T6P = VFNMS(LDK(KP773010453), T6w, T6v);
Chris@82 1777 T6S = VFNMS(LDK(KP773010453), T6H, T6G);
Chris@82 1778 T6g = VFMA(LDK(KP773010453), T6f, T6c);
Chris@82 1779 T6n = VFMA(LDK(KP773010453), T5S, T5L);
Chris@82 1780 T6x = VFMA(LDK(KP773010453), T6w, T6v);
Chris@82 1781 T6I = VFMA(LDK(KP773010453), T6H, T6G);
Chris@82 1782 T6q = VFNMS(LDK(KP773010453), T6f, T6c);
Chris@82 1783 }
Chris@82 1784 {
Chris@82 1785 V T69, T6k, T6R, T6U;
Chris@82 1786 T69 = VFNMS(LDK(KP903989293), T68, T5T);
Chris@82 1787 T6k = VFNMS(LDK(KP903989293), T6j, T6g);
Chris@82 1788 ST(&(xo[WS(os, 55)]), VFNMSI(T6k, T69), ovs, &(xo[WS(os, 1)]));
Chris@82 1789 ST(&(xo[WS(os, 73)]), VFMAI(T6k, T69), ovs, &(xo[WS(os, 1)]));
Chris@82 1790 T6R = VFMA(LDK(KP941544065), T6Q, T6P);
Chris@82 1791 T6U = VFNMS(LDK(KP941544065), T6T, T6S);
Chris@82 1792 ST(&(xo[WS(os, 39)]), VFNMSI(T6U, T6R), ovs, &(xo[WS(os, 1)]));
Chris@82 1793 ST(&(xo[WS(os, 89)]), VFMAI(T6U, T6R), ovs, &(xo[WS(os, 1)]));
Chris@82 1794 }
Chris@82 1795 {
Chris@82 1796 V T6V, T6W, T6l, T6m;
Chris@82 1797 T6V = VFNMS(LDK(KP941544065), T6Q, T6P);
Chris@82 1798 T6W = VFMA(LDK(KP941544065), T6T, T6S);
Chris@82 1799 ST(&(xo[WS(os, 25)]), VFMAI(T6W, T6V), ovs, &(xo[WS(os, 1)]));
Chris@82 1800 ST(&(xo[WS(os, 103)]), VFNMSI(T6W, T6V), ovs, &(xo[WS(os, 1)]));
Chris@82 1801 T6l = VFMA(LDK(KP903989293), T68, T5T);
Chris@82 1802 T6m = VFMA(LDK(KP903989293), T6j, T6g);
Chris@82 1803 ST(&(xo[WS(os, 119)]), VFNMSI(T6m, T6l), ovs, &(xo[WS(os, 1)]));
Chris@82 1804 ST(&(xo[WS(os, 9)]), VFMAI(T6m, T6l), ovs, &(xo[WS(os, 1)]));
Chris@82 1805 }
Chris@82 1806 {
Chris@82 1807 V T6p, T6s, T6F, T6M;
Chris@82 1808 T6p = VFNMS(LDK(KP903989293), T6o, T6n);
Chris@82 1809 T6s = VFMA(LDK(KP903989293), T6r, T6q);
Chris@82 1810 ST(&(xo[WS(os, 41)]), VFMAI(T6s, T6p), ovs, &(xo[WS(os, 1)]));
Chris@82 1811 ST(&(xo[WS(os, 87)]), VFNMSI(T6s, T6p), ovs, &(xo[WS(os, 1)]));
Chris@82 1812 T6F = VFNMS(LDK(KP941544065), T6E, T6x);
Chris@82 1813 T6M = VFNMS(LDK(KP941544065), T6L, T6I);
Chris@82 1814 ST(&(xo[WS(os, 71)]), VFNMSI(T6M, T6F), ovs, &(xo[WS(os, 1)]));
Chris@82 1815 ST(&(xo[WS(os, 57)]), VFMAI(T6M, T6F), ovs, &(xo[WS(os, 1)]));
Chris@82 1816 }
Chris@82 1817 {
Chris@82 1818 V T6N, T6O, T6t, T6u;
Chris@82 1819 T6N = VFMA(LDK(KP941544065), T6E, T6x);
Chris@82 1820 T6O = VFMA(LDK(KP941544065), T6L, T6I);
Chris@82 1821 ST(&(xo[WS(os, 7)]), VFNMSI(T6O, T6N), ovs, &(xo[WS(os, 1)]));
Chris@82 1822 ST(&(xo[WS(os, 121)]), VFMAI(T6O, T6N), ovs, &(xo[WS(os, 1)]));
Chris@82 1823 T6t = VFMA(LDK(KP903989293), T6o, T6n);
Chris@82 1824 T6u = VFNMS(LDK(KP903989293), T6r, T6q);
Chris@82 1825 ST(&(xo[WS(os, 23)]), VFNMSI(T6u, T6t), ovs, &(xo[WS(os, 1)]));
Chris@82 1826 ST(&(xo[WS(os, 105)]), VFMAI(T6u, T6t), ovs, &(xo[WS(os, 1)]));
Chris@82 1827 }
Chris@82 1828 }
Chris@82 1829 }
Chris@82 1830 }
Chris@82 1831 VLEAVE();
Chris@82 1832 }
Chris@82 1833
Chris@82 1834 static const kdft_desc desc = { 128, XSIMD_STRING("n1bv_128"), {440, 0, 642, 0}, &GENUS, 0, 0, 0, 0 };
Chris@82 1835
Chris@82 1836 void XSIMD(codelet_n1bv_128) (planner *p) {
Chris@82 1837 X(kdft_register) (p, n1bv_128, &desc);
Chris@82 1838 }
Chris@82 1839
Chris@82 1840 #else
Chris@82 1841
Chris@82 1842 /* Generated by: ../../../genfft/gen_notw_c.native -simd -compact -variables 4 -pipeline-latency 8 -sign 1 -n 128 -name n1bv_128 -include dft/simd/n1b.h */
Chris@82 1843
Chris@82 1844 /*
Chris@82 1845 * This function contains 1082 FP additions, 330 FP multiplications,
Chris@82 1846 * (or, 938 additions, 186 multiplications, 144 fused multiply/add),
Chris@82 1847 * 194 stack variables, 31 constants, and 256 memory accesses
Chris@82 1848 */
Chris@82 1849 #include "dft/simd/n1b.h"
Chris@82 1850
Chris@82 1851 static void n1bv_128(const R *ri, const R *ii, R *ro, R *io, stride is, stride os, INT v, INT ivs, INT ovs)
Chris@82 1852 {
Chris@82 1853 DVK(KP146730474, +0.146730474455361751658850129646717819706215317);
Chris@82 1854 DVK(KP989176509, +0.989176509964780973451673738016243063983689533);
Chris@82 1855 DVK(KP595699304, +0.595699304492433343467036528829969889511926338);
Chris@82 1856 DVK(KP803207531, +0.803207531480644909806676512963141923879569427);
Chris@82 1857 DVK(KP049067674, +0.049067674327418014254954976942682658314745363);
Chris@82 1858 DVK(KP998795456, +0.998795456205172392714771604759100694443203615);
Chris@82 1859 DVK(KP671558954, +0.671558954847018400625376850427421803228750632);
Chris@82 1860 DVK(KP740951125, +0.740951125354959091175616897495162729728955309);
Chris@82 1861 DVK(KP514102744, +0.514102744193221726593693838968815772608049120);
Chris@82 1862 DVK(KP857728610, +0.857728610000272069902269984284770137042490799);
Chris@82 1863 DVK(KP242980179, +0.242980179903263889948274162077471118320990783);
Chris@82 1864 DVK(KP970031253, +0.970031253194543992603984207286100251456865962);
Chris@82 1865 DVK(KP427555093, +0.427555093430282094320966856888798534304578629);
Chris@82 1866 DVK(KP903989293, +0.903989293123443331586200297230537048710132025);
Chris@82 1867 DVK(KP336889853, +0.336889853392220050689253212619147570477766780);
Chris@82 1868 DVK(KP941544065, +0.941544065183020778412509402599502357185589796);
Chris@82 1869 DVK(KP634393284, +0.634393284163645498215171613225493370675687095);
Chris@82 1870 DVK(KP773010453, +0.773010453362736960810906609758469800971041293);
Chris@82 1871 DVK(KP098017140, +0.098017140329560601994195563888641845861136673);
Chris@82 1872 DVK(KP995184726, +0.995184726672196886244836953109479921575474869);
Chris@82 1873 DVK(KP290284677, +0.290284677254462367636192375817395274691476278);
Chris@82 1874 DVK(KP956940335, +0.956940335732208864935797886980269969482849206);
Chris@82 1875 DVK(KP471396736, +0.471396736825997648556387625905254377657460319);
Chris@82 1876 DVK(KP881921264, +0.881921264348355029712756863660388349508442621);
Chris@82 1877 DVK(KP980785280, +0.980785280403230449126182236134239036973933731);
Chris@82 1878 DVK(KP195090322, +0.195090322016128267848284868477022240927691618);
Chris@82 1879 DVK(KP555570233, +0.555570233019602224742830813948532874374937191);
Chris@82 1880 DVK(KP831469612, +0.831469612302545237078788377617905756738560812);
Chris@82 1881 DVK(KP382683432, +0.382683432365089771728459984030398866761344562);
Chris@82 1882 DVK(KP923879532, +0.923879532511286756128183189396788286822416626);
Chris@82 1883 DVK(KP707106781, +0.707106781186547524400844362104849039284835938);
Chris@82 1884 {
Chris@82 1885 INT i;
Chris@82 1886 const R *xi;
Chris@82 1887 R *xo;
Chris@82 1888 xi = ii;
Chris@82 1889 xo = io;
Chris@82 1890 for (i = v; i > 0; i = i - VL, xi = xi + (VL * ivs), xo = xo + (VL * ovs), MAKE_VOLATILE_STRIDE(256, is), MAKE_VOLATILE_STRIDE(256, os)) {
Chris@82 1891 V T49, T6e, Tev, TgK, TfA, TgL, T4U, T5J, T7R, T9o, Tah, TdG, Tcw, TdB, T84;
Chris@82 1892 V T8T, Tfk, Tfo, T1G, T64, Tgs, Th6, T2p, T62, T7t, T9c, Tce, Tdm, T7i, T9e;
Chris@82 1893 V Tc8, Tdp, TgF, TgG, T4q, T4V, TeC, Tfx, T4H, T4W, T7X, T86, Tcr, TdH, T7U;
Chris@82 1894 V T85, Taw, TdC, Tf3, Tf7, Tr, T5X, Tgl, Th3, T1a, T5V, T7a, T95, TbD, Tdf;
Chris@82 1895 V T6Z, T97, Tbx, Tdi, Tgy, Tgz, TgA, TaN, Tdv, TeK, Tfu, T2W, T5M, T35, T5N;
Chris@82 1896 V T7F, T8X, TaI, Tdu, T7C, T8W, TgB, TgC, TgD, Tb4, Tdy, TeR, Tfv, T3x, T5P;
Chris@82 1897 V T3G, T5Q, T7M, T90, TaZ, Tdx, T7J, T8Z, Tbm, Tdg, TbG, Tdj, Tgo, Th4, Tf0;
Chris@82 1898 V Tf8, T76, T98, T7d, T94, T10, T5Y, T1d, T5U, TbX, Tdn, Tch, Tdq, Tgv, Th7;
Chris@82 1899 V Tfh, Tfp, T7p, T9f, T7w, T9b, T2f, T65, T2s, T61;
Chris@82 1900 {
Chris@82 1901 V T47, Ta8, T4O, Ta7, T44, Tcu, T4P, Tct, Taa, Tab, T3P, Tac, T4R, Tad, Tae;
Chris@82 1902 V T3W, Taf, T4S;
Chris@82 1903 {
Chris@82 1904 V T45, T46, T4M, T4N;
Chris@82 1905 T45 = LD(&(xi[WS(is, 32)]), ivs, &(xi[0]));
Chris@82 1906 T46 = LD(&(xi[WS(is, 96)]), ivs, &(xi[0]));
Chris@82 1907 T47 = VSUB(T45, T46);
Chris@82 1908 Ta8 = VADD(T45, T46);
Chris@82 1909 T4M = LD(&(xi[0]), ivs, &(xi[0]));
Chris@82 1910 T4N = LD(&(xi[WS(is, 64)]), ivs, &(xi[0]));
Chris@82 1911 T4O = VSUB(T4M, T4N);
Chris@82 1912 Ta7 = VADD(T4M, T4N);
Chris@82 1913 }
Chris@82 1914 {
Chris@82 1915 V T3Y, T3Z, T40, T41, T42, T43;
Chris@82 1916 T3Y = LD(&(xi[WS(is, 16)]), ivs, &(xi[0]));
Chris@82 1917 T3Z = LD(&(xi[WS(is, 80)]), ivs, &(xi[0]));
Chris@82 1918 T40 = VSUB(T3Y, T3Z);
Chris@82 1919 T41 = LD(&(xi[WS(is, 112)]), ivs, &(xi[0]));
Chris@82 1920 T42 = LD(&(xi[WS(is, 48)]), ivs, &(xi[0]));
Chris@82 1921 T43 = VSUB(T41, T42);
Chris@82 1922 T44 = VMUL(LDK(KP707106781), VSUB(T40, T43));
Chris@82 1923 Tcu = VADD(T41, T42);
Chris@82 1924 T4P = VMUL(LDK(KP707106781), VADD(T40, T43));
Chris@82 1925 Tct = VADD(T3Y, T3Z);
Chris@82 1926 }
Chris@82 1927 {
Chris@82 1928 V T3L, T3O, T3S, T3V;
Chris@82 1929 {
Chris@82 1930 V T3J, T3K, T3M, T3N;
Chris@82 1931 T3J = LD(&(xi[WS(is, 8)]), ivs, &(xi[0]));
Chris@82 1932 T3K = LD(&(xi[WS(is, 72)]), ivs, &(xi[0]));
Chris@82 1933 T3L = VSUB(T3J, T3K);
Chris@82 1934 Taa = VADD(T3J, T3K);
Chris@82 1935 T3M = LD(&(xi[WS(is, 40)]), ivs, &(xi[0]));
Chris@82 1936 T3N = LD(&(xi[WS(is, 104)]), ivs, &(xi[0]));
Chris@82 1937 T3O = VSUB(T3M, T3N);
Chris@82 1938 Tab = VADD(T3M, T3N);
Chris@82 1939 }
Chris@82 1940 T3P = VFNMS(LDK(KP382683432), T3O, VMUL(LDK(KP923879532), T3L));
Chris@82 1941 Tac = VSUB(Taa, Tab);
Chris@82 1942 T4R = VFMA(LDK(KP382683432), T3L, VMUL(LDK(KP923879532), T3O));
Chris@82 1943 {
Chris@82 1944 V T3Q, T3R, T3T, T3U;
Chris@82 1945 T3Q = LD(&(xi[WS(is, 120)]), ivs, &(xi[0]));
Chris@82 1946 T3R = LD(&(xi[WS(is, 56)]), ivs, &(xi[0]));
Chris@82 1947 T3S = VSUB(T3Q, T3R);
Chris@82 1948 Tad = VADD(T3Q, T3R);
Chris@82 1949 T3T = LD(&(xi[WS(is, 24)]), ivs, &(xi[0]));
Chris@82 1950 T3U = LD(&(xi[WS(is, 88)]), ivs, &(xi[0]));
Chris@82 1951 T3V = VSUB(T3T, T3U);
Chris@82 1952 Tae = VADD(T3T, T3U);
Chris@82 1953 }
Chris@82 1954 T3W = VFMA(LDK(KP923879532), T3S, VMUL(LDK(KP382683432), T3V));
Chris@82 1955 Taf = VSUB(Tad, Tae);
Chris@82 1956 T4S = VFNMS(LDK(KP382683432), T3S, VMUL(LDK(KP923879532), T3V));
Chris@82 1957 }
Chris@82 1958 {
Chris@82 1959 V T3X, T48, Tet, Teu;
Chris@82 1960 T3X = VSUB(T3P, T3W);
Chris@82 1961 T48 = VSUB(T44, T47);
Chris@82 1962 T49 = VSUB(T3X, T48);
Chris@82 1963 T6e = VADD(T48, T3X);
Chris@82 1964 Tet = VADD(Ta7, Ta8);
Chris@82 1965 Teu = VADD(Tct, Tcu);
Chris@82 1966 Tev = VSUB(Tet, Teu);
Chris@82 1967 TgK = VADD(Tet, Teu);
Chris@82 1968 }
Chris@82 1969 {
Chris@82 1970 V Tfy, Tfz, T4Q, T4T;
Chris@82 1971 Tfy = VADD(Taa, Tab);
Chris@82 1972 Tfz = VADD(Tad, Tae);
Chris@82 1973 TfA = VSUB(Tfy, Tfz);
Chris@82 1974 TgL = VADD(Tfy, Tfz);
Chris@82 1975 T4Q = VSUB(T4O, T4P);
Chris@82 1976 T4T = VSUB(T4R, T4S);
Chris@82 1977 T4U = VSUB(T4Q, T4T);
Chris@82 1978 T5J = VADD(T4Q, T4T);
Chris@82 1979 }
Chris@82 1980 {
Chris@82 1981 V T7P, T7Q, Ta9, Tag;
Chris@82 1982 T7P = VADD(T4R, T4S);
Chris@82 1983 T7Q = VADD(T47, T44);
Chris@82 1984 T7R = VSUB(T7P, T7Q);
Chris@82 1985 T9o = VADD(T7Q, T7P);
Chris@82 1986 Ta9 = VSUB(Ta7, Ta8);
Chris@82 1987 Tag = VMUL(LDK(KP707106781), VADD(Tac, Taf));
Chris@82 1988 Tah = VSUB(Ta9, Tag);
Chris@82 1989 TdG = VADD(Ta9, Tag);
Chris@82 1990 }
Chris@82 1991 {
Chris@82 1992 V Tcs, Tcv, T82, T83;
Chris@82 1993 Tcs = VMUL(LDK(KP707106781), VSUB(Tac, Taf));
Chris@82 1994 Tcv = VSUB(Tct, Tcu);
Chris@82 1995 Tcw = VSUB(Tcs, Tcv);
Chris@82 1996 TdB = VADD(Tcv, Tcs);
Chris@82 1997 T82 = VADD(T4O, T4P);
Chris@82 1998 T83 = VADD(T3P, T3W);
Chris@82 1999 T84 = VSUB(T82, T83);
Chris@82 2000 T8T = VADD(T82, T83);
Chris@82 2001 }
Chris@82 2002 }
Chris@82 2003 {
Chris@82 2004 V Tca, Tcb, T1i, Tfm, T2n, Tc5, Tc6, T1p, Tfn, T2k, T1x, Tfi, T2h, Tc0, T1E;
Chris@82 2005 V Tfj, T2i, Tc3, T1l, T1o, Tcc, Tcd;
Chris@82 2006 {
Chris@82 2007 V T1g, T1h, T2l, T2m;
Chris@82 2008 T1g = LD(&(xi[WS(is, 127)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2009 T1h = LD(&(xi[WS(is, 63)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2010 Tca = VADD(T1g, T1h);
Chris@82 2011 T2l = LD(&(xi[WS(is, 31)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2012 T2m = LD(&(xi[WS(is, 95)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2013 Tcb = VADD(T2l, T2m);
Chris@82 2014 T1i = VSUB(T1g, T1h);
Chris@82 2015 Tfm = VADD(Tca, Tcb);
Chris@82 2016 T2n = VSUB(T2l, T2m);
Chris@82 2017 }
Chris@82 2018 {
Chris@82 2019 V T1j, T1k, T1m, T1n;
Chris@82 2020 T1j = LD(&(xi[WS(is, 15)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2021 T1k = LD(&(xi[WS(is, 79)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2022 T1l = VSUB(T1j, T1k);
Chris@82 2023 Tc5 = VADD(T1j, T1k);
Chris@82 2024 T1m = LD(&(xi[WS(is, 111)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2025 T1n = LD(&(xi[WS(is, 47)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2026 T1o = VSUB(T1m, T1n);
Chris@82 2027 Tc6 = VADD(T1m, T1n);
Chris@82 2028 }
Chris@82 2029 T1p = VMUL(LDK(KP707106781), VADD(T1l, T1o));
Chris@82 2030 Tfn = VADD(Tc5, Tc6);
Chris@82 2031 T2k = VMUL(LDK(KP707106781), VSUB(T1l, T1o));
Chris@82 2032 {
Chris@82 2033 V T1t, TbY, T1w, TbZ;
Chris@82 2034 {
Chris@82 2035 V T1r, T1s, T1u, T1v;
Chris@82 2036 T1r = LD(&(xi[WS(is, 7)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2037 T1s = LD(&(xi[WS(is, 71)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2038 T1t = VSUB(T1r, T1s);
Chris@82 2039 TbY = VADD(T1r, T1s);
Chris@82 2040 T1u = LD(&(xi[WS(is, 39)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2041 T1v = LD(&(xi[WS(is, 103)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2042 T1w = VSUB(T1u, T1v);
Chris@82 2043 TbZ = VADD(T1u, T1v);
Chris@82 2044 }
Chris@82 2045 T1x = VFMA(LDK(KP382683432), T1t, VMUL(LDK(KP923879532), T1w));
Chris@82 2046 Tfi = VADD(TbY, TbZ);
Chris@82 2047 T2h = VFNMS(LDK(KP382683432), T1w, VMUL(LDK(KP923879532), T1t));
Chris@82 2048 Tc0 = VSUB(TbY, TbZ);
Chris@82 2049 }
Chris@82 2050 {
Chris@82 2051 V T1A, Tc2, T1D, Tc1;
Chris@82 2052 {
Chris@82 2053 V T1y, T1z, T1B, T1C;
Chris@82 2054 T1y = LD(&(xi[WS(is, 23)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2055 T1z = LD(&(xi[WS(is, 87)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2056 T1A = VSUB(T1y, T1z);
Chris@82 2057 Tc2 = VADD(T1y, T1z);
Chris@82 2058 T1B = LD(&(xi[WS(is, 119)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2059 T1C = LD(&(xi[WS(is, 55)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2060 T1D = VSUB(T1B, T1C);
Chris@82 2061 Tc1 = VADD(T1B, T1C);
Chris@82 2062 }
Chris@82 2063 T1E = VFNMS(LDK(KP382683432), T1D, VMUL(LDK(KP923879532), T1A));
Chris@82 2064 Tfj = VADD(Tc1, Tc2);
Chris@82 2065 T2i = VFMA(LDK(KP923879532), T1D, VMUL(LDK(KP382683432), T1A));
Chris@82 2066 Tc3 = VSUB(Tc1, Tc2);
Chris@82 2067 }
Chris@82 2068 Tfk = VSUB(Tfi, Tfj);
Chris@82 2069 Tfo = VSUB(Tfm, Tfn);
Chris@82 2070 {
Chris@82 2071 V T1q, T1F, Tgq, Tgr;
Chris@82 2072 T1q = VSUB(T1i, T1p);
Chris@82 2073 T1F = VSUB(T1x, T1E);
Chris@82 2074 T1G = VSUB(T1q, T1F);
Chris@82 2075 T64 = VADD(T1q, T1F);
Chris@82 2076 Tgq = VADD(Tfm, Tfn);
Chris@82 2077 Tgr = VADD(Tfi, Tfj);
Chris@82 2078 Tgs = VSUB(Tgq, Tgr);
Chris@82 2079 Th6 = VADD(Tgq, Tgr);
Chris@82 2080 }
Chris@82 2081 {
Chris@82 2082 V T2j, T2o, T7r, T7s;
Chris@82 2083 T2j = VSUB(T2h, T2i);
Chris@82 2084 T2o = VSUB(T2k, T2n);
Chris@82 2085 T2p = VSUB(T2j, T2o);
Chris@82 2086 T62 = VADD(T2o, T2j);
Chris@82 2087 T7r = VADD(T1x, T1E);
Chris@82 2088 T7s = VADD(T2n, T2k);
Chris@82 2089 T7t = VSUB(T7r, T7s);
Chris@82 2090 T9c = VADD(T7s, T7r);
Chris@82 2091 }
Chris@82 2092 Tcc = VSUB(Tca, Tcb);
Chris@82 2093 Tcd = VMUL(LDK(KP707106781), VADD(Tc0, Tc3));
Chris@82 2094 Tce = VSUB(Tcc, Tcd);
Chris@82 2095 Tdm = VADD(Tcc, Tcd);
Chris@82 2096 {
Chris@82 2097 V T7g, T7h, Tc4, Tc7;
Chris@82 2098 T7g = VADD(T1i, T1p);
Chris@82 2099 T7h = VADD(T2h, T2i);
Chris@82 2100 T7i = VSUB(T7g, T7h);
Chris@82 2101 T9e = VADD(T7g, T7h);
Chris@82 2102 Tc4 = VMUL(LDK(KP707106781), VSUB(Tc0, Tc3));
Chris@82 2103 Tc7 = VSUB(Tc5, Tc6);
Chris@82 2104 Tc8 = VSUB(Tc4, Tc7);
Chris@82 2105 Tdp = VADD(Tc7, Tc4);
Chris@82 2106 }
Chris@82 2107 }
Chris@82 2108 {
Chris@82 2109 V T4c, Tew, T4o, Tak, T4A, Tez, T4E, Tau, T4j, Tex, T4l, Tan, T4x, TeA, T4F;
Chris@82 2110 V Tar, Tcp, Tcq;
Chris@82 2111 {
Chris@82 2112 V T4a, T4b, Tai, T4m, T4n, Taj;
Chris@82 2113 T4a = LD(&(xi[WS(is, 4)]), ivs, &(xi[0]));
Chris@82 2114 T4b = LD(&(xi[WS(is, 68)]), ivs, &(xi[0]));
Chris@82 2115 Tai = VADD(T4a, T4b);
Chris@82 2116 T4m = LD(&(xi[WS(is, 36)]), ivs, &(xi[0]));
Chris@82 2117 T4n = LD(&(xi[WS(is, 100)]), ivs, &(xi[0]));
Chris@82 2118 Taj = VADD(T4m, T4n);
Chris@82 2119 T4c = VSUB(T4a, T4b);
Chris@82 2120 Tew = VADD(Tai, Taj);
Chris@82 2121 T4o = VSUB(T4m, T4n);
Chris@82 2122 Tak = VSUB(Tai, Taj);
Chris@82 2123 }
Chris@82 2124 {
Chris@82 2125 V T4y, T4z, Tat, T4C, T4D, Tas;
Chris@82 2126 T4y = LD(&(xi[WS(is, 28)]), ivs, &(xi[0]));
Chris@82 2127 T4z = LD(&(xi[WS(is, 92)]), ivs, &(xi[0]));
Chris@82 2128 Tat = VADD(T4y, T4z);
Chris@82 2129 T4C = LD(&(xi[WS(is, 124)]), ivs, &(xi[0]));
Chris@82 2130 T4D = LD(&(xi[WS(is, 60)]), ivs, &(xi[0]));
Chris@82 2131 Tas = VADD(T4C, T4D);
Chris@82 2132 T4A = VSUB(T4y, T4z);
Chris@82 2133 Tez = VADD(Tas, Tat);
Chris@82 2134 T4E = VSUB(T4C, T4D);
Chris@82 2135 Tau = VSUB(Tas, Tat);
Chris@82 2136 }
Chris@82 2137 {
Chris@82 2138 V T4f, Tal, T4i, Tam;
Chris@82 2139 {
Chris@82 2140 V T4d, T4e, T4g, T4h;
Chris@82 2141 T4d = LD(&(xi[WS(is, 20)]), ivs, &(xi[0]));
Chris@82 2142 T4e = LD(&(xi[WS(is, 84)]), ivs, &(xi[0]));
Chris@82 2143 T4f = VSUB(T4d, T4e);
Chris@82 2144 Tal = VADD(T4d, T4e);
Chris@82 2145 T4g = LD(&(xi[WS(is, 116)]), ivs, &(xi[0]));
Chris@82 2146 T4h = LD(&(xi[WS(is, 52)]), ivs, &(xi[0]));
Chris@82 2147 T4i = VSUB(T4g, T4h);
Chris@82 2148 Tam = VADD(T4g, T4h);
Chris@82 2149 }
Chris@82 2150 T4j = VMUL(LDK(KP707106781), VADD(T4f, T4i));
Chris@82 2151 Tex = VADD(Tal, Tam);
Chris@82 2152 T4l = VMUL(LDK(KP707106781), VSUB(T4f, T4i));
Chris@82 2153 Tan = VSUB(Tal, Tam);
Chris@82 2154 }
Chris@82 2155 {
Chris@82 2156 V T4t, Tap, T4w, Taq;
Chris@82 2157 {
Chris@82 2158 V T4r, T4s, T4u, T4v;
Chris@82 2159 T4r = LD(&(xi[WS(is, 12)]), ivs, &(xi[0]));
Chris@82 2160 T4s = LD(&(xi[WS(is, 76)]), ivs, &(xi[0]));
Chris@82 2161 T4t = VSUB(T4r, T4s);
Chris@82 2162 Tap = VADD(T4r, T4s);
Chris@82 2163 T4u = LD(&(xi[WS(is, 108)]), ivs, &(xi[0]));
Chris@82 2164 T4v = LD(&(xi[WS(is, 44)]), ivs, &(xi[0]));
Chris@82 2165 T4w = VSUB(T4u, T4v);
Chris@82 2166 Taq = VADD(T4u, T4v);
Chris@82 2167 }
Chris@82 2168 T4x = VMUL(LDK(KP707106781), VSUB(T4t, T4w));
Chris@82 2169 TeA = VADD(Tap, Taq);
Chris@82 2170 T4F = VMUL(LDK(KP707106781), VADD(T4t, T4w));
Chris@82 2171 Tar = VSUB(Tap, Taq);
Chris@82 2172 }
Chris@82 2173 TgF = VADD(Tew, Tex);
Chris@82 2174 TgG = VADD(Tez, TeA);
Chris@82 2175 {
Chris@82 2176 V T4k, T4p, Tey, TeB;
Chris@82 2177 T4k = VSUB(T4c, T4j);
Chris@82 2178 T4p = VSUB(T4l, T4o);
Chris@82 2179 T4q = VFNMS(LDK(KP555570233), T4p, VMUL(LDK(KP831469612), T4k));
Chris@82 2180 T4V = VFMA(LDK(KP831469612), T4p, VMUL(LDK(KP555570233), T4k));
Chris@82 2181 Tey = VSUB(Tew, Tex);
Chris@82 2182 TeB = VSUB(Tez, TeA);
Chris@82 2183 TeC = VMUL(LDK(KP707106781), VADD(Tey, TeB));
Chris@82 2184 Tfx = VMUL(LDK(KP707106781), VSUB(Tey, TeB));
Chris@82 2185 }
Chris@82 2186 {
Chris@82 2187 V T4B, T4G, T7V, T7W;
Chris@82 2188 T4B = VSUB(T4x, T4A);
Chris@82 2189 T4G = VSUB(T4E, T4F);
Chris@82 2190 T4H = VFMA(LDK(KP555570233), T4B, VMUL(LDK(KP831469612), T4G));
Chris@82 2191 T4W = VFNMS(LDK(KP555570233), T4G, VMUL(LDK(KP831469612), T4B));
Chris@82 2192 T7V = VADD(T4A, T4x);
Chris@82 2193 T7W = VADD(T4E, T4F);
Chris@82 2194 T7X = VFMA(LDK(KP195090322), T7V, VMUL(LDK(KP980785280), T7W));
Chris@82 2195 T86 = VFNMS(LDK(KP195090322), T7W, VMUL(LDK(KP980785280), T7V));
Chris@82 2196 }
Chris@82 2197 Tcp = VFNMS(LDK(KP382683432), Tan, VMUL(LDK(KP923879532), Tak));
Chris@82 2198 Tcq = VFMA(LDK(KP923879532), Tau, VMUL(LDK(KP382683432), Tar));
Chris@82 2199 Tcr = VSUB(Tcp, Tcq);
Chris@82 2200 TdH = VADD(Tcp, Tcq);
Chris@82 2201 {
Chris@82 2202 V T7S, T7T, Tao, Tav;
Chris@82 2203 T7S = VADD(T4c, T4j);
Chris@82 2204 T7T = VADD(T4o, T4l);
Chris@82 2205 T7U = VFNMS(LDK(KP195090322), T7T, VMUL(LDK(KP980785280), T7S));
Chris@82 2206 T85 = VFMA(LDK(KP980785280), T7T, VMUL(LDK(KP195090322), T7S));
Chris@82 2207 Tao = VFMA(LDK(KP382683432), Tak, VMUL(LDK(KP923879532), Tan));
Chris@82 2208 Tav = VFNMS(LDK(KP382683432), Tau, VMUL(LDK(KP923879532), Tar));
Chris@82 2209 Taw = VSUB(Tao, Tav);
Chris@82 2210 TdC = VADD(Tao, Tav);
Chris@82 2211 }
Chris@82 2212 }
Chris@82 2213 {
Chris@82 2214 V Tbz, TbA, T3, Tf5, T18, Tbu, Tbv, Ta, Tf6, T15, Ti, Tf1, T12, Tbp, Tp;
Chris@82 2215 V Tf2, T13, Tbs, T6, T9, TbB, TbC;
Chris@82 2216 {
Chris@82 2217 V T1, T2, T16, T17;
Chris@82 2218 T1 = LD(&(xi[WS(is, 1)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2219 T2 = LD(&(xi[WS(is, 65)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2220 Tbz = VADD(T1, T2);
Chris@82 2221 T16 = LD(&(xi[WS(is, 33)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2222 T17 = LD(&(xi[WS(is, 97)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2223 TbA = VADD(T16, T17);
Chris@82 2224 T3 = VSUB(T1, T2);
Chris@82 2225 Tf5 = VADD(Tbz, TbA);
Chris@82 2226 T18 = VSUB(T16, T17);
Chris@82 2227 }
Chris@82 2228 {
Chris@82 2229 V T4, T5, T7, T8;
Chris@82 2230 T4 = LD(&(xi[WS(is, 17)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2231 T5 = LD(&(xi[WS(is, 81)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2232 T6 = VSUB(T4, T5);
Chris@82 2233 Tbu = VADD(T4, T5);
Chris@82 2234 T7 = LD(&(xi[WS(is, 113)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2235 T8 = LD(&(xi[WS(is, 49)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2236 T9 = VSUB(T7, T8);
Chris@82 2237 Tbv = VADD(T7, T8);
Chris@82 2238 }
Chris@82 2239 Ta = VMUL(LDK(KP707106781), VADD(T6, T9));
Chris@82 2240 Tf6 = VADD(Tbu, Tbv);
Chris@82 2241 T15 = VMUL(LDK(KP707106781), VSUB(T6, T9));
Chris@82 2242 {
Chris@82 2243 V Te, Tbn, Th, Tbo;
Chris@82 2244 {
Chris@82 2245 V Tc, Td, Tf, Tg;
Chris@82 2246 Tc = LD(&(xi[WS(is, 9)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2247 Td = LD(&(xi[WS(is, 73)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2248 Te = VSUB(Tc, Td);
Chris@82 2249 Tbn = VADD(Tc, Td);
Chris@82 2250 Tf = LD(&(xi[WS(is, 41)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2251 Tg = LD(&(xi[WS(is, 105)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2252 Th = VSUB(Tf, Tg);
Chris@82 2253 Tbo = VADD(Tf, Tg);
Chris@82 2254 }
Chris@82 2255 Ti = VFMA(LDK(KP382683432), Te, VMUL(LDK(KP923879532), Th));
Chris@82 2256 Tf1 = VADD(Tbn, Tbo);
Chris@82 2257 T12 = VFNMS(LDK(KP382683432), Th, VMUL(LDK(KP923879532), Te));
Chris@82 2258 Tbp = VSUB(Tbn, Tbo);
Chris@82 2259 }
Chris@82 2260 {
Chris@82 2261 V Tl, Tbr, To, Tbq;
Chris@82 2262 {
Chris@82 2263 V Tj, Tk, Tm, Tn;
Chris@82 2264 Tj = LD(&(xi[WS(is, 25)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2265 Tk = LD(&(xi[WS(is, 89)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2266 Tl = VSUB(Tj, Tk);
Chris@82 2267 Tbr = VADD(Tj, Tk);
Chris@82 2268 Tm = LD(&(xi[WS(is, 121)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2269 Tn = LD(&(xi[WS(is, 57)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2270 To = VSUB(Tm, Tn);
Chris@82 2271 Tbq = VADD(Tm, Tn);
Chris@82 2272 }
Chris@82 2273 Tp = VFNMS(LDK(KP382683432), To, VMUL(LDK(KP923879532), Tl));
Chris@82 2274 Tf2 = VADD(Tbq, Tbr);
Chris@82 2275 T13 = VFMA(LDK(KP923879532), To, VMUL(LDK(KP382683432), Tl));
Chris@82 2276 Tbs = VSUB(Tbq, Tbr);
Chris@82 2277 }
Chris@82 2278 Tf3 = VSUB(Tf1, Tf2);
Chris@82 2279 Tf7 = VSUB(Tf5, Tf6);
Chris@82 2280 {
Chris@82 2281 V Tb, Tq, Tgj, Tgk;
Chris@82 2282 Tb = VSUB(T3, Ta);
Chris@82 2283 Tq = VSUB(Ti, Tp);
Chris@82 2284 Tr = VSUB(Tb, Tq);
Chris@82 2285 T5X = VADD(Tb, Tq);
Chris@82 2286 Tgj = VADD(Tf5, Tf6);
Chris@82 2287 Tgk = VADD(Tf1, Tf2);
Chris@82 2288 Tgl = VSUB(Tgj, Tgk);
Chris@82 2289 Th3 = VADD(Tgj, Tgk);
Chris@82 2290 }
Chris@82 2291 {
Chris@82 2292 V T14, T19, T78, T79;
Chris@82 2293 T14 = VSUB(T12, T13);
Chris@82 2294 T19 = VSUB(T15, T18);
Chris@82 2295 T1a = VSUB(T14, T19);
Chris@82 2296 T5V = VADD(T19, T14);
Chris@82 2297 T78 = VADD(Ti, Tp);
Chris@82 2298 T79 = VADD(T18, T15);
Chris@82 2299 T7a = VSUB(T78, T79);
Chris@82 2300 T95 = VADD(T79, T78);
Chris@82 2301 }
Chris@82 2302 TbB = VSUB(Tbz, TbA);
Chris@82 2303 TbC = VMUL(LDK(KP707106781), VADD(Tbp, Tbs));
Chris@82 2304 TbD = VSUB(TbB, TbC);
Chris@82 2305 Tdf = VADD(TbB, TbC);
Chris@82 2306 {
Chris@82 2307 V T6X, T6Y, Tbt, Tbw;
Chris@82 2308 T6X = VADD(T3, Ta);
Chris@82 2309 T6Y = VADD(T12, T13);
Chris@82 2310 T6Z = VSUB(T6X, T6Y);
Chris@82 2311 T97 = VADD(T6X, T6Y);
Chris@82 2312 Tbt = VMUL(LDK(KP707106781), VSUB(Tbp, Tbs));
Chris@82 2313 Tbw = VSUB(Tbu, Tbv);
Chris@82 2314 Tbx = VSUB(Tbt, Tbw);
Chris@82 2315 Tdi = VADD(Tbw, Tbt);
Chris@82 2316 }
Chris@82 2317 }
Chris@82 2318 {
Chris@82 2319 V TaK, TaJ, T2U, TeE, T2Z, TaF, TaG, T2R, TeF, T30, T2C, TeH, T32, TaA, T2J;
Chris@82 2320 V TeI, T33, TaD, T2N, T2Q, TaL, TaM;
Chris@82 2321 {
Chris@82 2322 V T2S, T2T, T2X, T2Y;
Chris@82 2323 T2S = LD(&(xi[WS(is, 34)]), ivs, &(xi[0]));
Chris@82 2324 T2T = LD(&(xi[WS(is, 98)]), ivs, &(xi[0]));
Chris@82 2325 TaK = VADD(T2S, T2T);
Chris@82 2326 T2X = LD(&(xi[WS(is, 2)]), ivs, &(xi[0]));
Chris@82 2327 T2Y = LD(&(xi[WS(is, 66)]), ivs, &(xi[0]));
Chris@82 2328 TaJ = VADD(T2X, T2Y);
Chris@82 2329 T2U = VSUB(T2S, T2T);
Chris@82 2330 TeE = VADD(TaJ, TaK);
Chris@82 2331 T2Z = VSUB(T2X, T2Y);
Chris@82 2332 }
Chris@82 2333 {
Chris@82 2334 V T2L, T2M, T2O, T2P;
Chris@82 2335 T2L = LD(&(xi[WS(is, 18)]), ivs, &(xi[0]));
Chris@82 2336 T2M = LD(&(xi[WS(is, 82)]), ivs, &(xi[0]));
Chris@82 2337 T2N = VSUB(T2L, T2M);
Chris@82 2338 TaF = VADD(T2L, T2M);
Chris@82 2339 T2O = LD(&(xi[WS(is, 114)]), ivs, &(xi[0]));
Chris@82 2340 T2P = LD(&(xi[WS(is, 50)]), ivs, &(xi[0]));
Chris@82 2341 T2Q = VSUB(T2O, T2P);
Chris@82 2342 TaG = VADD(T2O, T2P);
Chris@82 2343 }
Chris@82 2344 T2R = VMUL(LDK(KP707106781), VSUB(T2N, T2Q));
Chris@82 2345 TeF = VADD(TaF, TaG);
Chris@82 2346 T30 = VMUL(LDK(KP707106781), VADD(T2N, T2Q));
Chris@82 2347 {
Chris@82 2348 V T2y, Tay, T2B, Taz;
Chris@82 2349 {
Chris@82 2350 V T2w, T2x, T2z, T2A;
Chris@82 2351 T2w = LD(&(xi[WS(is, 10)]), ivs, &(xi[0]));
Chris@82 2352 T2x = LD(&(xi[WS(is, 74)]), ivs, &(xi[0]));
Chris@82 2353 T2y = VSUB(T2w, T2x);
Chris@82 2354 Tay = VADD(T2w, T2x);
Chris@82 2355 T2z = LD(&(xi[WS(is, 42)]), ivs, &(xi[0]));
Chris@82 2356 T2A = LD(&(xi[WS(is, 106)]), ivs, &(xi[0]));
Chris@82 2357 T2B = VSUB(T2z, T2A);
Chris@82 2358 Taz = VADD(T2z, T2A);
Chris@82 2359 }
Chris@82 2360 T2C = VFNMS(LDK(KP382683432), T2B, VMUL(LDK(KP923879532), T2y));
Chris@82 2361 TeH = VADD(Tay, Taz);
Chris@82 2362 T32 = VFMA(LDK(KP382683432), T2y, VMUL(LDK(KP923879532), T2B));
Chris@82 2363 TaA = VSUB(Tay, Taz);
Chris@82 2364 }
Chris@82 2365 {
Chris@82 2366 V T2F, TaB, T2I, TaC;
Chris@82 2367 {
Chris@82 2368 V T2D, T2E, T2G, T2H;
Chris@82 2369 T2D = LD(&(xi[WS(is, 122)]), ivs, &(xi[0]));
Chris@82 2370 T2E = LD(&(xi[WS(is, 58)]), ivs, &(xi[0]));
Chris@82 2371 T2F = VSUB(T2D, T2E);
Chris@82 2372 TaB = VADD(T2D, T2E);
Chris@82 2373 T2G = LD(&(xi[WS(is, 26)]), ivs, &(xi[0]));
Chris@82 2374 T2H = LD(&(xi[WS(is, 90)]), ivs, &(xi[0]));
Chris@82 2375 T2I = VSUB(T2G, T2H);
Chris@82 2376 TaC = VADD(T2G, T2H);
Chris@82 2377 }
Chris@82 2378 T2J = VFMA(LDK(KP923879532), T2F, VMUL(LDK(KP382683432), T2I));
Chris@82 2379 TeI = VADD(TaB, TaC);
Chris@82 2380 T33 = VFNMS(LDK(KP382683432), T2F, VMUL(LDK(KP923879532), T2I));
Chris@82 2381 TaD = VSUB(TaB, TaC);
Chris@82 2382 }
Chris@82 2383 Tgy = VADD(TeE, TeF);
Chris@82 2384 Tgz = VADD(TeH, TeI);
Chris@82 2385 TgA = VSUB(Tgy, Tgz);
Chris@82 2386 TaL = VSUB(TaJ, TaK);
Chris@82 2387 TaM = VMUL(LDK(KP707106781), VADD(TaA, TaD));
Chris@82 2388 TaN = VSUB(TaL, TaM);
Chris@82 2389 Tdv = VADD(TaL, TaM);
Chris@82 2390 {
Chris@82 2391 V TeG, TeJ, T2K, T2V;
Chris@82 2392 TeG = VSUB(TeE, TeF);
Chris@82 2393 TeJ = VSUB(TeH, TeI);
Chris@82 2394 TeK = VFMA(LDK(KP382683432), TeG, VMUL(LDK(KP923879532), TeJ));
Chris@82 2395 Tfu = VFNMS(LDK(KP382683432), TeJ, VMUL(LDK(KP923879532), TeG));
Chris@82 2396 T2K = VSUB(T2C, T2J);
Chris@82 2397 T2V = VSUB(T2R, T2U);
Chris@82 2398 T2W = VSUB(T2K, T2V);
Chris@82 2399 T5M = VADD(T2V, T2K);
Chris@82 2400 }
Chris@82 2401 {
Chris@82 2402 V T31, T34, T7D, T7E;
Chris@82 2403 T31 = VSUB(T2Z, T30);
Chris@82 2404 T34 = VSUB(T32, T33);
Chris@82 2405 T35 = VSUB(T31, T34);
Chris@82 2406 T5N = VADD(T31, T34);
Chris@82 2407 T7D = VADD(T32, T33);
Chris@82 2408 T7E = VADD(T2U, T2R);
Chris@82 2409 T7F = VSUB(T7D, T7E);
Chris@82 2410 T8X = VADD(T7E, T7D);
Chris@82 2411 }
Chris@82 2412 {
Chris@82 2413 V TaE, TaH, T7A, T7B;
Chris@82 2414 TaE = VMUL(LDK(KP707106781), VSUB(TaA, TaD));
Chris@82 2415 TaH = VSUB(TaF, TaG);
Chris@82 2416 TaI = VSUB(TaE, TaH);
Chris@82 2417 Tdu = VADD(TaH, TaE);
Chris@82 2418 T7A = VADD(T2Z, T30);
Chris@82 2419 T7B = VADD(T2C, T2J);
Chris@82 2420 T7C = VSUB(T7A, T7B);
Chris@82 2421 T8W = VADD(T7A, T7B);
Chris@82 2422 }
Chris@82 2423 }
Chris@82 2424 {
Chris@82 2425 V Tb1, Tb0, T3v, TeO, T3A, TaW, TaX, T3s, TeP, T3B, T3d, TeL, T3D, TaR, T3k;
Chris@82 2426 V TeM, T3E, TaU, T3o, T3r, Tb2, Tb3;
Chris@82 2427 {
Chris@82 2428 V T3t, T3u, T3y, T3z;
Chris@82 2429 T3t = LD(&(xi[WS(is, 30)]), ivs, &(xi[0]));
Chris@82 2430 T3u = LD(&(xi[WS(is, 94)]), ivs, &(xi[0]));
Chris@82 2431 Tb1 = VADD(T3t, T3u);
Chris@82 2432 T3y = LD(&(xi[WS(is, 126)]), ivs, &(xi[0]));
Chris@82 2433 T3z = LD(&(xi[WS(is, 62)]), ivs, &(xi[0]));
Chris@82 2434 Tb0 = VADD(T3y, T3z);
Chris@82 2435 T3v = VSUB(T3t, T3u);
Chris@82 2436 TeO = VADD(Tb0, Tb1);
Chris@82 2437 T3A = VSUB(T3y, T3z);
Chris@82 2438 }
Chris@82 2439 {
Chris@82 2440 V T3m, T3n, T3p, T3q;
Chris@82 2441 T3m = LD(&(xi[WS(is, 14)]), ivs, &(xi[0]));
Chris@82 2442 T3n = LD(&(xi[WS(is, 78)]), ivs, &(xi[0]));
Chris@82 2443 T3o = VSUB(T3m, T3n);
Chris@82 2444 TaW = VADD(T3m, T3n);
Chris@82 2445 T3p = LD(&(xi[WS(is, 110)]), ivs, &(xi[0]));
Chris@82 2446 T3q = LD(&(xi[WS(is, 46)]), ivs, &(xi[0]));
Chris@82 2447 T3r = VSUB(T3p, T3q);
Chris@82 2448 TaX = VADD(T3p, T3q);
Chris@82 2449 }
Chris@82 2450 T3s = VMUL(LDK(KP707106781), VSUB(T3o, T3r));
Chris@82 2451 TeP = VADD(TaW, TaX);
Chris@82 2452 T3B = VMUL(LDK(KP707106781), VADD(T3o, T3r));
Chris@82 2453 {
Chris@82 2454 V T39, TaP, T3c, TaQ;
Chris@82 2455 {
Chris@82 2456 V T37, T38, T3a, T3b;
Chris@82 2457 T37 = LD(&(xi[WS(is, 6)]), ivs, &(xi[0]));
Chris@82 2458 T38 = LD(&(xi[WS(is, 70)]), ivs, &(xi[0]));
Chris@82 2459 T39 = VSUB(T37, T38);
Chris@82 2460 TaP = VADD(T37, T38);
Chris@82 2461 T3a = LD(&(xi[WS(is, 38)]), ivs, &(xi[0]));
Chris@82 2462 T3b = LD(&(xi[WS(is, 102)]), ivs, &(xi[0]));
Chris@82 2463 T3c = VSUB(T3a, T3b);
Chris@82 2464 TaQ = VADD(T3a, T3b);
Chris@82 2465 }
Chris@82 2466 T3d = VFNMS(LDK(KP382683432), T3c, VMUL(LDK(KP923879532), T39));
Chris@82 2467 TeL = VADD(TaP, TaQ);
Chris@82 2468 T3D = VFMA(LDK(KP382683432), T39, VMUL(LDK(KP923879532), T3c));
Chris@82 2469 TaR = VSUB(TaP, TaQ);
Chris@82 2470 }
Chris@82 2471 {
Chris@82 2472 V T3g, TaS, T3j, TaT;
Chris@82 2473 {
Chris@82 2474 V T3e, T3f, T3h, T3i;
Chris@82 2475 T3e = LD(&(xi[WS(is, 118)]), ivs, &(xi[0]));
Chris@82 2476 T3f = LD(&(xi[WS(is, 54)]), ivs, &(xi[0]));
Chris@82 2477 T3g = VSUB(T3e, T3f);
Chris@82 2478 TaS = VADD(T3e, T3f);
Chris@82 2479 T3h = LD(&(xi[WS(is, 22)]), ivs, &(xi[0]));
Chris@82 2480 T3i = LD(&(xi[WS(is, 86)]), ivs, &(xi[0]));
Chris@82 2481 T3j = VSUB(T3h, T3i);
Chris@82 2482 TaT = VADD(T3h, T3i);
Chris@82 2483 }
Chris@82 2484 T3k = VFMA(LDK(KP923879532), T3g, VMUL(LDK(KP382683432), T3j));
Chris@82 2485 TeM = VADD(TaS, TaT);
Chris@82 2486 T3E = VFNMS(LDK(KP382683432), T3g, VMUL(LDK(KP923879532), T3j));
Chris@82 2487 TaU = VSUB(TaS, TaT);
Chris@82 2488 }
Chris@82 2489 TgB = VADD(TeO, TeP);
Chris@82 2490 TgC = VADD(TeL, TeM);
Chris@82 2491 TgD = VSUB(TgB, TgC);
Chris@82 2492 Tb2 = VSUB(Tb0, Tb1);
Chris@82 2493 Tb3 = VMUL(LDK(KP707106781), VADD(TaR, TaU));
Chris@82 2494 Tb4 = VSUB(Tb2, Tb3);
Chris@82 2495 Tdy = VADD(Tb2, Tb3);
Chris@82 2496 {
Chris@82 2497 V TeN, TeQ, T3l, T3w;
Chris@82 2498 TeN = VSUB(TeL, TeM);
Chris@82 2499 TeQ = VSUB(TeO, TeP);
Chris@82 2500 TeR = VFNMS(LDK(KP382683432), TeQ, VMUL(LDK(KP923879532), TeN));
Chris@82 2501 Tfv = VFMA(LDK(KP923879532), TeQ, VMUL(LDK(KP382683432), TeN));
Chris@82 2502 T3l = VSUB(T3d, T3k);
Chris@82 2503 T3w = VSUB(T3s, T3v);
Chris@82 2504 T3x = VSUB(T3l, T3w);
Chris@82 2505 T5P = VADD(T3w, T3l);
Chris@82 2506 }
Chris@82 2507 {
Chris@82 2508 V T3C, T3F, T7K, T7L;
Chris@82 2509 T3C = VSUB(T3A, T3B);
Chris@82 2510 T3F = VSUB(T3D, T3E);
Chris@82 2511 T3G = VSUB(T3C, T3F);
Chris@82 2512 T5Q = VADD(T3C, T3F);
Chris@82 2513 T7K = VADD(T3A, T3B);
Chris@82 2514 T7L = VADD(T3d, T3k);
Chris@82 2515 T7M = VSUB(T7K, T7L);
Chris@82 2516 T90 = VADD(T7K, T7L);
Chris@82 2517 }
Chris@82 2518 {
Chris@82 2519 V TaV, TaY, T7H, T7I;
Chris@82 2520 TaV = VMUL(LDK(KP707106781), VSUB(TaR, TaU));
Chris@82 2521 TaY = VSUB(TaW, TaX);
Chris@82 2522 TaZ = VSUB(TaV, TaY);
Chris@82 2523 Tdx = VADD(TaY, TaV);
Chris@82 2524 T7H = VADD(T3D, T3E);
Chris@82 2525 T7I = VADD(T3v, T3s);
Chris@82 2526 T7J = VSUB(T7H, T7I);
Chris@82 2527 T8Z = VADD(T7I, T7H);
Chris@82 2528 }
Chris@82 2529 }
Chris@82 2530 {
Chris@82 2531 V TB, TeU, TF, Tba, TS, TeX, TW, Tbh, Ty, TeV, TG, Tbd, TP, TeY, TX;
Chris@82 2532 V Tbk;
Chris@82 2533 {
Chris@82 2534 V Tz, TA, Tb9, TD, TE, Tb8;
Chris@82 2535 Tz = LD(&(xi[WS(is, 37)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2536 TA = LD(&(xi[WS(is, 101)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2537 Tb9 = VADD(Tz, TA);
Chris@82 2538 TD = LD(&(xi[WS(is, 5)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2539 TE = LD(&(xi[WS(is, 69)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2540 Tb8 = VADD(TD, TE);
Chris@82 2541 TB = VSUB(Tz, TA);
Chris@82 2542 TeU = VADD(Tb8, Tb9);
Chris@82 2543 TF = VSUB(TD, TE);
Chris@82 2544 Tba = VSUB(Tb8, Tb9);
Chris@82 2545 }
Chris@82 2546 {
Chris@82 2547 V TQ, TR, Tbg, TU, TV, Tbf;
Chris@82 2548 TQ = LD(&(xi[WS(is, 29)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2549 TR = LD(&(xi[WS(is, 93)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2550 Tbg = VADD(TQ, TR);
Chris@82 2551 TU = LD(&(xi[WS(is, 125)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2552 TV = LD(&(xi[WS(is, 61)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2553 Tbf = VADD(TU, TV);
Chris@82 2554 TS = VSUB(TQ, TR);
Chris@82 2555 TeX = VADD(Tbf, Tbg);
Chris@82 2556 TW = VSUB(TU, TV);
Chris@82 2557 Tbh = VSUB(Tbf, Tbg);
Chris@82 2558 }
Chris@82 2559 {
Chris@82 2560 V Tu, Tbb, Tx, Tbc;
Chris@82 2561 {
Chris@82 2562 V Ts, Tt, Tv, Tw;
Chris@82 2563 Ts = LD(&(xi[WS(is, 21)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2564 Tt = LD(&(xi[WS(is, 85)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2565 Tu = VSUB(Ts, Tt);
Chris@82 2566 Tbb = VADD(Ts, Tt);
Chris@82 2567 Tv = LD(&(xi[WS(is, 117)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2568 Tw = LD(&(xi[WS(is, 53)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2569 Tx = VSUB(Tv, Tw);
Chris@82 2570 Tbc = VADD(Tv, Tw);
Chris@82 2571 }
Chris@82 2572 Ty = VMUL(LDK(KP707106781), VSUB(Tu, Tx));
Chris@82 2573 TeV = VADD(Tbb, Tbc);
Chris@82 2574 TG = VMUL(LDK(KP707106781), VADD(Tu, Tx));
Chris@82 2575 Tbd = VSUB(Tbb, Tbc);
Chris@82 2576 }
Chris@82 2577 {
Chris@82 2578 V TL, Tbi, TO, Tbj;
Chris@82 2579 {
Chris@82 2580 V TJ, TK, TM, TN;
Chris@82 2581 TJ = LD(&(xi[WS(is, 13)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2582 TK = LD(&(xi[WS(is, 77)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2583 TL = VSUB(TJ, TK);
Chris@82 2584 Tbi = VADD(TJ, TK);
Chris@82 2585 TM = LD(&(xi[WS(is, 109)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2586 TN = LD(&(xi[WS(is, 45)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2587 TO = VSUB(TM, TN);
Chris@82 2588 Tbj = VADD(TM, TN);
Chris@82 2589 }
Chris@82 2590 TP = VMUL(LDK(KP707106781), VSUB(TL, TO));
Chris@82 2591 TeY = VADD(Tbi, Tbj);
Chris@82 2592 TX = VMUL(LDK(KP707106781), VADD(TL, TO));
Chris@82 2593 Tbk = VSUB(Tbi, Tbj);
Chris@82 2594 }
Chris@82 2595 {
Chris@82 2596 V Tbe, Tbl, TeW, TeZ;
Chris@82 2597 Tbe = VFNMS(LDK(KP382683432), Tbd, VMUL(LDK(KP923879532), Tba));
Chris@82 2598 Tbl = VFMA(LDK(KP923879532), Tbh, VMUL(LDK(KP382683432), Tbk));
Chris@82 2599 Tbm = VSUB(Tbe, Tbl);
Chris@82 2600 Tdg = VADD(Tbe, Tbl);
Chris@82 2601 {
Chris@82 2602 V TbE, TbF, Tgm, Tgn;
Chris@82 2603 TbE = VFMA(LDK(KP382683432), Tba, VMUL(LDK(KP923879532), Tbd));
Chris@82 2604 TbF = VFNMS(LDK(KP382683432), Tbh, VMUL(LDK(KP923879532), Tbk));
Chris@82 2605 TbG = VSUB(TbE, TbF);
Chris@82 2606 Tdj = VADD(TbE, TbF);
Chris@82 2607 Tgm = VADD(TeU, TeV);
Chris@82 2608 Tgn = VADD(TeX, TeY);
Chris@82 2609 Tgo = VSUB(Tgm, Tgn);
Chris@82 2610 Th4 = VADD(Tgm, Tgn);
Chris@82 2611 }
Chris@82 2612 TeW = VSUB(TeU, TeV);
Chris@82 2613 TeZ = VSUB(TeX, TeY);
Chris@82 2614 Tf0 = VMUL(LDK(KP707106781), VSUB(TeW, TeZ));
Chris@82 2615 Tf8 = VMUL(LDK(KP707106781), VADD(TeW, TeZ));
Chris@82 2616 {
Chris@82 2617 V T72, T7b, T75, T7c;
Chris@82 2618 {
Chris@82 2619 V T70, T71, T73, T74;
Chris@82 2620 T70 = VADD(TB, Ty);
Chris@82 2621 T71 = VADD(TF, TG);
Chris@82 2622 T72 = VFMA(LDK(KP980785280), T70, VMUL(LDK(KP195090322), T71));
Chris@82 2623 T7b = VFNMS(LDK(KP195090322), T70, VMUL(LDK(KP980785280), T71));
Chris@82 2624 T73 = VADD(TS, TP);
Chris@82 2625 T74 = VADD(TW, TX);
Chris@82 2626 T75 = VFNMS(LDK(KP195090322), T74, VMUL(LDK(KP980785280), T73));
Chris@82 2627 T7c = VFMA(LDK(KP195090322), T73, VMUL(LDK(KP980785280), T74));
Chris@82 2628 }
Chris@82 2629 T76 = VSUB(T72, T75);
Chris@82 2630 T98 = VADD(T7b, T7c);
Chris@82 2631 T7d = VSUB(T7b, T7c);
Chris@82 2632 T94 = VADD(T72, T75);
Chris@82 2633 }
Chris@82 2634 {
Chris@82 2635 V TI, T1b, TZ, T1c;
Chris@82 2636 {
Chris@82 2637 V TC, TH, TT, TY;
Chris@82 2638 TC = VSUB(Ty, TB);
Chris@82 2639 TH = VSUB(TF, TG);
Chris@82 2640 TI = VFMA(LDK(KP831469612), TC, VMUL(LDK(KP555570233), TH));
Chris@82 2641 T1b = VFNMS(LDK(KP555570233), TC, VMUL(LDK(KP831469612), TH));
Chris@82 2642 TT = VSUB(TP, TS);
Chris@82 2643 TY = VSUB(TW, TX);
Chris@82 2644 TZ = VFNMS(LDK(KP555570233), TY, VMUL(LDK(KP831469612), TT));
Chris@82 2645 T1c = VFMA(LDK(KP555570233), TT, VMUL(LDK(KP831469612), TY));
Chris@82 2646 }
Chris@82 2647 T10 = VSUB(TI, TZ);
Chris@82 2648 T5Y = VADD(T1b, T1c);
Chris@82 2649 T1d = VSUB(T1b, T1c);
Chris@82 2650 T5U = VADD(TI, TZ);
Chris@82 2651 }
Chris@82 2652 }
Chris@82 2653 }
Chris@82 2654 {
Chris@82 2655 V T1Q, Tfb, T1U, TbL, T27, Tfe, T2b, TbS, T1N, Tfc, T1V, TbO, T24, Tff, T2c;
Chris@82 2656 V TbV;
Chris@82 2657 {
Chris@82 2658 V T1O, T1P, TbK, T1S, T1T, TbJ;
Chris@82 2659 T1O = LD(&(xi[WS(is, 35)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2660 T1P = LD(&(xi[WS(is, 99)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2661 TbK = VADD(T1O, T1P);
Chris@82 2662 T1S = LD(&(xi[WS(is, 3)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2663 T1T = LD(&(xi[WS(is, 67)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2664 TbJ = VADD(T1S, T1T);
Chris@82 2665 T1Q = VSUB(T1O, T1P);
Chris@82 2666 Tfb = VADD(TbJ, TbK);
Chris@82 2667 T1U = VSUB(T1S, T1T);
Chris@82 2668 TbL = VSUB(TbJ, TbK);
Chris@82 2669 }
Chris@82 2670 {
Chris@82 2671 V T25, T26, TbR, T29, T2a, TbQ;
Chris@82 2672 T25 = LD(&(xi[WS(is, 27)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2673 T26 = LD(&(xi[WS(is, 91)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2674 TbR = VADD(T25, T26);
Chris@82 2675 T29 = LD(&(xi[WS(is, 123)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2676 T2a = LD(&(xi[WS(is, 59)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2677 TbQ = VADD(T29, T2a);
Chris@82 2678 T27 = VSUB(T25, T26);
Chris@82 2679 Tfe = VADD(TbQ, TbR);
Chris@82 2680 T2b = VSUB(T29, T2a);
Chris@82 2681 TbS = VSUB(TbQ, TbR);
Chris@82 2682 }
Chris@82 2683 {
Chris@82 2684 V T1J, TbM, T1M, TbN;
Chris@82 2685 {
Chris@82 2686 V T1H, T1I, T1K, T1L;
Chris@82 2687 T1H = LD(&(xi[WS(is, 19)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2688 T1I = LD(&(xi[WS(is, 83)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2689 T1J = VSUB(T1H, T1I);
Chris@82 2690 TbM = VADD(T1H, T1I);
Chris@82 2691 T1K = LD(&(xi[WS(is, 115)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2692 T1L = LD(&(xi[WS(is, 51)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2693 T1M = VSUB(T1K, T1L);
Chris@82 2694 TbN = VADD(T1K, T1L);
Chris@82 2695 }
Chris@82 2696 T1N = VMUL(LDK(KP707106781), VSUB(T1J, T1M));
Chris@82 2697 Tfc = VADD(TbM, TbN);
Chris@82 2698 T1V = VMUL(LDK(KP707106781), VADD(T1J, T1M));
Chris@82 2699 TbO = VSUB(TbM, TbN);
Chris@82 2700 }
Chris@82 2701 {
Chris@82 2702 V T20, TbT, T23, TbU;
Chris@82 2703 {
Chris@82 2704 V T1Y, T1Z, T21, T22;
Chris@82 2705 T1Y = LD(&(xi[WS(is, 11)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2706 T1Z = LD(&(xi[WS(is, 75)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2707 T20 = VSUB(T1Y, T1Z);
Chris@82 2708 TbT = VADD(T1Y, T1Z);
Chris@82 2709 T21 = LD(&(xi[WS(is, 107)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2710 T22 = LD(&(xi[WS(is, 43)]), ivs, &(xi[WS(is, 1)]));
Chris@82 2711 T23 = VSUB(T21, T22);
Chris@82 2712 TbU = VADD(T21, T22);
Chris@82 2713 }
Chris@82 2714 T24 = VMUL(LDK(KP707106781), VSUB(T20, T23));
Chris@82 2715 Tff = VADD(TbT, TbU);
Chris@82 2716 T2c = VMUL(LDK(KP707106781), VADD(T20, T23));
Chris@82 2717 TbV = VSUB(TbT, TbU);
Chris@82 2718 }
Chris@82 2719 {
Chris@82 2720 V TbP, TbW, Tfd, Tfg;
Chris@82 2721 TbP = VFNMS(LDK(KP382683432), TbO, VMUL(LDK(KP923879532), TbL));
Chris@82 2722 TbW = VFMA(LDK(KP923879532), TbS, VMUL(LDK(KP382683432), TbV));
Chris@82 2723 TbX = VSUB(TbP, TbW);
Chris@82 2724 Tdn = VADD(TbP, TbW);
Chris@82 2725 {
Chris@82 2726 V Tcf, Tcg, Tgt, Tgu;
Chris@82 2727 Tcf = VFMA(LDK(KP382683432), TbL, VMUL(LDK(KP923879532), TbO));
Chris@82 2728 Tcg = VFNMS(LDK(KP382683432), TbS, VMUL(LDK(KP923879532), TbV));
Chris@82 2729 Tch = VSUB(Tcf, Tcg);
Chris@82 2730 Tdq = VADD(Tcf, Tcg);
Chris@82 2731 Tgt = VADD(Tfb, Tfc);
Chris@82 2732 Tgu = VADD(Tfe, Tff);
Chris@82 2733 Tgv = VSUB(Tgt, Tgu);
Chris@82 2734 Th7 = VADD(Tgt, Tgu);
Chris@82 2735 }
Chris@82 2736 Tfd = VSUB(Tfb, Tfc);
Chris@82 2737 Tfg = VSUB(Tfe, Tff);
Chris@82 2738 Tfh = VMUL(LDK(KP707106781), VSUB(Tfd, Tfg));
Chris@82 2739 Tfp = VMUL(LDK(KP707106781), VADD(Tfd, Tfg));
Chris@82 2740 {
Chris@82 2741 V T7l, T7u, T7o, T7v;
Chris@82 2742 {
Chris@82 2743 V T7j, T7k, T7m, T7n;
Chris@82 2744 T7j = VADD(T1Q, T1N);
Chris@82 2745 T7k = VADD(T1U, T1V);
Chris@82 2746 T7l = VFMA(LDK(KP980785280), T7j, VMUL(LDK(KP195090322), T7k));
Chris@82 2747 T7u = VFNMS(LDK(KP195090322), T7j, VMUL(LDK(KP980785280), T7k));
Chris@82 2748 T7m = VADD(T27, T24);
Chris@82 2749 T7n = VADD(T2b, T2c);
Chris@82 2750 T7o = VFNMS(LDK(KP195090322), T7n, VMUL(LDK(KP980785280), T7m));
Chris@82 2751 T7v = VFMA(LDK(KP195090322), T7m, VMUL(LDK(KP980785280), T7n));
Chris@82 2752 }
Chris@82 2753 T7p = VSUB(T7l, T7o);
Chris@82 2754 T9f = VADD(T7u, T7v);
Chris@82 2755 T7w = VSUB(T7u, T7v);
Chris@82 2756 T9b = VADD(T7l, T7o);
Chris@82 2757 }
Chris@82 2758 {
Chris@82 2759 V T1X, T2q, T2e, T2r;
Chris@82 2760 {
Chris@82 2761 V T1R, T1W, T28, T2d;
Chris@82 2762 T1R = VSUB(T1N, T1Q);
Chris@82 2763 T1W = VSUB(T1U, T1V);
Chris@82 2764 T1X = VFMA(LDK(KP831469612), T1R, VMUL(LDK(KP555570233), T1W));
Chris@82 2765 T2q = VFNMS(LDK(KP555570233), T1R, VMUL(LDK(KP831469612), T1W));
Chris@82 2766 T28 = VSUB(T24, T27);
Chris@82 2767 T2d = VSUB(T2b, T2c);
Chris@82 2768 T2e = VFNMS(LDK(KP555570233), T2d, VMUL(LDK(KP831469612), T28));
Chris@82 2769 T2r = VFMA(LDK(KP555570233), T28, VMUL(LDK(KP831469612), T2d));
Chris@82 2770 }
Chris@82 2771 T2f = VSUB(T1X, T2e);
Chris@82 2772 T65 = VADD(T2q, T2r);
Chris@82 2773 T2s = VSUB(T2q, T2r);
Chris@82 2774 T61 = VADD(T1X, T2e);
Chris@82 2775 }
Chris@82 2776 }
Chris@82 2777 }
Chris@82 2778 {
Chris@82 2779 V Tgx, TgW, TgR, TgZ, TgI, TgY, TgO, TgV;
Chris@82 2780 {
Chris@82 2781 V Tgp, Tgw, TgP, TgQ;
Chris@82 2782 Tgp = VFNMS(LDK(KP382683432), Tgo, VMUL(LDK(KP923879532), Tgl));
Chris@82 2783 Tgw = VFMA(LDK(KP923879532), Tgs, VMUL(LDK(KP382683432), Tgv));
Chris@82 2784 Tgx = VSUB(Tgp, Tgw);
Chris@82 2785 TgW = VADD(Tgp, Tgw);
Chris@82 2786 TgP = VFMA(LDK(KP382683432), Tgl, VMUL(LDK(KP923879532), Tgo));
Chris@82 2787 TgQ = VFNMS(LDK(KP382683432), Tgs, VMUL(LDK(KP923879532), Tgv));
Chris@82 2788 TgR = VSUB(TgP, TgQ);
Chris@82 2789 TgZ = VADD(TgP, TgQ);
Chris@82 2790 }
Chris@82 2791 {
Chris@82 2792 V TgE, TgH, TgM, TgN;
Chris@82 2793 TgE = VMUL(LDK(KP707106781), VSUB(TgA, TgD));
Chris@82 2794 TgH = VSUB(TgF, TgG);
Chris@82 2795 TgI = VSUB(TgE, TgH);
Chris@82 2796 TgY = VADD(TgH, TgE);
Chris@82 2797 TgM = VSUB(TgK, TgL);
Chris@82 2798 TgN = VMUL(LDK(KP707106781), VADD(TgA, TgD));
Chris@82 2799 TgO = VSUB(TgM, TgN);
Chris@82 2800 TgV = VADD(TgM, TgN);
Chris@82 2801 }
Chris@82 2802 {
Chris@82 2803 V TgJ, TgS, Th1, Th2;
Chris@82 2804 TgJ = VBYI(VSUB(Tgx, TgI));
Chris@82 2805 TgS = VSUB(TgO, TgR);
Chris@82 2806 ST(&(xo[WS(os, 40)]), VADD(TgJ, TgS), ovs, &(xo[0]));
Chris@82 2807 ST(&(xo[WS(os, 88)]), VSUB(TgS, TgJ), ovs, &(xo[0]));
Chris@82 2808 Th1 = VSUB(TgV, TgW);
Chris@82 2809 Th2 = VBYI(VSUB(TgZ, TgY));
Chris@82 2810 ST(&(xo[WS(os, 72)]), VSUB(Th1, Th2), ovs, &(xo[0]));
Chris@82 2811 ST(&(xo[WS(os, 56)]), VADD(Th1, Th2), ovs, &(xo[0]));
Chris@82 2812 }
Chris@82 2813 {
Chris@82 2814 V TgT, TgU, TgX, Th0;
Chris@82 2815 TgT = VBYI(VADD(TgI, Tgx));
Chris@82 2816 TgU = VADD(TgO, TgR);
Chris@82 2817 ST(&(xo[WS(os, 24)]), VADD(TgT, TgU), ovs, &(xo[0]));
Chris@82 2818 ST(&(xo[WS(os, 104)]), VSUB(TgU, TgT), ovs, &(xo[0]));
Chris@82 2819 TgX = VADD(TgV, TgW);
Chris@82 2820 Th0 = VBYI(VADD(TgY, TgZ));
Chris@82 2821 ST(&(xo[WS(os, 120)]), VSUB(TgX, Th0), ovs, &(xo[0]));
Chris@82 2822 ST(&(xo[WS(os, 8)]), VADD(TgX, Th0), ovs, &(xo[0]));
Chris@82 2823 }
Chris@82 2824 }
Chris@82 2825 {
Chris@82 2826 V Th9, Thh, Thq, Ths, Thc, Thm, Thg, Thl, Thn, Thr;
Chris@82 2827 {
Chris@82 2828 V Th5, Th8, Tho, Thp;
Chris@82 2829 Th5 = VSUB(Th3, Th4);
Chris@82 2830 Th8 = VSUB(Th6, Th7);
Chris@82 2831 Th9 = VMUL(LDK(KP707106781), VSUB(Th5, Th8));
Chris@82 2832 Thh = VMUL(LDK(KP707106781), VADD(Th5, Th8));
Chris@82 2833 Tho = VADD(Th3, Th4);
Chris@82 2834 Thp = VADD(Th6, Th7);
Chris@82 2835 Thq = VBYI(VSUB(Tho, Thp));
Chris@82 2836 Ths = VADD(Tho, Thp);
Chris@82 2837 }
Chris@82 2838 {
Chris@82 2839 V Tha, Thb, The, Thf;
Chris@82 2840 Tha = VADD(Tgy, Tgz);
Chris@82 2841 Thb = VADD(TgB, TgC);
Chris@82 2842 Thc = VSUB(Tha, Thb);
Chris@82 2843 Thm = VADD(Tha, Thb);
Chris@82 2844 The = VADD(TgK, TgL);
Chris@82 2845 Thf = VADD(TgF, TgG);
Chris@82 2846 Thg = VSUB(The, Thf);
Chris@82 2847 Thl = VADD(The, Thf);
Chris@82 2848 }
Chris@82 2849 Thn = VSUB(Thl, Thm);
Chris@82 2850 ST(&(xo[WS(os, 96)]), VSUB(Thn, Thq), ovs, &(xo[0]));
Chris@82 2851 ST(&(xo[WS(os, 32)]), VADD(Thn, Thq), ovs, &(xo[0]));
Chris@82 2852 Thr = VADD(Thl, Thm);
Chris@82 2853 ST(&(xo[WS(os, 64)]), VSUB(Thr, Ths), ovs, &(xo[0]));
Chris@82 2854 ST(&(xo[0]), VADD(Thr, Ths), ovs, &(xo[0]));
Chris@82 2855 {
Chris@82 2856 V Thd, Thi, Thj, Thk;
Chris@82 2857 Thd = VBYI(VSUB(Th9, Thc));
Chris@82 2858 Thi = VSUB(Thg, Thh);
Chris@82 2859 ST(&(xo[WS(os, 48)]), VADD(Thd, Thi), ovs, &(xo[0]));
Chris@82 2860 ST(&(xo[WS(os, 80)]), VSUB(Thi, Thd), ovs, &(xo[0]));
Chris@82 2861 Thj = VBYI(VADD(Thc, Th9));
Chris@82 2862 Thk = VADD(Thg, Thh);
Chris@82 2863 ST(&(xo[WS(os, 16)]), VADD(Thj, Thk), ovs, &(xo[0]));
Chris@82 2864 ST(&(xo[WS(os, 112)]), VSUB(Thk, Thj), ovs, &(xo[0]));
Chris@82 2865 }
Chris@82 2866 }
Chris@82 2867 {
Chris@82 2868 V TeT, TfM, TfC, TfK, Tfs, TfN, TfF, TfJ;
Chris@82 2869 {
Chris@82 2870 V TeD, TeS, Tfw, TfB;
Chris@82 2871 TeD = VSUB(Tev, TeC);
Chris@82 2872 TeS = VSUB(TeK, TeR);
Chris@82 2873 TeT = VSUB(TeD, TeS);
Chris@82 2874 TfM = VADD(TeD, TeS);
Chris@82 2875 Tfw = VSUB(Tfu, Tfv);
Chris@82 2876 TfB = VSUB(Tfx, TfA);
Chris@82 2877 TfC = VSUB(Tfw, TfB);
Chris@82 2878 TfK = VADD(TfB, Tfw);
Chris@82 2879 {
Chris@82 2880 V Tfa, TfD, Tfr, TfE;
Chris@82 2881 {
Chris@82 2882 V Tf4, Tf9, Tfl, Tfq;
Chris@82 2883 Tf4 = VSUB(Tf0, Tf3);
Chris@82 2884 Tf9 = VSUB(Tf7, Tf8);
Chris@82 2885 Tfa = VFMA(LDK(KP831469612), Tf4, VMUL(LDK(KP555570233), Tf9));
Chris@82 2886 TfD = VFNMS(LDK(KP555570233), Tf4, VMUL(LDK(KP831469612), Tf9));
Chris@82 2887 Tfl = VSUB(Tfh, Tfk);
Chris@82 2888 Tfq = VSUB(Tfo, Tfp);
Chris@82 2889 Tfr = VFNMS(LDK(KP555570233), Tfq, VMUL(LDK(KP831469612), Tfl));
Chris@82 2890 TfE = VFMA(LDK(KP555570233), Tfl, VMUL(LDK(KP831469612), Tfq));
Chris@82 2891 }
Chris@82 2892 Tfs = VSUB(Tfa, Tfr);
Chris@82 2893 TfN = VADD(TfD, TfE);
Chris@82 2894 TfF = VSUB(TfD, TfE);
Chris@82 2895 TfJ = VADD(Tfa, Tfr);
Chris@82 2896 }
Chris@82 2897 }
Chris@82 2898 {
Chris@82 2899 V Tft, TfG, TfP, TfQ;
Chris@82 2900 Tft = VADD(TeT, Tfs);
Chris@82 2901 TfG = VBYI(VADD(TfC, TfF));
Chris@82 2902 ST(&(xo[WS(os, 108)]), VSUB(Tft, TfG), ovs, &(xo[0]));
Chris@82 2903 ST(&(xo[WS(os, 20)]), VADD(Tft, TfG), ovs, &(xo[0]));
Chris@82 2904 TfP = VBYI(VADD(TfK, TfJ));
Chris@82 2905 TfQ = VADD(TfM, TfN);
Chris@82 2906 ST(&(xo[WS(os, 12)]), VADD(TfP, TfQ), ovs, &(xo[0]));
Chris@82 2907 ST(&(xo[WS(os, 116)]), VSUB(TfQ, TfP), ovs, &(xo[0]));
Chris@82 2908 }
Chris@82 2909 {
Chris@82 2910 V TfH, TfI, TfL, TfO;
Chris@82 2911 TfH = VSUB(TeT, Tfs);
Chris@82 2912 TfI = VBYI(VSUB(TfF, TfC));
Chris@82 2913 ST(&(xo[WS(os, 84)]), VSUB(TfH, TfI), ovs, &(xo[0]));
Chris@82 2914 ST(&(xo[WS(os, 44)]), VADD(TfH, TfI), ovs, &(xo[0]));
Chris@82 2915 TfL = VBYI(VSUB(TfJ, TfK));
Chris@82 2916 TfO = VSUB(TfM, TfN);
Chris@82 2917 ST(&(xo[WS(os, 52)]), VADD(TfL, TfO), ovs, &(xo[0]));
Chris@82 2918 ST(&(xo[WS(os, 76)]), VSUB(TfO, TfL), ovs, &(xo[0]));
Chris@82 2919 }
Chris@82 2920 }
Chris@82 2921 {
Chris@82 2922 V TfT, Tge, Tg4, Tgc, Tg0, Tgf, Tg7, Tgb;
Chris@82 2923 {
Chris@82 2924 V TfR, TfS, Tg2, Tg3;
Chris@82 2925 TfR = VADD(Tev, TeC);
Chris@82 2926 TfS = VADD(Tfu, Tfv);
Chris@82 2927 TfT = VSUB(TfR, TfS);
Chris@82 2928 Tge = VADD(TfR, TfS);
Chris@82 2929 Tg2 = VADD(TeK, TeR);
Chris@82 2930 Tg3 = VADD(TfA, Tfx);
Chris@82 2931 Tg4 = VSUB(Tg2, Tg3);
Chris@82 2932 Tgc = VADD(Tg3, Tg2);
Chris@82 2933 {
Chris@82 2934 V TfW, Tg5, TfZ, Tg6;
Chris@82 2935 {
Chris@82 2936 V TfU, TfV, TfX, TfY;
Chris@82 2937 TfU = VADD(Tf3, Tf0);
Chris@82 2938 TfV = VADD(Tf7, Tf8);
Chris@82 2939 TfW = VFMA(LDK(KP980785280), TfU, VMUL(LDK(KP195090322), TfV));
Chris@82 2940 Tg5 = VFNMS(LDK(KP195090322), TfU, VMUL(LDK(KP980785280), TfV));
Chris@82 2941 TfX = VADD(Tfk, Tfh);
Chris@82 2942 TfY = VADD(Tfo, Tfp);
Chris@82 2943 TfZ = VFNMS(LDK(KP195090322), TfY, VMUL(LDK(KP980785280), TfX));
Chris@82 2944 Tg6 = VFMA(LDK(KP195090322), TfX, VMUL(LDK(KP980785280), TfY));
Chris@82 2945 }
Chris@82 2946 Tg0 = VSUB(TfW, TfZ);
Chris@82 2947 Tgf = VADD(Tg5, Tg6);
Chris@82 2948 Tg7 = VSUB(Tg5, Tg6);
Chris@82 2949 Tgb = VADD(TfW, TfZ);
Chris@82 2950 }
Chris@82 2951 }
Chris@82 2952 {
Chris@82 2953 V Tg1, Tg8, Tgh, Tgi;
Chris@82 2954 Tg1 = VADD(TfT, Tg0);
Chris@82 2955 Tg8 = VBYI(VADD(Tg4, Tg7));
Chris@82 2956 ST(&(xo[WS(os, 100)]), VSUB(Tg1, Tg8), ovs, &(xo[0]));
Chris@82 2957 ST(&(xo[WS(os, 28)]), VADD(Tg1, Tg8), ovs, &(xo[0]));
Chris@82 2958 Tgh = VBYI(VADD(Tgc, Tgb));
Chris@82 2959 Tgi = VADD(Tge, Tgf);
Chris@82 2960 ST(&(xo[WS(os, 4)]), VADD(Tgh, Tgi), ovs, &(xo[0]));
Chris@82 2961 ST(&(xo[WS(os, 124)]), VSUB(Tgi, Tgh), ovs, &(xo[0]));
Chris@82 2962 }
Chris@82 2963 {
Chris@82 2964 V Tg9, Tga, Tgd, Tgg;
Chris@82 2965 Tg9 = VSUB(TfT, Tg0);
Chris@82 2966 Tga = VBYI(VSUB(Tg7, Tg4));
Chris@82 2967 ST(&(xo[WS(os, 92)]), VSUB(Tg9, Tga), ovs, &(xo[0]));
Chris@82 2968 ST(&(xo[WS(os, 36)]), VADD(Tg9, Tga), ovs, &(xo[0]));
Chris@82 2969 Tgd = VBYI(VSUB(Tgb, Tgc));
Chris@82 2970 Tgg = VSUB(Tge, Tgf);
Chris@82 2971 ST(&(xo[WS(os, 60)]), VADD(Tgd, Tgg), ovs, &(xo[0]));
Chris@82 2972 ST(&(xo[WS(os, 68)]), VSUB(Tgg, Tgd), ovs, &(xo[0]));
Chris@82 2973 }
Chris@82 2974 }
Chris@82 2975 {
Chris@82 2976 V Tb7, Td8, TcI, Td0, Tcy, Tda, TcG, TcP, Tck, TcJ, TcB, TcF, TcW, Tdb, Td3;
Chris@82 2977 V Td7;
Chris@82 2978 {
Chris@82 2979 V Tax, TcZ, Tb6, TcY, TaO, Tb5;
Chris@82 2980 Tax = VSUB(Tah, Taw);
Chris@82 2981 TcZ = VADD(Tcw, Tcr);
Chris@82 2982 TaO = VFMA(LDK(KP831469612), TaI, VMUL(LDK(KP555570233), TaN));
Chris@82 2983 Tb5 = VFNMS(LDK(KP555570233), Tb4, VMUL(LDK(KP831469612), TaZ));
Chris@82 2984 Tb6 = VSUB(TaO, Tb5);
Chris@82 2985 TcY = VADD(TaO, Tb5);
Chris@82 2986 Tb7 = VSUB(Tax, Tb6);
Chris@82 2987 Td8 = VADD(TcZ, TcY);
Chris@82 2988 TcI = VADD(Tax, Tb6);
Chris@82 2989 Td0 = VSUB(TcY, TcZ);
Chris@82 2990 }
Chris@82 2991 {
Chris@82 2992 V Tcx, TcN, Tco, TcO, Tcm, Tcn;
Chris@82 2993 Tcx = VSUB(Tcr, Tcw);
Chris@82 2994 TcN = VADD(Tah, Taw);
Chris@82 2995 Tcm = VFNMS(LDK(KP555570233), TaI, VMUL(LDK(KP831469612), TaN));
Chris@82 2996 Tcn = VFMA(LDK(KP555570233), TaZ, VMUL(LDK(KP831469612), Tb4));
Chris@82 2997 Tco = VSUB(Tcm, Tcn);
Chris@82 2998 TcO = VADD(Tcm, Tcn);
Chris@82 2999 Tcy = VSUB(Tco, Tcx);
Chris@82 3000 Tda = VADD(TcN, TcO);
Chris@82 3001 TcG = VADD(Tcx, Tco);
Chris@82 3002 TcP = VSUB(TcN, TcO);
Chris@82 3003 }
Chris@82 3004 {
Chris@82 3005 V TbI, Tcz, Tcj, TcA;
Chris@82 3006 {
Chris@82 3007 V Tby, TbH, Tc9, Tci;
Chris@82 3008 Tby = VSUB(Tbm, Tbx);
Chris@82 3009 TbH = VSUB(TbD, TbG);
Chris@82 3010 TbI = VFMA(LDK(KP881921264), Tby, VMUL(LDK(KP471396736), TbH));
Chris@82 3011 Tcz = VFNMS(LDK(KP471396736), Tby, VMUL(LDK(KP881921264), TbH));
Chris@82 3012 Tc9 = VSUB(TbX, Tc8);
Chris@82 3013 Tci = VSUB(Tce, Tch);
Chris@82 3014 Tcj = VFNMS(LDK(KP471396736), Tci, VMUL(LDK(KP881921264), Tc9));
Chris@82 3015 TcA = VFMA(LDK(KP471396736), Tc9, VMUL(LDK(KP881921264), Tci));
Chris@82 3016 }
Chris@82 3017 Tck = VSUB(TbI, Tcj);
Chris@82 3018 TcJ = VADD(Tcz, TcA);
Chris@82 3019 TcB = VSUB(Tcz, TcA);
Chris@82 3020 TcF = VADD(TbI, Tcj);
Chris@82 3021 }
Chris@82 3022 {
Chris@82 3023 V TcS, Td1, TcV, Td2;
Chris@82 3024 {
Chris@82 3025 V TcQ, TcR, TcT, TcU;
Chris@82 3026 TcQ = VADD(Tbx, Tbm);
Chris@82 3027 TcR = VADD(TbD, TbG);
Chris@82 3028 TcS = VFMA(LDK(KP956940335), TcQ, VMUL(LDK(KP290284677), TcR));
Chris@82 3029 Td1 = VFNMS(LDK(KP290284677), TcQ, VMUL(LDK(KP956940335), TcR));
Chris@82 3030 TcT = VADD(Tc8, TbX);
Chris@82 3031 TcU = VADD(Tce, Tch);
Chris@82 3032 TcV = VFNMS(LDK(KP290284677), TcU, VMUL(LDK(KP956940335), TcT));
Chris@82 3033 Td2 = VFMA(LDK(KP290284677), TcT, VMUL(LDK(KP956940335), TcU));
Chris@82 3034 }
Chris@82 3035 TcW = VSUB(TcS, TcV);
Chris@82 3036 Tdb = VADD(Td1, Td2);
Chris@82 3037 Td3 = VSUB(Td1, Td2);
Chris@82 3038 Td7 = VADD(TcS, TcV);
Chris@82 3039 }
Chris@82 3040 {
Chris@82 3041 V Tcl, TcC, Td9, Tdc;
Chris@82 3042 Tcl = VADD(Tb7, Tck);
Chris@82 3043 TcC = VBYI(VADD(Tcy, TcB));
Chris@82 3044 ST(&(xo[WS(os, 106)]), VSUB(Tcl, TcC), ovs, &(xo[0]));
Chris@82 3045 ST(&(xo[WS(os, 22)]), VADD(Tcl, TcC), ovs, &(xo[0]));
Chris@82 3046 Td9 = VBYI(VSUB(Td7, Td8));
Chris@82 3047 Tdc = VSUB(Tda, Tdb);
Chris@82 3048 ST(&(xo[WS(os, 58)]), VADD(Td9, Tdc), ovs, &(xo[0]));
Chris@82 3049 ST(&(xo[WS(os, 70)]), VSUB(Tdc, Td9), ovs, &(xo[0]));
Chris@82 3050 }
Chris@82 3051 {
Chris@82 3052 V Tdd, Tde, TcD, TcE;
Chris@82 3053 Tdd = VBYI(VADD(Td8, Td7));
Chris@82 3054 Tde = VADD(Tda, Tdb);
Chris@82 3055 ST(&(xo[WS(os, 6)]), VADD(Tdd, Tde), ovs, &(xo[0]));
Chris@82 3056 ST(&(xo[WS(os, 122)]), VSUB(Tde, Tdd), ovs, &(xo[0]));
Chris@82 3057 TcD = VSUB(Tb7, Tck);
Chris@82 3058 TcE = VBYI(VSUB(TcB, Tcy));
Chris@82 3059 ST(&(xo[WS(os, 86)]), VSUB(TcD, TcE), ovs, &(xo[0]));
Chris@82 3060 ST(&(xo[WS(os, 42)]), VADD(TcD, TcE), ovs, &(xo[0]));
Chris@82 3061 }
Chris@82 3062 {
Chris@82 3063 V TcH, TcK, TcX, Td4;
Chris@82 3064 TcH = VBYI(VSUB(TcF, TcG));
Chris@82 3065 TcK = VSUB(TcI, TcJ);
Chris@82 3066 ST(&(xo[WS(os, 54)]), VADD(TcH, TcK), ovs, &(xo[0]));
Chris@82 3067 ST(&(xo[WS(os, 74)]), VSUB(TcK, TcH), ovs, &(xo[0]));
Chris@82 3068 TcX = VADD(TcP, TcW);
Chris@82 3069 Td4 = VBYI(VADD(Td0, Td3));
Chris@82 3070 ST(&(xo[WS(os, 102)]), VSUB(TcX, Td4), ovs, &(xo[0]));
Chris@82 3071 ST(&(xo[WS(os, 26)]), VADD(TcX, Td4), ovs, &(xo[0]));
Chris@82 3072 }
Chris@82 3073 {
Chris@82 3074 V Td5, Td6, TcL, TcM;
Chris@82 3075 Td5 = VSUB(TcP, TcW);
Chris@82 3076 Td6 = VBYI(VSUB(Td3, Td0));
Chris@82 3077 ST(&(xo[WS(os, 90)]), VSUB(Td5, Td6), ovs, &(xo[0]));
Chris@82 3078 ST(&(xo[WS(os, 38)]), VADD(Td5, Td6), ovs, &(xo[0]));
Chris@82 3079 TcL = VBYI(VADD(TcG, TcF));
Chris@82 3080 TcM = VADD(TcI, TcJ);
Chris@82 3081 ST(&(xo[WS(os, 10)]), VADD(TcL, TcM), ovs, &(xo[0]));
Chris@82 3082 ST(&(xo[WS(os, 118)]), VSUB(TcM, TcL), ovs, &(xo[0]));
Chris@82 3083 }
Chris@82 3084 }
Chris@82 3085 {
Chris@82 3086 V TdE, Tel, TdW, Tee, TdM, Teo, TdT, Tea, Tdt, TdX, TdP, TdU, Te7, Tep, Teh;
Chris@82 3087 V Tem;
Chris@82 3088 {
Chris@82 3089 V TdD, Tec, TdA, Ted, Tdw, Tdz;
Chris@82 3090 TdD = VADD(TdB, TdC);
Chris@82 3091 Tec = VSUB(TdG, TdH);
Chris@82 3092 Tdw = VFMA(LDK(KP980785280), Tdu, VMUL(LDK(KP195090322), Tdv));
Chris@82 3093 Tdz = VFNMS(LDK(KP195090322), Tdy, VMUL(LDK(KP980785280), Tdx));
Chris@82 3094 TdA = VADD(Tdw, Tdz);
Chris@82 3095 Ted = VSUB(Tdw, Tdz);
Chris@82 3096 TdE = VSUB(TdA, TdD);
Chris@82 3097 Tel = VADD(Tec, Ted);
Chris@82 3098 TdW = VADD(TdD, TdA);
Chris@82 3099 Tee = VSUB(Tec, Ted);
Chris@82 3100 }
Chris@82 3101 {
Chris@82 3102 V TdI, Te9, TdL, Te8, TdJ, TdK;
Chris@82 3103 TdI = VADD(TdG, TdH);
Chris@82 3104 Te9 = VSUB(TdC, TdB);
Chris@82 3105 TdJ = VFNMS(LDK(KP195090322), Tdu, VMUL(LDK(KP980785280), Tdv));
Chris@82 3106 TdK = VFMA(LDK(KP195090322), Tdx, VMUL(LDK(KP980785280), Tdy));
Chris@82 3107 TdL = VADD(TdJ, TdK);
Chris@82 3108 Te8 = VSUB(TdJ, TdK);
Chris@82 3109 TdM = VSUB(TdI, TdL);
Chris@82 3110 Teo = VADD(Te9, Te8);
Chris@82 3111 TdT = VADD(TdI, TdL);
Chris@82 3112 Tea = VSUB(Te8, Te9);
Chris@82 3113 }
Chris@82 3114 {
Chris@82 3115 V Tdl, TdN, Tds, TdO;
Chris@82 3116 {
Chris@82 3117 V Tdh, Tdk, Tdo, Tdr;
Chris@82 3118 Tdh = VADD(Tdf, Tdg);
Chris@82 3119 Tdk = VADD(Tdi, Tdj);
Chris@82 3120 Tdl = VFNMS(LDK(KP098017140), Tdk, VMUL(LDK(KP995184726), Tdh));
Chris@82 3121 TdN = VFMA(LDK(KP098017140), Tdh, VMUL(LDK(KP995184726), Tdk));
Chris@82 3122 Tdo = VADD(Tdm, Tdn);
Chris@82 3123 Tdr = VADD(Tdp, Tdq);
Chris@82 3124 Tds = VFMA(LDK(KP995184726), Tdo, VMUL(LDK(KP098017140), Tdr));
Chris@82 3125 TdO = VFNMS(LDK(KP098017140), Tdo, VMUL(LDK(KP995184726), Tdr));
Chris@82 3126 }
Chris@82 3127 Tdt = VSUB(Tdl, Tds);
Chris@82 3128 TdX = VADD(TdN, TdO);
Chris@82 3129 TdP = VSUB(TdN, TdO);
Chris@82 3130 TdU = VADD(Tdl, Tds);
Chris@82 3131 }
Chris@82 3132 {
Chris@82 3133 V Te3, Tef, Te6, Teg;
Chris@82 3134 {
Chris@82 3135 V Te1, Te2, Te4, Te5;
Chris@82 3136 Te1 = VSUB(Tdf, Tdg);
Chris@82 3137 Te2 = VSUB(Tdj, Tdi);
Chris@82 3138 Te3 = VFNMS(LDK(KP634393284), Te2, VMUL(LDK(KP773010453), Te1));
Chris@82 3139 Tef = VFMA(LDK(KP634393284), Te1, VMUL(LDK(KP773010453), Te2));
Chris@82 3140 Te4 = VSUB(Tdm, Tdn);
Chris@82 3141 Te5 = VSUB(Tdq, Tdp);
Chris@82 3142 Te6 = VFMA(LDK(KP773010453), Te4, VMUL(LDK(KP634393284), Te5));
Chris@82 3143 Teg = VFNMS(LDK(KP634393284), Te4, VMUL(LDK(KP773010453), Te5));
Chris@82 3144 }
Chris@82 3145 Te7 = VSUB(Te3, Te6);
Chris@82 3146 Tep = VADD(Tef, Teg);
Chris@82 3147 Teh = VSUB(Tef, Teg);
Chris@82 3148 Tem = VADD(Te3, Te6);
Chris@82 3149 }
Chris@82 3150 {
Chris@82 3151 V TdF, TdQ, Ten, Teq;
Chris@82 3152 TdF = VBYI(VSUB(Tdt, TdE));
Chris@82 3153 TdQ = VSUB(TdM, TdP);
Chris@82 3154 ST(&(xo[WS(os, 34)]), VADD(TdF, TdQ), ovs, &(xo[0]));
Chris@82 3155 ST(&(xo[WS(os, 94)]), VSUB(TdQ, TdF), ovs, &(xo[0]));
Chris@82 3156 Ten = VADD(Tel, Tem);
Chris@82 3157 Teq = VBYI(VADD(Teo, Tep));
Chris@82 3158 ST(&(xo[WS(os, 114)]), VSUB(Ten, Teq), ovs, &(xo[0]));
Chris@82 3159 ST(&(xo[WS(os, 14)]), VADD(Ten, Teq), ovs, &(xo[0]));
Chris@82 3160 }
Chris@82 3161 {
Chris@82 3162 V Ter, Tes, TdR, TdS;
Chris@82 3163 Ter = VSUB(Tel, Tem);
Chris@82 3164 Tes = VBYI(VSUB(Tep, Teo));
Chris@82 3165 ST(&(xo[WS(os, 78)]), VSUB(Ter, Tes), ovs, &(xo[0]));
Chris@82 3166 ST(&(xo[WS(os, 50)]), VADD(Ter, Tes), ovs, &(xo[0]));
Chris@82 3167 TdR = VBYI(VADD(TdE, Tdt));
Chris@82 3168 TdS = VADD(TdM, TdP);
Chris@82 3169 ST(&(xo[WS(os, 30)]), VADD(TdR, TdS), ovs, &(xo[0]));
Chris@82 3170 ST(&(xo[WS(os, 98)]), VSUB(TdS, TdR), ovs, &(xo[0]));
Chris@82 3171 }
Chris@82 3172 {
Chris@82 3173 V TdV, TdY, Teb, Tei;
Chris@82 3174 TdV = VADD(TdT, TdU);
Chris@82 3175 TdY = VBYI(VADD(TdW, TdX));
Chris@82 3176 ST(&(xo[WS(os, 126)]), VSUB(TdV, TdY), ovs, &(xo[0]));
Chris@82 3177 ST(&(xo[WS(os, 2)]), VADD(TdV, TdY), ovs, &(xo[0]));
Chris@82 3178 Teb = VBYI(VSUB(Te7, Tea));
Chris@82 3179 Tei = VSUB(Tee, Teh);
Chris@82 3180 ST(&(xo[WS(os, 46)]), VADD(Teb, Tei), ovs, &(xo[0]));
Chris@82 3181 ST(&(xo[WS(os, 82)]), VSUB(Tei, Teb), ovs, &(xo[0]));
Chris@82 3182 }
Chris@82 3183 {
Chris@82 3184 V Tej, Tek, TdZ, Te0;
Chris@82 3185 Tej = VBYI(VADD(Tea, Te7));
Chris@82 3186 Tek = VADD(Tee, Teh);
Chris@82 3187 ST(&(xo[WS(os, 18)]), VADD(Tej, Tek), ovs, &(xo[0]));
Chris@82 3188 ST(&(xo[WS(os, 110)]), VSUB(Tek, Tej), ovs, &(xo[0]));
Chris@82 3189 TdZ = VSUB(TdT, TdU);
Chris@82 3190 Te0 = VBYI(VSUB(TdX, TdW));
Chris@82 3191 ST(&(xo[WS(os, 66)]), VSUB(TdZ, Te0), ovs, &(xo[0]));
Chris@82 3192 ST(&(xo[WS(os, 62)]), VADD(TdZ, Te0), ovs, &(xo[0]));
Chris@82 3193 }
Chris@82 3194 }
Chris@82 3195 {
Chris@82 3196 V T7z, T8n, T8f, T8k, T8x, T8P, T8H, T8M, T80, T8L, T8O, T8c, T8j, T8A, T8E;
Chris@82 3197 V T8m;
Chris@82 3198 {
Chris@82 3199 V T7f, T8d, T7y, T8e;
Chris@82 3200 {
Chris@82 3201 V T77, T7e, T7q, T7x;
Chris@82 3202 T77 = VADD(T6Z, T76);
Chris@82 3203 T7e = VADD(T7a, T7d);
Chris@82 3204 T7f = VFNMS(LDK(KP336889853), T7e, VMUL(LDK(KP941544065), T77));
Chris@82 3205 T8d = VFMA(LDK(KP336889853), T77, VMUL(LDK(KP941544065), T7e));
Chris@82 3206 T7q = VADD(T7i, T7p);
Chris@82 3207 T7x = VADD(T7t, T7w);
Chris@82 3208 T7y = VFMA(LDK(KP941544065), T7q, VMUL(LDK(KP336889853), T7x));
Chris@82 3209 T8e = VFNMS(LDK(KP336889853), T7q, VMUL(LDK(KP941544065), T7x));
Chris@82 3210 }
Chris@82 3211 T7z = VSUB(T7f, T7y);
Chris@82 3212 T8n = VADD(T8d, T8e);
Chris@82 3213 T8f = VSUB(T8d, T8e);
Chris@82 3214 T8k = VADD(T7f, T7y);
Chris@82 3215 }
Chris@82 3216 {
Chris@82 3217 V T8t, T8F, T8w, T8G;
Chris@82 3218 {
Chris@82 3219 V T8r, T8s, T8u, T8v;
Chris@82 3220 T8r = VSUB(T6Z, T76);
Chris@82 3221 T8s = VSUB(T7d, T7a);
Chris@82 3222 T8t = VFNMS(LDK(KP427555093), T8s, VMUL(LDK(KP903989293), T8r));
Chris@82 3223 T8F = VFMA(LDK(KP427555093), T8r, VMUL(LDK(KP903989293), T8s));
Chris@82 3224 T8u = VSUB(T7i, T7p);
Chris@82 3225 T8v = VSUB(T7w, T7t);
Chris@82 3226 T8w = VFMA(LDK(KP903989293), T8u, VMUL(LDK(KP427555093), T8v));
Chris@82 3227 T8G = VFNMS(LDK(KP427555093), T8u, VMUL(LDK(KP903989293), T8v));
Chris@82 3228 }
Chris@82 3229 T8x = VSUB(T8t, T8w);
Chris@82 3230 T8P = VADD(T8F, T8G);
Chris@82 3231 T8H = VSUB(T8F, T8G);
Chris@82 3232 T8M = VADD(T8t, T8w);
Chris@82 3233 }
Chris@82 3234 {
Chris@82 3235 V T7Z, T8z, T88, T8C, T7O, T8D, T8b, T8y, T7Y, T87;
Chris@82 3236 T7Y = VSUB(T7U, T7X);
Chris@82 3237 T7Z = VADD(T7R, T7Y);
Chris@82 3238 T8z = VSUB(T7Y, T7R);
Chris@82 3239 T87 = VSUB(T85, T86);
Chris@82 3240 T88 = VADD(T84, T87);
Chris@82 3241 T8C = VSUB(T84, T87);
Chris@82 3242 {
Chris@82 3243 V T7G, T7N, T89, T8a;
Chris@82 3244 T7G = VFMA(LDK(KP634393284), T7C, VMUL(LDK(KP773010453), T7F));
Chris@82 3245 T7N = VFNMS(LDK(KP634393284), T7M, VMUL(LDK(KP773010453), T7J));
Chris@82 3246 T7O = VADD(T7G, T7N);
Chris@82 3247 T8D = VSUB(T7G, T7N);
Chris@82 3248 T89 = VFNMS(LDK(KP634393284), T7F, VMUL(LDK(KP773010453), T7C));
Chris@82 3249 T8a = VFMA(LDK(KP773010453), T7M, VMUL(LDK(KP634393284), T7J));
Chris@82 3250 T8b = VADD(T89, T8a);
Chris@82 3251 T8y = VSUB(T89, T8a);
Chris@82 3252 }
Chris@82 3253 T80 = VSUB(T7O, T7Z);
Chris@82 3254 T8L = VADD(T8C, T8D);
Chris@82 3255 T8O = VADD(T8z, T8y);
Chris@82 3256 T8c = VSUB(T88, T8b);
Chris@82 3257 T8j = VADD(T88, T8b);
Chris@82 3258 T8A = VSUB(T8y, T8z);
Chris@82 3259 T8E = VSUB(T8C, T8D);
Chris@82 3260 T8m = VADD(T7Z, T7O);
Chris@82 3261 }
Chris@82 3262 {
Chris@82 3263 V T81, T8g, T8N, T8Q;
Chris@82 3264 T81 = VBYI(VSUB(T7z, T80));
Chris@82 3265 T8g = VSUB(T8c, T8f);
Chris@82 3266 ST(&(xo[WS(os, 39)]), VADD(T81, T8g), ovs, &(xo[WS(os, 1)]));
Chris@82 3267 ST(&(xo[WS(os, 89)]), VSUB(T8g, T81), ovs, &(xo[WS(os, 1)]));
Chris@82 3268 T8N = VADD(T8L, T8M);
Chris@82 3269 T8Q = VBYI(VADD(T8O, T8P));
Chris@82 3270 ST(&(xo[WS(os, 119)]), VSUB(T8N, T8Q), ovs, &(xo[WS(os, 1)]));
Chris@82 3271 ST(&(xo[WS(os, 9)]), VADD(T8N, T8Q), ovs, &(xo[WS(os, 1)]));
Chris@82 3272 }
Chris@82 3273 {
Chris@82 3274 V T8R, T8S, T8h, T8i;
Chris@82 3275 T8R = VSUB(T8L, T8M);
Chris@82 3276 T8S = VBYI(VSUB(T8P, T8O));
Chris@82 3277 ST(&(xo[WS(os, 73)]), VSUB(T8R, T8S), ovs, &(xo[WS(os, 1)]));
Chris@82 3278 ST(&(xo[WS(os, 55)]), VADD(T8R, T8S), ovs, &(xo[WS(os, 1)]));
Chris@82 3279 T8h = VBYI(VADD(T80, T7z));
Chris@82 3280 T8i = VADD(T8c, T8f);
Chris@82 3281 ST(&(xo[WS(os, 25)]), VADD(T8h, T8i), ovs, &(xo[WS(os, 1)]));
Chris@82 3282 ST(&(xo[WS(os, 103)]), VSUB(T8i, T8h), ovs, &(xo[WS(os, 1)]));
Chris@82 3283 }
Chris@82 3284 {
Chris@82 3285 V T8l, T8o, T8B, T8I;
Chris@82 3286 T8l = VADD(T8j, T8k);
Chris@82 3287 T8o = VBYI(VADD(T8m, T8n));
Chris@82 3288 ST(&(xo[WS(os, 121)]), VSUB(T8l, T8o), ovs, &(xo[WS(os, 1)]));
Chris@82 3289 ST(&(xo[WS(os, 7)]), VADD(T8l, T8o), ovs, &(xo[WS(os, 1)]));
Chris@82 3290 T8B = VBYI(VSUB(T8x, T8A));
Chris@82 3291 T8I = VSUB(T8E, T8H);
Chris@82 3292 ST(&(xo[WS(os, 41)]), VADD(T8B, T8I), ovs, &(xo[WS(os, 1)]));
Chris@82 3293 ST(&(xo[WS(os, 87)]), VSUB(T8I, T8B), ovs, &(xo[WS(os, 1)]));
Chris@82 3294 }
Chris@82 3295 {
Chris@82 3296 V T8J, T8K, T8p, T8q;
Chris@82 3297 T8J = VBYI(VADD(T8A, T8x));
Chris@82 3298 T8K = VADD(T8E, T8H);
Chris@82 3299 ST(&(xo[WS(os, 23)]), VADD(T8J, T8K), ovs, &(xo[WS(os, 1)]));
Chris@82 3300 ST(&(xo[WS(os, 105)]), VSUB(T8K, T8J), ovs, &(xo[WS(os, 1)]));
Chris@82 3301 T8p = VSUB(T8j, T8k);
Chris@82 3302 T8q = VBYI(VSUB(T8n, T8m));
Chris@82 3303 ST(&(xo[WS(os, 71)]), VSUB(T8p, T8q), ovs, &(xo[WS(os, 1)]));
Chris@82 3304 ST(&(xo[WS(os, 57)]), VADD(T8p, T8q), ovs, &(xo[WS(os, 1)]));
Chris@82 3305 }
Chris@82 3306 }
Chris@82 3307 {
Chris@82 3308 V T2v, T5d, T55, T5a, T5n, T5F, T5x, T5C, T4K, T5B, T5E, T52, T59, T5q, T5u;
Chris@82 3309 V T5c;
Chris@82 3310 {
Chris@82 3311 V T1f, T53, T2u, T54;
Chris@82 3312 {
Chris@82 3313 V T11, T1e, T2g, T2t;
Chris@82 3314 T11 = VADD(Tr, T10);
Chris@82 3315 T1e = VADD(T1a, T1d);
Chris@82 3316 T1f = VFNMS(LDK(KP242980179), T1e, VMUL(LDK(KP970031253), T11));
Chris@82 3317 T53 = VFMA(LDK(KP242980179), T11, VMUL(LDK(KP970031253), T1e));
Chris@82 3318 T2g = VADD(T1G, T2f);
Chris@82 3319 T2t = VADD(T2p, T2s);
Chris@82 3320 T2u = VFMA(LDK(KP970031253), T2g, VMUL(LDK(KP242980179), T2t));
Chris@82 3321 T54 = VFNMS(LDK(KP242980179), T2g, VMUL(LDK(KP970031253), T2t));
Chris@82 3322 }
Chris@82 3323 T2v = VSUB(T1f, T2u);
Chris@82 3324 T5d = VADD(T53, T54);
Chris@82 3325 T55 = VSUB(T53, T54);
Chris@82 3326 T5a = VADD(T1f, T2u);
Chris@82 3327 }
Chris@82 3328 {
Chris@82 3329 V T5j, T5v, T5m, T5w;
Chris@82 3330 {
Chris@82 3331 V T5h, T5i, T5k, T5l;
Chris@82 3332 T5h = VSUB(Tr, T10);
Chris@82 3333 T5i = VSUB(T1d, T1a);
Chris@82 3334 T5j = VFNMS(LDK(KP514102744), T5i, VMUL(LDK(KP857728610), T5h));
Chris@82 3335 T5v = VFMA(LDK(KP514102744), T5h, VMUL(LDK(KP857728610), T5i));
Chris@82 3336 T5k = VSUB(T1G, T2f);
Chris@82 3337 T5l = VSUB(T2s, T2p);
Chris@82 3338 T5m = VFMA(LDK(KP857728610), T5k, VMUL(LDK(KP514102744), T5l));
Chris@82 3339 T5w = VFNMS(LDK(KP514102744), T5k, VMUL(LDK(KP857728610), T5l));
Chris@82 3340 }
Chris@82 3341 T5n = VSUB(T5j, T5m);
Chris@82 3342 T5F = VADD(T5v, T5w);
Chris@82 3343 T5x = VSUB(T5v, T5w);
Chris@82 3344 T5C = VADD(T5j, T5m);
Chris@82 3345 }
Chris@82 3346 {
Chris@82 3347 V T4J, T5p, T4Y, T5s, T3I, T5t, T51, T5o, T4I, T4X;
Chris@82 3348 T4I = VSUB(T4q, T4H);
Chris@82 3349 T4J = VADD(T49, T4I);
Chris@82 3350 T5p = VSUB(T4I, T49);
Chris@82 3351 T4X = VSUB(T4V, T4W);
Chris@82 3352 T4Y = VADD(T4U, T4X);
Chris@82 3353 T5s = VSUB(T4U, T4X);
Chris@82 3354 {
Chris@82 3355 V T36, T3H, T4Z, T50;
Chris@82 3356 T36 = VFMA(LDK(KP881921264), T2W, VMUL(LDK(KP471396736), T35));
Chris@82 3357 T3H = VFNMS(LDK(KP471396736), T3G, VMUL(LDK(KP881921264), T3x));
Chris@82 3358 T3I = VADD(T36, T3H);
Chris@82 3359 T5t = VSUB(T36, T3H);
Chris@82 3360 T4Z = VFNMS(LDK(KP471396736), T2W, VMUL(LDK(KP881921264), T35));
Chris@82 3361 T50 = VFMA(LDK(KP471396736), T3x, VMUL(LDK(KP881921264), T3G));
Chris@82 3362 T51 = VADD(T4Z, T50);
Chris@82 3363 T5o = VSUB(T4Z, T50);
Chris@82 3364 }
Chris@82 3365 T4K = VSUB(T3I, T4J);
Chris@82 3366 T5B = VADD(T5s, T5t);
Chris@82 3367 T5E = VADD(T5p, T5o);
Chris@82 3368 T52 = VSUB(T4Y, T51);
Chris@82 3369 T59 = VADD(T4Y, T51);
Chris@82 3370 T5q = VSUB(T5o, T5p);
Chris@82 3371 T5u = VSUB(T5s, T5t);
Chris@82 3372 T5c = VADD(T4J, T3I);
Chris@82 3373 }
Chris@82 3374 {
Chris@82 3375 V T4L, T56, T5D, T5G;
Chris@82 3376 T4L = VBYI(VSUB(T2v, T4K));
Chris@82 3377 T56 = VSUB(T52, T55);
Chris@82 3378 ST(&(xo[WS(os, 37)]), VADD(T4L, T56), ovs, &(xo[WS(os, 1)]));
Chris@82 3379 ST(&(xo[WS(os, 91)]), VSUB(T56, T4L), ovs, &(xo[WS(os, 1)]));
Chris@82 3380 T5D = VADD(T5B, T5C);
Chris@82 3381 T5G = VBYI(VADD(T5E, T5F));
Chris@82 3382 ST(&(xo[WS(os, 117)]), VSUB(T5D, T5G), ovs, &(xo[WS(os, 1)]));
Chris@82 3383 ST(&(xo[WS(os, 11)]), VADD(T5D, T5G), ovs, &(xo[WS(os, 1)]));
Chris@82 3384 }
Chris@82 3385 {
Chris@82 3386 V T5H, T5I, T57, T58;
Chris@82 3387 T5H = VSUB(T5B, T5C);
Chris@82 3388 T5I = VBYI(VSUB(T5F, T5E));
Chris@82 3389 ST(&(xo[WS(os, 75)]), VSUB(T5H, T5I), ovs, &(xo[WS(os, 1)]));
Chris@82 3390 ST(&(xo[WS(os, 53)]), VADD(T5H, T5I), ovs, &(xo[WS(os, 1)]));
Chris@82 3391 T57 = VBYI(VADD(T4K, T2v));
Chris@82 3392 T58 = VADD(T52, T55);
Chris@82 3393 ST(&(xo[WS(os, 27)]), VADD(T57, T58), ovs, &(xo[WS(os, 1)]));
Chris@82 3394 ST(&(xo[WS(os, 101)]), VSUB(T58, T57), ovs, &(xo[WS(os, 1)]));
Chris@82 3395 }
Chris@82 3396 {
Chris@82 3397 V T5b, T5e, T5r, T5y;
Chris@82 3398 T5b = VADD(T59, T5a);
Chris@82 3399 T5e = VBYI(VADD(T5c, T5d));
Chris@82 3400 ST(&(xo[WS(os, 123)]), VSUB(T5b, T5e), ovs, &(xo[WS(os, 1)]));
Chris@82 3401 ST(&(xo[WS(os, 5)]), VADD(T5b, T5e), ovs, &(xo[WS(os, 1)]));
Chris@82 3402 T5r = VBYI(VSUB(T5n, T5q));
Chris@82 3403 T5y = VSUB(T5u, T5x);
Chris@82 3404 ST(&(xo[WS(os, 43)]), VADD(T5r, T5y), ovs, &(xo[WS(os, 1)]));
Chris@82 3405 ST(&(xo[WS(os, 85)]), VSUB(T5y, T5r), ovs, &(xo[WS(os, 1)]));
Chris@82 3406 }
Chris@82 3407 {
Chris@82 3408 V T5z, T5A, T5f, T5g;
Chris@82 3409 T5z = VBYI(VADD(T5q, T5n));
Chris@82 3410 T5A = VADD(T5u, T5x);
Chris@82 3411 ST(&(xo[WS(os, 21)]), VADD(T5z, T5A), ovs, &(xo[WS(os, 1)]));
Chris@82 3412 ST(&(xo[WS(os, 107)]), VSUB(T5A, T5z), ovs, &(xo[WS(os, 1)]));
Chris@82 3413 T5f = VSUB(T59, T5a);
Chris@82 3414 T5g = VBYI(VSUB(T5d, T5c));
Chris@82 3415 ST(&(xo[WS(os, 69)]), VSUB(T5f, T5g), ovs, &(xo[WS(os, 1)]));
Chris@82 3416 ST(&(xo[WS(os, 59)]), VADD(T5f, T5g), ovs, &(xo[WS(os, 1)]));
Chris@82 3417 }
Chris@82 3418 }
Chris@82 3419 {
Chris@82 3420 V T9i, T9B, T9t, T9x, T9O, Ta3, T9V, T9Z, T93, Ta0, Ta2, T9q, T9y, T9H, T9S;
Chris@82 3421 V T9A;
Chris@82 3422 {
Chris@82 3423 V T9a, T9r, T9h, T9s;
Chris@82 3424 {
Chris@82 3425 V T96, T99, T9d, T9g;
Chris@82 3426 T96 = VSUB(T94, T95);
Chris@82 3427 T99 = VSUB(T97, T98);
Chris@82 3428 T9a = VFMA(LDK(KP740951125), T96, VMUL(LDK(KP671558954), T99));
Chris@82 3429 T9r = VFNMS(LDK(KP671558954), T96, VMUL(LDK(KP740951125), T99));
Chris@82 3430 T9d = VSUB(T9b, T9c);
Chris@82 3431 T9g = VSUB(T9e, T9f);
Chris@82 3432 T9h = VFNMS(LDK(KP671558954), T9g, VMUL(LDK(KP740951125), T9d));
Chris@82 3433 T9s = VFMA(LDK(KP671558954), T9d, VMUL(LDK(KP740951125), T9g));
Chris@82 3434 }
Chris@82 3435 T9i = VSUB(T9a, T9h);
Chris@82 3436 T9B = VADD(T9r, T9s);
Chris@82 3437 T9t = VSUB(T9r, T9s);
Chris@82 3438 T9x = VADD(T9a, T9h);
Chris@82 3439 }
Chris@82 3440 {
Chris@82 3441 V T9K, T9T, T9N, T9U;
Chris@82 3442 {
Chris@82 3443 V T9I, T9J, T9L, T9M;
Chris@82 3444 T9I = VADD(T95, T94);
Chris@82 3445 T9J = VADD(T97, T98);
Chris@82 3446 T9K = VFMA(LDK(KP998795456), T9I, VMUL(LDK(KP049067674), T9J));
Chris@82 3447 T9T = VFNMS(LDK(KP049067674), T9I, VMUL(LDK(KP998795456), T9J));
Chris@82 3448 T9L = VADD(T9c, T9b);
Chris@82 3449 T9M = VADD(T9e, T9f);
Chris@82 3450 T9N = VFNMS(LDK(KP049067674), T9M, VMUL(LDK(KP998795456), T9L));
Chris@82 3451 T9U = VFMA(LDK(KP049067674), T9L, VMUL(LDK(KP998795456), T9M));
Chris@82 3452 }
Chris@82 3453 T9O = VSUB(T9K, T9N);
Chris@82 3454 Ta3 = VADD(T9T, T9U);
Chris@82 3455 T9V = VSUB(T9T, T9U);
Chris@82 3456 T9Z = VADD(T9K, T9N);
Chris@82 3457 }
Chris@82 3458 {
Chris@82 3459 V T8V, T9F, T9p, T9R, T92, T9Q, T9m, T9G, T8U, T9n;
Chris@82 3460 T8U = VADD(T7U, T7X);
Chris@82 3461 T8V = VSUB(T8T, T8U);
Chris@82 3462 T9F = VADD(T8T, T8U);
Chris@82 3463 T9n = VADD(T85, T86);
Chris@82 3464 T9p = VSUB(T9n, T9o);
Chris@82 3465 T9R = VADD(T9o, T9n);
Chris@82 3466 {
Chris@82 3467 V T8Y, T91, T9k, T9l;
Chris@82 3468 T8Y = VFMA(LDK(KP098017140), T8W, VMUL(LDK(KP995184726), T8X));
Chris@82 3469 T91 = VFNMS(LDK(KP098017140), T90, VMUL(LDK(KP995184726), T8Z));
Chris@82 3470 T92 = VSUB(T8Y, T91);
Chris@82 3471 T9Q = VADD(T8Y, T91);
Chris@82 3472 T9k = VFNMS(LDK(KP098017140), T8X, VMUL(LDK(KP995184726), T8W));
Chris@82 3473 T9l = VFMA(LDK(KP995184726), T90, VMUL(LDK(KP098017140), T8Z));
Chris@82 3474 T9m = VSUB(T9k, T9l);
Chris@82 3475 T9G = VADD(T9k, T9l);
Chris@82 3476 }
Chris@82 3477 T93 = VSUB(T8V, T92);
Chris@82 3478 Ta0 = VADD(T9R, T9Q);
Chris@82 3479 Ta2 = VADD(T9F, T9G);
Chris@82 3480 T9q = VSUB(T9m, T9p);
Chris@82 3481 T9y = VADD(T9p, T9m);
Chris@82 3482 T9H = VSUB(T9F, T9G);
Chris@82 3483 T9S = VSUB(T9Q, T9R);
Chris@82 3484 T9A = VADD(T8V, T92);
Chris@82 3485 }
Chris@82 3486 {
Chris@82 3487 V T9j, T9u, Ta1, Ta4;
Chris@82 3488 T9j = VADD(T93, T9i);
Chris@82 3489 T9u = VBYI(VADD(T9q, T9t));
Chris@82 3490 ST(&(xo[WS(os, 111)]), VSUB(T9j, T9u), ovs, &(xo[WS(os, 1)]));
Chris@82 3491 ST(&(xo[WS(os, 17)]), VADD(T9j, T9u), ovs, &(xo[WS(os, 1)]));
Chris@82 3492 Ta1 = VBYI(VSUB(T9Z, Ta0));
Chris@82 3493 Ta4 = VSUB(Ta2, Ta3);
Chris@82 3494 ST(&(xo[WS(os, 63)]), VADD(Ta1, Ta4), ovs, &(xo[WS(os, 1)]));
Chris@82 3495 ST(&(xo[WS(os, 65)]), VSUB(Ta4, Ta1), ovs, &(xo[WS(os, 1)]));
Chris@82 3496 }
Chris@82 3497 {
Chris@82 3498 V Ta5, Ta6, T9v, T9w;
Chris@82 3499 Ta5 = VBYI(VADD(Ta0, T9Z));
Chris@82 3500 Ta6 = VADD(Ta2, Ta3);
Chris@82 3501 ST(&(xo[WS(os, 1)]), VADD(Ta5, Ta6), ovs, &(xo[WS(os, 1)]));
Chris@82 3502 ST(&(xo[WS(os, 127)]), VSUB(Ta6, Ta5), ovs, &(xo[WS(os, 1)]));
Chris@82 3503 T9v = VSUB(T93, T9i);
Chris@82 3504 T9w = VBYI(VSUB(T9t, T9q));
Chris@82 3505 ST(&(xo[WS(os, 81)]), VSUB(T9v, T9w), ovs, &(xo[WS(os, 1)]));
Chris@82 3506 ST(&(xo[WS(os, 47)]), VADD(T9v, T9w), ovs, &(xo[WS(os, 1)]));
Chris@82 3507 }
Chris@82 3508 {
Chris@82 3509 V T9z, T9C, T9P, T9W;
Chris@82 3510 T9z = VBYI(VSUB(T9x, T9y));
Chris@82 3511 T9C = VSUB(T9A, T9B);
Chris@82 3512 ST(&(xo[WS(os, 49)]), VADD(T9z, T9C), ovs, &(xo[WS(os, 1)]));
Chris@82 3513 ST(&(xo[WS(os, 79)]), VSUB(T9C, T9z), ovs, &(xo[WS(os, 1)]));
Chris@82 3514 T9P = VADD(T9H, T9O);
Chris@82 3515 T9W = VBYI(VADD(T9S, T9V));
Chris@82 3516 ST(&(xo[WS(os, 97)]), VSUB(T9P, T9W), ovs, &(xo[WS(os, 1)]));
Chris@82 3517 ST(&(xo[WS(os, 31)]), VADD(T9P, T9W), ovs, &(xo[WS(os, 1)]));
Chris@82 3518 }
Chris@82 3519 {
Chris@82 3520 V T9X, T9Y, T9D, T9E;
Chris@82 3521 T9X = VSUB(T9H, T9O);
Chris@82 3522 T9Y = VBYI(VSUB(T9V, T9S));
Chris@82 3523 ST(&(xo[WS(os, 95)]), VSUB(T9X, T9Y), ovs, &(xo[WS(os, 1)]));
Chris@82 3524 ST(&(xo[WS(os, 33)]), VADD(T9X, T9Y), ovs, &(xo[WS(os, 1)]));
Chris@82 3525 T9D = VBYI(VADD(T9y, T9x));
Chris@82 3526 T9E = VADD(T9A, T9B);
Chris@82 3527 ST(&(xo[WS(os, 15)]), VADD(T9D, T9E), ovs, &(xo[WS(os, 1)]));
Chris@82 3528 ST(&(xo[WS(os, 113)]), VSUB(T9E, T9D), ovs, &(xo[WS(os, 1)]));
Chris@82 3529 }
Chris@82 3530 }
Chris@82 3531 {
Chris@82 3532 V T68, T6r, T6j, T6n, T6E, T6T, T6L, T6P, T5T, T6Q, T6S, T6g, T6o, T6x, T6I;
Chris@82 3533 V T6q;
Chris@82 3534 {
Chris@82 3535 V T60, T6h, T67, T6i;
Chris@82 3536 {
Chris@82 3537 V T5W, T5Z, T63, T66;
Chris@82 3538 T5W = VSUB(T5U, T5V);
Chris@82 3539 T5Z = VSUB(T5X, T5Y);
Chris@82 3540 T60 = VFMA(LDK(KP803207531), T5W, VMUL(LDK(KP595699304), T5Z));
Chris@82 3541 T6h = VFNMS(LDK(KP595699304), T5W, VMUL(LDK(KP803207531), T5Z));
Chris@82 3542 T63 = VSUB(T61, T62);
Chris@82 3543 T66 = VSUB(T64, T65);
Chris@82 3544 T67 = VFNMS(LDK(KP595699304), T66, VMUL(LDK(KP803207531), T63));
Chris@82 3545 T6i = VFMA(LDK(KP595699304), T63, VMUL(LDK(KP803207531), T66));
Chris@82 3546 }
Chris@82 3547 T68 = VSUB(T60, T67);
Chris@82 3548 T6r = VADD(T6h, T6i);
Chris@82 3549 T6j = VSUB(T6h, T6i);
Chris@82 3550 T6n = VADD(T60, T67);
Chris@82 3551 }
Chris@82 3552 {
Chris@82 3553 V T6A, T6J, T6D, T6K;
Chris@82 3554 {
Chris@82 3555 V T6y, T6z, T6B, T6C;
Chris@82 3556 T6y = VADD(T5V, T5U);
Chris@82 3557 T6z = VADD(T5X, T5Y);
Chris@82 3558 T6A = VFMA(LDK(KP989176509), T6y, VMUL(LDK(KP146730474), T6z));
Chris@82 3559 T6J = VFNMS(LDK(KP146730474), T6y, VMUL(LDK(KP989176509), T6z));
Chris@82 3560 T6B = VADD(T62, T61);
Chris@82 3561 T6C = VADD(T64, T65);
Chris@82 3562 T6D = VFNMS(LDK(KP146730474), T6C, VMUL(LDK(KP989176509), T6B));
Chris@82 3563 T6K = VFMA(LDK(KP146730474), T6B, VMUL(LDK(KP989176509), T6C));
Chris@82 3564 }
Chris@82 3565 T6E = VSUB(T6A, T6D);
Chris@82 3566 T6T = VADD(T6J, T6K);
Chris@82 3567 T6L = VSUB(T6J, T6K);
Chris@82 3568 T6P = VADD(T6A, T6D);
Chris@82 3569 }
Chris@82 3570 {
Chris@82 3571 V T5L, T6v, T6f, T6H, T5S, T6G, T6c, T6w, T5K, T6d;
Chris@82 3572 T5K = VADD(T4q, T4H);
Chris@82 3573 T5L = VSUB(T5J, T5K);
Chris@82 3574 T6v = VADD(T5J, T5K);
Chris@82 3575 T6d = VADD(T4V, T4W);
Chris@82 3576 T6f = VSUB(T6d, T6e);
Chris@82 3577 T6H = VADD(T6e, T6d);
Chris@82 3578 {
Chris@82 3579 V T5O, T5R, T6a, T6b;
Chris@82 3580 T5O = VFMA(LDK(KP956940335), T5M, VMUL(LDK(KP290284677), T5N));
Chris@82 3581 T5R = VFNMS(LDK(KP290284677), T5Q, VMUL(LDK(KP956940335), T5P));
Chris@82 3582 T5S = VSUB(T5O, T5R);
Chris@82 3583 T6G = VADD(T5O, T5R);
Chris@82 3584 T6a = VFNMS(LDK(KP290284677), T5M, VMUL(LDK(KP956940335), T5N));
Chris@82 3585 T6b = VFMA(LDK(KP290284677), T5P, VMUL(LDK(KP956940335), T5Q));
Chris@82 3586 T6c = VSUB(T6a, T6b);
Chris@82 3587 T6w = VADD(T6a, T6b);
Chris@82 3588 }
Chris@82 3589 T5T = VSUB(T5L, T5S);
Chris@82 3590 T6Q = VADD(T6H, T6G);
Chris@82 3591 T6S = VADD(T6v, T6w);
Chris@82 3592 T6g = VSUB(T6c, T6f);
Chris@82 3593 T6o = VADD(T6f, T6c);
Chris@82 3594 T6x = VSUB(T6v, T6w);
Chris@82 3595 T6I = VSUB(T6G, T6H);
Chris@82 3596 T6q = VADD(T5L, T5S);
Chris@82 3597 }
Chris@82 3598 {
Chris@82 3599 V T69, T6k, T6R, T6U;
Chris@82 3600 T69 = VADD(T5T, T68);
Chris@82 3601 T6k = VBYI(VADD(T6g, T6j));
Chris@82 3602 ST(&(xo[WS(os, 109)]), VSUB(T69, T6k), ovs, &(xo[WS(os, 1)]));
Chris@82 3603 ST(&(xo[WS(os, 19)]), VADD(T69, T6k), ovs, &(xo[WS(os, 1)]));
Chris@82 3604 T6R = VBYI(VSUB(T6P, T6Q));
Chris@82 3605 T6U = VSUB(T6S, T6T);
Chris@82 3606 ST(&(xo[WS(os, 61)]), VADD(T6R, T6U), ovs, &(xo[WS(os, 1)]));
Chris@82 3607 ST(&(xo[WS(os, 67)]), VSUB(T6U, T6R), ovs, &(xo[WS(os, 1)]));
Chris@82 3608 }
Chris@82 3609 {
Chris@82 3610 V T6V, T6W, T6l, T6m;
Chris@82 3611 T6V = VBYI(VADD(T6Q, T6P));
Chris@82 3612 T6W = VADD(T6S, T6T);
Chris@82 3613 ST(&(xo[WS(os, 3)]), VADD(T6V, T6W), ovs, &(xo[WS(os, 1)]));
Chris@82 3614 ST(&(xo[WS(os, 125)]), VSUB(T6W, T6V), ovs, &(xo[WS(os, 1)]));
Chris@82 3615 T6l = VSUB(T5T, T68);
Chris@82 3616 T6m = VBYI(VSUB(T6j, T6g));
Chris@82 3617 ST(&(xo[WS(os, 83)]), VSUB(T6l, T6m), ovs, &(xo[WS(os, 1)]));
Chris@82 3618 ST(&(xo[WS(os, 45)]), VADD(T6l, T6m), ovs, &(xo[WS(os, 1)]));
Chris@82 3619 }
Chris@82 3620 {
Chris@82 3621 V T6p, T6s, T6F, T6M;
Chris@82 3622 T6p = VBYI(VSUB(T6n, T6o));
Chris@82 3623 T6s = VSUB(T6q, T6r);
Chris@82 3624 ST(&(xo[WS(os, 51)]), VADD(T6p, T6s), ovs, &(xo[WS(os, 1)]));
Chris@82 3625 ST(&(xo[WS(os, 77)]), VSUB(T6s, T6p), ovs, &(xo[WS(os, 1)]));
Chris@82 3626 T6F = VADD(T6x, T6E);
Chris@82 3627 T6M = VBYI(VADD(T6I, T6L));
Chris@82 3628 ST(&(xo[WS(os, 99)]), VSUB(T6F, T6M), ovs, &(xo[WS(os, 1)]));
Chris@82 3629 ST(&(xo[WS(os, 29)]), VADD(T6F, T6M), ovs, &(xo[WS(os, 1)]));
Chris@82 3630 }
Chris@82 3631 {
Chris@82 3632 V T6N, T6O, T6t, T6u;
Chris@82 3633 T6N = VSUB(T6x, T6E);
Chris@82 3634 T6O = VBYI(VSUB(T6L, T6I));
Chris@82 3635 ST(&(xo[WS(os, 93)]), VSUB(T6N, T6O), ovs, &(xo[WS(os, 1)]));
Chris@82 3636 ST(&(xo[WS(os, 35)]), VADD(T6N, T6O), ovs, &(xo[WS(os, 1)]));
Chris@82 3637 T6t = VBYI(VADD(T6o, T6n));
Chris@82 3638 T6u = VADD(T6q, T6r);
Chris@82 3639 ST(&(xo[WS(os, 13)]), VADD(T6t, T6u), ovs, &(xo[WS(os, 1)]));
Chris@82 3640 ST(&(xo[WS(os, 115)]), VSUB(T6u, T6t), ovs, &(xo[WS(os, 1)]));
Chris@82 3641 }
Chris@82 3642 }
Chris@82 3643 }
Chris@82 3644 }
Chris@82 3645 VLEAVE();
Chris@82 3646 }
Chris@82 3647
Chris@82 3648 static const kdft_desc desc = { 128, XSIMD_STRING("n1bv_128"), {938, 186, 144, 0}, &GENUS, 0, 0, 0, 0 };
Chris@82 3649
Chris@82 3650 void XSIMD(codelet_n1bv_128) (planner *p) {
Chris@82 3651 X(kdft_register) (p, n1bv_128, &desc);
Chris@82 3652 }
Chris@82 3653
Chris@82 3654 #endif