annotate src/fftw-3.3.5/rdft/scalar/r2cf/r2cf_128.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents 2cd0e3b3e1fd
children
rev   line source
Chris@42 1 /*
Chris@42 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@42 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@42 4 *
Chris@42 5 * This program is free software; you can redistribute it and/or modify
Chris@42 6 * it under the terms of the GNU General Public License as published by
Chris@42 7 * the Free Software Foundation; either version 2 of the License, or
Chris@42 8 * (at your option) any later version.
Chris@42 9 *
Chris@42 10 * This program is distributed in the hope that it will be useful,
Chris@42 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@42 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@42 13 * GNU General Public License for more details.
Chris@42 14 *
Chris@42 15 * You should have received a copy of the GNU General Public License
Chris@42 16 * along with this program; if not, write to the Free Software
Chris@42 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@42 18 *
Chris@42 19 */
Chris@42 20
Chris@42 21 /* This file was automatically generated --- DO NOT EDIT */
Chris@42 22 /* Generated on Sat Jul 30 16:46:09 EDT 2016 */
Chris@42 23
Chris@42 24 #include "codelet-rdft.h"
Chris@42 25
Chris@42 26 #ifdef HAVE_FMA
Chris@42 27
Chris@42 28 /* Generated by: ../../../genfft/gen_r2cf.native -fma -reorder-insns -schedule-for-pipeline -compact -variables 4 -pipeline-latency 4 -n 128 -name r2cf_128 -include r2cf.h */
Chris@42 29
Chris@42 30 /*
Chris@42 31 * This function contains 956 FP additions, 516 FP multiplications,
Chris@42 32 * (or, 440 additions, 0 multiplications, 516 fused multiply/add),
Chris@42 33 * 229 stack variables, 31 constants, and 256 memory accesses
Chris@42 34 */
Chris@42 35 #include "r2cf.h"
Chris@42 36
Chris@42 37 static void r2cf_128(R *R0, R *R1, R *Cr, R *Ci, stride rs, stride csr, stride csi, INT v, INT ivs, INT ovs)
Chris@42 38 {
Chris@42 39 DK(KP989176509, +0.989176509964780973451673738016243063983689533);
Chris@42 40 DK(KP803207531, +0.803207531480644909806676512963141923879569427);
Chris@42 41 DK(KP148335987, +0.148335987538347428753676511486911367000625355);
Chris@42 42 DK(KP741650546, +0.741650546272035369581266691172079863842265220);
Chris@42 43 DK(KP998795456, +0.998795456205172392714771604759100694443203615);
Chris@42 44 DK(KP740951125, +0.740951125354959091175616897495162729728955309);
Chris@42 45 DK(KP049126849, +0.049126849769467254105343321271313617079695752);
Chris@42 46 DK(KP906347169, +0.906347169019147157946142717268914412664134293);
Chris@42 47 DK(KP857728610, +0.857728610000272069902269984284770137042490799);
Chris@42 48 DK(KP970031253, +0.970031253194543992603984207286100251456865962);
Chris@42 49 DK(KP599376933, +0.599376933681923766271389869014404232837890546);
Chris@42 50 DK(KP250486960, +0.250486960191305461595702160124721208578685568);
Chris@42 51 DK(KP941544065, +0.941544065183020778412509402599502357185589796);
Chris@42 52 DK(KP903989293, +0.903989293123443331586200297230537048710132025);
Chris@42 53 DK(KP472964775, +0.472964775891319928124438237972992463904131113);
Chris@42 54 DK(KP357805721, +0.357805721314524104672487743774474392487532769);
Chris@42 55 DK(KP773010453, +0.773010453362736960810906609758469800971041293);
Chris@42 56 DK(KP995184726, +0.995184726672196886244836953109479921575474869);
Chris@42 57 DK(KP098491403, +0.098491403357164253077197521291327432293052451);
Chris@42 58 DK(KP820678790, +0.820678790828660330972281985331011598767386482);
Chris@42 59 DK(KP956940335, +0.956940335732208864935797886980269969482849206);
Chris@42 60 DK(KP881921264, +0.881921264348355029712756863660388349508442621);
Chris@42 61 DK(KP534511135, +0.534511135950791641089685961295362908582039528);
Chris@42 62 DK(KP303346683, +0.303346683607342391675883946941299872384187453);
Chris@42 63 DK(KP831469612, +0.831469612302545237078788377617905756738560812);
Chris@42 64 DK(KP980785280, +0.980785280403230449126182236134239036973933731);
Chris@42 65 DK(KP923879532, +0.923879532511286756128183189396788286822416626);
Chris@42 66 DK(KP198912367, +0.198912367379658006911597622644676228597850501);
Chris@42 67 DK(KP668178637, +0.668178637919298919997757686523080761552472251);
Chris@42 68 DK(KP414213562, +0.414213562373095048801688724209698078569671875);
Chris@42 69 DK(KP707106781, +0.707106781186547524400844362104849039284835938);
Chris@42 70 {
Chris@42 71 INT i;
Chris@42 72 for (i = v; i > 0; i = i - 1, R0 = R0 + ivs, R1 = R1 + ivs, Cr = Cr + ovs, Ci = Ci + ovs, MAKE_VOLATILE_STRIDE(512, rs), MAKE_VOLATILE_STRIDE(512, csr), MAKE_VOLATILE_STRIDE(512, csi)) {
Chris@42 73 E T95, T96;
Chris@42 74 {
Chris@42 75 E TcD, TdR, T5P, T8v, T27, T7r, Tf, Ta5, T7s, T5S, T8w, T2e, TdS, TcG, Tbn;
Chris@42 76 E Tu, TcK, TdU, TK, Ta6, T7w, T8y, T2o, T5U, TcN, TdV, TZ, Ta7, T7z, T8z;
Chris@42 77 E T2x, T5V, T1g, Taa, Tab, T1v, Tew, TcX, Tex, TcU, T6A, T2M, T9b, T7E, T9a;
Chris@42 78 E T7H, T6z, T2T, TeO, TdK, TeL, Tdz, T9p, T8d, T6O, T5G, T6L, T4X, Tc3, TaV;
Chris@42 79 E Tc4, Tbi, T9s, T8o, TeH, Tdp, TeE, Tde, T9i, T7U, T6H, T4r, T6E, T3I, TbW;
Chris@42 80 E Tao, TbX, TaL, T9l, T85, T1L, Tad, Tae, T20, Tez, Td6, TeA, Td3, T6x, T37;
Chris@42 81 E T9e, T7L, T9d, T7O, T6w, T3e, TbZ, T3Z, T4s, Tc0, TeF, Tds, T4t, T4g, T87;
Chris@42 82 E T80, TeI, Tdl, T86, T7X, TaM, TaD, Tb2, Tc6, T8e, T8f, T5e, T5H, Tb9, Tc7;
Chris@42 83 E TeM, TdN, T5I, T5v, T8q, T8j, TeP, TdG;
Chris@42 84 {
Chris@42 85 E T7G, T2S, T2P, T7F;
Chris@42 86 {
Chris@42 87 E T28, Ti, Tn, T2c, Ts, T29, Tl, To;
Chris@42 88 {
Chris@42 89 E T4, T23, T3, T25, Td, T5, T8, T9;
Chris@42 90 {
Chris@42 91 E T1, T2, Tb, Tc;
Chris@42 92 T1 = R0[0];
Chris@42 93 T2 = R0[WS(rs, 32)];
Chris@42 94 Tb = R0[WS(rs, 56)];
Chris@42 95 Tc = R0[WS(rs, 24)];
Chris@42 96 T4 = R0[WS(rs, 16)];
Chris@42 97 T23 = T1 - T2;
Chris@42 98 T3 = T1 + T2;
Chris@42 99 T25 = Tb - Tc;
Chris@42 100 Td = Tb + Tc;
Chris@42 101 T5 = R0[WS(rs, 48)];
Chris@42 102 T8 = R0[WS(rs, 8)];
Chris@42 103 T9 = R0[WS(rs, 40)];
Chris@42 104 }
Chris@42 105 {
Chris@42 106 E Tq, Tr, Tj, Tk;
Chris@42 107 {
Chris@42 108 E Tg, T5N, T6, T24, Ta, Th;
Chris@42 109 Tg = R0[WS(rs, 4)];
Chris@42 110 T5N = T4 - T5;
Chris@42 111 T6 = T4 + T5;
Chris@42 112 T24 = T8 - T9;
Chris@42 113 Ta = T8 + T9;
Chris@42 114 Th = R0[WS(rs, 36)];
Chris@42 115 {
Chris@42 116 E T7, T26, T5O, Te;
Chris@42 117 TcD = T3 - T6;
Chris@42 118 T7 = T3 + T6;
Chris@42 119 T26 = T24 + T25;
Chris@42 120 T5O = T25 - T24;
Chris@42 121 TdR = Td - Ta;
Chris@42 122 Te = Ta + Td;
Chris@42 123 T5P = FNMS(KP707106781, T5O, T5N);
Chris@42 124 T8v = FMA(KP707106781, T5O, T5N);
Chris@42 125 T27 = FMA(KP707106781, T26, T23);
Chris@42 126 T7r = FNMS(KP707106781, T26, T23);
Chris@42 127 Tf = T7 + Te;
Chris@42 128 Ta5 = T7 - Te;
Chris@42 129 T28 = Tg - Th;
Chris@42 130 Ti = Tg + Th;
Chris@42 131 }
Chris@42 132 }
Chris@42 133 Tq = R0[WS(rs, 12)];
Chris@42 134 Tr = R0[WS(rs, 44)];
Chris@42 135 Tj = R0[WS(rs, 20)];
Chris@42 136 Tk = R0[WS(rs, 52)];
Chris@42 137 Tn = R0[WS(rs, 60)];
Chris@42 138 T2c = Tq - Tr;
Chris@42 139 Ts = Tq + Tr;
Chris@42 140 T29 = Tj - Tk;
Chris@42 141 Tl = Tj + Tk;
Chris@42 142 To = R0[WS(rs, 28)];
Chris@42 143 }
Chris@42 144 }
Chris@42 145 {
Chris@42 146 E T2g, T2l, T2h, TF, TcI, TC, T2i, TI;
Chris@42 147 {
Chris@42 148 E Ty, TG, TB, TH;
Chris@42 149 {
Chris@42 150 E Tw, T5Q, T2a, TcE, Tm, T2b, Tp, Tx;
Chris@42 151 Tw = R0[WS(rs, 2)];
Chris@42 152 T5Q = FMA(KP414213562, T28, T29);
Chris@42 153 T2a = FNMS(KP414213562, T29, T28);
Chris@42 154 TcE = Ti - Tl;
Chris@42 155 Tm = Ti + Tl;
Chris@42 156 T2b = Tn - To;
Chris@42 157 Tp = Tn + To;
Chris@42 158 Tx = R0[WS(rs, 34)];
Chris@42 159 {
Chris@42 160 E Tz, TA, TD, TE;
Chris@42 161 Tz = R0[WS(rs, 18)];
Chris@42 162 {
Chris@42 163 E T5R, T2d, TcF, Tt;
Chris@42 164 T5R = FNMS(KP414213562, T2b, T2c);
Chris@42 165 T2d = FMA(KP414213562, T2c, T2b);
Chris@42 166 TcF = Tp - Ts;
Chris@42 167 Tt = Tp + Ts;
Chris@42 168 T2g = Tw - Tx;
Chris@42 169 Ty = Tw + Tx;
Chris@42 170 T7s = T5Q - T5R;
Chris@42 171 T5S = T5Q + T5R;
Chris@42 172 T8w = T2d - T2a;
Chris@42 173 T2e = T2a + T2d;
Chris@42 174 TdS = TcF - TcE;
Chris@42 175 TcG = TcE + TcF;
Chris@42 176 Tbn = Tt - Tm;
Chris@42 177 Tu = Tm + Tt;
Chris@42 178 TA = R0[WS(rs, 50)];
Chris@42 179 }
Chris@42 180 TD = R0[WS(rs, 10)];
Chris@42 181 TE = R0[WS(rs, 42)];
Chris@42 182 TG = R0[WS(rs, 58)];
Chris@42 183 T2l = Tz - TA;
Chris@42 184 TB = Tz + TA;
Chris@42 185 T2h = TD - TE;
Chris@42 186 TF = TD + TE;
Chris@42 187 TH = R0[WS(rs, 26)];
Chris@42 188 }
Chris@42 189 }
Chris@42 190 TcI = Ty - TB;
Chris@42 191 TC = Ty + TB;
Chris@42 192 T2i = TG - TH;
Chris@42 193 TI = TG + TH;
Chris@42 194 }
Chris@42 195 {
Chris@42 196 E T2p, T2u, T2q, TU, TcL, TR, T2r, TX;
Chris@42 197 {
Chris@42 198 E TN, TV, TQ, TW;
Chris@42 199 {
Chris@42 200 E T2k, T7u, T2n, T7v, TL, TM;
Chris@42 201 TL = R0[WS(rs, 62)];
Chris@42 202 TM = R0[WS(rs, 30)];
Chris@42 203 {
Chris@42 204 E TJ, TcJ, T2m, T2j;
Chris@42 205 TJ = TF + TI;
Chris@42 206 TcJ = TI - TF;
Chris@42 207 T2m = T2h - T2i;
Chris@42 208 T2j = T2h + T2i;
Chris@42 209 TcK = FMA(KP414213562, TcJ, TcI);
Chris@42 210 TdU = FNMS(KP414213562, TcI, TcJ);
Chris@42 211 TK = TC + TJ;
Chris@42 212 Ta6 = TC - TJ;
Chris@42 213 T2k = FMA(KP707106781, T2j, T2g);
Chris@42 214 T7u = FNMS(KP707106781, T2j, T2g);
Chris@42 215 T2n = FMA(KP707106781, T2m, T2l);
Chris@42 216 T7v = FNMS(KP707106781, T2m, T2l);
Chris@42 217 T2p = TL - TM;
Chris@42 218 TN = TL + TM;
Chris@42 219 }
Chris@42 220 T7w = FMA(KP668178637, T7v, T7u);
Chris@42 221 T8y = FNMS(KP668178637, T7u, T7v);
Chris@42 222 T2o = FNMS(KP198912367, T2n, T2k);
Chris@42 223 T5U = FMA(KP198912367, T2k, T2n);
Chris@42 224 {
Chris@42 225 E TO, TP, TS, TT;
Chris@42 226 TO = R0[WS(rs, 14)];
Chris@42 227 TP = R0[WS(rs, 46)];
Chris@42 228 TS = R0[WS(rs, 6)];
Chris@42 229 TT = R0[WS(rs, 38)];
Chris@42 230 TV = R0[WS(rs, 54)];
Chris@42 231 T2u = TO - TP;
Chris@42 232 TQ = TO + TP;
Chris@42 233 T2q = TS - TT;
Chris@42 234 TU = TS + TT;
Chris@42 235 TW = R0[WS(rs, 22)];
Chris@42 236 }
Chris@42 237 }
Chris@42 238 TcL = TN - TQ;
Chris@42 239 TR = TN + TQ;
Chris@42 240 T2r = TV - TW;
Chris@42 241 TX = TV + TW;
Chris@42 242 }
Chris@42 243 {
Chris@42 244 E T2A, T14, T2N, T17, T1b, T1e, T2D, T2O, T1r, T2I, T1q, T2Q, T2H, TcR, T1n;
Chris@42 245 E T1s, T15, T16;
Chris@42 246 {
Chris@42 247 E T2t, T7x, T2w, T7y, T12, T13;
Chris@42 248 T12 = R0[WS(rs, 1)];
Chris@42 249 T13 = R0[WS(rs, 33)];
Chris@42 250 {
Chris@42 251 E TY, TcM, T2v, T2s;
Chris@42 252 TY = TU + TX;
Chris@42 253 TcM = TX - TU;
Chris@42 254 T2v = T2q - T2r;
Chris@42 255 T2s = T2q + T2r;
Chris@42 256 TcN = FNMS(KP414213562, TcM, TcL);
Chris@42 257 TdV = FMA(KP414213562, TcL, TcM);
Chris@42 258 TZ = TR + TY;
Chris@42 259 Ta7 = TR - TY;
Chris@42 260 T2t = FMA(KP707106781, T2s, T2p);
Chris@42 261 T7x = FNMS(KP707106781, T2s, T2p);
Chris@42 262 T2w = FMA(KP707106781, T2v, T2u);
Chris@42 263 T7y = FNMS(KP707106781, T2v, T2u);
Chris@42 264 T2A = T12 - T13;
Chris@42 265 T14 = T12 + T13;
Chris@42 266 }
Chris@42 267 T7z = FNMS(KP668178637, T7y, T7x);
Chris@42 268 T8z = FMA(KP668178637, T7x, T7y);
Chris@42 269 T2x = FMA(KP198912367, T2w, T2t);
Chris@42 270 T5V = FNMS(KP198912367, T2t, T2w);
Chris@42 271 T15 = R0[WS(rs, 17)];
Chris@42 272 T16 = R0[WS(rs, 49)];
Chris@42 273 }
Chris@42 274 {
Chris@42 275 E T1c, T2B, T1d, T19, T1a;
Chris@42 276 T19 = R0[WS(rs, 9)];
Chris@42 277 T1a = R0[WS(rs, 41)];
Chris@42 278 T1c = R0[WS(rs, 57)];
Chris@42 279 T2N = T15 - T16;
Chris@42 280 T17 = T15 + T16;
Chris@42 281 T2B = T19 - T1a;
Chris@42 282 T1b = T19 + T1a;
Chris@42 283 T1d = R0[WS(rs, 25)];
Chris@42 284 {
Chris@42 285 E T1k, T2F, T1j, T1l, T1h, T1i, T2C;
Chris@42 286 T1h = R0[WS(rs, 5)];
Chris@42 287 T1i = R0[WS(rs, 37)];
Chris@42 288 T2C = T1c - T1d;
Chris@42 289 T1e = T1c + T1d;
Chris@42 290 T1k = R0[WS(rs, 21)];
Chris@42 291 T2F = T1h - T1i;
Chris@42 292 T1j = T1h + T1i;
Chris@42 293 T2D = T2B + T2C;
Chris@42 294 T2O = T2B - T2C;
Chris@42 295 T1l = R0[WS(rs, 53)];
Chris@42 296 {
Chris@42 297 E T1o, T1p, T2G, T1m;
Chris@42 298 T1o = R0[WS(rs, 61)];
Chris@42 299 T1p = R0[WS(rs, 29)];
Chris@42 300 T1r = R0[WS(rs, 13)];
Chris@42 301 T2G = T1k - T1l;
Chris@42 302 T1m = T1k + T1l;
Chris@42 303 T2I = T1o - T1p;
Chris@42 304 T1q = T1o + T1p;
Chris@42 305 T2Q = FMA(KP414213562, T2F, T2G);
Chris@42 306 T2H = FNMS(KP414213562, T2G, T2F);
Chris@42 307 TcR = T1j - T1m;
Chris@42 308 T1n = T1j + T1m;
Chris@42 309 T1s = R0[WS(rs, 45)];
Chris@42 310 }
Chris@42 311 }
Chris@42 312 }
Chris@42 313 {
Chris@42 314 E TcQ, TcV, T2K, T2R, T1u, TcT, TcW, TcS;
Chris@42 315 {
Chris@42 316 E T18, T1f, T1t, T2J;
Chris@42 317 T18 = T14 + T17;
Chris@42 318 TcQ = T14 - T17;
Chris@42 319 TcV = T1e - T1b;
Chris@42 320 T1f = T1b + T1e;
Chris@42 321 T1t = T1r + T1s;
Chris@42 322 T2J = T1r - T1s;
Chris@42 323 T1g = T18 + T1f;
Chris@42 324 Taa = T18 - T1f;
Chris@42 325 T2K = FMA(KP414213562, T2J, T2I);
Chris@42 326 T2R = FNMS(KP414213562, T2I, T2J);
Chris@42 327 T1u = T1q + T1t;
Chris@42 328 TcS = T1q - T1t;
Chris@42 329 }
Chris@42 330 TcT = TcR + TcS;
Chris@42 331 TcW = TcS - TcR;
Chris@42 332 {
Chris@42 333 E T7C, T2E, T2L, T7D;
Chris@42 334 T7C = FNMS(KP707106781, T2D, T2A);
Chris@42 335 T2E = FMA(KP707106781, T2D, T2A);
Chris@42 336 Tab = T1u - T1n;
Chris@42 337 T1v = T1n + T1u;
Chris@42 338 Tew = FNMS(KP707106781, TcW, TcV);
Chris@42 339 TcX = FMA(KP707106781, TcW, TcV);
Chris@42 340 Tex = FNMS(KP707106781, TcT, TcQ);
Chris@42 341 TcU = FMA(KP707106781, TcT, TcQ);
Chris@42 342 T2L = T2H + T2K;
Chris@42 343 T7G = T2K - T2H;
Chris@42 344 T7D = T2Q - T2R;
Chris@42 345 T2S = T2Q + T2R;
Chris@42 346 T2P = FMA(KP707106781, T2O, T2N);
Chris@42 347 T7F = FNMS(KP707106781, T2O, T2N);
Chris@42 348 T6A = FNMS(KP923879532, T2L, T2E);
Chris@42 349 T2M = FMA(KP923879532, T2L, T2E);
Chris@42 350 T9b = FNMS(KP923879532, T7D, T7C);
Chris@42 351 T7E = FMA(KP923879532, T7D, T7C);
Chris@42 352 }
Chris@42 353 }
Chris@42 354 }
Chris@42 355 }
Chris@42 356 }
Chris@42 357 }
Chris@42 358 {
Chris@42 359 E T83, T84, T8m, T8n;
Chris@42 360 {
Chris@42 361 E TaP, T4z, TaQ, T5A, TaS, TaT, T4G, T5B, T4O, T5D, Tbh, Tdw, T4R, Tbc, T4S;
Chris@42 362 E T4T;
Chris@42 363 {
Chris@42 364 E T4x, T4y, T5y, T5z;
Chris@42 365 T4x = R1[WS(rs, 63)];
Chris@42 366 T9a = FNMS(KP923879532, T7G, T7F);
Chris@42 367 T7H = FMA(KP923879532, T7G, T7F);
Chris@42 368 T6z = FNMS(KP923879532, T2S, T2P);
Chris@42 369 T2T = FMA(KP923879532, T2S, T2P);
Chris@42 370 T4y = R1[WS(rs, 31)];
Chris@42 371 T5y = R1[WS(rs, 47)];
Chris@42 372 T5z = R1[WS(rs, 15)];
Chris@42 373 {
Chris@42 374 E T4A, T4B, T4D, T4E;
Chris@42 375 T4A = R1[WS(rs, 7)];
Chris@42 376 TaP = T4x + T4y;
Chris@42 377 T4z = T4x - T4y;
Chris@42 378 TaQ = T5z + T5y;
Chris@42 379 T5A = T5y - T5z;
Chris@42 380 T4B = R1[WS(rs, 39)];
Chris@42 381 T4D = R1[WS(rs, 55)];
Chris@42 382 T4E = R1[WS(rs, 23)];
Chris@42 383 {
Chris@42 384 E T4K, Tbf, Tbg, T4N, T4P, T4Q;
Chris@42 385 {
Chris@42 386 E T4I, T4C, T4F, T4J, T4L, T4M;
Chris@42 387 T4I = R1[WS(rs, 3)];
Chris@42 388 TaS = T4A + T4B;
Chris@42 389 T4C = T4A - T4B;
Chris@42 390 TaT = T4D + T4E;
Chris@42 391 T4F = T4D - T4E;
Chris@42 392 T4J = R1[WS(rs, 35)];
Chris@42 393 T4L = R1[WS(rs, 51)];
Chris@42 394 T4M = R1[WS(rs, 19)];
Chris@42 395 T4G = T4C + T4F;
Chris@42 396 T5B = T4F - T4C;
Chris@42 397 T4K = T4I - T4J;
Chris@42 398 Tbf = T4I + T4J;
Chris@42 399 Tbg = T4M + T4L;
Chris@42 400 T4N = T4L - T4M;
Chris@42 401 }
Chris@42 402 T4P = R1[WS(rs, 59)];
Chris@42 403 T4Q = R1[WS(rs, 27)];
Chris@42 404 T4O = FMA(KP414213562, T4N, T4K);
Chris@42 405 T5D = FNMS(KP414213562, T4K, T4N);
Chris@42 406 Tbh = Tbf + Tbg;
Chris@42 407 Tdw = Tbf - Tbg;
Chris@42 408 T4R = T4P - T4Q;
Chris@42 409 Tbc = T4P + T4Q;
Chris@42 410 T4S = R1[WS(rs, 43)];
Chris@42 411 T4T = R1[WS(rs, 11)];
Chris@42 412 }
Chris@42 413 }
Chris@42 414 }
Chris@42 415 {
Chris@42 416 E T4H, T8b, TaR, Tdv, TdI, TaU, T4U, Tbd, T5C;
Chris@42 417 T4H = FMA(KP707106781, T4G, T4z);
Chris@42 418 T8b = FNMS(KP707106781, T4G, T4z);
Chris@42 419 TaR = TaP + TaQ;
Chris@42 420 Tdv = TaP - TaQ;
Chris@42 421 TdI = TaT - TaS;
Chris@42 422 TaU = TaS + TaT;
Chris@42 423 T4U = T4S - T4T;
Chris@42 424 Tbd = T4T + T4S;
Chris@42 425 T8m = FNMS(KP707106781, T5B, T5A);
Chris@42 426 T5C = FMA(KP707106781, T5B, T5A);
Chris@42 427 {
Chris@42 428 E Tbe, Tdx, T5E, T4V;
Chris@42 429 Tbe = Tbc + Tbd;
Chris@42 430 Tdx = Tbc - Tbd;
Chris@42 431 T5E = FMA(KP414213562, T4R, T4U);
Chris@42 432 T4V = FNMS(KP414213562, T4U, T4R);
Chris@42 433 {
Chris@42 434 E Tdy, TdJ, T5F, T8c, T4W;
Chris@42 435 Tdy = Tdw + Tdx;
Chris@42 436 TdJ = Tdx - Tdw;
Chris@42 437 T5F = T5D + T5E;
Chris@42 438 T8c = T5E - T5D;
Chris@42 439 T8n = T4V - T4O;
Chris@42 440 T4W = T4O + T4V;
Chris@42 441 TeO = FNMS(KP707106781, TdJ, TdI);
Chris@42 442 TdK = FMA(KP707106781, TdJ, TdI);
Chris@42 443 TeL = FNMS(KP707106781, Tdy, Tdv);
Chris@42 444 Tdz = FMA(KP707106781, Tdy, Tdv);
Chris@42 445 T9p = FNMS(KP923879532, T8c, T8b);
Chris@42 446 T8d = FMA(KP923879532, T8c, T8b);
Chris@42 447 T6O = FNMS(KP923879532, T5F, T5C);
Chris@42 448 T5G = FMA(KP923879532, T5F, T5C);
Chris@42 449 T6L = FNMS(KP923879532, T4W, T4H);
Chris@42 450 T4X = FMA(KP923879532, T4W, T4H);
Chris@42 451 }
Chris@42 452 Tc3 = TaR + TaU;
Chris@42 453 TaV = TaR - TaU;
Chris@42 454 Tc4 = Tbh + Tbe;
Chris@42 455 Tbi = Tbe - Tbh;
Chris@42 456 }
Chris@42 457 }
Chris@42 458 }
Chris@42 459 {
Chris@42 460 E Tai, T3k, Taj, T4l, Tal, Tam, T4m, T3r, T3D, TaF, T3C, Tdb, TaK, T3z, T4o;
Chris@42 461 E T3E;
Chris@42 462 {
Chris@42 463 E T4j, T4k, T3i, T3j;
Chris@42 464 T3i = R1[0];
Chris@42 465 T3j = R1[WS(rs, 32)];
Chris@42 466 T4j = R1[WS(rs, 16)];
Chris@42 467 T9s = FMA(KP923879532, T8n, T8m);
Chris@42 468 T8o = FNMS(KP923879532, T8n, T8m);
Chris@42 469 Tai = T3i + T3j;
Chris@42 470 T3k = T3i - T3j;
Chris@42 471 T4k = R1[WS(rs, 48)];
Chris@42 472 {
Chris@42 473 E T3o, T3n, T3p, T3l, T3m;
Chris@42 474 T3l = R1[WS(rs, 8)];
Chris@42 475 T3m = R1[WS(rs, 40)];
Chris@42 476 T3o = R1[WS(rs, 56)];
Chris@42 477 Taj = T4j + T4k;
Chris@42 478 T4l = T4j - T4k;
Chris@42 479 T3n = T3l - T3m;
Chris@42 480 Tal = T3l + T3m;
Chris@42 481 T3p = R1[WS(rs, 24)];
Chris@42 482 {
Chris@42 483 E T3w, TaI, T3v, T3x, T3t, T3u, T3q;
Chris@42 484 T3t = R1[WS(rs, 4)];
Chris@42 485 T3u = R1[WS(rs, 36)];
Chris@42 486 T3q = T3o - T3p;
Chris@42 487 Tam = T3o + T3p;
Chris@42 488 T3w = R1[WS(rs, 20)];
Chris@42 489 TaI = T3t + T3u;
Chris@42 490 T3v = T3t - T3u;
Chris@42 491 T4m = T3n - T3q;
Chris@42 492 T3r = T3n + T3q;
Chris@42 493 T3x = R1[WS(rs, 52)];
Chris@42 494 {
Chris@42 495 E T3A, T3B, TaJ, T3y;
Chris@42 496 T3A = R1[WS(rs, 60)];
Chris@42 497 T3B = R1[WS(rs, 28)];
Chris@42 498 T3D = R1[WS(rs, 12)];
Chris@42 499 TaJ = T3w + T3x;
Chris@42 500 T3y = T3w - T3x;
Chris@42 501 TaF = T3A + T3B;
Chris@42 502 T3C = T3A - T3B;
Chris@42 503 Tdb = TaI - TaJ;
Chris@42 504 TaK = TaI + TaJ;
Chris@42 505 T3z = FNMS(KP414213562, T3y, T3v);
Chris@42 506 T4o = FMA(KP414213562, T3v, T3y);
Chris@42 507 T3E = R1[WS(rs, 44)];
Chris@42 508 }
Chris@42 509 }
Chris@42 510 }
Chris@42 511 }
Chris@42 512 {
Chris@42 513 E T3s, T7S, Tak, Tda, Tdn, Tan, T3F, TaG, T4n;
Chris@42 514 T3s = FMA(KP707106781, T3r, T3k);
Chris@42 515 T7S = FNMS(KP707106781, T3r, T3k);
Chris@42 516 Tak = Tai + Taj;
Chris@42 517 Tda = Tai - Taj;
Chris@42 518 Tdn = Tam - Tal;
Chris@42 519 Tan = Tal + Tam;
Chris@42 520 T3F = T3D - T3E;
Chris@42 521 TaG = T3D + T3E;
Chris@42 522 T83 = FNMS(KP707106781, T4m, T4l);
Chris@42 523 T4n = FMA(KP707106781, T4m, T4l);
Chris@42 524 {
Chris@42 525 E TaH, Tdc, T4p, T3G;
Chris@42 526 TaH = TaF + TaG;
Chris@42 527 Tdc = TaF - TaG;
Chris@42 528 T4p = FNMS(KP414213562, T3C, T3F);
Chris@42 529 T3G = FMA(KP414213562, T3F, T3C);
Chris@42 530 {
Chris@42 531 E Tdd, Tdo, T4q, T7T, T3H;
Chris@42 532 Tdd = Tdb + Tdc;
Chris@42 533 Tdo = Tdc - Tdb;
Chris@42 534 T4q = T4o + T4p;
Chris@42 535 T7T = T4o - T4p;
Chris@42 536 T84 = T3G - T3z;
Chris@42 537 T3H = T3z + T3G;
Chris@42 538 TeH = FNMS(KP707106781, Tdo, Tdn);
Chris@42 539 Tdp = FMA(KP707106781, Tdo, Tdn);
Chris@42 540 TeE = FNMS(KP707106781, Tdd, Tda);
Chris@42 541 Tde = FMA(KP707106781, Tdd, Tda);
Chris@42 542 T9i = FNMS(KP923879532, T7T, T7S);
Chris@42 543 T7U = FMA(KP923879532, T7T, T7S);
Chris@42 544 T6H = FNMS(KP923879532, T4q, T4n);
Chris@42 545 T4r = FMA(KP923879532, T4q, T4n);
Chris@42 546 T6E = FNMS(KP923879532, T3H, T3s);
Chris@42 547 T3I = FMA(KP923879532, T3H, T3s);
Chris@42 548 }
Chris@42 549 TbW = Tak + Tan;
Chris@42 550 Tao = Tak - Tan;
Chris@42 551 TbX = TaK + TaH;
Chris@42 552 TaL = TaH - TaK;
Chris@42 553 }
Chris@42 554 }
Chris@42 555 }
Chris@42 556 {
Chris@42 557 E T7N, T3d, T3a, T7M;
Chris@42 558 {
Chris@42 559 E T2V, T1z, T38, T1C, T1G, T1J, T2Y, T39, T1W, T33, T1V, T3b, T32, Td0, T1S;
Chris@42 560 E T1X;
Chris@42 561 {
Chris@42 562 E T1A, T1B, T1x, T1y;
Chris@42 563 T1x = R0[WS(rs, 63)];
Chris@42 564 T1y = R0[WS(rs, 31)];
Chris@42 565 T1A = R0[WS(rs, 15)];
Chris@42 566 T9l = FNMS(KP923879532, T84, T83);
Chris@42 567 T85 = FMA(KP923879532, T84, T83);
Chris@42 568 T2V = T1x - T1y;
Chris@42 569 T1z = T1x + T1y;
Chris@42 570 T1B = R0[WS(rs, 47)];
Chris@42 571 {
Chris@42 572 E T1H, T2W, T1I, T1E, T1F;
Chris@42 573 T1E = R0[WS(rs, 7)];
Chris@42 574 T1F = R0[WS(rs, 39)];
Chris@42 575 T1H = R0[WS(rs, 55)];
Chris@42 576 T38 = T1A - T1B;
Chris@42 577 T1C = T1A + T1B;
Chris@42 578 T2W = T1E - T1F;
Chris@42 579 T1G = T1E + T1F;
Chris@42 580 T1I = R0[WS(rs, 23)];
Chris@42 581 {
Chris@42 582 E T1P, T30, T1O, T1Q, T1M, T1N, T2X;
Chris@42 583 T1M = R0[WS(rs, 3)];
Chris@42 584 T1N = R0[WS(rs, 35)];
Chris@42 585 T2X = T1H - T1I;
Chris@42 586 T1J = T1H + T1I;
Chris@42 587 T1P = R0[WS(rs, 19)];
Chris@42 588 T30 = T1M - T1N;
Chris@42 589 T1O = T1M + T1N;
Chris@42 590 T2Y = T2W + T2X;
Chris@42 591 T39 = T2W - T2X;
Chris@42 592 T1Q = R0[WS(rs, 51)];
Chris@42 593 {
Chris@42 594 E T1T, T1U, T31, T1R;
Chris@42 595 T1T = R0[WS(rs, 59)];
Chris@42 596 T1U = R0[WS(rs, 27)];
Chris@42 597 T1W = R0[WS(rs, 11)];
Chris@42 598 T31 = T1P - T1Q;
Chris@42 599 T1R = T1P + T1Q;
Chris@42 600 T33 = T1T - T1U;
Chris@42 601 T1V = T1T + T1U;
Chris@42 602 T3b = FMA(KP414213562, T30, T31);
Chris@42 603 T32 = FNMS(KP414213562, T31, T30);
Chris@42 604 Td0 = T1O - T1R;
Chris@42 605 T1S = T1O + T1R;
Chris@42 606 T1X = R0[WS(rs, 43)];
Chris@42 607 }
Chris@42 608 }
Chris@42 609 }
Chris@42 610 }
Chris@42 611 {
Chris@42 612 E TcZ, Td4, T35, T3c, T1Z, Td2, Td5, Td1;
Chris@42 613 {
Chris@42 614 E T1D, T1K, T1Y, T34;
Chris@42 615 T1D = T1z + T1C;
Chris@42 616 TcZ = T1z - T1C;
Chris@42 617 Td4 = T1J - T1G;
Chris@42 618 T1K = T1G + T1J;
Chris@42 619 T1Y = T1W + T1X;
Chris@42 620 T34 = T1W - T1X;
Chris@42 621 T1L = T1D + T1K;
Chris@42 622 Tad = T1D - T1K;
Chris@42 623 T35 = FMA(KP414213562, T34, T33);
Chris@42 624 T3c = FNMS(KP414213562, T33, T34);
Chris@42 625 T1Z = T1V + T1Y;
Chris@42 626 Td1 = T1V - T1Y;
Chris@42 627 }
Chris@42 628 Td2 = Td0 + Td1;
Chris@42 629 Td5 = Td1 - Td0;
Chris@42 630 {
Chris@42 631 E T7J, T2Z, T36, T7K;
Chris@42 632 T7J = FNMS(KP707106781, T2Y, T2V);
Chris@42 633 T2Z = FMA(KP707106781, T2Y, T2V);
Chris@42 634 Tae = T1Z - T1S;
Chris@42 635 T20 = T1S + T1Z;
Chris@42 636 Tez = FNMS(KP707106781, Td5, Td4);
Chris@42 637 Td6 = FMA(KP707106781, Td5, Td4);
Chris@42 638 TeA = FNMS(KP707106781, Td2, TcZ);
Chris@42 639 Td3 = FMA(KP707106781, Td2, TcZ);
Chris@42 640 T36 = T32 + T35;
Chris@42 641 T7N = T35 - T32;
Chris@42 642 T7K = T3b - T3c;
Chris@42 643 T3d = T3b + T3c;
Chris@42 644 T3a = FMA(KP707106781, T39, T38);
Chris@42 645 T7M = FNMS(KP707106781, T39, T38);
Chris@42 646 T6x = FNMS(KP923879532, T36, T2Z);
Chris@42 647 T37 = FMA(KP923879532, T36, T2Z);
Chris@42 648 T9e = FNMS(KP923879532, T7K, T7J);
Chris@42 649 T7L = FMA(KP923879532, T7K, T7J);
Chris@42 650 }
Chris@42 651 }
Chris@42 652 }
Chris@42 653 {
Chris@42 654 E Tav, T7V, T7W, TaC;
Chris@42 655 {
Chris@42 656 E T3L, T3W, Tdf, Tar, T42, T4d, Tay, Tdi, T46, Tau, Tdg, T3X, T3S, Taz, T45;
Chris@42 657 E T47, Taw, Tax;
Chris@42 658 {
Chris@42 659 E T3J, T3K, T3U, T3V;
Chris@42 660 T3J = R1[WS(rs, 2)];
Chris@42 661 T9d = FNMS(KP923879532, T7N, T7M);
Chris@42 662 T7O = FMA(KP923879532, T7N, T7M);
Chris@42 663 T6w = FNMS(KP923879532, T3d, T3a);
Chris@42 664 T3e = FMA(KP923879532, T3d, T3a);
Chris@42 665 T3K = R1[WS(rs, 34)];
Chris@42 666 T3U = R1[WS(rs, 18)];
Chris@42 667 T3V = R1[WS(rs, 50)];
Chris@42 668 {
Chris@42 669 E T40, Tap, Taq, T41, T4b, T4c;
Chris@42 670 T40 = R1[WS(rs, 62)];
Chris@42 671 T3L = T3J - T3K;
Chris@42 672 Tap = T3J + T3K;
Chris@42 673 T3W = T3U - T3V;
Chris@42 674 Taq = T3U + T3V;
Chris@42 675 T41 = R1[WS(rs, 30)];
Chris@42 676 T4b = R1[WS(rs, 14)];
Chris@42 677 T4c = R1[WS(rs, 46)];
Chris@42 678 Tdf = Tap - Taq;
Chris@42 679 Tar = Tap + Taq;
Chris@42 680 T42 = T40 - T41;
Chris@42 681 Taw = T40 + T41;
Chris@42 682 Tax = T4b + T4c;
Chris@42 683 T4d = T4b - T4c;
Chris@42 684 }
Chris@42 685 }
Chris@42 686 {
Chris@42 687 E T3M, T3N, T3P, T3Q;
Chris@42 688 T3M = R1[WS(rs, 10)];
Chris@42 689 Tay = Taw + Tax;
Chris@42 690 Tdi = Taw - Tax;
Chris@42 691 T3N = R1[WS(rs, 42)];
Chris@42 692 T3P = R1[WS(rs, 58)];
Chris@42 693 T3Q = R1[WS(rs, 26)];
Chris@42 694 {
Chris@42 695 E T43, Tas, T3O, Tat, T3R, T44;
Chris@42 696 T43 = R1[WS(rs, 6)];
Chris@42 697 Tas = T3M + T3N;
Chris@42 698 T3O = T3M - T3N;
Chris@42 699 Tat = T3P + T3Q;
Chris@42 700 T3R = T3P - T3Q;
Chris@42 701 T44 = R1[WS(rs, 38)];
Chris@42 702 T46 = R1[WS(rs, 54)];
Chris@42 703 Tau = Tas + Tat;
Chris@42 704 Tdg = Tat - Tas;
Chris@42 705 T3X = T3O - T3R;
Chris@42 706 T3S = T3O + T3R;
Chris@42 707 Taz = T43 + T44;
Chris@42 708 T45 = T43 - T44;
Chris@42 709 T47 = R1[WS(rs, 22)];
Chris@42 710 }
Chris@42 711 }
Chris@42 712 {
Chris@42 713 E Tdq, Tdh, T49, T4e, Tdr, Tdk;
Chris@42 714 Tav = Tar - Tau;
Chris@42 715 TbZ = Tar + Tau;
Chris@42 716 {
Chris@42 717 E T3T, T3Y, TaA, T48, Tdj, TaB;
Chris@42 718 T3T = FMA(KP707106781, T3S, T3L);
Chris@42 719 T7V = FNMS(KP707106781, T3S, T3L);
Chris@42 720 T7W = FNMS(KP707106781, T3X, T3W);
Chris@42 721 T3Y = FMA(KP707106781, T3X, T3W);
Chris@42 722 TaA = T46 + T47;
Chris@42 723 T48 = T46 - T47;
Chris@42 724 Tdq = FNMS(KP414213562, Tdf, Tdg);
Chris@42 725 Tdh = FMA(KP414213562, Tdg, Tdf);
Chris@42 726 T3Z = FNMS(KP198912367, T3Y, T3T);
Chris@42 727 T4s = FMA(KP198912367, T3T, T3Y);
Chris@42 728 Tdj = TaA - Taz;
Chris@42 729 TaB = Taz + TaA;
Chris@42 730 T49 = T45 + T48;
Chris@42 731 T4e = T45 - T48;
Chris@42 732 TaC = Tay - TaB;
Chris@42 733 Tc0 = Tay + TaB;
Chris@42 734 Tdr = FMA(KP414213562, Tdi, Tdj);
Chris@42 735 Tdk = FNMS(KP414213562, Tdj, Tdi);
Chris@42 736 }
Chris@42 737 {
Chris@42 738 E T7Z, T7Y, T4f, T4a;
Chris@42 739 T7Z = FNMS(KP707106781, T4e, T4d);
Chris@42 740 T4f = FMA(KP707106781, T4e, T4d);
Chris@42 741 T4a = FMA(KP707106781, T49, T42);
Chris@42 742 T7Y = FNMS(KP707106781, T49, T42);
Chris@42 743 TeF = Tdr - Tdq;
Chris@42 744 Tds = Tdq + Tdr;
Chris@42 745 T4t = FNMS(KP198912367, T4a, T4f);
Chris@42 746 T4g = FMA(KP198912367, T4f, T4a);
Chris@42 747 T87 = FMA(KP668178637, T7Y, T7Z);
Chris@42 748 T80 = FNMS(KP668178637, T7Z, T7Y);
Chris@42 749 TeI = Tdh - Tdk;
Chris@42 750 Tdl = Tdh + Tdk;
Chris@42 751 }
Chris@42 752 }
Chris@42 753 }
Chris@42 754 {
Chris@42 755 E T50, T5b, TdA, TaY, T5h, T5s, Tb5, TdD, T5l, Tb1, TdB, T5c, T57, Tb6, T5k;
Chris@42 756 E T5m, Tb3, Tb4;
Chris@42 757 {
Chris@42 758 E T4Y, T4Z, T59, T5a;
Chris@42 759 T4Y = R1[WS(rs, 1)];
Chris@42 760 T86 = FNMS(KP668178637, T7V, T7W);
Chris@42 761 T7X = FMA(KP668178637, T7W, T7V);
Chris@42 762 TaM = TaC - Tav;
Chris@42 763 TaD = Tav + TaC;
Chris@42 764 T4Z = R1[WS(rs, 33)];
Chris@42 765 T59 = R1[WS(rs, 49)];
Chris@42 766 T5a = R1[WS(rs, 17)];
Chris@42 767 {
Chris@42 768 E T5f, TaW, TaX, T5g, T5q, T5r;
Chris@42 769 T5f = R1[WS(rs, 61)];
Chris@42 770 T50 = T4Y - T4Z;
Chris@42 771 TaW = T4Y + T4Z;
Chris@42 772 T5b = T59 - T5a;
Chris@42 773 TaX = T5a + T59;
Chris@42 774 T5g = R1[WS(rs, 29)];
Chris@42 775 T5q = R1[WS(rs, 45)];
Chris@42 776 T5r = R1[WS(rs, 13)];
Chris@42 777 TdA = TaW - TaX;
Chris@42 778 TaY = TaW + TaX;
Chris@42 779 T5h = T5f - T5g;
Chris@42 780 Tb3 = T5f + T5g;
Chris@42 781 Tb4 = T5r + T5q;
Chris@42 782 T5s = T5q - T5r;
Chris@42 783 }
Chris@42 784 }
Chris@42 785 {
Chris@42 786 E T51, T52, T54, T55;
Chris@42 787 T51 = R1[WS(rs, 9)];
Chris@42 788 Tb5 = Tb3 + Tb4;
Chris@42 789 TdD = Tb3 - Tb4;
Chris@42 790 T52 = R1[WS(rs, 41)];
Chris@42 791 T54 = R1[WS(rs, 57)];
Chris@42 792 T55 = R1[WS(rs, 25)];
Chris@42 793 {
Chris@42 794 E T5i, TaZ, T53, Tb0, T56, T5j;
Chris@42 795 T5i = R1[WS(rs, 5)];
Chris@42 796 TaZ = T51 + T52;
Chris@42 797 T53 = T51 - T52;
Chris@42 798 Tb0 = T54 + T55;
Chris@42 799 T56 = T54 - T55;
Chris@42 800 T5j = R1[WS(rs, 37)];
Chris@42 801 T5l = R1[WS(rs, 53)];
Chris@42 802 Tb1 = TaZ + Tb0;
Chris@42 803 TdB = Tb0 - TaZ;
Chris@42 804 T5c = T56 - T53;
Chris@42 805 T57 = T53 + T56;
Chris@42 806 Tb6 = T5i + T5j;
Chris@42 807 T5k = T5i - T5j;
Chris@42 808 T5m = R1[WS(rs, 21)];
Chris@42 809 }
Chris@42 810 }
Chris@42 811 {
Chris@42 812 E TdL, TdC, T5o, T5t, TdM, TdF;
Chris@42 813 Tb2 = TaY - Tb1;
Chris@42 814 Tc6 = TaY + Tb1;
Chris@42 815 {
Chris@42 816 E T58, T5d, Tb7, T5n, TdE, Tb8;
Chris@42 817 T58 = FMA(KP707106781, T57, T50);
Chris@42 818 T8e = FNMS(KP707106781, T57, T50);
Chris@42 819 T8f = FNMS(KP707106781, T5c, T5b);
Chris@42 820 T5d = FMA(KP707106781, T5c, T5b);
Chris@42 821 Tb7 = T5l + T5m;
Chris@42 822 T5n = T5l - T5m;
Chris@42 823 TdL = FNMS(KP414213562, TdA, TdB);
Chris@42 824 TdC = FMA(KP414213562, TdB, TdA);
Chris@42 825 T5e = FMA(KP198912367, T5d, T58);
Chris@42 826 T5H = FNMS(KP198912367, T58, T5d);
Chris@42 827 TdE = Tb7 - Tb6;
Chris@42 828 Tb8 = Tb6 + Tb7;
Chris@42 829 T5o = T5k + T5n;
Chris@42 830 T5t = T5n - T5k;
Chris@42 831 Tb9 = Tb5 - Tb8;
Chris@42 832 Tc7 = Tb5 + Tb8;
Chris@42 833 TdM = FMA(KP414213562, TdD, TdE);
Chris@42 834 TdF = FNMS(KP414213562, TdE, TdD);
Chris@42 835 }
Chris@42 836 {
Chris@42 837 E T8i, T8h, T5u, T5p;
Chris@42 838 T8i = FNMS(KP707106781, T5t, T5s);
Chris@42 839 T5u = FMA(KP707106781, T5t, T5s);
Chris@42 840 T5p = FMA(KP707106781, T5o, T5h);
Chris@42 841 T8h = FNMS(KP707106781, T5o, T5h);
Chris@42 842 TeM = TdM - TdL;
Chris@42 843 TdN = TdL + TdM;
Chris@42 844 T5I = FMA(KP198912367, T5p, T5u);
Chris@42 845 T5v = FNMS(KP198912367, T5u, T5p);
Chris@42 846 T8q = FNMS(KP668178637, T8h, T8i);
Chris@42 847 T8j = FMA(KP668178637, T8i, T8h);
Chris@42 848 TeP = TdF - TdC;
Chris@42 849 TdG = TdC + TdF;
Chris@42 850 }
Chris@42 851 }
Chris@42 852 }
Chris@42 853 }
Chris@42 854 }
Chris@42 855 }
Chris@42 856 }
Chris@42 857 {
Chris@42 858 E T8p, T8g, TcH, TdW, TdT, TcO, Tfp, Tfk, Tfj, Tfq;
Chris@42 859 {
Chris@42 860 E Tbj, Tba, Tcy, Tco, TcB, Tcl, Tcx, Tcv, Tcz, Tcr;
Chris@42 861 {
Chris@42 862 E Tch, Tct, Tcp, Tcq, Tci, T1w, TbV, T11, Tcf, Tc9, T21, Tcj, Tcm, TbY, Tc1;
Chris@42 863 E Tcn, Tcu, Tck;
Chris@42 864 {
Chris@42 865 E Tv, T10, Tc5, Tc8;
Chris@42 866 Tch = Tf - Tu;
Chris@42 867 Tv = Tf + Tu;
Chris@42 868 T8p = FMA(KP668178637, T8e, T8f);
Chris@42 869 T8g = FNMS(KP668178637, T8f, T8e);
Chris@42 870 Tbj = Tb9 - Tb2;
Chris@42 871 Tba = Tb2 + Tb9;
Chris@42 872 T10 = TK + TZ;
Chris@42 873 Tct = TZ - TK;
Chris@42 874 Tcp = Tc3 - Tc4;
Chris@42 875 Tc5 = Tc3 + Tc4;
Chris@42 876 Tc8 = Tc6 + Tc7;
Chris@42 877 Tcq = Tc7 - Tc6;
Chris@42 878 Tci = T1g - T1v;
Chris@42 879 T1w = T1g + T1v;
Chris@42 880 TbV = Tv - T10;
Chris@42 881 T11 = Tv + T10;
Chris@42 882 Tcf = Tc5 + Tc8;
Chris@42 883 Tc9 = Tc5 - Tc8;
Chris@42 884 T21 = T1L + T20;
Chris@42 885 Tcj = T1L - T20;
Chris@42 886 Tcm = TbW - TbX;
Chris@42 887 TbY = TbW + TbX;
Chris@42 888 Tc1 = TbZ + Tc0;
Chris@42 889 Tcn = Tc0 - TbZ;
Chris@42 890 }
Chris@42 891 {
Chris@42 892 E Tcb, T22, Tce, Tc2;
Chris@42 893 Tcb = T21 - T1w;
Chris@42 894 T22 = T1w + T21;
Chris@42 895 Tce = TbY + Tc1;
Chris@42 896 Tc2 = TbY - Tc1;
Chris@42 897 {
Chris@42 898 E Tcd, Tcg, Tca, Tcc;
Chris@42 899 Tcd = T11 + T22;
Chris@42 900 Cr[WS(csr, 32)] = T11 - T22;
Chris@42 901 Tcg = Tce + Tcf;
Chris@42 902 Ci[WS(csi, 32)] = Tcf - Tce;
Chris@42 903 Tca = Tc2 + Tc9;
Chris@42 904 Tcc = Tc9 - Tc2;
Chris@42 905 Cr[0] = Tcd + Tcg;
Chris@42 906 Cr[WS(csr, 64)] = Tcd - Tcg;
Chris@42 907 Ci[WS(csi, 48)] = FMS(KP707106781, Tcc, Tcb);
Chris@42 908 Ci[WS(csi, 16)] = FMA(KP707106781, Tcc, Tcb);
Chris@42 909 Cr[WS(csr, 16)] = FMA(KP707106781, Tca, TbV);
Chris@42 910 Cr[WS(csr, 48)] = FNMS(KP707106781, Tca, TbV);
Chris@42 911 Tcu = Tcj - Tci;
Chris@42 912 Tck = Tci + Tcj;
Chris@42 913 Tcy = FNMS(KP414213562, Tcm, Tcn);
Chris@42 914 Tco = FMA(KP414213562, Tcn, Tcm);
Chris@42 915 }
Chris@42 916 }
Chris@42 917 TcB = FNMS(KP707106781, Tck, Tch);
Chris@42 918 Tcl = FMA(KP707106781, Tck, Tch);
Chris@42 919 Tcx = FMA(KP707106781, Tcu, Tct);
Chris@42 920 Tcv = FNMS(KP707106781, Tcu, Tct);
Chris@42 921 Tcz = FMA(KP414213562, Tcp, Tcq);
Chris@42 922 Tcr = FNMS(KP414213562, Tcq, Tcp);
Chris@42 923 }
Chris@42 924 {
Chris@42 925 E TbT, TbO, TbN, TbU;
Chris@42 926 {
Chris@42 927 E Ta9, TbB, Tbb, TbL, Tbp, TbM, Tag, Tbk, TbR, TbJ, Tbw, TaO, TbC, Tbs, TbQ;
Chris@42 928 E TbG;
Chris@42 929 {
Chris@42 930 E Tbq, Tbr, TbH, TbI;
Chris@42 931 {
Chris@42 932 E Tbo, Ta8, Tac, Taf;
Chris@42 933 Tbo = Ta7 - Ta6;
Chris@42 934 Ta8 = Ta6 + Ta7;
Chris@42 935 {
Chris@42 936 E TcC, TcA, Tcw, Tcs;
Chris@42 937 TcC = Tcz - Tcy;
Chris@42 938 TcA = Tcy + Tcz;
Chris@42 939 Tcw = Tcr - Tco;
Chris@42 940 Tcs = Tco + Tcr;
Chris@42 941 Cr[WS(csr, 24)] = FMA(KP923879532, TcC, TcB);
Chris@42 942 Cr[WS(csr, 40)] = FNMS(KP923879532, TcC, TcB);
Chris@42 943 Ci[WS(csi, 56)] = FMS(KP923879532, TcA, Tcx);
Chris@42 944 Ci[WS(csi, 8)] = FMA(KP923879532, TcA, Tcx);
Chris@42 945 Ci[WS(csi, 40)] = FMA(KP923879532, Tcw, Tcv);
Chris@42 946 Ci[WS(csi, 24)] = FMS(KP923879532, Tcw, Tcv);
Chris@42 947 Cr[WS(csr, 8)] = FMA(KP923879532, Tcs, Tcl);
Chris@42 948 Cr[WS(csr, 56)] = FNMS(KP923879532, Tcs, Tcl);
Chris@42 949 Ta9 = FMA(KP707106781, Ta8, Ta5);
Chris@42 950 TbB = FNMS(KP707106781, Ta8, Ta5);
Chris@42 951 }
Chris@42 952 Tbq = FNMS(KP414213562, Taa, Tab);
Chris@42 953 Tac = FMA(KP414213562, Tab, Taa);
Chris@42 954 Taf = FNMS(KP414213562, Tae, Tad);
Chris@42 955 Tbr = FMA(KP414213562, Tad, Tae);
Chris@42 956 Tbb = FMA(KP707106781, Tba, TaV);
Chris@42 957 TbH = FNMS(KP707106781, Tba, TaV);
Chris@42 958 TbL = FNMS(KP707106781, Tbo, Tbn);
Chris@42 959 Tbp = FMA(KP707106781, Tbo, Tbn);
Chris@42 960 TbM = Taf - Tac;
Chris@42 961 Tag = Tac + Taf;
Chris@42 962 TbI = FNMS(KP707106781, Tbj, Tbi);
Chris@42 963 Tbk = FMA(KP707106781, Tbj, Tbi);
Chris@42 964 }
Chris@42 965 {
Chris@42 966 E TbE, TbF, TaE, TaN;
Chris@42 967 TbE = FNMS(KP707106781, TaD, Tao);
Chris@42 968 TaE = FMA(KP707106781, TaD, Tao);
Chris@42 969 TaN = FMA(KP707106781, TaM, TaL);
Chris@42 970 TbF = FNMS(KP707106781, TaM, TaL);
Chris@42 971 TbR = FNMS(KP668178637, TbH, TbI);
Chris@42 972 TbJ = FMA(KP668178637, TbI, TbH);
Chris@42 973 Tbw = FNMS(KP198912367, TaE, TaN);
Chris@42 974 TaO = FMA(KP198912367, TaN, TaE);
Chris@42 975 TbC = Tbr - Tbq;
Chris@42 976 Tbs = Tbq + Tbr;
Chris@42 977 TbQ = FMA(KP668178637, TbE, TbF);
Chris@42 978 TbG = FNMS(KP668178637, TbF, TbE);
Chris@42 979 }
Chris@42 980 }
Chris@42 981 {
Chris@42 982 E Tbz, Tah, Tbv, Tbt, Tbx, Tbl;
Chris@42 983 Tbz = FNMS(KP923879532, Tag, Ta9);
Chris@42 984 Tah = FMA(KP923879532, Tag, Ta9);
Chris@42 985 Tbv = FMA(KP923879532, Tbs, Tbp);
Chris@42 986 Tbt = FNMS(KP923879532, Tbs, Tbp);
Chris@42 987 Tbx = FMA(KP198912367, Tbb, Tbk);
Chris@42 988 Tbl = FNMS(KP198912367, Tbk, Tbb);
Chris@42 989 {
Chris@42 990 E TbD, TbK, TbP, TbS;
Chris@42 991 TbT = FNMS(KP923879532, TbC, TbB);
Chris@42 992 TbD = FMA(KP923879532, TbC, TbB);
Chris@42 993 {
Chris@42 994 E TbA, Tby, Tbu, Tbm;
Chris@42 995 TbA = Tbx - Tbw;
Chris@42 996 Tby = Tbw + Tbx;
Chris@42 997 Tbu = Tbl - TaO;
Chris@42 998 Tbm = TaO + Tbl;
Chris@42 999 Cr[WS(csr, 28)] = FMA(KP980785280, TbA, Tbz);
Chris@42 1000 Cr[WS(csr, 36)] = FNMS(KP980785280, TbA, Tbz);
Chris@42 1001 Ci[WS(csi, 60)] = FMS(KP980785280, Tby, Tbv);
Chris@42 1002 Ci[WS(csi, 4)] = FMA(KP980785280, Tby, Tbv);
Chris@42 1003 Ci[WS(csi, 36)] = FMA(KP980785280, Tbu, Tbt);
Chris@42 1004 Ci[WS(csi, 28)] = FMS(KP980785280, Tbu, Tbt);
Chris@42 1005 Cr[WS(csr, 4)] = FMA(KP980785280, Tbm, Tah);
Chris@42 1006 Cr[WS(csr, 60)] = FNMS(KP980785280, Tbm, Tah);
Chris@42 1007 TbK = TbG + TbJ;
Chris@42 1008 TbO = TbJ - TbG;
Chris@42 1009 }
Chris@42 1010 TbN = FMA(KP923879532, TbM, TbL);
Chris@42 1011 TbP = FNMS(KP923879532, TbM, TbL);
Chris@42 1012 TbS = TbQ + TbR;
Chris@42 1013 TbU = TbQ - TbR;
Chris@42 1014 Cr[WS(csr, 12)] = FMA(KP831469612, TbK, TbD);
Chris@42 1015 Cr[WS(csr, 52)] = FNMS(KP831469612, TbK, TbD);
Chris@42 1016 Ci[WS(csi, 52)] = FNMS(KP831469612, TbS, TbP);
Chris@42 1017 Ci[WS(csi, 12)] = -(FMA(KP831469612, TbS, TbP));
Chris@42 1018 }
Chris@42 1019 }
Chris@42 1020 }
Chris@42 1021 {
Chris@42 1022 E TeN, Tf7, Tev, Tfm, Tfc, TeQ, TeX, TeW, Tfn, Tff, Tfi, TeC, Tf2, TeK, Tfh;
Chris@42 1023 E TeV, Tf8;
Chris@42 1024 {
Chris@42 1025 E TeG, TeJ, Tfd, Tfe, Tey, TeB, TeT, TeU;
Chris@42 1026 {
Chris@42 1027 E Tet, Teu, Tfa, Tfb;
Chris@42 1028 TcH = FMA(KP707106781, TcG, TcD);
Chris@42 1029 Tet = FNMS(KP707106781, TcG, TcD);
Chris@42 1030 Ci[WS(csi, 44)] = FMS(KP831469612, TbO, TbN);
Chris@42 1031 Ci[WS(csi, 20)] = FMA(KP831469612, TbO, TbN);
Chris@42 1032 Cr[WS(csr, 20)] = FMA(KP831469612, TbU, TbT);
Chris@42 1033 Cr[WS(csr, 44)] = FNMS(KP831469612, TbU, TbT);
Chris@42 1034 Teu = TdV - TdU;
Chris@42 1035 TdW = TdU + TdV;
Chris@42 1036 TeG = FNMS(KP923879532, TeF, TeE);
Chris@42 1037 Tfa = FMA(KP923879532, TeF, TeE);
Chris@42 1038 Tfb = FMA(KP923879532, TeI, TeH);
Chris@42 1039 TeJ = FNMS(KP923879532, TeI, TeH);
Chris@42 1040 TeN = FNMS(KP923879532, TeM, TeL);
Chris@42 1041 Tfd = FMA(KP923879532, TeM, TeL);
Chris@42 1042 Tf7 = FMA(KP923879532, Teu, Tet);
Chris@42 1043 Tev = FNMS(KP923879532, Teu, Tet);
Chris@42 1044 Tfm = FMA(KP303346683, Tfa, Tfb);
Chris@42 1045 Tfc = FNMS(KP303346683, Tfb, Tfa);
Chris@42 1046 Tfe = FNMS(KP923879532, TeP, TeO);
Chris@42 1047 TeQ = FMA(KP923879532, TeP, TeO);
Chris@42 1048 TeX = FNMS(KP668178637, Tew, Tex);
Chris@42 1049 Tey = FMA(KP668178637, Tex, Tew);
Chris@42 1050 TeB = FNMS(KP668178637, TeA, Tez);
Chris@42 1051 TeW = FMA(KP668178637, Tez, TeA);
Chris@42 1052 }
Chris@42 1053 Tfn = FNMS(KP303346683, Tfd, Tfe);
Chris@42 1054 Tff = FMA(KP303346683, Tfe, Tfd);
Chris@42 1055 Tfi = Tey + TeB;
Chris@42 1056 TeC = Tey - TeB;
Chris@42 1057 TdT = FMA(KP707106781, TdS, TdR);
Chris@42 1058 TeT = FNMS(KP707106781, TdS, TdR);
Chris@42 1059 TeU = TcN - TcK;
Chris@42 1060 TcO = TcK + TcN;
Chris@42 1061 Tf2 = FNMS(KP534511135, TeG, TeJ);
Chris@42 1062 TeK = FMA(KP534511135, TeJ, TeG);
Chris@42 1063 Tfh = FNMS(KP923879532, TeU, TeT);
Chris@42 1064 TeV = FMA(KP923879532, TeU, TeT);
Chris@42 1065 }
Chris@42 1066 {
Chris@42 1067 E Tf5, TeD, TeY, Tf3, TeR;
Chris@42 1068 Tf5 = FNMS(KP831469612, TeC, Tev);
Chris@42 1069 TeD = FMA(KP831469612, TeC, Tev);
Chris@42 1070 Tf8 = TeX + TeW;
Chris@42 1071 TeY = TeW - TeX;
Chris@42 1072 Tf3 = FMA(KP534511135, TeN, TeQ);
Chris@42 1073 TeR = FNMS(KP534511135, TeQ, TeN);
Chris@42 1074 {
Chris@42 1075 E Tf1, TeZ, Tf6, Tf4, Tf0, TeS;
Chris@42 1076 Tf1 = FMA(KP831469612, TeY, TeV);
Chris@42 1077 TeZ = FNMS(KP831469612, TeY, TeV);
Chris@42 1078 Tf6 = Tf3 - Tf2;
Chris@42 1079 Tf4 = Tf2 + Tf3;
Chris@42 1080 Tf0 = TeR - TeK;
Chris@42 1081 TeS = TeK + TeR;
Chris@42 1082 Ci[WS(csi, 54)] = FMS(KP881921264, Tf4, Tf1);
Chris@42 1083 Ci[WS(csi, 10)] = FMA(KP881921264, Tf4, Tf1);
Chris@42 1084 Ci[WS(csi, 42)] = FMA(KP881921264, Tf0, TeZ);
Chris@42 1085 Ci[WS(csi, 22)] = FMS(KP881921264, Tf0, TeZ);
Chris@42 1086 Cr[WS(csr, 10)] = FMA(KP881921264, TeS, TeD);
Chris@42 1087 Cr[WS(csr, 54)] = FNMS(KP881921264, TeS, TeD);
Chris@42 1088 Cr[WS(csr, 42)] = FNMS(KP881921264, Tf6, Tf5);
Chris@42 1089 Cr[WS(csr, 22)] = FMA(KP881921264, Tf6, Tf5);
Chris@42 1090 }
Chris@42 1091 }
Chris@42 1092 {
Chris@42 1093 E Tf9, Tfg, Tfl, Tfo;
Chris@42 1094 Tfp = FNMS(KP831469612, Tf8, Tf7);
Chris@42 1095 Tf9 = FMA(KP831469612, Tf8, Tf7);
Chris@42 1096 Tfg = Tfc + Tff;
Chris@42 1097 Tfk = Tff - Tfc;
Chris@42 1098 Tfj = FNMS(KP831469612, Tfi, Tfh);
Chris@42 1099 Tfl = FMA(KP831469612, Tfi, Tfh);
Chris@42 1100 Tfo = Tfm + Tfn;
Chris@42 1101 Tfq = Tfm - Tfn;
Chris@42 1102 Cr[WS(csr, 6)] = FMA(KP956940335, Tfg, Tf9);
Chris@42 1103 Cr[WS(csr, 58)] = FNMS(KP956940335, Tfg, Tf9);
Chris@42 1104 Ci[WS(csi, 58)] = FNMS(KP956940335, Tfo, Tfl);
Chris@42 1105 Ci[WS(csi, 6)] = -(FMA(KP956940335, Tfo, Tfl));
Chris@42 1106 }
Chris@42 1107 }
Chris@42 1108 }
Chris@42 1109 }
Chris@42 1110 {
Chris@42 1111 E T2f, T5W, T5T, T2y, T5J, T5w, T4u, T4h, T7p, T7q;
Chris@42 1112 {
Chris@42 1113 E Ter, Tem, Tel, Tes;
Chris@42 1114 {
Chris@42 1115 E TdH, Te9, TcP, Teo, Tee, TdO, TdY, TdZ, Tep, Teh, Tek, Td8, Te4, Tdu, Tej;
Chris@42 1116 E TdX, Tea;
Chris@42 1117 {
Chris@42 1118 E Tdm, Tdt, Tef, Teg, TcY, Td7, Tec, Ted;
Chris@42 1119 Ci[WS(csi, 38)] = FMS(KP956940335, Tfk, Tfj);
Chris@42 1120 Ci[WS(csi, 26)] = FMA(KP956940335, Tfk, Tfj);
Chris@42 1121 Cr[WS(csr, 26)] = FMA(KP956940335, Tfq, Tfp);
Chris@42 1122 Cr[WS(csr, 38)] = FNMS(KP956940335, Tfq, Tfp);
Chris@42 1123 Tdm = FMA(KP923879532, Tdl, Tde);
Chris@42 1124 Tec = FNMS(KP923879532, Tdl, Tde);
Chris@42 1125 Ted = FNMS(KP923879532, Tds, Tdp);
Chris@42 1126 Tdt = FMA(KP923879532, Tds, Tdp);
Chris@42 1127 TdH = FMA(KP923879532, TdG, Tdz);
Chris@42 1128 Tef = FNMS(KP923879532, TdG, Tdz);
Chris@42 1129 Te9 = FNMS(KP923879532, TcO, TcH);
Chris@42 1130 TcP = FMA(KP923879532, TcO, TcH);
Chris@42 1131 Teo = FMA(KP820678790, Tec, Ted);
Chris@42 1132 Tee = FNMS(KP820678790, Ted, Tec);
Chris@42 1133 Teg = FNMS(KP923879532, TdN, TdK);
Chris@42 1134 TdO = FMA(KP923879532, TdN, TdK);
Chris@42 1135 TdY = FNMS(KP198912367, TcU, TcX);
Chris@42 1136 TcY = FMA(KP198912367, TcX, TcU);
Chris@42 1137 Td7 = FNMS(KP198912367, Td6, Td3);
Chris@42 1138 TdZ = FMA(KP198912367, Td3, Td6);
Chris@42 1139 Tep = FNMS(KP820678790, Tef, Teg);
Chris@42 1140 Teh = FMA(KP820678790, Teg, Tef);
Chris@42 1141 Tek = Td7 - TcY;
Chris@42 1142 Td8 = TcY + Td7;
Chris@42 1143 Te4 = FNMS(KP098491403, Tdm, Tdt);
Chris@42 1144 Tdu = FMA(KP098491403, Tdt, Tdm);
Chris@42 1145 Tej = FNMS(KP923879532, TdW, TdT);
Chris@42 1146 TdX = FMA(KP923879532, TdW, TdT);
Chris@42 1147 }
Chris@42 1148 {
Chris@42 1149 E Te7, Td9, Te0, Te5, TdP;
Chris@42 1150 Te7 = FNMS(KP980785280, Td8, TcP);
Chris@42 1151 Td9 = FMA(KP980785280, Td8, TcP);
Chris@42 1152 Tea = TdZ - TdY;
Chris@42 1153 Te0 = TdY + TdZ;
Chris@42 1154 Te5 = FMA(KP098491403, TdH, TdO);
Chris@42 1155 TdP = FNMS(KP098491403, TdO, TdH);
Chris@42 1156 {
Chris@42 1157 E Te3, Te1, Te8, Te6, Te2, TdQ;
Chris@42 1158 Te3 = FMA(KP980785280, Te0, TdX);
Chris@42 1159 Te1 = FNMS(KP980785280, Te0, TdX);
Chris@42 1160 Te8 = Te5 - Te4;
Chris@42 1161 Te6 = Te4 + Te5;
Chris@42 1162 Te2 = TdP - Tdu;
Chris@42 1163 TdQ = Tdu + TdP;
Chris@42 1164 Ci[WS(csi, 62)] = FMS(KP995184726, Te6, Te3);
Chris@42 1165 Ci[WS(csi, 2)] = FMA(KP995184726, Te6, Te3);
Chris@42 1166 Ci[WS(csi, 34)] = FMA(KP995184726, Te2, Te1);
Chris@42 1167 Ci[WS(csi, 30)] = FMS(KP995184726, Te2, Te1);
Chris@42 1168 Cr[WS(csr, 2)] = FMA(KP995184726, TdQ, Td9);
Chris@42 1169 Cr[WS(csr, 62)] = FNMS(KP995184726, TdQ, Td9);
Chris@42 1170 Cr[WS(csr, 34)] = FNMS(KP995184726, Te8, Te7);
Chris@42 1171 Cr[WS(csr, 30)] = FMA(KP995184726, Te8, Te7);
Chris@42 1172 }
Chris@42 1173 }
Chris@42 1174 {
Chris@42 1175 E Teb, Tei, Ten, Teq;
Chris@42 1176 Ter = FNMS(KP980785280, Tea, Te9);
Chris@42 1177 Teb = FMA(KP980785280, Tea, Te9);
Chris@42 1178 Tei = Tee + Teh;
Chris@42 1179 Tem = Teh - Tee;
Chris@42 1180 Tel = FMA(KP980785280, Tek, Tej);
Chris@42 1181 Ten = FNMS(KP980785280, Tek, Tej);
Chris@42 1182 Teq = Teo + Tep;
Chris@42 1183 Tes = Teo - Tep;
Chris@42 1184 Cr[WS(csr, 14)] = FMA(KP773010453, Tei, Teb);
Chris@42 1185 Cr[WS(csr, 50)] = FNMS(KP773010453, Tei, Teb);
Chris@42 1186 Ci[WS(csi, 50)] = FNMS(KP773010453, Teq, Ten);
Chris@42 1187 Ci[WS(csi, 14)] = -(FMA(KP773010453, Teq, Ten));
Chris@42 1188 }
Chris@42 1189 }
Chris@42 1190 {
Chris@42 1191 E T77, T6v, T7i, T6C, T78, T6Y, T7h, T6V, T6N, T7d, T6P, T6F, T6I;
Chris@42 1192 {
Chris@42 1193 E T6W, T6X, T6T, T6U, T6M;
Chris@42 1194 {
Chris@42 1195 E T6t, T6u, T6y, T6B;
Chris@42 1196 T2f = FMA(KP923879532, T2e, T27);
Chris@42 1197 T6t = FNMS(KP923879532, T2e, T27);
Chris@42 1198 Ci[WS(csi, 46)] = FMS(KP773010453, Tem, Tel);
Chris@42 1199 Ci[WS(csi, 18)] = FMA(KP773010453, Tem, Tel);
Chris@42 1200 Cr[WS(csr, 18)] = FMA(KP773010453, Tes, Ter);
Chris@42 1201 Cr[WS(csr, 46)] = FNMS(KP773010453, Tes, Ter);
Chris@42 1202 T6u = T5U - T5V;
Chris@42 1203 T5W = T5U + T5V;
Chris@42 1204 T6W = FNMS(KP820678790, T6w, T6x);
Chris@42 1205 T6y = FMA(KP820678790, T6x, T6w);
Chris@42 1206 T6B = FNMS(KP820678790, T6A, T6z);
Chris@42 1207 T6X = FMA(KP820678790, T6z, T6A);
Chris@42 1208 T77 = FMA(KP980785280, T6u, T6t);
Chris@42 1209 T6v = FNMS(KP980785280, T6u, T6t);
Chris@42 1210 T7i = T6B + T6y;
Chris@42 1211 T6C = T6y - T6B;
Chris@42 1212 }
Chris@42 1213 T5T = FMA(KP923879532, T5S, T5P);
Chris@42 1214 T6T = FNMS(KP923879532, T5S, T5P);
Chris@42 1215 T6U = T2x - T2o;
Chris@42 1216 T2y = T2o + T2x;
Chris@42 1217 T5J = T5H + T5I;
Chris@42 1218 T6M = T5I - T5H;
Chris@42 1219 T78 = T6X + T6W;
Chris@42 1220 T6Y = T6W - T6X;
Chris@42 1221 T7h = FMA(KP980785280, T6U, T6T);
Chris@42 1222 T6V = FNMS(KP980785280, T6U, T6T);
Chris@42 1223 T6N = FNMS(KP980785280, T6M, T6L);
Chris@42 1224 T7d = FMA(KP980785280, T6M, T6L);
Chris@42 1225 T6P = T5v - T5e;
Chris@42 1226 T5w = T5e + T5v;
Chris@42 1227 T4u = T4s + T4t;
Chris@42 1228 T6F = T4s - T4t;
Chris@42 1229 T6I = T4g - T3Z;
Chris@42 1230 T4h = T3Z + T4g;
Chris@42 1231 }
Chris@42 1232 {
Chris@42 1233 E T75, T7f, T7n, T7c, T7m, T76;
Chris@42 1234 {
Chris@42 1235 E T6D, T72, T6R, T73, T6K, T71, T6Z, T7e, T6Q, T74, T70, T6S;
Chris@42 1236 T75 = FNMS(KP773010453, T6C, T6v);
Chris@42 1237 T6D = FMA(KP773010453, T6C, T6v);
Chris@42 1238 T7e = FNMS(KP980785280, T6P, T6O);
Chris@42 1239 T6Q = FMA(KP980785280, T6P, T6O);
Chris@42 1240 {
Chris@42 1241 E T7a, T6G, T7b, T6J;
Chris@42 1242 T7a = FMA(KP980785280, T6F, T6E);
Chris@42 1243 T6G = FNMS(KP980785280, T6F, T6E);
Chris@42 1244 T7b = FMA(KP980785280, T6I, T6H);
Chris@42 1245 T6J = FNMS(KP980785280, T6I, T6H);
Chris@42 1246 T7f = FMA(KP357805721, T7e, T7d);
Chris@42 1247 T7n = FNMS(KP357805721, T7d, T7e);
Chris@42 1248 T72 = FMA(KP472964775, T6N, T6Q);
Chris@42 1249 T6R = FNMS(KP472964775, T6Q, T6N);
Chris@42 1250 T7c = FMA(KP357805721, T7b, T7a);
Chris@42 1251 T7m = FNMS(KP357805721, T7a, T7b);
Chris@42 1252 T73 = FMA(KP472964775, T6G, T6J);
Chris@42 1253 T6K = FNMS(KP472964775, T6J, T6G);
Chris@42 1254 }
Chris@42 1255 T71 = FNMS(KP773010453, T6Y, T6V);
Chris@42 1256 T6Z = FMA(KP773010453, T6Y, T6V);
Chris@42 1257 T74 = T72 - T73;
Chris@42 1258 T76 = T73 + T72;
Chris@42 1259 T70 = T6R - T6K;
Chris@42 1260 T6S = T6K + T6R;
Chris@42 1261 Ci[WS(csi, 55)] = FMA(KP903989293, T74, T71);
Chris@42 1262 Ci[WS(csi, 9)] = FMS(KP903989293, T74, T71);
Chris@42 1263 Cr[WS(csr, 9)] = FMA(KP903989293, T6S, T6D);
Chris@42 1264 Cr[WS(csr, 55)] = FNMS(KP903989293, T6S, T6D);
Chris@42 1265 Ci[WS(csi, 41)] = FMS(KP903989293, T70, T6Z);
Chris@42 1266 Ci[WS(csi, 23)] = FMA(KP903989293, T70, T6Z);
Chris@42 1267 }
Chris@42 1268 {
Chris@42 1269 E T7k, T7j, T7l, T7o, T79, T7g;
Chris@42 1270 T7p = FNMS(KP773010453, T78, T77);
Chris@42 1271 T79 = FMA(KP773010453, T78, T77);
Chris@42 1272 T7g = T7c + T7f;
Chris@42 1273 T7k = T7f - T7c;
Chris@42 1274 T7j = FNMS(KP773010453, T7i, T7h);
Chris@42 1275 T7l = FMA(KP773010453, T7i, T7h);
Chris@42 1276 Cr[WS(csr, 23)] = FMA(KP903989293, T76, T75);
Chris@42 1277 Cr[WS(csr, 41)] = FNMS(KP903989293, T76, T75);
Chris@42 1278 Cr[WS(csr, 7)] = FMA(KP941544065, T7g, T79);
Chris@42 1279 Cr[WS(csr, 57)] = FNMS(KP941544065, T7g, T79);
Chris@42 1280 T7o = T7m - T7n;
Chris@42 1281 T7q = T7m + T7n;
Chris@42 1282 Ci[WS(csi, 57)] = FMS(KP941544065, T7o, T7l);
Chris@42 1283 Ci[WS(csi, 7)] = FMA(KP941544065, T7o, T7l);
Chris@42 1284 Ci[WS(csi, 39)] = FMA(KP941544065, T7k, T7j);
Chris@42 1285 Ci[WS(csi, 25)] = FMS(KP941544065, T7k, T7j);
Chris@42 1286 }
Chris@42 1287 }
Chris@42 1288 }
Chris@42 1289 }
Chris@42 1290 {
Chris@42 1291 E T7t, T8A, T8x, T7A, T8r, T8k, T88, T81, Ta3, Ta4, T6r, T6s;
Chris@42 1292 {
Chris@42 1293 E T9L, T99, T9W, T9g, T9M, T9C, T9V, T9z, T9k, T9O, T9T, Ta0, T9H, T9v, T9m;
Chris@42 1294 {
Chris@42 1295 E T9B, T9c, T9f, T9A, T97, T98;
Chris@42 1296 T7t = FMA(KP923879532, T7s, T7r);
Chris@42 1297 T97 = FNMS(KP923879532, T7s, T7r);
Chris@42 1298 T98 = T8z - T8y;
Chris@42 1299 T8A = T8y + T8z;
Chris@42 1300 T9B = FNMS(KP534511135, T9a, T9b);
Chris@42 1301 T9c = FMA(KP534511135, T9b, T9a);
Chris@42 1302 Cr[WS(csr, 25)] = FNMS(KP941544065, T7q, T7p);
Chris@42 1303 Cr[WS(csr, 39)] = FMA(KP941544065, T7q, T7p);
Chris@42 1304 T9L = FMA(KP831469612, T98, T97);
Chris@42 1305 T99 = FNMS(KP831469612, T98, T97);
Chris@42 1306 T9f = FNMS(KP534511135, T9e, T9d);
Chris@42 1307 T9A = FMA(KP534511135, T9d, T9e);
Chris@42 1308 {
Chris@42 1309 E T9x, T9y, T9q, T9t;
Chris@42 1310 T8x = FMA(KP923879532, T8w, T8v);
Chris@42 1311 T9x = FNMS(KP923879532, T8w, T8v);
Chris@42 1312 T9W = T9c + T9f;
Chris@42 1313 T9g = T9c - T9f;
Chris@42 1314 T9M = T9B + T9A;
Chris@42 1315 T9C = T9A - T9B;
Chris@42 1316 T9y = T7z - T7w;
Chris@42 1317 T7A = T7w + T7z;
Chris@42 1318 T8r = T8p + T8q;
Chris@42 1319 T9q = T8p - T8q;
Chris@42 1320 T9t = T8j - T8g;
Chris@42 1321 T8k = T8g + T8j;
Chris@42 1322 {
Chris@42 1323 E T9R, T9r, T9S, T9u, T9j;
Chris@42 1324 T88 = T86 + T87;
Chris@42 1325 T9j = T87 - T86;
Chris@42 1326 T9V = FNMS(KP831469612, T9y, T9x);
Chris@42 1327 T9z = FMA(KP831469612, T9y, T9x);
Chris@42 1328 T9R = FMA(KP831469612, T9q, T9p);
Chris@42 1329 T9r = FNMS(KP831469612, T9q, T9p);
Chris@42 1330 T9S = FMA(KP831469612, T9t, T9s);
Chris@42 1331 T9u = FNMS(KP831469612, T9t, T9s);
Chris@42 1332 T9k = FNMS(KP831469612, T9j, T9i);
Chris@42 1333 T9O = FMA(KP831469612, T9j, T9i);
Chris@42 1334 T9T = FNMS(KP250486960, T9S, T9R);
Chris@42 1335 Ta0 = FMA(KP250486960, T9R, T9S);
Chris@42 1336 T9H = FNMS(KP599376933, T9r, T9u);
Chris@42 1337 T9v = FMA(KP599376933, T9u, T9r);
Chris@42 1338 T9m = T7X - T80;
Chris@42 1339 T81 = T7X + T80;
Chris@42 1340 }
Chris@42 1341 }
Chris@42 1342 }
Chris@42 1343 {
Chris@42 1344 E T9J, T9h, T9F, T9D, T9P, T9n;
Chris@42 1345 T9J = FNMS(KP881921264, T9g, T99);
Chris@42 1346 T9h = FMA(KP881921264, T9g, T99);
Chris@42 1347 T9F = FMA(KP881921264, T9C, T9z);
Chris@42 1348 T9D = FNMS(KP881921264, T9C, T9z);
Chris@42 1349 T9P = FMA(KP831469612, T9m, T9l);
Chris@42 1350 T9n = FNMS(KP831469612, T9m, T9l);
Chris@42 1351 {
Chris@42 1352 E T9Y, T9X, T9Z, Ta2;
Chris@42 1353 {
Chris@42 1354 E T9N, Ta1, T9G, T9o, T9U, T9Q;
Chris@42 1355 Ta3 = FNMS(KP881921264, T9M, T9L);
Chris@42 1356 T9N = FMA(KP881921264, T9M, T9L);
Chris@42 1357 T9Q = FNMS(KP250486960, T9P, T9O);
Chris@42 1358 Ta1 = FMA(KP250486960, T9O, T9P);
Chris@42 1359 T9G = FNMS(KP599376933, T9k, T9n);
Chris@42 1360 T9o = FMA(KP599376933, T9n, T9k);
Chris@42 1361 T9U = T9Q + T9T;
Chris@42 1362 T9Y = T9T - T9Q;
Chris@42 1363 T9X = FNMS(KP881921264, T9W, T9V);
Chris@42 1364 T9Z = FMA(KP881921264, T9W, T9V);
Chris@42 1365 {
Chris@42 1366 E T9K, T9I, T9E, T9w;
Chris@42 1367 T9K = T9G + T9H;
Chris@42 1368 T9I = T9G - T9H;
Chris@42 1369 T9E = T9v - T9o;
Chris@42 1370 T9w = T9o + T9v;
Chris@42 1371 Cr[WS(csr, 5)] = FMA(KP970031253, T9U, T9N);
Chris@42 1372 Cr[WS(csr, 59)] = FNMS(KP970031253, T9U, T9N);
Chris@42 1373 Cr[WS(csr, 21)] = FNMS(KP857728610, T9K, T9J);
Chris@42 1374 Cr[WS(csr, 43)] = FMA(KP857728610, T9K, T9J);
Chris@42 1375 Ci[WS(csi, 53)] = FMS(KP857728610, T9I, T9F);
Chris@42 1376 Ci[WS(csi, 11)] = FMA(KP857728610, T9I, T9F);
Chris@42 1377 Ci[WS(csi, 43)] = FMA(KP857728610, T9E, T9D);
Chris@42 1378 Ci[WS(csi, 21)] = FMS(KP857728610, T9E, T9D);
Chris@42 1379 Cr[WS(csr, 11)] = FMA(KP857728610, T9w, T9h);
Chris@42 1380 Cr[WS(csr, 53)] = FNMS(KP857728610, T9w, T9h);
Chris@42 1381 Ta2 = Ta0 - Ta1;
Chris@42 1382 Ta4 = Ta1 + Ta0;
Chris@42 1383 }
Chris@42 1384 }
Chris@42 1385 Ci[WS(csi, 59)] = FMA(KP970031253, Ta2, T9Z);
Chris@42 1386 Ci[WS(csi, 5)] = FMS(KP970031253, Ta2, T9Z);
Chris@42 1387 Ci[WS(csi, 37)] = FMS(KP970031253, T9Y, T9X);
Chris@42 1388 Ci[WS(csi, 27)] = FMA(KP970031253, T9Y, T9X);
Chris@42 1389 }
Chris@42 1390 }
Chris@42 1391 }
Chris@42 1392 {
Chris@42 1393 E T69, T2z, T6k, T3g, T6a, T60, T6j, T5X, T4i, T6c, T6h, T6p, T64, T5L;
Chris@42 1394 {
Chris@42 1395 E T5Y, T2U, T3f, T5Z;
Chris@42 1396 T5Y = FMA(KP098491403, T2M, T2T);
Chris@42 1397 T2U = FNMS(KP098491403, T2T, T2M);
Chris@42 1398 Cr[WS(csr, 27)] = FMA(KP970031253, Ta4, Ta3);
Chris@42 1399 Cr[WS(csr, 37)] = FNMS(KP970031253, Ta4, Ta3);
Chris@42 1400 T69 = FNMS(KP980785280, T2y, T2f);
Chris@42 1401 T2z = FMA(KP980785280, T2y, T2f);
Chris@42 1402 T3f = FMA(KP098491403, T3e, T37);
Chris@42 1403 T5Z = FNMS(KP098491403, T37, T3e);
Chris@42 1404 T6k = T3f - T2U;
Chris@42 1405 T3g = T2U + T3f;
Chris@42 1406 T6a = T5Y - T5Z;
Chris@42 1407 T60 = T5Y + T5Z;
Chris@42 1408 {
Chris@42 1409 E T6f, T5x, T6g, T5K;
Chris@42 1410 T6j = FNMS(KP980785280, T5W, T5T);
Chris@42 1411 T5X = FMA(KP980785280, T5W, T5T);
Chris@42 1412 T6f = FNMS(KP980785280, T5w, T4X);
Chris@42 1413 T5x = FMA(KP980785280, T5w, T4X);
Chris@42 1414 T6g = FNMS(KP980785280, T5J, T5G);
Chris@42 1415 T5K = FMA(KP980785280, T5J, T5G);
Chris@42 1416 T4i = FMA(KP980785280, T4h, T3I);
Chris@42 1417 T6c = FNMS(KP980785280, T4h, T3I);
Chris@42 1418 T6h = FMA(KP906347169, T6g, T6f);
Chris@42 1419 T6p = FNMS(KP906347169, T6f, T6g);
Chris@42 1420 T64 = FMA(KP049126849, T5x, T5K);
Chris@42 1421 T5L = FNMS(KP049126849, T5K, T5x);
Chris@42 1422 }
Chris@42 1423 }
Chris@42 1424 {
Chris@42 1425 E T67, T3h, T63, T61, T6d, T4v;
Chris@42 1426 T67 = FNMS(KP995184726, T3g, T2z);
Chris@42 1427 T3h = FMA(KP995184726, T3g, T2z);
Chris@42 1428 T63 = FMA(KP995184726, T60, T5X);
Chris@42 1429 T61 = FNMS(KP995184726, T60, T5X);
Chris@42 1430 T6d = FNMS(KP980785280, T4u, T4r);
Chris@42 1431 T4v = FMA(KP980785280, T4u, T4r);
Chris@42 1432 {
Chris@42 1433 E T6m, T6l, T6n, T6q;
Chris@42 1434 {
Chris@42 1435 E T6b, T6o, T65, T4w, T6i, T6e;
Chris@42 1436 T6r = FNMS(KP995184726, T6a, T69);
Chris@42 1437 T6b = FMA(KP995184726, T6a, T69);
Chris@42 1438 T6e = FMA(KP906347169, T6d, T6c);
Chris@42 1439 T6o = FNMS(KP906347169, T6c, T6d);
Chris@42 1440 T65 = FMA(KP049126849, T4i, T4v);
Chris@42 1441 T4w = FNMS(KP049126849, T4v, T4i);
Chris@42 1442 T6i = T6e + T6h;
Chris@42 1443 T6m = T6h - T6e;
Chris@42 1444 T6l = FNMS(KP995184726, T6k, T6j);
Chris@42 1445 T6n = FMA(KP995184726, T6k, T6j);
Chris@42 1446 {
Chris@42 1447 E T68, T66, T62, T5M;
Chris@42 1448 T68 = T65 + T64;
Chris@42 1449 T66 = T64 - T65;
Chris@42 1450 T62 = T5L - T4w;
Chris@42 1451 T5M = T4w + T5L;
Chris@42 1452 Cr[WS(csr, 15)] = FMA(KP740951125, T6i, T6b);
Chris@42 1453 Cr[WS(csr, 49)] = FNMS(KP740951125, T6i, T6b);
Chris@42 1454 Cr[WS(csr, 31)] = FMA(KP998795456, T68, T67);
Chris@42 1455 Cr[WS(csr, 33)] = FNMS(KP998795456, T68, T67);
Chris@42 1456 Ci[WS(csi, 63)] = FMA(KP998795456, T66, T63);
Chris@42 1457 Ci[WS(csi, 1)] = FMS(KP998795456, T66, T63);
Chris@42 1458 Ci[WS(csi, 33)] = FMS(KP998795456, T62, T61);
Chris@42 1459 Ci[WS(csi, 31)] = FMA(KP998795456, T62, T61);
Chris@42 1460 Cr[WS(csr, 1)] = FMA(KP998795456, T5M, T3h);
Chris@42 1461 Cr[WS(csr, 63)] = FNMS(KP998795456, T5M, T3h);
Chris@42 1462 T6q = T6o - T6p;
Chris@42 1463 T6s = T6o + T6p;
Chris@42 1464 }
Chris@42 1465 }
Chris@42 1466 Ci[WS(csi, 49)] = FMS(KP740951125, T6q, T6n);
Chris@42 1467 Ci[WS(csi, 15)] = FMA(KP740951125, T6q, T6n);
Chris@42 1468 Ci[WS(csi, 47)] = FMA(KP740951125, T6m, T6l);
Chris@42 1469 Ci[WS(csi, 17)] = FMS(KP740951125, T6m, T6l);
Chris@42 1470 }
Chris@42 1471 }
Chris@42 1472 }
Chris@42 1473 {
Chris@42 1474 E T8N, T7B, T8Y, T7Q, T8O, T8E, T8X, T8B, T82, T8Q, T8V, T92, T8J, T8t;
Chris@42 1475 {
Chris@42 1476 E T8C, T7I, T7P, T8D;
Chris@42 1477 T8C = FNMS(KP303346683, T7E, T7H);
Chris@42 1478 T7I = FMA(KP303346683, T7H, T7E);
Chris@42 1479 Cr[WS(csr, 17)] = FNMS(KP740951125, T6s, T6r);
Chris@42 1480 Cr[WS(csr, 47)] = FMA(KP740951125, T6s, T6r);
Chris@42 1481 T8N = FNMS(KP831469612, T7A, T7t);
Chris@42 1482 T7B = FMA(KP831469612, T7A, T7t);
Chris@42 1483 T7P = FNMS(KP303346683, T7O, T7L);
Chris@42 1484 T8D = FMA(KP303346683, T7L, T7O);
Chris@42 1485 T8Y = T7P - T7I;
Chris@42 1486 T7Q = T7I + T7P;
Chris@42 1487 T8O = T8D - T8C;
Chris@42 1488 T8E = T8C + T8D;
Chris@42 1489 {
Chris@42 1490 E T8T, T8l, T8U, T8s;
Chris@42 1491 T8X = FNMS(KP831469612, T8A, T8x);
Chris@42 1492 T8B = FMA(KP831469612, T8A, T8x);
Chris@42 1493 T8T = FNMS(KP831469612, T8k, T8d);
Chris@42 1494 T8l = FMA(KP831469612, T8k, T8d);
Chris@42 1495 T8U = FNMS(KP831469612, T8r, T8o);
Chris@42 1496 T8s = FMA(KP831469612, T8r, T8o);
Chris@42 1497 T82 = FMA(KP831469612, T81, T7U);
Chris@42 1498 T8Q = FNMS(KP831469612, T81, T7U);
Chris@42 1499 T8V = FNMS(KP741650546, T8U, T8T);
Chris@42 1500 T92 = FMA(KP741650546, T8T, T8U);
Chris@42 1501 T8J = FNMS(KP148335987, T8l, T8s);
Chris@42 1502 T8t = FMA(KP148335987, T8s, T8l);
Chris@42 1503 }
Chris@42 1504 }
Chris@42 1505 {
Chris@42 1506 E T8L, T7R, T8H, T8F, T8R, T89;
Chris@42 1507 T8L = FNMS(KP956940335, T7Q, T7B);
Chris@42 1508 T7R = FMA(KP956940335, T7Q, T7B);
Chris@42 1509 T8H = FMA(KP956940335, T8E, T8B);
Chris@42 1510 T8F = FNMS(KP956940335, T8E, T8B);
Chris@42 1511 T8R = FNMS(KP831469612, T88, T85);
Chris@42 1512 T89 = FMA(KP831469612, T88, T85);
Chris@42 1513 {
Chris@42 1514 E T90, T8Z, T91, T94;
Chris@42 1515 {
Chris@42 1516 E T8P, T93, T8I, T8a, T8W, T8S;
Chris@42 1517 T95 = FNMS(KP956940335, T8O, T8N);
Chris@42 1518 T8P = FMA(KP956940335, T8O, T8N);
Chris@42 1519 T8S = FNMS(KP741650546, T8R, T8Q);
Chris@42 1520 T93 = FMA(KP741650546, T8Q, T8R);
Chris@42 1521 T8I = FNMS(KP148335987, T82, T89);
Chris@42 1522 T8a = FMA(KP148335987, T89, T82);
Chris@42 1523 T8W = T8S + T8V;
Chris@42 1524 T90 = T8V - T8S;
Chris@42 1525 T8Z = FMA(KP956940335, T8Y, T8X);
Chris@42 1526 T91 = FNMS(KP956940335, T8Y, T8X);
Chris@42 1527 {
Chris@42 1528 E T8M, T8K, T8G, T8u;
Chris@42 1529 T8M = T8I + T8J;
Chris@42 1530 T8K = T8I - T8J;
Chris@42 1531 T8G = T8t - T8a;
Chris@42 1532 T8u = T8a + T8t;
Chris@42 1533 Cr[WS(csr, 13)] = FMA(KP803207531, T8W, T8P);
Chris@42 1534 Cr[WS(csr, 51)] = FNMS(KP803207531, T8W, T8P);
Chris@42 1535 Cr[WS(csr, 29)] = FNMS(KP989176509, T8M, T8L);
Chris@42 1536 Cr[WS(csr, 35)] = FMA(KP989176509, T8M, T8L);
Chris@42 1537 Ci[WS(csi, 61)] = FMS(KP989176509, T8K, T8H);
Chris@42 1538 Ci[WS(csi, 3)] = FMA(KP989176509, T8K, T8H);
Chris@42 1539 Ci[WS(csi, 35)] = FMA(KP989176509, T8G, T8F);
Chris@42 1540 Ci[WS(csi, 29)] = FMS(KP989176509, T8G, T8F);
Chris@42 1541 Cr[WS(csr, 3)] = FMA(KP989176509, T8u, T7R);
Chris@42 1542 Cr[WS(csr, 61)] = FNMS(KP989176509, T8u, T7R);
Chris@42 1543 T94 = T92 - T93;
Chris@42 1544 T96 = T93 + T92;
Chris@42 1545 }
Chris@42 1546 }
Chris@42 1547 Ci[WS(csi, 51)] = FMA(KP803207531, T94, T91);
Chris@42 1548 Ci[WS(csi, 13)] = FMS(KP803207531, T94, T91);
Chris@42 1549 Ci[WS(csi, 45)] = FMS(KP803207531, T90, T8Z);
Chris@42 1550 Ci[WS(csi, 19)] = FMA(KP803207531, T90, T8Z);
Chris@42 1551 }
Chris@42 1552 }
Chris@42 1553 }
Chris@42 1554 }
Chris@42 1555 }
Chris@42 1556 }
Chris@42 1557 }
Chris@42 1558 Cr[WS(csr, 19)] = FMA(KP803207531, T96, T95);
Chris@42 1559 Cr[WS(csr, 45)] = FNMS(KP803207531, T96, T95);
Chris@42 1560 }
Chris@42 1561 }
Chris@42 1562 }
Chris@42 1563
Chris@42 1564 static const kr2c_desc desc = { 128, "r2cf_128", {440, 0, 516, 0}, &GENUS };
Chris@42 1565
Chris@42 1566 void X(codelet_r2cf_128) (planner *p) {
Chris@42 1567 X(kr2c_register) (p, r2cf_128, &desc);
Chris@42 1568 }
Chris@42 1569
Chris@42 1570 #else /* HAVE_FMA */
Chris@42 1571
Chris@42 1572 /* Generated by: ../../../genfft/gen_r2cf.native -compact -variables 4 -pipeline-latency 4 -n 128 -name r2cf_128 -include r2cf.h */
Chris@42 1573
Chris@42 1574 /*
Chris@42 1575 * This function contains 956 FP additions, 330 FP multiplications,
Chris@42 1576 * (or, 812 additions, 186 multiplications, 144 fused multiply/add),
Chris@42 1577 * 186 stack variables, 31 constants, and 256 memory accesses
Chris@42 1578 */
Chris@42 1579 #include "r2cf.h"
Chris@42 1580
Chris@42 1581 static void r2cf_128(R *R0, R *R1, R *Cr, R *Ci, stride rs, stride csr, stride csi, INT v, INT ivs, INT ovs)
Chris@42 1582 {
Chris@42 1583 DK(KP803207531, +0.803207531480644909806676512963141923879569427);
Chris@42 1584 DK(KP595699304, +0.595699304492433343467036528829969889511926338);
Chris@42 1585 DK(KP146730474, +0.146730474455361751658850129646717819706215317);
Chris@42 1586 DK(KP989176509, +0.989176509964780973451673738016243063983689533);
Chris@42 1587 DK(KP740951125, +0.740951125354959091175616897495162729728955309);
Chris@42 1588 DK(KP671558954, +0.671558954847018400625376850427421803228750632);
Chris@42 1589 DK(KP049067674, +0.049067674327418014254954976942682658314745363);
Chris@42 1590 DK(KP998795456, +0.998795456205172392714771604759100694443203615);
Chris@42 1591 DK(KP242980179, +0.242980179903263889948274162077471118320990783);
Chris@42 1592 DK(KP970031253, +0.970031253194543992603984207286100251456865962);
Chris@42 1593 DK(KP514102744, +0.514102744193221726593693838968815772608049120);
Chris@42 1594 DK(KP857728610, +0.857728610000272069902269984284770137042490799);
Chris@42 1595 DK(KP336889853, +0.336889853392220050689253212619147570477766780);
Chris@42 1596 DK(KP941544065, +0.941544065183020778412509402599502357185589796);
Chris@42 1597 DK(KP427555093, +0.427555093430282094320966856888798534304578629);
Chris@42 1598 DK(KP903989293, +0.903989293123443331586200297230537048710132025);
Chris@42 1599 DK(KP098017140, +0.098017140329560601994195563888641845861136673);
Chris@42 1600 DK(KP995184726, +0.995184726672196886244836953109479921575474869);
Chris@42 1601 DK(KP634393284, +0.634393284163645498215171613225493370675687095);
Chris@42 1602 DK(KP773010453, +0.773010453362736960810906609758469800971041293);
Chris@42 1603 DK(KP881921264, +0.881921264348355029712756863660388349508442621);
Chris@42 1604 DK(KP471396736, +0.471396736825997648556387625905254377657460319);
Chris@42 1605 DK(KP956940335, +0.956940335732208864935797886980269969482849206);
Chris@42 1606 DK(KP290284677, +0.290284677254462367636192375817395274691476278);
Chris@42 1607 DK(KP555570233, +0.555570233019602224742830813948532874374937191);
Chris@42 1608 DK(KP831469612, +0.831469612302545237078788377617905756738560812);
Chris@42 1609 DK(KP195090322, +0.195090322016128267848284868477022240927691618);
Chris@42 1610 DK(KP980785280, +0.980785280403230449126182236134239036973933731);
Chris@42 1611 DK(KP382683432, +0.382683432365089771728459984030398866761344562);
Chris@42 1612 DK(KP923879532, +0.923879532511286756128183189396788286822416626);
Chris@42 1613 DK(KP707106781, +0.707106781186547524400844362104849039284835938);
Chris@42 1614 {
Chris@42 1615 INT i;
Chris@42 1616 for (i = v; i > 0; i = i - 1, R0 = R0 + ivs, R1 = R1 + ivs, Cr = Cr + ovs, Ci = Ci + ovs, MAKE_VOLATILE_STRIDE(512, rs), MAKE_VOLATILE_STRIDE(512, csr), MAKE_VOLATILE_STRIDE(512, csi)) {
Chris@42 1617 E TcD, TdU, T27, T7r, T5S, T8y, Tf, Ta5, Tu, Tbq, TcG, TdV, T2e, T8z, T5V;
Chris@42 1618 E T7s, TK, Ta6, TcK, TdX, T2o, T5X, T7w, T8B, TZ, Ta7, TcN, TdY, T2x, T5Y;
Chris@42 1619 E T7z, T8C, T1g, Taa, TcU, TeA, TcX, Tez, T1v, Tab, T2M, T6z, T7E, T9e, T7H;
Chris@42 1620 E T9d, T2T, T6A, T4X, T6L, Tdz, TeL, TdK, TeP, T5G, T6P, T8d, T9p, TaV, Tc3;
Chris@42 1621 E Tbi, Tc4, T8o, T9t, T3I, T6H, Tde, TeH, Tdp, TeF, T4r, T6F, T7U, T9l, Tao;
Chris@42 1622 E TbW, TaL, TbX, T85, T9j, T1L, Tad, Td3, Tew, Td6, Tex, T20, Tae, T37, T6x;
Chris@42 1623 E T7L, T9a, T7O, T9b, T3e, T6w, TbZ, Tc0, T3Z, T4s, Tds, TeI, T4g, T4t, T80;
Chris@42 1624 E T87, Tdl, TeE, T7X, T86, TaD, TaM, Tc6, Tc7, T5e, T5H, TdN, TeM, T5v, T5I;
Chris@42 1625 E T8j, T8q, TdG, TeO, T8g, T8p, Tba, Tbj;
Chris@42 1626 {
Chris@42 1627 E T3, T23, Td, T25, T6, T5R, Ta, T24;
Chris@42 1628 {
Chris@42 1629 E T1, T2, Tb, Tc;
Chris@42 1630 T1 = R0[0];
Chris@42 1631 T2 = R0[WS(rs, 32)];
Chris@42 1632 T3 = T1 + T2;
Chris@42 1633 T23 = T1 - T2;
Chris@42 1634 Tb = R0[WS(rs, 56)];
Chris@42 1635 Tc = R0[WS(rs, 24)];
Chris@42 1636 Td = Tb + Tc;
Chris@42 1637 T25 = Tb - Tc;
Chris@42 1638 }
Chris@42 1639 {
Chris@42 1640 E T4, T5, T8, T9;
Chris@42 1641 T4 = R0[WS(rs, 16)];
Chris@42 1642 T5 = R0[WS(rs, 48)];
Chris@42 1643 T6 = T4 + T5;
Chris@42 1644 T5R = T4 - T5;
Chris@42 1645 T8 = R0[WS(rs, 8)];
Chris@42 1646 T9 = R0[WS(rs, 40)];
Chris@42 1647 Ta = T8 + T9;
Chris@42 1648 T24 = T8 - T9;
Chris@42 1649 }
Chris@42 1650 TcD = T3 - T6;
Chris@42 1651 TdU = Td - Ta;
Chris@42 1652 {
Chris@42 1653 E T26, T5Q, T7, Te;
Chris@42 1654 T26 = KP707106781 * (T24 + T25);
Chris@42 1655 T27 = T23 + T26;
Chris@42 1656 T7r = T23 - T26;
Chris@42 1657 T5Q = KP707106781 * (T25 - T24);
Chris@42 1658 T5S = T5Q - T5R;
Chris@42 1659 T8y = T5R + T5Q;
Chris@42 1660 T7 = T3 + T6;
Chris@42 1661 Te = Ta + Td;
Chris@42 1662 Tf = T7 + Te;
Chris@42 1663 Ta5 = T7 - Te;
Chris@42 1664 }
Chris@42 1665 }
Chris@42 1666 {
Chris@42 1667 E Ti, T28, Ts, T2c, Tl, T29, Tp, T2b;
Chris@42 1668 {
Chris@42 1669 E Tg, Th, Tq, Tr;
Chris@42 1670 Tg = R0[WS(rs, 4)];
Chris@42 1671 Th = R0[WS(rs, 36)];
Chris@42 1672 Ti = Tg + Th;
Chris@42 1673 T28 = Tg - Th;
Chris@42 1674 Tq = R0[WS(rs, 12)];
Chris@42 1675 Tr = R0[WS(rs, 44)];
Chris@42 1676 Ts = Tq + Tr;
Chris@42 1677 T2c = Tq - Tr;
Chris@42 1678 }
Chris@42 1679 {
Chris@42 1680 E Tj, Tk, Tn, To;
Chris@42 1681 Tj = R0[WS(rs, 20)];
Chris@42 1682 Tk = R0[WS(rs, 52)];
Chris@42 1683 Tl = Tj + Tk;
Chris@42 1684 T29 = Tj - Tk;
Chris@42 1685 Tn = R0[WS(rs, 60)];
Chris@42 1686 To = R0[WS(rs, 28)];
Chris@42 1687 Tp = Tn + To;
Chris@42 1688 T2b = Tn - To;
Chris@42 1689 }
Chris@42 1690 {
Chris@42 1691 E Tm, Tt, TcE, TcF;
Chris@42 1692 Tm = Ti + Tl;
Chris@42 1693 Tt = Tp + Ts;
Chris@42 1694 Tu = Tm + Tt;
Chris@42 1695 Tbq = Tt - Tm;
Chris@42 1696 TcE = Ti - Tl;
Chris@42 1697 TcF = Tp - Ts;
Chris@42 1698 TcG = KP707106781 * (TcE + TcF);
Chris@42 1699 TdV = KP707106781 * (TcF - TcE);
Chris@42 1700 }
Chris@42 1701 {
Chris@42 1702 E T2a, T2d, T5T, T5U;
Chris@42 1703 T2a = FNMS(KP382683432, T29, KP923879532 * T28);
Chris@42 1704 T2d = FMA(KP923879532, T2b, KP382683432 * T2c);
Chris@42 1705 T2e = T2a + T2d;
Chris@42 1706 T8z = T2d - T2a;
Chris@42 1707 T5T = FNMS(KP923879532, T2c, KP382683432 * T2b);
Chris@42 1708 T5U = FMA(KP382683432, T28, KP923879532 * T29);
Chris@42 1709 T5V = T5T - T5U;
Chris@42 1710 T7s = T5U + T5T;
Chris@42 1711 }
Chris@42 1712 }
Chris@42 1713 {
Chris@42 1714 E Ty, T2g, TB, T2m, TF, T2l, TI, T2j;
Chris@42 1715 {
Chris@42 1716 E Tw, Tx, Tz, TA;
Chris@42 1717 Tw = R0[WS(rs, 2)];
Chris@42 1718 Tx = R0[WS(rs, 34)];
Chris@42 1719 Ty = Tw + Tx;
Chris@42 1720 T2g = Tw - Tx;
Chris@42 1721 Tz = R0[WS(rs, 18)];
Chris@42 1722 TA = R0[WS(rs, 50)];
Chris@42 1723 TB = Tz + TA;
Chris@42 1724 T2m = Tz - TA;
Chris@42 1725 {
Chris@42 1726 E TD, TE, T2h, TG, TH, T2i;
Chris@42 1727 TD = R0[WS(rs, 10)];
Chris@42 1728 TE = R0[WS(rs, 42)];
Chris@42 1729 T2h = TD - TE;
Chris@42 1730 TG = R0[WS(rs, 58)];
Chris@42 1731 TH = R0[WS(rs, 26)];
Chris@42 1732 T2i = TG - TH;
Chris@42 1733 TF = TD + TE;
Chris@42 1734 T2l = KP707106781 * (T2i - T2h);
Chris@42 1735 TI = TG + TH;
Chris@42 1736 T2j = KP707106781 * (T2h + T2i);
Chris@42 1737 }
Chris@42 1738 }
Chris@42 1739 {
Chris@42 1740 E TC, TJ, TcI, TcJ;
Chris@42 1741 TC = Ty + TB;
Chris@42 1742 TJ = TF + TI;
Chris@42 1743 TK = TC + TJ;
Chris@42 1744 Ta6 = TC - TJ;
Chris@42 1745 TcI = Ty - TB;
Chris@42 1746 TcJ = TI - TF;
Chris@42 1747 TcK = FMA(KP923879532, TcI, KP382683432 * TcJ);
Chris@42 1748 TdX = FNMS(KP382683432, TcI, KP923879532 * TcJ);
Chris@42 1749 }
Chris@42 1750 {
Chris@42 1751 E T2k, T2n, T7u, T7v;
Chris@42 1752 T2k = T2g + T2j;
Chris@42 1753 T2n = T2l - T2m;
Chris@42 1754 T2o = FMA(KP980785280, T2k, KP195090322 * T2n);
Chris@42 1755 T5X = FNMS(KP195090322, T2k, KP980785280 * T2n);
Chris@42 1756 T7u = T2g - T2j;
Chris@42 1757 T7v = T2m + T2l;
Chris@42 1758 T7w = FMA(KP831469612, T7u, KP555570233 * T7v);
Chris@42 1759 T8B = FNMS(KP555570233, T7u, KP831469612 * T7v);
Chris@42 1760 }
Chris@42 1761 }
Chris@42 1762 {
Chris@42 1763 E TN, T2p, TQ, T2v, TU, T2u, TX, T2s;
Chris@42 1764 {
Chris@42 1765 E TL, TM, TO, TP;
Chris@42 1766 TL = R0[WS(rs, 62)];
Chris@42 1767 TM = R0[WS(rs, 30)];
Chris@42 1768 TN = TL + TM;
Chris@42 1769 T2p = TL - TM;
Chris@42 1770 TO = R0[WS(rs, 14)];
Chris@42 1771 TP = R0[WS(rs, 46)];
Chris@42 1772 TQ = TO + TP;
Chris@42 1773 T2v = TO - TP;
Chris@42 1774 {
Chris@42 1775 E TS, TT, T2q, TV, TW, T2r;
Chris@42 1776 TS = R0[WS(rs, 6)];
Chris@42 1777 TT = R0[WS(rs, 38)];
Chris@42 1778 T2q = TS - TT;
Chris@42 1779 TV = R0[WS(rs, 54)];
Chris@42 1780 TW = R0[WS(rs, 22)];
Chris@42 1781 T2r = TV - TW;
Chris@42 1782 TU = TS + TT;
Chris@42 1783 T2u = KP707106781 * (T2r - T2q);
Chris@42 1784 TX = TV + TW;
Chris@42 1785 T2s = KP707106781 * (T2q + T2r);
Chris@42 1786 }
Chris@42 1787 }
Chris@42 1788 {
Chris@42 1789 E TR, TY, TcL, TcM;
Chris@42 1790 TR = TN + TQ;
Chris@42 1791 TY = TU + TX;
Chris@42 1792 TZ = TR + TY;
Chris@42 1793 Ta7 = TR - TY;
Chris@42 1794 TcL = TN - TQ;
Chris@42 1795 TcM = TX - TU;
Chris@42 1796 TcN = FNMS(KP382683432, TcM, KP923879532 * TcL);
Chris@42 1797 TdY = FMA(KP382683432, TcL, KP923879532 * TcM);
Chris@42 1798 }
Chris@42 1799 {
Chris@42 1800 E T2t, T2w, T7x, T7y;
Chris@42 1801 T2t = T2p + T2s;
Chris@42 1802 T2w = T2u - T2v;
Chris@42 1803 T2x = FNMS(KP195090322, T2w, KP980785280 * T2t);
Chris@42 1804 T5Y = FMA(KP195090322, T2t, KP980785280 * T2w);
Chris@42 1805 T7x = T2p - T2s;
Chris@42 1806 T7y = T2v + T2u;
Chris@42 1807 T7z = FNMS(KP555570233, T7y, KP831469612 * T7x);
Chris@42 1808 T8C = FMA(KP555570233, T7x, KP831469612 * T7y);
Chris@42 1809 }
Chris@42 1810 }
Chris@42 1811 {
Chris@42 1812 E T14, T2N, T17, T2D, T1b, T2O, T1e, T2C, T1j, T1m, T2K, TcR, T2Q, T1q, T1t;
Chris@42 1813 E T2H, TcS, T2R;
Chris@42 1814 {
Chris@42 1815 E T12, T13, T15, T16;
Chris@42 1816 T12 = R0[WS(rs, 1)];
Chris@42 1817 T13 = R0[WS(rs, 33)];
Chris@42 1818 T14 = T12 + T13;
Chris@42 1819 T2N = T12 - T13;
Chris@42 1820 T15 = R0[WS(rs, 17)];
Chris@42 1821 T16 = R0[WS(rs, 49)];
Chris@42 1822 T17 = T15 + T16;
Chris@42 1823 T2D = T15 - T16;
Chris@42 1824 }
Chris@42 1825 {
Chris@42 1826 E T19, T1a, T2B, T1c, T1d, T2A;
Chris@42 1827 T19 = R0[WS(rs, 9)];
Chris@42 1828 T1a = R0[WS(rs, 41)];
Chris@42 1829 T2B = T19 - T1a;
Chris@42 1830 T1c = R0[WS(rs, 57)];
Chris@42 1831 T1d = R0[WS(rs, 25)];
Chris@42 1832 T2A = T1c - T1d;
Chris@42 1833 T1b = T19 + T1a;
Chris@42 1834 T2O = KP707106781 * (T2B + T2A);
Chris@42 1835 T1e = T1c + T1d;
Chris@42 1836 T2C = KP707106781 * (T2A - T2B);
Chris@42 1837 }
Chris@42 1838 {
Chris@42 1839 E T2I, T2J, T2F, T2G;
Chris@42 1840 {
Chris@42 1841 E T1h, T1i, T1k, T1l;
Chris@42 1842 T1h = R0[WS(rs, 5)];
Chris@42 1843 T1i = R0[WS(rs, 37)];
Chris@42 1844 T1j = T1h + T1i;
Chris@42 1845 T2I = T1h - T1i;
Chris@42 1846 T1k = R0[WS(rs, 21)];
Chris@42 1847 T1l = R0[WS(rs, 53)];
Chris@42 1848 T1m = T1k + T1l;
Chris@42 1849 T2J = T1k - T1l;
Chris@42 1850 }
Chris@42 1851 T2K = FMA(KP382683432, T2I, KP923879532 * T2J);
Chris@42 1852 TcR = T1j - T1m;
Chris@42 1853 T2Q = FNMS(KP382683432, T2J, KP923879532 * T2I);
Chris@42 1854 {
Chris@42 1855 E T1o, T1p, T1r, T1s;
Chris@42 1856 T1o = R0[WS(rs, 61)];
Chris@42 1857 T1p = R0[WS(rs, 29)];
Chris@42 1858 T1q = T1o + T1p;
Chris@42 1859 T2F = T1o - T1p;
Chris@42 1860 T1r = R0[WS(rs, 13)];
Chris@42 1861 T1s = R0[WS(rs, 45)];
Chris@42 1862 T1t = T1r + T1s;
Chris@42 1863 T2G = T1r - T1s;
Chris@42 1864 }
Chris@42 1865 T2H = FNMS(KP923879532, T2G, KP382683432 * T2F);
Chris@42 1866 TcS = T1q - T1t;
Chris@42 1867 T2R = FMA(KP923879532, T2F, KP382683432 * T2G);
Chris@42 1868 }
Chris@42 1869 {
Chris@42 1870 E T18, T1f, TcQ, TcT;
Chris@42 1871 T18 = T14 + T17;
Chris@42 1872 T1f = T1b + T1e;
Chris@42 1873 T1g = T18 + T1f;
Chris@42 1874 Taa = T18 - T1f;
Chris@42 1875 TcQ = T14 - T17;
Chris@42 1876 TcT = KP707106781 * (TcR + TcS);
Chris@42 1877 TcU = TcQ + TcT;
Chris@42 1878 TeA = TcQ - TcT;
Chris@42 1879 }
Chris@42 1880 {
Chris@42 1881 E TcV, TcW, T1n, T1u;
Chris@42 1882 TcV = T1e - T1b;
Chris@42 1883 TcW = KP707106781 * (TcS - TcR);
Chris@42 1884 TcX = TcV + TcW;
Chris@42 1885 Tez = TcW - TcV;
Chris@42 1886 T1n = T1j + T1m;
Chris@42 1887 T1u = T1q + T1t;
Chris@42 1888 T1v = T1n + T1u;
Chris@42 1889 Tab = T1u - T1n;
Chris@42 1890 }
Chris@42 1891 {
Chris@42 1892 E T2E, T2L, T7C, T7D;
Chris@42 1893 T2E = T2C - T2D;
Chris@42 1894 T2L = T2H - T2K;
Chris@42 1895 T2M = T2E + T2L;
Chris@42 1896 T6z = T2L - T2E;
Chris@42 1897 T7C = T2N - T2O;
Chris@42 1898 T7D = T2K + T2H;
Chris@42 1899 T7E = T7C + T7D;
Chris@42 1900 T9e = T7C - T7D;
Chris@42 1901 }
Chris@42 1902 {
Chris@42 1903 E T7F, T7G, T2P, T2S;
Chris@42 1904 T7F = T2D + T2C;
Chris@42 1905 T7G = T2R - T2Q;
Chris@42 1906 T7H = T7F + T7G;
Chris@42 1907 T9d = T7G - T7F;
Chris@42 1908 T2P = T2N + T2O;
Chris@42 1909 T2S = T2Q + T2R;
Chris@42 1910 T2T = T2P + T2S;
Chris@42 1911 T6A = T2P - T2S;
Chris@42 1912 }
Chris@42 1913 }
Chris@42 1914 {
Chris@42 1915 E T4z, TaP, T5B, TaQ, T4G, TaT, T5y, TaS, Tbf, Tbg, T4O, Tdw, T5E, Tbc, Tbd;
Chris@42 1916 E T4V, Tdx, T5D;
Chris@42 1917 {
Chris@42 1918 E T4x, T4y, T5z, T5A;
Chris@42 1919 T4x = R1[WS(rs, 63)];
Chris@42 1920 T4y = R1[WS(rs, 31)];
Chris@42 1921 T4z = T4x - T4y;
Chris@42 1922 TaP = T4x + T4y;
Chris@42 1923 T5z = R1[WS(rs, 15)];
Chris@42 1924 T5A = R1[WS(rs, 47)];
Chris@42 1925 T5B = T5z - T5A;
Chris@42 1926 TaQ = T5z + T5A;
Chris@42 1927 }
Chris@42 1928 {
Chris@42 1929 E T4A, T4B, T4C, T4D, T4E, T4F;
Chris@42 1930 T4A = R1[WS(rs, 7)];
Chris@42 1931 T4B = R1[WS(rs, 39)];
Chris@42 1932 T4C = T4A - T4B;
Chris@42 1933 T4D = R1[WS(rs, 55)];
Chris@42 1934 T4E = R1[WS(rs, 23)];
Chris@42 1935 T4F = T4D - T4E;
Chris@42 1936 T4G = KP707106781 * (T4C + T4F);
Chris@42 1937 TaT = T4D + T4E;
Chris@42 1938 T5y = KP707106781 * (T4F - T4C);
Chris@42 1939 TaS = T4A + T4B;
Chris@42 1940 }
Chris@42 1941 {
Chris@42 1942 E T4K, T4N, T4R, T4U;
Chris@42 1943 {
Chris@42 1944 E T4I, T4J, T4L, T4M;
Chris@42 1945 T4I = R1[WS(rs, 3)];
Chris@42 1946 T4J = R1[WS(rs, 35)];
Chris@42 1947 T4K = T4I - T4J;
Chris@42 1948 Tbf = T4I + T4J;
Chris@42 1949 T4L = R1[WS(rs, 19)];
Chris@42 1950 T4M = R1[WS(rs, 51)];
Chris@42 1951 T4N = T4L - T4M;
Chris@42 1952 Tbg = T4L + T4M;
Chris@42 1953 }
Chris@42 1954 T4O = FNMS(KP382683432, T4N, KP923879532 * T4K);
Chris@42 1955 Tdw = Tbf - Tbg;
Chris@42 1956 T5E = FMA(KP382683432, T4K, KP923879532 * T4N);
Chris@42 1957 {
Chris@42 1958 E T4P, T4Q, T4S, T4T;
Chris@42 1959 T4P = R1[WS(rs, 59)];
Chris@42 1960 T4Q = R1[WS(rs, 27)];
Chris@42 1961 T4R = T4P - T4Q;
Chris@42 1962 Tbc = T4P + T4Q;
Chris@42 1963 T4S = R1[WS(rs, 11)];
Chris@42 1964 T4T = R1[WS(rs, 43)];
Chris@42 1965 T4U = T4S - T4T;
Chris@42 1966 Tbd = T4S + T4T;
Chris@42 1967 }
Chris@42 1968 T4V = FMA(KP923879532, T4R, KP382683432 * T4U);
Chris@42 1969 Tdx = Tbc - Tbd;
Chris@42 1970 T5D = FNMS(KP923879532, T4U, KP382683432 * T4R);
Chris@42 1971 }
Chris@42 1972 {
Chris@42 1973 E T4H, T4W, Tdv, Tdy;
Chris@42 1974 T4H = T4z + T4G;
Chris@42 1975 T4W = T4O + T4V;
Chris@42 1976 T4X = T4H + T4W;
Chris@42 1977 T6L = T4H - T4W;
Chris@42 1978 Tdv = TaP - TaQ;
Chris@42 1979 Tdy = KP707106781 * (Tdw + Tdx);
Chris@42 1980 Tdz = Tdv + Tdy;
Chris@42 1981 TeL = Tdv - Tdy;
Chris@42 1982 }
Chris@42 1983 {
Chris@42 1984 E TdI, TdJ, T5C, T5F;
Chris@42 1985 TdI = TaT - TaS;
Chris@42 1986 TdJ = KP707106781 * (Tdx - Tdw);
Chris@42 1987 TdK = TdI + TdJ;
Chris@42 1988 TeP = TdJ - TdI;
Chris@42 1989 T5C = T5y - T5B;
Chris@42 1990 T5F = T5D - T5E;
Chris@42 1991 T5G = T5C + T5F;
Chris@42 1992 T6P = T5F - T5C;
Chris@42 1993 }
Chris@42 1994 {
Chris@42 1995 E T8b, T8c, TaR, TaU;
Chris@42 1996 T8b = T4z - T4G;
Chris@42 1997 T8c = T5E + T5D;
Chris@42 1998 T8d = T8b + T8c;
Chris@42 1999 T9p = T8b - T8c;
Chris@42 2000 TaR = TaP + TaQ;
Chris@42 2001 TaU = TaS + TaT;
Chris@42 2002 TaV = TaR - TaU;
Chris@42 2003 Tc3 = TaR + TaU;
Chris@42 2004 }
Chris@42 2005 {
Chris@42 2006 E Tbe, Tbh, T8m, T8n;
Chris@42 2007 Tbe = Tbc + Tbd;
Chris@42 2008 Tbh = Tbf + Tbg;
Chris@42 2009 Tbi = Tbe - Tbh;
Chris@42 2010 Tc4 = Tbh + Tbe;
Chris@42 2011 T8m = T5B + T5y;
Chris@42 2012 T8n = T4V - T4O;
Chris@42 2013 T8o = T8m + T8n;
Chris@42 2014 T9t = T8n - T8m;
Chris@42 2015 }
Chris@42 2016 }
Chris@42 2017 {
Chris@42 2018 E T3k, Tai, T4m, Taj, T3r, Tam, T4j, Tal, TaI, TaJ, T3z, Tdb, T4p, TaF, TaG;
Chris@42 2019 E T3G, Tdc, T4o;
Chris@42 2020 {
Chris@42 2021 E T3i, T3j, T4k, T4l;
Chris@42 2022 T3i = R1[0];
Chris@42 2023 T3j = R1[WS(rs, 32)];
Chris@42 2024 T3k = T3i - T3j;
Chris@42 2025 Tai = T3i + T3j;
Chris@42 2026 T4k = R1[WS(rs, 16)];
Chris@42 2027 T4l = R1[WS(rs, 48)];
Chris@42 2028 T4m = T4k - T4l;
Chris@42 2029 Taj = T4k + T4l;
Chris@42 2030 }
Chris@42 2031 {
Chris@42 2032 E T3l, T3m, T3n, T3o, T3p, T3q;
Chris@42 2033 T3l = R1[WS(rs, 8)];
Chris@42 2034 T3m = R1[WS(rs, 40)];
Chris@42 2035 T3n = T3l - T3m;
Chris@42 2036 T3o = R1[WS(rs, 56)];
Chris@42 2037 T3p = R1[WS(rs, 24)];
Chris@42 2038 T3q = T3o - T3p;
Chris@42 2039 T3r = KP707106781 * (T3n + T3q);
Chris@42 2040 Tam = T3o + T3p;
Chris@42 2041 T4j = KP707106781 * (T3q - T3n);
Chris@42 2042 Tal = T3l + T3m;
Chris@42 2043 }
Chris@42 2044 {
Chris@42 2045 E T3v, T3y, T3C, T3F;
Chris@42 2046 {
Chris@42 2047 E T3t, T3u, T3w, T3x;
Chris@42 2048 T3t = R1[WS(rs, 4)];
Chris@42 2049 T3u = R1[WS(rs, 36)];
Chris@42 2050 T3v = T3t - T3u;
Chris@42 2051 TaI = T3t + T3u;
Chris@42 2052 T3w = R1[WS(rs, 20)];
Chris@42 2053 T3x = R1[WS(rs, 52)];
Chris@42 2054 T3y = T3w - T3x;
Chris@42 2055 TaJ = T3w + T3x;
Chris@42 2056 }
Chris@42 2057 T3z = FNMS(KP382683432, T3y, KP923879532 * T3v);
Chris@42 2058 Tdb = TaI - TaJ;
Chris@42 2059 T4p = FMA(KP382683432, T3v, KP923879532 * T3y);
Chris@42 2060 {
Chris@42 2061 E T3A, T3B, T3D, T3E;
Chris@42 2062 T3A = R1[WS(rs, 60)];
Chris@42 2063 T3B = R1[WS(rs, 28)];
Chris@42 2064 T3C = T3A - T3B;
Chris@42 2065 TaF = T3A + T3B;
Chris@42 2066 T3D = R1[WS(rs, 12)];
Chris@42 2067 T3E = R1[WS(rs, 44)];
Chris@42 2068 T3F = T3D - T3E;
Chris@42 2069 TaG = T3D + T3E;
Chris@42 2070 }
Chris@42 2071 T3G = FMA(KP923879532, T3C, KP382683432 * T3F);
Chris@42 2072 Tdc = TaF - TaG;
Chris@42 2073 T4o = FNMS(KP923879532, T3F, KP382683432 * T3C);
Chris@42 2074 }
Chris@42 2075 {
Chris@42 2076 E T3s, T3H, Tda, Tdd;
Chris@42 2077 T3s = T3k + T3r;
Chris@42 2078 T3H = T3z + T3G;
Chris@42 2079 T3I = T3s + T3H;
Chris@42 2080 T6H = T3s - T3H;
Chris@42 2081 Tda = Tai - Taj;
Chris@42 2082 Tdd = KP707106781 * (Tdb + Tdc);
Chris@42 2083 Tde = Tda + Tdd;
Chris@42 2084 TeH = Tda - Tdd;
Chris@42 2085 }
Chris@42 2086 {
Chris@42 2087 E Tdn, Tdo, T4n, T4q;
Chris@42 2088 Tdn = Tam - Tal;
Chris@42 2089 Tdo = KP707106781 * (Tdc - Tdb);
Chris@42 2090 Tdp = Tdn + Tdo;
Chris@42 2091 TeF = Tdo - Tdn;
Chris@42 2092 T4n = T4j - T4m;
Chris@42 2093 T4q = T4o - T4p;
Chris@42 2094 T4r = T4n + T4q;
Chris@42 2095 T6F = T4q - T4n;
Chris@42 2096 }
Chris@42 2097 {
Chris@42 2098 E T7S, T7T, Tak, Tan;
Chris@42 2099 T7S = T3k - T3r;
Chris@42 2100 T7T = T4p + T4o;
Chris@42 2101 T7U = T7S + T7T;
Chris@42 2102 T9l = T7S - T7T;
Chris@42 2103 Tak = Tai + Taj;
Chris@42 2104 Tan = Tal + Tam;
Chris@42 2105 Tao = Tak - Tan;
Chris@42 2106 TbW = Tak + Tan;
Chris@42 2107 }
Chris@42 2108 {
Chris@42 2109 E TaH, TaK, T83, T84;
Chris@42 2110 TaH = TaF + TaG;
Chris@42 2111 TaK = TaI + TaJ;
Chris@42 2112 TaL = TaH - TaK;
Chris@42 2113 TbX = TaK + TaH;
Chris@42 2114 T83 = T4m + T4j;
Chris@42 2115 T84 = T3G - T3z;
Chris@42 2116 T85 = T83 + T84;
Chris@42 2117 T9j = T84 - T83;
Chris@42 2118 }
Chris@42 2119 }
Chris@42 2120 {
Chris@42 2121 E T1z, T2V, T1C, T39, T1G, T38, T1J, T2Y, T1O, T1R, T32, Td0, T3c, T1V, T1Y;
Chris@42 2122 E T35, Td1, T3b;
Chris@42 2123 {
Chris@42 2124 E T1x, T1y, T1A, T1B;
Chris@42 2125 T1x = R0[WS(rs, 63)];
Chris@42 2126 T1y = R0[WS(rs, 31)];
Chris@42 2127 T1z = T1x + T1y;
Chris@42 2128 T2V = T1x - T1y;
Chris@42 2129 T1A = R0[WS(rs, 15)];
Chris@42 2130 T1B = R0[WS(rs, 47)];
Chris@42 2131 T1C = T1A + T1B;
Chris@42 2132 T39 = T1A - T1B;
Chris@42 2133 }
Chris@42 2134 {
Chris@42 2135 E T1E, T1F, T2W, T1H, T1I, T2X;
Chris@42 2136 T1E = R0[WS(rs, 7)];
Chris@42 2137 T1F = R0[WS(rs, 39)];
Chris@42 2138 T2W = T1E - T1F;
Chris@42 2139 T1H = R0[WS(rs, 55)];
Chris@42 2140 T1I = R0[WS(rs, 23)];
Chris@42 2141 T2X = T1H - T1I;
Chris@42 2142 T1G = T1E + T1F;
Chris@42 2143 T38 = KP707106781 * (T2X - T2W);
Chris@42 2144 T1J = T1H + T1I;
Chris@42 2145 T2Y = KP707106781 * (T2W + T2X);
Chris@42 2146 }
Chris@42 2147 {
Chris@42 2148 E T30, T31, T33, T34;
Chris@42 2149 {
Chris@42 2150 E T1M, T1N, T1P, T1Q;
Chris@42 2151 T1M = R0[WS(rs, 3)];
Chris@42 2152 T1N = R0[WS(rs, 35)];
Chris@42 2153 T1O = T1M + T1N;
Chris@42 2154 T30 = T1M - T1N;
Chris@42 2155 T1P = R0[WS(rs, 19)];
Chris@42 2156 T1Q = R0[WS(rs, 51)];
Chris@42 2157 T1R = T1P + T1Q;
Chris@42 2158 T31 = T1P - T1Q;
Chris@42 2159 }
Chris@42 2160 T32 = FNMS(KP382683432, T31, KP923879532 * T30);
Chris@42 2161 Td0 = T1O - T1R;
Chris@42 2162 T3c = FMA(KP382683432, T30, KP923879532 * T31);
Chris@42 2163 {
Chris@42 2164 E T1T, T1U, T1W, T1X;
Chris@42 2165 T1T = R0[WS(rs, 59)];
Chris@42 2166 T1U = R0[WS(rs, 27)];
Chris@42 2167 T1V = T1T + T1U;
Chris@42 2168 T33 = T1T - T1U;
Chris@42 2169 T1W = R0[WS(rs, 11)];
Chris@42 2170 T1X = R0[WS(rs, 43)];
Chris@42 2171 T1Y = T1W + T1X;
Chris@42 2172 T34 = T1W - T1X;
Chris@42 2173 }
Chris@42 2174 T35 = FMA(KP923879532, T33, KP382683432 * T34);
Chris@42 2175 Td1 = T1V - T1Y;
Chris@42 2176 T3b = FNMS(KP923879532, T34, KP382683432 * T33);
Chris@42 2177 }
Chris@42 2178 {
Chris@42 2179 E T1D, T1K, TcZ, Td2;
Chris@42 2180 T1D = T1z + T1C;
Chris@42 2181 T1K = T1G + T1J;
Chris@42 2182 T1L = T1D + T1K;
Chris@42 2183 Tad = T1D - T1K;
Chris@42 2184 TcZ = T1z - T1C;
Chris@42 2185 Td2 = KP707106781 * (Td0 + Td1);
Chris@42 2186 Td3 = TcZ + Td2;
Chris@42 2187 Tew = TcZ - Td2;
Chris@42 2188 }
Chris@42 2189 {
Chris@42 2190 E Td4, Td5, T1S, T1Z;
Chris@42 2191 Td4 = T1J - T1G;
Chris@42 2192 Td5 = KP707106781 * (Td1 - Td0);
Chris@42 2193 Td6 = Td4 + Td5;
Chris@42 2194 Tex = Td5 - Td4;
Chris@42 2195 T1S = T1O + T1R;
Chris@42 2196 T1Z = T1V + T1Y;
Chris@42 2197 T20 = T1S + T1Z;
Chris@42 2198 Tae = T1Z - T1S;
Chris@42 2199 }
Chris@42 2200 {
Chris@42 2201 E T2Z, T36, T7J, T7K;
Chris@42 2202 T2Z = T2V + T2Y;
Chris@42 2203 T36 = T32 + T35;
Chris@42 2204 T37 = T2Z + T36;
Chris@42 2205 T6x = T2Z - T36;
Chris@42 2206 T7J = T2V - T2Y;
Chris@42 2207 T7K = T3c + T3b;
Chris@42 2208 T7L = T7J + T7K;
Chris@42 2209 T9a = T7J - T7K;
Chris@42 2210 }
Chris@42 2211 {
Chris@42 2212 E T7M, T7N, T3a, T3d;
Chris@42 2213 T7M = T39 + T38;
Chris@42 2214 T7N = T35 - T32;
Chris@42 2215 T7O = T7M + T7N;
Chris@42 2216 T9b = T7N - T7M;
Chris@42 2217 T3a = T38 - T39;
Chris@42 2218 T3d = T3b - T3c;
Chris@42 2219 T3e = T3a + T3d;
Chris@42 2220 T6w = T3d - T3a;
Chris@42 2221 }
Chris@42 2222 }
Chris@42 2223 {
Chris@42 2224 E T3L, Tdf, T3X, Tar, T42, Tdi, T4e, Tay, T3S, Tdg, T3U, Tau, T49, Tdj, T4b;
Chris@42 2225 E TaB, Tdh, Tdk;
Chris@42 2226 {
Chris@42 2227 E T3J, T3K, Tap, T3V, T3W, Taq;
Chris@42 2228 T3J = R1[WS(rs, 2)];
Chris@42 2229 T3K = R1[WS(rs, 34)];
Chris@42 2230 Tap = T3J + T3K;
Chris@42 2231 T3V = R1[WS(rs, 18)];
Chris@42 2232 T3W = R1[WS(rs, 50)];
Chris@42 2233 Taq = T3V + T3W;
Chris@42 2234 T3L = T3J - T3K;
Chris@42 2235 Tdf = Tap - Taq;
Chris@42 2236 T3X = T3V - T3W;
Chris@42 2237 Tar = Tap + Taq;
Chris@42 2238 }
Chris@42 2239 {
Chris@42 2240 E T40, T41, Taw, T4c, T4d, Tax;
Chris@42 2241 T40 = R1[WS(rs, 62)];
Chris@42 2242 T41 = R1[WS(rs, 30)];
Chris@42 2243 Taw = T40 + T41;
Chris@42 2244 T4c = R1[WS(rs, 14)];
Chris@42 2245 T4d = R1[WS(rs, 46)];
Chris@42 2246 Tax = T4c + T4d;
Chris@42 2247 T42 = T40 - T41;
Chris@42 2248 Tdi = Taw - Tax;
Chris@42 2249 T4e = T4c - T4d;
Chris@42 2250 Tay = Taw + Tax;
Chris@42 2251 }
Chris@42 2252 {
Chris@42 2253 E T3O, Tas, T3R, Tat;
Chris@42 2254 {
Chris@42 2255 E T3M, T3N, T3P, T3Q;
Chris@42 2256 T3M = R1[WS(rs, 10)];
Chris@42 2257 T3N = R1[WS(rs, 42)];
Chris@42 2258 T3O = T3M - T3N;
Chris@42 2259 Tas = T3M + T3N;
Chris@42 2260 T3P = R1[WS(rs, 58)];
Chris@42 2261 T3Q = R1[WS(rs, 26)];
Chris@42 2262 T3R = T3P - T3Q;
Chris@42 2263 Tat = T3P + T3Q;
Chris@42 2264 }
Chris@42 2265 T3S = KP707106781 * (T3O + T3R);
Chris@42 2266 Tdg = Tat - Tas;
Chris@42 2267 T3U = KP707106781 * (T3R - T3O);
Chris@42 2268 Tau = Tas + Tat;
Chris@42 2269 }
Chris@42 2270 {
Chris@42 2271 E T45, Taz, T48, TaA;
Chris@42 2272 {
Chris@42 2273 E T43, T44, T46, T47;
Chris@42 2274 T43 = R1[WS(rs, 6)];
Chris@42 2275 T44 = R1[WS(rs, 38)];
Chris@42 2276 T45 = T43 - T44;
Chris@42 2277 Taz = T43 + T44;
Chris@42 2278 T46 = R1[WS(rs, 54)];
Chris@42 2279 T47 = R1[WS(rs, 22)];
Chris@42 2280 T48 = T46 - T47;
Chris@42 2281 TaA = T46 + T47;
Chris@42 2282 }
Chris@42 2283 T49 = KP707106781 * (T45 + T48);
Chris@42 2284 Tdj = TaA - Taz;
Chris@42 2285 T4b = KP707106781 * (T48 - T45);
Chris@42 2286 TaB = Taz + TaA;
Chris@42 2287 }
Chris@42 2288 TbZ = Tar + Tau;
Chris@42 2289 Tc0 = Tay + TaB;
Chris@42 2290 {
Chris@42 2291 E T3T, T3Y, Tdq, Tdr;
Chris@42 2292 T3T = T3L + T3S;
Chris@42 2293 T3Y = T3U - T3X;
Chris@42 2294 T3Z = FMA(KP980785280, T3T, KP195090322 * T3Y);
Chris@42 2295 T4s = FNMS(KP195090322, T3T, KP980785280 * T3Y);
Chris@42 2296 Tdq = FNMS(KP382683432, Tdf, KP923879532 * Tdg);
Chris@42 2297 Tdr = FMA(KP382683432, Tdi, KP923879532 * Tdj);
Chris@42 2298 Tds = Tdq + Tdr;
Chris@42 2299 TeI = Tdr - Tdq;
Chris@42 2300 }
Chris@42 2301 {
Chris@42 2302 E T4a, T4f, T7Y, T7Z;
Chris@42 2303 T4a = T42 + T49;
Chris@42 2304 T4f = T4b - T4e;
Chris@42 2305 T4g = FNMS(KP195090322, T4f, KP980785280 * T4a);
Chris@42 2306 T4t = FMA(KP195090322, T4a, KP980785280 * T4f);
Chris@42 2307 T7Y = T42 - T49;
Chris@42 2308 T7Z = T4e + T4b;
Chris@42 2309 T80 = FNMS(KP555570233, T7Z, KP831469612 * T7Y);
Chris@42 2310 T87 = FMA(KP555570233, T7Y, KP831469612 * T7Z);
Chris@42 2311 }
Chris@42 2312 Tdh = FMA(KP923879532, Tdf, KP382683432 * Tdg);
Chris@42 2313 Tdk = FNMS(KP382683432, Tdj, KP923879532 * Tdi);
Chris@42 2314 Tdl = Tdh + Tdk;
Chris@42 2315 TeE = Tdk - Tdh;
Chris@42 2316 {
Chris@42 2317 E T7V, T7W, Tav, TaC;
Chris@42 2318 T7V = T3L - T3S;
Chris@42 2319 T7W = T3X + T3U;
Chris@42 2320 T7X = FMA(KP831469612, T7V, KP555570233 * T7W);
Chris@42 2321 T86 = FNMS(KP555570233, T7V, KP831469612 * T7W);
Chris@42 2322 Tav = Tar - Tau;
Chris@42 2323 TaC = Tay - TaB;
Chris@42 2324 TaD = KP707106781 * (Tav + TaC);
Chris@42 2325 TaM = KP707106781 * (TaC - Tav);
Chris@42 2326 }
Chris@42 2327 }
Chris@42 2328 {
Chris@42 2329 E T50, TdA, T5c, TaY, T5h, TdD, T5t, Tb5, T57, TdB, T59, Tb1, T5o, TdE, T5q;
Chris@42 2330 E Tb8, TdC, TdF;
Chris@42 2331 {
Chris@42 2332 E T4Y, T4Z, TaW, T5a, T5b, TaX;
Chris@42 2333 T4Y = R1[WS(rs, 1)];
Chris@42 2334 T4Z = R1[WS(rs, 33)];
Chris@42 2335 TaW = T4Y + T4Z;
Chris@42 2336 T5a = R1[WS(rs, 17)];
Chris@42 2337 T5b = R1[WS(rs, 49)];
Chris@42 2338 TaX = T5a + T5b;
Chris@42 2339 T50 = T4Y - T4Z;
Chris@42 2340 TdA = TaW - TaX;
Chris@42 2341 T5c = T5a - T5b;
Chris@42 2342 TaY = TaW + TaX;
Chris@42 2343 }
Chris@42 2344 {
Chris@42 2345 E T5f, T5g, Tb3, T5r, T5s, Tb4;
Chris@42 2346 T5f = R1[WS(rs, 61)];
Chris@42 2347 T5g = R1[WS(rs, 29)];
Chris@42 2348 Tb3 = T5f + T5g;
Chris@42 2349 T5r = R1[WS(rs, 13)];
Chris@42 2350 T5s = R1[WS(rs, 45)];
Chris@42 2351 Tb4 = T5r + T5s;
Chris@42 2352 T5h = T5f - T5g;
Chris@42 2353 TdD = Tb3 - Tb4;
Chris@42 2354 T5t = T5r - T5s;
Chris@42 2355 Tb5 = Tb3 + Tb4;
Chris@42 2356 }
Chris@42 2357 {
Chris@42 2358 E T53, TaZ, T56, Tb0;
Chris@42 2359 {
Chris@42 2360 E T51, T52, T54, T55;
Chris@42 2361 T51 = R1[WS(rs, 9)];
Chris@42 2362 T52 = R1[WS(rs, 41)];
Chris@42 2363 T53 = T51 - T52;
Chris@42 2364 TaZ = T51 + T52;
Chris@42 2365 T54 = R1[WS(rs, 57)];
Chris@42 2366 T55 = R1[WS(rs, 25)];
Chris@42 2367 T56 = T54 - T55;
Chris@42 2368 Tb0 = T54 + T55;
Chris@42 2369 }
Chris@42 2370 T57 = KP707106781 * (T53 + T56);
Chris@42 2371 TdB = Tb0 - TaZ;
Chris@42 2372 T59 = KP707106781 * (T56 - T53);
Chris@42 2373 Tb1 = TaZ + Tb0;
Chris@42 2374 }
Chris@42 2375 {
Chris@42 2376 E T5k, Tb6, T5n, Tb7;
Chris@42 2377 {
Chris@42 2378 E T5i, T5j, T5l, T5m;
Chris@42 2379 T5i = R1[WS(rs, 5)];
Chris@42 2380 T5j = R1[WS(rs, 37)];
Chris@42 2381 T5k = T5i - T5j;
Chris@42 2382 Tb6 = T5i + T5j;
Chris@42 2383 T5l = R1[WS(rs, 53)];
Chris@42 2384 T5m = R1[WS(rs, 21)];
Chris@42 2385 T5n = T5l - T5m;
Chris@42 2386 Tb7 = T5l + T5m;
Chris@42 2387 }
Chris@42 2388 T5o = KP707106781 * (T5k + T5n);
Chris@42 2389 TdE = Tb7 - Tb6;
Chris@42 2390 T5q = KP707106781 * (T5n - T5k);
Chris@42 2391 Tb8 = Tb6 + Tb7;
Chris@42 2392 }
Chris@42 2393 Tc6 = TaY + Tb1;
Chris@42 2394 Tc7 = Tb5 + Tb8;
Chris@42 2395 {
Chris@42 2396 E T58, T5d, TdL, TdM;
Chris@42 2397 T58 = T50 + T57;
Chris@42 2398 T5d = T59 - T5c;
Chris@42 2399 T5e = FMA(KP980785280, T58, KP195090322 * T5d);
Chris@42 2400 T5H = FNMS(KP195090322, T58, KP980785280 * T5d);
Chris@42 2401 TdL = FNMS(KP382683432, TdA, KP923879532 * TdB);
Chris@42 2402 TdM = FMA(KP382683432, TdD, KP923879532 * TdE);
Chris@42 2403 TdN = TdL + TdM;
Chris@42 2404 TeM = TdM - TdL;
Chris@42 2405 }
Chris@42 2406 {
Chris@42 2407 E T5p, T5u, T8h, T8i;
Chris@42 2408 T5p = T5h + T5o;
Chris@42 2409 T5u = T5q - T5t;
Chris@42 2410 T5v = FNMS(KP195090322, T5u, KP980785280 * T5p);
Chris@42 2411 T5I = FMA(KP195090322, T5p, KP980785280 * T5u);
Chris@42 2412 T8h = T5h - T5o;
Chris@42 2413 T8i = T5t + T5q;
Chris@42 2414 T8j = FNMS(KP555570233, T8i, KP831469612 * T8h);
Chris@42 2415 T8q = FMA(KP555570233, T8h, KP831469612 * T8i);
Chris@42 2416 }
Chris@42 2417 TdC = FMA(KP923879532, TdA, KP382683432 * TdB);
Chris@42 2418 TdF = FNMS(KP382683432, TdE, KP923879532 * TdD);
Chris@42 2419 TdG = TdC + TdF;
Chris@42 2420 TeO = TdF - TdC;
Chris@42 2421 {
Chris@42 2422 E T8e, T8f, Tb2, Tb9;
Chris@42 2423 T8e = T50 - T57;
Chris@42 2424 T8f = T5c + T59;
Chris@42 2425 T8g = FMA(KP831469612, T8e, KP555570233 * T8f);
Chris@42 2426 T8p = FNMS(KP555570233, T8e, KP831469612 * T8f);
Chris@42 2427 Tb2 = TaY - Tb1;
Chris@42 2428 Tb9 = Tb5 - Tb8;
Chris@42 2429 Tba = KP707106781 * (Tb2 + Tb9);
Chris@42 2430 Tbj = KP707106781 * (Tb9 - Tb2);
Chris@42 2431 }
Chris@42 2432 }
Chris@42 2433 {
Chris@42 2434 E T11, TbV, Tc9, Tcf, T22, Tcb, Tc2, Tce;
Chris@42 2435 {
Chris@42 2436 E Tv, T10, Tc5, Tc8;
Chris@42 2437 Tv = Tf + Tu;
Chris@42 2438 T10 = TK + TZ;
Chris@42 2439 T11 = Tv + T10;
Chris@42 2440 TbV = Tv - T10;
Chris@42 2441 Tc5 = Tc3 + Tc4;
Chris@42 2442 Tc8 = Tc6 + Tc7;
Chris@42 2443 Tc9 = Tc5 - Tc8;
Chris@42 2444 Tcf = Tc5 + Tc8;
Chris@42 2445 }
Chris@42 2446 {
Chris@42 2447 E T1w, T21, TbY, Tc1;
Chris@42 2448 T1w = T1g + T1v;
Chris@42 2449 T21 = T1L + T20;
Chris@42 2450 T22 = T1w + T21;
Chris@42 2451 Tcb = T21 - T1w;
Chris@42 2452 TbY = TbW + TbX;
Chris@42 2453 Tc1 = TbZ + Tc0;
Chris@42 2454 Tc2 = TbY - Tc1;
Chris@42 2455 Tce = TbY + Tc1;
Chris@42 2456 }
Chris@42 2457 Cr[WS(csr, 32)] = T11 - T22;
Chris@42 2458 Ci[WS(csi, 32)] = Tcf - Tce;
Chris@42 2459 {
Chris@42 2460 E Tca, Tcc, Tcd, Tcg;
Chris@42 2461 Tca = KP707106781 * (Tc2 + Tc9);
Chris@42 2462 Cr[WS(csr, 48)] = TbV - Tca;
Chris@42 2463 Cr[WS(csr, 16)] = TbV + Tca;
Chris@42 2464 Tcc = KP707106781 * (Tc9 - Tc2);
Chris@42 2465 Ci[WS(csi, 16)] = Tcb + Tcc;
Chris@42 2466 Ci[WS(csi, 48)] = Tcc - Tcb;
Chris@42 2467 Tcd = T11 + T22;
Chris@42 2468 Tcg = Tce + Tcf;
Chris@42 2469 Cr[WS(csr, 64)] = Tcd - Tcg;
Chris@42 2470 Cr[0] = Tcd + Tcg;
Chris@42 2471 }
Chris@42 2472 }
Chris@42 2473 {
Chris@42 2474 E Tch, Tcu, Tck, Tct, Tco, Tcy, Tcr, Tcz, Tci, Tcj;
Chris@42 2475 Tch = Tf - Tu;
Chris@42 2476 Tcu = TZ - TK;
Chris@42 2477 Tci = T1g - T1v;
Chris@42 2478 Tcj = T1L - T20;
Chris@42 2479 Tck = KP707106781 * (Tci + Tcj);
Chris@42 2480 Tct = KP707106781 * (Tcj - Tci);
Chris@42 2481 {
Chris@42 2482 E Tcm, Tcn, Tcp, Tcq;
Chris@42 2483 Tcm = TbW - TbX;
Chris@42 2484 Tcn = Tc0 - TbZ;
Chris@42 2485 Tco = FMA(KP923879532, Tcm, KP382683432 * Tcn);
Chris@42 2486 Tcy = FNMS(KP382683432, Tcm, KP923879532 * Tcn);
Chris@42 2487 Tcp = Tc3 - Tc4;
Chris@42 2488 Tcq = Tc7 - Tc6;
Chris@42 2489 Tcr = FNMS(KP382683432, Tcq, KP923879532 * Tcp);
Chris@42 2490 Tcz = FMA(KP382683432, Tcp, KP923879532 * Tcq);
Chris@42 2491 }
Chris@42 2492 {
Chris@42 2493 E Tcl, Tcs, Tcx, TcA;
Chris@42 2494 Tcl = Tch + Tck;
Chris@42 2495 Tcs = Tco + Tcr;
Chris@42 2496 Cr[WS(csr, 56)] = Tcl - Tcs;
Chris@42 2497 Cr[WS(csr, 8)] = Tcl + Tcs;
Chris@42 2498 Tcx = Tcu + Tct;
Chris@42 2499 TcA = Tcy + Tcz;
Chris@42 2500 Ci[WS(csi, 8)] = Tcx + TcA;
Chris@42 2501 Ci[WS(csi, 56)] = TcA - Tcx;
Chris@42 2502 }
Chris@42 2503 {
Chris@42 2504 E Tcv, Tcw, TcB, TcC;
Chris@42 2505 Tcv = Tct - Tcu;
Chris@42 2506 Tcw = Tcr - Tco;
Chris@42 2507 Ci[WS(csi, 24)] = Tcv + Tcw;
Chris@42 2508 Ci[WS(csi, 40)] = Tcw - Tcv;
Chris@42 2509 TcB = Tch - Tck;
Chris@42 2510 TcC = Tcz - Tcy;
Chris@42 2511 Cr[WS(csr, 40)] = TcB - TcC;
Chris@42 2512 Cr[WS(csr, 24)] = TcB + TcC;
Chris@42 2513 }
Chris@42 2514 }
Chris@42 2515 {
Chris@42 2516 E Ta9, TbB, Tbs, TbM, Tag, TbL, TbJ, TbR, TaO, Tbw, Tbp, TbC, TbG, TbQ, Tbl;
Chris@42 2517 E Tbx, Ta8, Tbr;
Chris@42 2518 Ta8 = KP707106781 * (Ta6 + Ta7);
Chris@42 2519 Ta9 = Ta5 + Ta8;
Chris@42 2520 TbB = Ta5 - Ta8;
Chris@42 2521 Tbr = KP707106781 * (Ta7 - Ta6);
Chris@42 2522 Tbs = Tbq + Tbr;
Chris@42 2523 TbM = Tbr - Tbq;
Chris@42 2524 {
Chris@42 2525 E Tac, Taf, TbH, TbI;
Chris@42 2526 Tac = FMA(KP923879532, Taa, KP382683432 * Tab);
Chris@42 2527 Taf = FNMS(KP382683432, Tae, KP923879532 * Tad);
Chris@42 2528 Tag = Tac + Taf;
Chris@42 2529 TbL = Taf - Tac;
Chris@42 2530 TbH = TaV - Tba;
Chris@42 2531 TbI = Tbj - Tbi;
Chris@42 2532 TbJ = FNMS(KP555570233, TbI, KP831469612 * TbH);
Chris@42 2533 TbR = FMA(KP555570233, TbH, KP831469612 * TbI);
Chris@42 2534 }
Chris@42 2535 {
Chris@42 2536 E TaE, TaN, Tbn, Tbo;
Chris@42 2537 TaE = Tao + TaD;
Chris@42 2538 TaN = TaL + TaM;
Chris@42 2539 TaO = FMA(KP980785280, TaE, KP195090322 * TaN);
Chris@42 2540 Tbw = FNMS(KP195090322, TaE, KP980785280 * TaN);
Chris@42 2541 Tbn = FNMS(KP382683432, Taa, KP923879532 * Tab);
Chris@42 2542 Tbo = FMA(KP382683432, Tad, KP923879532 * Tae);
Chris@42 2543 Tbp = Tbn + Tbo;
Chris@42 2544 TbC = Tbo - Tbn;
Chris@42 2545 }
Chris@42 2546 {
Chris@42 2547 E TbE, TbF, Tbb, Tbk;
Chris@42 2548 TbE = Tao - TaD;
Chris@42 2549 TbF = TaM - TaL;
Chris@42 2550 TbG = FMA(KP831469612, TbE, KP555570233 * TbF);
Chris@42 2551 TbQ = FNMS(KP555570233, TbE, KP831469612 * TbF);
Chris@42 2552 Tbb = TaV + Tba;
Chris@42 2553 Tbk = Tbi + Tbj;
Chris@42 2554 Tbl = FNMS(KP195090322, Tbk, KP980785280 * Tbb);
Chris@42 2555 Tbx = FMA(KP195090322, Tbb, KP980785280 * Tbk);
Chris@42 2556 }
Chris@42 2557 {
Chris@42 2558 E Tah, Tbm, Tbv, Tby;
Chris@42 2559 Tah = Ta9 + Tag;
Chris@42 2560 Tbm = TaO + Tbl;
Chris@42 2561 Cr[WS(csr, 60)] = Tah - Tbm;
Chris@42 2562 Cr[WS(csr, 4)] = Tah + Tbm;
Chris@42 2563 Tbv = Tbs + Tbp;
Chris@42 2564 Tby = Tbw + Tbx;
Chris@42 2565 Ci[WS(csi, 4)] = Tbv + Tby;
Chris@42 2566 Ci[WS(csi, 60)] = Tby - Tbv;
Chris@42 2567 }
Chris@42 2568 {
Chris@42 2569 E Tbt, Tbu, Tbz, TbA;
Chris@42 2570 Tbt = Tbp - Tbs;
Chris@42 2571 Tbu = Tbl - TaO;
Chris@42 2572 Ci[WS(csi, 28)] = Tbt + Tbu;
Chris@42 2573 Ci[WS(csi, 36)] = Tbu - Tbt;
Chris@42 2574 Tbz = Ta9 - Tag;
Chris@42 2575 TbA = Tbx - Tbw;
Chris@42 2576 Cr[WS(csr, 36)] = Tbz - TbA;
Chris@42 2577 Cr[WS(csr, 28)] = Tbz + TbA;
Chris@42 2578 }
Chris@42 2579 {
Chris@42 2580 E TbD, TbK, TbP, TbS;
Chris@42 2581 TbD = TbB + TbC;
Chris@42 2582 TbK = TbG + TbJ;
Chris@42 2583 Cr[WS(csr, 52)] = TbD - TbK;
Chris@42 2584 Cr[WS(csr, 12)] = TbD + TbK;
Chris@42 2585 TbP = TbM + TbL;
Chris@42 2586 TbS = TbQ + TbR;
Chris@42 2587 Ci[WS(csi, 12)] = TbP + TbS;
Chris@42 2588 Ci[WS(csi, 52)] = TbS - TbP;
Chris@42 2589 }
Chris@42 2590 {
Chris@42 2591 E TbN, TbO, TbT, TbU;
Chris@42 2592 TbN = TbL - TbM;
Chris@42 2593 TbO = TbJ - TbG;
Chris@42 2594 Ci[WS(csi, 20)] = TbN + TbO;
Chris@42 2595 Ci[WS(csi, 44)] = TbO - TbN;
Chris@42 2596 TbT = TbB - TbC;
Chris@42 2597 TbU = TbR - TbQ;
Chris@42 2598 Cr[WS(csr, 44)] = TbT - TbU;
Chris@42 2599 Cr[WS(csr, 20)] = TbT + TbU;
Chris@42 2600 }
Chris@42 2601 }
Chris@42 2602 {
Chris@42 2603 E Tev, Tf7, Tfc, Tfm, Tff, Tfn, TeC, Tfh, TeK, Tf2, TeV, Tf8, TeY, Tfi, TeR;
Chris@42 2604 E Tf3;
Chris@42 2605 {
Chris@42 2606 E Tet, Teu, Tfa, Tfb;
Chris@42 2607 Tet = TcD - TcG;
Chris@42 2608 Teu = TdY - TdX;
Chris@42 2609 Tev = Tet - Teu;
Chris@42 2610 Tf7 = Tet + Teu;
Chris@42 2611 Tfa = TeF + TeE;
Chris@42 2612 Tfb = TeH + TeI;
Chris@42 2613 Tfc = FMA(KP290284677, Tfa, KP956940335 * Tfb);
Chris@42 2614 Tfm = FNMS(KP290284677, Tfb, KP956940335 * Tfa);
Chris@42 2615 }
Chris@42 2616 {
Chris@42 2617 E Tfd, Tfe, Tey, TeB;
Chris@42 2618 Tfd = TeL + TeM;
Chris@42 2619 Tfe = TeP + TeO;
Chris@42 2620 Tff = FNMS(KP290284677, Tfe, KP956940335 * Tfd);
Chris@42 2621 Tfn = FMA(KP956940335, Tfe, KP290284677 * Tfd);
Chris@42 2622 Tey = FMA(KP555570233, Tew, KP831469612 * Tex);
Chris@42 2623 TeB = FNMS(KP555570233, TeA, KP831469612 * Tez);
Chris@42 2624 TeC = Tey - TeB;
Chris@42 2625 Tfh = TeB + Tey;
Chris@42 2626 }
Chris@42 2627 {
Chris@42 2628 E TeG, TeJ, TeT, TeU;
Chris@42 2629 TeG = TeE - TeF;
Chris@42 2630 TeJ = TeH - TeI;
Chris@42 2631 TeK = FMA(KP471396736, TeG, KP881921264 * TeJ);
Chris@42 2632 Tf2 = FNMS(KP471396736, TeJ, KP881921264 * TeG);
Chris@42 2633 TeT = FNMS(KP555570233, Tex, KP831469612 * Tew);
Chris@42 2634 TeU = FMA(KP831469612, TeA, KP555570233 * Tez);
Chris@42 2635 TeV = TeT - TeU;
Chris@42 2636 Tf8 = TeU + TeT;
Chris@42 2637 }
Chris@42 2638 {
Chris@42 2639 E TeW, TeX, TeN, TeQ;
Chris@42 2640 TeW = TcN - TcK;
Chris@42 2641 TeX = TdV - TdU;
Chris@42 2642 TeY = TeW - TeX;
Chris@42 2643 Tfi = TeX + TeW;
Chris@42 2644 TeN = TeL - TeM;
Chris@42 2645 TeQ = TeO - TeP;
Chris@42 2646 TeR = FNMS(KP471396736, TeQ, KP881921264 * TeN);
Chris@42 2647 Tf3 = FMA(KP881921264, TeQ, KP471396736 * TeN);
Chris@42 2648 }
Chris@42 2649 {
Chris@42 2650 E TeD, TeS, Tf1, Tf4;
Chris@42 2651 TeD = Tev + TeC;
Chris@42 2652 TeS = TeK + TeR;
Chris@42 2653 Cr[WS(csr, 54)] = TeD - TeS;
Chris@42 2654 Cr[WS(csr, 10)] = TeD + TeS;
Chris@42 2655 Tf1 = TeY + TeV;
Chris@42 2656 Tf4 = Tf2 + Tf3;
Chris@42 2657 Ci[WS(csi, 10)] = Tf1 + Tf4;
Chris@42 2658 Ci[WS(csi, 54)] = Tf4 - Tf1;
Chris@42 2659 }
Chris@42 2660 {
Chris@42 2661 E TeZ, Tf0, Tf5, Tf6;
Chris@42 2662 TeZ = TeV - TeY;
Chris@42 2663 Tf0 = TeR - TeK;
Chris@42 2664 Ci[WS(csi, 22)] = TeZ + Tf0;
Chris@42 2665 Ci[WS(csi, 42)] = Tf0 - TeZ;
Chris@42 2666 Tf5 = Tev - TeC;
Chris@42 2667 Tf6 = Tf3 - Tf2;
Chris@42 2668 Cr[WS(csr, 42)] = Tf5 - Tf6;
Chris@42 2669 Cr[WS(csr, 22)] = Tf5 + Tf6;
Chris@42 2670 }
Chris@42 2671 {
Chris@42 2672 E Tf9, Tfg, Tfl, Tfo;
Chris@42 2673 Tf9 = Tf7 + Tf8;
Chris@42 2674 Tfg = Tfc + Tff;
Chris@42 2675 Cr[WS(csr, 58)] = Tf9 - Tfg;
Chris@42 2676 Cr[WS(csr, 6)] = Tf9 + Tfg;
Chris@42 2677 Tfl = Tfi + Tfh;
Chris@42 2678 Tfo = Tfm + Tfn;
Chris@42 2679 Ci[WS(csi, 6)] = Tfl + Tfo;
Chris@42 2680 Ci[WS(csi, 58)] = Tfo - Tfl;
Chris@42 2681 }
Chris@42 2682 {
Chris@42 2683 E Tfj, Tfk, Tfp, Tfq;
Chris@42 2684 Tfj = Tfh - Tfi;
Chris@42 2685 Tfk = Tff - Tfc;
Chris@42 2686 Ci[WS(csi, 26)] = Tfj + Tfk;
Chris@42 2687 Ci[WS(csi, 38)] = Tfk - Tfj;
Chris@42 2688 Tfp = Tf7 - Tf8;
Chris@42 2689 Tfq = Tfn - Tfm;
Chris@42 2690 Cr[WS(csr, 38)] = Tfp - Tfq;
Chris@42 2691 Cr[WS(csr, 26)] = Tfp + Tfq;
Chris@42 2692 }
Chris@42 2693 }
Chris@42 2694 {
Chris@42 2695 E TcP, Te9, Tee, Teo, Teh, Tep, Td8, Tej, Tdu, Te4, TdT, Tea, Te0, Tek, TdP;
Chris@42 2696 E Te5;
Chris@42 2697 {
Chris@42 2698 E TcH, TcO, Tec, Ted;
Chris@42 2699 TcH = TcD + TcG;
Chris@42 2700 TcO = TcK + TcN;
Chris@42 2701 TcP = TcH + TcO;
Chris@42 2702 Te9 = TcH - TcO;
Chris@42 2703 Tec = Tde - Tdl;
Chris@42 2704 Ted = Tds - Tdp;
Chris@42 2705 Tee = FMA(KP773010453, Tec, KP634393284 * Ted);
Chris@42 2706 Teo = FNMS(KP634393284, Tec, KP773010453 * Ted);
Chris@42 2707 }
Chris@42 2708 {
Chris@42 2709 E Tef, Teg, TcY, Td7;
Chris@42 2710 Tef = Tdz - TdG;
Chris@42 2711 Teg = TdN - TdK;
Chris@42 2712 Teh = FNMS(KP634393284, Teg, KP773010453 * Tef);
Chris@42 2713 Tep = FMA(KP634393284, Tef, KP773010453 * Teg);
Chris@42 2714 TcY = FMA(KP980785280, TcU, KP195090322 * TcX);
Chris@42 2715 Td7 = FNMS(KP195090322, Td6, KP980785280 * Td3);
Chris@42 2716 Td8 = TcY + Td7;
Chris@42 2717 Tej = Td7 - TcY;
Chris@42 2718 }
Chris@42 2719 {
Chris@42 2720 E Tdm, Tdt, TdR, TdS;
Chris@42 2721 Tdm = Tde + Tdl;
Chris@42 2722 Tdt = Tdp + Tds;
Chris@42 2723 Tdu = FMA(KP995184726, Tdm, KP098017140 * Tdt);
Chris@42 2724 Te4 = FNMS(KP098017140, Tdm, KP995184726 * Tdt);
Chris@42 2725 TdR = FNMS(KP195090322, TcU, KP980785280 * TcX);
Chris@42 2726 TdS = FMA(KP195090322, Td3, KP980785280 * Td6);
Chris@42 2727 TdT = TdR + TdS;
Chris@42 2728 Tea = TdS - TdR;
Chris@42 2729 }
Chris@42 2730 {
Chris@42 2731 E TdW, TdZ, TdH, TdO;
Chris@42 2732 TdW = TdU + TdV;
Chris@42 2733 TdZ = TdX + TdY;
Chris@42 2734 Te0 = TdW + TdZ;
Chris@42 2735 Tek = TdZ - TdW;
Chris@42 2736 TdH = Tdz + TdG;
Chris@42 2737 TdO = TdK + TdN;
Chris@42 2738 TdP = FNMS(KP098017140, TdO, KP995184726 * TdH);
Chris@42 2739 Te5 = FMA(KP098017140, TdH, KP995184726 * TdO);
Chris@42 2740 }
Chris@42 2741 {
Chris@42 2742 E Td9, TdQ, Te3, Te6;
Chris@42 2743 Td9 = TcP + Td8;
Chris@42 2744 TdQ = Tdu + TdP;
Chris@42 2745 Cr[WS(csr, 62)] = Td9 - TdQ;
Chris@42 2746 Cr[WS(csr, 2)] = Td9 + TdQ;
Chris@42 2747 Te3 = Te0 + TdT;
Chris@42 2748 Te6 = Te4 + Te5;
Chris@42 2749 Ci[WS(csi, 2)] = Te3 + Te6;
Chris@42 2750 Ci[WS(csi, 62)] = Te6 - Te3;
Chris@42 2751 }
Chris@42 2752 {
Chris@42 2753 E Te1, Te2, Te7, Te8;
Chris@42 2754 Te1 = TdT - Te0;
Chris@42 2755 Te2 = TdP - Tdu;
Chris@42 2756 Ci[WS(csi, 30)] = Te1 + Te2;
Chris@42 2757 Ci[WS(csi, 34)] = Te2 - Te1;
Chris@42 2758 Te7 = TcP - Td8;
Chris@42 2759 Te8 = Te5 - Te4;
Chris@42 2760 Cr[WS(csr, 34)] = Te7 - Te8;
Chris@42 2761 Cr[WS(csr, 30)] = Te7 + Te8;
Chris@42 2762 }
Chris@42 2763 {
Chris@42 2764 E Teb, Tei, Ten, Teq;
Chris@42 2765 Teb = Te9 + Tea;
Chris@42 2766 Tei = Tee + Teh;
Chris@42 2767 Cr[WS(csr, 50)] = Teb - Tei;
Chris@42 2768 Cr[WS(csr, 14)] = Teb + Tei;
Chris@42 2769 Ten = Tek + Tej;
Chris@42 2770 Teq = Teo + Tep;
Chris@42 2771 Ci[WS(csi, 14)] = Ten + Teq;
Chris@42 2772 Ci[WS(csi, 50)] = Teq - Ten;
Chris@42 2773 }
Chris@42 2774 {
Chris@42 2775 E Tel, Tem, Ter, Tes;
Chris@42 2776 Tel = Tej - Tek;
Chris@42 2777 Tem = Teh - Tee;
Chris@42 2778 Ci[WS(csi, 18)] = Tel + Tem;
Chris@42 2779 Ci[WS(csi, 46)] = Tem - Tel;
Chris@42 2780 Ter = Te9 - Tea;
Chris@42 2781 Tes = Tep - Teo;
Chris@42 2782 Cr[WS(csr, 46)] = Ter - Tes;
Chris@42 2783 Cr[WS(csr, 18)] = Ter + Tes;
Chris@42 2784 }
Chris@42 2785 }
Chris@42 2786 {
Chris@42 2787 E T6v, T77, T6C, T7h, T6Y, T7i, T6V, T78, T6R, T7n, T73, T7f, T6K, T7m, T72;
Chris@42 2788 E T7c;
Chris@42 2789 {
Chris@42 2790 E T6t, T6u, T6T, T6U;
Chris@42 2791 T6t = T27 - T2e;
Chris@42 2792 T6u = T5Y - T5X;
Chris@42 2793 T6v = T6t - T6u;
Chris@42 2794 T77 = T6t + T6u;
Chris@42 2795 {
Chris@42 2796 E T6y, T6B, T6W, T6X;
Chris@42 2797 T6y = FMA(KP773010453, T6w, KP634393284 * T6x);
Chris@42 2798 T6B = FNMS(KP634393284, T6A, KP773010453 * T6z);
Chris@42 2799 T6C = T6y - T6B;
Chris@42 2800 T7h = T6B + T6y;
Chris@42 2801 T6W = T2x - T2o;
Chris@42 2802 T6X = T5V - T5S;
Chris@42 2803 T6Y = T6W - T6X;
Chris@42 2804 T7i = T6X + T6W;
Chris@42 2805 }
Chris@42 2806 T6T = FNMS(KP634393284, T6w, KP773010453 * T6x);
Chris@42 2807 T6U = FMA(KP634393284, T6z, KP773010453 * T6A);
Chris@42 2808 T6V = T6T - T6U;
Chris@42 2809 T78 = T6U + T6T;
Chris@42 2810 {
Chris@42 2811 E T6N, T7d, T6Q, T7e, T6M, T6O;
Chris@42 2812 T6M = T5I - T5H;
Chris@42 2813 T6N = T6L - T6M;
Chris@42 2814 T7d = T6L + T6M;
Chris@42 2815 T6O = T5v - T5e;
Chris@42 2816 T6Q = T6O - T6P;
Chris@42 2817 T7e = T6P + T6O;
Chris@42 2818 T6R = FNMS(KP427555093, T6Q, KP903989293 * T6N);
Chris@42 2819 T7n = FMA(KP941544065, T7e, KP336889853 * T7d);
Chris@42 2820 T73 = FMA(KP903989293, T6Q, KP427555093 * T6N);
Chris@42 2821 T7f = FNMS(KP336889853, T7e, KP941544065 * T7d);
Chris@42 2822 }
Chris@42 2823 {
Chris@42 2824 E T6G, T7a, T6J, T7b, T6E, T6I;
Chris@42 2825 T6E = T4g - T3Z;
Chris@42 2826 T6G = T6E - T6F;
Chris@42 2827 T7a = T6F + T6E;
Chris@42 2828 T6I = T4t - T4s;
Chris@42 2829 T6J = T6H - T6I;
Chris@42 2830 T7b = T6H + T6I;
Chris@42 2831 T6K = FMA(KP427555093, T6G, KP903989293 * T6J);
Chris@42 2832 T7m = FNMS(KP336889853, T7b, KP941544065 * T7a);
Chris@42 2833 T72 = FNMS(KP427555093, T6J, KP903989293 * T6G);
Chris@42 2834 T7c = FMA(KP336889853, T7a, KP941544065 * T7b);
Chris@42 2835 }
Chris@42 2836 }
Chris@42 2837 {
Chris@42 2838 E T6D, T6S, T71, T74;
Chris@42 2839 T6D = T6v + T6C;
Chris@42 2840 T6S = T6K + T6R;
Chris@42 2841 Cr[WS(csr, 55)] = T6D - T6S;
Chris@42 2842 Cr[WS(csr, 9)] = T6D + T6S;
Chris@42 2843 T71 = T6Y + T6V;
Chris@42 2844 T74 = T72 + T73;
Chris@42 2845 Ci[WS(csi, 9)] = T71 + T74;
Chris@42 2846 Ci[WS(csi, 55)] = T74 - T71;
Chris@42 2847 }
Chris@42 2848 {
Chris@42 2849 E T6Z, T70, T75, T76;
Chris@42 2850 T6Z = T6V - T6Y;
Chris@42 2851 T70 = T6R - T6K;
Chris@42 2852 Ci[WS(csi, 23)] = T6Z + T70;
Chris@42 2853 Ci[WS(csi, 41)] = T70 - T6Z;
Chris@42 2854 T75 = T6v - T6C;
Chris@42 2855 T76 = T73 - T72;
Chris@42 2856 Cr[WS(csr, 41)] = T75 - T76;
Chris@42 2857 Cr[WS(csr, 23)] = T75 + T76;
Chris@42 2858 }
Chris@42 2859 {
Chris@42 2860 E T79, T7g, T7l, T7o;
Chris@42 2861 T79 = T77 + T78;
Chris@42 2862 T7g = T7c + T7f;
Chris@42 2863 Cr[WS(csr, 57)] = T79 - T7g;
Chris@42 2864 Cr[WS(csr, 7)] = T79 + T7g;
Chris@42 2865 T7l = T7i + T7h;
Chris@42 2866 T7o = T7m + T7n;
Chris@42 2867 Ci[WS(csi, 7)] = T7l + T7o;
Chris@42 2868 Ci[WS(csi, 57)] = T7o - T7l;
Chris@42 2869 }
Chris@42 2870 {
Chris@42 2871 E T7j, T7k, T7p, T7q;
Chris@42 2872 T7j = T7h - T7i;
Chris@42 2873 T7k = T7f - T7c;
Chris@42 2874 Ci[WS(csi, 25)] = T7j + T7k;
Chris@42 2875 Ci[WS(csi, 39)] = T7k - T7j;
Chris@42 2876 T7p = T77 - T78;
Chris@42 2877 T7q = T7n - T7m;
Chris@42 2878 Cr[WS(csr, 39)] = T7p - T7q;
Chris@42 2879 Cr[WS(csr, 25)] = T7p + T7q;
Chris@42 2880 }
Chris@42 2881 }
Chris@42 2882 {
Chris@42 2883 E T99, T9L, T9g, T9V, T9C, T9W, T9z, T9M, T9v, Ta1, T9H, T9T, T9o, Ta0, T9G;
Chris@42 2884 E T9Q;
Chris@42 2885 {
Chris@42 2886 E T97, T98, T9x, T9y;
Chris@42 2887 T97 = T7r - T7s;
Chris@42 2888 T98 = T8C - T8B;
Chris@42 2889 T99 = T97 - T98;
Chris@42 2890 T9L = T97 + T98;
Chris@42 2891 {
Chris@42 2892 E T9c, T9f, T9A, T9B;
Chris@42 2893 T9c = FMA(KP471396736, T9a, KP881921264 * T9b);
Chris@42 2894 T9f = FNMS(KP471396736, T9e, KP881921264 * T9d);
Chris@42 2895 T9g = T9c - T9f;
Chris@42 2896 T9V = T9f + T9c;
Chris@42 2897 T9A = T7z - T7w;
Chris@42 2898 T9B = T8z - T8y;
Chris@42 2899 T9C = T9A - T9B;
Chris@42 2900 T9W = T9B + T9A;
Chris@42 2901 }
Chris@42 2902 T9x = FNMS(KP471396736, T9b, KP881921264 * T9a);
Chris@42 2903 T9y = FMA(KP881921264, T9e, KP471396736 * T9d);
Chris@42 2904 T9z = T9x - T9y;
Chris@42 2905 T9M = T9y + T9x;
Chris@42 2906 {
Chris@42 2907 E T9r, T9R, T9u, T9S, T9q, T9s;
Chris@42 2908 T9q = T8q - T8p;
Chris@42 2909 T9r = T9p - T9q;
Chris@42 2910 T9R = T9p + T9q;
Chris@42 2911 T9s = T8j - T8g;
Chris@42 2912 T9u = T9s - T9t;
Chris@42 2913 T9S = T9t + T9s;
Chris@42 2914 T9v = FNMS(KP514102744, T9u, KP857728610 * T9r);
Chris@42 2915 Ta1 = FMA(KP970031253, T9S, KP242980179 * T9R);
Chris@42 2916 T9H = FMA(KP857728610, T9u, KP514102744 * T9r);
Chris@42 2917 T9T = FNMS(KP242980179, T9S, KP970031253 * T9R);
Chris@42 2918 }
Chris@42 2919 {
Chris@42 2920 E T9k, T9O, T9n, T9P, T9i, T9m;
Chris@42 2921 T9i = T80 - T7X;
Chris@42 2922 T9k = T9i - T9j;
Chris@42 2923 T9O = T9j + T9i;
Chris@42 2924 T9m = T87 - T86;
Chris@42 2925 T9n = T9l - T9m;
Chris@42 2926 T9P = T9l + T9m;
Chris@42 2927 T9o = FMA(KP514102744, T9k, KP857728610 * T9n);
Chris@42 2928 Ta0 = FNMS(KP242980179, T9P, KP970031253 * T9O);
Chris@42 2929 T9G = FNMS(KP514102744, T9n, KP857728610 * T9k);
Chris@42 2930 T9Q = FMA(KP242980179, T9O, KP970031253 * T9P);
Chris@42 2931 }
Chris@42 2932 }
Chris@42 2933 {
Chris@42 2934 E T9h, T9w, T9F, T9I;
Chris@42 2935 T9h = T99 + T9g;
Chris@42 2936 T9w = T9o + T9v;
Chris@42 2937 Cr[WS(csr, 53)] = T9h - T9w;
Chris@42 2938 Cr[WS(csr, 11)] = T9h + T9w;
Chris@42 2939 T9F = T9C + T9z;
Chris@42 2940 T9I = T9G + T9H;
Chris@42 2941 Ci[WS(csi, 11)] = T9F + T9I;
Chris@42 2942 Ci[WS(csi, 53)] = T9I - T9F;
Chris@42 2943 }
Chris@42 2944 {
Chris@42 2945 E T9D, T9E, T9J, T9K;
Chris@42 2946 T9D = T9z - T9C;
Chris@42 2947 T9E = T9v - T9o;
Chris@42 2948 Ci[WS(csi, 21)] = T9D + T9E;
Chris@42 2949 Ci[WS(csi, 43)] = T9E - T9D;
Chris@42 2950 T9J = T99 - T9g;
Chris@42 2951 T9K = T9H - T9G;
Chris@42 2952 Cr[WS(csr, 43)] = T9J - T9K;
Chris@42 2953 Cr[WS(csr, 21)] = T9J + T9K;
Chris@42 2954 }
Chris@42 2955 {
Chris@42 2956 E T9N, T9U, T9Z, Ta2;
Chris@42 2957 T9N = T9L + T9M;
Chris@42 2958 T9U = T9Q + T9T;
Chris@42 2959 Cr[WS(csr, 59)] = T9N - T9U;
Chris@42 2960 Cr[WS(csr, 5)] = T9N + T9U;
Chris@42 2961 T9Z = T9W + T9V;
Chris@42 2962 Ta2 = Ta0 + Ta1;
Chris@42 2963 Ci[WS(csi, 5)] = T9Z + Ta2;
Chris@42 2964 Ci[WS(csi, 59)] = Ta2 - T9Z;
Chris@42 2965 }
Chris@42 2966 {
Chris@42 2967 E T9X, T9Y, Ta3, Ta4;
Chris@42 2968 T9X = T9V - T9W;
Chris@42 2969 T9Y = T9T - T9Q;
Chris@42 2970 Ci[WS(csi, 27)] = T9X + T9Y;
Chris@42 2971 Ci[WS(csi, 37)] = T9Y - T9X;
Chris@42 2972 Ta3 = T9L - T9M;
Chris@42 2973 Ta4 = Ta1 - Ta0;
Chris@42 2974 Cr[WS(csr, 37)] = Ta3 - Ta4;
Chris@42 2975 Cr[WS(csr, 27)] = Ta3 + Ta4;
Chris@42 2976 }
Chris@42 2977 }
Chris@42 2978 {
Chris@42 2979 E T2z, T69, T3g, T6j, T60, T6k, T5P, T6a, T5L, T6p, T65, T6h, T4w, T6o, T64;
Chris@42 2980 E T6e;
Chris@42 2981 {
Chris@42 2982 E T2f, T2y, T5N, T5O;
Chris@42 2983 T2f = T27 + T2e;
Chris@42 2984 T2y = T2o + T2x;
Chris@42 2985 T2z = T2f + T2y;
Chris@42 2986 T69 = T2f - T2y;
Chris@42 2987 {
Chris@42 2988 E T2U, T3f, T5W, T5Z;
Chris@42 2989 T2U = FMA(KP098017140, T2M, KP995184726 * T2T);
Chris@42 2990 T3f = FNMS(KP098017140, T3e, KP995184726 * T37);
Chris@42 2991 T3g = T2U + T3f;
Chris@42 2992 T6j = T3f - T2U;
Chris@42 2993 T5W = T5S + T5V;
Chris@42 2994 T5Z = T5X + T5Y;
Chris@42 2995 T60 = T5W + T5Z;
Chris@42 2996 T6k = T5Z - T5W;
Chris@42 2997 }
Chris@42 2998 T5N = FNMS(KP098017140, T2T, KP995184726 * T2M);
Chris@42 2999 T5O = FMA(KP995184726, T3e, KP098017140 * T37);
Chris@42 3000 T5P = T5N + T5O;
Chris@42 3001 T6a = T5O - T5N;
Chris@42 3002 {
Chris@42 3003 E T5x, T6f, T5K, T6g, T5w, T5J;
Chris@42 3004 T5w = T5e + T5v;
Chris@42 3005 T5x = T4X + T5w;
Chris@42 3006 T6f = T4X - T5w;
Chris@42 3007 T5J = T5H + T5I;
Chris@42 3008 T5K = T5G + T5J;
Chris@42 3009 T6g = T5J - T5G;
Chris@42 3010 T5L = FNMS(KP049067674, T5K, KP998795456 * T5x);
Chris@42 3011 T6p = FMA(KP671558954, T6f, KP740951125 * T6g);
Chris@42 3012 T65 = FMA(KP049067674, T5x, KP998795456 * T5K);
Chris@42 3013 T6h = FNMS(KP671558954, T6g, KP740951125 * T6f);
Chris@42 3014 }
Chris@42 3015 {
Chris@42 3016 E T4i, T6c, T4v, T6d, T4h, T4u;
Chris@42 3017 T4h = T3Z + T4g;
Chris@42 3018 T4i = T3I + T4h;
Chris@42 3019 T6c = T3I - T4h;
Chris@42 3020 T4u = T4s + T4t;
Chris@42 3021 T4v = T4r + T4u;
Chris@42 3022 T6d = T4u - T4r;
Chris@42 3023 T4w = FMA(KP998795456, T4i, KP049067674 * T4v);
Chris@42 3024 T6o = FNMS(KP671558954, T6c, KP740951125 * T6d);
Chris@42 3025 T64 = FNMS(KP049067674, T4i, KP998795456 * T4v);
Chris@42 3026 T6e = FMA(KP740951125, T6c, KP671558954 * T6d);
Chris@42 3027 }
Chris@42 3028 }
Chris@42 3029 {
Chris@42 3030 E T3h, T5M, T63, T66;
Chris@42 3031 T3h = T2z + T3g;
Chris@42 3032 T5M = T4w + T5L;
Chris@42 3033 Cr[WS(csr, 63)] = T3h - T5M;
Chris@42 3034 Cr[WS(csr, 1)] = T3h + T5M;
Chris@42 3035 T63 = T60 + T5P;
Chris@42 3036 T66 = T64 + T65;
Chris@42 3037 Ci[WS(csi, 1)] = T63 + T66;
Chris@42 3038 Ci[WS(csi, 63)] = T66 - T63;
Chris@42 3039 }
Chris@42 3040 {
Chris@42 3041 E T61, T62, T67, T68;
Chris@42 3042 T61 = T5P - T60;
Chris@42 3043 T62 = T5L - T4w;
Chris@42 3044 Ci[WS(csi, 31)] = T61 + T62;
Chris@42 3045 Ci[WS(csi, 33)] = T62 - T61;
Chris@42 3046 T67 = T2z - T3g;
Chris@42 3047 T68 = T65 - T64;
Chris@42 3048 Cr[WS(csr, 33)] = T67 - T68;
Chris@42 3049 Cr[WS(csr, 31)] = T67 + T68;
Chris@42 3050 }
Chris@42 3051 {
Chris@42 3052 E T6b, T6i, T6n, T6q;
Chris@42 3053 T6b = T69 + T6a;
Chris@42 3054 T6i = T6e + T6h;
Chris@42 3055 Cr[WS(csr, 49)] = T6b - T6i;
Chris@42 3056 Cr[WS(csr, 15)] = T6b + T6i;
Chris@42 3057 T6n = T6k + T6j;
Chris@42 3058 T6q = T6o + T6p;
Chris@42 3059 Ci[WS(csi, 15)] = T6n + T6q;
Chris@42 3060 Ci[WS(csi, 49)] = T6q - T6n;
Chris@42 3061 }
Chris@42 3062 {
Chris@42 3063 E T6l, T6m, T6r, T6s;
Chris@42 3064 T6l = T6j - T6k;
Chris@42 3065 T6m = T6h - T6e;
Chris@42 3066 Ci[WS(csi, 17)] = T6l + T6m;
Chris@42 3067 Ci[WS(csi, 47)] = T6m - T6l;
Chris@42 3068 T6r = T69 - T6a;
Chris@42 3069 T6s = T6p - T6o;
Chris@42 3070 Cr[WS(csr, 47)] = T6r - T6s;
Chris@42 3071 Cr[WS(csr, 17)] = T6r + T6s;
Chris@42 3072 }
Chris@42 3073 }
Chris@42 3074 {
Chris@42 3075 E T7B, T8N, T7Q, T8X, T8E, T8Y, T8x, T8O, T8t, T93, T8J, T8V, T8a, T92, T8I;
Chris@42 3076 E T8S;
Chris@42 3077 {
Chris@42 3078 E T7t, T7A, T8v, T8w;
Chris@42 3079 T7t = T7r + T7s;
Chris@42 3080 T7A = T7w + T7z;
Chris@42 3081 T7B = T7t + T7A;
Chris@42 3082 T8N = T7t - T7A;
Chris@42 3083 {
Chris@42 3084 E T7I, T7P, T8A, T8D;
Chris@42 3085 T7I = FMA(KP956940335, T7E, KP290284677 * T7H);
Chris@42 3086 T7P = FNMS(KP290284677, T7O, KP956940335 * T7L);
Chris@42 3087 T7Q = T7I + T7P;
Chris@42 3088 T8X = T7P - T7I;
Chris@42 3089 T8A = T8y + T8z;
Chris@42 3090 T8D = T8B + T8C;
Chris@42 3091 T8E = T8A + T8D;
Chris@42 3092 T8Y = T8D - T8A;
Chris@42 3093 }
Chris@42 3094 T8v = FNMS(KP290284677, T7E, KP956940335 * T7H);
Chris@42 3095 T8w = FMA(KP290284677, T7L, KP956940335 * T7O);
Chris@42 3096 T8x = T8v + T8w;
Chris@42 3097 T8O = T8w - T8v;
Chris@42 3098 {
Chris@42 3099 E T8l, T8T, T8s, T8U, T8k, T8r;
Chris@42 3100 T8k = T8g + T8j;
Chris@42 3101 T8l = T8d + T8k;
Chris@42 3102 T8T = T8d - T8k;
Chris@42 3103 T8r = T8p + T8q;
Chris@42 3104 T8s = T8o + T8r;
Chris@42 3105 T8U = T8r - T8o;
Chris@42 3106 T8t = FNMS(KP146730474, T8s, KP989176509 * T8l);
Chris@42 3107 T93 = FMA(KP595699304, T8T, KP803207531 * T8U);
Chris@42 3108 T8J = FMA(KP146730474, T8l, KP989176509 * T8s);
Chris@42 3109 T8V = FNMS(KP595699304, T8U, KP803207531 * T8T);
Chris@42 3110 }
Chris@42 3111 {
Chris@42 3112 E T82, T8Q, T89, T8R, T81, T88;
Chris@42 3113 T81 = T7X + T80;
Chris@42 3114 T82 = T7U + T81;
Chris@42 3115 T8Q = T7U - T81;
Chris@42 3116 T88 = T86 + T87;
Chris@42 3117 T89 = T85 + T88;
Chris@42 3118 T8R = T88 - T85;
Chris@42 3119 T8a = FMA(KP989176509, T82, KP146730474 * T89);
Chris@42 3120 T92 = FNMS(KP595699304, T8Q, KP803207531 * T8R);
Chris@42 3121 T8I = FNMS(KP146730474, T82, KP989176509 * T89);
Chris@42 3122 T8S = FMA(KP803207531, T8Q, KP595699304 * T8R);
Chris@42 3123 }
Chris@42 3124 }
Chris@42 3125 {
Chris@42 3126 E T7R, T8u, T8H, T8K;
Chris@42 3127 T7R = T7B + T7Q;
Chris@42 3128 T8u = T8a + T8t;
Chris@42 3129 Cr[WS(csr, 61)] = T7R - T8u;
Chris@42 3130 Cr[WS(csr, 3)] = T7R + T8u;
Chris@42 3131 T8H = T8E + T8x;
Chris@42 3132 T8K = T8I + T8J;
Chris@42 3133 Ci[WS(csi, 3)] = T8H + T8K;
Chris@42 3134 Ci[WS(csi, 61)] = T8K - T8H;
Chris@42 3135 }
Chris@42 3136 {
Chris@42 3137 E T8F, T8G, T8L, T8M;
Chris@42 3138 T8F = T8x - T8E;
Chris@42 3139 T8G = T8t - T8a;
Chris@42 3140 Ci[WS(csi, 29)] = T8F + T8G;
Chris@42 3141 Ci[WS(csi, 35)] = T8G - T8F;
Chris@42 3142 T8L = T7B - T7Q;
Chris@42 3143 T8M = T8J - T8I;
Chris@42 3144 Cr[WS(csr, 35)] = T8L - T8M;
Chris@42 3145 Cr[WS(csr, 29)] = T8L + T8M;
Chris@42 3146 }
Chris@42 3147 {
Chris@42 3148 E T8P, T8W, T91, T94;
Chris@42 3149 T8P = T8N + T8O;
Chris@42 3150 T8W = T8S + T8V;
Chris@42 3151 Cr[WS(csr, 51)] = T8P - T8W;
Chris@42 3152 Cr[WS(csr, 13)] = T8P + T8W;
Chris@42 3153 T91 = T8Y + T8X;
Chris@42 3154 T94 = T92 + T93;
Chris@42 3155 Ci[WS(csi, 13)] = T91 + T94;
Chris@42 3156 Ci[WS(csi, 51)] = T94 - T91;
Chris@42 3157 }
Chris@42 3158 {
Chris@42 3159 E T8Z, T90, T95, T96;
Chris@42 3160 T8Z = T8X - T8Y;
Chris@42 3161 T90 = T8V - T8S;
Chris@42 3162 Ci[WS(csi, 19)] = T8Z + T90;
Chris@42 3163 Ci[WS(csi, 45)] = T90 - T8Z;
Chris@42 3164 T95 = T8N - T8O;
Chris@42 3165 T96 = T93 - T92;
Chris@42 3166 Cr[WS(csr, 45)] = T95 - T96;
Chris@42 3167 Cr[WS(csr, 19)] = T95 + T96;
Chris@42 3168 }
Chris@42 3169 }
Chris@42 3170 }
Chris@42 3171 }
Chris@42 3172 }
Chris@42 3173
Chris@42 3174 static const kr2c_desc desc = { 128, "r2cf_128", {812, 186, 144, 0}, &GENUS };
Chris@42 3175
Chris@42 3176 void X(codelet_r2cf_128) (planner *p) {
Chris@42 3177 X(kr2c_register) (p, r2cf_128, &desc);
Chris@42 3178 }
Chris@42 3179
Chris@42 3180 #endif /* HAVE_FMA */