cannam@167: (* cannam@167: * Copyright (c) 1997-1999 Massachusetts Institute of Technology cannam@167: * Copyright (c) 2003, 2007-14 Matteo Frigo cannam@167: * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology cannam@167: * cannam@167: * This program is free software; you can redistribute it and/or modify cannam@167: * it under the terms of the GNU General Public License as published by cannam@167: * the Free Software Foundation; either version 2 of the License, or cannam@167: * (at your option) any later version. cannam@167: * cannam@167: * This program is distributed in the hope that it will be useful, cannam@167: * but WITHOUT ANY WARRANTY; without even the implied warranty of cannam@167: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the cannam@167: * GNU General Public License for more details. cannam@167: * cannam@167: * You should have received a copy of the GNU General Public License cannam@167: * along with this program; if not, write to the Free Software cannam@167: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA cannam@167: * cannam@167: *) cannam@167: cannam@167: open Util cannam@167: open Genutil cannam@167: open C cannam@167: cannam@167: type ditdif = DIT | DIF cannam@167: let ditdif = ref DIT cannam@167: cannam@167: let usage = "Usage: " ^ Sys.argv.(0) ^ " -n [ -dit | -dif ]" cannam@167: cannam@167: let reload_twiddle = ref false cannam@167: cannam@167: let urs = ref Stride_variable cannam@167: let uvs = ref Stride_variable cannam@167: let ums = ref Stride_variable cannam@167: cannam@167: let speclist = [ cannam@167: "-dit", cannam@167: Arg.Unit(fun () -> ditdif := DIT), cannam@167: " generate a DIT codelet"; cannam@167: cannam@167: "-dif", cannam@167: Arg.Unit(fun () -> ditdif := DIF), cannam@167: " generate a DIF codelet"; cannam@167: cannam@167: "-reload-twiddle", cannam@167: Arg.Unit(fun () -> reload_twiddle := true), cannam@167: " do not collect common twiddle factors"; cannam@167: cannam@167: "-with-rs", cannam@167: Arg.String(fun x -> urs := arg_to_stride x), cannam@167: " specialize for given input stride"; cannam@167: cannam@167: "-with-vs", cannam@167: Arg.String(fun x -> uvs := arg_to_stride x), cannam@167: " specialize for given vector stride"; cannam@167: cannam@167: "-with-ms", cannam@167: Arg.String(fun x -> ums := arg_to_stride x), cannam@167: " specialize for given ms" cannam@167: ] cannam@167: cannam@167: let generate n = cannam@167: let rioarray = "x" cannam@167: and rs = "rs" and vs = "vs" cannam@167: and twarray = "W" cannam@167: and m = "m" and mb = "mb" and me = "me" and ms = "ms" in cannam@167: cannam@167: let sign = !Genutil.sign cannam@167: and name = !Magic.codelet_name cannam@167: and byvl x = choose_simd x (ctimes (CVar "VL", x)) cannam@167: and bytwvl x = choose_simd x (ctimes (CVar "TWVL", x)) cannam@167: and bytwvl_vl x = choose_simd x (ctimes (CVar "(TWVL/VL)", x)) in cannam@167: let ename = expand_name name in cannam@167: cannam@167: let (bytwiddle, num_twiddles, twdesc) = Twiddle.twiddle_policy 0 true in cannam@167: let nt = num_twiddles n in cannam@167: cannam@167: let svs = either_stride (!uvs) (C.SVar vs) cannam@167: and srs = either_stride (!urs) (C.SVar rs) in cannam@167: let sms = stride_to_string "ms" !ums in cannam@167: cannam@167: let byw = cannam@167: if !reload_twiddle then cannam@167: array n (fun v -> bytwiddle n sign (twiddle_array nt twarray)) cannam@167: else cannam@167: let a = bytwiddle n sign (twiddle_array nt twarray) cannam@167: in fun v -> a cannam@167: in cannam@167: cannam@167: let locations = unique_v_array_c n n in cannam@167: cannam@167: let ioi = cannam@167: locative_v_array_c n n cannam@167: (C.varray_subscript rioarray svs srs) cannam@167: (C.varray_subscript "BUG" svs srs) cannam@167: locations sms cannam@167: and ioo = cannam@167: locative_v_array_c n n cannam@167: (C.varray_subscript rioarray svs srs) cannam@167: (C.varray_subscript "BUG" svs srs) cannam@167: locations sms cannam@167: in cannam@167: cannam@167: let lioi = load_v_array_c n n ioi in cannam@167: let fft = Trig.dft_via_rdft in cannam@167: let output = cannam@167: match !ditdif with cannam@167: | DIT -> array n (fun v -> fft sign n (byw v (lioi v))) cannam@167: | DIF -> array n (fun v -> byw v (fft sign n (lioi v))) cannam@167: in cannam@167: cannam@167: let odag = store_v_array_c n n ioo (transpose output) in cannam@167: let annot = standard_optimizer odag in cannam@167: cannam@167: let vm = CVar m and vmb = CVar mb and vme = CVar me in cannam@167: cannam@167: let body = Block ( cannam@167: [Decl ("INT", m); cannam@167: Decl (C.realtypep, rioarray)], cannam@167: [Stmt_assign (CVar rioarray, cannam@167: CVar (if (sign < 0) then "ri" else "ii")); cannam@167: For (list_to_comma cannam@167: [Expr_assign (vm, vmb); cannam@167: Expr_assign (CVar twarray, cannam@167: CPlus [CVar twarray; cannam@167: ctimes (vmb, cannam@167: bytwvl_vl (Integer nt))])], cannam@167: Binop (" < ", vm, vme), cannam@167: list_to_comma cannam@167: [Expr_assign (vm, CPlus [vm; byvl (Integer 1)]); cannam@167: Expr_assign (CVar rioarray, CPlus [CVar rioarray; cannam@167: byvl (CVar sms)]); cannam@167: Expr_assign (CVar twarray, CPlus [CVar twarray; cannam@167: bytwvl (Integer nt)]); cannam@167: make_volatile_stride (2*n) (CVar rs); cannam@167: make_volatile_stride (2*n) (CVar vs) cannam@167: ], cannam@167: Asch annot)]) in cannam@167: cannam@167: let tree = cannam@167: Fcn (("static void"), ename, cannam@167: [Decl (C.realtypep, "ri"); cannam@167: Decl (C.realtypep, "ii"); cannam@167: Decl (C.constrealtypep, twarray); cannam@167: Decl (C.stridetype, rs); cannam@167: Decl (C.stridetype, vs); cannam@167: Decl ("INT", mb); cannam@167: Decl ("INT", me); cannam@167: Decl ("INT", ms)], cannam@167: finalize_fcn body) cannam@167: in cannam@167: let twinstr = cannam@167: Printf.sprintf "static const tw_instr twinstr[] = %s;\n\n" cannam@167: (twinstr_to_string "VL" (twdesc n)) cannam@167: cannam@167: and desc = cannam@167: Printf.sprintf cannam@167: "static const ct_desc desc = {%d, %s, twinstr, &GENUS, %s, %s, %s, %s};\n\n" cannam@167: n (stringify name) (flops_of tree) cannam@167: (stride_to_solverparm !urs) cannam@167: (stride_to_solverparm !uvs) cannam@167: (stride_to_solverparm !ums) cannam@167: cannam@167: and register = cannam@167: match !ditdif with cannam@167: | DIT -> "X(kdft_ditsq_register)" cannam@167: | DIF -> "X(kdft_difsq_register)" cannam@167: in cannam@167: let init = cannam@167: "\n" ^ cannam@167: twinstr ^ cannam@167: desc ^ cannam@167: (declare_register_fcn name) ^ cannam@167: (Printf.sprintf "{\n%s(p, %s, &desc);\n}" register ename) cannam@167: in cannam@167: cannam@167: (unparse tree) ^ "\n" ^ init cannam@167: cannam@167: cannam@167: let main () = cannam@167: begin cannam@167: parse (speclist @ Twiddle.speclist) usage; cannam@167: print_string (generate (check_size ())); cannam@167: end cannam@167: cannam@167: let _ = main()