cannam@95: (* cannam@95: * Copyright (c) 1997-1999 Massachusetts Institute of Technology cannam@95: * Copyright (c) 2003, 2007-11 Matteo Frigo cannam@95: * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology cannam@95: * cannam@95: * This program is free software; you can redistribute it and/or modify cannam@95: * it under the terms of the GNU General Public License as published by cannam@95: * the Free Software Foundation; either version 2 of the License, or cannam@95: * (at your option) any later version. cannam@95: * cannam@95: * This program is distributed in the hope that it will be useful, cannam@95: * but WITHOUT ANY WARRANTY; without even the implied warranty of cannam@95: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the cannam@95: * GNU General Public License for more details. cannam@95: * cannam@95: * You should have received a copy of the GNU General Public License cannam@95: * along with this program; if not, write to the Free Software cannam@95: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA cannam@95: * cannam@95: *) cannam@95: cannam@95: (* utilities common to all generators *) cannam@95: open Util cannam@95: cannam@95: let choose_simd a b = if !Simdmagic.simd_mode then b else a cannam@95: cannam@95: let unique_array n = array n (fun _ -> Unique.make ()) cannam@95: let unique_array_c n = cannam@95: array n (fun _ -> cannam@95: (Unique.make (), Unique.make ())) cannam@95: cannam@95: let unique_v_array_c veclen n = cannam@95: array veclen (fun _ -> cannam@95: unique_array_c n) cannam@95: cannam@95: let locative_array_c n rarr iarr loc vs = cannam@95: array n (fun i -> cannam@95: let klass = Unique.make () in cannam@95: let (rloc, iloc) = loc i in cannam@95: (Variable.make_locative rloc klass rarr i vs, cannam@95: Variable.make_locative iloc klass iarr i vs)) cannam@95: cannam@95: let locative_v_array_c veclen n rarr iarr loc vs = cannam@95: array veclen (fun v -> cannam@95: array n (fun i -> cannam@95: let klass = Unique.make () in cannam@95: let (rloc, iloc) = loc v i in cannam@95: (Variable.make_locative rloc klass (rarr v) i vs, cannam@95: Variable.make_locative iloc klass (iarr v) i vs))) cannam@95: cannam@95: let temporary_array n = cannam@95: array n (fun i -> Variable.make_temporary ()) cannam@95: cannam@95: let temporary_array_c n = cannam@95: let tmpr = temporary_array n cannam@95: and tmpi = temporary_array n cannam@95: in cannam@95: array n (fun i -> (tmpr i, tmpi i)) cannam@95: cannam@95: let temporary_v_array_c veclen n = cannam@95: array veclen (fun v -> temporary_array_c n) cannam@95: cannam@95: let temporary_array_c n = cannam@95: let tmpr = temporary_array n cannam@95: and tmpi = temporary_array n cannam@95: in cannam@95: array n (fun i -> (tmpr i, tmpi i)) cannam@95: cannam@95: let load_c (vr, vi) = Complex.make (Expr.Load vr, Expr.Load vi) cannam@95: let load_r (vr, vi) = Complex.make (Expr.Load vr, Expr.Num (Number.zero)) cannam@95: cannam@95: let twiddle_array nt w = cannam@95: array (nt/2) (fun i -> cannam@95: let stride = choose_simd (C.SInteger 1) (C.SConst "TWVL") cannam@95: and klass = Unique.make () in cannam@95: let (refr, refi) = (C.array_subscript w stride (2 * i), cannam@95: C.array_subscript w stride (2 * i + 1)) cannam@95: in cannam@95: let (kr, ki) = (Variable.make_constant klass refr, cannam@95: Variable.make_constant klass refi) cannam@95: in cannam@95: load_c (kr, ki)) cannam@95: cannam@95: cannam@95: let load_array_c n var = array n (fun i -> load_c (var i)) cannam@95: let load_array_r n var = array n (fun i -> load_r (var i)) cannam@95: let load_array_hc n var = cannam@95: array n (fun i -> cannam@95: if (i < n - i) then cannam@95: load_c (var i) cannam@95: else if (i > n - i) then cannam@95: Complex.times Complex.i (load_c (var (n - i))) cannam@95: else cannam@95: load_r (var i)) cannam@95: cannam@95: let load_v_array_c veclen n var = cannam@95: array veclen (fun v -> load_array_c n (var v)) cannam@95: cannam@95: let store_c (vr, vi) x = [Complex.store_real vr x; Complex.store_imag vi x] cannam@95: let store_r (vr, vi) x = Complex.store_real vr x cannam@95: let store_i (vr, vi) x = Complex.store_imag vi x cannam@95: cannam@95: let assign_array_c n dst src = cannam@95: List.flatten cannam@95: (rmap (iota n) cannam@95: (fun i -> cannam@95: let (ar, ai) = Complex.assign (dst i) (src i) cannam@95: in [ar; ai])) cannam@95: let assign_v_array_c veclen n dst src = cannam@95: List.flatten cannam@95: (rmap (iota veclen) cannam@95: (fun v -> cannam@95: assign_array_c n (dst v) (src v))) cannam@95: cannam@95: let vassign_v_array_c veclen n dst src = cannam@95: List.flatten cannam@95: (rmap (iota n) (fun i -> cannam@95: List.flatten cannam@95: (rmap (iota veclen) cannam@95: (fun v -> cannam@95: let (ar, ai) = Complex.assign (dst v i) (src v i) cannam@95: in [ar; ai])))) cannam@95: cannam@95: let store_array_r n dst src = cannam@95: rmap (iota n) cannam@95: (fun i -> store_r (dst i) (src i)) cannam@95: cannam@95: let store_array_c n dst src = cannam@95: List.flatten cannam@95: (rmap (iota n) cannam@95: (fun i -> store_c (dst i) (src i))) cannam@95: cannam@95: let store_array_hc n dst src = cannam@95: List.flatten cannam@95: (rmap (iota n) cannam@95: (fun i -> cannam@95: if (i < n - i) then cannam@95: store_c (dst i) (src i) cannam@95: else if (i > n - i) then cannam@95: [] cannam@95: else cannam@95: [store_r (dst i) (Complex.real (src i))])) cannam@95: cannam@95: cannam@95: let store_v_array_c veclen n dst src = cannam@95: List.flatten cannam@95: (rmap (iota veclen) cannam@95: (fun v -> cannam@95: store_array_c n (dst v) (src v))) cannam@95: cannam@95: cannam@95: let elementwise f n a = array n (fun i -> f (a i)) cannam@95: let conj_array_c = elementwise Complex.conj cannam@95: let real_array_c = elementwise Complex.real cannam@95: let imag_array_c = elementwise Complex.imag cannam@95: cannam@95: let elementwise_v f veclen n a = cannam@95: array veclen (fun v -> cannam@95: array n (fun i -> f (a v i))) cannam@95: let conj_v_array_c = elementwise_v Complex.conj cannam@95: let real_v_array_c = elementwise_v Complex.real cannam@95: let imag_v_array_c = elementwise_v Complex.imag cannam@95: cannam@95: cannam@95: let transpose f i j = f j i cannam@95: let symmetrize f i j = if i <= j then f i j else f j i cannam@95: cannam@95: (* utilities for command-line parsing *) cannam@95: let standard_arg_parse_fail _ = failwith "too many arguments" cannam@95: cannam@95: let dump_dag alist = cannam@95: let fnam = !Magic.dag_dump_file in cannam@95: if (String.length fnam > 0) then cannam@95: let ochan = open_out fnam in cannam@95: begin cannam@95: To_alist.dump (output_string ochan) alist; cannam@95: close_out ochan; cannam@95: end cannam@95: cannam@95: let dump_alist alist = cannam@95: let fnam = !Magic.alist_dump_file in cannam@95: if (String.length fnam > 0) then cannam@95: let ochan = open_out fnam in cannam@95: begin cannam@95: Expr.dump (output_string ochan) alist; cannam@95: close_out ochan; cannam@95: end cannam@95: cannam@95: let dump_asched asched = cannam@95: let fnam = !Magic.asched_dump_file in cannam@95: if (String.length fnam > 0) then cannam@95: let ochan = open_out fnam in cannam@95: begin cannam@95: Annotate.dump (output_string ochan) asched; cannam@95: close_out ochan; cannam@95: end cannam@95: cannam@95: (* utilities for optimization *) cannam@95: let standard_scheduler dag = cannam@95: let optim = Algsimp.algsimp dag in cannam@95: let alist = To_alist.to_assignments optim in cannam@95: let _ = dump_alist alist in cannam@95: let _ = dump_dag alist in cannam@95: if !Magic.precompute_twiddles then cannam@95: Schedule.isolate_precomputations_and_schedule alist cannam@95: else cannam@95: Schedule.schedule alist cannam@95: cannam@95: let standard_optimizer dag = cannam@95: let sched = standard_scheduler dag in cannam@95: let annot = Annotate.annotate [] sched in cannam@95: let _ = dump_asched annot in cannam@95: annot cannam@95: cannam@95: let size = ref None cannam@95: let sign = ref (-1) cannam@95: cannam@95: let speclist = [ cannam@95: "-n", Arg.Int(fun i -> size := Some i), " generate a codelet of size "; cannam@95: "-sign", cannam@95: Arg.Int(fun i -> cannam@95: if (i > 0) then cannam@95: sign := 1 cannam@95: else cannam@95: sign := (-1)), cannam@95: " sign of transform"; cannam@95: ] cannam@95: cannam@95: let check_size () = cannam@95: match !size with cannam@95: | Some i -> i cannam@95: | None -> failwith "must specify -n" cannam@95: cannam@95: let expand_name name = if name = "" then "noname" else name cannam@95: cannam@95: let declare_register_fcn name = cannam@95: if name = "" then cannam@95: "void NAME(planner *p)\n" cannam@95: else cannam@95: "void " ^ (choose_simd "X" "XSIMD") ^ cannam@95: "(codelet_" ^ name ^ ")(planner *p)\n" cannam@95: cannam@95: let stringify name = cannam@95: if name = "" then "STRINGIZE(NAME)" else cannam@95: choose_simd ("\"" ^ name ^ "\"") cannam@95: ("XSIMD_STRING(\"" ^ name ^ "\")") cannam@95: cannam@95: let parse user_speclist usage = cannam@95: Arg.parse cannam@95: (user_speclist @ speclist @ Magic.speclist @ Simdmagic.speclist) cannam@95: standard_arg_parse_fail cannam@95: usage cannam@95: cannam@95: let rec list_to_c = function cannam@95: [] -> "" cannam@95: | [a] -> (string_of_int a) cannam@95: | a :: b -> (string_of_int a) ^ ", " ^ (list_to_c b) cannam@95: cannam@95: let rec list_to_comma = function cannam@95: | [a; b] -> C.Comma (a, b) cannam@95: | a :: b -> C.Comma (a, list_to_comma b) cannam@95: | _ -> failwith "list_to_comma" cannam@95: cannam@95: cannam@95: type stride = Stride_variable | Fixed_int of int | Fixed_string of string cannam@95: cannam@95: let either_stride a b = cannam@95: match a with cannam@95: Fixed_int x -> C.SInteger x cannam@95: | Fixed_string x -> C.SConst x cannam@95: | _ -> b cannam@95: cannam@95: let stride_fixed = function cannam@95: Stride_variable -> false cannam@95: | _ -> true cannam@95: cannam@95: let arg_to_stride s = cannam@95: try cannam@95: Fixed_int (int_of_string s) cannam@95: with Failure "int_of_string" -> cannam@95: Fixed_string s cannam@95: cannam@95: let stride_to_solverparm = function cannam@95: Stride_variable -> "0" cannam@95: | Fixed_int x -> string_of_int x cannam@95: | Fixed_string x -> x cannam@95: cannam@95: let stride_to_string s = function cannam@95: Stride_variable -> s cannam@95: | Fixed_int x -> string_of_int x cannam@95: | Fixed_string x -> x cannam@95: cannam@95: (* output the command line *) cannam@95: let cmdline () = cannam@95: List.fold_right (fun a b -> a ^ " " ^ b) (Array.to_list Sys.argv) "" cannam@95: cannam@95: let unparse tree = cannam@95: "/* Generated by: " ^ (cmdline ()) ^ "*/\n\n" ^ cannam@95: (C.print_cost tree) ^ cannam@95: (if String.length !Magic.inklude > 0 cannam@95: then cannam@95: (Printf.sprintf "#include \"%s\"\n\n" !Magic.inklude) cannam@95: else "") ^ cannam@95: (if !Simdmagic.simd_mode then cannam@95: Simd.unparse_function tree cannam@95: else cannam@95: C.unparse_function tree) cannam@95: cannam@95: let finalize_fcn ast = cannam@95: let mergedecls = function cannam@95: C.Block (d1, [C.Block (d2, s)]) -> C.Block (d1 @ d2, s) cannam@95: | x -> x cannam@95: and extract_constants = cannam@95: if !Simdmagic.simd_mode then cannam@95: Simd.extract_constants cannam@95: else cannam@95: C.extract_constants cannam@95: cannam@95: in mergedecls (C.Block (extract_constants ast, [ast; C.Simd_leavefun])) cannam@95: cannam@95: let twinstr_to_string vl x = cannam@95: if !Simdmagic.simd_mode then cannam@95: Twiddle.twinstr_to_simd_string vl x cannam@95: else cannam@95: Twiddle.twinstr_to_c_string x cannam@95: cannam@95: let make_volatile_stride n x = cannam@95: C.CCall ("MAKE_VOLATILE_STRIDE", C.Comma((C.Integer n), x))