Chris@19: (* Chris@19: * Copyright (c) 1997-1999 Massachusetts Institute of Technology Chris@19: * Copyright (c) 2003, 2007-14 Matteo Frigo Chris@19: * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology Chris@19: * Chris@19: * This program is free software; you can redistribute it and/or modify Chris@19: * it under the terms of the GNU General Public License as published by Chris@19: * the Free Software Foundation; either version 2 of the License, or Chris@19: * (at your option) any later version. Chris@19: * Chris@19: * This program is distributed in the hope that it will be useful, Chris@19: * but WITHOUT ANY WARRANTY; without even the implied warranty of Chris@19: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the Chris@19: * GNU General Public License for more details. Chris@19: * Chris@19: * You should have received a copy of the GNU General Public License Chris@19: * along with this program; if not, write to the Free Software Chris@19: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA Chris@19: * Chris@19: *) Chris@19: Chris@19: (* generation of trigonometric transforms *) Chris@19: Chris@19: open Util Chris@19: open Genutil Chris@19: open C Chris@19: Chris@19: Chris@19: let usage = "Usage: " ^ Sys.argv.(0) ^ " -n " Chris@19: Chris@19: let uistride = ref Stride_variable Chris@19: let uostride = ref Stride_variable Chris@19: let uivstride = ref Stride_variable Chris@19: let uovstride = ref Stride_variable Chris@19: let normalization = ref 1 Chris@19: Chris@19: type mode = Chris@19: | MDCT Chris@19: | MDCT_MP3 Chris@19: | MDCT_VORBIS Chris@19: | MDCT_WINDOW Chris@19: | MDCT_WINDOW_SYM Chris@19: | IMDCT Chris@19: | IMDCT_MP3 Chris@19: | IMDCT_VORBIS Chris@19: | IMDCT_WINDOW Chris@19: | IMDCT_WINDOW_SYM Chris@19: | NONE Chris@19: Chris@19: let mode = ref NONE Chris@19: Chris@19: let speclist = [ Chris@19: "-with-istride", Chris@19: Arg.String(fun x -> uistride := arg_to_stride x), Chris@19: " specialize for given input stride"; Chris@19: Chris@19: "-with-ostride", Chris@19: Arg.String(fun x -> uostride := arg_to_stride x), Chris@19: " specialize for given output stride"; Chris@19: Chris@19: "-with-ivstride", Chris@19: Arg.String(fun x -> uivstride := arg_to_stride x), Chris@19: " specialize for given input vector stride"; Chris@19: Chris@19: "-with-ovstride", Chris@19: Arg.String(fun x -> uovstride := arg_to_stride x), Chris@19: " specialize for given output vector stride"; Chris@19: Chris@19: "-normalization", Chris@19: Arg.String(fun x -> normalization := int_of_string x), Chris@19: " normalization integer to divide by"; Chris@19: Chris@19: "-mdct", Chris@19: Arg.Unit(fun () -> mode := MDCT), Chris@19: " generate an MDCT codelet"; Chris@19: Chris@19: "-mdct-mp3", Chris@19: Arg.Unit(fun () -> mode := MDCT_MP3), Chris@19: " generate an MDCT codelet with MP3 windowing"; Chris@19: Chris@19: "-mdct-window", Chris@19: Arg.Unit(fun () -> mode := MDCT_WINDOW), Chris@19: " generate an MDCT codelet with window array"; Chris@19: Chris@19: "-mdct-window-sym", Chris@19: Arg.Unit(fun () -> mode := MDCT_WINDOW_SYM), Chris@19: " generate an MDCT codelet with symmetric window array"; Chris@19: Chris@19: "-imdct", Chris@19: Arg.Unit(fun () -> mode := IMDCT), Chris@19: " generate an IMDCT codelet"; Chris@19: Chris@19: "-imdct-mp3", Chris@19: Arg.Unit(fun () -> mode := IMDCT_MP3), Chris@19: " generate an IMDCT codelet with MP3 windowing"; Chris@19: Chris@19: "-imdct-window", Chris@19: Arg.Unit(fun () -> mode := IMDCT_WINDOW), Chris@19: " generate an IMDCT codelet with window array"; Chris@19: Chris@19: "-imdct-window-sym", Chris@19: Arg.Unit(fun () -> mode := IMDCT_WINDOW_SYM), Chris@19: " generate an IMDCT codelet with symmetric window array"; Chris@19: ] Chris@19: Chris@19: let unity_window n i = Complex.one Chris@19: Chris@19: (* MP3 window(k) = sin(pi/(2n) * (k + 1/2)) *) Chris@19: let mp3_window n k = Chris@19: Complex.imag (Complex.exp (8 * n) (2*k + 1)) Chris@19: Chris@19: (* Vorbis window(k) = sin(pi/2 * (mp3_window(k))^2) Chris@19: ... this is transcendental, though, so we can't do it with our Chris@19: current Complex.exp function *) Chris@19: Chris@19: let window_array n w = Chris@19: array n (fun i -> Chris@19: let stride = C.SInteger 1 Chris@19: and klass = Unique.make () in Chris@19: let refr = C.array_subscript w stride i in Chris@19: let kr = Variable.make_constant klass refr in Chris@19: load_r (kr, kr)) Chris@19: Chris@19: let load_window w n i = w i Chris@19: let load_window_sym w n i = w (if (i < n) then i else (2*n - 1 - i)) Chris@19: Chris@19: (* fixme: use same locations for input and output so that it works in-place? *) Chris@19: Chris@19: (* Note: only correct for even n! *) Chris@19: let load_array_mdct window n rarr iarr locations = Chris@19: let twon = 2 * n in Chris@19: let arr = load_array_c twon Chris@19: (locative_array_c twon rarr iarr locations "BUG") in Chris@19: let arrw = fun i -> Complex.times (window n i) (arr i) in Chris@19: array n Chris@19: ((Complex.times Complex.half) @@ Chris@19: (fun i -> Chris@19: if (i < n/2) then Chris@19: Complex.uminus (Complex.plus [arrw (i + n + n/2); Chris@19: arrw (n + n/2 - 1 - i)]) Chris@19: else Chris@19: Complex.plus [arrw (i - n/2); Chris@19: Complex.uminus (arrw (n + n/2 - 1 - i))])) Chris@19: Chris@19: let store_array_mdct window n rarr iarr locations arr = Chris@19: store_array_r n (locative_array_c n rarr iarr locations "BUG") arr Chris@19: Chris@19: let load_array_imdct window n rarr iarr locations = Chris@19: load_array_c n (locative_array_c n rarr iarr locations "BUG") Chris@19: Chris@19: let store_array_imdct window n rarr iarr locations arr = Chris@19: let n2 = n/2 in Chris@19: let threen2 = 3*n2 in Chris@19: let arr2 = fun i -> Chris@19: if (i < n2) then Chris@19: arr (i + n2) Chris@19: else if (i < threen2) then Chris@19: Complex.uminus (arr (threen2 - 1 - i)) Chris@19: else Chris@19: Complex.uminus (arr (i - threen2)) Chris@19: in Chris@19: let arr2w = fun i -> Complex.times (window n i) (arr2 i) in Chris@19: let twon = 2 * n in Chris@19: store_array_r twon (locative_array_c twon rarr iarr locations "BUG") arr2w Chris@19: Chris@19: let window_param = function Chris@19: MDCT_WINDOW -> true Chris@19: | MDCT_WINDOW_SYM -> true Chris@19: | IMDCT_WINDOW -> true Chris@19: | IMDCT_WINDOW_SYM -> true Chris@19: | _ -> false Chris@19: Chris@19: let generate n mode = Chris@19: let iarray = "I" Chris@19: and oarray = "O" Chris@19: and istride = "istride" Chris@19: and ostride = "ostride" Chris@19: and window = "W" Chris@19: and name = !Magic.codelet_name in Chris@19: Chris@19: let vistride = either_stride (!uistride) (C.SVar istride) Chris@19: and vostride = either_stride (!uostride) (C.SVar ostride) Chris@19: in Chris@19: Chris@19: let sivs = stride_to_string "ovs" !uovstride in Chris@19: let sovs = stride_to_string "ivs" !uivstride in Chris@19: Chris@19: let (transform, load_input, store_output) = match mode with Chris@19: | MDCT -> Trig.dctIV, load_array_mdct unity_window, Chris@19: store_array_mdct unity_window Chris@19: | MDCT_MP3 -> Trig.dctIV, load_array_mdct mp3_window, Chris@19: store_array_mdct unity_window Chris@19: | MDCT_WINDOW -> Trig.dctIV, load_array_mdct Chris@19: (load_window (window_array (2 * n) window)), Chris@19: store_array_mdct unity_window Chris@19: | MDCT_WINDOW_SYM -> Trig.dctIV, load_array_mdct Chris@19: (load_window_sym (window_array n window)), Chris@19: store_array_mdct unity_window Chris@19: | IMDCT -> Trig.dctIV, load_array_imdct unity_window, Chris@19: store_array_imdct unity_window Chris@19: | IMDCT_MP3 -> Trig.dctIV, load_array_imdct unity_window, Chris@19: store_array_imdct mp3_window Chris@19: | IMDCT_WINDOW -> Trig.dctIV, load_array_imdct unity_window, Chris@19: store_array_imdct (load_window (window_array (2 * n) window)) Chris@19: | IMDCT_WINDOW_SYM -> Trig.dctIV, load_array_imdct unity_window, Chris@19: store_array_imdct (load_window_sym (window_array n window)) Chris@19: | _ -> failwith "must specify transform kind" Chris@19: in Chris@19: Chris@19: let locations = unique_array_c (2*n) in Chris@19: let input = Chris@19: load_input n Chris@19: (C.array_subscript iarray vistride) Chris@19: (C.array_subscript "BUG" vistride) Chris@19: locations Chris@19: in Chris@19: let output = (Complex.times (Complex.inverse_int !normalization)) Chris@19: @@ (transform n input) in Chris@19: let odag = Chris@19: store_output n Chris@19: (C.array_subscript oarray vostride) Chris@19: (C.array_subscript "BUG" vostride) Chris@19: locations Chris@19: output Chris@19: in Chris@19: let annot = standard_optimizer odag in Chris@19: Chris@19: let tree = Chris@19: Fcn ("void", name, Chris@19: ([Decl (C.constrealtypep, iarray); Chris@19: Decl (C.realtypep, oarray)] Chris@19: @ (if stride_fixed !uistride then [] Chris@19: else [Decl (C.stridetype, istride)]) Chris@19: @ (if stride_fixed !uostride then [] Chris@19: else [Decl (C.stridetype, ostride)]) Chris@19: @ (choose_simd [] Chris@19: (if stride_fixed !uivstride then [] else Chris@19: [Decl ("int", sivs)])) Chris@19: @ (choose_simd [] Chris@19: (if stride_fixed !uovstride then [] else Chris@19: [Decl ("int", sovs)])) Chris@19: @ (if (not (window_param mode)) then [] Chris@19: else [Decl (C.constrealtypep, window)]) Chris@19: ), Chris@19: finalize_fcn (Asch annot)) Chris@19: Chris@19: in Chris@19: (unparse tree) ^ "\n" Chris@19: Chris@19: Chris@19: let main () = Chris@19: begin Chris@19: parse speclist usage; Chris@19: print_string (generate (check_size ()) !mode); Chris@19: end Chris@19: Chris@19: let _ = main()