annotate src/fftw-3.3.3/genfft/twiddle.ml @ 168:ceec0dd9ec9c

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam <cannam@all-day-breakfast.com>
date Fri, 07 Feb 2020 11:51:13 +0000
parents 89f5e221ed7b
children
rev   line source
cannam@95 1 (*
cannam@95 2 * Copyright (c) 1997-1999 Massachusetts Institute of Technology
cannam@95 3 * Copyright (c) 2003, 2007-11 Matteo Frigo
cannam@95 4 * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology
cannam@95 5 *
cannam@95 6 * This program is free software; you can redistribute it and/or modify
cannam@95 7 * it under the terms of the GNU General Public License as published by
cannam@95 8 * the Free Software Foundation; either version 2 of the License, or
cannam@95 9 * (at your option) any later version.
cannam@95 10 *
cannam@95 11 * This program is distributed in the hope that it will be useful,
cannam@95 12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
cannam@95 13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
cannam@95 14 * GNU General Public License for more details.
cannam@95 15 *
cannam@95 16 * You should have received a copy of the GNU General Public License
cannam@95 17 * along with this program; if not, write to the Free Software
cannam@95 18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
cannam@95 19 *
cannam@95 20 *)
cannam@95 21
cannam@95 22 (* policies for loading/computing twiddle factors *)
cannam@95 23 open Complex
cannam@95 24 open Util
cannam@95 25
cannam@95 26 type twop = TW_FULL | TW_CEXP | TW_NEXT
cannam@95 27
cannam@95 28 let optostring = function
cannam@95 29 | TW_CEXP -> "TW_CEXP"
cannam@95 30 | TW_NEXT -> "TW_NEXT"
cannam@95 31 | TW_FULL -> "TW_FULL"
cannam@95 32
cannam@95 33 type twinstr = (twop * int * int)
cannam@95 34
cannam@95 35 let rec unroll_twfull l = match l with
cannam@95 36 | [] -> []
cannam@95 37 | (TW_FULL, v, n) :: b ->
cannam@95 38 (forall [] cons 1 n (fun i -> (TW_CEXP, v, i)))
cannam@95 39 @ unroll_twfull b
cannam@95 40 | a :: b -> a :: unroll_twfull b
cannam@95 41
cannam@95 42 let twinstr_to_c_string l =
cannam@95 43 let one (op, a, b) = Printf.sprintf "{ %s, %d, %d }" (optostring op) a b
cannam@95 44 in let rec loop first = function
cannam@95 45 | [] -> ""
cannam@95 46 | a :: b -> (if first then "\n" else ",\n") ^ (one a) ^ (loop false b)
cannam@95 47 in "{" ^ (loop true l) ^ "}"
cannam@95 48
cannam@95 49 let twinstr_to_simd_string vl l =
cannam@95 50 let one sep = function
cannam@95 51 | (TW_NEXT, 1, 0) -> sep ^ "{TW_NEXT, " ^ vl ^ ", 0}"
cannam@95 52 | (TW_NEXT, _, _) -> failwith "twinstr_to_simd_string"
cannam@95 53 | (TW_CEXP, v, b) -> sep ^ (Printf.sprintf "VTW(%d,%d)" v b)
cannam@95 54 | _ -> failwith "twinstr_to_simd_string"
cannam@95 55 in let rec loop first = function
cannam@95 56 | [] -> ""
cannam@95 57 | a :: b -> (one (if first then "\n" else ",\n") a) ^ (loop false b)
cannam@95 58 in "{" ^ (loop true (unroll_twfull l)) ^ "}"
cannam@95 59
cannam@95 60 let rec pow m n =
cannam@95 61 if (n = 0) then 1
cannam@95 62 else m * pow m (n - 1)
cannam@95 63
cannam@95 64 let rec is_pow m n =
cannam@95 65 n = 1 || ((n mod m) = 0 && is_pow m (n / m))
cannam@95 66
cannam@95 67 let rec log m n = if n = 1 then 0 else 1 + log m (n / m)
cannam@95 68
cannam@95 69 let rec largest_power_smaller_than m i =
cannam@95 70 if (is_pow m i) then i
cannam@95 71 else largest_power_smaller_than m (i - 1)
cannam@95 72
cannam@95 73 let rec smallest_power_larger_than m i =
cannam@95 74 if (is_pow m i) then i
cannam@95 75 else smallest_power_larger_than m (i + 1)
cannam@95 76
cannam@95 77 let rec_array n f =
cannam@95 78 let g = ref (fun i -> Complex.zero) in
cannam@95 79 let a = Array.init n (fun i -> lazy (!g i)) in
cannam@95 80 let h i = f (fun i -> Lazy.force a.(i)) i in
cannam@95 81 begin
cannam@95 82 g := h;
cannam@95 83 h
cannam@95 84 end
cannam@95 85
cannam@95 86
cannam@95 87 let ctimes use_complex_arith a b =
cannam@95 88 if use_complex_arith then
cannam@95 89 Complex.ctimes a b
cannam@95 90 else
cannam@95 91 Complex.times a b
cannam@95 92
cannam@95 93 let ctimesj use_complex_arith a b =
cannam@95 94 if use_complex_arith then
cannam@95 95 Complex.ctimesj a b
cannam@95 96 else
cannam@95 97 Complex.times (Complex.conj a) b
cannam@95 98
cannam@95 99 let make_bytwiddle sign use_complex_arith g f i =
cannam@95 100 if i = 0 then
cannam@95 101 f i
cannam@95 102 else if sign = 1 then
cannam@95 103 ctimes use_complex_arith (g i) (f i)
cannam@95 104 else
cannam@95 105 ctimesj use_complex_arith (g i) (f i)
cannam@95 106
cannam@95 107 (* various policies for computing/loading twiddle factors *)
cannam@95 108
cannam@95 109 let twiddle_policy_load_all v use_complex_arith =
cannam@95 110 let bytwiddle n sign w f =
cannam@95 111 make_bytwiddle sign use_complex_arith (fun i -> w (i - 1)) f
cannam@95 112 and twidlen n = 2 * (n - 1)
cannam@95 113 and twdesc r = [(TW_FULL, v, r);(TW_NEXT, 1, 0)]
cannam@95 114 in bytwiddle, twidlen, twdesc
cannam@95 115
cannam@95 116 (*
cannam@95 117 * if i is a power of two, then load w (log i)
cannam@95 118 * else let x = largest power of 2 less than i in
cannam@95 119 * let y = i - x in
cannam@95 120 * compute w^{x+y} = w^x * w^y
cannam@95 121 *)
cannam@95 122 let twiddle_policy_log2 v use_complex_arith =
cannam@95 123 let bytwiddle n sign w f =
cannam@95 124 let g = rec_array n (fun self i ->
cannam@95 125 if i = 0 then Complex.one
cannam@95 126 else if is_pow 2 i then w (log 2 i)
cannam@95 127 else let x = largest_power_smaller_than 2 i in
cannam@95 128 let y = i - x in
cannam@95 129 ctimes use_complex_arith (self x) (self y))
cannam@95 130 in make_bytwiddle sign use_complex_arith g f
cannam@95 131 and twidlen n = 2 * (log 2 (largest_power_smaller_than 2 (2 * n - 1)))
cannam@95 132 and twdesc n =
cannam@95 133 (List.flatten
cannam@95 134 (List.map
cannam@95 135 (fun i ->
cannam@95 136 if i > 0 && is_pow 2 i then
cannam@95 137 [TW_CEXP, v, i]
cannam@95 138 else
cannam@95 139 [])
cannam@95 140 (iota n)))
cannam@95 141 @ [(TW_NEXT, 1, 0)]
cannam@95 142 in bytwiddle, twidlen, twdesc
cannam@95 143
cannam@95 144 let twiddle_policy_log3 v use_complex_arith =
cannam@95 145 let rec terms_needed i pi s n =
cannam@95 146 if (s >= n - 1) then i
cannam@95 147 else terms_needed (i + 1) (3 * pi) (s + pi) n
cannam@95 148 in
cannam@95 149 let rec bytwiddle n sign w f =
cannam@95 150 let nterms = terms_needed 0 1 0 n in
cannam@95 151 let maxterm = pow 3 (nterms - 1) in
cannam@95 152 let g = rec_array (3 * n) (fun self i ->
cannam@95 153 if i = 0 then Complex.one
cannam@95 154 else if is_pow 3 i then w (log 3 i)
cannam@95 155 else if i = (n - 1) && maxterm >= n then
cannam@95 156 w (nterms - 1)
cannam@95 157 else let x = smallest_power_larger_than 3 i in
cannam@95 158 if (i + i >= x) then
cannam@95 159 let x = min x (n - 1) in
cannam@95 160 ctimesj use_complex_arith (self (x - i)) (self x)
cannam@95 161 else let x = largest_power_smaller_than 3 i in
cannam@95 162 ctimes use_complex_arith (self (i - x)) (self x))
cannam@95 163 in make_bytwiddle sign use_complex_arith g f
cannam@95 164 and twidlen n = 2 * (terms_needed 0 1 0 n)
cannam@95 165 and twdesc n =
cannam@95 166 (List.map
cannam@95 167 (fun i ->
cannam@95 168 let x = min (pow 3 i) (n - 1) in
cannam@95 169 TW_CEXP, v, x)
cannam@95 170 (iota ((twidlen n) / 2)))
cannam@95 171 @ [(TW_NEXT, 1, 0)]
cannam@95 172 in bytwiddle, twidlen, twdesc
cannam@95 173
cannam@95 174 let current_twiddle_policy = ref twiddle_policy_load_all
cannam@95 175
cannam@95 176 let twiddle_policy use_complex_arith =
cannam@95 177 !current_twiddle_policy use_complex_arith
cannam@95 178
cannam@95 179 let set_policy x = Arg.Unit (fun () -> current_twiddle_policy := x)
cannam@95 180 let set_policy_int x = Arg.Int (fun i -> current_twiddle_policy := x i)
cannam@95 181
cannam@95 182 let undocumented = " Undocumented twiddle policy"
cannam@95 183
cannam@95 184 let speclist = [
cannam@95 185 "-twiddle-load-all", set_policy twiddle_policy_load_all, undocumented;
cannam@95 186 "-twiddle-log2", set_policy twiddle_policy_log2, undocumented;
cannam@95 187 "-twiddle-log3", set_policy twiddle_policy_log3, undocumented;
cannam@95 188 ]