annotate src/fftw-3.3.3/support/addchain.c @ 127:7867fa7e1b6b

Current fftw source
author Chris Cannam <cannam@all-day-breakfast.com>
date Tue, 18 Oct 2016 13:40:26 +0100
parents 89f5e221ed7b
children
rev   line source
cannam@95 1 /* addition-chain optimizer */
cannam@95 2 #include <stdio.h>
cannam@95 3 #include <stdlib.h>
cannam@95 4 #include <unistd.h>
cannam@95 5
cannam@95 6 static int verbose;
cannam@95 7 static int mulcost = 18;
cannam@95 8 static int ldcost = 2;
cannam@95 9 static int sqcost = 10;
cannam@95 10 static int reflcost = 8;
cannam@95 11 #define INFTY 100000
cannam@95 12
cannam@95 13 static int *answer;
cannam@95 14 static int best_so_far;
cannam@95 15
cannam@95 16 static void print_answer(int n, int t)
cannam@95 17 {
cannam@95 18 int i;
cannam@95 19 printf("| (%d, %d) -> [", n, t);
cannam@95 20 for (i = 0; i < t; ++i)
cannam@95 21 printf("%d;", answer[i]);
cannam@95 22 printf("] (* %d *)\n", best_so_far);
cannam@95 23 }
cannam@95 24
cannam@95 25 #define DO(i, j, k, cst) \
cannam@95 26 if (k < n) { \
cannam@95 27 int c = A[i] + A[j] + cst; \
cannam@95 28 if (c < A[k]) { \
cannam@95 29 A[k] = c; \
cannam@95 30 changed = 1; \
cannam@95 31 } \
cannam@95 32 }
cannam@95 33
cannam@95 34 #define DO3(i, j, l, k, cst) \
cannam@95 35 if (k < n) { \
cannam@95 36 int c = A[i] + A[j] + A[l] + cst; \
cannam@95 37 if (c < A[k]) { \
cannam@95 38 A[k] = c; \
cannam@95 39 changed = 1; \
cannam@95 40 } \
cannam@95 41 }
cannam@95 42
cannam@95 43 static int optimize(int n, int *A)
cannam@95 44 {
cannam@95 45 int i, j, k, changed, cst, cstmax;
cannam@95 46
cannam@95 47 do {
cannam@95 48 changed = 0;
cannam@95 49 for (i = 0; i < n; ++i) {
cannam@95 50 k = i + i;
cannam@95 51 DO(i, i, k, sqcost);
cannam@95 52 }
cannam@95 53
cannam@95 54 for (i = 0; i < n; ++i) {
cannam@95 55 for (j = 0; j <= i; ++j) {
cannam@95 56 k = i + j;
cannam@95 57 DO(i, j, k, mulcost);
cannam@95 58 k = i - j;
cannam@95 59 DO(i, j, k, mulcost);
cannam@95 60
cannam@95 61 k = i + j;
cannam@95 62 DO3(i, j, i - j, k, reflcost);
cannam@95 63 }
cannam@95 64 }
cannam@95 65
cannam@95 66 } while (changed);
cannam@95 67
cannam@95 68 cst = cstmax = 0;
cannam@95 69 for (i = 0; i < n; ++i) {
cannam@95 70 cst += A[i];
cannam@95 71 if (A[i] > cstmax) cstmax = A[i];
cannam@95 72 }
cannam@95 73 /* return cstmax; */
cannam@95 74 return cst;
cannam@95 75 }
cannam@95 76
cannam@95 77 static void search(int n, int t, int *A, int *B, int depth)
cannam@95 78 {
cannam@95 79 if (depth == 0) {
cannam@95 80 int i, tc;
cannam@95 81 for (i = 0; i < n; ++i)
cannam@95 82 A[i] = INFTY;
cannam@95 83 A[0] = 0; /* always free */
cannam@95 84 for (i = 1; i <= t; ++i)
cannam@95 85 A[B[-i]] = ldcost;
cannam@95 86
cannam@95 87 tc = optimize(n, A);
cannam@95 88 if (tc < best_so_far) {
cannam@95 89 best_so_far = tc;
cannam@95 90 for (i = 1; i <= t; ++i)
cannam@95 91 answer[t - i] = B[-i];
cannam@95 92 if (verbose)
cannam@95 93 print_answer(n, t);
cannam@95 94 }
cannam@95 95 } else {
cannam@95 96 for (B[0] = B[-1] + 1; B[0] < n; ++B[0])
cannam@95 97 search(n, t, A, B + 1, depth - 1);
cannam@95 98 }
cannam@95 99 }
cannam@95 100
cannam@95 101 static void doit(int n, int t)
cannam@95 102 {
cannam@95 103 int *A;
cannam@95 104 int *B;
cannam@95 105
cannam@95 106 A = malloc(n * sizeof(int));
cannam@95 107 B = malloc((t + 1) * sizeof(int));
cannam@95 108 answer = malloc(t * sizeof(int));
cannam@95 109
cannam@95 110 B[0] = 0;
cannam@95 111 best_so_far = INFTY;
cannam@95 112 search(n, t, A, B + 1, t);
cannam@95 113
cannam@95 114 print_answer(n, t);
cannam@95 115
cannam@95 116 free(A); free(B); free(answer);
cannam@95 117 }
cannam@95 118
cannam@95 119 int main(int argc, char *argv[])
cannam@95 120 {
cannam@95 121 int n = 32;
cannam@95 122 int t = 3;
cannam@95 123 int all;
cannam@95 124 int ch;
cannam@95 125
cannam@95 126 verbose = 0;
cannam@95 127 all = 0;
cannam@95 128 while ((ch = getopt(argc, argv, "n:t:m:l:r:s:va")) != -1) {
cannam@95 129 switch (ch) {
cannam@95 130 case 'n':
cannam@95 131 n = atoi(optarg);
cannam@95 132 break;
cannam@95 133 case 't':
cannam@95 134 t = atoi(optarg);
cannam@95 135 break;
cannam@95 136 case 'm':
cannam@95 137 mulcost = atoi(optarg);
cannam@95 138 break;
cannam@95 139 case 'l':
cannam@95 140 ldcost = atoi(optarg);
cannam@95 141 break;
cannam@95 142 case 's':
cannam@95 143 sqcost = atoi(optarg);
cannam@95 144 break;
cannam@95 145 case 'r':
cannam@95 146 reflcost = atoi(optarg);
cannam@95 147 break;
cannam@95 148 case 'v':
cannam@95 149 ++verbose;
cannam@95 150 break;
cannam@95 151 case 'a':
cannam@95 152 ++all;
cannam@95 153 break;
cannam@95 154 case '?':
cannam@95 155 fprintf(stderr, "use the source\n");
cannam@95 156 exit(1);
cannam@95 157 }
cannam@95 158 }
cannam@95 159
cannam@95 160 if (all) {
cannam@95 161 for (n = 4; n <= 64; n *= 2) {
cannam@95 162 int n1 = n - 1; if (n1 > 7) n1 = 7;
cannam@95 163 for (t = 1; t <= n1; ++t)
cannam@95 164 doit(n, t);
cannam@95 165 }
cannam@95 166 } else {
cannam@95 167 doit(n, t);
cannam@95 168 }
cannam@95 169
cannam@95 170 return 0;
cannam@95 171 }