annotate src/fftw-3.3.5/support/addchain.c @ 148:b4bfdf10c4b3

Update Win64 capnp builds to v0.6
author Chris Cannam <cannam@all-day-breakfast.com>
date Mon, 22 May 2017 18:56:49 +0100
parents 7867fa7e1b6b
children
rev   line source
cannam@127 1 /* addition-chain optimizer */
cannam@127 2 #include <stdio.h>
cannam@127 3 #include <stdlib.h>
cannam@127 4 #include <unistd.h>
cannam@127 5
cannam@127 6 static int verbose;
cannam@127 7 static int mulcost = 18;
cannam@127 8 static int ldcost = 2;
cannam@127 9 static int sqcost = 10;
cannam@127 10 static int reflcost = 8;
cannam@127 11 #define INFTY 100000
cannam@127 12
cannam@127 13 static int *answer;
cannam@127 14 static int best_so_far;
cannam@127 15
cannam@127 16 static void print_answer(int n, int t)
cannam@127 17 {
cannam@127 18 int i;
cannam@127 19 printf("| (%d, %d) -> [", n, t);
cannam@127 20 for (i = 0; i < t; ++i)
cannam@127 21 printf("%d;", answer[i]);
cannam@127 22 printf("] (* %d *)\n", best_so_far);
cannam@127 23 }
cannam@127 24
cannam@127 25 #define DO(i, j, k, cst) \
cannam@127 26 if (k < n) { \
cannam@127 27 int c = A[i] + A[j] + cst; \
cannam@127 28 if (c < A[k]) { \
cannam@127 29 A[k] = c; \
cannam@127 30 changed = 1; \
cannam@127 31 } \
cannam@127 32 }
cannam@127 33
cannam@127 34 #define DO3(i, j, l, k, cst) \
cannam@127 35 if (k < n) { \
cannam@127 36 int c = A[i] + A[j] + A[l] + cst; \
cannam@127 37 if (c < A[k]) { \
cannam@127 38 A[k] = c; \
cannam@127 39 changed = 1; \
cannam@127 40 } \
cannam@127 41 }
cannam@127 42
cannam@127 43 static int optimize(int n, int *A)
cannam@127 44 {
cannam@127 45 int i, j, k, changed, cst, cstmax;
cannam@127 46
cannam@127 47 do {
cannam@127 48 changed = 0;
cannam@127 49 for (i = 0; i < n; ++i) {
cannam@127 50 k = i + i;
cannam@127 51 DO(i, i, k, sqcost);
cannam@127 52 }
cannam@127 53
cannam@127 54 for (i = 0; i < n; ++i) {
cannam@127 55 for (j = 0; j <= i; ++j) {
cannam@127 56 k = i + j;
cannam@127 57 DO(i, j, k, mulcost);
cannam@127 58 k = i - j;
cannam@127 59 DO(i, j, k, mulcost);
cannam@127 60
cannam@127 61 k = i + j;
cannam@127 62 DO3(i, j, i - j, k, reflcost);
cannam@127 63 }
cannam@127 64 }
cannam@127 65
cannam@127 66 } while (changed);
cannam@127 67
cannam@127 68 cst = cstmax = 0;
cannam@127 69 for (i = 0; i < n; ++i) {
cannam@127 70 cst += A[i];
cannam@127 71 if (A[i] > cstmax) cstmax = A[i];
cannam@127 72 }
cannam@127 73 /* return cstmax; */
cannam@127 74 return cst;
cannam@127 75 }
cannam@127 76
cannam@127 77 static void search(int n, int t, int *A, int *B, int depth)
cannam@127 78 {
cannam@127 79 if (depth == 0) {
cannam@127 80 int i, tc;
cannam@127 81 for (i = 0; i < n; ++i)
cannam@127 82 A[i] = INFTY;
cannam@127 83 A[0] = 0; /* always free */
cannam@127 84 for (i = 1; i <= t; ++i)
cannam@127 85 A[B[-i]] = ldcost;
cannam@127 86
cannam@127 87 tc = optimize(n, A);
cannam@127 88 if (tc < best_so_far) {
cannam@127 89 best_so_far = tc;
cannam@127 90 for (i = 1; i <= t; ++i)
cannam@127 91 answer[t - i] = B[-i];
cannam@127 92 if (verbose)
cannam@127 93 print_answer(n, t);
cannam@127 94 }
cannam@127 95 } else {
cannam@127 96 for (B[0] = B[-1] + 1; B[0] < n; ++B[0])
cannam@127 97 search(n, t, A, B + 1, depth - 1);
cannam@127 98 }
cannam@127 99 }
cannam@127 100
cannam@127 101 static void doit(int n, int t)
cannam@127 102 {
cannam@127 103 int *A;
cannam@127 104 int *B;
cannam@127 105
cannam@127 106 A = malloc(n * sizeof(int));
cannam@127 107 B = malloc((t + 1) * sizeof(int));
cannam@127 108 answer = malloc(t * sizeof(int));
cannam@127 109
cannam@127 110 B[0] = 0;
cannam@127 111 best_so_far = INFTY;
cannam@127 112 search(n, t, A, B + 1, t);
cannam@127 113
cannam@127 114 print_answer(n, t);
cannam@127 115
cannam@127 116 free(A); free(B); free(answer);
cannam@127 117 }
cannam@127 118
cannam@127 119 int main(int argc, char *argv[])
cannam@127 120 {
cannam@127 121 int n = 32;
cannam@127 122 int t = 3;
cannam@127 123 int all;
cannam@127 124 int ch;
cannam@127 125
cannam@127 126 verbose = 0;
cannam@127 127 all = 0;
cannam@127 128 while ((ch = getopt(argc, argv, "n:t:m:l:r:s:va")) != -1) {
cannam@127 129 switch (ch) {
cannam@127 130 case 'n':
cannam@127 131 n = atoi(optarg);
cannam@127 132 break;
cannam@127 133 case 't':
cannam@127 134 t = atoi(optarg);
cannam@127 135 break;
cannam@127 136 case 'm':
cannam@127 137 mulcost = atoi(optarg);
cannam@127 138 break;
cannam@127 139 case 'l':
cannam@127 140 ldcost = atoi(optarg);
cannam@127 141 break;
cannam@127 142 case 's':
cannam@127 143 sqcost = atoi(optarg);
cannam@127 144 break;
cannam@127 145 case 'r':
cannam@127 146 reflcost = atoi(optarg);
cannam@127 147 break;
cannam@127 148 case 'v':
cannam@127 149 ++verbose;
cannam@127 150 break;
cannam@127 151 case 'a':
cannam@127 152 ++all;
cannam@127 153 break;
cannam@127 154 case '?':
cannam@127 155 fprintf(stderr, "use the source\n");
cannam@127 156 exit(1);
cannam@127 157 }
cannam@127 158 }
cannam@127 159
cannam@127 160 if (all) {
cannam@127 161 for (n = 4; n <= 64; n *= 2) {
cannam@127 162 int n1 = n - 1; if (n1 > 7) n1 = 7;
cannam@127 163 for (t = 1; t <= n1; ++t)
cannam@127 164 doit(n, t);
cannam@127 165 }
cannam@127 166 } else {
cannam@127 167 doit(n, t);
cannam@127 168 }
cannam@127 169
cannam@127 170 return 0;
cannam@127 171 }