comparison src/fftw-3.3.8/simd-support/avx2.c @ 82:d0c2a83c1364

Add FFTW 3.3.8 source, and a Linux build
author Chris Cannam
date Tue, 19 Nov 2019 14:52:55 +0000
parents
children
comparison
equal deleted inserted replaced
81:7029a4916348 82:d0c2a83c1364
1 /*
2 * Copyright (c) 2003, 2007-14 Matteo Frigo
3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
18 *
19 */
20
21
22 #include "kernel/ifftw.h"
23
24 #if HAVE_AVX2
25
26 #if defined(__x86_64__) || defined(_M_X64) || defined(_M_AMD64)
27 # include "amd64-cpuid.h"
28 #else
29 # include "x86-cpuid.h"
30 #endif
31
32 int X(have_simd_avx2_128)(void)
33 {
34 static int init = 0, res;
35 int max_stdfn, eax, ebx, ecx, edx;
36
37 if (!init) {
38 cpuid_all(0,0,&eax,&ebx,&ecx,&edx);
39 max_stdfn = eax;
40 if (max_stdfn >= 0x1) {
41 /* have AVX and OSXSAVE? (implies XGETBV exists) */
42 cpuid_all(0x1, 0, &eax, &ebx, &ecx, &edx);
43 if ((ecx & 0x18000000) == 0x18000000) {
44 /* have AVX2? */
45 cpuid_all(7,0,&eax,&ebx,&ecx,&edx);
46 if (ebx & (1 << 5)) {
47 /* have OS support for XMM, YMM? */
48 res = ((xgetbv_eax(0) & 0x6) == 0x6);
49 }
50 }
51 }
52 init = 1;
53 }
54 return res;
55 }
56
57 int X(have_simd_avx2)(void)
58 {
59 /*
60 * For now 256-bit AVX2 support is identical to 128-bit.
61 * This might change in the future if AMD released AVX2-capable
62 * chips that work better with the 128-bit flavor, but since AMD
63 * might actually change it to implement 256-bit AVX2 efficiently
64 * by then we don't want to disable it before we know.
65 */
66 return X(have_simd_avx2_128)();
67 }
68 #endif