cannam@127: /* cannam@127: * Copyright (c) 2003, 2007-11 Matteo Frigo cannam@127: * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology cannam@127: * Copyright (c) 2012-2013 Romain Dolbeau cannam@127: * cannam@127: * Permission is hereby granted, free of charge, to any person obtaining a copy cannam@127: * of this software and associated documentation files (the "Software"), to deal cannam@127: * in the Software without restriction, including without limitation the rights cannam@127: * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell cannam@127: * copies of the Software, and to permit persons to whom the Software is cannam@127: * furnished to do so, subject to the following conditions: cannam@127: * cannam@127: * The above copyright notice and this permission notice shall be included in cannam@127: * all copies or substantial portions of the Software. cannam@127: * cannam@127: * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR cannam@127: * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, cannam@127: * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE cannam@127: * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER cannam@127: * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, cannam@127: * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN cannam@127: * THE SOFTWARE. cannam@127: * cannam@127: */ cannam@127: cannam@127: #include "ifftw.h" cannam@127: cannam@127: #if HAVE_AVX512 cannam@127: cannam@127: #if defined(__x86_64__) || defined(_M_X64) || defined(_M_AMD64) cannam@127: cannam@127: #include "amd64-cpuid.h" cannam@127: cannam@127: int X(have_simd_avx512)(void) cannam@127: { cannam@127: static int init = 0, res; cannam@127: int max_stdfn, eax, ebx, ecx, edx; cannam@127: cannam@127: /* NOTE: this code is a total guess. I don't have an avx512 cannam@127: machine available. The code contributed by Erik Lindahl would cannam@127: crash on a machine without XGETBV, so I had to guess a fix. */ cannam@127: if (!init) { cannam@127: cpuid_all(0,0,&eax,&ebx,&ecx,&edx); cannam@127: max_stdfn = eax; cannam@127: if (max_stdfn >= 0x1) { cannam@127: /* have OSXSAVE? (implies XGETBV exists) */ cannam@127: cpuid_all(0x1, 0, &eax, &ebx, &ecx, &edx); cannam@127: if ((ecx & 0x08000000) == 0x08000000) { cannam@127: /* have AVX512? */ cannam@127: cpuid_all(7,0,&eax,&ebx,&ecx,&edx); cannam@127: if (ebx & (1 << 16)) { cannam@127: /* have OS support for XMM, YMM, ZMM */ cannam@127: int zmm_ymm_xmm = (7 << 5) | (1 << 2) | (1 << 1); cannam@127: res = ((xgetbv_eax(0) & zmm_ymm_xmm) == zmm_ymm_xmm); cannam@127: } cannam@127: } cannam@127: } cannam@127: init = 1; cannam@127: } cannam@127: cannam@127: return res; cannam@127: } cannam@127: cannam@127: #else /* 32-bit code */ cannam@127: cannam@127: #error "Avx512 is 64 bits only" cannam@127: cannam@127: #endif cannam@127: cannam@127: #endif