annotate fft/fftw/fftw-3.3.4/simd-support/amd64-cpuid.h @ 40:223f770b5341 kissfft-double tip

Try a double-precision kissfft
author Chris Cannam
date Wed, 07 Sep 2016 10:40:32 +0100
parents 26056e866c29
children
rev   line source
Chris@19 1 /*
Chris@19 2 * Copyright (c) 2003, 2007-14 Matteo Frigo
Chris@19 3 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
Chris@19 4 *
Chris@19 5 * This program is free software; you can redistribute it and/or modify
Chris@19 6 * it under the terms of the GNU General Public License as published by
Chris@19 7 * the Free Software Foundation; either version 2 of the License, or
Chris@19 8 * (at your option) any later version.
Chris@19 9 *
Chris@19 10 * This program is distributed in the hope that it will be useful,
Chris@19 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Chris@19 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
Chris@19 13 * GNU General Public License for more details.
Chris@19 14 *
Chris@19 15 * You should have received a copy of the GNU General Public License
Chris@19 16 * along with this program; if not, write to the Free Software
Chris@19 17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Chris@19 18 *
Chris@19 19 */
Chris@19 20
Chris@19 21
Chris@19 22 #ifdef _MSC_VER
Chris@19 23 #ifndef inline
Chris@19 24 #define inline __inline
Chris@19 25 #endif
Chris@19 26 #endif
Chris@19 27
Chris@19 28 #ifdef _MSC_VER
Chris@19 29 #include <intrin.h>
Chris@19 30 #if (_MSC_VER >= 1600) && !defined(__INTEL_COMPILER)
Chris@19 31 #include <immintrin.h>
Chris@19 32 #endif
Chris@19 33 #endif
Chris@19 34
Chris@19 35 static inline int cpuid_ecx(int op)
Chris@19 36 {
Chris@19 37 # ifdef _MSC_VER
Chris@19 38 # ifdef __INTEL_COMPILER
Chris@19 39 int result;
Chris@19 40 _asm {
Chris@19 41 push rbx
Chris@19 42 mov eax,op
Chris@19 43 cpuid
Chris@19 44 mov result,ecx
Chris@19 45 pop rbx
Chris@19 46 }
Chris@19 47 return result;
Chris@19 48 # else
Chris@19 49 int cpu_info[4];
Chris@19 50 __cpuid(cpu_info,op);
Chris@19 51 return cpu_info[2];
Chris@19 52 # endif
Chris@19 53 # else
Chris@19 54 int eax, ecx, edx;
Chris@19 55
Chris@19 56 __asm__("pushq %%rbx\n\tcpuid\n\tpopq %%rbx"
Chris@19 57 : "=a" (eax), "=c" (ecx), "=d" (edx)
Chris@19 58 : "a" (op));
Chris@19 59 return ecx;
Chris@19 60 # endif
Chris@19 61 }
Chris@19 62
Chris@19 63 static inline int xgetbv_eax(int op)
Chris@19 64 {
Chris@19 65 # ifdef _MSC_VER
Chris@19 66 # ifdef __INTEL_COMPILER
Chris@19 67 int veax, vedx;
Chris@19 68 _asm {
Chris@19 69 mov ecx,op
Chris@19 70 xgetbv
Chris@19 71 mov veax,eax
Chris@19 72 mov vedx,edx
Chris@19 73 }
Chris@19 74 return veax;
Chris@19 75 # else
Chris@19 76 # if defined(_MSC_VER) && (_MSC_VER >= 1600)
Chris@19 77 unsigned __int64 result;
Chris@19 78 result = _xgetbv(op);
Chris@19 79 return (int)result;
Chris@19 80 # else
Chris@19 81 # error "Need at least Visual Studio 10 SP1 for AVX support"
Chris@19 82 # endif
Chris@19 83 # endif
Chris@19 84 # else
Chris@19 85 int eax, edx;
Chris@19 86 __asm__ (".byte 0x0f, 0x01, 0xd0" : "=a"(eax), "=d"(edx) : "c" (op));
Chris@19 87 return eax;
Chris@19 88 #endif
Chris@19 89 }