/**************************************************************************** * Copyright (C) 2014-2015 Intel Corporation. All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS * IN THE SOFTWARE. ****************************************************************************/ #pragma once #include #include #include #include #include #include // Clang for Windows does supply an intrin.h with __cpuid intrinsics, however... // It seems to not realize that a write to "b" (ebx) will kill the value in rbx. // This attempts to use the "native" clang / gcc intrinsics instead of the windows // compatible ones. #if defined(_MSC_VER) && !defined(__clang__) #include #else #include #if !defined(__cpuid) #include #endif #endif class InstructionSet { public: InstructionSet() : CPU_Rep(){}; // getters std::string Vendor(void) { return CPU_Rep.vendor_; } std::string Brand(void) { return CPU_Rep.brand_; } bool SSE3(void) { return CPU_Rep.f_1_ECX_[0]; } bool PCLMULQDQ(void) { return CPU_Rep.f_1_ECX_[1]; } bool MONITOR(void) { return CPU_Rep.f_1_ECX_[3]; } bool SSSE3(void) { return CPU_Rep.f_1_ECX_[9]; } bool FMA(void) { return CPU_Rep.f_1_ECX_[12]; } bool CMPXCHG16B(void) { return CPU_Rep.f_1_ECX_[13]; } bool SSE41(void) { return CPU_Rep.f_1_ECX_[19]; } bool SSE42(void) { return CPU_Rep.f_1_ECX_[20]; } bool MOVBE(void) { return CPU_Rep.f_1_ECX_[22]; } bool POPCNT(void) { return CPU_Rep.f_1_ECX_[23]; } bool AES(void) { return CPU_Rep.f_1_ECX_[25]; } bool XSAVE(void) { return CPU_Rep.f_1_ECX_[26]; } bool OSXSAVE(void) { return CPU_Rep.f_1_ECX_[27]; } bool RDRAND(void) { return CPU_Rep.f_1_ECX_[30]; } bool MSR(void) { return CPU_Rep.f_1_EDX_[5]; } bool CX8(void) { return CPU_Rep.f_1_EDX_[8]; } bool SEP(void) { return CPU_Rep.f_1_EDX_[11]; } bool CMOV(void) { return CPU_Rep.f_1_EDX_[15]; } bool CLFSH(void) { return CPU_Rep.f_1_EDX_[19]; } bool MMX(void) { return CPU_Rep.f_1_EDX_[23]; } bool FXSR(void) { return CPU_Rep.f_1_EDX_[24]; } bool SSE(void) { return CPU_Rep.f_1_EDX_[25]; } bool SSE2(void) { return CPU_Rep.f_1_EDX_[26]; } bool FSGSBASE(void) { return CPU_Rep.f_7_EBX_[0]; } bool BMI1(void) { return CPU_Rep.f_7_EBX_[3]; } bool HLE(void) { return CPU_Rep.isIntel_ && CPU_Rep.f_7_EBX_[4]; } bool BMI2(void) { return CPU_Rep.f_7_EBX_[8]; } bool ERMS(void) { return CPU_Rep.f_7_EBX_[9]; } bool INVPCID(void) { return CPU_Rep.f_7_EBX_[10]; } bool RTM(void) { return CPU_Rep.isIntel_ && CPU_Rep.f_7_EBX_[11]; } bool RDSEED(void) { return CPU_Rep.f_7_EBX_[18]; } bool ADX(void) { return CPU_Rep.f_7_EBX_[19]; } bool SHA(void) { return CPU_Rep.f_7_EBX_[29]; } bool PREFETCHWT1(void) { return CPU_Rep.f_7_ECX_[0]; } bool LAHF(void) { return CPU_Rep.f_81_ECX_[0]; } bool LZCNT(void) { return CPU_Rep.isIntel_ && CPU_Rep.f_81_ECX_[5]; } bool ABM(void) { return CPU_Rep.isAMD_ && CPU_Rep.f_81_ECX_[5]; } bool SSE4a(void) { return CPU_Rep.isAMD_ && CPU_Rep.f_81_ECX_[6]; } bool XOP(void) { return CPU_Rep.isAMD_ && CPU_Rep.f_81_ECX_[11]; } bool TBM(void) { return CPU_Rep.isAMD_ && CPU_Rep.f_81_ECX_[21]; } bool SYSCALL(void) { return CPU_Rep.isIntel_ && CPU_Rep.f_81_EDX_[11]; } bool MMXEXT(void) { return CPU_Rep.isAMD_ && CPU_Rep.f_81_EDX_[22]; } bool RDTSCP(void) { return CPU_Rep.isIntel_ && CPU_Rep.f_81_EDX_[27]; } bool _3DNOWEXT(void) { return CPU_Rep.isAMD_ && CPU_Rep.f_81_EDX_[30]; } bool _3DNOW(void) { return CPU_Rep.isAMD_ && CPU_Rep.f_81_EDX_[31]; } bool AVX(void) { return CPU_Rep.f_1_ECX_[28]; } bool F16C(void) { return CPU_Rep.f_1_ECX_[29]; } bool AVX2(void) { return CPU_Rep.f_7_EBX_[5]; } bool AVX512F(void) { return CPU_Rep.f_7_EBX_[16]; } bool AVX512PF(void) { return CPU_Rep.f_7_EBX_[26]; } bool AVX512ER(void) { return CPU_Rep.f_7_EBX_[27]; } bool AVX512CD(void) { return CPU_Rep.f_7_EBX_[28]; } private: class InstructionSet_Internal { public: InstructionSet_Internal() : nIds_{0}, nExIds_{0}, isIntel_{false}, isAMD_{false}, f_1_ECX_{0}, f_1_EDX_{0}, f_7_EBX_{0}, f_7_ECX_{0}, f_81_ECX_{0}, f_81_EDX_{0}, data_{}, extdata_{} { // int cpuInfo[4] = {-1}; std::array cpui; // Calling __cpuid with 0x0 as the function_id argument // gets the number of the highest valid function ID. #if defined(_MSC_VER) && !defined(__clang__) __cpuid(cpui.data(), 0); nIds_ = cpui[0]; #else nIds_ = __get_cpuid_max(0, NULL); #endif for (int i = 0; i <= nIds_; ++i) { #if defined(_MSC_VER) && !defined(__clang__) __cpuidex(cpui.data(), i, 0); #else int* data = cpui.data(); __cpuid_count(i, 0, data[0], data[1], data[2], data[3]); #endif data_.push_back(cpui); } // Capture vendor string char vendor[0x20]; memset(vendor, 0, sizeof(vendor)); *reinterpret_cast(vendor) = data_[0][1]; *reinterpret_cast(vendor + 4) = data_[0][3]; *reinterpret_cast(vendor + 8) = data_[0][2]; vendor_ = vendor; if (vendor_ == "GenuineIntel") { isIntel_ = true; } else if (vendor_ == "AuthenticAMD") { isAMD_ = true; } // load bitset with flags for function 0x00000001 if (nIds_ >= 1) { f_1_ECX_ = data_[1][2]; f_1_EDX_ = data_[1][3]; } // load bitset with flags for function 0x00000007 if (nIds_ >= 7) { f_7_EBX_ = data_[7][1]; f_7_ECX_ = data_[7][2]; } // Calling __cpuid with 0x80000000 as the function_id argument // gets the number of the highest valid extended ID. #if defined(_MSC_VER) && !defined(__clang__) __cpuid(cpui.data(), 0x80000000); nExIds_ = cpui[0]; #else nExIds_ = __get_cpuid_max(0x80000000, NULL); #endif char brand[0x40]; memset(brand, 0, sizeof(brand)); for (unsigned i = 0x80000000; i <= nExIds_; ++i) { #if defined(_MSC_VER) && !defined(__clang__) __cpuidex(cpui.data(), i, 0); #else int* data = cpui.data(); __cpuid_count(i, 0, data[0], data[1], data[2], data[3]); #endif extdata_.push_back(cpui); } // load bitset with flags for function 0x80000001 if (nExIds_ >= 0x80000001) { f_81_ECX_ = extdata_[1][2]; f_81_EDX_ = extdata_[1][3]; } // Interpret CPU brand string if reported if (nExIds_ >= 0x80000004) { memcpy(brand, extdata_[2].data(), sizeof(cpui)); memcpy(brand + 16, extdata_[3].data(), sizeof(cpui)); memcpy(brand + 32, extdata_[4].data(), sizeof(cpui)); brand_ = brand; } }; int nIds_; unsigned nExIds_; std::string vendor_; std::string brand_; bool isIntel_; bool isAMD_; std::bitset<32> f_1_ECX_; std::bitset<32> f_1_EDX_; std::bitset<32> f_7_EBX_; std::bitset<32> f_7_ECX_; std::bitset<32> f_81_ECX_; std::bitset<32> f_81_EDX_; std::vector> data_; std::vector> extdata_; }; const InstructionSet_Internal CPU_Rep; };