// Copyright 2016 The SwiftShader Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "CPUID.hpp" #if defined(_WIN32) # ifndef WIN32_LEAN_AND_MEAN # define WIN32_LEAN_AND_MEAN # endif # include # include # include #else # include # include # include #endif namespace rr { static void cpuid(int eax_ebx_ecx_edx[4], int eax, int ecx = 0) { #if defined(__i386__) || defined(__x86_64__) # if defined(_WIN32) __cpuidex(eax_ebx_ecx_edx, eax, ecx); # else __asm volatile("cpuid" : "=a"(eax_ebx_ecx_edx[0]), "=b"(eax_ebx_ecx_edx[1]), "=c"(eax_ebx_ecx_edx[2]), "=d"(eax_ebx_ecx_edx[3]) : "a"(eax), "c"(ecx)); # endif #else eax_ebx_ecx_edx[0] = 0; eax_ebx_ecx_edx[1] = 0; eax_ebx_ecx_edx[2] = 0; eax_ebx_ecx_edx[3] = 0; #endif } bool CPUID::supportsSSE4_1() { int eax_ebx_ecx_edx[4]; cpuid(eax_ebx_ecx_edx, 1); return (eax_ebx_ecx_edx[2] & 0x00080000) != 0; } bool CPUID::supportsAVX2() { int eax_ebx_ecx_edx[4]; cpuid(eax_ebx_ecx_edx, 1); // Test bits 12 (FMA), 27 (OSXSAVE), and 28 (AVX) of ECX bool osxsave_avx_fma = (eax_ebx_ecx_edx[2] & 0x18001000) == 0x18001000; // AVX is a prerequisite of AVX2 and must be checked for first according to the Intel Software Developer's Manual. // OSXSAVE ensures the operating system can save/restore ymm registers on context switches. // FMA support is often considered an integral part of AVX2. if(!osxsave_avx_fma) { return false; } cpuid(eax_ebx_ecx_edx, 7, 0); // Valid if AVX is supported return (eax_ebx_ecx_edx[1] & 0x00000020) != 0; } } // namespace rr