blob: b8a67cf98ad02a4ad3ba291ba64ba7eceb8df149 [file] [log] [blame]
// Copyright 2016 The SwiftShader Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "CPUID.hpp"
#if defined(_WIN32)
# ifndef WIN32_LEAN_AND_MEAN
# define WIN32_LEAN_AND_MEAN
# endif
# include <windows.h>
# include <intrin.h>
# include <float.h>
#else
# include <unistd.h>
# include <sched.h>
# include <sys/types.h>
#endif
namespace rr {
static void cpuid(int eax_ebx_ecx_edx[4], int eax, int ecx = 0)
{
#if defined(__i386__) || defined(__x86_64__)
# if defined(_WIN32)
__cpuidex(eax_ebx_ecx_edx, eax, ecx);
# else
__asm volatile("cpuid"
: "=a"(eax_ebx_ecx_edx[0]), "=b"(eax_ebx_ecx_edx[1]), "=c"(eax_ebx_ecx_edx[2]), "=d"(eax_ebx_ecx_edx[3])
: "a"(eax), "c"(ecx));
# endif
#else
eax_ebx_ecx_edx[0] = 0;
eax_ebx_ecx_edx[1] = 0;
eax_ebx_ecx_edx[2] = 0;
eax_ebx_ecx_edx[3] = 0;
#endif
}
bool CPUID::supportsSSE4_1()
{
int eax_ebx_ecx_edx[4];
cpuid(eax_ebx_ecx_edx, 1);
return (eax_ebx_ecx_edx[2] & 0x00080000) != 0;
}
bool CPUID::supportsAVX2()
{
int eax_ebx_ecx_edx[4];
cpuid(eax_ebx_ecx_edx, 1);
// Test bits 12 (FMA), 27 (OSXSAVE), and 28 (AVX) of ECX
bool osxsave_avx_fma = (eax_ebx_ecx_edx[2] & 0x18001000) == 0x18001000;
// AVX is a prerequisite of AVX2 and must be checked for first according to the Intel Software Developer's Manual.
// OSXSAVE ensures the operating system can save/restore ymm registers on context switches.
// FMA support is often considered an integral part of AVX2.
if(!osxsave_avx_fma)
{
return false;
}
cpuid(eax_ebx_ecx_edx, 7, 0); // Valid if AVX is supported
return (eax_ebx_ecx_edx[1] & 0x00000020) != 0;
}
} // namespace rr