2011-04-27 11:58:34 +00:00
|
|
|
/*
|
2013-08-18 14:16:15 +00:00
|
|
|
* Copyright 2011-2013 Blender Foundation
|
2011-04-27 11:58:34 +00:00
|
|
|
*
|
2013-08-18 14:16:15 +00:00
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
2011-04-27 11:58:34 +00:00
|
|
|
*
|
2013-08-18 14:16:15 +00:00
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
2011-04-27 11:58:34 +00:00
|
|
|
*
|
2013-08-18 14:16:15 +00:00
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License
|
2011-04-27 11:58:34 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include "util_system.h"
|
|
|
|
#include "util_types.h"
|
|
|
|
|
|
|
|
#ifdef _WIN32
|
2011-09-04 15:39:09 +00:00
|
|
|
#if(!defined(FREE_WINDOWS))
|
2011-04-27 11:58:34 +00:00
|
|
|
#include <intrin.h>
|
2011-09-04 15:39:09 +00:00
|
|
|
#endif
|
2011-04-27 11:58:34 +00:00
|
|
|
#include <windows.h>
|
|
|
|
#elif defined(__APPLE__)
|
|
|
|
#include <sys/sysctl.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#else
|
|
|
|
#include <unistd.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
CCL_NAMESPACE_BEGIN
|
|
|
|
|
|
|
|
int system_cpu_thread_count()
|
|
|
|
{
|
|
|
|
static uint count = 0;
|
|
|
|
|
|
|
|
if(count > 0)
|
|
|
|
return count;
|
|
|
|
|
|
|
|
#ifdef _WIN32
|
|
|
|
SYSTEM_INFO info;
|
|
|
|
GetSystemInfo(&info);
|
|
|
|
count = (uint)info.dwNumberOfProcessors;
|
|
|
|
#elif defined(__APPLE__)
|
|
|
|
size_t len = sizeof(count);
|
|
|
|
int mib[2] = { CTL_HW, HW_NCPU };
|
|
|
|
|
|
|
|
sysctl(mib, 2, &count, &len, NULL, 0);
|
|
|
|
#else
|
|
|
|
count = (uint)sysconf(_SC_NPROCESSORS_ONLN);
|
|
|
|
#endif
|
|
|
|
|
|
|
|
if(count < 1)
|
|
|
|
count = 1;
|
|
|
|
|
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
2011-09-04 15:39:09 +00:00
|
|
|
#if !defined(_WIN32) || defined(FREE_WINDOWS)
|
2011-04-27 11:58:34 +00:00
|
|
|
static void __cpuid(int data[4], int selector)
|
|
|
|
{
|
2011-05-05 13:51:33 +00:00
|
|
|
#ifdef __x86_64__
|
2011-04-27 11:58:34 +00:00
|
|
|
asm("cpuid" : "=a" (data[0]), "=b" (data[1]), "=c" (data[2]), "=d" (data[3]) : "a"(selector));
|
2011-05-05 13:51:33 +00:00
|
|
|
#else
|
|
|
|
#ifdef __i386__
|
|
|
|
asm("pushl %%ebx \n\t"
|
|
|
|
"cpuid \n\t"
|
|
|
|
"movl %%ebx, %1 \n\t"
|
|
|
|
"popl %%ebx \n\t" : "=a" (data[0]), "=r" (data[1]), "=c" (data[2]), "=d" (data[3]) : "a"(selector));
|
|
|
|
#else
|
|
|
|
data[0] = data[1] = data[2] = data[3] = 0;
|
|
|
|
#endif
|
|
|
|
#endif
|
2011-04-27 11:58:34 +00:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
static void replace_string(string& haystack, const string& needle, const string& other)
|
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
while((i = haystack.find(needle)) != string::npos)
|
|
|
|
haystack.replace(i, needle.length(), other);
|
|
|
|
}
|
|
|
|
|
|
|
|
string system_cpu_brand_string()
|
|
|
|
{
|
|
|
|
char buf[48];
|
|
|
|
int result[4];
|
|
|
|
|
|
|
|
__cpuid(result, 0x80000000);
|
|
|
|
|
|
|
|
if(result[0] >= (int)0x80000004) {
|
|
|
|
__cpuid((int*)(buf+0), 0x80000002);
|
|
|
|
__cpuid((int*)(buf+16), 0x80000003);
|
|
|
|
__cpuid((int*)(buf+32), 0x80000004);
|
|
|
|
|
|
|
|
string brand = buf;
|
|
|
|
|
|
|
|
/* make it a bit more presentable */
|
|
|
|
replace_string(brand, "(TM)", "");
|
|
|
|
replace_string(brand, "(R)", "");
|
|
|
|
|
2013-12-07 01:29:53 +00:00
|
|
|
brand = string_strip(brand);
|
2011-04-27 11:58:34 +00:00
|
|
|
|
|
|
|
return brand;
|
|
|
|
}
|
|
|
|
|
|
|
|
return "Unknown CPU";
|
|
|
|
}
|
|
|
|
|
2011-09-08 18:58:07 +00:00
|
|
|
int system_cpu_bits()
|
|
|
|
{
|
|
|
|
return (sizeof(void*)*8);
|
|
|
|
}
|
|
|
|
|
2013-10-05 19:56:34 +00:00
|
|
|
#if defined(__x86_64__) || defined(_M_X64) || defined(i386) || defined(_M_IX86)
|
2011-11-15 15:13:38 +00:00
|
|
|
|
|
|
|
struct CPUCapabilities {
|
|
|
|
bool x64;
|
|
|
|
bool mmx;
|
|
|
|
bool sse;
|
|
|
|
bool sse2;
|
|
|
|
bool sse3;
|
|
|
|
bool ssse3;
|
|
|
|
bool sse41;
|
|
|
|
bool sse42;
|
|
|
|
bool sse4a;
|
|
|
|
bool avx;
|
2014-06-13 20:23:58 +00:00
|
|
|
bool avx2;
|
2011-11-15 15:13:38 +00:00
|
|
|
bool xop;
|
|
|
|
bool fma3;
|
|
|
|
bool fma4;
|
2014-06-13 20:23:58 +00:00
|
|
|
bool bmi1;
|
|
|
|
bool bmi2;
|
2011-11-15 15:13:38 +00:00
|
|
|
};
|
|
|
|
|
2013-02-04 16:12:37 +00:00
|
|
|
static CPUCapabilities& system_cpu_capabilities()
|
2011-11-15 15:13:38 +00:00
|
|
|
{
|
|
|
|
static CPUCapabilities caps;
|
|
|
|
static bool caps_init = false;
|
|
|
|
|
|
|
|
if(!caps_init) {
|
2011-12-02 14:26:28 +00:00
|
|
|
int result[4], num; //, num_ex;
|
2011-11-15 15:13:38 +00:00
|
|
|
|
|
|
|
memset(&caps, 0, sizeof(caps));
|
|
|
|
|
|
|
|
__cpuid(result, 0);
|
|
|
|
num = result[0];
|
|
|
|
|
2012-06-09 17:22:52 +00:00
|
|
|
#if 0
|
|
|
|
__cpuid(result, 0x80000000);
|
|
|
|
num_ex = result[0];
|
|
|
|
#endif
|
2011-11-15 15:13:38 +00:00
|
|
|
|
2012-06-06 22:38:39 +00:00
|
|
|
if(num >= 1) {
|
2011-11-15 15:13:38 +00:00
|
|
|
__cpuid(result, 0x00000001);
|
|
|
|
caps.mmx = (result[3] & ((int)1 << 23)) != 0;
|
|
|
|
caps.sse = (result[3] & ((int)1 << 25)) != 0;
|
|
|
|
caps.sse2 = (result[3] & ((int)1 << 26)) != 0;
|
|
|
|
caps.sse3 = (result[2] & ((int)1 << 0)) != 0;
|
|
|
|
|
|
|
|
caps.ssse3 = (result[2] & ((int)1 << 9)) != 0;
|
|
|
|
caps.sse41 = (result[2] & ((int)1 << 19)) != 0;
|
|
|
|
caps.sse42 = (result[2] & ((int)1 << 20)) != 0;
|
|
|
|
|
|
|
|
caps.fma3 = (result[2] & ((int)1 << 12)) != 0;
|
2014-02-25 16:57:05 +00:00
|
|
|
caps.avx = false;
|
2014-02-25 18:50:53 +00:00
|
|
|
bool os_uses_xsave_xrestore = (result[2] & ((int)1 << 27)) != 0;
|
2014-02-25 16:57:05 +00:00
|
|
|
bool cpu_avx_support = (result[2] & ((int)1 << 28)) != 0;
|
|
|
|
|
|
|
|
if( os_uses_xsave_xrestore && cpu_avx_support) {
|
|
|
|
// Check if the OS will save the YMM registers
|
|
|
|
uint32_t xcr_feature_mask;
|
2014-05-04 16:19:08 +00:00
|
|
|
#if defined(__GNUC__)
|
|
|
|
int edx; /* not used */
|
|
|
|
/* actual opcode for xgetbv */
|
|
|
|
__asm__ (".byte 0x0f, 0x01, 0xd0" : "=a" (xcr_feature_mask) , "=d" (edx) : "c" (0) );
|
|
|
|
#elif defined(_MSC_VER) && defined(_XCR_XFEATURE_ENABLED_MASK)
|
|
|
|
xcr_feature_mask = (uint32_t)_xgetbv(_XCR_XFEATURE_ENABLED_MASK); /* min VS2010 SP1 compiler is required */
|
|
|
|
#else
|
|
|
|
xcr_feature_mask = 0;
|
|
|
|
#endif
|
2014-02-25 16:57:05 +00:00
|
|
|
caps.avx = (xcr_feature_mask & 0x6) == 0x6;
|
|
|
|
}
|
2014-06-13 20:23:58 +00:00
|
|
|
|
|
|
|
__cpuid(result, 0x00000007);
|
|
|
|
caps.bmi1 = (result[1] & ((int)1 << 3)) != 0;
|
|
|
|
caps.bmi2 = (result[1] & ((int)1 << 8)) != 0;
|
|
|
|
caps.avx2 = (result[1] & ((int)1 << 5)) != 0;
|
2011-11-15 15:13:38 +00:00
|
|
|
}
|
|
|
|
|
2012-06-09 17:22:52 +00:00
|
|
|
#if 0
|
|
|
|
if(num_ex >= 0x80000001) {
|
2011-11-15 15:13:38 +00:00
|
|
|
__cpuid(result, 0x80000001);
|
|
|
|
caps.x64 = (result[3] & ((int)1 << 29)) != 0;
|
|
|
|
caps.sse4a = (result[2] & ((int)1 << 6)) != 0;
|
|
|
|
caps.fma4 = (result[2] & ((int)1 << 16)) != 0;
|
|
|
|
caps.xop = (result[2] & ((int)1 << 11)) != 0;
|
2012-06-09 17:22:52 +00:00
|
|
|
}
|
|
|
|
#endif
|
2011-11-15 15:13:38 +00:00
|
|
|
|
|
|
|
caps_init = true;
|
|
|
|
}
|
|
|
|
|
2013-02-04 16:12:37 +00:00
|
|
|
return caps;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_sse2()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
|
|
|
return caps.sse && caps.sse2;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_sse3()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
2013-06-18 16:52:02 +00:00
|
|
|
return caps.sse && caps.sse2 && caps.sse3 && caps.ssse3;
|
2011-11-15 15:13:38 +00:00
|
|
|
}
|
|
|
|
|
2013-11-22 13:16:47 +00:00
|
|
|
bool system_cpu_support_sse41()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
|
|
|
return caps.sse && caps.sse2 && caps.sse3 && caps.ssse3 && caps.sse41;
|
|
|
|
}
|
2014-01-16 16:04:11 +00:00
|
|
|
|
|
|
|
bool system_cpu_support_avx()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
|
|
|
return caps.sse && caps.sse2 && caps.sse3 && caps.ssse3 && caps.sse41 && caps.avx;
|
|
|
|
}
|
2014-06-13 20:23:58 +00:00
|
|
|
bool system_cpu_support_avx2()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
|
|
|
return caps.sse && caps.sse2 && caps.sse3 && caps.ssse3 && caps.sse41 && caps.avx && caps.avx2 && caps.fma3 && caps.bmi1 && caps.bmi2;
|
|
|
|
}
|
2011-11-15 15:13:38 +00:00
|
|
|
#else
|
|
|
|
|
2013-06-04 11:21:13 +00:00
|
|
|
bool system_cpu_support_sse2()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_sse3()
|
2011-11-15 15:13:38 +00:00
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2014-01-16 16:04:11 +00:00
|
|
|
bool system_cpu_support_sse41()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_avx()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
2014-06-13 20:23:58 +00:00
|
|
|
bool system_cpu_support_avx2()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
2014-01-16 16:04:11 +00:00
|
|
|
|
2011-11-15 15:13:38 +00:00
|
|
|
#endif
|
|
|
|
|
2011-04-27 11:58:34 +00:00
|
|
|
CCL_NAMESPACE_END
|
|
|
|
|