2011-04-27 11:58:34 +00:00
|
|
|
/*
|
2013-08-18 14:16:15 +00:00
|
|
|
* Copyright 2011-2013 Blender Foundation
|
2011-04-27 11:58:34 +00:00
|
|
|
*
|
2013-08-18 14:16:15 +00:00
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
2011-04-27 11:58:34 +00:00
|
|
|
*
|
2013-08-18 14:16:15 +00:00
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
2011-04-27 11:58:34 +00:00
|
|
|
*
|
2013-08-18 14:16:15 +00:00
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
2014-12-25 01:50:24 +00:00
|
|
|
* limitations under the License.
|
2011-04-27 11:58:34 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include "util_system.h"
|
2016-06-03 23:29:13 +00:00
|
|
|
|
2016-01-12 11:00:48 +00:00
|
|
|
#include "util_debug.h"
|
2016-06-03 23:29:13 +00:00
|
|
|
#include "util_logging.h"
|
2011-04-27 11:58:34 +00:00
|
|
|
#include "util_types.h"
|
2015-05-21 21:43:18 +00:00
|
|
|
#include "util_string.h"
|
2011-04-27 11:58:34 +00:00
|
|
|
|
|
|
|
#ifdef _WIN32
|
2016-02-05 08:09:39 +00:00
|
|
|
# if(!defined(FREE_WINDOWS))
|
|
|
|
# include <intrin.h>
|
|
|
|
# endif
|
|
|
|
# include "util_windows.h"
|
2011-04-27 11:58:34 +00:00
|
|
|
#elif defined(__APPLE__)
|
2016-02-05 08:09:39 +00:00
|
|
|
# include <sys/sysctl.h>
|
|
|
|
# include <sys/types.h>
|
2011-04-27 11:58:34 +00:00
|
|
|
#else
|
2016-02-05 08:09:39 +00:00
|
|
|
# include <unistd.h>
|
2011-04-27 11:58:34 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
CCL_NAMESPACE_BEGIN
|
|
|
|
|
2016-06-03 23:29:13 +00:00
|
|
|
int system_cpu_group_count()
|
2011-04-27 11:58:34 +00:00
|
|
|
{
|
2016-06-03 23:29:13 +00:00
|
|
|
#ifdef _WIN32
|
|
|
|
util_windows_init_numa_groups();
|
|
|
|
return GetActiveProcessorGroupCount();
|
|
|
|
#else
|
|
|
|
/* TODO(sergey): Need to adopt for other platforms. */
|
|
|
|
return 1;
|
|
|
|
#endif
|
|
|
|
}
|
2011-04-27 11:58:34 +00:00
|
|
|
|
2016-06-03 23:29:13 +00:00
|
|
|
int system_cpu_group_thread_count(int group)
|
|
|
|
{
|
|
|
|
/* TODO(sergey): Need make other platforms aware of groups. */
|
2011-04-27 11:58:34 +00:00
|
|
|
#ifdef _WIN32
|
2016-06-03 23:29:13 +00:00
|
|
|
util_windows_init_numa_groups();
|
|
|
|
return GetActiveProcessorCount(group);
|
2011-04-27 11:58:34 +00:00
|
|
|
#elif defined(__APPLE__)
|
2016-06-03 23:29:13 +00:00
|
|
|
(void)group;
|
2016-06-06 11:52:57 +00:00
|
|
|
int count;
|
2011-04-27 11:58:34 +00:00
|
|
|
size_t len = sizeof(count);
|
|
|
|
int mib[2] = { CTL_HW, HW_NCPU };
|
|
|
|
sysctl(mib, 2, &count, &len, NULL, 0);
|
2016-06-03 23:29:13 +00:00
|
|
|
return count;
|
2011-04-27 11:58:34 +00:00
|
|
|
#else
|
2016-06-03 23:29:13 +00:00
|
|
|
(void)group;
|
|
|
|
return sysconf(_SC_NPROCESSORS_ONLN);
|
2011-04-27 11:58:34 +00:00
|
|
|
#endif
|
2016-06-03 23:29:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int system_cpu_thread_count()
|
|
|
|
{
|
|
|
|
static uint count = 0;
|
|
|
|
|
|
|
|
if(count > 0) {
|
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
|
|
|
int max_group = system_cpu_group_count();
|
|
|
|
VLOG(1) << "Detected " << max_group << " CPU groups.";
|
|
|
|
for(int group = 0; group < max_group; ++group) {
|
|
|
|
int num_threads = system_cpu_group_thread_count(group);
|
|
|
|
VLOG(1) << "Group " << group
|
|
|
|
<< " has " << num_threads << " threads.";
|
|
|
|
count += num_threads;
|
|
|
|
}
|
2011-04-27 11:58:34 +00:00
|
|
|
|
2016-06-03 23:29:13 +00:00
|
|
|
if(count < 1) {
|
2011-04-27 11:58:34 +00:00
|
|
|
count = 1;
|
2016-06-03 23:29:13 +00:00
|
|
|
}
|
2011-04-27 11:58:34 +00:00
|
|
|
|
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
2011-09-04 15:39:09 +00:00
|
|
|
#if !defined(_WIN32) || defined(FREE_WINDOWS)
|
2011-04-27 11:58:34 +00:00
|
|
|
static void __cpuid(int data[4], int selector)
|
|
|
|
{
|
2011-05-05 13:51:33 +00:00
|
|
|
#ifdef __x86_64__
|
2011-04-27 11:58:34 +00:00
|
|
|
asm("cpuid" : "=a" (data[0]), "=b" (data[1]), "=c" (data[2]), "=d" (data[3]) : "a"(selector));
|
2011-05-05 13:51:33 +00:00
|
|
|
#else
|
|
|
|
#ifdef __i386__
|
|
|
|
asm("pushl %%ebx \n\t"
|
|
|
|
"cpuid \n\t"
|
|
|
|
"movl %%ebx, %1 \n\t"
|
|
|
|
"popl %%ebx \n\t" : "=a" (data[0]), "=r" (data[1]), "=c" (data[2]), "=d" (data[3]) : "a"(selector));
|
|
|
|
#else
|
|
|
|
data[0] = data[1] = data[2] = data[3] = 0;
|
|
|
|
#endif
|
|
|
|
#endif
|
2011-04-27 11:58:34 +00:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
string system_cpu_brand_string()
|
|
|
|
{
|
|
|
|
char buf[48];
|
|
|
|
int result[4];
|
|
|
|
|
|
|
|
__cpuid(result, 0x80000000);
|
|
|
|
|
|
|
|
if(result[0] >= (int)0x80000004) {
|
|
|
|
__cpuid((int*)(buf+0), 0x80000002);
|
|
|
|
__cpuid((int*)(buf+16), 0x80000003);
|
|
|
|
__cpuid((int*)(buf+32), 0x80000004);
|
|
|
|
|
|
|
|
string brand = buf;
|
|
|
|
|
|
|
|
/* make it a bit more presentable */
|
2015-05-21 21:43:18 +00:00
|
|
|
brand = string_remove_trademark(brand);
|
2011-04-27 11:58:34 +00:00
|
|
|
|
|
|
|
return brand;
|
|
|
|
}
|
|
|
|
|
|
|
|
return "Unknown CPU";
|
|
|
|
}
|
|
|
|
|
2011-09-08 18:58:07 +00:00
|
|
|
int system_cpu_bits()
|
|
|
|
{
|
|
|
|
return (sizeof(void*)*8);
|
|
|
|
}
|
|
|
|
|
2013-10-05 19:56:34 +00:00
|
|
|
#if defined(__x86_64__) || defined(_M_X64) || defined(i386) || defined(_M_IX86)
|
2011-11-15 15:13:38 +00:00
|
|
|
|
|
|
|
struct CPUCapabilities {
|
|
|
|
bool x64;
|
|
|
|
bool mmx;
|
|
|
|
bool sse;
|
|
|
|
bool sse2;
|
|
|
|
bool sse3;
|
|
|
|
bool ssse3;
|
|
|
|
bool sse41;
|
|
|
|
bool sse42;
|
|
|
|
bool sse4a;
|
|
|
|
bool avx;
|
2015-05-11 15:49:36 +00:00
|
|
|
bool f16c;
|
2014-06-13 20:23:58 +00:00
|
|
|
bool avx2;
|
2011-11-15 15:13:38 +00:00
|
|
|
bool xop;
|
|
|
|
bool fma3;
|
|
|
|
bool fma4;
|
2014-06-13 20:23:58 +00:00
|
|
|
bool bmi1;
|
|
|
|
bool bmi2;
|
2011-11-15 15:13:38 +00:00
|
|
|
};
|
|
|
|
|
2013-02-04 16:12:37 +00:00
|
|
|
static CPUCapabilities& system_cpu_capabilities()
|
2011-11-15 15:13:38 +00:00
|
|
|
{
|
|
|
|
static CPUCapabilities caps;
|
|
|
|
static bool caps_init = false;
|
|
|
|
|
|
|
|
if(!caps_init) {
|
2015-02-11 10:28:42 +00:00
|
|
|
int result[4], num;
|
2011-11-15 15:13:38 +00:00
|
|
|
|
|
|
|
memset(&caps, 0, sizeof(caps));
|
|
|
|
|
|
|
|
__cpuid(result, 0);
|
|
|
|
num = result[0];
|
|
|
|
|
2012-06-06 22:38:39 +00:00
|
|
|
if(num >= 1) {
|
2011-11-15 15:13:38 +00:00
|
|
|
__cpuid(result, 0x00000001);
|
|
|
|
caps.mmx = (result[3] & ((int)1 << 23)) != 0;
|
|
|
|
caps.sse = (result[3] & ((int)1 << 25)) != 0;
|
|
|
|
caps.sse2 = (result[3] & ((int)1 << 26)) != 0;
|
|
|
|
caps.sse3 = (result[2] & ((int)1 << 0)) != 0;
|
|
|
|
|
|
|
|
caps.ssse3 = (result[2] & ((int)1 << 9)) != 0;
|
|
|
|
caps.sse41 = (result[2] & ((int)1 << 19)) != 0;
|
|
|
|
caps.sse42 = (result[2] & ((int)1 << 20)) != 0;
|
|
|
|
|
|
|
|
caps.fma3 = (result[2] & ((int)1 << 12)) != 0;
|
2014-02-25 16:57:05 +00:00
|
|
|
caps.avx = false;
|
2014-02-25 18:50:53 +00:00
|
|
|
bool os_uses_xsave_xrestore = (result[2] & ((int)1 << 27)) != 0;
|
2014-02-25 16:57:05 +00:00
|
|
|
bool cpu_avx_support = (result[2] & ((int)1 << 28)) != 0;
|
|
|
|
|
|
|
|
if( os_uses_xsave_xrestore && cpu_avx_support) {
|
|
|
|
// Check if the OS will save the YMM registers
|
|
|
|
uint32_t xcr_feature_mask;
|
2014-05-04 16:19:08 +00:00
|
|
|
#if defined(__GNUC__)
|
|
|
|
int edx; /* not used */
|
|
|
|
/* actual opcode for xgetbv */
|
|
|
|
__asm__ (".byte 0x0f, 0x01, 0xd0" : "=a" (xcr_feature_mask) , "=d" (edx) : "c" (0) );
|
|
|
|
#elif defined(_MSC_VER) && defined(_XCR_XFEATURE_ENABLED_MASK)
|
|
|
|
xcr_feature_mask = (uint32_t)_xgetbv(_XCR_XFEATURE_ENABLED_MASK); /* min VS2010 SP1 compiler is required */
|
|
|
|
#else
|
|
|
|
xcr_feature_mask = 0;
|
|
|
|
#endif
|
2014-02-25 16:57:05 +00:00
|
|
|
caps.avx = (xcr_feature_mask & 0x6) == 0x6;
|
|
|
|
}
|
2014-06-13 20:23:58 +00:00
|
|
|
|
2015-05-11 15:49:36 +00:00
|
|
|
caps.f16c = (result[2] & ((int)1 << 29)) != 0;
|
|
|
|
|
2014-06-13 20:23:58 +00:00
|
|
|
__cpuid(result, 0x00000007);
|
|
|
|
caps.bmi1 = (result[1] & ((int)1 << 3)) != 0;
|
|
|
|
caps.bmi2 = (result[1] & ((int)1 << 8)) != 0;
|
|
|
|
caps.avx2 = (result[1] & ((int)1 << 5)) != 0;
|
2011-11-15 15:13:38 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
caps_init = true;
|
|
|
|
}
|
|
|
|
|
2013-02-04 16:12:37 +00:00
|
|
|
return caps;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_sse2()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
2016-01-12 11:00:48 +00:00
|
|
|
return DebugFlags().cpu.sse2 && caps.sse && caps.sse2;
|
2013-02-04 16:12:37 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_sse3()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
2016-01-12 11:00:48 +00:00
|
|
|
return DebugFlags().cpu.sse3 &&
|
|
|
|
caps.sse && caps.sse2 && caps.sse3 && caps.ssse3;
|
2011-11-15 15:13:38 +00:00
|
|
|
}
|
|
|
|
|
2013-11-22 13:16:47 +00:00
|
|
|
bool system_cpu_support_sse41()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
2016-01-12 11:00:48 +00:00
|
|
|
return DebugFlags().cpu.sse41 &&
|
|
|
|
caps.sse && caps.sse2 && caps.sse3 && caps.ssse3 && caps.sse41;
|
2013-11-22 13:16:47 +00:00
|
|
|
}
|
2014-01-16 16:04:11 +00:00
|
|
|
|
|
|
|
bool system_cpu_support_avx()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
2016-01-12 11:00:48 +00:00
|
|
|
return DebugFlags().cpu.avx &&
|
|
|
|
caps.sse && caps.sse2 && caps.sse3 && caps.ssse3 && caps.sse41 && caps.avx;
|
2014-01-16 16:04:11 +00:00
|
|
|
}
|
2016-01-12 11:00:48 +00:00
|
|
|
|
2014-06-13 20:23:58 +00:00
|
|
|
bool system_cpu_support_avx2()
|
|
|
|
{
|
|
|
|
CPUCapabilities& caps = system_cpu_capabilities();
|
2016-01-12 11:00:48 +00:00
|
|
|
return DebugFlags().cpu.avx2 &&
|
|
|
|
caps.sse && caps.sse2 && caps.sse3 && caps.ssse3 && caps.sse41 && caps.avx && caps.f16c && caps.avx2 && caps.fma3 && caps.bmi1 && caps.bmi2;
|
2014-06-13 20:23:58 +00:00
|
|
|
}
|
2011-11-15 15:13:38 +00:00
|
|
|
#else
|
|
|
|
|
2013-06-04 11:21:13 +00:00
|
|
|
bool system_cpu_support_sse2()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_sse3()
|
2011-11-15 15:13:38 +00:00
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2014-01-16 16:04:11 +00:00
|
|
|
bool system_cpu_support_sse41()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool system_cpu_support_avx()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
2014-06-13 20:23:58 +00:00
|
|
|
bool system_cpu_support_avx2()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
2014-01-16 16:04:11 +00:00
|
|
|
|
2011-11-15 15:13:38 +00:00
|
|
|
#endif
|
|
|
|
|
2011-04-27 11:58:34 +00:00
|
|
|
CCL_NAMESPACE_END
|
|
|
|
|