X-Git-Url: https://git.sesse.net/?p=stockfish;a=blobdiff_plain;f=src%2Fmisc.cpp;h=2970ac3b49c30c6ceb0aeda94b95836919eab715;hp=d0616ca1865dc08d161f433b891f67ca1a6a9fb1;hb=47ee6d9fa4091aa05f6fedb62a2bb652b0422f08;hpb=a7fcdfd6bff8baa6278306dd9e4fa72d053bb8c9 diff --git a/src/misc.cpp b/src/misc.cpp index d0616ca1..2970ac3b 100644 --- a/src/misc.cpp +++ b/src/misc.cpp @@ -39,22 +39,26 @@ #endif +#if !defined(NO_PREFETCH) +# include +#endif + #include #include -#include #include #include #include #include "bitcount.h" #include "misc.h" +#include "thread.h" using namespace std; /// Version number. If this is left empty, the current date (in the format /// YYMMDD) is used as a version number. -static const string EngineVersion = "1.7"; +static const string EngineVersion = ""; static const string AppName = "Stockfish"; static const string AppTag = ""; @@ -183,85 +187,39 @@ int get_system_time() { } -/// builtin_cpu_count() tries to detect the number of CPU cores, if -/// hyper-threading is enabled this is the number of logical processors. +/// cpu_count() tries to detect the number of CPU cores. #if !defined(_MSC_VER) # if defined(_SC_NPROCESSORS_ONLN) -static int builtin_cpu_count() { - return Min(sysconf(_SC_NPROCESSORS_ONLN), 8); +int cpu_count() { + return Min(sysconf(_SC_NPROCESSORS_ONLN), MAX_THREADS); } # elif defined(__hpux) -static int builtin_cpu_count() { +int cpu_count() { struct pst_dynamic psd; if (pstat_getdynamic(&psd, sizeof(psd), (size_t)1, 0) == -1) return 1; - return Min(psd.psd_proc_cnt, 8); + return Min(psd.psd_proc_cnt, MAX_THREADS); } # else -static int builtin_cpu_count() { +int cpu_count() { return 1; } # endif #else -static int builtin_cpu_count() { +int cpu_count() { SYSTEM_INFO s; GetSystemInfo(&s); - return Min(s.dwNumberOfProcessors, 8); + return Min(s.dwNumberOfProcessors, MAX_THREADS); } #endif -/// HT_enabled() returns true if hyper-threading is enabled on current machine - -static bool HT_enabled() { - - char CPUString[0x20]; - int CPUInfo[4] = {-1}; - int nIds, nLogicalCPU, nCores; - - // Detect CPU producer - __cpuid(CPUInfo, 0); - nIds = CPUInfo[0]; - - memset(CPUString, 0, sizeof(CPUString)); - memcpy(&CPUString[0], &CPUInfo[1], sizeof(int)); - memcpy(&CPUString[4], &CPUInfo[3], sizeof(int)); - memcpy(&CPUString[8], &CPUInfo[2], sizeof(int)); - - // Not an Intel CPU or CPUID.4 not supported - if (strcmp(CPUString, "GenuineIntel") || nIds < 4) - return false; - - // Detect if HT Technology is supported - __cpuid(CPUInfo, 1); - if (!((CPUInfo[3] >> 28) & 1)) - return false; - - nLogicalCPU = (CPUInfo[1] >> 16) & 0xFF; - - // Detect number of cores - __cpuid(CPUInfo, 4); - nCores = 1 + ((CPUInfo[0] >> 26) & 0x3F); - - return nLogicalCPU > nCores; -} - - -/// cpu_count() tries to detect the number of physical CPU cores taking -/// in account hyper-threading. - -int cpu_count() { - - return HT_enabled() ? builtin_cpu_count() / 2 : builtin_cpu_count(); -} - - /* From Beowulf, from Olithink */ @@ -333,4 +291,26 @@ int Bioskey() return 0; } } + +/// prefetch() preloads the given address in L1/L2 cache. This is a non +/// blocking function and do not stalls the CPU waiting for data to be +/// loaded from RAM, that can be very slow. +#if defined(NO_PREFETCH) +void prefetch(char*) {} +#else + +void prefetch(char* addr) { + +#if defined(__INTEL_COMPILER) || defined(__ICL) + // This hack prevents prefetches to be optimized away by + // Intel compiler. Both MSVC and gcc seems not affected. + __asm__ (""); +#endif + + _mm_prefetch(addr, _MM_HINT_T2); + _mm_prefetch(addr+64, _MM_HINT_T2); // 64 bytes ahead +} + +#endif + #endif