# if defined(__INTEL_COMPILER) || defined(_MSC_VER)
_mm_prefetch(addr, _MM_HINT_T0);
- _mm_prefetch(addr+64, _MM_HINT_T0); // 64 bytes ahead
# else
__builtin_prefetch(addr);
- __builtin_prefetch(addr+64);
# endif
}
return;
hashMask = size - ClusterSize;
- delete [] table;
- table = new (std::nothrow) TTEntry[size];
+ free(mem);
+ mem = malloc(size * sizeof(TTEntry) + CACHE_LINE_SIZE - 1);
- if (!table)
+ if (!mem)
{
std::cerr << "Failed to allocate " << mbSize
<< "MB for transposition table." << std::endl;
exit(EXIT_FAILURE);
}
+ // Align table start address to a cache line
+ for (char* c = (char*)mem; unsigned(table = (TTEntry*)(c)) % CACHE_LINE_SIZE; c++) {}
clear(); // Operator new is not guaranteed to initialize memory to zero
}
static const unsigned ClusterSize = 4; // A cluster is 64 Bytes
public:
- ~TranspositionTable() { delete [] table; }
+ ~TranspositionTable() { free(mem); }
void new_search() { generation++; }
TTEntry* probe(const Key key) const;
private:
uint32_t hashMask;
TTEntry* table;
+ void* mem;
uint8_t generation; // Size must be not bigger then TTEntry::generation8
};
# include <xmmintrin.h> // Intel and Microsoft header for _mm_prefetch()
# endif
+#define CACHE_LINE_SIZE 64
#if defined(_MSC_VER) || defined(__INTEL_COMPILER)
-# define CACHE_LINE_ALIGNMENT __declspec(align(64))
+# define CACHE_LINE_ALIGNMENT __declspec(align(CACHE_LINE_SIZE))
#else
-# define CACHE_LINE_ALIGNMENT __attribute__ ((aligned(64)))
+# define CACHE_LINE_ALIGNMENT __attribute__ ((aligned(CACHE_LINE_SIZE)))
#endif
#if defined(_MSC_VER)