Use atomics instead of volatile

[stockfish] / src / thread.cpp
diff --git a/src/thread.cpp b/src/thread.cpp

index ba5d13d5666908e45b0ad8149a51e72b4365f54a..eb64f7ee372151ec5966d08477f9b9a040b3ef78 100644 (file)
--- a/src/thread.cpp
+++ b/src/thread.cpp
@@ -38,9 +38,9 @@ namespace {
   // when start_routine (and hence virtual idle_loop) is called and when joining.
  
   template<typename T> T* new_thread() {
-   T* th = new T();
-   th->nativeThread = std::thread(&ThreadBase::idle_loop, th); // Will go to sleep
-   return th;
+   std::thread* th = new T;
+   *th = std::thread(&T::idle_loop, (T*)th); // Will go to sleep
+   return (T*)th;
   }
  
   void delete_thread(ThreadBase* th) {
@@ -50,7 +50,7 @@ namespace {
     th->mutex.unlock();
  
     th->notify_one();
-   th->nativeThread.join(); // Wait for thread termination
+   th->join(); // Wait for thread termination
     delete th;
   }
  
@@ -61,179 +61,76 @@ namespace {
  
  void ThreadBase::notify_one() {
  
-  std::unique_lock<std::mutex>(this->mutex);
+  std::unique_lock<Mutex> lk(mutex);
    sleepCondition.notify_one();
  }
  
  
-// ThreadBase::wait_for() set the thread to sleep until 'condition' turns true
+// ThreadBase::wait() set the thread to sleep until 'condition' turns true
  
-void ThreadBase::wait_for(volatile const bool& condition) {
+void ThreadBase::wait(std::atomic<bool>& condition) {
  
-  std::unique_lock<std::mutex> lk(mutex);
-  sleepCondition.wait(lk, [&]{ return condition; });
+  std::unique_lock<Mutex> lk(mutex);
+  sleepCondition.wait(lk, [&]{ return bool(condition); });
+}
+
+
+// ThreadBase::wait_while() set the thread to sleep until 'condition' turns false
+void ThreadBase::wait_while(std::atomic<bool>& condition) {
+
+  std::unique_lock<Mutex> lk(mutex);
+  sleepCondition.wait(lk, [&]{ return !condition; });
  }
  
  
  // Thread c'tor makes some init but does not launch any execution thread that
  // will be started only when c'tor returns.
  
-Thread::Thread() /* : splitPoints() */ { // Initialization of non POD broken in MSVC
+Thread::Thread() {
  
    searching = false;
    maxPly = 0;
-  splitPointsSize = 0;
-  activeSplitPoint = nullptr;
-  activePosition = nullptr;
+  history.clear();
+  counterMoves.clear();
    idx = Threads.size(); // Starts from 0
  }
  
  
-// Thread::cutoff_occurred() checks whether a beta cutoff has occurred in the
-// current active split point, or in some ancestor of the split point.
-
-bool Thread::cutoff_occurred() const {
-
-  for (SplitPoint* sp = activeSplitPoint; sp; sp = sp->parentSplitPoint)
-      if (sp->cutoff)
-          return true;
-
-  return false;
-}
-
-
-// Thread::available_to() checks whether the thread is available to help the
-// thread 'master' at a split point. An obvious requirement is that thread must
-// be idle. With more than two threads, this is not sufficient: If the thread is
-// the master of some split point, it is only available as a slave to the slaves
-// which are busy searching the split point at the top of slave's split point
-// stack (the "helpful master concept" in YBWC terminology).
-
-bool Thread::available_to(const Thread* master) const {
+// TimerThread::idle_loop() is where the timer thread waits Resolution milliseconds
+// and then calls check_time(). When not searching, thread sleeps until it's woken up.
  
-  if (searching)
-      return false;
+void TimerThread::idle_loop() {
  
-  // Make a local copy to be sure it doesn't become zero under our feet while
-  // testing next condition and so leading to an out of bounds access.
-  const size_t size = splitPointsSize;
+  while (!exit)
+  {
+      std::unique_lock<Mutex> lk(mutex);
  
-  // No split points means that the thread is available as a slave for any
-  // other thread otherwise apply the "helpful master" concept if possible.
-  return !size || splitPoints[size - 1].slavesMask.test(master->idx);
-}
+      if (!exit)
+          sleepCondition.wait_for(lk, std::chrono::milliseconds(run ? Resolution : INT_MAX));
  
+      lk.unlock();
  
-// Thread::split() does the actual work of distributing the work at a node between
-// several available threads. If it does not succeed in splitting the node
-// (because no idle threads are available), the function immediately returns.
-// If splitting is possible, a SplitPoint object is initialized with all the
-// data that must be copied to the helper threads and then helper threads are
-// informed that they have been assigned work. This will cause them to instantly
-// leave their idle loops and call search(). When all threads have returned from
-// search() then split() returns.
-
-void Thread::split(Position& pos, Stack* ss, Value alpha, Value beta, Value* bestValue,
-                   Move* bestMove, Depth depth, int moveCount,
-                   MovePicker* movePicker, int nodeType, bool cutNode) {
-
-  assert(searching);
-  assert(-VALUE_INFINITE < *bestValue && *bestValue <= alpha && alpha < beta && beta <= VALUE_INFINITE);
-  assert(depth >= Threads.minimumSplitDepth);
-  assert(splitPointsSize < MAX_SPLITPOINTS_PER_THREAD);
-
-  // Pick and init the next available split point
-  SplitPoint& sp = splitPoints[splitPointsSize];
-
-  sp.master = this;
-  sp.parentSplitPoint = activeSplitPoint;
-  sp.slavesMask = 0, sp.slavesMask.set(idx);
-  sp.depth = depth;
-  sp.bestValue = *bestValue;
-  sp.bestMove = *bestMove;
-  sp.alpha = alpha;
-  sp.beta = beta;
-  sp.nodeType = nodeType;
-  sp.cutNode = cutNode;
-  sp.movePicker = movePicker;
-  sp.moveCount = moveCount;
-  sp.pos = &pos;
-  sp.nodes = 0;
-  sp.cutoff = false;
-  sp.ss = ss;
-
-  // Try to allocate available threads and ask them to start searching setting
-  // 'searching' flag. This must be done under lock protection to avoid concurrent
-  // allocation of the same slave by another master.
-  Threads.spinlock.acquire();
-  sp.spinlock.acquire();
-
-  sp.allSlavesSearching = true; // Must be set under lock protection
-  ++splitPointsSize;
-  activeSplitPoint = &sp;
-  activePosition = nullptr;
-
-  Thread* slave;
-
-  while (    sp.slavesMask.count() < MAX_SLAVES_PER_SPLITPOINT
-         && (slave = Threads.available_slave(this)) != nullptr)
-  {
-      sp.slavesMask.set(slave->idx);
-      slave->activeSplitPoint = &sp;
-      slave->searching = true; // Slave leaves idle_loop()
-      slave->notify_one(); // Could be sleeping
+      if (!exit && run)
+          check_time();
    }
-
-  // Everything is set up. The master thread enters the idle loop, from which
-  // it will instantly launch a search, because its 'searching' flag is set.
-  // The thread will return from the idle loop when all slaves have finished
-  // their work at this split point.
-  sp.spinlock.release();
-  Threads.spinlock.release();
-
-  Thread::idle_loop(); // Force a call to base class idle_loop()
-
-  // In the helpful master concept, a master can help only a sub-tree of its
-  // split point and because everything is finished here, it's not possible
-  // for the master to be booked.
-  assert(!searching);
-  assert(!activePosition);
-
-  // We have returned from the idle loop, which means that all threads are
-  // finished. Note that setting 'searching' and decreasing splitPointsSize must
-  // be done under lock protection to avoid a race with Thread::available_to().
-  Threads.spinlock.acquire();
-  sp.spinlock.acquire();
-
-  searching = true;
-  --splitPointsSize;
-  activeSplitPoint = sp.parentSplitPoint;
-  activePosition = &pos;
-  pos.set_nodes_searched(pos.nodes_searched() + sp.nodes);
-  *bestMove = sp.bestMove;
-  *bestValue = sp.bestValue;
-
-  sp.spinlock.release();
-  Threads.spinlock.release();
  }
  
  
-// TimerThread::idle_loop() is where the timer thread waits Resolution milliseconds
-// and then calls check_time(). When not searching, thread sleeps until it's woken up.
+// Thread::idle_loop() is where the thread is parked when it has no work to do
  
-void TimerThread::idle_loop() {
+void Thread::idle_loop() {
  
    while (!exit)
    {
-      std::unique_lock<std::mutex> lk(mutex);
+      std::unique_lock<Mutex> lk(mutex);
  
-      if (!exit)
-          sleepCondition.wait_for(lk, std::chrono::milliseconds(run ? Resolution : INT_MAX));
+      while (!searching && !exit)
+          sleepCondition.wait(lk);
  
        lk.unlock();
  
-      if (run)
-          check_time();
+      if (!exit && searching)
+          search();
    }
  }
  
@@ -245,29 +142,30 @@ void MainThread::idle_loop() {
  
    while (!exit)
    {
-      std::unique_lock<std::mutex> lk(mutex);
+      std::unique_lock<Mutex> lk(mutex);
  
        thinking = false;
  
        while (!thinking && !exit)
        {
-          Threads.sleepCondition.notify_one(); // Wake up the UI thread if needed
+          sleepCondition.notify_one(); // Wake up the UI thread if needed
            sleepCondition.wait(lk);
        }
  
        lk.unlock();
  
        if (!exit)
-      {
-          searching = true;
+          think();
+  }
+}
  
-          Search::think();
  
-          assert(searching);
+// MainThread::join() waits for main thread to finish thinking
  
-          searching = false;
-      }
-  }
+void MainThread::join() {
+
+  std::unique_lock<Mutex> lk(mutex);
+  sleepCondition.wait(lk, [&]{ return !thinking; });
  }
  
  
@@ -290,9 +188,12 @@ void ThreadPool::init() {
  void ThreadPool::exit() {
  
    delete_thread(timer); // As first because check_time() accesses threads data
+  timer = nullptr;
  
    for (Thread* th : *this)
        delete_thread(th);
+
+  clear(); // Get rid of stale pointers
  }
  
  
@@ -304,15 +205,10 @@ void ThreadPool::exit() {
  
  void ThreadPool::read_uci_options() {
  
-  minimumSplitDepth = Options["Min Split Depth"] * ONE_PLY;
    size_t requested  = Options["Threads"];
  
    assert(requested > 0);
  
-  // If zero (default) then set best minimum split depth automatically
-  if (!minimumSplitDepth)
-      minimumSplitDepth = requested < 8 ? 4 * ONE_PLY : 7 * ONE_PLY;
-
    while (size() < requested)
        push_back(new_thread<Thread>());
  
@@ -324,25 +220,14 @@ void ThreadPool::read_uci_options() {
  }
  
  
-// ThreadPool::available_slave() tries to find an idle thread which is available
-// as a slave for the thread 'master'.
+// ThreadPool::nodes_searched() returns the number of nodes searched
  
-Thread* ThreadPool::available_slave(const Thread* master) const {
+int64_t ThreadPool::nodes_searched() {
  
-  for (Thread* th : *this)
-      if (th->available_to(master))
-          return th;
-
-  return nullptr;
-}
-
-
-// ThreadPool::wait_for_think_finished() waits for main thread to finish the search
-
-void ThreadPool::wait_for_think_finished() {
-
-  std::unique_lock<std::mutex> lk(main()->mutex);
-  sleepCondition.wait(lk, [&]{ return !main()->thinking; });
+  int64_t nodes = 0;
+  for (Thread *th : *this)
+      nodes += th->rootPos.nodes_searched();
+  return nodes;
  }
  
  
@@ -351,15 +236,13 @@ void ThreadPool::wait_for_think_finished() {
  
  void ThreadPool::start_thinking(const Position& pos, const LimitsType& limits,
                                  StateStackPtr& states) {
-  wait_for_think_finished();
-
-  SearchTime = now(); // As early as possible
+  main()->join();
  
    Signals.stopOnPonderhit = Signals.firstRootMove = false;
    Signals.stop = Signals.failedLowAtRoot = false;
  
-  RootMoves.clear();
-  RootPos = pos;
+  main()->rootMoves.clear();
+  main()->rootPos = pos;
    Limits = limits;
    if (states.get()) // If we don't set a new position, preserve current state
    {
@@ -370,8 +253,8 @@ void ThreadPool::start_thinking(const Position& pos, const LimitsType& limits,
    for (const auto& m : MoveList<LEGAL>(pos))
        if (   limits.searchmoves.empty()
            || std::count(limits.searchmoves.begin(), limits.searchmoves.end(), m))
-          RootMoves.push_back(RootMove(m));
+          main()->rootMoves.push_back(RootMove(m));
  
    main()->thinking = true;
-  main()->notify_one(); // Starts main thread
+  main()->notify_one(); // Wake up main thread: 'thinking' must be already set
  }