doxygen/ThreadPool_8h_source.html

//===-- llvm/Support/ThreadPool.h - A ThreadPool implementation -*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file defines a crude C++11 based thread pool.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_SUPPORT_THREADPOOL_H

#define LLVM_SUPPORT_THREADPOOL_H


#include "llvm/ADT/DenseMap.h"

#include "llvm/ADT/FunctionExtras.h"

#include "llvm/Config/llvm-config.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Jobserver.h"

#include "llvm/Support/RWMutex.h"

#include "llvm/Support/Threading.h"

#include "llvm/Support/thread.h"


#include <future>


#include <condition_variable>

#include <deque>

#include <functional>

#include <mutex>

#include <utility>


namespace llvm {


class ThreadPoolTaskGroup;


/// This defines the abstract base interface for a ThreadPool allowing

/// asynchronous parallel execution on a defined number of threads.

///

/// It is possible to reuse one thread pool for different groups of tasks

/// by grouping tasks using ThreadPoolTaskGroup. All tasks are processed using

/// the same queue, but it is possible to wait only for a specific group of

/// tasks to finish.

///

/// It is also possible for worker threads to submit new tasks and wait for

/// them. Note that this may result in a deadlock in cases such as when a task

/// (directly or indirectly) tries to wait for its own completion, or when all

/// available threads are used up by tasks waiting for a task that has no thread

/// left to run on (this includes waiting on the returned future). It should be

/// generally safe to wait() for a group as long as groups do not form a cycle.


class LLVM_ABI ThreadPoolInterface {

  /// The actual method to enqueue a task to be defined by the concrete

  /// implementation.

  virtual void asyncEnqueue(llvm::unique_function<void()> Task,

                            ThreadPoolTaskGroup *Group) = 0;


public:

  /// Destroying the pool will drain the pending tasks and wait. The current

  /// thread may participate in the execution of the pending tasks.

  virtual ~ThreadPoolInterface();


  /// Blocking wait for all the threads to complete and the queue to be empty.

  /// It is an error to try to add new tasks while blocking on this call.

  /// Calling wait() from a task would deadlock waiting for itself.

  virtual void wait() = 0;


  /// Blocking wait for only all the threads in the given group to complete.

  /// It is possible to wait even inside a task, but waiting (directly or

  /// indirectly) on itself will deadlock. If called from a task running on a

  /// worker thread, the call may process pending tasks while waiting in order

  /// not to waste the thread.

  virtual void wait(ThreadPoolTaskGroup &Group) = 0;


  /// Returns the maximum number of worker this pool can eventually grow to.

  virtual unsigned getMaxConcurrency() const = 0;


  /// Asynchronous submission of a task to the pool. The returned future can be

  /// used to wait for the task to finish and is *non-blocking* on destruction.

  template <typename Function, typename... Args>


  auto async(Function &&F, Args &&...ArgList) {

    auto Task =

        std::bind(std::forward<Function>(F), std::forward<Args>(ArgList)...);

    return async(std::move(Task));

  }


  /// Overload, task will be in the given task group.

  template <typename Function, typename... Args>


  auto async(ThreadPoolTaskGroup &Group, Function &&F, Args &&...ArgList) {

    auto Task =

        std::bind(std::forward<Function>(F), std::forward<Args>(ArgList)...);

    return async(Group, std::move(Task));

  }


  /// Asynchronous submission of a task to the pool. The returned future can be

  /// used to wait for the task to finish and is *non-blocking* on destruction.

  template <typename Func>


  auto async(Func &&F) -> std::shared_future<decltype(F())> {

    return asyncImpl(

        llvm::unique_function<decltype(F())()>(std::forward<Func>(F)), nullptr);

  }


  template <typename Func>


  auto async(ThreadPoolTaskGroup &Group, Func &&F)

      -> std::shared_future<decltype(F())> {

    return asyncImpl(

        llvm::unique_function<decltype(F())()>(std::forward<Func>(F)), &Group);

  }


private:

  /// Asynchronous submission of a task to the pool. The returned future can be

  /// used to wait for the task to finish and is *non-blocking* on destruction.

  template <typename ResTy>

  std::shared_future<ResTy> asyncImpl(llvm::unique_function<ResTy()> Task,

                                      ThreadPoolTaskGroup *Group) {

    auto Future = std::async(std::launch::deferred, std::move(Task)).share();

    asyncEnqueue([Future]() { Future.wait(); }, Group);

    return Future;

  }

};


#if LLVM_ENABLE_THREADS

/// A ThreadPool implementation using std::threads.

///

/// The pool keeps a vector of threads alive, waiting on a condition variable

/// for some work to become available.

class LLVM_ABI StdThreadPool : public ThreadPoolInterface {

public:

  /// Construct a pool using the hardware strategy \p S for mapping hardware

  /// execution resources (threads, cores, CPUs)

  /// Defaults to using the maximum execution resources in the system, but

  /// accounting for the affinity mask.

  StdThreadPool(ThreadPoolStrategy S = hardware_concurrency());


  /// Blocking destructor: the pool will wait for all the threads to complete.

  ~StdThreadPool() override;


  /// Blocking wait for all the threads to complete and the queue to be empty.

  /// It is an error to try to add new tasks while blocking on this call.

  /// Calling wait() from a task would deadlock waiting for itself.

  void wait() override;


  /// Blocking wait for only all the threads in the given group to complete.

  /// It is possible to wait even inside a task, but waiting (directly or

  /// indirectly) on itself will deadlock. If called from a task running on a

  /// worker thread, the call may process pending tasks while waiting in order

  /// not to waste the thread.

  void wait(ThreadPoolTaskGroup &Group) override;


  /// Returns the maximum number of worker threads in the pool, not the current

  /// number of threads!

  unsigned getMaxConcurrency() const override { return MaxThreadCount; }


  /// Returns true if the current thread is a worker thread of this thread pool.

  bool isWorkerThread() const;


private:

  /// Returns true if all tasks in the given group have finished (nullptr means

  /// all tasks regardless of their group). QueueLock must be locked.

  bool workCompletedUnlocked(ThreadPoolTaskGroup *Group) const;


  /// Asynchronous submission of a task to the pool. The returned future can be

  /// used to wait for the task to finish and is *non-blocking* on destruction.

  void asyncEnqueue(llvm::unique_function<void()> Task,

                    ThreadPoolTaskGroup *Group) override {

    int requestedThreads;

    {

      // Lock the queue and push the new task

      std::unique_lock<std::mutex> LockGuard(QueueLock);


      // Don't allow enqueueing after disabling the pool

      assert(EnableFlag && "Queuing a thread during ThreadPool destruction");

      Tasks.emplace_back(std::make_pair(std::move(Task), Group));

      requestedThreads = ActiveThreads + Tasks.size();

    }

    QueueCondition.notify_one();

    grow(requestedThreads);

  }


  /// Grow to ensure that we have at least `requested` Threads, but do not go

  /// over MaxThreadCount.

  void grow(int requested);


  void processTasks(ThreadPoolTaskGroup *WaitingForGroup);

  void processTasksWithJobserver();


  /// Threads in flight

  std::vector<llvm::thread> Threads;

  /// Lock protecting access to the Threads vector.

  mutable llvm::sys::RWMutex ThreadsLock;


  /// Tasks waiting for execution in the pool.

  std::deque<std::pair<llvm::unique_function<void()>, ThreadPoolTaskGroup *>>

      Tasks;


  /// Locking and signaling for accessing the Tasks queue.

  std::mutex QueueLock;

  std::condition_variable QueueCondition;


  /// Signaling for job completion (all tasks or all tasks in a group).

  std::condition_variable CompletionCondition;


  /// Keep track of the number of thread actually busy

  unsigned ActiveThreads = 0;

  /// Number of threads active for tasks in the given group (only non-zero).

  DenseMap<ThreadPoolTaskGroup *, unsigned> ActiveGroups;


  /// Signal for the destruction of the pool, asking thread to exit.

  bool EnableFlag = true;


  const ThreadPoolStrategy Strategy;


  /// Maximum number of threads to potentially grow this pool to.

  const unsigned MaxThreadCount;


  JobserverClient *TheJobserver = nullptr;

};

#endif // LLVM_ENABLE_THREADS


/// A non-threaded implementation.


class LLVM_ABI SingleThreadExecutor : public ThreadPoolInterface {

public:

  /// Construct a non-threaded pool, ignoring using the hardware strategy.

  SingleThreadExecutor(ThreadPoolStrategy ignored = {});


  /// Blocking destructor: the pool will first execute the pending tasks.

  ~SingleThreadExecutor() override;


  // Excplicitly disable copy. This is necessary for the MSVC LLVM_DYLIB build

  // because MSVC tries to generate copy constructor and assignment operator

  // for classes marked with `__declspec(dllexport)`.

  SingleThreadExecutor(const SingleThreadExecutor &) = delete;

  SingleThreadExecutor &operator=(const SingleThreadExecutor &) = delete;


  /// Blocking wait for all the tasks to execute first

  void wait() override;


  /// Blocking wait for only all the tasks in the given group to complete.

  void wait(ThreadPoolTaskGroup &Group) override;


  /// Returns always 1: there is no concurrency.

  unsigned getMaxConcurrency() const override { return 1; }


  /// Returns true if the current thread is a worker thread of this thread pool.

  bool isWorkerThread() const;


private:

  /// Asynchronous submission of a task to the pool. The returned future can be

  /// used to wait for the task to finish and is *non-blocking* on destruction.

  void asyncEnqueue(llvm::unique_function<void()> Task,

                    ThreadPoolTaskGroup *Group) override {

    Tasks.emplace_back(std::make_pair(std::move(Task), Group));

  }


  /// Tasks waiting for execution in the pool.

  std::deque<std::pair<llvm::unique_function<void()>, ThreadPoolTaskGroup *>>

      Tasks;

};


#if LLVM_ENABLE_THREADS

using DefaultThreadPool = StdThreadPool;

#else

using DefaultThreadPool = SingleThreadExecutor;

#endif


/// A group of tasks to be run on a thread pool. Thread pool tasks in different

/// groups can run on the same threadpool but can be waited for separately.

/// It is even possible for tasks of one group to submit and wait for tasks

/// of another group, as long as this does not form a loop.


class ThreadPoolTaskGroup {

public:

  /// The ThreadPool argument is the thread pool to forward calls to.

  ThreadPoolTaskGroup(ThreadPoolInterface &Pool) : Pool(Pool) {}


  /// Blocking destructor: will wait for all the tasks in the group to complete

  /// by calling ThreadPool::wait().

  ~ThreadPoolTaskGroup() { wait(); }


  /// Calls ThreadPool::async() for this group.

  template <typename Function, typename... Args>


  inline auto async(Function &&F, Args &&...ArgList) {

    return Pool.async(*this, std::forward<Function>(F),

                      std::forward<Args>(ArgList)...);

  }


  /// Calls ThreadPool::wait() for this group.

  void wait() { Pool.wait(*this); }


private:

  ThreadPoolInterface &Pool;

};


} // namespace llvm


#endif // LLVM_SUPPORT_THREADPOOL_H

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Compiler.h

LLVM_ABI
#define LLVM_ABI
Definition Compiler.h:213

DenseMap.h
This file defines the DenseMap class.

FunctionExtras.h
This file provides a collection of function (or more generally, callable) type erasure utilities supp...

Jobserver.h

F
#define F(x, y, z)
Definition MD5.cpp:54

RWMutex.h

Threading.h

llvm::Function
Definition Function.h:64

llvm::SingleThreadExecutor
A non-threaded implementation.
Definition ThreadPool.h:220

llvm::SingleThreadExecutor::SingleThreadExecutor
SingleThreadExecutor(const SingleThreadExecutor &)=delete

llvm::SingleThreadExecutor::SingleThreadExecutor
SingleThreadExecutor(ThreadPoolStrategy ignored={})
Construct a non-threaded pool, ignoring using the hardware strategy.
Definition ThreadPool.cpp:301

llvm::SingleThreadExecutor::wait
void wait() override
Blocking wait for all the tasks to execute first.
Definition ThreadPool.cpp:309

llvm::SingleThreadExecutor::operator=
SingleThreadExecutor & operator=(const SingleThreadExecutor &)=delete

llvm::SingleThreadExecutor::getMaxConcurrency
unsigned getMaxConcurrency() const override
Returns always 1: there is no concurrency.
Definition ThreadPool.h:241

llvm::ThreadPoolInterface
This defines the abstract base interface for a ThreadPool allowing asynchronous parallel execution on...
Definition ThreadPool.h:51

llvm::ThreadPoolInterface::async
auto async(ThreadPoolTaskGroup &Group, Function &&F, Args &&...ArgList)
Overload, task will be in the given task group.
Definition ThreadPool.h:88

llvm::ThreadPoolInterface::wait
virtual void wait()=0
Blocking wait for all the threads to complete and the queue to be empty.

llvm::ThreadPoolInterface::async
auto async(ThreadPoolTaskGroup &Group, Func &&F) -> std::shared_future< decltype(F())>
Definition ThreadPool.h:103

llvm::ThreadPoolInterface::getMaxConcurrency
virtual unsigned getMaxConcurrency() const =0
Returns the maximum number of worker this pool can eventually grow to.

llvm::ThreadPoolInterface::async
auto async(Func &&F) -> std::shared_future< decltype(F())>
Asynchronous submission of a task to the pool.
Definition ThreadPool.h:97

llvm::ThreadPoolInterface::~ThreadPoolInterface
virtual ~ThreadPoolInterface()
Destroying the pool will drain the pending tasks and wait.

llvm::ThreadPoolInterface::async
auto async(Function &&F, Args &&...ArgList)
Asynchronous submission of a task to the pool.
Definition ThreadPool.h:80

llvm::ThreadPoolInterface::wait
virtual void wait(ThreadPoolTaskGroup &Group)=0
Blocking wait for only all the threads in the given group to complete.

llvm::ThreadPoolStrategy
This tells how a thread pool will be used.
Definition Threading.h:115

llvm::ThreadPoolTaskGroup
A group of tasks to be run on a thread pool.
Definition ThreadPool.h:269

llvm::ThreadPoolTaskGroup::async
auto async(Function &&F, Args &&...ArgList)
Calls ThreadPool::async() for this group.
Definition ThreadPool.h:280

llvm::ThreadPoolTaskGroup::wait
void wait()
Calls ThreadPool::wait() for this group.
Definition ThreadPool.h:286

llvm::ThreadPoolTaskGroup::~ThreadPoolTaskGroup
~ThreadPoolTaskGroup()
Blocking destructor: will wait for all the tasks in the group to complete by calling ThreadPool::wait...
Definition ThreadPool.h:276

llvm::ThreadPoolTaskGroup::ThreadPoolTaskGroup
ThreadPoolTaskGroup(ThreadPoolInterface &Pool)
The ThreadPool argument is the thread pool to forward calls to.
Definition ThreadPool.h:272

llvm::unique_function
unique_function is a type-erasing functor similar to std::function.
Definition FunctionExtras.h:56

llvm::sys::RWMutex
SmartRWMutex< false > RWMutex
Definition RWMutex.h:165

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26

llvm::hardware_concurrency
ThreadPoolStrategy hardware_concurrency(unsigned ThreadCount=0)
Returns a default thread strategy where all available hardware resources are to be used,...
Definition Threading.h:190

llvm::DefaultThreadPool
SingleThreadExecutor DefaultThreadPool
Definition ThreadPool.h:262

thread.h