doxygen/Threading_8h_source.html

//===-- llvm/Support/Threading.h - Control multithreading mode --*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file declares helper functions for running LLVM in a multi-threaded

// environment.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_SUPPORT_THREADING_H

#define LLVM_SUPPORT_THREADING_H


#include "llvm/ADT/BitVector.h"

#include "llvm/ADT/StringRef.h"

#include "llvm/Config/llvm-config.h" // for LLVM_ON_UNIX

#include "llvm/Support/Compiler.h"

#include <optional>


#if defined(_MSC_VER)

// MSVC's call_once implementation worked since VS 2015, which is the minimum

// supported version as of this writing.

#define LLVM_THREADING_USE_STD_CALL_ONCE 1

#elif defined(LLVM_ON_UNIX) &&                                                 \

    (defined(_LIBCPP_VERSION) ||                                               \

     !(defined(__NetBSD__) || defined(__OpenBSD__) || defined(__powerpc__)))

// std::call_once from libc++ is used on all Unix platforms. Other

// implementations like libstdc++ are known to have problems on NetBSD,

// OpenBSD and PowerPC.

#define LLVM_THREADING_USE_STD_CALL_ONCE 1

#elif defined(LLVM_ON_UNIX) &&                                                 \

    (defined(__powerpc__) && defined(__LITTLE_ENDIAN__))

#define LLVM_THREADING_USE_STD_CALL_ONCE 1

#else

#define LLVM_THREADING_USE_STD_CALL_ONCE 0

#endif


#if LLVM_THREADING_USE_STD_CALL_ONCE

#include <mutex>

#else

#include "llvm/Support/Atomic.h"

#endif


namespace llvm {

class Twine;


/// Returns true if LLVM is compiled with support for multi-threading, and

/// false otherwise.

constexpr bool llvm_is_multithreaded() { return LLVM_ENABLE_THREADS; }


#if LLVM_THREADING_USE_STD_CALL_ONCE


using once_flag = std::once_flag;


#else


  enum InitStatus { Uninitialized = 0, Wait = 1, Done = 2 };


  /// The llvm::once_flag structure

  ///

  /// This type is modeled after std::once_flag to use with llvm::call_once.

  /// This structure must be used as an opaque object. It is a struct to force

  /// autoinitialization and behave like std::once_flag.


  struct once_flag {

    volatile sys::cas_flag status = Uninitialized;

  };


#endif


  /// Execute the function specified as a parameter once.

  ///

  /// Typical usage:

  /// \code

  ///   void foo() {...};

  ///   ...

  ///   static once_flag flag;

  ///   call_once(flag, foo);

  /// \endcode

  ///

  /// \param flag Flag used for tracking whether or not this has run.

  /// \param F Function to call once.

  template <typename Function, typename... Args>


  void call_once(once_flag &flag, Function &&F, Args &&... ArgList) {

#if LLVM_THREADING_USE_STD_CALL_ONCE

    std::call_once(flag, std::forward<Function>(F),

                   std::forward<Args>(ArgList)...);

#else

    // For other platforms we use a generic (if brittle) version based on our

    // atomics.

    sys::cas_flag old_val = sys::CompareAndSwap(&flag.status, Wait, Uninitialized);

    if (old_val == Uninitialized) {

      std::forward<Function>(F)(std::forward<Args>(ArgList)...);

      sys::MemoryFence();

      TsanIgnoreWritesBegin();

      TsanHappensBefore(&flag.status);

      flag.status = Done;

      TsanIgnoreWritesEnd();

    } else {

      // Wait until any thread doing the call has finished.

      sys::cas_flag tmp = flag.status;

      sys::MemoryFence();

      while (tmp != Done) {

        tmp = flag.status;

        sys::MemoryFence();

      }

    }

    TsanHappensAfter(&flag.status);

#endif

  }


  /// This tells how a thread pool will be used


  class ThreadPoolStrategy {

  public:

    // The default value (0) means all available threads should be used,

    // taking the affinity mask into account. If set, this value only represents

    // a suggested high bound, the runtime might choose a lower value (not

    // higher).

    unsigned ThreadsRequested = 0;


    // If SMT is active, use hyper threads. If false, there will be only one

    // std::thread per core.

    bool UseHyperThreads = true;


    // If set, will constrain 'ThreadsRequested' to the number of hardware

    // threads, or hardware cores.

    bool Limit = false;


    /// Retrieves the max available threads for the current strategy. This

    /// accounts for affinity masks and takes advantage of all CPU sockets.

    LLVM_ABI unsigned compute_thread_count() const;


    /// Assign the current thread to an ideal hardware CPU or NUMA node. In a

    /// multi-socket system, this ensures threads are assigned to all CPU

    /// sockets. \p ThreadPoolNum represents a number bounded by [0,

    /// compute_thread_count()).

    LLVM_ABI void apply_thread_strategy(unsigned ThreadPoolNum) const;


    /// Finds the CPU socket where a thread should go. Returns 'std::nullopt' if

    /// the thread shall remain on the actual CPU socket.

    LLVM_ABI std::optional<unsigned>

    compute_cpu_socket(unsigned ThreadPoolNum) const;


    /// If true, the thread pool will attempt to coordinate with a GNU Make

    /// jobserver, acquiring a job slot before processing a task. If no

    /// jobserver is found in the environment, this is ignored.

    bool UseJobserver = false;

  };


  /// Build a strategy from a number of threads as a string provided in \p Num.

  /// When Num is above the max number of threads specified by the \p Default

  /// strategy, we attempt to equally allocate the threads on all CPU sockets.

  /// "0" or an empty string will return the \p Default strategy.

  /// "all" for using all hardware threads.

  LLVM_ABI std::optional<ThreadPoolStrategy>

  get_threadpool_strategy(StringRef Num, ThreadPoolStrategy Default = {});


  /// Returns a thread strategy for tasks requiring significant memory or other

  /// resources. To be used for workloads where hardware_concurrency() proves to

  /// be less efficient. Avoid this strategy if doing lots of I/O. Currently

  /// based on physical cores, if available for the host system, otherwise falls

  /// back to hardware_concurrency(). Returns 1 when LLVM is configured with

  /// LLVM_ENABLE_THREADS = OFF.

  inline ThreadPoolStrategy


  heavyweight_hardware_concurrency(unsigned ThreadCount = 0) {

    ThreadPoolStrategy S;

    S.UseHyperThreads = false;

    S.ThreadsRequested = ThreadCount;

    return S;

  }


  /// Like heavyweight_hardware_concurrency() above, but builds a strategy

  /// based on the rules described for get_threadpool_strategy().

  /// If \p Num is invalid, returns a default strategy where one thread per

  /// hardware core is used.


  inline ThreadPoolStrategy heavyweight_hardware_concurrency(StringRef Num) {

    std::optional<ThreadPoolStrategy> S =

        get_threadpool_strategy(Num, heavyweight_hardware_concurrency());

    if (S)

      return *S;

    return heavyweight_hardware_concurrency();

  }


  /// Returns a default thread strategy where all available hardware resources

  /// are to be used, except for those initially excluded by an affinity mask.

  /// This function takes affinity into consideration. Returns 1 when LLVM is

  /// configured with LLVM_ENABLE_THREADS=OFF.


  inline ThreadPoolStrategy hardware_concurrency(unsigned ThreadCount = 0) {

    ThreadPoolStrategy S;

    S.ThreadsRequested = ThreadCount;

    return S;

  }


  /// Like hardware_concurrency() above, but builds a strategy

  /// based on the rules described for get_threadpool_strategy().

  /// If \p Num is invalid, returns a default strategy where one thread per

  /// hardware core is used.


  inline ThreadPoolStrategy hardware_concurrency(StringRef Num) {

    std::optional<ThreadPoolStrategy> S =

        get_threadpool_strategy(Num, hardware_concurrency());

    if (S)

      return *S;

    return hardware_concurrency();

  }


  /// Returns an optimal thread strategy to execute specified amount of tasks.

  /// This strategy should prevent us from creating too many threads if we

  /// occasionaly have an unexpectedly small amount of tasks.


  inline ThreadPoolStrategy optimal_concurrency(unsigned TaskCount = 0) {

    ThreadPoolStrategy S;

    S.Limit = true;

    S.ThreadsRequested = TaskCount;

    return S;

  }


  /// Returns a thread strategy that attempts to coordinate with a GNU Make

  /// jobserver. The number of active threads will be limited by the number of

  /// available job slots. If no jobserver is detected in the environment, this

  /// strategy falls back to the default hardware_concurrency() behavior.


  inline ThreadPoolStrategy jobserver_concurrency() {

    ThreadPoolStrategy S;

    S.UseJobserver = true;

    // We can still request all threads be created, as they will simply

    // block waiting for a job slot if the jobserver is the limiting factor.

    S.ThreadsRequested = 0; // 0 means 'use all available'

    return S;

  }


  /// Return the current thread id, as used in various OS system calls.

  /// Note that not all platforms guarantee that the value returned will be

  /// unique across the entire system, so portable code should not assume

  /// this.

  LLVM_ABI uint64_t get_threadid();


  /// Get the maximum length of a thread name on this platform.

  /// A value of 0 means there is no limit.

  LLVM_ABI uint32_t get_max_thread_name_length();


  /// Set the name of the current thread.  Setting a thread's name can

  /// be helpful for enabling useful diagnostics under a debugger or when

  /// logging.  The level of support for setting a thread's name varies

  /// wildly across operating systems, and we only make a best effort to

  /// perform the operation on supported platforms.  No indication of success

  /// or failure is returned.

  LLVM_ABI void set_thread_name(const Twine &Name);


  /// Get the name of the current thread.  The level of support for

  /// getting a thread's name varies wildly across operating systems, and it

  /// is not even guaranteed that if you can successfully set a thread's name

  /// that you can later get it back.  This function is intended for diagnostic

  /// purposes, and as with setting a thread's name no indication of whether

  /// the operation succeeded or failed is returned.

  LLVM_ABI void get_thread_name(SmallVectorImpl<char> &Name);


  /// Returns a mask that represents on which hardware thread, core, CPU, NUMA

  /// group, the calling thread can be executed. On Windows, threads cannot

  /// cross CPU sockets boundaries.

  LLVM_ABI llvm::BitVector get_thread_affinity_mask();


  /// Returns how many physical CPUs or NUMA groups the system has.

  LLVM_ABI unsigned get_cpus();


  /// Returns how many physical cores (as opposed to logical cores returned from

  /// thread::hardware_concurrency(), which includes hyperthreads).

  /// Returns -1 if unknown for the current host system.

  LLVM_ABI int get_physical_cores();


  enum class ThreadPriority {

    /// Lower the current thread's priority as much as possible. Can be used

    /// for long-running tasks that are not time critical; more energy-

    /// efficient than Low.

    Background = 0,


    /// Lower the current thread's priority such that it does not affect

    /// foreground tasks significantly. This is a good default for long-

    /// running, latency-insensitive tasks to make sure cpu is not hogged

    /// by this task.

    Low = 1,


    /// Restore the current thread's priority to default scheduling priority.

    Default = 2,

  };


  enum class SetThreadPriorityResult { FAILURE, SUCCESS };

  LLVM_ABI SetThreadPriorityResult set_thread_priority(ThreadPriority Priority);

}


#endif

BitVector.h
This file implements the BitVector class.

Compiler.h

TsanHappensBefore
#define TsanHappensBefore(cv)
Definition Compiler.h:617

TsanHappensAfter
#define TsanHappensAfter(cv)
Definition Compiler.h:618

LLVM_ABI
#define LLVM_ABI
Definition Compiler.h:213

TsanIgnoreWritesEnd
#define TsanIgnoreWritesEnd()
Definition Compiler.h:620

TsanIgnoreWritesBegin
#define TsanIgnoreWritesBegin()
Definition Compiler.h:619

F
#define F(x, y, z)
Definition MD5.cpp:54

StringRef.h

Atomic.h

ThreadCount
static cl::opt< int > ThreadCount("threads", cl::init(0))

llvm::BitVector
Definition BitVector.h:101

llvm::Function
Definition Function.h:64

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::ThreadPoolStrategy
This tells how a thread pool will be used.
Definition Threading.h:115

llvm::ThreadPoolStrategy::Limit
bool Limit
Definition Threading.h:129

llvm::ThreadPoolStrategy::ThreadsRequested
unsigned ThreadsRequested
Definition Threading.h:121

llvm::ThreadPoolStrategy::UseHyperThreads
bool UseHyperThreads
Definition Threading.h:125

llvm::ThreadPoolStrategy::apply_thread_strategy
LLVM_ABI void apply_thread_strategy(unsigned ThreadPoolNum) const
Assign the current thread to an ideal hardware CPU or NUMA node.

llvm::ThreadPoolStrategy::compute_cpu_socket
LLVM_ABI std::optional< unsigned > compute_cpu_socket(unsigned ThreadPoolNum) const
Finds the CPU socket where a thread should go.

llvm::ThreadPoolStrategy::compute_thread_count
LLVM_ABI unsigned compute_thread_count() const
Retrieves the max available threads for the current strategy.
Definition Threading.cpp:42

llvm::ThreadPoolStrategy::UseJobserver
bool UseJobserver
If true, the thread pool will attempt to coordinate with a GNU Make jobserver, acquiring a job slot b...
Definition Threading.h:149

uint32_t

uint64_t

llvm::sys::MemoryFence
LLVM_ABI void MemoryFence()
Definition Atomic.cpp:30

llvm::sys::cas_flag
uint32_t cas_flag
Definition Atomic.h:35

llvm::sys::CompareAndSwap
LLVM_ABI cas_flag CompareAndSwap(volatile cas_flag *ptr, cas_flag new_value, cas_flag old_value)
Definition Atomic.cpp:44

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26

llvm::hardware_concurrency
ThreadPoolStrategy hardware_concurrency(unsigned ThreadCount=0)
Returns a default thread strategy where all available hardware resources are to be used,...
Definition Threading.h:190

llvm::heavyweight_hardware_concurrency
ThreadPoolStrategy heavyweight_hardware_concurrency(unsigned ThreadCount=0)
Returns a thread strategy for tasks requiring significant memory or other resources.
Definition Threading.h:167

llvm::jobserver_concurrency
ThreadPoolStrategy jobserver_concurrency()
Returns a thread strategy that attempts to coordinate with a GNU Make jobserver.
Definition Threading.h:222

llvm::ThreadPriority
ThreadPriority
Definition Threading.h:270

llvm::ThreadPriority::Low
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.
Definition Threading.h:280

llvm::ThreadPriority::Background
@ Background
Lower the current thread's priority as much as possible.
Definition Threading.h:274

llvm::llvm_is_multithreaded
constexpr bool llvm_is_multithreaded()
Returns true if LLVM is compiled with support for multi-threading, and false otherwise.
Definition Threading.h:52

llvm::InitStatus
InitStatus
Definition Threading.h:60

llvm::Uninitialized
@ Uninitialized
Definition Threading.h:60

llvm::Wait
@ Wait
Definition Threading.h:60

llvm::Done
@ Done
Definition Threading.h:60

llvm::get_thread_affinity_mask
LLVM_ABI llvm::BitVector get_thread_affinity_mask()
Returns a mask that represents on which hardware thread, core, CPU, NUMA group, the calling thread ca...
Definition Threading.cpp:40

llvm::get_max_thread_name_length
LLVM_ABI uint32_t get_max_thread_name_length()
Get the maximum length of a thread name on this platform.
Definition Threading.cpp:34

llvm::set_thread_priority
LLVM_ABI SetThreadPriorityResult set_thread_priority(ThreadPriority Priority)

llvm::get_cpus
LLVM_ABI unsigned get_cpus()
Returns how many physical CPUs or NUMA groups the system has.

llvm::optimal_concurrency
ThreadPoolStrategy optimal_concurrency(unsigned TaskCount=0)
Returns an optimal thread strategy to execute specified amount of tasks.
Definition Threading.h:211

llvm::set_thread_name
LLVM_ABI void set_thread_name(const Twine &Name)
Set the name of the current thread.
Definition Threading.cpp:36

llvm::SetThreadPriorityResult
SetThreadPriorityResult
Definition Threading.h:285

llvm::SetThreadPriorityResult::FAILURE
@ FAILURE
Definition Threading.h:285

llvm::SetThreadPriorityResult::SUCCESS
@ SUCCESS
Definition Threading.h:285

llvm::get_thread_name
LLVM_ABI void get_thread_name(SmallVectorImpl< char > &Name)
Get the name of the current thread.
Definition Threading.cpp:38

llvm::get_physical_cores
LLVM_ABI int get_physical_cores()
Returns how many physical cores (as opposed to logical cores returned from thread::hardware_concurren...
Definition Threading.cpp:48

llvm::get_threadpool_strategy
LLVM_ABI std::optional< ThreadPoolStrategy > get_threadpool_strategy(StringRef Num, ThreadPoolStrategy Default={})
Build a strategy from a number of threads as a string provided in Num.
Definition Threading.cpp:102

llvm::get_threadid
LLVM_ABI uint64_t get_threadid()
Return the current thread id, as used in various OS system calls.
Definition Threading.cpp:32

llvm::call_once
void call_once(once_flag &flag, Function &&F, Args &&... ArgList)
Execute the function specified as a parameter once.
Definition Threading.h:86

llvm::InstructionUniformity::Default
@ Default
The result values are uniform if and only if all operands are uniform.
Definition Uniformity.h:20

llvm::once_flag
The llvm::once_flag structure.
Definition Threading.h:67

llvm::once_flag::status
volatile sys::cas_flag status
Definition Threading.h:68