include/marl/scheduler.h - SwiftShader - Git at Google

 // Copyright 2019 The Marl Authors.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     https://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #ifndef marl_scheduler_h
 #define marl_scheduler_h

 #include "debug.h"
 #include "memory.h"
 #include "sal.h"

 #include <array>
 #include <atomic>
 #include <chrono>
 #include <condition_variable>
 #include <functional>
 #include <map>
 #include <mutex>
 #include <queue>
 #include <set>
 #include <thread>
 #include <unordered_map>
 #include <unordered_set>

 namespace marl {

 class OSFiber;

 // Task is a unit of work for the scheduler.
 using Task = std::function<void()>;

 // Scheduler asynchronously processes Tasks.
 // A scheduler can be bound to one or more threads using the bind() method.
 // Once bound to a thread, that thread can call marl::schedule() to enqueue
 // work tasks to be executed asynchronously.
 // All threads must be unbound with unbind() before the scheduler is destructed.
 // Scheduler are initially constructed in single-threaded mode.
 // Call setWorkerThreadCount() to spawn dedicated worker threads.
 class Scheduler {
   class Worker;

  public:
   using TimePoint = std::chrono::system_clock::time_point;
   using Predicate = std::function<bool()>;

   Scheduler(Allocator* allocator = Allocator::Default);

   // Destructor.
   // Ensure that all threads are unbound before calling - failure to do so may
   // result in leaked memory.
   ~Scheduler();

   // get() returns the scheduler bound to the current thread.
   static Scheduler* get();

   // bind() binds this scheduler to the current thread.
   // There must be no existing scheduler bound to the thread prior to calling.
   void bind();

   // unbind() unbinds the scheduler currently bound to the current thread.
   // There must be a existing scheduler bound to the thread prior to calling.
   // unbind() flushes any enqueued tasks on the single-threaded worker before
   // returning.
   static void unbind();

   // enqueue() queues the task for asynchronous execution.
   void enqueue(Task&& task);

   // setThreadInitializer() sets the worker thread initializer function which
   // will be called for each new worker thread spawned.
   // The initializer will only be called on newly created threads (call
   // setThreadInitializer() before setWorkerThreadCount()).
   void setThreadInitializer(const std::function<void()>& init);

   // getThreadInitializer() returns the thread initializer function set by
   // setThreadInitializer().
   const std::function<void()>& getThreadInitializer();

   // setWorkerThreadCount() adjusts the number of dedicated worker threads.
   // A count of 0 puts the scheduler into single-threaded mode.
   // Note: Currently the number of threads cannot be adjusted once tasks
   // have been enqueued. This restriction may be lifted at a later time.
   void setWorkerThreadCount(int count);

   // getWorkerThreadCount() returns the number of worker threads.
   int getWorkerThreadCount();

   // Fibers expose methods to perform cooperative multitasking and are
   // automatically created by the Scheduler.
   //
   // The currently executing Fiber can be obtained by calling Fiber::current().
   //
   // When execution becomes blocked, yield() can be called to suspend execution
   // of the fiber and start executing other pending work. Once the block has
   // been lifted, schedule() can be called to reschedule the Fiber on the same
   // thread that previously executed it.
   class Fiber {
    public:
     using Lock = std::unique_lock<std::mutex>;

     // current() returns the currently executing fiber, or nullptr if called
     // without a bound scheduler.
     static Fiber* current();

     // wait() suspends execution of this Fiber until the Fiber is woken up with
     // a call to notify() and the predicate pred returns true.
     // If the predicate pred does not return true when notify() is called, then
     // the Fiber is automatically re-suspended, and will need to be woken with
     // another call to notify().
     // While the Fiber is suspended, the scheduler thread may continue executing
     // other tasks.
     // lock must be locked before calling, and is unlocked by wait() just before
     // the Fiber is suspended, and re-locked before the fiber is resumed. lock
     // will be locked before wait() returns.
     // pred will be always be called with the lock held.
     // wait() must only be called on the currently executing fiber.
     _Requires_lock_held_(lock)
     void wait(Lock& lock, const Predicate& pred);

     // wait() suspends execution of this Fiber until the Fiber is woken up with
     // a call to notify() and the predicate pred returns true, or sometime after
     // the timeout is reached.
     // If the predicate pred does not return true when notify() is called, then
     // the Fiber is automatically re-suspended, and will need to be woken with
     // another call to notify() or will be woken sometime after the timeout is
     // reached.
     // While the Fiber is suspended, the scheduler thread may continue executing
     // other tasks.
     // lock must be locked before calling, and is unlocked by wait() just before
     // the Fiber is suspended, and re-locked before the fiber is resumed. lock
     // will be locked before wait() returns.
     // pred will be always be called with the lock held.
     // wait() must only be called on the currently executing fiber.
     _Requires_lock_held_(lock)
     template <typename Clock, typename Duration>
     inline bool wait(Lock& lock,
                      const std::chrono::time_point<Clock, Duration>& timeout,
                      const Predicate& pred);

     // notify() reschedules the suspended Fiber for execution.
     // notify() is usually only called when the predicate for one or more wait()
     // calls will likely return true.
     void notify();

     // id is the thread-unique identifier of the Fiber.
     uint32_t const id;

    private:
     friend class Allocator;
     friend class Scheduler;

     enum class State {
       // Idle: the Fiber is currently unused, and sits in Worker::idleFibers,
       // ready to be recycled.
       Idle,

       // Yielded: the Fiber is currently blocked on a wait() call with no
       // timeout.
       Yielded,

       // Waiting: the Fiber is currently blocked on a wait() call with a
       // timeout. The fiber is stilling in the Worker::Work::waiting queue.
       Waiting,

       // Queued: the Fiber is currently queued for execution in the
       // Worker::Work::fibers queue.
       Queued,

       // Running: the Fiber is currently executing.
       Running,
     };

     Fiber(Allocator::unique_ptr<OSFiber>&&, uint32_t id);

     // switchTo() switches execution to the given fiber.
     // switchTo() must only be called on the currently executing fiber.
     void switchTo(Fiber*);

     // create() constructs and returns a new fiber with the given identifier,
     // stack size that will executed func when switched to.
     static Allocator::unique_ptr<Fiber> create(
         Allocator* allocator,
         uint32_t id,
         size_t stackSize,
         const std::function<void()>& func);

     // createFromCurrentThread() constructs and returns a new fiber with the
     // given identifier for the current thread.
     static Allocator::unique_ptr<Fiber> createFromCurrentThread(
         Allocator* allocator,
         uint32_t id);

     // toString() returns a string representation of the given State.
     // Used for debugging.
     static const char* toString(State state);

     Allocator::unique_ptr<OSFiber> const impl;
     Worker* const worker;
     State state = State::Running;  // Guarded by Worker's work.mutex.
   };

  private:
   Scheduler(const Scheduler&) = delete;
   Scheduler(Scheduler&&) = delete;
   Scheduler& operator=(const Scheduler&) = delete;
   Scheduler& operator=(Scheduler&&) = delete;

   // Stack size in bytes of a new fiber.
   // TODO: Make configurable so the default size can be reduced.
   static constexpr size_t FiberStackSize = 1024 * 1024;

   // Maximum number of worker threads.
   static constexpr size_t MaxWorkerThreads = 256;

   // WaitingFibers holds all the fibers waiting on a timeout.
   struct WaitingFibers {
     // operator bool() returns true iff there are any wait fibers.
     inline operator bool() const;

     // take() returns the next fiber that has exceeded its timeout, or nullptr
     // if there are no fibers that have yet exceeded their timeouts.
     inline Fiber* take(const TimePoint& timepoint);

     // next() returns the timepoint of the next fiber to timeout.
     // next() can only be called if operator bool() returns true.
     inline TimePoint next() const;

     // add() adds another fiber and timeout to the list of waiting fibers.
     inline void add(const TimePoint& timeout, Fiber* fiber);

     // erase() removes the fiber from the waiting list.
     inline void erase(Fiber* fiber);

     // contains() returns true if fiber is waiting.
     inline bool contains(Fiber* fiber) const;

    private:
     struct Timeout {
       TimePoint timepoint;
       Fiber* fiber;
       inline bool operator<(const Timeout&) const;
     };
     std::set<Timeout> timeouts;
     std::unordered_map<Fiber*, TimePoint> fibers;
   };

   // TODO: Implement a queue that recycles elements to reduce number of
   // heap allocations.
   using TaskQueue = std::queue<Task>;
   using FiberQueue = std::queue<Fiber*>;
   using FiberSet = std::unordered_set<Fiber*>;

   // Workers executes Tasks on a single thread.
   // Once a task is started, it may yield to other tasks on the same Worker.
   // Tasks are always resumed by the same Worker.
   class Worker {
    public:
     enum class Mode {
       // Worker will spawn a background thread to process tasks.
       MultiThreaded,

       // Worker will execute tasks whenever it yields.
       SingleThreaded,
     };

     Worker(Scheduler* scheduler, Mode mode, uint32_t id);

     // start() begins execution of the worker.
     void start();

     // stop() ceases execution of the worker, blocking until all pending
     // tasks have fully finished.
     void stop();

     // wait() suspends execution of the current task until the predicate pred
     // returns true.
     // See Fiber::wait() for more information.
     _Requires_lock_held_(lock)
     bool wait(Fiber::Lock& lock,
               const TimePoint* timeout,
               const Predicate& pred);

     // suspend() suspends the currenetly executing Fiber until the fiber is
     // woken with a call to enqueue(Fiber*), or automatically sometime after the
     // optional timeout.
     _Requires_lock_held_(work.mutex)
     void suspend(const TimePoint* timeout);

     // enqueue(Fiber*) enqueues resuming of a suspended fiber.
     void enqueue(Fiber* fiber);

     // enqueue(Task&&) enqueues a new, unstarted task.
     void enqueue(Task&& task);

     // tryLock() attempts to lock the worker for task enqueing.
     // If the lock was successful then true is returned, and the caller must
     // call enqueueAndUnlock().
     _When_(return == true, _Acquires_lock_(work.mutex))
     bool tryLock();

     // enqueueAndUnlock() enqueues the task and unlocks the worker.
     // Must only be called after a call to tryLock() which returned true.
     _Requires_lock_held_(work.mutex)
     _Releases_lock_(work.mutex)
     void enqueueAndUnlock(Task&& task);

     // flush() processes all pending tasks before returning.
     void flush();

     // dequeue() attempts to take a Task from the worker. Returns true if
     // a task was taken and assigned to out, otherwise false.
     bool dequeue(Task& out);

     // getCurrent() returns the Worker currently bound to the current
     // thread.
     static inline Worker* getCurrent();

     // getCurrentFiber() returns the Fiber currently being executed.
     inline Fiber* getCurrentFiber() const;

     // Unique identifier of the Worker.
     const uint32_t id;

    private:
     // run() is the task processing function for the worker.
     // If the worker was constructed in Mode::MultiThreaded, run() will
     // continue to process tasks until stop() is called.
     // If the worker was constructed in Mode::SingleThreaded, run() call
     // flush() and return.
     void run();

     // createWorkerFiber() creates a new fiber that when executed calls
     // run().
     Fiber* createWorkerFiber();

     // switchToFiber() switches execution to the given fiber. The fiber
     // must belong to this worker.
     void switchToFiber(Fiber*);

     // runUntilIdle() executes all pending tasks and then returns.
     _Requires_lock_held_(work.mutex)
     void runUntilIdle();

     // waitForWork() blocks until new work is available, potentially calling
     // spinForWork().
     _Requires_lock_held_(work.mutex)
     void waitForWork();

     // spinForWork() attempts to steal work from another Worker, and keeps
     // the thread awake for a short duration. This reduces overheads of
     // frequently putting the thread to sleep and re-waking.
     void spinForWork();

     // enqueueFiberTimeouts() enqueues all the fibers that have finished
     // waiting.
     _Requires_lock_held_(work.mutex)
     void enqueueFiberTimeouts();

     _Requires_lock_held_(work.mutex)
     inline void changeFiberState(Fiber* fiber,
                                  Fiber::State from,
                                  Fiber::State to) const;

     _Requires_lock_held_(work.mutex)
     inline void setFiberState(Fiber* fiber, Fiber::State to) const;

     // numBlockedFibers() returns the number of fibers currently blocked and
     // held externally.
     inline size_t numBlockedFibers() const {
       return workerFibers.size() - idleFibers.size();
     }

     // Work holds tasks and fibers that are enqueued on the Worker.
     struct Work {
       std::atomic<uint64_t> num = {0};  // tasks.size() + fibers.size()
       _Guarded_by_(mutex) TaskQueue tasks;
       _Guarded_by_(mutex) FiberQueue fibers;
       _Guarded_by_(mutex) WaitingFibers waiting;
       std::condition_variable added;
       std::mutex mutex;
     };

     // https://en.wikipedia.org/wiki/Xorshift
     class FastRnd {
      public:
       inline uint64_t operator()() {
         x ^= x << 13;
         x ^= x >> 7;
         x ^= x << 17;
         return x;
       }

      private:
       uint64_t x = std::chrono::system_clock::now().time_since_epoch().count();
     };

     // The current worker bound to the current thread.
     static thread_local Worker* current;

     Mode const mode;
     Scheduler* const scheduler;
     Allocator::unique_ptr<Fiber> mainFiber;
     Fiber* currentFiber = nullptr;
     std::thread thread;
     Work work;
     FiberSet idleFibers;  // Fibers that have completed which can be reused.
     std::vector<Allocator::unique_ptr<Fiber>>
         workerFibers;  // All fibers created by this worker.
     FastRnd rng;
     std::atomic<bool> shutdown = {false};
   };

   // stealWork() attempts to steal a task from the worker with the given id.
   // Returns true if a task was stolen and assigned to out, otherwise false.
   bool stealWork(Worker* thief, uint64_t from, Task& out);

   // onBeginSpinning() is called when a Worker calls spinForWork().
   // The scheduler will prioritize this worker for new tasks to try to prevent
   // it going to sleep.
   void onBeginSpinning(int workerId);

   // The scheduler currently bound to the current thread.
   static thread_local Scheduler* bound;

   Allocator* const allocator;

   std::function<void()> threadInitFunc;
   std::mutex threadInitFuncMutex;

   std::array<std::atomic<int>, 8> spinningWorkers;
   std::atomic<unsigned int> nextSpinningWorkerIdx = {0x8000000};

   // TODO: Make this lot thread-safe so setWorkerThreadCount() can be called
   // during execution of tasks.
   std::atomic<unsigned int> nextEnqueueIndex = {0};
   unsigned int numWorkerThreads = 0;
   std::array<Worker*, MaxWorkerThreads> workerThreads;

   std::mutex singleThreadedWorkerMutex;
   std::unordered_map<std::thread::id, Allocator::unique_ptr<Worker>>
       singleThreadedWorkers;
 };

 _Requires_lock_held_(lock)
 template <typename Clock, typename Duration>
 bool Scheduler::Fiber::wait(
     Lock& lock,
     const std::chrono::time_point<Clock, Duration>& timeout,
     const Predicate& pred) {
   using ToDuration = typename TimePoint::duration;
   using ToClock = typename TimePoint::clock;
   auto tp = std::chrono::time_point_cast<ToDuration, ToClock>(timeout);
   return worker->wait(lock, &tp, pred);
 }

 Scheduler::Worker* Scheduler::Worker::getCurrent() {
   return Worker::current;
 }

 Scheduler::Fiber* Scheduler::Worker::getCurrentFiber() const {
   return currentFiber;
 }

 // schedule() schedules the function f to be asynchronously called with the
 // given arguments using the currently bound scheduler.
 template <typename Function, typename... Args>
 inline void schedule(Function&& f, Args&&... args) {
   MARL_ASSERT_HAS_BOUND_SCHEDULER("marl::schedule");
   auto scheduler = Scheduler::get();
   scheduler->enqueue(
       std::bind(std::forward<Function>(f), std::forward<Args>(args)...));
 }

 // schedule() schedules the function f to be asynchronously called using the
 // currently bound scheduler.
 template <typename Function>
 inline void schedule(Function&& f) {
   MARL_ASSERT_HAS_BOUND_SCHEDULER("marl::schedule");
   auto scheduler = Scheduler::get();
   scheduler->enqueue(std::forward<Function>(f));
 }

 }  // namespace marl

 #endif  // marl_scheduler_h
	// Copyright 2019 The Marl Authors.
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// https://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	#ifndef marl_scheduler_h
	#define marl_scheduler_h

	#include "debug.h"
	#include "memory.h"
	#include "sal.h"

	#include <array>
	#include <atomic>
	#include <chrono>
	#include <condition_variable>
	#include <functional>
	#include <map>
	#include <mutex>
	#include <queue>
	#include <set>
	#include <thread>
	#include <unordered_map>
	#include <unordered_set>

	namespace marl {

	class OSFiber;

	// Task is a unit of work for the scheduler.
	using Task = std::function<void()>;

	// Scheduler asynchronously processes Tasks.
	// A scheduler can be bound to one or more threads using the bind() method.
	// Once bound to a thread, that thread can call marl::schedule() to enqueue
	// work tasks to be executed asynchronously.
	// All threads must be unbound with unbind() before the scheduler is destructed.
	// Scheduler are initially constructed in single-threaded mode.
	// Call setWorkerThreadCount() to spawn dedicated worker threads.
	class Scheduler {
	class Worker;

	public:
	using TimePoint = std::chrono::system_clock::time_point;
	using Predicate = std::function<bool()>;

	Scheduler(Allocator* allocator = Allocator::Default);

	// Destructor.
	// Ensure that all threads are unbound before calling - failure to do so may
	// result in leaked memory.
	~Scheduler();

	// get() returns the scheduler bound to the current thread.
	static Scheduler* get();

	// bind() binds this scheduler to the current thread.
	// There must be no existing scheduler bound to the thread prior to calling.
	void bind();

	// unbind() unbinds the scheduler currently bound to the current thread.
	// There must be a existing scheduler bound to the thread prior to calling.
	// unbind() flushes any enqueued tasks on the single-threaded worker before
	// returning.
	static void unbind();

	// enqueue() queues the task for asynchronous execution.
	void enqueue(Task&& task);

	// setThreadInitializer() sets the worker thread initializer function which
	// will be called for each new worker thread spawned.
	// The initializer will only be called on newly created threads (call
	// setThreadInitializer() before setWorkerThreadCount()).
	void setThreadInitializer(const std::function<void()>& init);

	// getThreadInitializer() returns the thread initializer function set by
	// setThreadInitializer().
	const std::function<void()>& getThreadInitializer();

	// setWorkerThreadCount() adjusts the number of dedicated worker threads.
	// A count of 0 puts the scheduler into single-threaded mode.
	// Note: Currently the number of threads cannot be adjusted once tasks
	// have been enqueued. This restriction may be lifted at a later time.
	void setWorkerThreadCount(int count);

	// getWorkerThreadCount() returns the number of worker threads.
	int getWorkerThreadCount();

	// Fibers expose methods to perform cooperative multitasking and are
	// automatically created by the Scheduler.
	//
	// The currently executing Fiber can be obtained by calling Fiber::current().
	//
	// When execution becomes blocked, yield() can be called to suspend execution
	// of the fiber and start executing other pending work. Once the block has
	// been lifted, schedule() can be called to reschedule the Fiber on the same
	// thread that previously executed it.
	class Fiber {
	public:
	using Lock = std::unique_lock<std::mutex>;

	// current() returns the currently executing fiber, or nullptr if called
	// without a bound scheduler.
	static Fiber* current();

	// wait() suspends execution of this Fiber until the Fiber is woken up with
	// a call to notify() and the predicate pred returns true.
	// If the predicate pred does not return true when notify() is called, then
	// the Fiber is automatically re-suspended, and will need to be woken with
	// another call to notify().
	// While the Fiber is suspended, the scheduler thread may continue executing
	// other tasks.
	// lock must be locked before calling, and is unlocked by wait() just before
	// the Fiber is suspended, and re-locked before the fiber is resumed. lock
	// will be locked before wait() returns.
	// pred will be always be called with the lock held.
	// wait() must only be called on the currently executing fiber.
	_Requires_lock_held_(lock)
	void wait(Lock& lock, const Predicate& pred);

	// wait() suspends execution of this Fiber until the Fiber is woken up with
	// a call to notify() and the predicate pred returns true, or sometime after
	// the timeout is reached.
	// If the predicate pred does not return true when notify() is called, then
	// the Fiber is automatically re-suspended, and will need to be woken with
	// another call to notify() or will be woken sometime after the timeout is
	// reached.
	// While the Fiber is suspended, the scheduler thread may continue executing
	// other tasks.
	// lock must be locked before calling, and is unlocked by wait() just before
	// the Fiber is suspended, and re-locked before the fiber is resumed. lock
	// will be locked before wait() returns.
	// pred will be always be called with the lock held.
	// wait() must only be called on the currently executing fiber.
	_Requires_lock_held_(lock)
	template <typename Clock, typename Duration>
	inline bool wait(Lock& lock,
	const std::chrono::time_point<Clock, Duration>& timeout,
	const Predicate& pred);

	// notify() reschedules the suspended Fiber for execution.
	// notify() is usually only called when the predicate for one or more wait()
	// calls will likely return true.
	void notify();

	// id is the thread-unique identifier of the Fiber.
	uint32_t const id;

	private:
	friend class Allocator;
	friend class Scheduler;

	enum class State {
	// Idle: the Fiber is currently unused, and sits in Worker::idleFibers,
	// ready to be recycled.
	Idle,

	// Yielded: the Fiber is currently blocked on a wait() call with no
	// timeout.
	Yielded,

	// Waiting: the Fiber is currently blocked on a wait() call with a
	// timeout. The fiber is stilling in the Worker::Work::waiting queue.
	Waiting,

	// Queued: the Fiber is currently queued for execution in the
	// Worker::Work::fibers queue.
	Queued,

	// Running: the Fiber is currently executing.
	Running,
	};

	Fiber(Allocator::unique_ptr<OSFiber>&&, uint32_t id);

	// switchTo() switches execution to the given fiber.
	// switchTo() must only be called on the currently executing fiber.
	void switchTo(Fiber*);

	// create() constructs and returns a new fiber with the given identifier,
	// stack size that will executed func when switched to.
	static Allocator::unique_ptr<Fiber> create(
	Allocator* allocator,
	uint32_t id,
	size_t stackSize,
	const std::function<void()>& func);

	// createFromCurrentThread() constructs and returns a new fiber with the
	// given identifier for the current thread.
	static Allocator::unique_ptr<Fiber> createFromCurrentThread(
	Allocator* allocator,
	uint32_t id);

	// toString() returns a string representation of the given State.
	// Used for debugging.
	static const char* toString(State state);

	Allocator::unique_ptr<OSFiber> const impl;
	Worker* const worker;
	State state = State::Running; // Guarded by Worker's work.mutex.
	};

	private:
	Scheduler(const Scheduler&) = delete;
	Scheduler(Scheduler&&) = delete;
	Scheduler& operator=(const Scheduler&) = delete;
	Scheduler& operator=(Scheduler&&) = delete;

	// Stack size in bytes of a new fiber.
	// TODO: Make configurable so the default size can be reduced.
	static constexpr size_t FiberStackSize = 1024 * 1024;

	// Maximum number of worker threads.
	static constexpr size_t MaxWorkerThreads = 256;

	// WaitingFibers holds all the fibers waiting on a timeout.
	struct WaitingFibers {
	// operator bool() returns true iff there are any wait fibers.
	inline operator bool() const;

	// take() returns the next fiber that has exceeded its timeout, or nullptr
	// if there are no fibers that have yet exceeded their timeouts.
	inline Fiber* take(const TimePoint& timepoint);

	// next() returns the timepoint of the next fiber to timeout.
	// next() can only be called if operator bool() returns true.
	inline TimePoint next() const;

	// add() adds another fiber and timeout to the list of waiting fibers.
	inline void add(const TimePoint& timeout, Fiber* fiber);

	// erase() removes the fiber from the waiting list.
	inline void erase(Fiber* fiber);

	// contains() returns true if fiber is waiting.
	inline bool contains(Fiber* fiber) const;

	private:
	struct Timeout {
	TimePoint timepoint;
	Fiber* fiber;
	inline bool operator<(const Timeout&) const;
	};
	std::set<Timeout> timeouts;
	std::unordered_map<Fiber*, TimePoint> fibers;
	};

	// TODO: Implement a queue that recycles elements to reduce number of
	// heap allocations.
	using TaskQueue = std::queue<Task>;
	using FiberQueue = std::queue<Fiber*>;
	using FiberSet = std::unordered_set<Fiber*>;

	// Workers executes Tasks on a single thread.
	// Once a task is started, it may yield to other tasks on the same Worker.
	// Tasks are always resumed by the same Worker.
	class Worker {
	public:
	enum class Mode {
	// Worker will spawn a background thread to process tasks.
	MultiThreaded,

	// Worker will execute tasks whenever it yields.
	SingleThreaded,
	};

	Worker(Scheduler* scheduler, Mode mode, uint32_t id);

	// start() begins execution of the worker.
	void start();

	// stop() ceases execution of the worker, blocking until all pending
	// tasks have fully finished.
	void stop();

	// wait() suspends execution of the current task until the predicate pred
	// returns true.
	// See Fiber::wait() for more information.
	_Requires_lock_held_(lock)
	bool wait(Fiber::Lock& lock,
	const TimePoint* timeout,
	const Predicate& pred);

	// suspend() suspends the currenetly executing Fiber until the fiber is
	// woken with a call to enqueue(Fiber*), or automatically sometime after the
	// optional timeout.
	_Requires_lock_held_(work.mutex)
	void suspend(const TimePoint* timeout);

	// enqueue(Fiber*) enqueues resuming of a suspended fiber.
	void enqueue(Fiber* fiber);

	// enqueue(Task&&) enqueues a new, unstarted task.
	void enqueue(Task&& task);

	// tryLock() attempts to lock the worker for task enqueing.
	// If the lock was successful then true is returned, and the caller must
	// call enqueueAndUnlock().
	_When_(return == true, _Acquires_lock_(work.mutex))
	bool tryLock();

	// enqueueAndUnlock() enqueues the task and unlocks the worker.
	// Must only be called after a call to tryLock() which returned true.
	_Requires_lock_held_(work.mutex)
	_Releases_lock_(work.mutex)
	void enqueueAndUnlock(Task&& task);

	// flush() processes all pending tasks before returning.
	void flush();

	// dequeue() attempts to take a Task from the worker. Returns true if
	// a task was taken and assigned to out, otherwise false.
	bool dequeue(Task& out);

	// getCurrent() returns the Worker currently bound to the current
	// thread.
	static inline Worker* getCurrent();

	// getCurrentFiber() returns the Fiber currently being executed.
	inline Fiber* getCurrentFiber() const;

	// Unique identifier of the Worker.
	const uint32_t id;

	private:
	// run() is the task processing function for the worker.
	// If the worker was constructed in Mode::MultiThreaded, run() will
	// continue to process tasks until stop() is called.
	// If the worker was constructed in Mode::SingleThreaded, run() call
	// flush() and return.
	void run();

	// createWorkerFiber() creates a new fiber that when executed calls
	// run().
	Fiber* createWorkerFiber();

	// switchToFiber() switches execution to the given fiber. The fiber
	// must belong to this worker.
	void switchToFiber(Fiber*);

	// runUntilIdle() executes all pending tasks and then returns.
	_Requires_lock_held_(work.mutex)
	void runUntilIdle();

	// waitForWork() blocks until new work is available, potentially calling
	// spinForWork().
	_Requires_lock_held_(work.mutex)
	void waitForWork();

	// spinForWork() attempts to steal work from another Worker, and keeps
	// the thread awake for a short duration. This reduces overheads of
	// frequently putting the thread to sleep and re-waking.
	void spinForWork();

	// enqueueFiberTimeouts() enqueues all the fibers that have finished
	// waiting.
	_Requires_lock_held_(work.mutex)
	void enqueueFiberTimeouts();

	_Requires_lock_held_(work.mutex)
	inline void changeFiberState(Fiber* fiber,
	Fiber::State from,
	Fiber::State to) const;

	_Requires_lock_held_(work.mutex)
	inline void setFiberState(Fiber* fiber, Fiber::State to) const;

	// numBlockedFibers() returns the number of fibers currently blocked and
	// held externally.
	inline size_t numBlockedFibers() const {
	return workerFibers.size() - idleFibers.size();
	}

	// Work holds tasks and fibers that are enqueued on the Worker.
	struct Work {
	std::atomic<uint64_t> num = {0}; // tasks.size() + fibers.size()
	_Guarded_by_(mutex) TaskQueue tasks;
	_Guarded_by_(mutex) FiberQueue fibers;
	_Guarded_by_(mutex) WaitingFibers waiting;
	std::condition_variable added;
	std::mutex mutex;
	};

	// https://en.wikipedia.org/wiki/Xorshift
	class FastRnd {
	public:
	inline uint64_t operator()() {
	x ^= x << 13;
	x ^= x >> 7;
	x ^= x << 17;
	return x;
	}

	private:
	uint64_t x = std::chrono::system_clock::now().time_since_epoch().count();
	};

	// The current worker bound to the current thread.
	static thread_local Worker* current;

	Mode const mode;
	Scheduler* const scheduler;
	Allocator::unique_ptr<Fiber> mainFiber;
	Fiber* currentFiber = nullptr;
	std::thread thread;
	Work work;
	FiberSet idleFibers; // Fibers that have completed which can be reused.
	std::vector<Allocator::unique_ptr<Fiber>>
	workerFibers; // All fibers created by this worker.
	FastRnd rng;
	std::atomic<bool> shutdown = {false};
	};

	// stealWork() attempts to steal a task from the worker with the given id.
	// Returns true if a task was stolen and assigned to out, otherwise false.
	bool stealWork(Worker* thief, uint64_t from, Task& out);

	// onBeginSpinning() is called when a Worker calls spinForWork().
	// The scheduler will prioritize this worker for new tasks to try to prevent
	// it going to sleep.
	void onBeginSpinning(int workerId);

	// The scheduler currently bound to the current thread.
	static thread_local Scheduler* bound;

	Allocator* const allocator;

	std::function<void()> threadInitFunc;
	std::mutex threadInitFuncMutex;

	std::array<std::atomic<int>, 8> spinningWorkers;
	std::atomic<unsigned int> nextSpinningWorkerIdx = {0x8000000};

	// TODO: Make this lot thread-safe so setWorkerThreadCount() can be called
	// during execution of tasks.
	std::atomic<unsigned int> nextEnqueueIndex = {0};
	unsigned int numWorkerThreads = 0;
	std::array<Worker*, MaxWorkerThreads> workerThreads;

	std::mutex singleThreadedWorkerMutex;
	std::unordered_map<std::thread::id, Allocator::unique_ptr<Worker>>
	singleThreadedWorkers;
	};

	_Requires_lock_held_(lock)
	template <typename Clock, typename Duration>
	bool Scheduler::Fiber::wait(
	Lock& lock,
	const std::chrono::time_point<Clock, Duration>& timeout,
	const Predicate& pred) {
	using ToDuration = typename TimePoint::duration;
	using ToClock = typename TimePoint::clock;
	auto tp = std::chrono::time_point_cast<ToDuration, ToClock>(timeout);
	return worker->wait(lock, &tp, pred);
	}

	Scheduler::Worker* Scheduler::Worker::getCurrent() {
	return Worker::current;
	}

	Scheduler::Fiber* Scheduler::Worker::getCurrentFiber() const {
	return currentFiber;
	}

	// schedule() schedules the function f to be asynchronously called with the
	// given arguments using the currently bound scheduler.
	template <typename Function, typename... Args>
	inline void schedule(Function&& f, Args&&... args) {
	MARL_ASSERT_HAS_BOUND_SCHEDULER("marl::schedule");
	auto scheduler = Scheduler::get();
	scheduler->enqueue(
	std::bind(std::forward<Function>(f), std::forward<Args>(args)...));
	}

	// schedule() schedules the function f to be asynchronously called using the
	// currently bound scheduler.
	template <typename Function>
	inline void schedule(Function&& f) {
	MARL_ASSERT_HAS_BOUND_SCHEDULER("marl::schedule");
	auto scheduler = Scheduler::get();
	scheduler->enqueue(std::forward<Function>(f));
	}

	} // namespace marl

	#endif // marl_scheduler_h