rpcs3/Utilities/cond.h

#pragma once

#include "types.h"
#include "util/atomic.hpp"
#include <shared_mutex>
#include "asm.h"

// Lightweight condition variable
class cond_variable
{
	// Internal waiter counter
	atomic_t<u32> m_value{0};

	enum : u32
	{
		c_waiter_mask = 0x1fff,
		c_signal_mask = 0xffffffff & ~c_waiter_mask,
	};

protected:
	// Increment waiter count
	u32 add_waiter() noexcept
	{
		return m_value.atomic_op([](u32& value) -> u32
		{
			if ((value & c_signal_mask) == c_signal_mask || (value & c_waiter_mask) == c_waiter_mask)
			{
				// Signal or waiter overflow, return immediately
				return 0;
			}

			value += c_waiter_mask & -c_waiter_mask;
			return value;
		});
	}

	// Internal waiting function
	void imp_wait(u32 _old, u64 _timeout) noexcept;

	// Try to notify up to _count threads
	void imp_wake(u32 _count) noexcept;

public:
	constexpr cond_variable() = default;

	// Intrusive wait algorithm for lockable objects
	template <typename T>
	void wait(T& object, u64 usec_timeout = -1) noexcept
	{
		const u32 _old = add_waiter();

		if (!_old)
		{
			return;
		}

		object.unlock();
		imp_wait(_old, usec_timeout);
		object.lock();
	}

	// Unlock all specified objects but don't lock them again
	template <typename... Locks>
	void wait_unlock(u64 usec_timeout, Locks&&... locks)
	{
		const u32 _old = add_waiter();
		(..., std::forward<Locks>(locks).unlock());

		if (!_old)
		{
			return;
		}

		imp_wait(_old, usec_timeout);
	}

	// Wake one thread
	void notify_one() noexcept
	{
		if (m_value)
		{
			imp_wake(1);
		}
	}

	// Wake all threads
	void notify_all() noexcept
	{
		if (m_value)
		{
			imp_wake(-1);
		}
	}

	static constexpr u64 max_timeout = UINT64_MAX / 1000;
};

// Condition variable fused with a pseudo-mutex supporting only reader locks (up to 32 readers).
class shared_cond
{
	// For information, shouldn't modify
	enum : u64
	{
		// Wait bit is aligned for compatibility with 32-bit futex.
		c_wait = 1,
		c_sig  = 1ull << 32,
		c_lock = 1ull << 32 | 1,
	};

	// Split in 32-bit parts for convenient bit combining
	atomic_t<u64> m_cvx32{0};

	class shared_lock
	{
		shared_cond* m_this;
		u32 m_slot;

		friend class shared_cond;

	public:
		shared_lock(shared_cond* _this) noexcept
			: m_this(_this)
		{
			// Lock and remember obtained slot index
			m_slot = m_this->m_cvx32.atomic_op([](u64& cvx32)
			{
				// Combine used bits and invert to find least significant bit unused
				const u32 slot = static_cast<u32>(utils::cnttz64(~((cvx32 & 0xffffffff) | (cvx32 >> 32)), true));

				// Set lock bits (does nothing if all slots are used)
				const u64 bit = (1ull << slot) & 0xffffffff;
				cvx32 |= bit | (bit << 32);
				return slot;
			});
		}

		shared_lock(const shared_lock&) = delete;

		shared_lock(shared_lock&& rhs)
			: m_this(rhs.m_this)
			, m_slot(rhs.m_slot)
		{
			rhs.m_slot = 32;
		}

		shared_lock& operator=(const shared_lock&) = delete;

		~shared_lock()
		{
			// Clear the slot (does nothing if all slots are used)
			const u64 bit = (1ull << m_slot) & 0xffffffff;
			m_this->m_cvx32 &= ~(bit | (bit << 32));
		}

		explicit operator bool() const noexcept
		{
			// Check success
			return m_slot < 32;
		}

		bool wait(u64 usec_timeout = -1) const noexcept
		{
			return m_this->wait(*this, usec_timeout);
		}
	};

	bool imp_wait(u32 slot, u64 _timeout) noexcept;
	void imp_notify() noexcept;

public:
	constexpr shared_cond() = default;

	shared_lock try_shared_lock() noexcept
	{
		return shared_lock(this);
	}

	bool wait(shared_lock const& lock, u64 usec_timeout = -1) noexcept
	{
		AUDIT(lock.m_this == this);
		return imp_wait(lock.m_slot, usec_timeout);
	}

	void notify_all() noexcept
	{
		if (LIKELY(!m_cvx32))
			return;

		imp_notify();
	}
};
New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`#pragma once`

			`#include "types.h"`
Implement waitable atomics Moved Atomic.h to util/atomic.hpp List source files in CMakeLists.txt 2019-07-27 00:34:10 +02:00			`#include "util/atomic.hpp"`
Add cond_variable::wait_unlock 2018-10-02 16:50:22 +02:00			`#include <shared_mutex>`
Implement class cond_x16 Use as reservation notifier Limited to 16 threads but allows more precise control of contention 2018-11-25 17:43:02 +01:00			`#include "asm.h"`
New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00
			`// Lightweight condition variable`
			`class cond_variable`
			`{`
			`// Internal waiter counter`
			`atomic_t<u32> m_value{0};`

Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`enum : u32`
			`{`
			`c_waiter_mask = 0x1fff,`
			`c_signal_mask = 0xffffffff & ~c_waiter_mask,`
			`};`

New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`protected:`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`// Increment waiter count`
			`u32 add_waiter() noexcept`
			`{`
			`return m_value.atomic_op([](u32& value) -> u32`
			`{`
			`if ((value & c_signal_mask) == c_signal_mask \|\| (value & c_waiter_mask) == c_waiter_mask)`
			`{`
			`// Signal or waiter overflow, return immediately`
			`return 0;`
			`}`

			`value += c_waiter_mask & -c_waiter_mask;`
			`return value;`
			`});`
			`}`

New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`// Internal waiting function`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`void imp_wait(u32 _old, u64 _timeout) noexcept;`
New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00
			`// Try to notify up to _count threads`
			`void imp_wake(u32 _count) noexcept;`

			`public:`
			`constexpr cond_variable() = default;`

			`// Intrusive wait algorithm for lockable objects`
Thread.cpp refinement Hide thread mutex Safe notify() method Other refactoring 2016-09-07 00:38:52 +02:00			`template <typename T>`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`void wait(T& object, u64 usec_timeout = -1) noexcept`
New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`{`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`const u32 _old = add_waiter();`

			`if (!_old)`
			`{`
			`return;`
			`}`

Thread.cpp refinement Hide thread mutex Safe notify() method Other refactoring 2016-09-07 00:38:52 +02:00			`object.unlock();`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`imp_wait(_old, usec_timeout);`
Thread.cpp refinement Hide thread mutex Safe notify() method Other refactoring 2016-09-07 00:38:52 +02:00			`object.lock();`
New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`}`

Add cond_variable::wait_unlock 2018-10-02 16:50:22 +02:00			`// Unlock all specified objects but don't lock them again`
			`template <typename... Locks>`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`void wait_unlock(u64 usec_timeout, Locks&&... locks)`
Add cond_variable::wait_unlock 2018-10-02 16:50:22 +02:00			`{`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`const u32 _old = add_waiter();`
Add cond_variable::wait_unlock 2018-10-02 16:50:22 +02:00			`(..., std::forward<Locks>(locks).unlock());`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00
			`if (!_old)`
			`{`
			`return;`
			`}`

			`imp_wait(_old, usec_timeout);`
Add cond_variable::wait_unlock 2018-10-02 16:50:22 +02:00			`}`

New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`// Wake one thread`
			`void notify_one() noexcept`
			`{`
			`if (m_value)`
			`{`
			`imp_wake(1);`
			`}`
			`}`

			`// Wake all threads`
			`void notify_all() noexcept`
			`{`
			`if (m_value)`
			`{`
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`imp_wake(-1);`
New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`}`
			`}`
Fix cond_variable timeout Thanks @Farseer2 for debugging 2017-11-17 20:20:46 +01:00
Rewrite `cond_variable` to use waitable atomics Increase max_timeout and fix max_timeout usage 2019-09-09 10:09:30 +02:00			`static constexpr u64 max_timeout = UINT64_MAX / 1000;`
New shared_mutex Experimental sync utils New semaphore<> New cond_variable New owned_mutex 2017-01-24 21:19:52 +01:00			`};`
Revert "Remove `shared_cond` and simplify reservation waiting" This reverts commit 0a96497e135bc6564bdc686407f75706fe62c92e. 2019-09-13 22:54:43 +02:00
			`// Condition variable fused with a pseudo-mutex supporting only reader locks (up to 32 readers).`
			`class shared_cond`
			`{`
			`// For information, shouldn't modify`
			`enum : u64`
			`{`
			`// Wait bit is aligned for compatibility with 32-bit futex.`
			`c_wait = 1,`
			`c_sig = 1ull << 32,`
			`c_lock = 1ull << 32 \| 1,`
			`};`

			`// Split in 32-bit parts for convenient bit combining`
			`atomic_t<u64> m_cvx32{0};`

			`class shared_lock`
			`{`
			`shared_cond* m_this;`
			`u32 m_slot;`

			`friend class shared_cond;`

			`public:`
			`shared_lock(shared_cond* _this) noexcept`
			`: m_this(_this)`
			`{`
			`// Lock and remember obtained slot index`
			`m_slot = m_this->m_cvx32.atomic_op([](u64& cvx32)`
			`{`
			`// Combine used bits and invert to find least significant bit unused`
			`const u32 slot = static_cast<u32>(utils::cnttz64(~((cvx32 & 0xffffffff) \| (cvx32 >> 32)), true));`

			`// Set lock bits (does nothing if all slots are used)`
			`const u64 bit = (1ull << slot) & 0xffffffff;`
			`cvx32 \|= bit \| (bit << 32);`
			`return slot;`
			`});`
			`}`

			`shared_lock(const shared_lock&) = delete;`

			`shared_lock(shared_lock&& rhs)`
			`: m_this(rhs.m_this)`
			`, m_slot(rhs.m_slot)`
			`{`
			`rhs.m_slot = 32;`
			`}`

			`shared_lock& operator=(const shared_lock&) = delete;`

			`~shared_lock()`
			`{`
			`// Clear the slot (does nothing if all slots are used)`
			`const u64 bit = (1ull << m_slot) & 0xffffffff;`
			`m_this->m_cvx32 &= ~(bit \| (bit << 32));`
			`}`

			`explicit operator bool() const noexcept`
			`{`
			`// Check success`
			`return m_slot < 32;`
			`}`

			`bool wait(u64 usec_timeout = -1) const noexcept`
			`{`
			`return m_this->wait(*this, usec_timeout);`
			`}`
			`};`

			`bool imp_wait(u32 slot, u64 _timeout) noexcept;`
			`void imp_notify() noexcept;`

			`public:`
			`constexpr shared_cond() = default;`

			`shared_lock try_shared_lock() noexcept`
			`{`
			`return shared_lock(this);`
			`}`

			`bool wait(shared_lock const& lock, u64 usec_timeout = -1) noexcept`
			`{`
			`AUDIT(lock.m_this == this);`
			`return imp_wait(lock.m_slot, usec_timeout);`
			`}`

			`void notify_all() noexcept`
			`{`
			`if (LIKELY(!m_cvx32))`
			`return;`

			`imp_notify();`
			`}`
			`};`