From 59a0f810b92f578ea209007f262271a06247365a Mon Sep 17 00:00:00 2001 From: Nekotekina Date: Thu, 30 Jan 2020 03:04:44 +0300 Subject: [PATCH] Implement fat atomics Atomics with embedded mutex bit. --- rpcs3/util/atomic.hpp | 356 ++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 356 insertions(+) diff --git a/rpcs3/util/atomic.hpp b/rpcs3/util/atomic.hpp index 47e38eab95..8aa30ef81c 100644 --- a/rpcs3/util/atomic.hpp +++ b/rpcs3/util/atomic.hpp @@ -2,6 +2,7 @@ #include "Utilities/types.h" #include +#include #ifdef _MSC_VER #include @@ -1150,3 +1151,358 @@ public: atomic_storage_futex::notify_all(&m_data); } }; + +template +class atomic_with_lock_bit +{ + // Simply internal type + using type = std::conditional_t, std::uintptr_t, T>; + + // Check space for lock bit + static_assert(BitWidth < sizeof(T) * 8, "No space for lock bit"); + static_assert(sizeof(T) <= 8, "Not supported"); + static_assert(std::is_pointer_v == (BitWidth == 0), "BitWidth should be 0 for pointers"); + static_assert(!std::is_pointer_v || (alignof(std::remove_pointer_t) > 1), "Pointer type should have align 2 or more"); + + // Use the most significant bit as a mutex + atomic_t m_data; + +public: + using base_type = T; + + static bool is_locked(type old_val) + { + if constexpr (std::is_signed_v && BitWidth == sizeof(T) * 8 - 1) + { + return old_val < 0; + } + else if constexpr (std::is_pointer_v) + { + return (old_val & 1) != 0; + } + else + { + return (old_val & (type{1} << BitWidth)) != 0; + } + } + + static type clamp_value(type old_val) + { + if constexpr (std::is_signed_v) + { + return static_cast(static_cast>(old_val) << (sizeof(T) * 8 - BitWidth)) >> (sizeof(T) * 8 - BitWidth); + } + else if constexpr (std::is_pointer_v) + { + return old_val & 0xffff'ffff'ffff'fffeull; + } + else + { + return old_val & static_cast(0xffff'ffff'ffff'ffffull >> (64 - BitWidth)); + } + } + + // Define simple type + using simple_type = simple_t; + + atomic_with_lock_bit() noexcept = default; + + atomic_with_lock_bit(const atomic_with_lock_bit&) = delete; + + atomic_with_lock_bit& operator =(const atomic_with_lock_bit&) = delete; + + constexpr atomic_with_lock_bit(T value) noexcept + : m_data(clamp_value(reinterpret_cast(value))) + { + } + + // Unsafe read + type raw_load() const + { + return clamp_value(m_data.load()); + } + + // Unsafe write and unlock + void raw_release(type value) + { + m_data.release(clamp_value(value)); + m_data.notify_all(); + } + + void lock() + { + while (UNLIKELY(m_data.bts(BitWidth))) + { + type old_val = m_data.load(); + + if (is_locked(old_val)) + { + m_data.wait(old_val); + old_val = m_data.load(); + } + } + } + + bool try_lock() + { + return !m_data.bts(BitWidth); + } + + void unlock() + { + m_data.btr(BitWidth); + m_data.notify_all(); + } + + T load() + { + type old_val = m_data.load(); + + while (UNLIKELY(is_locked(old_val))) + { + m_data.wait(old_val); + old_val = m_data.load(); + } + + return reinterpret_cast(clamp_value(old_val)); + } + + void store(T value) + { + type old_val = m_data.load(); + + while (UNLIKELY(is_locked(old_val) || !m_data.compare_and_swap_test(old_val, clamp_value(reinterpret_cast(value))))) + { + m_data.wait(old_val); + old_val = m_data.load(); + } + } + + template > + RT atomic_op(F func) + { + type _new, old; + old.m_data = m_data.load(); + + while (true) + { + if (UNLIKELY(is_locked(old.m_data))) + { + m_data.wait(old.m_data); + old.m_data = m_data.load(); + continue; + } + + _new = old; + + if constexpr (std::is_void_v) + { + std::invoke(func, reinterpret_cast(_new)); + + if (LIKELY(atomic_storage::compare_exchange(m_data, old.m_data, clamp_value(_new.m_data)))) + { + return; + } + } + else + { + RT result = std::invoke(func, reinterpret_cast(_new)); + + if (LIKELY(atomic_storage::compare_exchange(m_data, old.m_data, clamp_value(_new.m_data)))) + { + return result; + } + } + } + } + + type fetch_add(const type& rhs) + { + return atomic_op([&](T& v) + { + return std::exchange(v, v += rhs); + }); + } + + auto operator +=(const type& rhs) + { + return atomic_op([&](T& v) + { + return v += rhs; + }); + } + + type fetch_sub(const type& rhs) + { + return atomic_op([&](T& v) + { + return std::exchange(v, v -= rhs); + }); + } + + auto operator -=(const type& rhs) + { + return atomic_op([&](T& v) + { + return v -= rhs; + }); + } + + type fetch_and(const type& rhs) + { + return atomic_op([&](T& v) + { + return std::exchange(v, v &= rhs); + }); + } + + auto operator &=(const type& rhs) + { + return atomic_op([&](T& v) + { + return v &= rhs; + }); + } + + type fetch_or(const type& rhs) + { + return atomic_op([&](T& v) + { + return std::exchange(v, v |= rhs); + }); + } + + auto operator |=(const type& rhs) + { + return atomic_op([&](T& v) + { + return v |= rhs; + }); + } + + type fetch_xor(const type& rhs) + { + return atomic_op([&](T& v) + { + return std::exchange(v, v ^= rhs); + }); + } + + auto operator ^=(const type& rhs) + { + return atomic_op([&](T& v) + { + return v ^= rhs; + }); + } + + auto operator ++() + { + return atomic_op([](T& v) + { + return ++v; + }); + } + + auto operator --() + { + return atomic_op([](T& v) + { + return --v; + }); + } + + auto operator ++(int) + { + return atomic_op([](T& v) + { + return v++; + }); + } + + auto operator --(int) + { + return atomic_op([](T& v) + { + return v--; + }); + } +}; + +using fat_atomic_u1 = atomic_with_lock_bit; +using fat_atomic_u7 = atomic_with_lock_bit; +using fat_atomic_s7 = atomic_with_lock_bit; +using fat_atomic_u8 = atomic_with_lock_bit; +using fat_atomic_s8 = atomic_with_lock_bit; + +using fat_atomic_u15 = atomic_with_lock_bit; +using fat_atomic_s15 = atomic_with_lock_bit; +using fat_atomic_u16 = atomic_with_lock_bit; +using fat_atomic_s16 = atomic_with_lock_bit; + +using fat_atomic_u31 = atomic_with_lock_bit; +using fat_atomic_s31 = atomic_with_lock_bit; +using fat_atomic_u32 = atomic_with_lock_bit; +using fat_atomic_s32 = atomic_with_lock_bit; +using fat_atomic_u63 = atomic_with_lock_bit; +using fat_atomic_s63 = atomic_with_lock_bit; + +template +using fat_atomic_ptr = atomic_with_lock_bit; + +namespace detail +{ + template + struct mao_func_t + { + template + using RT = typename mao_func_t::template RT; + }; + + template + struct mao_func_t + { + template + using RT = std::invoke_result_t&...>; + }; + + template + using mao_result = typename mao_func_t...>::template RT<>; + + template + RT multi_atomic_op(std::index_sequence, Args&&... args) + { + // Tie all arguments (function is the latest) + auto vars = std::tie(args...); + + // Lock all variables + std::lock(std::get(vars)...); + + // Load initial values + auto values = std::make_tuple(std::get(vars).raw_load()...); + + if constexpr (std::is_void_v) + { + std::invoke(std::get<(sizeof...(Args) - 1)>(vars), reinterpret_cast(vars))>::base_type&>(std::get(values))...); + + // Unlock and return + (std::get(vars).raw_release(std::get(values)), ...); + } + else + { + RT result = std::invoke(std::get<(sizeof...(Args) - 1)>(vars), reinterpret_cast(vars))>::base_type&>(std::get(values))...); + + // Unlock and return the result + (std::get(vars).raw_release(std::get(values)), ...); + + return result; + } + } +} + +// Atomic operation; returns function result value, function is the lambda +template > +RT multi_atomic_op(Args&&... args) +{ + return detail::multi_atomic_op(std::make_index_sequence<(sizeof...(Args) - 1)>(), std::forward(args)...); +}