#pragma once #include "vm.h" class cpu_thread; class shared_mutex; namespace vm { extern shared_mutex g_mutex; extern thread_local atomic_t* g_tls_locked; enum range_lock_flags : u64 { /* flags (3 bits) */ range_readable = 1ull << 32, range_writable = 2ull << 32, range_executable = 4ull << 32, range_full_mask = 7ull << 32, /* flag combinations with special meaning */ range_normal = 3ull << 32, // R+W, testing as mask for zero can check no access range_locked = 2ull << 32, // R+W as well, the only range flag that should block by address range_allocation = 0, // Allocation, no safe access, g_shareable may change at ANY location }; extern atomic_t g_range_lock; extern atomic_t g_shareable[]; // Register reader void passive_lock(cpu_thread& cpu); // Register range lock for further use atomic_t* alloc_range_lock(); void range_lock_internal(atomic_t* range_lock, u32 begin, u32 size); // Lock memory range FORCE_INLINE void range_lock(atomic_t* range_lock, u32 begin, u32 size) { const u64 lock_val = g_range_lock.load(); #ifndef _MSC_VER __asm__(""); // Tiny barrier #endif const u64 is_shared = g_shareable[begin >> 16].load(); const u64 lock_addr = static_cast(lock_val); // -> u64 const u32 lock_size = static_cast(lock_val >> 35); u64 addr = begin; // Optimization: if range_locked is not used, the addr check will always pass // Otherwise, g_shareable is unchanged and its value is reliable to read if (is_shared) { addr = addr & 0xffff; } if (addr + size <= lock_addr || addr >= lock_addr + lock_size || ((lock_val >> 32) ^ (range_locked >> 32)) & (range_full_mask >> 32)) [[likely]] { // Optimistic locking. // Note that we store the range we will be accessing, without any clamping. range_lock->store(begin | (u64{size} << 32)); const u64 new_lock_val = g_range_lock.load(); if (!new_lock_val || new_lock_val == lock_val) [[likely]] { return; } range_lock->store(0); } // Fallback to slow path range_lock_internal(range_lock, begin, size); } // Release it void free_range_lock(atomic_t*) noexcept; // Unregister reader void passive_unlock(cpu_thread& cpu); // Unregister reader (foreign thread) void cleanup_unlock(cpu_thread& cpu) noexcept; // Optimization (set cpu_flag::memory) void temporary_unlock(cpu_thread& cpu) noexcept; void temporary_unlock() noexcept; class reader_lock final { bool m_upgraded = false; public: reader_lock(const reader_lock&) = delete; reader_lock& operator=(const reader_lock&) = delete; reader_lock(); ~reader_lock(); void upgrade(); }; struct writer_lock final { writer_lock(const writer_lock&) = delete; writer_lock& operator=(const writer_lock&) = delete; writer_lock(u32 addr = 0); ~writer_lock(); }; } // namespace vm