src/memory.cpp - GCC Code Coverage Report

Directory:	./
Coverage:	low: ≥ 0% medium: ≥ 75.0% high: ≥ 90.0%
	Coverage	Exec / Excl / Total
Lines:	79.7%	459 / 0 / 576
Functions:	97.7%	42 / 0 / 43
Branches:	54.3%	266 / 0 / 490
    src/memory.cpp
    
        Line
        Branch
        Exec
        Source
      
        /**
      
         * @file memory.cpp
      
         * @brief Implementation of memory manipulation and validation utilities.
      
         *
      
         * Provides functions for checking memory readability and writability, writing bytes to memory,
      
         * and managing a memory region cache for performance optimization.
      
         * The cache uses sharded locks with SRWLOCK for high-concurrency read-heavy access.
      
         * Uses monotonic counter-keyed map for O(log n) LRU eviction instead of O(n) scan.
      
         * In-flight query coalescing prevents cache stampede under high concurrency.
      
         * On-demand cleanup handles expired entry removal to avoid polluting the miss path.
      
         * Epoch-based reader tracking prevents use-after-free during shutdown.
      
         */
      
        #include "DetourModKit/memory.hpp"
      
        #include "DetourModKit/format.hpp"
      
        #include "DetourModKit/logger.hpp"
      
        #include "platform.hpp"
      
        #include <windows.h>
      
        #include <shared_mutex>
      
        #include <unordered_map>
      
        #include <map>
      
        #include <vector>
      
        #include <chrono>
      
        #include <atomic>
      
        #include <cstdlib>
      
        #include <sstream>
      
        #include <iomanip>
      
        #include <algorithm>
      
        #include <stdexcept>
      
        #include <cstddef>
      
        #include <thread>
      
        #include <condition_variable>
      
        using namespace DetourModKit;
      
        // Permission flags as constexpr for compile-time constants
      
        namespace CachePermissions
      
        {
      
            constexpr DWORD READ_PERMISSION_FLAGS = PAGE_READONLY | PAGE_READWRITE | PAGE_WRITECOPY |
      
                                                    PAGE_EXECUTE_READ | PAGE_EXECUTE_READWRITE | PAGE_EXECUTE_WRITECOPY;
      
            constexpr DWORD WRITE_PERMISSION_FLAGS = PAGE_READWRITE | PAGE_WRITECOPY |
      
                                                     PAGE_EXECUTE_READWRITE | PAGE_EXECUTE_WRITECOPY;
      
            constexpr DWORD NOACCESS_GUARD_FLAGS = PAGE_NOACCESS | PAGE_GUARD;
      
        }
      
        using DetourModKit::detail::is_loader_lock_held;
      
        using DetourModKit::detail::pin_current_module;
      
        // Anonymous namespace for internal helpers and storage
      
        namespace
      
        {
      
            /**
      
             * @class SrwSharedMutex
      
             * @brief Shared mutex backed by Windows SRWLOCK instead of pthread_rwlock_t.
      
             * @details MinGW/winpthreads' pthread_rwlock_t corrupts internal state under
      
             *          high reader contention, causing assertion failures in lock_shared().
      
             *          SRWLOCK is kernel-level, lock-free for uncontended cases, and does
      
             *          not suffer from this bug.
      
             */
      
            class SrwSharedMutex
      
            {
      
            public:
      
        2744
                SrwSharedMutex() noexcept { InitializeSRWLock(&srw_); }
      
                SrwSharedMutex(const SrwSharedMutex &) = delete;
      
                SrwSharedMutex &operator=(const SrwSharedMutex &) = delete;
      
        3279
                void lock() noexcept { AcquireSRWLockExclusive(&srw_); }
      
        51
                bool try_lock() noexcept { return TryAcquireSRWLockExclusive(&srw_) != 0; }
      
        3330
                void unlock() noexcept { ReleaseSRWLockExclusive(&srw_); }
      
        93678
                void lock_shared() noexcept { AcquireSRWLockShared(&srw_); }
      
        21
                bool try_lock_shared() noexcept { return TryAcquireSRWLockShared(&srw_) != 0; }
      
        102163
                void unlock_shared() noexcept { ReleaseSRWLockShared(&srw_); }
      
            private:
      
                SRWLOCK srw_;
      
            };
      
            /**
      
             * @struct CachedMemoryRegionInfo
      
             * @brief Structure to hold cached memory region information.
      
             * @details Uses timestamp for thread-safe updates and reduced memory footprint.
      
             */
      
            struct CachedMemoryRegionInfo
      
            {
      
                uintptr_t baseAddress;
      
                size_t regionSize;
      
                DWORD protection;
      
                DWORD state;
      
                uint64_t timestamp_ns;
      
                uint64_t lru_key;
      
                bool valid;
      
        139
                CachedMemoryRegionInfo()
      
        139
                    : baseAddress(0), regionSize(0), protection(0), state(0), timestamp_ns(0), lru_key(0), valid(false)
      
                {
      
        139
                }
      
            };
      
            /**
      
             * @struct CacheShard
      
             * @brief Individual cache shard with O(1) address lookup and O(log n) LRU eviction.
      
             * @details Uses unordered_map keyed by region base address for fast lookup.
      
             *          std::map keyed by monotonic counter for efficient oldest-entry eviction.
      
             *          SrwSharedMutex allows multiple concurrent readers.
      
             *          in_flight flag prevents cache stampede by coalescing concurrent VirtualQuery calls.
      
             *          Mutex is stored separately to allow vector resize operations.
      
             */
      
            struct CacheShard
      
            {
      
                // Map from baseAddress -> CachedMemoryRegionInfo for O(1) lookup by address
      
                std::unordered_map<uintptr_t, CachedMemoryRegionInfo> entries;
      
                // Map from monotonic counter -> baseAddress for O(log n) oldest-entry lookup (LRU)
      
                // Monotonic counter guarantees insertion-order uniqueness for correct eviction
      
                std::map<uint64_t, uintptr_t> lru_index;
      
                // Sorted by base address for O(log n) containment lookup
      
                std::vector<std::pair<uintptr_t, uintptr_t>> sorted_ranges; // {base, base+size}
      
                uint64_t entry_counter{0};
      
                size_t capacity;
      
                size_t max_capacity;
      
        2744
                CacheShard() : capacity(0), max_capacity(0)
      
                {
      
          1/2✓ Branch 5 → 6 taken 2744 times.
✗ Branch 5 → 8 not taken.

        2744
                    entries.reserve(64);
      
          1/2✓ Branch 6 → 7 taken 2744 times.
✗ Branch 6 → 8 not taken.

        2744
                    sorted_ranges.reserve(64);
      
        2744
                }
      
            };
      
            /**
      
             * @brief Returns current time in nanoseconds.
      
             */
      
        97577
            inline uint64_t current_time_ns() noexcept
      
            {
      
        103791
                return std::chrono::duration_cast<std::chrono::nanoseconds>(
      
        200524
                           std::chrono::steady_clock::now().time_since_epoch())
      
        103575
                    .count();
      
            }
      
            /**
      
             * @brief Computes the shard index for a given address.
      
             * @param address The address to hash.
      
             * @param shard_count Total number of shards.
      
             * @return The shard index.
      
             * @note Uses golden ratio bit-mixing to spread adjacent addresses across shards.
      
             */
      
        98982
            constexpr inline size_t compute_shard_index(uintptr_t address, size_t shard_count) noexcept
      
            {
      
        98982
                return (static_cast<size_t>((address * 0x9E3779B97F4A7C15ULL) >> 48)) % shard_count;
      
            }
      
        }
      
        // Internal static variables and helper functions for memory cache.
      
        // Anonymous namespace ensures internal linkage, preventing ODR violations
      
        // if this translation unit's declarations were ever duplicated.
      
        namespace
      
        {
      
            std::vector<CacheShard> s_cacheShards;
      
            std::vector<std::unique_ptr<SrwSharedMutex>> s_shardMutexes;
      
            std::unique_ptr<std::atomic<char>[]> s_inFlight;
      
            std::atomic<size_t> s_shardCount{0};
      
            std::atomic<size_t> s_maxEntriesPerShard{0};
      
            std::atomic<unsigned int> s_configuredExpiryMs{0};
      
            std::atomic<bool> s_cacheInitialized{false};
      
            // Global cache state mutex to serialize init/clear/shutdown transitions
      
            // Protects against concurrent state changes that could leave vectors in invalid state
      
            std::mutex s_cacheStateMutex;
      
            // Epoch-based reader tracking to prevent use-after-free during shutdown.
      
            // Readers increment on entry to is_readable/is_writable and decrement on exit.
      
            // shutdown_cache waits for this to reach zero before destroying data structures.
      
            std::atomic<int32_t> s_activeReaders{0};
      
            /**
      
             * @class ActiveReaderGuard
      
             * @brief RAII guard that increments s_activeReaders on construction and
      
             *        decrements on destruction, ensuring correct pairing on all exit paths.
      
             */
      
            class ActiveReaderGuard
      
            {
      
            public:
      
        101138
                ActiveReaderGuard() noexcept
      
                {
      
                    s_activeReaders.fetch_add(1, std::memory_order_acq_rel);
      
        101138
                }
      
        107617
                ~ActiveReaderGuard() noexcept
      
                {
      
                    s_activeReaders.fetch_sub(1, std::memory_order_release);
      
        107617
                }
      
                ActiveReaderGuard(const ActiveReaderGuard &) = delete;
      
                ActiveReaderGuard &operator=(const ActiveReaderGuard &) = delete;
      
            };
      
            // Background cleanup thread.
      
            // Uses std::thread (not jthread) because these are namespace-scope statics:
      
            // jthread's auto-join destructor would run after s_cleanupCv/s_cleanupMutex
      
            // are destroyed (reverse declaration order), causing UB. Manual join in
      
            // shutdown_cache() avoids this. DMK_Shutdown() calls shutdown_cache()
      
            // which joins this thread before any other cleanup proceeds, ensuring
      
            // the thread is fully stopped before static destruction begins.
      
            std::atomic<bool> s_cleanupThreadRunning{false};
      
            std::thread s_cleanupThread;
      
            std::mutex s_cleanupMutex;
      
            std::condition_variable s_cleanupCv;
      
            std::atomic<bool> s_cleanupRequested{false};
      
            // On-demand cleanup fallback timer (used when background thread is disabled)
      
            std::atomic<uint64_t> s_lastCleanupTimeNs{0};
      
            constexpr uint64_t CLEANUP_INTERVAL_NS = 1'000'000'000ULL; // 1 second in nanoseconds
      
            // Always-available cache statistics
      
            struct CacheStats
      
            {
      
                std::atomic<uint64_t> cacheHits{0};
      
                std::atomic<uint64_t> cacheMisses{0};
      
                std::atomic<uint64_t> invalidations{0};
      
                std::atomic<uint64_t> coalescedQueries{0};
      
                std::atomic<uint64_t> onDemandCleanups{0};
      
            };
      
            CacheStats s_stats;
      
            /**
      
             * @brief Checks if a cache entry covers the requested address range and is valid.
      
             * @param entry The cache entry to check.
      
             * @param address Start address of the query.
      
             * @param size Size of the query range.
      
             * @param current_time_ns Current timestamp in nanoseconds.
      
             * @param expiry_ns Expiry time in nanoseconds.
      
             * @return true if the entry is valid and covers the range.
      
             */
      
        100662
            constexpr inline bool is_entry_valid_and_covers(const CachedMemoryRegionInfo &entry,
      
                                                            uintptr_t address,
      
                                                            size_t size,
      
                                                            uint64_t current_time_ns,
      
                                                            uint64_t expiry_ns) noexcept
      
            {
      
          1/2✗ Branch 2 → 3 not taken.
✓ Branch 2 → 4 taken 100662 times.

        100662
                if (!entry.valid)
      
        ✗
                    return false;
      
        100662
                const uint64_t entry_age = current_time_ns - entry.timestamp_ns;
      
          2/2✓ Branch 4 → 5 taken 4 times.
✓ Branch 4 → 6 taken 100658 times.

        100662
                if (entry_age > expiry_ns)
      
        4
                    return false;
      
        100658
                const uintptr_t endAddress = address + size;
      
          2/2✓ Branch 6 → 7 taken 4 times.
✓ Branch 6 → 8 taken 100654 times.

        100658
                if (endAddress < address)
      
        4
                    return false;
      
        100654
                const uintptr_t entryEndAddress = entry.baseAddress + entry.regionSize;
      
          1/2✗ Branch 8 → 9 not taken.
✓ Branch 8 → 10 taken 100654 times.

        100654
                if (entryEndAddress < entry.baseAddress)
      
        ✗
                    return false;
      
          2/4✓ Branch 10 → 11 taken 102975 times.
✗ Branch 10 → 13 not taken.
✓ Branch 11 → 12 taken 103665 times.
✗ Branch 11 → 13 not taken.

        100654
                return address >= entry.baseAddress && endAddress <= entryEndAddress;
      
            }
      
            /**
      
             * @brief Checks protection flags for read permission.
      
             */
      
        100860
            constexpr inline bool check_read_permission(DWORD protection) noexcept
      
            {
      
          1/2✓ Branch 2 → 3 taken 101840 times.
✗ Branch 2 → 5 not taken.

        202700
                return (protection & CachePermissions::READ_PERMISSION_FLAGS) != 0 &&
      
          1/2✓ Branch 3 → 4 taken 102147 times.
✗ Branch 3 → 5 not taken.

        202700
                       (protection & CachePermissions::NOACCESS_GUARD_FLAGS) == 0;
      
            }
      
            /**
      
             * @brief Checks protection flags for write permission.
      
             */
      
        3786
            constexpr inline bool check_write_permission(DWORD protection) noexcept
      
            {
      
          1/2✓ Branch 2 → 3 taken 3802 times.
✗ Branch 2 → 5 not taken.

        7588
                return (protection & CachePermissions::WRITE_PERMISSION_FLAGS) != 0 &&
      
          2/2✓ Branch 3 → 4 taken 3777 times.
✓ Branch 3 → 5 taken 25 times.

        7588
                       (protection & CachePermissions::NOACCESS_GUARD_FLAGS) == 0;
      
            }
      
            /**
      
             * @brief Inserts a range into the shard's sorted auxiliary vector.
      
             * @note Must be called with shard mutex held (exclusive).
      
             */
      
        139
            void insert_sorted_range(CacheShard &shard, uintptr_t base_addr, size_t region_size) noexcept
      
            {
      
        139
                auto range = std::make_pair(base_addr, base_addr + region_size);
      
        139
                auto pos = std::lower_bound(shard.sorted_ranges.begin(),
      
                                             shard.sorted_ranges.end(), range);
      
        278
                shard.sorted_ranges.insert(pos, range);
      
        139
            }
      
            /**
      
             * @brief Removes a range from the shard's sorted auxiliary vector.
      
             * @note Must be called with shard mutex held (exclusive).
      
             */
      
        14
            void remove_sorted_range(CacheShard &shard, uintptr_t base_addr) noexcept
      
            {
      
        14
                auto it = std::lower_bound(shard.sorted_ranges.begin(),
      
                                            shard.sorted_ranges.end(),
      
        14
                                            std::make_pair(base_addr, uintptr_t{0}));
      
          3/6✓ Branch 13 → 14 taken 14 times.
✗ Branch 13 → 18 not taken.
✓ Branch 16 → 17 taken 14 times.
✗ Branch 16 → 18 not taken.
✓ Branch 19 → 20 taken 14 times.
✗ Branch 19 → 25 not taken.

        42
                if (it != shard.sorted_ranges.end() && it->first == base_addr)
      
        28
                    shard.sorted_ranges.erase(it);
      
        14
            }
      
            /**
      
             * @brief Finds and validates a cache entry in a shard by scanning for range containment.
      
             * @param shard The cache shard to search.
      
             * @param address Address to look up.
      
             * @param size Size of the query range.
      
             * @param current_time_ns Current timestamp in nanoseconds.
      
             * @param expiry_ns Expiry time in nanoseconds.
      
             * @return Pointer to the matching entry, or nullptr if not found or expired.
      
             * @note Must be called with shard mutex held (shared or exclusive).
      
             * @note First attempts direct lookup by page-aligned base address for O(1) fast path,
      
             *       then falls back to O(log n) binary search via sorted_ranges for addresses
      
             *       within larger regions.
      
             */
      
        107515
            CachedMemoryRegionInfo *find_in_shard(CacheShard &shard,
      
                                                  uintptr_t address,
      
                                                  size_t size,
      
                                                  uint64_t current_time_ns,
      
                                                  uint64_t expiry_ns) noexcept
      
            {
      
                // Fast path: direct lookup by page-aligned base address
      
        107515
                const uintptr_t base_addr = address & ~static_cast<uintptr_t>(0xFFF);
      
        107515
                auto it = shard.entries.find(base_addr);
      
          1/2✓ Branch 5 → 6 taken 103592 times.
✗ Branch 5 → 10 not taken.

        101532
                if (it != shard.entries.end())
      
                {
      
        103592
                    CachedMemoryRegionInfo &entry = it->second;
      
          1/2✓ Branch 8 → 9 taken 102628 times.
✗ Branch 8 → 10 not taken.

        102192
                    if (is_entry_valid_and_covers(entry, address, size, current_time_ns, expiry_ns))
      
                    {
      
        102628
                        return &entry;
      
                    }
      
                }
      
                // Slow path: O(log n) containment lookup via sorted ranges.
      
                // Finds the last range starting at or before the queried address,
      
                // then verifies containment and entry validity.
      
        159
                auto range_it = std::upper_bound(shard.sorted_ranges.begin(),
      
                                                  shard.sorted_ranges.end(),
      
        ✗
                                                  std::make_pair(address, UINTPTR_MAX));
      
          2/2✓ Branch 21 → 22 taken 34 times.
✓ Branch 21 → 44 taken 125 times.

        318
                if (range_it != shard.sorted_ranges.begin())
      
                {
      
                    --range_it;
      
          5/6✓ Branch 26 → 27 taken 34 times.
✗ Branch 26 → 31 not taken.
✓ Branch 29 → 30 taken 6 times.
✓ Branch 29 → 31 taken 28 times.
✓ Branch 32 → 33 taken 6 times.
✓ Branch 32 → 44 taken 28 times.

        68
                    if (address >= range_it->first && address < range_it->second)
      
                    {
      
        12
                        auto entry_it = shard.entries.find(range_it->first);
      
          1/2✓ Branch 38 → 39 taken 6 times.
✗ Branch 38 → 43 not taken.

        6
                        if (entry_it != shard.entries.end())
      
                        {
      
        6
                            CachedMemoryRegionInfo &entry = entry_it->second;
      
          2/2✓ Branch 41 → 42 taken 2 times.
✓ Branch 41 → 43 taken 4 times.

        6
                            if (is_entry_valid_and_covers(entry, address, size, current_time_ns, expiry_ns))
      
                            {
      
        2
                                return &entry;
      
                            }
      
                        }
      
                    }
      
                }
      
        157
                return nullptr;
      
            }
      
            /**
      
             * @brief Evicts the oldest entry from the shard using O(log n) LRU lookup.
      
             * @note Must be called with shard mutex held (exclusive).
      
             * @return true if an entry was evicted, false if shard is empty.
      
             */
      
        8
            bool evict_oldest_entry(CacheShard &shard) noexcept
      
            {
      
          1/2✗ Branch 3 → 4 not taken.
✓ Branch 3 → 5 taken 8 times.

        8
                if (shard.lru_index.empty())
      
        ✗
                    return false;
      
        8
                const auto lru_it = shard.lru_index.begin();
      
        8
                const uintptr_t oldest_base = lru_it->second;
      
        8
                shard.lru_index.erase(lru_it);
      
        8
                const auto entry_it = shard.entries.find(oldest_base);
      
          1/2✓ Branch 11 → 12 taken 8 times.
✗ Branch 11 → 15 not taken.

        8
                if (entry_it != shard.entries.end())
      
                {
      
        8
                    shard.entries.erase(entry_it);
      
        8
                    remove_sorted_range(shard, oldest_base);
      
        8
                    return true;
      
                }
      
        ✗
                return false;
      
            }
      
            /**
      
             * @brief Force-evicts entries until shard is at or below max_capacity.
      
             * @note Must be called with shard mutex held (exclusive).
      
             * @param shard The cache shard to trim.
      
             */
      
        36
            void trim_to_max_capacity(CacheShard &shard) noexcept
      
            {
      
          2/6✗ Branch 5 → 6 not taken.
✓ Branch 5 → 9 taken 36 times.
✗ Branch 7 → 8 not taken.
✗ Branch 7 → 9 not taken.
✗ Branch 10 → 3 not taken.
✓ Branch 10 → 11 taken 36 times.

        36
                while (shard.entries.size() > shard.max_capacity && !shard.lru_index.empty())
      
                {
      
        ✗
                    evict_oldest_entry(shard);
      
                }
      
        36
            }
      
            /**
      
             * @brief Updates or inserts a cache entry in a specific shard.
      
             * @param shard The cache shard to update.
      
             * @param mbi Memory basic information from VirtualQuery.
      
             * @param current_time_ns Current timestamp in nanoseconds.
      
             * @note Must be called with shard mutex held (exclusive).
      
             */
      
        143
            void update_shard_with_region(CacheShard &shard, const MEMORY_BASIC_INFORMATION &mbi, uint64_t current_time_ns) noexcept
      
            {
      
        143
                const uintptr_t base_addr = reinterpret_cast<uintptr_t>(mbi.BaseAddress);
      
        143
                auto it = shard.entries.find(base_addr);
      
          2/2✓ Branch 5 → 6 taken 4 times.
✓ Branch 5 → 22 taken 139 times.

        143
                if (it != shard.entries.end())
      
                {
      
                    // Remove old entry from LRU index using stored lru_key
      
        4
                    CachedMemoryRegionInfo &old_entry = it->second;
      
        4
                    const auto lru_it = shard.lru_index.find(old_entry.lru_key);
      
          3/6✓ Branch 10 → 11 taken 4 times.
✗ Branch 10 → 14 not taken.
✓ Branch 12 → 13 taken 4 times.
✗ Branch 12 → 14 not taken.
✓ Branch 15 → 16 taken 4 times.
✗ Branch 15 → 17 not taken.

        4
                    if (lru_it != shard.lru_index.end() && lru_it->second == base_addr)
      
                    {
      
        4
                        shard.lru_index.erase(lru_it);
      
                    }
      
                    // Update sorted range if region size changed
      
          1/2✗ Branch 17 → 18 not taken.
✓ Branch 17 → 20 taken 4 times.

        4
                    if (old_entry.regionSize != mbi.RegionSize)
      
                    {
      
        ✗
                        remove_sorted_range(shard, base_addr);
      
        ✗
                        insert_sorted_range(shard, base_addr, mbi.RegionSize);
      
                    }
      
                    // Update existing entry with new monotonic LRU key
      
        4
                    const uint64_t new_lru_key = shard.entry_counter++;
      
        4
                    old_entry.baseAddress = base_addr;
      
        4
                    old_entry.regionSize = mbi.RegionSize;
      
        4
                    old_entry.protection = mbi.Protect;
      
        4
                    old_entry.state = mbi.State;
      
        4
                    old_entry.timestamp_ns = current_time_ns;
      
        4
                    old_entry.lru_key = new_lru_key;
      
        4
                    old_entry.valid = true;
      
                    // Insert new composite key into LRU index
      
        4
                    shard.lru_index.emplace(new_lru_key, base_addr);
      
                }
      
                else
      
                {
      
                    // Evict oldest if at capacity - O(log n) via map
      
          2/2✓ Branch 23 → 24 taken 8 times.
✓ Branch 23 → 25 taken 131 times.

        139
                    if (shard.entries.size() >= shard.capacity)
      
                    {
      
        8
                        evict_oldest_entry(shard);
      
                    }
      
                    // Hard upper bound: trim if exceeding max_capacity
      
          1/2✗ Branch 26 → 27 not taken.
✓ Branch 26 → 28 taken 139 times.

        139
                    if (shard.entries.size() >= shard.max_capacity)
      
                    {
      
        ✗
                        trim_to_max_capacity(shard);
      
                    }
      
                    // Generate unique monotonic LRU key
      
        139
                    const uint64_t new_lru_key = shard.entry_counter++;
      
        139
                    CachedMemoryRegionInfo new_entry;
      
        139
                    new_entry.baseAddress = base_addr;
      
        139
                    new_entry.regionSize = mbi.RegionSize;
      
        139
                    new_entry.protection = mbi.Protect;
      
        139
                    new_entry.state = mbi.State;
      
        139
                    new_entry.timestamp_ns = current_time_ns;
      
        139
                    new_entry.lru_key = new_lru_key;
      
        139
                    new_entry.valid = true;
      
        278
                    shard.entries.insert_or_assign(base_addr, std::move(new_entry));
      
        139
                    shard.lru_index.emplace(new_lru_key, base_addr);
      
        139
                    insert_sorted_range(shard, base_addr, mbi.RegionSize);
      
                }
      
        143
            }
      
            /**
      
             * @brief Removes expired entries from a shard.
      
             * @note Must be called with shard mutex held (exclusive).
      
             * @return Number of entries removed from this shard.
      
             */
      
        36
            size_t cleanup_expired_entries_in_shard(CacheShard &shard,
      
                                                    uint64_t current_time_ns,
      
                                                    uint64_t expiry_ns) noexcept
      
            {
      
        36
                size_t removed = 0;
      
        36
                auto it = shard.entries.begin();
      
          2/2✓ Branch 25 → 4 taken 1 time.
✓ Branch 25 → 26 taken 36 times.

        37
                while (it != shard.entries.end())
      
                {
      
        1
                    const CachedMemoryRegionInfo &entry = it->second;
      
        1
                    const uint64_t entry_age = current_time_ns - entry.timestamp_ns;
      
          2/4✓ Branch 5 → 6 taken 1 time.
✗ Branch 5 → 7 not taken.
✓ Branch 6 → 7 taken 1 time.
✗ Branch 6 → 21 not taken.

        1
                    if (!entry.valid || entry_age > expiry_ns)
      
                    {
      
                        // Remove from LRU index using stored lru_key
      
        1
                        const auto lru_it = shard.lru_index.find(entry.lru_key);
      
          3/6✓ Branch 10 → 11 taken 1 time.
✗ Branch 10 → 15 not taken.
✓ Branch 13 → 14 taken 1 time.
✗ Branch 13 → 15 not taken.
✓ Branch 16 → 17 taken 1 time.
✗ Branch 16 → 18 not taken.

        1
                        if (lru_it != shard.lru_index.end() && lru_it->second == it->first)
      
                        {
      
        1
                            shard.lru_index.erase(lru_it);
      
                        }
      
        1
                        remove_sorted_range(shard, entry.baseAddress);
      
        1
                        it = shard.entries.erase(it);
      
        1
                        ++removed;
      
        1
                    }
      
                    else
      
                    {
      
        ✗
                        ++it;
      
                    }
      
                }
      
        36
                return removed;
      
            }
      
            /**
      
             * @brief Performs cleanup of expired cache entries across all shards.
      
             * @details Called by the background cleanup thread or on-demand timer.
      
             * @param force Force cleanup regardless of timing.
      
             */
      
        3
            void cleanup_expired_entries(bool force) noexcept
      
            {
      
                // Always hold state mutex to prevent racing with shutdown_cache()
      
                // which clears the shard vectors. try_lock for on-demand to avoid
      
                // blocking the hot path; forced cleanup blocks to guarantee progress.
      
        3
                std::unique_lock<std::mutex> lock(s_cacheStateMutex, std::defer_lock);
      
          1/2✓ Branch 3 → 4 taken 3 times.
✗ Branch 3 → 5 not taken.

        3
                if (force)
      
                {
      
        3
                    lock.lock();
      
                }
      
        ✗
                else if (!lock.try_lock())
      
                {
      
        ✗
                    return; // Shutdown or forced cleanup in progress, skip
      
                }
      
          1/2✗ Branch 9 → 10 not taken.
✓ Branch 9 → 11 taken 3 times.

        3
                if (s_cacheShards.empty())
      
        ✗
                    return;
      
        3
                const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
          1/2✗ Branch 18 → 19 not taken.
✓ Branch 18 → 20 taken 3 times.

        3
                if (shard_count == 0)
      
        ✗
                    return;
      
        3
                const uint64_t current_ts = current_time_ns();
      
        3
                const uint64_t expiry_ns = static_cast<uint64_t>(s_configuredExpiryMs.load(std::memory_order_acquire)) * 1'000'000ULL;
      
          2/2✓ Branch 40 → 29 taken 36 times.
✓ Branch 40 → 41 taken 3 times.

        39
                for (size_t i = 0; i < shard_count; ++i)
      
                {
      
        36
                    std::unique_lock<SrwSharedMutex> shard_lock(*s_shardMutexes[i], std::try_to_lock);
      
          1/2✓ Branch 33 → 34 taken 36 times.
✗ Branch 33 → 38 not taken.

        36
                    if (shard_lock.owns_lock())
      
                    {
      
        36
                        cleanup_expired_entries_in_shard(s_cacheShards[i], current_ts, expiry_ns);
      
                        // Also trim to hard upper bound
      
        36
                        trim_to_max_capacity(s_cacheShards[i]);
      
                    }
      
        36
                }
      
          1/2✓ Branch 43 → 44 taken 3 times.
✗ Branch 43 → 46 not taken.

        3
            }
      
            /**
      
             * @brief Checks if on-demand cleanup should run based on elapsed time.
      
             * @return true if cleanup was performed, false otherwise.
      
             */
      
        ✗
            bool try_trigger_on_demand_cleanup() noexcept
      
            {
      
        ✗
                if (!s_cacheInitialized.load(std::memory_order_acquire))
      
        ✗
                    return false;
      
        ✗
                const uint64_t now_ns = current_time_ns();
      
        ✗
                const uint64_t last_cleanup = s_lastCleanupTimeNs.load(std::memory_order_acquire);
      
        ✗
                const uint64_t elapsed_ns = now_ns - last_cleanup;
      
        ✗
                if (elapsed_ns >= CLEANUP_INTERVAL_NS)
      
                {
      
                    // Atomically update last cleanup time to prevent multiple threads triggering
      
        ✗
                    uint64_t expected = last_cleanup;
      
        ✗
                    if (s_lastCleanupTimeNs.compare_exchange_strong(expected, now_ns, std::memory_order_acq_rel))
      
                    {
      
        ✗
                        cleanup_expired_entries(false);
      
                        s_stats.onDemandCleanups.fetch_add(1, std::memory_order_relaxed);
      
        ✗
                        return true;
      
                    }
      
                }
      
        ✗
                return false;
      
            }
      
            /**
      
             * @brief Background cleanup thread function.
      
             * @details Runs periodically to clean up expired entries without impacting the miss path.
      
             */
      
        191
            void cleanup_thread_func() noexcept
      
            {
      
          2/2✓ Branch 13 → 3 taken 16 times.
✓ Branch 13 → 14 taken 178 times.

        194
                while (s_cleanupThreadRunning.load(std::memory_order_acquire))
      
                {
      
                    {
      
        16
                        std::unique_lock<std::mutex> lock(s_cleanupMutex);
      
        16
                        s_cleanupCv.wait_for(lock, std::chrono::seconds(1), [&]()
      
          4/4✓ Branch 3 → 4 taken 28 times.
✓ Branch 3 → 6 taken 2 times.
✓ Branch 5 → 6 taken 13 times.
✓ Branch 5 → 7 taken 15 times.

        30
                                             { return s_cleanupRequested.load(std::memory_order_acquire) || !s_cleanupThreadRunning.load(std::memory_order_acquire); });
      
        16
                    }
      
          2/2✓ Branch 8 → 9 taken 13 times.
✓ Branch 8 → 10 taken 3 times.

        16
                    if (!s_cleanupThreadRunning.load(std::memory_order_acquire))
      
        13
                        break;
      
        3
                    cleanup_expired_entries(true); // force=true to hold state mutex during vector iteration
      
        3
                    s_cleanupRequested.store(false, std::memory_order_relaxed);
      
                }
      
        191
            }
      
            /**
      
             * @brief Signals the cleanup thread to run or triggers on-demand cleanup.
      
             */
      
        15
            void request_cleanup() noexcept
      
            {
      
          1/2✓ Branch 3 → 4 taken 15 times.
✗ Branch 3 → 6 not taken.

        15
                if (s_cleanupThreadRunning.load(std::memory_order_acquire))
      
                {
      
        15
                    s_cleanupRequested.store(true, std::memory_order_relaxed);
      
        15
                    s_cleanupCv.notify_one();
      
                }
      
                else
      
                {
      
                    // Background thread disabled (MinGW) - use on-demand timer-based cleanup
      
        ✗
                    try_trigger_on_demand_cleanup();
      
                }
      
        15
            }
      
            /**
      
             * @brief Invalidates cache entries in shards that overlap with the given range.
      
             * @details Only invalidates specific entries that overlap, not entire shards.
      
             *          Uses retry loop to handle locked shards gracefully.
      
             */
      
        15
            void invalidate_range_internal(uintptr_t address, size_t size) noexcept
      
            {
      
          3/6✓ Branch 3 → 4 taken 15 times.
✗ Branch 3 → 5 not taken.
✗ Branch 4 → 5 not taken.
✓ Branch 4 → 6 taken 15 times.
✗ Branch 7 → 8 not taken.
✓ Branch 7 → 9 taken 15 times.

        15
                if (s_cacheShards.empty() || size == 0)
      
        ✗
                    return;
      
                // Guard against address + size wrapping around the address space
      
          2/2✓ Branch 9 → 10 taken 14 times.
✓ Branch 9 → 11 taken 1 time.

        15
                const uintptr_t endAddress = (address + size < address) ? UINTPTR_MAX : address + size;
      
        15
                const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
        15
                const uintptr_t start_page = address >> 12;
      
          1/2✓ Branch 19 → 20 taken 15 times.
✗ Branch 19 → 21 not taken.

        15
                const uintptr_t end_page = (endAddress == 0 ? address : endAddress - 1) >> 12;
      
        15
                constexpr size_t MAX_INVALIDATION_RETRIES = 3;
      
          1/2✓ Branch 74 → 23 taken 15 times.
✗ Branch 74 → 75 not taken.

        15
                for (uintptr_t page = start_page; page <= end_page; ++page)
      
                {
      
        15
                    const size_t shard_idx = compute_shard_index(page << 12, shard_count);
      
        15
                    bool invalidated = false;
      
          3/4✓ Branch 69 → 70 taken 30 times.
✗ Branch 69 → 71 not taken.
✓ Branch 70 → 25 taken 15 times.
✓ Branch 70 → 71 taken 15 times.

        30
                    for (size_t retry = 0; retry < MAX_INVALIDATION_RETRIES && !invalidated; ++retry)
      
                    {
      
        15
                        std::unique_lock<SrwSharedMutex> lock(*s_shardMutexes[shard_idx], std::try_to_lock);
      
          1/2✗ Branch 29 → 30 not taken.
✓ Branch 29 → 33 taken 15 times.

        15
                        if (!lock.owns_lock())
      
                        {
      
                            // Shard is locked by another writer - yield and retry
      
        ✗
                            if (retry < MAX_INVALIDATION_RETRIES - 1)
      
                            {
      
        ✗
                                std::this_thread::yield();
      
                            }
      
        ✗
                            continue;
      
                        }
      
        15
                        CacheShard &shard = s_cacheShards[shard_idx];
      
        15
                        const uintptr_t page_base = page << 12;
      
        15
                        auto it = shard.entries.find(page_base);
      
          2/2✓ Branch 37 → 38 taken 5 times.
✓ Branch 37 → 61 taken 10 times.

        15
                        if (it != shard.entries.end())
      
                        {
      
        5
                            CachedMemoryRegionInfo &entry = it->second;
      
          1/2✗ Branch 39 → 40 not taken.
✓ Branch 39 → 41 taken 5 times.

        5
                            if (!entry.valid)
      
                            {
      
        ✗
                                invalidated = true;
      
        ✗
                                continue;
      
                            }
      
        5
                            const uintptr_t entryEndAddress = entry.baseAddress + entry.regionSize;
      
          2/4✓ Branch 41 → 42 taken 5 times.
✗ Branch 41 → 44 not taken.
✓ Branch 42 → 43 taken 5 times.
✗ Branch 42 → 44 not taken.

        5
                            const bool overlaps = address < entryEndAddress && endAddress > entry.baseAddress;
      
          1/2✓ Branch 45 → 46 taken 5 times.
✗ Branch 45 → 62 not taken.

        5
                            if (overlaps)
      
                            {
      
                                // Remove from LRU index using stored lru_key to avoid tombstone accumulation
      
        5
                                const auto lru_it = shard.lru_index.find(entry.lru_key);
      
          3/6✓ Branch 49 → 50 taken 5 times.
✗ Branch 49 → 53 not taken.
✓ Branch 51 → 52 taken 5 times.
✗ Branch 51 → 53 not taken.
✓ Branch 54 → 55 taken 5 times.
✗ Branch 54 → 56 not taken.

        5
                                if (lru_it != shard.lru_index.end() && lru_it->second == page_base)
      
                                {
      
        5
                                    shard.lru_index.erase(lru_it);
      
                                }
      
                                // Erase entry immediately instead of leaving tombstone
      
        5
                                remove_sorted_range(shard, entry.baseAddress);
      
        5
                                shard.entries.erase(it);
      
                                s_stats.invalidations.fetch_add(1, std::memory_order_relaxed);
      
        5
                                invalidated = true;
      
                            }
      
                        }
      
                        else
      
                        {
      
        10
                            invalidated = true;
      
                        }
      
          1/2✓ Branch 64 → 65 taken 15 times.
✗ Branch 64 → 67 not taken.

        15
                    }
      
          1/2✓ Branch 71 → 72 taken 15 times.
✗ Branch 71 → 73 not taken.

        15
                    if (start_page == end_page)
      
        15
                        break;
      
                }
      
            }
      
            /**
      
             * @brief Performs one-time cache initialization.
      
             */
      
        191
            bool perform_cache_initialization(size_t cache_size, unsigned int expiry_ms, size_t shard_count)
      
            {
      
          1/2✗ Branch 2 → 3 not taken.
✓ Branch 2 → 4 taken 191 times.

        191
                if (cache_size == 0)
      
        ✗
                    cache_size = 1;
      
          1/2✗ Branch 4 → 5 not taken.
✓ Branch 4 → 6 taken 191 times.

        191
                if (shard_count == 0)
      
        ✗
                    shard_count = 1;
      
        191
                const size_t entries_per_shard = (cache_size + shard_count - 1) / shard_count;
      
        191
                const size_t hard_max_per_shard = entries_per_shard * 2; // Hard upper bound: 2x capacity
      
                try
      
                {
      
          1/2✓ Branch 6 → 7 taken 191 times.
✗ Branch 6 → 73 not taken.

        191
                    s_cacheShards.resize(shard_count);
      
          1/2✓ Branch 7 → 8 taken 191 times.
✗ Branch 7 → 73 not taken.

        191
                    s_shardMutexes.resize(shard_count);
      
          1/2✓ Branch 8 → 9 taken 191 times.
✗ Branch 8 → 71 not taken.

        191
                    s_inFlight = std::make_unique<std::atomic<char>[]>(shard_count);
      
          2/2✓ Branch 32 → 12 taken 2744 times.
✓ Branch 32 → 33 taken 191 times.

        2935
                    for (size_t i = 0; i < shard_count; ++i)
      
                    {
      
          1/2✓ Branch 13 → 14 taken 2744 times.
✗ Branch 13 → 73 not taken.

        2744
                        s_cacheShards[i].entries.reserve(entries_per_shard * 2);
      
          1/2✓ Branch 15 → 16 taken 2744 times.
✗ Branch 15 → 73 not taken.

        2744
                        s_cacheShards[i].sorted_ranges.reserve(entries_per_shard * 2);
      
        2744
                        s_cacheShards[i].capacity = entries_per_shard;
      
        2744
                        s_cacheShards[i].max_capacity = hard_max_per_shard;
      
          1/2✓ Branch 18 → 19 taken 2744 times.
✗ Branch 18 → 72 not taken.

        2744
                        s_shardMutexes[i] = std::make_unique<SrwSharedMutex>();
      
        2744
                        s_inFlight[i].store(0, std::memory_order_relaxed);
      
                    }
      
                }
      
        ✗
                catch (const std::bad_alloc &)
      
                {
      
        ✗
                    Logger::get_instance().error("MemoryCache: Failed to allocate memory for cache shards.");
      
        ✗
                    s_cacheShards.clear();
      
        ✗
                    s_shardMutexes.clear();
      
        ✗
                    s_inFlight.reset();
      
                    // Reset initialization flag so retry can work
      
        ✗
                    s_cacheInitialized.store(false, std::memory_order_relaxed);
      
        ✗
                    return false;
      
        ✗
                }
      
        191
                s_shardCount.store(shard_count, std::memory_order_release);
      
        191
                s_maxEntriesPerShard.store(entries_per_shard, std::memory_order_release);
      
        191
                s_configuredExpiryMs.store(expiry_ms, std::memory_order_release);
      
        191
                s_lastCleanupTimeNs.store(current_time_ns(), std::memory_order_release);
      
          2/4✓ Branch 66 → 67 taken 191 times.
✗ Branch 66 → 87 not taken.
✓ Branch 67 → 68 taken 191 times.
✗ Branch 67 → 86 not taken.

        191
                Logger::get_instance().debug("MemoryCache: Initialized with {} shards ({} entries/shard, {}ms expiry, {} max).",
      
                                             shard_count, entries_per_shard, expiry_ms, hard_max_per_shard);
      
        191
                return true;
      
            }
      
            /**
      
             * @brief Performs VirtualQuery and updates cache with coalescing support.
      
             * @param shard_idx Index of the shard to update.
      
             * @param address Address to query.
      
             * @param mbi_out Output buffer for VirtualQuery result.
      
             * @return true if VirtualQuery succeeded.
      
             */
      
        143
            bool query_and_update_cache(size_t shard_idx, LPCVOID address, MEMORY_BASIC_INFORMATION &mbi_out) noexcept
      
            {
      
        143
                CacheShard &shard = s_cacheShards[shard_idx];
      
                // Try to claim in-flight status (stampede coalescing)
      
        143
                char expected = 0;
      
          1/2✓ Branch 12 → 13 taken 143 times.
✗ Branch 12 → 32 not taken.

        286
                if (s_inFlight[shard_idx].compare_exchange_strong(expected, 1, std::memory_order_acq_rel))
      
                {
      
                    // We are the leader - perform VirtualQuery
      
        143
                    const bool result = VirtualQuery(address, &mbi_out, sizeof(mbi_out)) != 0;
      
        143
                    const uint64_t now_ns = current_time_ns();
      
          1/2✓ Branch 15 → 16 taken 143 times.
✗ Branch 15 → 22 not taken.

        143
                    if (result)
      
                    {
      
        143
                        std::unique_lock<SrwSharedMutex> lock(*s_shardMutexes[shard_idx]);
      
        143
                        update_shard_with_region(shard, mbi_out, now_ns);
      
        143
                    }
      
                    // Release in-flight status
      
        143
                    s_inFlight[shard_idx].store(0, std::memory_order_release);
      
        143
                    return result;
      
                }
      
                else
      
                {
      
                    // We are a follower - VirtualQuery already in progress by another thread.
      
                    // Bounded wait to avoid stalling game threads on render-critical paths.
      
        ✗
                    const uint64_t expiry_ns = static_cast<uint64_t>(s_configuredExpiryMs.load(std::memory_order_acquire)) * 1'000'000ULL;
      
        ✗
                    constexpr size_t MAX_FOLLOWER_YIELDS = 8;
      
        ✗
                    for (size_t yield_count = 0; yield_count < MAX_FOLLOWER_YIELDS; ++yield_count)
      
                    {
      
        ✗
                        if (s_inFlight[shard_idx].load(std::memory_order_acquire) == 0)
      
                        {
      
                            // Query completed, check cache
      
        ✗
                            const uintptr_t addr_val = reinterpret_cast<uintptr_t>(address);
      
        ✗
                            std::shared_lock<SrwSharedMutex> lock(*s_shardMutexes[shard_idx]);
      
        ✗
                            CachedMemoryRegionInfo *cached = find_in_shard(shard, addr_val, 1, current_time_ns(), expiry_ns);
      
        ✗
                            if (cached)
      
                            {
      
                                s_stats.coalescedQueries.fetch_add(1, std::memory_order_relaxed);
      
                                // Copy cached info to output for consistency
      
        ✗
                                mbi_out.BaseAddress = reinterpret_cast<PVOID>(cached->baseAddress);
      
        ✗
                                mbi_out.RegionSize = cached->regionSize;
      
        ✗
                                mbi_out.Protect = cached->protection;
      
        ✗
                                mbi_out.State = cached->state;
      
        ✗
                                return true;
      
                            }
      
                            // Cache not populated, break to retry as leader
      
        ✗
                            break;
      
        ✗
                        }
      
                        // Yield to allow the leader thread to complete
      
        ✗
                        std::this_thread::yield();
      
                    }
      
                    // Retry as leader if follower wait timed out
      
        ✗
                    expected = 0;
      
        ✗
                    if (s_inFlight[shard_idx].compare_exchange_strong(expected, 1, std::memory_order_acq_rel))
      
                    {
      
        ✗
                        const bool result = VirtualQuery(address, &mbi_out, sizeof(mbi_out)) != 0;
      
        ✗
                        if (result)
      
                        {
      
        ✗
                            std::unique_lock<SrwSharedMutex> lock(*s_shardMutexes[shard_idx]);
      
        ✗
                            const uint64_t now_ns = current_time_ns();
      
        ✗
                            update_shard_with_region(shard, mbi_out, now_ns);
      
        ✗
                        }
      
        ✗
                        s_inFlight[shard_idx].store(0, std::memory_order_release);
      
        ✗
                        return result;
      
                    }
      
                    // Last resort: just do VirtualQuery without cache update
      
        ✗
                    return VirtualQuery(address, &mbi_out, sizeof(mbi_out)) != 0;
      
                }
      
            }
      
        } // anonymous namespace (cache internals)
      
        193
        bool DetourModKit::Memory::init_cache(size_t cache_size, unsigned int expiry_ms, size_t shard_count)
      
        {
      
            // Hold state mutex to prevent concurrent clear_cache or shutdown_cache
      
            // This serializes init/clear/shutdown transitions to ensure vectors are not accessed while being resized or cleared
      
          1/2✓ Branch 2 → 3 taken 193 times.
✗ Branch 2 → 38 not taken.

        193
            std::lock_guard<std::mutex> state_lock(s_cacheStateMutex);
      
            // Fast path: already initialized
      
          2/2✓ Branch 4 → 5 taken 2 times.
✓ Branch 4 → 6 taken 191 times.

        193
            if (s_cacheInitialized.load(std::memory_order_acquire))
      
        2
                return true;
      
            // Try to initialize
      
        191
            bool expected = false;
      
          1/2✓ Branch 7 → 8 taken 191 times.
✗ Branch 7 → 21 not taken.

        191
            if (s_cacheInitialized.compare_exchange_strong(expected, true, std::memory_order_acq_rel))
      
            {
      
          2/4✓ Branch 8 → 9 taken 191 times.
✗ Branch 8 → 36 not taken.
✗ Branch 9 → 10 not taken.
✓ Branch 9 → 11 taken 191 times.

        191
                if (!perform_cache_initialization(cache_size, expiry_ms, shard_count))
      
                {
      
                    // Initialization failed - s_cacheInitialized already reset to false in perform_cache_initialization
      
        ✗
                    return false;
      
                }
      
                // Try to start background cleanup thread (may fail silently on MinGW)
      
        191
                s_cleanupThreadRunning.store(true, std::memory_order_release);
      
                try
      
                {
      
          1/2✓ Branch 12 → 13 taken 191 times.
✗ Branch 12 → 25 not taken.

        191
                    s_cleanupThread = std::thread(cleanup_thread_func);
      
                }
      
        ✗
                catch (const std::system_error &)
      
                {
      
                    // Background thread creation failed (MinGW pthreads issue) - use on-demand cleanup
      
        ✗
                    s_cleanupThreadRunning.store(false, std::memory_order_release);
      
        ✗
                    Logger::get_instance().debug("MemoryCache: Background cleanup thread unavailable, using on-demand cleanup.");
      
        ✗
                }
      
                // Register atexit handler as a last-resort safety net in case the
      
                // consumer forgets to call shutdown_cache() / DMK_Shutdown().
      
                // Prevents std::terminate from the joinable std::thread destructor.
      
                // The handler detects loader-lock context (FreeLibrary) and skips
      
                // the thread join to avoid deadlock.
      
                static bool atexit_registered = false;
      
          2/2✓ Branch 16 → 17 taken 1 time.
✓ Branch 16 → 20 taken 190 times.

        191
                if (!atexit_registered)
      
                {
      
        1
                    std::atexit([]()
      
                                {
      
          1/2✗ Branch 3 → 4 not taken.
✓ Branch 3 → 15 taken 1 time.

        1
                        if (s_cacheInitialized.load(std::memory_order_acquire))
      
                        {
      
        ✗
                            if (is_loader_lock_held())
      
                            {
      
                                // Under loader lock (FreeLibrary path): pin the module
      
                                // so code pages remain valid for the detached thread,
      
                                // then signal it to stop and detach.
      
        ✗
                                s_cleanupThreadRunning.store(false, std::memory_order_release);
      
        ✗
                                s_cleanupCv.notify_one();
      
        ✗
                                if (s_cleanupThread.joinable())
      
                                {
      
        ✗
                                    pin_current_module();
      
        ✗
                                    s_cleanupThread.detach();
      
                                }
      
        ✗
                                s_cacheInitialized.store(false, std::memory_order_release);
      
        ✗
                                return;
      
                            }
      
        ✗
                            Memory::shutdown_cache();
      
                        } });
      
        1
                    atexit_registered = true;
      
                }
      
        191
                return true;
      
            }
      
            // Another thread initialized while we were waiting
      
        ✗
            return true;
      
        193
        }
      
        26
        void DetourModKit::Memory::clear_cache()
      
        {
      
            // Hold state mutex to serialize with shutdown and cleanup thread
      
          1/2✓ Branch 2 → 3 taken 26 times.
✗ Branch 2 → 102 not taken.

        26
            std::lock_guard<std::mutex> state_lock(s_cacheStateMutex);
      
          1/2✗ Branch 4 → 5 not taken.
✓ Branch 4 → 6 taken 26 times.

        26
            if (!s_cacheInitialized.load(std::memory_order_acquire))
      
        ✗
                return;
      
        26
            const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
          1/2✗ Branch 13 → 14 not taken.
✓ Branch 13 → 15 taken 26 times.

        26
            if (shard_count == 0)
      
        ✗
                return;
      
            // Acquire exclusive lock on each shard and clear entries.
      
            // Uses blocking lock to guarantee all entries are cleared.
      
            // The background cleanup thread uses try_to_lock on shard mutexes,
      
            // so it will skip shards we hold without deadlocking.
      
          2/2✓ Branch 39 → 16 taken 392 times.
✓ Branch 39 → 40 taken 26 times.

        418
            for (size_t i = 0; i < shard_count; ++i)
      
            {
      
        392
                auto &mutex_ptr = s_shardMutexes[i];
      
          1/2✓ Branch 18 → 19 taken 392 times.
✗ Branch 18 → 38 not taken.

        392
                if (mutex_ptr)
      
                {
      
          1/2✓ Branch 20 → 21 taken 392 times.
✗ Branch 20 → 98 not taken.

        392
                    std::unique_lock<SrwSharedMutex> shard_lock(*mutex_ptr);
      
        392
                    s_cacheShards[i].entries.clear();
      
        392
                    s_cacheShards[i].lru_index.clear();
      
        392
                    s_cacheShards[i].sorted_ranges.clear();
      
        392
                    s_inFlight[i].store(0, std::memory_order_relaxed);
      
        392
                }
      
            }
      
            s_stats.cacheHits.store(0, std::memory_order_relaxed);
      
            s_stats.cacheMisses.store(0, std::memory_order_relaxed);
      
            s_stats.invalidations.store(0, std::memory_order_relaxed);
      
            s_stats.coalescedQueries.store(0, std::memory_order_relaxed);
      
            s_stats.onDemandCleanups.store(0, std::memory_order_relaxed);
      
        26
            s_lastCleanupTimeNs.store(current_time_ns(), std::memory_order_relaxed);
      
          2/4✓ Branch 89 → 90 taken 26 times.
✗ Branch 89 → 100 not taken.
✓ Branch 90 → 91 taken 26 times.
✗ Branch 90 → 99 not taken.

        26
            Logger::get_instance().debug("MemoryCache: All entries cleared.");
      
          1/2✓ Branch 93 → 94 taken 26 times.
✗ Branch 93 → 96 not taken.

        26
        }
      
        213
        void DetourModKit::Memory::shutdown_cache()
      
        {
      
            // Signal and join cleanup thread BEFORE acquiring state mutex.
      
            // The cleanup thread acquires s_cacheStateMutex in cleanup_expired_entries(force=true),
      
            // so joining while holding the state mutex would deadlock.
      
        213
            s_cleanupThreadRunning.store(false, std::memory_order_release);
      
        213
            s_cleanupCv.notify_one();
      
          2/2✓ Branch 5 → 6 taken 191 times.
✓ Branch 5 → 11 taken 22 times.

        213
            if (s_cleanupThread.joinable())
      
            {
      
          1/2✗ Branch 7 → 8 not taken.
✓ Branch 7 → 10 taken 191 times.

        191
                if (is_loader_lock_held())
      
                {
      
                    // Under loader lock (DllMain / FreeLibrary): thread join would
      
                    // deadlock because the cleanup thread cannot exit while the
      
                    // loader lock is held. Pin the module so code and static data
      
                    // remain valid, then detach. The thread will observe the stop
      
                    // flag and exit on its own.
      
        ✗
                    pin_current_module();
      
        ✗
                    s_cleanupThread.detach();
      
                }
      
                else
      
                {
      
          1/2✓ Branch 10 → 11 taken 191 times.
✗ Branch 10 → 132 not taken.

        191
                    s_cleanupThread.join();
      
                }
      
            }
      
            // Acquire state mutex to serialize with clear_cache and protect data teardown
      
          1/2✓ Branch 11 → 12 taken 213 times.
✗ Branch 11 → 132 not taken.

        213
            std::lock_guard<std::mutex> state_lock(s_cacheStateMutex);
      
            // Mark as not initialized and zero shard count.
      
            // This prevents new readers from entering the critical section.
      
            // acquire/release is sufficient here because the state mutex provides the
      
            // cross-thread ordering guarantee. Readers that observe shard_count == 0
      
            // immediately exit without touching data structures.
      
        213
            s_cacheInitialized.store(false, std::memory_order_release);
      
            s_shardCount.store(0, std::memory_order_release);
      
            // Wait for in-flight readers to finish before destroying data structures.
      
            // Readers increment s_activeReaders on entry and decrement on exit.
      
            // ActiveReaderGuard is RAII so readers always decrement; this loop is
      
            // bounded by the maximum time a single cache lookup can take.
      
            // Escalate from yield to sleep to avoid burning CPU if a reader is
      
            // preempted by the OS scheduler.
      
        213
            constexpr int yield_spins = 4096;
      
        213
            int spins = 0;
      
          1/2✗ Branch 35 → 22 not taken.
✓ Branch 35 → 36 taken 213 times.

        426
            while (s_activeReaders.load(std::memory_order_acquire) > 0)
      
            {
      
        ✗
                if (spins < yield_spins)
      
                {
      
        ✗
                    std::this_thread::yield();
      
                }
      
                else
      
                {
      
        ✗
                    std::this_thread::sleep_for(std::chrono::microseconds(100));
      
                }
      
        ✗
                ++spins;
      
            }
      
            // All readers have exited - safe to destroy data structures
      
        213
            const size_t shard_count = s_cacheShards.size();
      
          2/2✓ Branch 53 → 38 taken 2744 times.
✓ Branch 53 → 54 taken 213 times.

        2957
            for (size_t i = 0; i < shard_count; ++i)
      
            {
      
          1/2✓ Branch 40 → 41 taken 2744 times.
✗ Branch 40 → 52 not taken.

        2744
                if (s_shardMutexes[i])
      
                {
      
          1/2✓ Branch 43 → 44 taken 2744 times.
✗ Branch 43 → 128 not taken.

        2744
                    std::unique_lock<SrwSharedMutex> shard_lock(*s_shardMutexes[i]);
      
        2744
                    s_cacheShards[i].entries.clear();
      
        2744
                    s_cacheShards[i].lru_index.clear();
      
        2744
                    s_cacheShards[i].sorted_ranges.clear();
      
        2744
                }
      
            }
      
        213
            s_cacheShards.clear();
      
        213
            s_shardMutexes.clear();
      
        213
            s_inFlight.reset();
      
            // Reset all stats and config so a subsequent init_cache starts from a clean state
      
            s_stats.cacheHits.store(0, std::memory_order_relaxed);
      
            s_stats.cacheMisses.store(0, std::memory_order_relaxed);
      
            s_stats.invalidations.store(0, std::memory_order_relaxed);
      
            s_stats.coalescedQueries.store(0, std::memory_order_relaxed);
      
            s_stats.onDemandCleanups.store(0, std::memory_order_relaxed);
      
            s_lastCleanupTimeNs.store(0, std::memory_order_relaxed);
      
            s_configuredExpiryMs.store(0, std::memory_order_relaxed);
      
            s_maxEntriesPerShard.store(0, std::memory_order_relaxed);
      
        213
            s_cleanupRequested.store(false, std::memory_order_relaxed);
      
          2/4✓ Branch 122 → 123 taken 213 times.
✗ Branch 122 → 130 not taken.
✓ Branch 123 → 124 taken 213 times.
✗ Branch 123 → 129 not taken.

        213
            Logger::get_instance().debug("MemoryCache: Shutdown complete.");
      
        213
        }
      
        22
        std::string DetourModKit::Memory::get_cache_stats()
      
        {
      
        22
            const uint64_t hits = s_stats.cacheHits.load(std::memory_order_relaxed);
      
        22
            const uint64_t misses = s_stats.cacheMisses.load(std::memory_order_relaxed);
      
        22
            const uint64_t invalidations = s_stats.invalidations.load(std::memory_order_relaxed);
      
        22
            const uint64_t coalesced = s_stats.coalescedQueries.load(std::memory_order_relaxed);
      
        22
            const uint64_t on_demand_cleanups = s_stats.onDemandCleanups.load(std::memory_order_relaxed);
      
        22
            const uint64_t total_queries = hits + misses;
      
        22
            const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
        22
            const size_t max_entries_per_shard = s_maxEntriesPerShard.load(std::memory_order_acquire);
      
        22
            const unsigned int expiry_ms = s_configuredExpiryMs.load(std::memory_order_acquire);
      
            // Calculate total entries and hard max with reader guard
      
        22
            size_t total_entries = 0;
      
        22
            size_t total_hard_max = 0;
      
            {
      
        22
                ActiveReaderGuard reader_guard;
      
        22
                const size_t active_shard_count = s_shardCount.load(std::memory_order_acquire);
      
          2/2✓ Branch 78 → 67 taken 115 times.
✓ Branch 78 → 79 taken 22 times.

        137
                for (size_t i = 0; i < active_shard_count; ++i)
      
                {
      
        115
                    auto &mutex_ptr = s_shardMutexes[i];
      
          1/2✓ Branch 69 → 70 taken 115 times.
✗ Branch 69 → 77 not taken.

        115
                    if (mutex_ptr)
      
                    {
      
        115
                        std::shared_lock<SrwSharedMutex> shard_lock(*mutex_ptr);
      
        115
                        total_entries += s_cacheShards[i].entries.size();
      
        115
                        total_hard_max += s_cacheShards[i].max_capacity;
      
        115
                    }
      
                }
      
        22
            }
      
          1/2✓ Branch 80 → 81 taken 22 times.
✗ Branch 80 → 120 not taken.

        22
            std::ostringstream oss;
      
          2/4✓ Branch 81 → 82 taken 22 times.
✗ Branch 81 → 118 not taken.
✓ Branch 82 → 83 taken 22 times.
✗ Branch 82 → 118 not taken.

        22
            oss << "MemoryCache Stats (Shards: " << shard_count
      
          2/4✓ Branch 83 → 84 taken 22 times.
✗ Branch 83 → 118 not taken.
✓ Branch 84 → 85 taken 22 times.
✗ Branch 84 → 118 not taken.

        22
                << ", Entries/Shard: " << max_entries_per_shard
      
          3/6✓ Branch 85 → 86 taken 22 times.
✗ Branch 85 → 118 not taken.
✓ Branch 86 → 87 taken 22 times.
✗ Branch 86 → 88 not taken.
✓ Branch 89 → 90 taken 22 times.
✗ Branch 89 → 118 not taken.

        22
                << ", HardMax/Shard: " << (shard_count > 0 ? total_hard_max / shard_count : 0)
      
          2/4✓ Branch 90 → 91 taken 22 times.
✗ Branch 90 → 118 not taken.
✓ Branch 91 → 92 taken 22 times.
✗ Branch 91 → 118 not taken.

        22
                << ", Expiry: " << expiry_ms << "ms) - "
      
          5/10✓ Branch 92 → 93 taken 22 times.
✗ Branch 92 → 118 not taken.
✓ Branch 93 → 94 taken 22 times.
✗ Branch 93 → 118 not taken.
✓ Branch 94 → 95 taken 22 times.
✗ Branch 94 → 118 not taken.
✓ Branch 95 → 96 taken 22 times.
✗ Branch 95 → 118 not taken.
✓ Branch 96 → 97 taken 22 times.
✗ Branch 96 → 118 not taken.

        22
                << "Hits: " << hits << ", Misses: " << misses
      
          2/4✓ Branch 97 → 98 taken 22 times.
✗ Branch 97 → 118 not taken.
✓ Branch 98 → 99 taken 22 times.
✗ Branch 98 → 118 not taken.

        22
                << ", Invalidations: " << invalidations
      
          2/4✓ Branch 99 → 100 taken 22 times.
✗ Branch 99 → 118 not taken.
✓ Branch 100 → 101 taken 22 times.
✗ Branch 100 → 118 not taken.

        22
                << ", Coalesced: " << coalesced
      
          2/4✓ Branch 101 → 102 taken 22 times.
✗ Branch 101 → 118 not taken.
✓ Branch 102 → 103 taken 22 times.
✗ Branch 102 → 118 not taken.

        22
                << ", OnDemandCleanups: " << on_demand_cleanups
      
          2/4✓ Branch 103 → 104 taken 22 times.
✗ Branch 103 → 118 not taken.
✓ Branch 104 → 105 taken 22 times.
✗ Branch 104 → 118 not taken.

        22
                << ", TotalEntries: " << total_entries;
      
          2/2✓ Branch 105 → 106 taken 16 times.
✓ Branch 105 → 112 taken 6 times.

        22
            if (total_queries > 0)
      
            {
      
        16
                const double hit_rate_percent = (static_cast<double>(hits) / static_cast<double>(total_queries)) * 100.0;
      
          4/8✓ Branch 106 → 107 taken 16 times.
✗ Branch 106 → 118 not taken.
✓ Branch 107 → 108 taken 16 times.
✗ Branch 107 → 118 not taken.
✓ Branch 110 → 111 taken 16 times.
✗ Branch 110 → 118 not taken.
✓ Branch 111 → 113 taken 16 times.
✗ Branch 111 → 118 not taken.

        16
                oss << ", Hit Rate: " << std::fixed << std::setprecision(2) << hit_rate_percent << "%";
      
            }
      
            else
      
            {
      
          1/2✓ Branch 112 → 113 taken 6 times.
✗ Branch 112 → 118 not taken.

        6
                oss << ", Hit Rate: N/A (no queries tracked)";
      
            }
      
          1/2✓ Branch 113 → 114 taken 22 times.
✗ Branch 113 → 118 not taken.

        44
            return oss.str();
      
        22
        }
      
        17
        void DetourModKit::Memory::invalidate_range(const void *address, size_t size)
      
        {
      
          4/4✓ Branch 2 → 3 taken 16 times.
✓ Branch 2 → 4 taken 1 time.
✓ Branch 3 → 4 taken 1 time.
✓ Branch 3 → 5 taken 15 times.

        17
            if (!address || size == 0)
      
        2
                return;
      
            // Construct reader guard BEFORE checking s_cacheInitialized to prevent
      
            // shutdown_cache from destroying data structures between the check and access.
      
        15
            ActiveReaderGuard reader_guard;
      
          1/2✗ Branch 7 → 8 not taken.
✓ Branch 7 → 9 taken 15 times.

        15
            if (!s_cacheInitialized.load(std::memory_order_acquire))
      
        ✗
                return;
      
        15
            const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
          1/2✗ Branch 16 → 17 not taken.
✓ Branch 16 → 18 taken 15 times.

        15
            if (shard_count == 0)
      
        ✗
                return;
      
        15
            const uintptr_t addr_val = reinterpret_cast<uintptr_t>(address);
      
        15
            invalidate_range_internal(addr_val, size);
      
            // request_cleanup may trigger on-demand cleanup_expired_entries(force=false)
      
            // which iterates shards without s_cacheStateMutex. Keep s_activeReaders > 0
      
            // so shutdown_cache cannot destroy shards during the cleanup pass.
      
        15
            request_cleanup();
      
          1/2✓ Branch 22 → 23 taken 15 times.
✗ Branch 22 → 25 not taken.

        15
        }
      
        namespace
      
        {
      
            /**
      
             * @brief Unified permission check for is_readable/is_writable.
      
             * @details Parameterized by permission checker to avoid duplicating the
      
             *          cache lookup, VirtualQuery fallback, and range validation logic.
      
             * @param address Starting address of the memory region.
      
             * @param size Number of bytes in the memory region to check.
      
             * @param check_permission Function that validates protection flags.
      
             * @return true if the entire region has the requested permission.
      
             */
      
        100063
            bool check_memory_permission(const void *address, size_t size,
      
                                         bool (*check_permission)(DWORD) noexcept) noexcept
      
            {
      
          2/4✓ Branch 2 → 3 taken 102266 times.
✗ Branch 2 → 4 not taken.
✗ Branch 3 → 4 not taken.
✓ Branch 3 → 5 taken 103178 times.

        100063
                if (!address || size == 0)
      
        ✗
                    return false;
      
                // Construct reader guard BEFORE checking s_cacheInitialized to prevent
      
                // shutdown_cache from destroying data structures between the check and access.
      
        103178
                ActiveReaderGuard reader_guard;
      
          2/2✓ Branch 7 → 8 taken 118 times.
✓ Branch 7 → 24 taken 103285 times.

        110510
                if (!s_cacheInitialized.load(std::memory_order_acquire))
      
                {
      
                    // Cache not initialized -- fall back to direct VirtualQuery
      
                    MEMORY_BASIC_INFORMATION mbi;
      
          1/2✗ Branch 9 → 10 not taken.
✓ Branch 9 → 11 taken 118 times.

        118
                    if (!VirtualQuery(address, &mbi, sizeof(mbi)))
      
        ✗
                        return false;
      
          2/2✓ Branch 11 → 12 taken 3 times.
✓ Branch 11 → 13 taken 115 times.

        118
                    if (mbi.State != MEM_COMMIT)
      
        3
                        return false;
      
          2/2✓ Branch 14 → 15 taken 3 times.
✓ Branch 14 → 16 taken 112 times.

        115
                    if (!check_permission(mbi.Protect))
      
        3
                        return false;
      
        112
                    const uintptr_t query_addr_val = reinterpret_cast<uintptr_t>(address);
      
        112
                    const uintptr_t region_start = reinterpret_cast<uintptr_t>(mbi.BaseAddress);
      
        112
                    const uintptr_t query_end = query_addr_val + size;
      
          2/2✓ Branch 16 → 17 taken 3 times.
✓ Branch 16 → 18 taken 109 times.

        112
                    if (query_end < query_addr_val)
      
        3
                        return false;
      
          2/4✓ Branch 18 → 19 taken 109 times.
✗ Branch 18 → 21 not taken.
✓ Branch 19 → 20 taken 109 times.
✗ Branch 19 → 21 not taken.

        109
                    return query_addr_val >= region_start && query_end <= region_start + mbi.RegionSize;
      
                }
      
                // Reader guard already active -- safe to access cache data structures
      
        100223
                const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
          1/2✗ Branch 31 → 32 not taken.
✓ Branch 31 → 33 taken 100223 times.

        100223
                if (shard_count == 0)
      
        ✗
                    return false;
      
        100223
                const uintptr_t query_addr_val = reinterpret_cast<uintptr_t>(address);
      
        100223
                const size_t shard_idx = compute_shard_index(query_addr_val, shard_count);
      
        98317
                const uint64_t now_ns = current_time_ns();
      
        100317
                const uint64_t expiry_ns = static_cast<uint64_t>(s_configuredExpiryMs.load(std::memory_order_acquire)) * 1'000'000ULL;
      
                // Fast path: blocking shared lock for concurrent read access (multiple readers allowed)
      
                {
      
        100317
                    std::shared_lock<SrwSharedMutex> lock(*s_shardMutexes[shard_idx]);
      
        108597
                    CachedMemoryRegionInfo *cached_info = find_in_shard(
      
        112546
                        s_cacheShards[shard_idx],
      
                        query_addr_val, size, now_ns, expiry_ns);
      
          2/2✓ Branch 47 → 48 taken 106199 times.
✓ Branch 47 → 52 taken 143 times.

        106342
                    if (cached_info)
      
                    {
      
                        s_stats.cacheHits.fetch_add(1, std::memory_order_relaxed);
      
        106199
                        return check_permission(cached_info->protection);
      
                    }
      
          2/2✓ Branch 54 → 55 taken 143 times.
✓ Branch 54 → 60 taken 108819 times.

        103999
                }
      
                s_stats.cacheMisses.fetch_add(1, std::memory_order_relaxed);
      
                // Cache miss: call VirtualQuery with stampede coalescing
      
                MEMORY_BASIC_INFORMATION mbi;
      
          1/2✗ Branch 59 → 61 not taken.
✓ Branch 59 → 62 taken 143 times.

        143
                if (!query_and_update_cache(shard_idx, address, mbi))
      
        ✗
                    return false;
      
          2/2✓ Branch 62 → 63 taken 4 times.
✓ Branch 62 → 64 taken 139 times.

        143
                if (mbi.State != MEM_COMMIT)
      
        4
                    return false;
      
          2/2✓ Branch 65 → 66 taken 8 times.
✓ Branch 65 → 67 taken 131 times.

        139
                if (!check_permission(mbi.Protect))
      
        8
                    return false;
      
        131
                const uintptr_t region_start_addr = reinterpret_cast<uintptr_t>(mbi.BaseAddress);
      
        131
                const uintptr_t region_end_addr = region_start_addr + mbi.RegionSize;
      
        131
                const uintptr_t query_end_addr = query_addr_val + size;
      
          2/2✓ Branch 67 → 68 taken 4 times.
✓ Branch 67 → 69 taken 127 times.

        131
                if (query_end_addr < query_addr_val)
      
        4
                    return false;
      
          3/4✓ Branch 69 → 70 taken 127 times.
✗ Branch 69 → 72 not taken.
✓ Branch 70 → 71 taken 126 times.
✓ Branch 70 → 72 taken 1 time.

        127
                return query_addr_val >= region_start_addr && query_end_addr <= region_end_addr;
      
        109080
            }
      
        } // anonymous namespace
      
        99840
        bool DetourModKit::Memory::is_readable(const void *address, size_t size)
      
        {
      
        99840
            return check_memory_permission(address, size, check_read_permission);
      
        }
      
        3755
        bool DetourModKit::Memory::is_writable(void *address, size_t size)
      
        {
      
        3755
            return check_memory_permission(address, size, check_write_permission);
      
        }
      
        16
        std::expected<void, MemoryError> DetourModKit::Memory::write_bytes(std::byte *targetAddress, const std::byte *sourceBytes, size_t numBytes)
      
        {
      
          1/2✓ Branch 2 → 3 taken 16 times.
✗ Branch 2 → 92 not taken.

        16
            auto &logger = Logger::get_instance();
      
          2/2✓ Branch 3 → 4 taken 2 times.
✓ Branch 3 → 9 taken 14 times.

        16
            if (!targetAddress)
      
            {
      
          1/2✓ Branch 4 → 5 taken 2 times.
✗ Branch 4 → 66 not taken.

        2
                logger.error("write_bytes: Target address is null.");
      
        2
                return std::unexpected(MemoryError::NullTargetAddress);
      
            }
      
          3/4✓ Branch 9 → 10 taken 2 times.
✓ Branch 9 → 16 taken 12 times.
✓ Branch 10 → 11 taken 2 times.
✗ Branch 10 → 16 not taken.

        14
            if (!sourceBytes && numBytes > 0)
      
            {
      
          1/2✓ Branch 11 → 12 taken 2 times.
✗ Branch 11 → 67 not taken.

        2
                logger.error("write_bytes: Source bytes pointer is null for non-zero numBytes.");
      
        2
                return std::unexpected(MemoryError::NullSourceBytes);
      
            }
      
          2/2✓ Branch 16 → 17 taken 2 times.
✓ Branch 16 → 21 taken 10 times.

        12
            if (numBytes == 0)
      
            {
      
          1/2✓ Branch 17 → 18 taken 2 times.
✗ Branch 17 → 68 not taken.

        2
                logger.warning("write_bytes: Number of bytes to write is zero. Operation has no effect.");
      
        2
                return {};
      
            }
      
          2/2✓ Branch 21 → 22 taken 1 time.
✓ Branch 21 → 27 taken 9 times.

        10
            if (numBytes > MAX_WRITE_SIZE)
      
            {
      
          1/2✓ Branch 22 → 23 taken 1 time.
✗ Branch 22 → 69 not taken.

        1
                logger.error("write_bytes: Requested size {} exceeds MAX_WRITE_SIZE ({}).", numBytes, MAX_WRITE_SIZE);
      
        1
                return std::unexpected(MemoryError::SizeTooLarge);
      
            }
      
            DWORD old_protection_flags;
      
          2/4✓ Branch 27 → 28 taken 9 times.
✗ Branch 27 → 92 not taken.
✗ Branch 28 → 29 not taken.
✓ Branch 28 → 37 taken 9 times.

        9
            if (!VirtualProtect(reinterpret_cast<LPVOID>(targetAddress), numBytes, PAGE_EXECUTE_READWRITE, &old_protection_flags))
      
            {
      
        ✗
                logger.error("write_bytes: VirtualProtect failed to set PAGE_EXECUTE_READWRITE at address {}. Windows Error: {}",
      
        ✗
                             DetourModKit::Format::format_address(reinterpret_cast<uintptr_t>(targetAddress)), GetLastError());
      
        ✗
                return std::unexpected(MemoryError::ProtectionChangeFailed);
      
            }
      
        9
            memcpy(reinterpret_cast<void *>(targetAddress), reinterpret_cast<const void *>(sourceBytes), numBytes);
      
            DWORD temp_old_protect;
      
          2/4✓ Branch 37 → 38 taken 9 times.
✗ Branch 37 → 92 not taken.
✗ Branch 38 → 39 not taken.
✓ Branch 38 → 49 taken 9 times.

        9
            if (!VirtualProtect(reinterpret_cast<LPVOID>(targetAddress), numBytes, old_protection_flags, &temp_old_protect))
      
            {
      
        ✗
                logger.error("write_bytes: VirtualProtect failed to restore original protection ({}) at address {}. Windows Error: {}. Memory may remain writable!",
      
        ✗
                             DetourModKit::Format::format_hex(static_cast<int>(old_protection_flags)),
      
        ✗
                             DetourModKit::Format::format_address(reinterpret_cast<uintptr_t>(targetAddress)), GetLastError());
      
        ✗
                return std::unexpected(MemoryError::ProtectionRestoreFailed);
      
            }
      
          3/6✓ Branch 49 → 50 taken 9 times.
✗ Branch 49 → 92 not taken.
✓ Branch 50 → 51 taken 9 times.
✗ Branch 50 → 92 not taken.
✗ Branch 51 → 52 not taken.
✓ Branch 51 → 57 taken 9 times.

        9
            if (!FlushInstructionCache(GetCurrentProcess(), reinterpret_cast<LPCVOID>(targetAddress), numBytes))
      
            {
      
        ✗
                logger.warning("write_bytes: FlushInstructionCache failed for address {}. Windows Error: {}",
      
        ✗
                               DetourModKit::Format::format_address(reinterpret_cast<uintptr_t>(targetAddress)), GetLastError());
      
            }
      
        9
            Memory::invalidate_range(targetAddress, numBytes);
      
          1/2✓ Branch 59 → 60 taken 9 times.
✗ Branch 59 → 88 not taken.

        9
            logger.debug("write_bytes: Successfully wrote {} bytes to address {}.",
      
          1/2✓ Branch 58 → 59 taken 9 times.
✗ Branch 58 → 91 not taken.

        18
                         numBytes, DetourModKit::Format::format_address(reinterpret_cast<uintptr_t>(targetAddress)));
      
        9
            return {};
      
        }
      
        14
        Memory::ReadableStatus DetourModKit::Memory::is_readable_nonblocking(const void *address, size_t size)
      
        {
      
          4/4✓ Branch 2 → 3 taken 13 times.
✓ Branch 2 → 4 taken 1 time.
✓ Branch 3 → 4 taken 1 time.
✓ Branch 3 → 5 taken 12 times.

        14
            if (!address || size == 0)
      
        2
                return ReadableStatus::NotReadable;
      
        12
            ActiveReaderGuard reader_guard;
      
          2/2✓ Branch 7 → 8 taken 2 times.
✓ Branch 7 → 23 taken 10 times.

        12
            if (!s_cacheInitialized.load(std::memory_order_acquire))
      
            {
      
                // Cache not initialized - fall back to direct VirtualQuery (blocking)
      
                MEMORY_BASIC_INFORMATION mbi;
      
          2/4✓ Branch 8 → 9 taken 2 times.
✗ Branch 8 → 62 not taken.
✗ Branch 9 → 10 not taken.
✓ Branch 9 → 11 taken 2 times.

        2
                if (!VirtualQuery(address, &mbi, sizeof(mbi)))
      
        ✗
                    return ReadableStatus::NotReadable;
      
          2/2✓ Branch 11 → 12 taken 1 time.
✓ Branch 11 → 13 taken 1 time.

        2
                if (mbi.State != MEM_COMMIT)
      
        1
                    return ReadableStatus::NotReadable;
      
          1/2✗ Branch 14 → 15 not taken.
✓ Branch 14 → 16 taken 1 time.

        1
                if (!check_read_permission(mbi.Protect))
      
        ✗
                    return ReadableStatus::NotReadable;
      
        1
                const uintptr_t query_addr_val = reinterpret_cast<uintptr_t>(address);
      
        1
                const uintptr_t region_start = reinterpret_cast<uintptr_t>(mbi.BaseAddress);
      
        1
                const uintptr_t query_end = query_addr_val + size;
      
          1/2✗ Branch 16 → 17 not taken.
✓ Branch 16 → 18 taken 1 time.

        1
                if (query_end < query_addr_val)
      
        ✗
                    return ReadableStatus::NotReadable;
      
          2/4✓ Branch 18 → 19 taken 1 time.
✗ Branch 18 → 21 not taken.
✓ Branch 19 → 20 taken 1 time.
✗ Branch 19 → 21 not taken.

        1
                if (query_addr_val >= region_start && query_end <= region_start + mbi.RegionSize)
      
        1
                    return ReadableStatus::Readable;
      
        ✗
                return ReadableStatus::NotReadable;
      
            }
      
        10
            const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
          1/2✗ Branch 30 → 31 not taken.
✓ Branch 30 → 32 taken 10 times.

        10
            if (shard_count == 0)
      
        ✗
                return ReadableStatus::Unknown;
      
        10
            const uintptr_t query_addr_val = reinterpret_cast<uintptr_t>(address);
      
        10
            const size_t shard_idx = compute_shard_index(query_addr_val, shard_count);
      
        10
            const uint64_t now_ns = current_time_ns();
      
        10
            const uint64_t expiry_ns = static_cast<uint64_t>(s_configuredExpiryMs.load(std::memory_order_acquire)) * 1'000'000ULL;
      
            // Non-blocking: try_lock_shared to avoid stalling latency-sensitive threads
      
        10
            std::shared_lock<SrwSharedMutex> lock(*s_shardMutexes[shard_idx], std::try_to_lock);
      
          1/2✗ Branch 45 → 46 not taken.
✓ Branch 45 → 47 taken 10 times.

        10
            if (!lock.owns_lock())
      
        ✗
                return ReadableStatus::Unknown;
      
        10
            CachedMemoryRegionInfo *cached_info = find_in_shard(
      
        10
                s_cacheShards[shard_idx],
      
                query_addr_val, size, now_ns, expiry_ns);
      
          2/2✓ Branch 49 → 50 taken 6 times.
✓ Branch 49 → 57 taken 4 times.

        10
            if (cached_info)
      
            {
      
                s_stats.cacheHits.fetch_add(1, std::memory_order_relaxed);
      
        6
                return check_read_permission(cached_info->protection)
      
          2/2✓ Branch 53 → 54 taken 3 times.
✓ Branch 53 → 55 taken 3 times.

        6
                           ? ReadableStatus::Readable
      
        6
                           : ReadableStatus::NotReadable;
      
            }
      
            // Cache miss with non-blocking semantics: return Unknown rather than issuing VirtualQuery
      
        4
            return ReadableStatus::Unknown;
      
        12
        }
      
        11
        uintptr_t DetourModKit::Memory::read_ptr_unsafe(uintptr_t base, ptrdiff_t offset) noexcept
      
        {
      
        #ifdef _MSC_VER
      
            __try
      
            {
      
                return *reinterpret_cast<const uintptr_t *>(base + offset);
      
            }
      
            __except ((GetExceptionCode() == EXCEPTION_ACCESS_VIOLATION ||
      
                       GetExceptionCode() == STATUS_GUARD_PAGE_VIOLATION)
      
                          ? EXCEPTION_EXECUTE_HANDLER
      
                          : EXCEPTION_CONTINUE_SEARCH)
      
            {
      
                return 0;
      
            }
      
        #else
      
            // MinGW/GCC lacks __try/__except. Probe the cache with a trylock
      
            // to avoid a VirtualQuery syscall when the region is already cached.
      
            // Falls back to VirtualQuery on cache miss or when cache is off.
      
            // ActiveReaderGuard is required to prevent shutdown_cache() from
      
            // destroying shard vectors between our check and access.
      
        11
            const auto src = base + static_cast<uintptr_t>(offset);
      
            {
      
        11
                ActiveReaderGuard reader_guard;
      
          1/2✓ Branch 4 → 5 taken 11 times.
✗ Branch 4 → 40 not taken.

        11
                if (s_cacheInitialized.load(std::memory_order_acquire))
      
                {
      
        11
                    const size_t shard_count = s_shardCount.load(std::memory_order_acquire);
      
          1/2✓ Branch 12 → 13 taken 11 times.
✗ Branch 12 → 40 not taken.

        11
                    if (shard_count != 0)
      
                    {
      
        11
                        const size_t shard_idx = compute_shard_index(src, shard_count);
      
        11
                        std::shared_lock<SrwSharedMutex> lock(*s_shardMutexes[shard_idx], std::try_to_lock);
      
          1/2✓ Branch 18 → 19 taken 11 times.
✗ Branch 18 → 34 not taken.

        11
                        if (lock.owns_lock())
      
                        {
      
        11
                            const uint64_t now_ns = current_time_ns();
      
        11
                            const uint64_t expiry_ns = static_cast<uint64_t>(
      
        11
                                s_configuredExpiryMs.load(std::memory_order_acquire)) * 1'000'000ULL;
      
        11
                            CachedMemoryRegionInfo *cached = find_in_shard(
      
        11
                                s_cacheShards[shard_idx],
      
                                src, sizeof(uintptr_t), now_ns, expiry_ns);
      
          2/2✓ Branch 29 → 30 taken 1 time.
✓ Branch 29 → 34 taken 10 times.

        11
                            if (cached)
      
                            {
      
          1/2✓ Branch 31 → 32 taken 1 time.
✗ Branch 31 → 33 not taken.

        1
                                if (check_read_permission(cached->protection))
      
        1
                                    return *reinterpret_cast<const uintptr_t *>(src);
      
        ✗
                                return 0;
      
                            }
      
                        }
      
          2/2✓ Branch 36 → 37 taken 10 times.
✓ Branch 36 → 39 taken 1 time.

        11
                    }
      
                }
      
          2/2✓ Branch 42 → 43 taken 10 times.
✓ Branch 42 → 46 taken 1 time.

        11
            }
      
            // Cache miss, lock contention, or cache not initialized
      
            MEMORY_BASIC_INFORMATION mbi;
      
          1/2✗ Branch 45 → 47 not taken.
✓ Branch 45 → 48 taken 10 times.

        10
            if (!VirtualQuery(reinterpret_cast<const void *>(src), &mbi, sizeof(mbi)))
      
        ✗
                return 0;
      
          2/2✓ Branch 48 → 49 taken 3 times.
✓ Branch 48 → 50 taken 7 times.

        10
            if (mbi.State != MEM_COMMIT)
      
        3
                return 0;
      
          2/2✓ Branch 50 → 51 taken 6 times.
✓ Branch 50 → 52 taken 1 time.

        7
            if ((mbi.Protect & CachePermissions::READ_PERMISSION_FLAGS) == 0 ||
      
          2/2✓ Branch 51 → 52 taken 1 time.
✓ Branch 51 → 53 taken 5 times.

        6
                (mbi.Protect & CachePermissions::NOACCESS_GUARD_FLAGS) != 0)
      
        2
                return 0;
      
            // Verify the full read fits within the committed region (overflow-safe)
      
        5
            const uintptr_t region_start = reinterpret_cast<uintptr_t>(mbi.BaseAddress);
      
        5
            const uintptr_t region_end = region_start + mbi.RegionSize;
      
        5
            const uintptr_t read_end = src + sizeof(uintptr_t);
      
          3/6✓ Branch 53 → 54 taken 5 times.
✗ Branch 53 → 56 not taken.
✓ Branch 54 → 55 taken 5 times.
✗ Branch 54 → 56 not taken.
✗ Branch 55 → 56 not taken.
✓ Branch 55 → 57 taken 5 times.

        5
            if (read_end < src || src < region_start || read_end > region_end)
      
        ✗
                return 0;
      
        5
            return *reinterpret_cast<const uintptr_t *>(src);
      
        #endif
      
        }