summaryrefslogblamecommitdiffstats
path: root/src/core/core_timing.cpp
blob: ac117161c0e3ccaec4c12d92bee243ef6159e964 (plain) (tree)
1
2
3
4
5
6
7
8
9

                                                               
 
                    
                

                 
 
                                
                          
                             
                                  
                                     
 
                        
 
                                      
 



                                                                                    
                          
             
                   
                             
                                  
 




                                                                                             
 



                                                                                             
 

                                                                                             
 
                                    
 
                                                    


                                              
                                                                       

                              
                               
 
 
                                                                      
                                                
                      
                          
              
                                                                                      
                                                               
                       




                                                                              
     

 
                             
                     
                         
     
                                                




                                         
     
                           
                         
                        

 
                                         
                                            










                                                                     
 
 
                                             
                                            
                                                                     
               
     













                                                                                                    
         
     


                                    
                                                         


                                           
                                            
                                

 
                                                                       

                                                                            
 
                                            


                                                                                       
 



                                                                             
     

 

                                                                              
                                            
                                                                                                 
                                                                                   
       
 


                                                                                
                                                                                 
     

 

                                             
                                         

 

                               
                                                             
                                                                                           


                                 






                                 

 
                                     



                                     

 
                                       



                                         


                                       
                                            


                        
                                                                            
                                            



                                                                                                 
 


                                                                                
                                                                                 
     

 
                                          
                                             
 
                                            

                                                                              
                                                                                
                               
                             
 
                                                     
                                                   

                                                                                            

         
                           
                                                 
     
 
                               
                                                                      

                         
                            
     

 
                               
                                                                                

                            
                                              

                                             

                                                                                                 
                                                            
                                                                          
                 
                    
                                                        
                                                    
             
         
                                                










                                                                                      
     
 
 
                                                              


                                  
                             

 
                                                               


                                  
                             

 
                           
// SPDX-FileCopyrightText: Copyright 2020 yuzu Emulator Project
// SPDX-License-Identifier: GPL-2.0-or-later

#include <algorithm>
#include <mutex>
#include <string>
#include <tuple>

#include "common/microprofile.h"
#include "common/thread.h"
#include "core/core_timing.h"
#include "core/core_timing_util.h"
#include "core/hardware_properties.h"

namespace Core::Timing {

constexpr s64 MAX_SLICE_LENGTH = 4000;

std::shared_ptr<EventType> CreateEvent(std::string name, TimedCallback&& callback) {
    return std::make_shared<EventType>(std::move(callback), std::move(name));
}

struct CoreTiming::Event {
    u64 time;
    u64 fifo_order;
    std::uintptr_t user_data;
    std::weak_ptr<EventType> type;

    // Sort by time, unless the times are the same, in which case sort by
    // the order added to the queue
    friend bool operator>(const Event& left, const Event& right) {
        return std::tie(left.time, left.fifo_order) > std::tie(right.time, right.fifo_order);
    }

    friend bool operator<(const Event& left, const Event& right) {
        return std::tie(left.time, left.fifo_order) < std::tie(right.time, right.fifo_order);
    }
};

CoreTiming::CoreTiming()
    : clock{Common::CreateBestMatchingClock(Hardware::BASE_CLOCK_RATE, Hardware::CNTFREQ)} {}

CoreTiming::~CoreTiming() = default;

void CoreTiming::ThreadEntry(CoreTiming& instance) {
    constexpr char name[] = "yuzu:HostTiming";
    MicroProfileOnThreadCreate(name);
    Common::SetCurrentThreadName(name);
    Common::SetCurrentThreadPriority(Common::ThreadPriority::Critical);
    instance.on_thread_init();
    instance.ThreadLoop();
    MicroProfileOnThreadExit();
}

void CoreTiming::Initialize(std::function<void()>&& on_thread_init_) {
    on_thread_init = std::move(on_thread_init_);
    event_fifo_id = 0;
    shutting_down = false;
    ticks = 0;
    const auto empty_timed_callback = [](std::uintptr_t, std::chrono::nanoseconds) {};
    ev_lost = CreateEvent("_lost_event", empty_timed_callback);
    if (is_multicore) {
        const auto hardware_concurrency = std::thread::hardware_concurrency();
        worker_threads.emplace_back(ThreadEntry, std::ref(*this));
        if (hardware_concurrency > 8) {
            worker_threads.emplace_back(ThreadEntry, std::ref(*this));
        }
    }
}

void CoreTiming::Shutdown() {
    is_paused = true;
    shutting_down = true;
    {
        std::unique_lock main_lock(event_mutex);
        event_cv.notify_all();
        wait_pause_cv.notify_all();
    }
    for (auto& thread : worker_threads) {
        thread.join();
    }
    worker_threads.clear();
    ClearPendingEvents();
    has_started = false;
}

void CoreTiming::Pause(bool is_paused_) {
    std::unique_lock main_lock(event_mutex);
    if (is_paused_ == paused_state.load(std::memory_order_relaxed)) {
        return;
    }
    if (is_multicore) {
        is_paused = is_paused_;
        event_cv.notify_all();
        if (!is_paused_) {
            wait_pause_cv.notify_all();
        }
    }
    paused_state.store(is_paused_, std::memory_order_relaxed);
}

void CoreTiming::SyncPause(bool is_paused_) {
    std::unique_lock main_lock(event_mutex);
    if (is_paused_ == paused_state.load(std::memory_order_relaxed)) {
        return;
    }

    if (is_multicore) {
        is_paused = is_paused_;
        event_cv.notify_all();
        if (!is_paused_) {
            wait_pause_cv.notify_all();
        }
    }
    paused_state.store(is_paused_, std::memory_order_relaxed);
    if (is_multicore) {
        if (is_paused_) {
            wait_signal_cv.wait(main_lock, [this] { return pause_count == worker_threads.size(); });
        } else {
            wait_signal_cv.wait(main_lock, [this] { return pause_count == 0; });
        }
    }
}

bool CoreTiming::IsRunning() const {
    return !paused_state.load(std::memory_order_acquire);
}

bool CoreTiming::HasPendingEvents() const {
    std::unique_lock main_lock(event_mutex);
    return !event_queue.empty();
}

void CoreTiming::ScheduleEvent(std::chrono::nanoseconds ns_into_future,
                               const std::shared_ptr<EventType>& event_type,
                               std::uintptr_t user_data) {

    std::unique_lock main_lock(event_mutex);
    const u64 timeout = static_cast<u64>((GetGlobalTimeNs() + ns_into_future).count());

    event_queue.emplace_back(Event{timeout, event_fifo_id++, user_data, event_type});

    std::push_heap(event_queue.begin(), event_queue.end(), std::greater<>());

    if (is_multicore) {
        event_cv.notify_one();
    }
}

void CoreTiming::UnscheduleEvent(const std::shared_ptr<EventType>& event_type,
                                 std::uintptr_t user_data) {
    std::unique_lock main_lock(event_mutex);
    const auto itr = std::remove_if(event_queue.begin(), event_queue.end(), [&](const Event& e) {
        return e.type.lock().get() == event_type.get() && e.user_data == user_data;
    });

    // Removing random items breaks the invariant so we have to re-establish it.
    if (itr != event_queue.end()) {
        event_queue.erase(itr, event_queue.end());
        std::make_heap(event_queue.begin(), event_queue.end(), std::greater<>());
    }
}

void CoreTiming::AddTicks(u64 ticks_to_add) {
    ticks += ticks_to_add;
    downcount -= static_cast<s64>(ticks);
}

void CoreTiming::Idle() {
    if (!event_queue.empty()) {
        const u64 next_event_time = event_queue.front().time;
        const u64 next_ticks = nsToCycles(std::chrono::nanoseconds(next_event_time)) + 10U;
        if (next_ticks > ticks) {
            ticks = next_ticks;
        }
        return;
    }
    ticks += 1000U;
}

void CoreTiming::ResetTicks() {
    downcount = MAX_SLICE_LENGTH;
}

u64 CoreTiming::GetCPUTicks() const {
    if (is_multicore) {
        return clock->GetCPUCycles();
    }
    return ticks;
}

u64 CoreTiming::GetClockTicks() const {
    if (is_multicore) {
        return clock->GetClockCycles();
    }
    return CpuCyclesToClockCycles(ticks);
}

void CoreTiming::ClearPendingEvents() {
    std::unique_lock main_lock(event_mutex);
    event_queue.clear();
}

void CoreTiming::RemoveEvent(const std::shared_ptr<EventType>& event_type) {
    std::unique_lock main_lock(event_mutex);

    const auto itr = std::remove_if(event_queue.begin(), event_queue.end(), [&](const Event& e) {
        return e.type.lock().get() == event_type.get();
    });

    // Removing random items breaks the invariant so we have to re-establish it.
    if (itr != event_queue.end()) {
        event_queue.erase(itr, event_queue.end());
        std::make_heap(event_queue.begin(), event_queue.end(), std::greater<>());
    }
}

std::optional<s64> CoreTiming::Advance() {
    global_timer = GetGlobalTimeNs().count();

    std::unique_lock main_lock(event_mutex);
    while (!event_queue.empty() && event_queue.front().time <= global_timer) {
        Event evt = std::move(event_queue.front());
        std::pop_heap(event_queue.begin(), event_queue.end(), std::greater<>());
        event_queue.pop_back();
        event_mutex.unlock();

        if (const auto event_type{evt.type.lock()}) {
            std::unique_lock lk(event_type->guard);
            event_type->callback(evt.user_data, std::chrono::nanoseconds{static_cast<s64>(
                                                    GetGlobalTimeNs().count() - evt.time)});
        }

        event_mutex.lock();
        global_timer = GetGlobalTimeNs().count();
    }

    if (!event_queue.empty()) {
        const s64 next_time = event_queue.front().time - global_timer;
        return next_time;
    } else {
        return std::nullopt;
    }
}

void CoreTiming::ThreadLoop() {
    const auto predicate = [this] { return !event_queue.empty() || is_paused; };
    has_started = true;
    while (!shutting_down) {
        while (!is_paused && !shutting_down) {
            const auto next_time = Advance();
            if (next_time) {
                if (*next_time > 0) {
                    std::chrono::nanoseconds next_time_ns = std::chrono::nanoseconds(*next_time);
                    std::unique_lock main_lock(event_mutex);
                    event_cv.wait_for(main_lock, next_time_ns, predicate);
                }
            } else {
                std::unique_lock main_lock(event_mutex);
                event_cv.wait(main_lock, predicate);
            }
        }
        std::unique_lock main_lock(event_mutex);
        pause_count++;
        if (pause_count == worker_threads.size()) {
            clock->Pause(true);
            wait_signal_cv.notify_all();
        }
        wait_pause_cv.wait(main_lock, [this] { return !is_paused || shutting_down; });
        pause_count--;
        if (pause_count == 0) {
            clock->Pause(false);
            wait_signal_cv.notify_all();
        }
    }
}

std::chrono::nanoseconds CoreTiming::GetGlobalTimeNs() const {
    if (is_multicore) {
        return clock->GetTimeNS();
    }
    return CyclesToNs(ticks);
}

std::chrono::microseconds CoreTiming::GetGlobalTimeUs() const {
    if (is_multicore) {
        return clock->GetTimeUS();
    }
    return CyclesToUs(ticks);
}

} // namespace Core::Timing