Debugging: Add minimalist PPC profiler

This commit is contained in:
Exzap 2023-06-25 08:38:25 +02:00
parent 45072fccb2
commit 9499870cc9
7 changed files with 281 additions and 43 deletions

View File

@ -83,6 +83,20 @@ RPLStoredSymbol* rplSymbolStorage_getByAddress(MPTR address)
return rplSymbolStorage.map_symbolByAddress[address]; return rplSymbolStorage.map_symbolByAddress[address];
} }
RPLStoredSymbol* rplSymbolStorage_getByClosestAddress(MPTR address)
{
// highly inefficient but doesn't matter for now
std::unique_lock<std::mutex> lck(rplSymbolStorage.m_symbolStorageMutex);
for(uint32 i=0; i<4096; i++)
{
RPLStoredSymbol* symbol = rplSymbolStorage.map_symbolByAddress[address];
if(symbol)
return symbol;
address -= 4;
}
return nullptr;
}
void rplSymbolStorage_remove(RPLStoredSymbol* storedSymbol) void rplSymbolStorage_remove(RPLStoredSymbol* storedSymbol)
{ {
std::unique_lock<std::mutex> lck(rplSymbolStorage.m_symbolStorageMutex); std::unique_lock<std::mutex> lck(rplSymbolStorage.m_symbolStorageMutex);

View File

@ -12,6 +12,7 @@ RPLStoredSymbol* rplSymbolStorage_store(const char* libName, const char* symbolN
void rplSymbolStorage_remove(RPLStoredSymbol* storedSymbol); void rplSymbolStorage_remove(RPLStoredSymbol* storedSymbol);
void rplSymbolStorage_removeRange(MPTR address, sint32 length); void rplSymbolStorage_removeRange(MPTR address, sint32 length);
RPLStoredSymbol* rplSymbolStorage_getByAddress(MPTR address); RPLStoredSymbol* rplSymbolStorage_getByAddress(MPTR address);
RPLStoredSymbol* rplSymbolStorage_getByClosestAddress(MPTR address);
void rplSymbolStorage_createJumpProxySymbol(MPTR jumpAddress, MPTR destAddress); void rplSymbolStorage_createJumpProxySymbol(MPTR jumpAddress, MPTR destAddress);
std::unordered_map<uint32, RPLStoredSymbol*>& rplSymbolStorage_lockSymbolMap(); std::unordered_map<uint32, RPLStoredSymbol*>& rplSymbolStorage_lockSymbolMap();

View File

@ -812,17 +812,21 @@ namespace coreinit
return suspendCounter > 0; return suspendCounter > 0;
} }
bool OSIsThreadRunningNoLock(OSThread_t* thread)
{
cemu_assert_debug(__OSHasSchedulerLock());
return thread->state == OSThread_t::THREAD_STATE::STATE_RUNNING;
}
bool OSIsThreadRunning(OSThread_t* thread) bool OSIsThreadRunning(OSThread_t* thread)
{ {
bool isRunning = false; bool isRunning = false;
__OSLockScheduler(); __OSLockScheduler();
if (thread->state == OSThread_t::THREAD_STATE::STATE_RUNNING) isRunning = OSIsThreadRunningNoLock(thread);
isRunning = true;
__OSUnlockScheduler(); __OSUnlockScheduler();
return isRunning; return isRunning;
} }
void OSCancelThread(OSThread_t* thread) void OSCancelThread(OSThread_t* thread)
{ {
__OSLockScheduler(); __OSLockScheduler();

View File

@ -538,6 +538,7 @@ namespace coreinit
bool OSIsThreadTerminated(OSThread_t* thread); bool OSIsThreadTerminated(OSThread_t* thread);
bool OSIsThreadSuspended(OSThread_t* thread); bool OSIsThreadSuspended(OSThread_t* thread);
bool OSIsThreadRunningNoLock(OSThread_t* thread);
bool OSIsThreadRunning(OSThread_t* thread); bool OSIsThreadRunning(OSThread_t* thread);
// OSThreadQueue // OSThreadQueue
@ -603,6 +604,8 @@ namespace coreinit
void __OSAddReadyThreadToRunQueue(OSThread_t* thread); void __OSAddReadyThreadToRunQueue(OSThread_t* thread);
bool __OSCoreShouldSwitchToThread(OSThread_t* currentThread, OSThread_t* newThread); bool __OSCoreShouldSwitchToThread(OSThread_t* currentThread, OSThread_t* newThread);
void __OSQueueThreadDeallocation(OSThread_t* thread); void __OSQueueThreadDeallocation(OSThread_t* thread);
bool __OSIsThreadActive(OSThread_t* thread);
} }
#pragma pack() #pragma pack()

View File

@ -0,0 +1,118 @@
#pragma once
#include <wx/event.h>
#include <wx/progdlg.h>
#include <wx/thread.h>
#include "util/helpers/Semaphore.h"
wxDEFINE_EVENT(wxEVT_CREATE_PROGRESS_DIALOG, wxThreadEvent);
wxDEFINE_EVENT(wxEVT_DESTROY_PROGRESS_DIALOG, wxThreadEvent);
wxDEFINE_EVENT(wxEVT_UPDATE_PROGRESS_DIALOG, wxThreadEvent);
// wrapper for wxGenericProgressDialog which can be used from any thread
class wxProgressDialogManager : public wxEvtHandler
{
public:
wxProgressDialogManager(wxWindow* parent) : m_parent(parent), m_dialog(nullptr)
{
Bind(wxEVT_CREATE_PROGRESS_DIALOG, &wxProgressDialogManager::OnCreateProgressDialog, this);
Bind(wxEVT_DESTROY_PROGRESS_DIALOG, &wxProgressDialogManager::OnDestroyProgressDialog, this);
Bind(wxEVT_UPDATE_PROGRESS_DIALOG, &wxProgressDialogManager::OnUpdateProgressDialog, this);
}
~wxProgressDialogManager()
{
if (m_dialog)
Destroy();
}
void Create(const wxString& title, const wxString& message, int maximum, int style = wxPD_APP_MODAL | wxPD_ELAPSED_TIME | wxPD_REMAINING_TIME)
{
m_instanceSemaphore.increment();
m_isCancelled = false;
m_isSkipped = false;
wxThreadEvent event(wxEVT_CREATE_PROGRESS_DIALOG);
event.SetString(title);
event.SetInt(maximum);
event.SetExtraLong(style);
wxQueueEvent(this, event.Clone());
}
void Destroy()
{
wxThreadEvent event(wxEVT_DESTROY_PROGRESS_DIALOG);
wxQueueEvent(this, event.Clone());
m_instanceSemaphore.waitUntilZero(); // wait until destruction is complete
}
// this also updates the cancel and skip state
void Update(int value, const wxString& newmsg = wxEmptyString)
{
wxThreadEvent event(wxEVT_UPDATE_PROGRESS_DIALOG);
event.SetInt(value);
event.SetString(newmsg);
wxQueueEvent(this, event.Clone());
}
bool IsCancelled() const
{
return m_isCancelled;
}
bool IsSkipped() const
{
return m_isSkipped;
}
bool IsCancelledOrSkipped() const
{
return m_isCancelled || m_isSkipped;
}
private:
void OnCreateProgressDialog(wxThreadEvent& event)
{
if (m_dialog)
{
m_dialog->Destroy();
m_instanceSemaphore.waitUntilZero();
}
m_maximum = event.GetInt();
m_dialog = new wxGenericProgressDialog(event.GetString(), "Please wait...", m_maximum, m_parent, event.GetExtraLong());
}
void OnDestroyProgressDialog(wxThreadEvent& event)
{
if (m_dialog)
{
m_dialog->Destroy();
m_dialog = nullptr;
m_instanceSemaphore.decrement();
}
}
void OnUpdateProgressDialog(wxThreadEvent& event)
{
if (m_dialog)
{
// make sure that progress is never >= maximum
// because wxGenericProgressDialog seems to become crashy on destruction otherwise
int progress = event.GetInt();
if(progress >= m_maximum)
progress = m_maximum - 1;
bool wasSkipped = false;
bool r = m_dialog->Update(progress, event.GetString(), &wasSkipped);
if(!r)
m_isCancelled = true;
if(wasSkipped)
m_isSkipped = true;
}
}
wxWindow* m_parent;
wxGenericProgressDialog* m_dialog;
bool m_isCancelled{false};
bool m_isSkipped{false};
int m_maximum{0};
CounterSemaphore m_instanceSemaphore; // used to synchronize destruction of the dialog
};

View File

@ -5,6 +5,8 @@
#include "Cafe/OS/RPL/rpl.h" #include "Cafe/OS/RPL/rpl.h"
#include "Cafe/OS/RPL/rpl_symbol_storage.h" #include "Cafe/OS/RPL/rpl_symbol_storage.h"
#include "gui/components/wxProgressDialogManager.h"
#include <cinttypes> #include <cinttypes>
enum enum
@ -23,17 +25,18 @@ enum
THREADLIST_MENU_SUSPEND, THREADLIST_MENU_SUSPEND,
THREADLIST_MENU_RESUME, THREADLIST_MENU_RESUME,
THREADLIST_MENU_DUMP_STACK_TRACE, THREADLIST_MENU_DUMP_STACK_TRACE,
THREADLIST_MENU_PROFILE_THREAD,
}; };
wxBEGIN_EVENT_TABLE(DebugPPCThreadsWindow, wxFrame) wxBEGIN_EVENT_TABLE(DebugPPCThreadsWindow, wxFrame)
EVT_BUTTON(CLOSE_ID,DebugPPCThreadsWindow::OnCloseButton) EVT_BUTTON(CLOSE_ID, DebugPPCThreadsWindow::OnCloseButton)
EVT_BUTTON(REFRESH_ID,DebugPPCThreadsWindow::OnRefreshButton) EVT_BUTTON(REFRESH_ID, DebugPPCThreadsWindow::OnRefreshButton)
EVT_CLOSE(DebugPPCThreadsWindow::OnClose) EVT_CLOSE(DebugPPCThreadsWindow::OnClose)
wxEND_EVENT_TABLE() wxEND_EVENT_TABLE()
DebugPPCThreadsWindow::DebugPPCThreadsWindow(wxFrame& parent) DebugPPCThreadsWindow::DebugPPCThreadsWindow(wxFrame& parent)
: wxFrame(&parent, wxID_ANY, _("PPC threads"), wxDefaultPosition, wxSize(930, 280), wxCLOSE_BOX | wxCLIP_CHILDREN | wxCAPTION | wxRESIZE_BORDER) : wxFrame(&parent, wxID_ANY, _("PPC threads"), wxDefaultPosition, wxSize(930, 280),
wxCLOSE_BOX | wxCLIP_CHILDREN | wxCAPTION | wxRESIZE_BORDER)
{ {
wxFrame::SetBackgroundColour(*wxWHITE); wxFrame::SetBackgroundColour(*wxWHITE);
@ -158,7 +161,6 @@ void DebugPPCThreadsWindow::OnTimer(wxTimerEvent& event)
RefreshThreadList(); RefreshThreadList();
} }
#define _r(__idx) _swapEndianU32(cafeThread->context.gpr[__idx]) #define _r(__idx) _swapEndianU32(cafeThread->context.gpr[__idx])
void DebugPPCThreadsWindow::RefreshThreadList() void DebugPPCThreadsWindow::RefreshThreadList()
@ -278,30 +280,126 @@ void DebugLogStackTrace(OSThread_t* thread, MPTR sp);
void DebugPPCThreadsWindow::DumpStackTrace(OSThread_t* thread) void DebugPPCThreadsWindow::DumpStackTrace(OSThread_t* thread)
{ {
cemuLog_log(LogType::Force, fmt::format("Dumping stack trace for thread {0:08x} LR: {1:08x}", memory_getVirtualOffsetFromPointer(thread), _swapEndianU32(thread->context.lr))); cemuLog_log(LogType::Force, fmt::format("Dumping stack trace for thread {0:08x} LR: {1:08x}",
memory_getVirtualOffsetFromPointer(thread),
_swapEndianU32(thread->context.lr)));
DebugLogStackTrace(thread, _swapEndianU32(thread->context.gpr[1])); DebugLogStackTrace(thread, _swapEndianU32(thread->context.gpr[1]));
} }
void DebugPPCThreadsWindow::PresentProfileResults(OSThread_t* thread, const std::unordered_map<VAddr, uint32>& samples)
{
std::vector<std::pair<VAddr, uint32>> sortedSamples;
// count samples
uint32 totalSampleCount = 0;
for (auto& sample : samples)
totalSampleCount += sample.second;
cemuLog_log(LogType::Force, "--- Thread {:08x} profile results with {:} samples captured ---",
MEMPTR<OSThread_t>(thread).GetMPTR(), totalSampleCount);
cemuLog_log(LogType::Force, "Exclusive time, grouped by function:");
// print samples grouped by function
sortedSamples.clear();
for (auto& sample : samples)
{
RPLStoredSymbol* symbol = rplSymbolStorage_getByClosestAddress(sample.first);
VAddr sampleAddr = sample.first;
if (symbol)
sampleAddr = symbol->address;
auto it = std::find_if(sortedSamples.begin(), sortedSamples.end(),
[sampleAddr](const std::pair<VAddr, uint32>& a) { return a.first == sampleAddr; });
if (it != sortedSamples.end())
it->second += sample.second;
else
sortedSamples.push_back(std::make_pair(sampleAddr, sample.second));
}
std::sort(sortedSamples.begin(), sortedSamples.end(),
[](const std::pair<VAddr, uint32>& a, const std::pair<VAddr, uint32>& b) { return a.second > b.second; });
for (auto& sample : sortedSamples)
{
if (sample.second < 3)
continue;
VAddr sampleAddr = sample.first;
RPLStoredSymbol* symbol = rplSymbolStorage_getByClosestAddress(sample.first);
std::string strName;
if (symbol)
{
strName = fmt::format("{}.{}+0x{:x}", (const char*)symbol->libName, (const char*)symbol->symbolName,
sampleAddr - symbol->address);
}
else
strName = "Unknown";
cemuLog_log(LogType::Force, "[{:08x}] {:8.2f}% (Samples: {:5}) Symbol: {}", sample.first,
(double)(sample.second * 100) / (double)totalSampleCount, sample.second, strName);
}
}
void DebugPPCThreadsWindow::ProfileThreadWorker(OSThread_t* thread)
{
wxProgressDialogManager progressDialog(this);
progressDialog.Create("Profiling thread",
_("Capturing samples..."),
1000, // range
wxPD_CAN_SKIP);
std::unordered_map<VAddr, uint32> samples;
// loop for one minute
uint64 startTime = std::chrono::duration_cast<std::chrono::milliseconds>(
std::chrono::system_clock::now().time_since_epoch())
.count();
uint32 totalSampleCount = 0;
while (true)
{
// suspend thread
coreinit::OSSuspendThread(thread);
// wait until thread is not running anymore
__OSLockScheduler();
while (coreinit::OSIsThreadRunningNoLock(thread))
{
__OSUnlockScheduler();
std::this_thread::sleep_for(std::chrono::milliseconds(1));
__OSLockScheduler();
}
uint32 sampleIP = thread->context.srr0;
__OSUnlockScheduler();
coreinit::OSResumeThread(thread);
// count sample
samples[sampleIP]++;
totalSampleCount++;
if ((totalSampleCount % 50) == 0)
{
wxString msg = fmt::format("Capturing samples... ({:})\nResults will be written to log.txt\n",
totalSampleCount);
if (totalSampleCount < 30000)
msg.Append(_("Click Skip button for early results with lower accuracy"));
else
msg.Append(_("Click Skip button to finish"));
progressDialog.Update(totalSampleCount * 1000 / 30000, msg);
if (progressDialog.IsCancelledOrSkipped())
break;
}
std::this_thread::sleep_for(std::chrono::milliseconds(1));
}
PresentProfileResults(thread, samples);
progressDialog.Destroy();
}
void DebugPPCThreadsWindow::ProfileThread(OSThread_t* thread)
{
std::thread profileThread(&DebugPPCThreadsWindow::ProfileThreadWorker, this, thread);
profileThread.detach();
}
void DebugPPCThreadsWindow::OnThreadListPopupClick(wxCommandEvent& evt) void DebugPPCThreadsWindow::OnThreadListPopupClick(wxCommandEvent& evt)
{ {
MPTR threadMPTR = (MPTR)(size_t)static_cast<wxMenu *>(evt.GetEventObject())->GetClientData(); MPTR threadMPTR = (MPTR)(size_t) static_cast<wxMenu*>(evt.GetEventObject())->GetClientData();
// check if thread is still active
bool threadIsActive = false;
srwlock_activeThreadList.LockWrite();
for (sint32 i = 0; i < activeThreadCount; i++)
{
MPTR threadItrMPTR = activeThread[i];
if (threadItrMPTR == threadMPTR)
{
threadIsActive = true;
break;
}
}
srwlock_activeThreadList.UnlockWrite();
if (threadIsActive == false)
return;
// handle command
OSThread_t* osThread = (OSThread_t*)memory_getPointerFromVirtualOffset(threadMPTR); OSThread_t* osThread = (OSThread_t*)memory_getPointerFromVirtualOffset(threadMPTR);
__OSLockScheduler();
if (!coreinit::__OSIsThreadActive(osThread))
{
__OSUnlockScheduler();
return;
}
__OSUnlockScheduler();
// handle command
switch (evt.GetId()) switch (evt.GetId())
{ {
case THREADLIST_MENU_BOOST_PRIO_5: case THREADLIST_MENU_BOOST_PRIO_5:
@ -325,6 +423,9 @@ void DebugPPCThreadsWindow::OnThreadListPopupClick(wxCommandEvent& evt)
case THREADLIST_MENU_DUMP_STACK_TRACE: case THREADLIST_MENU_DUMP_STACK_TRACE:
DumpStackTrace(osThread); DumpStackTrace(osThread);
break; break;
case THREADLIST_MENU_PROFILE_THREAD:
ProfileThread(osThread);
break;
} }
coreinit::__OSUpdateThreadEffectivePriority(osThread); coreinit::__OSUpdateThreadEffectivePriority(osThread);
// update thread list // update thread list
@ -347,20 +448,13 @@ void DebugPPCThreadsWindow::OnThreadListRightClick(wxMouseEvent& event)
m_thread_list->SetItemState(itemIndex, wxLIST_STATE_SELECTED, wxLIST_STATE_SELECTED); m_thread_list->SetItemState(itemIndex, wxLIST_STATE_SELECTED, wxLIST_STATE_SELECTED);
// check if thread is still on the list of active threads // check if thread is still on the list of active threads
MPTR threadMPTR = (MPTR)m_thread_list->GetItemData(itemIndex); MPTR threadMPTR = (MPTR)m_thread_list->GetItemData(itemIndex);
bool threadIsActive = false; __OSLockScheduler();
srwlock_activeThreadList.LockWrite(); if (!coreinit::__OSIsThreadActive(MEMPTR<OSThread_t>(threadMPTR)))
for (sint32 i = 0; i < activeThreadCount; i++)
{ {
MPTR threadItrMPTR = activeThread[i]; __OSUnlockScheduler();
if (threadItrMPTR == threadMPTR)
{
threadIsActive = true;
break;
}
}
srwlock_activeThreadList.UnlockWrite();
if (threadIsActive == false)
return; return;
}
__OSUnlockScheduler();
// create menu entry // create menu entry
wxMenu menu; wxMenu menu;
menu.SetClientData((void*)(size_t)threadMPTR); menu.SetClientData((void*)(size_t)threadMPTR);
@ -374,6 +468,7 @@ void DebugPPCThreadsWindow::OnThreadListRightClick(wxMouseEvent& event)
menu.Append(THREADLIST_MENU_SUSPEND, _("Suspend")); menu.Append(THREADLIST_MENU_SUSPEND, _("Suspend"));
menu.AppendSeparator(); menu.AppendSeparator();
menu.Append(THREADLIST_MENU_DUMP_STACK_TRACE, _("Write stack trace to log")); menu.Append(THREADLIST_MENU_DUMP_STACK_TRACE, _("Write stack trace to log"));
menu.Append(THREADLIST_MENU_PROFILE_THREAD, _("Profile thread"));
menu.Connect(wxEVT_COMMAND_MENU_SELECTED, wxCommandEventHandler(DebugPPCThreadsWindow::OnThreadListPopupClick), nullptr, this); menu.Connect(wxEVT_COMMAND_MENU_SELECTED, wxCommandEventHandler(DebugPPCThreadsWindow::OnThreadListPopupClick), nullptr, this);
PopupMenu(&menu); PopupMenu(&menu);
} }

View File

@ -15,11 +15,14 @@ public:
void OnThreadListPopupClick(wxCommandEvent &evt); void OnThreadListPopupClick(wxCommandEvent &evt);
void OnThreadListRightClick(wxMouseEvent& event); void OnThreadListRightClick(wxMouseEvent& event);
void DumpStackTrace(struct OSThread_t* thread);
void Close(); void Close();
private: private:
void ProfileThread(struct OSThread_t* thread);
void ProfileThreadWorker(OSThread_t* thread);
void PresentProfileResults(OSThread_t* thread, const std::unordered_map<VAddr, uint32>& samples);
void DumpStackTrace(struct OSThread_t* thread);
wxListCtrl* m_thread_list; wxListCtrl* m_thread_list;
wxCheckBox* m_auto_refresh; wxCheckBox* m_auto_refresh;
wxTimer* m_timer; wxTimer* m_timer;