forked from dolphin-emu/dolphin
This introduces speculative constants, allowing FIFO writes to be optimized in more places. It also clarifies the guarantees of the FIFO optimization, changing the location of some of the checks and potentially avoiding redundant checks.
295 lines
7.2 KiB
C++
295 lines
7.2 KiB
C++
// Copyright 2013 Dolphin Emulator Project
|
|
// Licensed under GPLv2+
|
|
// Refer to the license.txt file included.
|
|
|
|
#include <algorithm>
|
|
#include <cinttypes>
|
|
#include <string>
|
|
|
|
#ifdef _WIN32
|
|
#include <windows.h>
|
|
#else
|
|
#include "Common/PerformanceCounter.h"
|
|
#endif
|
|
|
|
#include "Core/ConfigManager.h"
|
|
#include "Core/Core.h"
|
|
#include "Core/PowerPC/CachedInterpreter.h"
|
|
#include "Core/PowerPC/JitCommon/JitBase.h"
|
|
#include "Core/PowerPC/JitInterface.h"
|
|
#include "Core/PowerPC/PPCSymbolDB.h"
|
|
#include "Core/PowerPC/PowerPC.h"
|
|
#include "Core/PowerPC/Profiler.h"
|
|
|
|
#if _M_X86
|
|
#include "Core/PowerPC/Jit64/Jit.h"
|
|
#include "Core/PowerPC/Jit64/Jit64_Tables.h"
|
|
#include "Core/PowerPC/Jit64IL/JitIL.h"
|
|
#include "Core/PowerPC/Jit64IL/JitIL_Tables.h"
|
|
#endif
|
|
|
|
#if _M_ARM_64
|
|
#include "Core/PowerPC/JitArm64/Jit.h"
|
|
#include "Core/PowerPC/JitArm64/JitArm64_Tables.h"
|
|
#endif
|
|
|
|
namespace JitInterface
|
|
{
|
|
void DoState(PointerWrap& p)
|
|
{
|
|
if (jit && p.GetMode() == PointerWrap::MODE_READ)
|
|
jit->ClearCache();
|
|
}
|
|
CPUCoreBase* InitJitCore(int core)
|
|
{
|
|
CPUCoreBase* ptr = nullptr;
|
|
switch (core)
|
|
{
|
|
#if _M_X86
|
|
case PowerPC::CORE_JIT64:
|
|
ptr = new Jit64();
|
|
break;
|
|
case PowerPC::CORE_JITIL64:
|
|
ptr = new JitIL();
|
|
break;
|
|
#endif
|
|
#if _M_ARM_64
|
|
case PowerPC::CORE_JITARM64:
|
|
ptr = new JitArm64();
|
|
break;
|
|
#endif
|
|
case PowerPC::CORE_CACHEDINTERPRETER:
|
|
ptr = new CachedInterpreter();
|
|
break;
|
|
|
|
default:
|
|
PanicAlert("Unrecognizable cpu_core: %d", core);
|
|
jit = nullptr;
|
|
return nullptr;
|
|
}
|
|
jit = static_cast<JitBase*>(ptr);
|
|
jit->Init();
|
|
return ptr;
|
|
}
|
|
void InitTables(int core)
|
|
{
|
|
switch (core)
|
|
{
|
|
#if _M_X86
|
|
case PowerPC::CORE_JIT64:
|
|
Jit64Tables::InitTables();
|
|
break;
|
|
case PowerPC::CORE_JITIL64:
|
|
JitILTables::InitTables();
|
|
break;
|
|
#endif
|
|
#if _M_ARM_64
|
|
case PowerPC::CORE_JITARM64:
|
|
JitArm64Tables::InitTables();
|
|
break;
|
|
#endif
|
|
case PowerPC::CORE_CACHEDINTERPRETER:
|
|
// has no tables
|
|
break;
|
|
default:
|
|
PanicAlert("Unrecognizable cpu_core: %d", core);
|
|
break;
|
|
}
|
|
}
|
|
CPUCoreBase* GetCore()
|
|
{
|
|
return jit;
|
|
}
|
|
|
|
void WriteProfileResults(const std::string& filename)
|
|
{
|
|
ProfileStats prof_stats;
|
|
GetProfileResults(&prof_stats);
|
|
|
|
File::IOFile f(filename, "w");
|
|
if (!f)
|
|
{
|
|
PanicAlert("Failed to open %s", filename.c_str());
|
|
return;
|
|
}
|
|
fprintf(f.GetHandle(), "origAddr\tblkName\trunCount\tcost\ttimeCost\tpercent\ttimePercent\tOvAlli"
|
|
"nBlkTime(ms)\tblkCodeSize\n");
|
|
for (auto& stat : prof_stats.block_stats)
|
|
{
|
|
std::string name = g_symbolDB.GetDescription(stat.addr);
|
|
double percent = 100.0 * (double)stat.cost / (double)prof_stats.cost_sum;
|
|
double timePercent = 100.0 * (double)stat.tick_counter / (double)prof_stats.timecost_sum;
|
|
fprintf(f.GetHandle(),
|
|
"%08x\t%s\t%" PRIu64 "\t%" PRIu64 "\t%" PRIu64 "\t%.2f\t%.2f\t%.2f\t%i\n", stat.addr,
|
|
name.c_str(), stat.run_count, stat.cost, stat.tick_counter, percent, timePercent,
|
|
(double)stat.tick_counter * 1000.0 / (double)prof_stats.countsPerSec, stat.block_size);
|
|
}
|
|
}
|
|
|
|
void GetProfileResults(ProfileStats* prof_stats)
|
|
{
|
|
// Can't really do this with no jit core available
|
|
if (!jit)
|
|
return;
|
|
|
|
prof_stats->cost_sum = 0;
|
|
prof_stats->timecost_sum = 0;
|
|
prof_stats->block_stats.clear();
|
|
prof_stats->block_stats.reserve(jit->GetBlockCache()->GetNumBlocks());
|
|
|
|
Core::EState old_state = Core::GetState();
|
|
if (old_state == Core::CORE_RUN)
|
|
Core::SetState(Core::CORE_PAUSE);
|
|
|
|
QueryPerformanceFrequency((LARGE_INTEGER*)&prof_stats->countsPerSec);
|
|
for (int i = 0; i < jit->GetBlockCache()->GetNumBlocks(); i++)
|
|
{
|
|
const JitBlock* block = jit->GetBlockCache()->GetBlock(i);
|
|
// Rough heuristic. Mem instructions should cost more.
|
|
u64 cost = block->originalSize * (block->runCount / 4);
|
|
u64 timecost = block->ticCounter;
|
|
// Todo: tweak.
|
|
if (block->runCount >= 1)
|
|
prof_stats->block_stats.emplace_back(i, block->effectiveAddress, cost, timecost,
|
|
block->runCount, block->codeSize);
|
|
prof_stats->cost_sum += cost;
|
|
prof_stats->timecost_sum += timecost;
|
|
}
|
|
|
|
sort(prof_stats->block_stats.begin(), prof_stats->block_stats.end());
|
|
if (old_state == Core::CORE_RUN)
|
|
Core::SetState(Core::CORE_RUN);
|
|
}
|
|
|
|
int GetHostCode(u32* address, const u8** code, u32* code_size)
|
|
{
|
|
if (!jit)
|
|
{
|
|
*code_size = 0;
|
|
return 1;
|
|
}
|
|
|
|
int block_num = jit->GetBlockCache()->GetBlockNumberFromStartAddress(*address, MSR);
|
|
if (block_num < 0)
|
|
{
|
|
for (int i = 0; i < 500; i++)
|
|
{
|
|
block_num = jit->GetBlockCache()->GetBlockNumberFromStartAddress(*address - 4 * i, MSR);
|
|
if (block_num >= 0)
|
|
break;
|
|
}
|
|
|
|
if (block_num >= 0)
|
|
{
|
|
JitBlock* block = jit->GetBlockCache()->GetBlock(block_num);
|
|
if (!(block->effectiveAddress <= *address &&
|
|
block->originalSize + block->effectiveAddress >= *address))
|
|
block_num = -1;
|
|
}
|
|
|
|
// Do not merge this "if" with the above - block_num changes inside it.
|
|
if (block_num < 0)
|
|
{
|
|
*code_size = 0;
|
|
return 2;
|
|
}
|
|
}
|
|
|
|
JitBlock* block = jit->GetBlockCache()->GetBlock(block_num);
|
|
|
|
*code = block->checkedEntry;
|
|
*code_size = block->codeSize;
|
|
*address = block->effectiveAddress;
|
|
return 0;
|
|
}
|
|
|
|
bool HandleFault(uintptr_t access_address, SContext* ctx)
|
|
{
|
|
// Prevent nullptr dereference on a crash with no JIT present
|
|
if (!jit)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
return jit->HandleFault(access_address, ctx);
|
|
}
|
|
|
|
bool HandleStackFault()
|
|
{
|
|
if (!jit)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
return jit->HandleStackFault();
|
|
}
|
|
|
|
void ClearCache()
|
|
{
|
|
if (jit)
|
|
jit->ClearCache();
|
|
}
|
|
void ClearSafe()
|
|
{
|
|
// This clear is "safe" in the sense that it's okay to run from
|
|
// inside a JIT'ed block: it clears the instruction cache, but not
|
|
// the JIT'ed code.
|
|
// TODO: There's probably a better way to handle this situation.
|
|
if (jit)
|
|
jit->GetBlockCache()->Clear();
|
|
}
|
|
|
|
void InvalidateICache(u32 address, u32 size, bool forced)
|
|
{
|
|
if (jit)
|
|
jit->GetBlockCache()->InvalidateICache(address, size, forced);
|
|
}
|
|
|
|
void CompileExceptionCheck(ExceptionType type)
|
|
{
|
|
if (!jit)
|
|
return;
|
|
|
|
std::unordered_set<u32>* exception_addresses = nullptr;
|
|
|
|
switch (type)
|
|
{
|
|
case ExceptionType::EXCEPTIONS_FIFO_WRITE:
|
|
exception_addresses = &jit->js.fifoWriteAddresses;
|
|
break;
|
|
case ExceptionType::EXCEPTIONS_PAIRED_QUANTIZE:
|
|
exception_addresses = &jit->js.pairedQuantizeAddresses;
|
|
break;
|
|
case ExceptionType::EXCEPTIONS_SPECULATIVE_CONSTANTS:
|
|
exception_addresses = &jit->js.noSpeculativeConstantsAddresses;
|
|
break;
|
|
}
|
|
|
|
if (PC != 0 && (exception_addresses->find(PC)) == (exception_addresses->end()))
|
|
{
|
|
if (type == ExceptionType::EXCEPTIONS_FIFO_WRITE)
|
|
{
|
|
// Check in case the code has been replaced since: do we need to do this?
|
|
int optype = GetOpInfo(PowerPC::HostRead_U32(PC))->type;
|
|
if (optype != OPTYPE_STORE && optype != OPTYPE_STOREFP && (optype != OPTYPE_STOREPS))
|
|
return;
|
|
}
|
|
exception_addresses->insert(PC);
|
|
|
|
// Invalidate the JIT block so that it gets recompiled with the external exception check
|
|
// included.
|
|
jit->GetBlockCache()->InvalidateICache(PC, 4, true);
|
|
}
|
|
}
|
|
|
|
void Shutdown()
|
|
{
|
|
if (jit)
|
|
{
|
|
jit->Shutdown();
|
|
delete jit;
|
|
jit = nullptr;
|
|
}
|
|
}
|
|
}
|