Merge pull request #8188 from merryhime/jit-race-page-table-changed

dynarmic: Fix race when switching page tables
This commit is contained in:
bunnei 2022-04-16 00:24:53 -07:00 committed by GitHub
commit a29a8c6f78
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
4 changed files with 84 additions and 57 deletions

View File

@ -88,7 +88,7 @@ public:
void CallSVC(u32 swi) override { void CallSVC(u32 swi) override {
parent.svc_swi = swi; parent.svc_swi = swi;
parent.jit->HaltExecution(svc_call); parent.jit.load()->HaltExecution(svc_call);
} }
void AddTicks(u64 ticks) override { void AddTicks(u64 ticks) override {
@ -151,6 +151,13 @@ std::shared_ptr<Dynarmic::A32::Jit> ARM_Dynarmic_32::MakeJit(Common::PageTable*
config.code_cache_size = 512_MiB; config.code_cache_size = 512_MiB;
config.far_code_offset = 400_MiB; config.far_code_offset = 400_MiB;
// null_jit
if (!page_table) {
// Don't waste too much memory on null_jit
config.code_cache_size = 8_MiB;
config.far_code_offset = 4_MiB;
}
// Safe optimizations // Safe optimizations
if (Settings::values.cpu_debug_mode) { if (Settings::values.cpu_debug_mode) {
if (!Settings::values.cpuopt_page_tables) { if (!Settings::values.cpuopt_page_tables) {
@ -228,7 +235,7 @@ std::shared_ptr<Dynarmic::A32::Jit> ARM_Dynarmic_32::MakeJit(Common::PageTable*
void ARM_Dynarmic_32::Run() { void ARM_Dynarmic_32::Run() {
while (true) { while (true) {
const auto hr = jit->Run(); const auto hr = jit.load()->Run();
if (Has(hr, svc_call)) { if (Has(hr, svc_call)) {
Kernel::Svc::Call(system, svc_swi); Kernel::Svc::Call(system, svc_swi);
} }
@ -239,7 +246,7 @@ void ARM_Dynarmic_32::Run() {
} }
void ARM_Dynarmic_32::Step() { void ARM_Dynarmic_32::Step() {
jit->Step(); jit.load()->Step();
} }
ARM_Dynarmic_32::ARM_Dynarmic_32(System& system_, CPUInterrupts& interrupt_handlers_, ARM_Dynarmic_32::ARM_Dynarmic_32(System& system_, CPUInterrupts& interrupt_handlers_,
@ -249,24 +256,24 @@ ARM_Dynarmic_32::ARM_Dynarmic_32(System& system_, CPUInterrupts& interrupt_handl
cb(std::make_unique<DynarmicCallbacks32>(*this)), cb(std::make_unique<DynarmicCallbacks32>(*this)),
cp15(std::make_shared<DynarmicCP15>(*this)), core_index{core_index_}, cp15(std::make_shared<DynarmicCP15>(*this)), core_index{core_index_},
exclusive_monitor{dynamic_cast<DynarmicExclusiveMonitor&>(exclusive_monitor_)}, exclusive_monitor{dynamic_cast<DynarmicExclusiveMonitor&>(exclusive_monitor_)},
jit(MakeJit(nullptr)) {} null_jit{MakeJit(nullptr)}, jit{null_jit.get()} {}
ARM_Dynarmic_32::~ARM_Dynarmic_32() = default; ARM_Dynarmic_32::~ARM_Dynarmic_32() = default;
void ARM_Dynarmic_32::SetPC(u64 pc) { void ARM_Dynarmic_32::SetPC(u64 pc) {
jit->Regs()[15] = static_cast<u32>(pc); jit.load()->Regs()[15] = static_cast<u32>(pc);
} }
u64 ARM_Dynarmic_32::GetPC() const { u64 ARM_Dynarmic_32::GetPC() const {
return jit->Regs()[15]; return jit.load()->Regs()[15];
} }
u64 ARM_Dynarmic_32::GetReg(int index) const { u64 ARM_Dynarmic_32::GetReg(int index) const {
return jit->Regs()[index]; return jit.load()->Regs()[index];
} }
void ARM_Dynarmic_32::SetReg(int index, u64 value) { void ARM_Dynarmic_32::SetReg(int index, u64 value) {
jit->Regs()[index] = static_cast<u32>(value); jit.load()->Regs()[index] = static_cast<u32>(value);
} }
u128 ARM_Dynarmic_32::GetVectorReg(int index) const { u128 ARM_Dynarmic_32::GetVectorReg(int index) const {
@ -276,11 +283,11 @@ u128 ARM_Dynarmic_32::GetVectorReg(int index) const {
void ARM_Dynarmic_32::SetVectorReg(int index, u128 value) {} void ARM_Dynarmic_32::SetVectorReg(int index, u128 value) {}
u32 ARM_Dynarmic_32::GetPSTATE() const { u32 ARM_Dynarmic_32::GetPSTATE() const {
return jit->Cpsr(); return jit.load()->Cpsr();
} }
void ARM_Dynarmic_32::SetPSTATE(u32 cpsr) { void ARM_Dynarmic_32::SetPSTATE(u32 cpsr) {
jit->SetCpsr(cpsr); jit.load()->SetCpsr(cpsr);
} }
u64 ARM_Dynarmic_32::GetTlsAddress() const { u64 ARM_Dynarmic_32::GetTlsAddress() const {
@ -301,7 +308,7 @@ void ARM_Dynarmic_32::SetTPIDR_EL0(u64 value) {
void ARM_Dynarmic_32::SaveContext(ThreadContext32& ctx) { void ARM_Dynarmic_32::SaveContext(ThreadContext32& ctx) {
Dynarmic::A32::Context context; Dynarmic::A32::Context context;
jit->SaveContext(context); jit.load()->SaveContext(context);
ctx.cpu_registers = context.Regs(); ctx.cpu_registers = context.Regs();
ctx.extension_registers = context.ExtRegs(); ctx.extension_registers = context.ExtRegs();
ctx.cpsr = context.Cpsr(); ctx.cpsr = context.Cpsr();
@ -314,27 +321,27 @@ void ARM_Dynarmic_32::LoadContext(const ThreadContext32& ctx) {
context.ExtRegs() = ctx.extension_registers; context.ExtRegs() = ctx.extension_registers;
context.SetCpsr(ctx.cpsr); context.SetCpsr(ctx.cpsr);
context.SetFpscr(ctx.fpscr); context.SetFpscr(ctx.fpscr);
jit->LoadContext(context); jit.load()->LoadContext(context);
} }
void ARM_Dynarmic_32::PrepareReschedule() { void ARM_Dynarmic_32::PrepareReschedule() {
jit->HaltExecution(break_loop); jit.load()->HaltExecution(break_loop);
} }
void ARM_Dynarmic_32::SignalInterrupt() { void ARM_Dynarmic_32::SignalInterrupt() {
jit->HaltExecution(break_loop); jit.load()->HaltExecution(break_loop);
} }
void ARM_Dynarmic_32::ClearInstructionCache() { void ARM_Dynarmic_32::ClearInstructionCache() {
jit->ClearCache(); jit.load()->ClearCache();
} }
void ARM_Dynarmic_32::InvalidateCacheRange(VAddr addr, std::size_t size) { void ARM_Dynarmic_32::InvalidateCacheRange(VAddr addr, std::size_t size) {
jit->InvalidateCacheRange(static_cast<u32>(addr), size); jit.load()->InvalidateCacheRange(static_cast<u32>(addr), size);
} }
void ARM_Dynarmic_32::ClearExclusiveState() { void ARM_Dynarmic_32::ClearExclusiveState() {
jit->ClearExclusiveState(); jit.load()->ClearExclusiveState();
} }
void ARM_Dynarmic_32::PageTableChanged(Common::PageTable& page_table, void ARM_Dynarmic_32::PageTableChanged(Common::PageTable& page_table,
@ -345,13 +352,14 @@ void ARM_Dynarmic_32::PageTableChanged(Common::PageTable& page_table,
auto key = std::make_pair(&page_table, new_address_space_size_in_bits); auto key = std::make_pair(&page_table, new_address_space_size_in_bits);
auto iter = jit_cache.find(key); auto iter = jit_cache.find(key);
if (iter != jit_cache.end()) { if (iter != jit_cache.end()) {
jit = iter->second; jit.store(iter->second.get());
LoadContext(ctx); LoadContext(ctx);
return; return;
} }
jit = MakeJit(&page_table); std::shared_ptr new_jit = MakeJit(&page_table);
jit.store(new_jit.get());
LoadContext(ctx); LoadContext(ctx);
jit_cache.emplace(key, jit); jit_cache.emplace(key, std::move(new_jit));
} }
} // namespace Core } // namespace Core

View File

@ -4,6 +4,7 @@
#pragma once #pragma once
#include <atomic>
#include <memory> #include <memory>
#include <unordered_map> #include <unordered_map>
@ -80,7 +81,11 @@ private:
std::shared_ptr<DynarmicCP15> cp15; std::shared_ptr<DynarmicCP15> cp15;
std::size_t core_index; std::size_t core_index;
DynarmicExclusiveMonitor& exclusive_monitor; DynarmicExclusiveMonitor& exclusive_monitor;
std::shared_ptr<Dynarmic::A32::Jit> jit;
std::shared_ptr<Dynarmic::A32::Jit> null_jit;
// A raw pointer here is fine; we never delete Jit instances.
std::atomic<Dynarmic::A32::Jit*> jit;
// SVC callback // SVC callback
u32 svc_swi{}; u32 svc_swi{};

View File

@ -109,7 +109,7 @@ public:
break; break;
} }
parent.jit->HaltExecution(Dynarmic::HaltReason::CacheInvalidation); parent.jit.load()->HaltExecution(Dynarmic::HaltReason::CacheInvalidation);
} }
void ExceptionRaised(u64 pc, Dynarmic::A64::Exception exception) override { void ExceptionRaised(u64 pc, Dynarmic::A64::Exception exception) override {
@ -130,7 +130,7 @@ public:
void CallSVC(u32 swi) override { void CallSVC(u32 swi) override {
parent.svc_swi = swi; parent.svc_swi = swi;
parent.jit->HaltExecution(svc_call); parent.jit.load()->HaltExecution(svc_call);
} }
void AddTicks(u64 ticks) override { void AddTicks(u64 ticks) override {
@ -212,6 +212,13 @@ std::shared_ptr<Dynarmic::A64::Jit> ARM_Dynarmic_64::MakeJit(Common::PageTable*
config.code_cache_size = 512_MiB; config.code_cache_size = 512_MiB;
config.far_code_offset = 400_MiB; config.far_code_offset = 400_MiB;
// null_jit
if (!page_table) {
// Don't waste too much memory on null_jit
config.code_cache_size = 8_MiB;
config.far_code_offset = 4_MiB;
}
// Safe optimizations // Safe optimizations
if (Settings::values.cpu_debug_mode) { if (Settings::values.cpu_debug_mode) {
if (!Settings::values.cpuopt_page_tables) { if (!Settings::values.cpuopt_page_tables) {
@ -289,7 +296,7 @@ std::shared_ptr<Dynarmic::A64::Jit> ARM_Dynarmic_64::MakeJit(Common::PageTable*
void ARM_Dynarmic_64::Run() { void ARM_Dynarmic_64::Run() {
while (true) { while (true) {
const auto hr = jit->Run(); const auto hr = jit.load()->Run();
if (Has(hr, svc_call)) { if (Has(hr, svc_call)) {
Kernel::Svc::Call(system, svc_swi); Kernel::Svc::Call(system, svc_swi);
} }
@ -300,7 +307,7 @@ void ARM_Dynarmic_64::Run() {
} }
void ARM_Dynarmic_64::Step() { void ARM_Dynarmic_64::Step() {
jit->Step(); jit.load()->Step();
} }
ARM_Dynarmic_64::ARM_Dynarmic_64(System& system_, CPUInterrupts& interrupt_handlers_, ARM_Dynarmic_64::ARM_Dynarmic_64(System& system_, CPUInterrupts& interrupt_handlers_,
@ -309,40 +316,40 @@ ARM_Dynarmic_64::ARM_Dynarmic_64(System& system_, CPUInterrupts& interrupt_handl
: ARM_Interface{system_, interrupt_handlers_, uses_wall_clock_}, : ARM_Interface{system_, interrupt_handlers_, uses_wall_clock_},
cb(std::make_unique<DynarmicCallbacks64>(*this)), core_index{core_index_}, cb(std::make_unique<DynarmicCallbacks64>(*this)), core_index{core_index_},
exclusive_monitor{dynamic_cast<DynarmicExclusiveMonitor&>(exclusive_monitor_)}, exclusive_monitor{dynamic_cast<DynarmicExclusiveMonitor&>(exclusive_monitor_)},
jit(MakeJit(nullptr, 48)) {} null_jit{MakeJit(nullptr, 48)}, jit{null_jit.get()} {}
ARM_Dynarmic_64::~ARM_Dynarmic_64() = default; ARM_Dynarmic_64::~ARM_Dynarmic_64() = default;
void ARM_Dynarmic_64::SetPC(u64 pc) { void ARM_Dynarmic_64::SetPC(u64 pc) {
jit->SetPC(pc); jit.load()->SetPC(pc);
} }
u64 ARM_Dynarmic_64::GetPC() const { u64 ARM_Dynarmic_64::GetPC() const {
return jit->GetPC(); return jit.load()->GetPC();
} }
u64 ARM_Dynarmic_64::GetReg(int index) const { u64 ARM_Dynarmic_64::GetReg(int index) const {
return jit->GetRegister(index); return jit.load()->GetRegister(index);
} }
void ARM_Dynarmic_64::SetReg(int index, u64 value) { void ARM_Dynarmic_64::SetReg(int index, u64 value) {
jit->SetRegister(index, value); jit.load()->SetRegister(index, value);
} }
u128 ARM_Dynarmic_64::GetVectorReg(int index) const { u128 ARM_Dynarmic_64::GetVectorReg(int index) const {
return jit->GetVector(index); return jit.load()->GetVector(index);
} }
void ARM_Dynarmic_64::SetVectorReg(int index, u128 value) { void ARM_Dynarmic_64::SetVectorReg(int index, u128 value) {
jit->SetVector(index, value); jit.load()->SetVector(index, value);
} }
u32 ARM_Dynarmic_64::GetPSTATE() const { u32 ARM_Dynarmic_64::GetPSTATE() const {
return jit->GetPstate(); return jit.load()->GetPstate();
} }
void ARM_Dynarmic_64::SetPSTATE(u32 pstate) { void ARM_Dynarmic_64::SetPSTATE(u32 pstate) {
jit->SetPstate(pstate); jit.load()->SetPstate(pstate);
} }
u64 ARM_Dynarmic_64::GetTlsAddress() const { u64 ARM_Dynarmic_64::GetTlsAddress() const {
@ -362,45 +369,47 @@ void ARM_Dynarmic_64::SetTPIDR_EL0(u64 value) {
} }
void ARM_Dynarmic_64::SaveContext(ThreadContext64& ctx) { void ARM_Dynarmic_64::SaveContext(ThreadContext64& ctx) {
ctx.cpu_registers = jit->GetRegisters(); Dynarmic::A64::Jit* j = jit.load();
ctx.sp = jit->GetSP(); ctx.cpu_registers = j->GetRegisters();
ctx.pc = jit->GetPC(); ctx.sp = j->GetSP();
ctx.pstate = jit->GetPstate(); ctx.pc = j->GetPC();
ctx.vector_registers = jit->GetVectors(); ctx.pstate = j->GetPstate();
ctx.fpcr = jit->GetFpcr(); ctx.vector_registers = j->GetVectors();
ctx.fpsr = jit->GetFpsr(); ctx.fpcr = j->GetFpcr();
ctx.fpsr = j->GetFpsr();
ctx.tpidr = cb->tpidr_el0; ctx.tpidr = cb->tpidr_el0;
} }
void ARM_Dynarmic_64::LoadContext(const ThreadContext64& ctx) { void ARM_Dynarmic_64::LoadContext(const ThreadContext64& ctx) {
jit->SetRegisters(ctx.cpu_registers); Dynarmic::A64::Jit* j = jit.load();
jit->SetSP(ctx.sp); j->SetRegisters(ctx.cpu_registers);
jit->SetPC(ctx.pc); j->SetSP(ctx.sp);
jit->SetPstate(ctx.pstate); j->SetPC(ctx.pc);
jit->SetVectors(ctx.vector_registers); j->SetPstate(ctx.pstate);
jit->SetFpcr(ctx.fpcr); j->SetVectors(ctx.vector_registers);
jit->SetFpsr(ctx.fpsr); j->SetFpcr(ctx.fpcr);
j->SetFpsr(ctx.fpsr);
SetTPIDR_EL0(ctx.tpidr); SetTPIDR_EL0(ctx.tpidr);
} }
void ARM_Dynarmic_64::PrepareReschedule() { void ARM_Dynarmic_64::PrepareReschedule() {
jit->HaltExecution(break_loop); jit.load()->HaltExecution(break_loop);
} }
void ARM_Dynarmic_64::SignalInterrupt() { void ARM_Dynarmic_64::SignalInterrupt() {
jit->HaltExecution(break_loop); jit.load()->HaltExecution(break_loop);
} }
void ARM_Dynarmic_64::ClearInstructionCache() { void ARM_Dynarmic_64::ClearInstructionCache() {
jit->ClearCache(); jit.load()->ClearCache();
} }
void ARM_Dynarmic_64::InvalidateCacheRange(VAddr addr, std::size_t size) { void ARM_Dynarmic_64::InvalidateCacheRange(VAddr addr, std::size_t size) {
jit->InvalidateCacheRange(addr, size); jit.load()->InvalidateCacheRange(addr, size);
} }
void ARM_Dynarmic_64::ClearExclusiveState() { void ARM_Dynarmic_64::ClearExclusiveState() {
jit->ClearExclusiveState(); jit.load()->ClearExclusiveState();
} }
void ARM_Dynarmic_64::PageTableChanged(Common::PageTable& page_table, void ARM_Dynarmic_64::PageTableChanged(Common::PageTable& page_table,
@ -411,13 +420,14 @@ void ARM_Dynarmic_64::PageTableChanged(Common::PageTable& page_table,
auto key = std::make_pair(&page_table, new_address_space_size_in_bits); auto key = std::make_pair(&page_table, new_address_space_size_in_bits);
auto iter = jit_cache.find(key); auto iter = jit_cache.find(key);
if (iter != jit_cache.end()) { if (iter != jit_cache.end()) {
jit = iter->second; jit.store(iter->second.get());
LoadContext(ctx); LoadContext(ctx);
return; return;
} }
jit = MakeJit(&page_table, new_address_space_size_in_bits); std::shared_ptr new_jit = MakeJit(&page_table, new_address_space_size_in_bits);
jit.store(new_jit.get());
LoadContext(ctx); LoadContext(ctx);
jit_cache.emplace(key, jit); jit_cache.emplace(key, std::move(new_jit));
} }
} // namespace Core } // namespace Core

View File

@ -4,6 +4,7 @@
#pragma once #pragma once
#include <atomic>
#include <memory> #include <memory>
#include <unordered_map> #include <unordered_map>
@ -74,7 +75,10 @@ private:
std::size_t core_index; std::size_t core_index;
DynarmicExclusiveMonitor& exclusive_monitor; DynarmicExclusiveMonitor& exclusive_monitor;
std::shared_ptr<Dynarmic::A64::Jit> jit; std::shared_ptr<Dynarmic::A64::Jit> null_jit;
// A raw pointer here is fine; we never delete Jit instances.
std::atomic<Dynarmic::A64::Jit*> jit;
// SVC callback // SVC callback
u32 svc_swi{}; u32 svc_swi{};