2018-01-13 13:22:39 -08:00
|
|
|
// Copyright 2018 yuzu emulator team
|
2016-09-01 20:07:14 -07:00
|
|
|
// Licensed under GPLv2 or any later version
|
|
|
|
// Refer to the license.txt file included.
|
|
|
|
|
2018-01-13 14:34:15 -08:00
|
|
|
#include <cinttypes>
|
2018-01-09 13:33:46 -08:00
|
|
|
#include <memory>
|
|
|
|
#include <dynarmic/A64/a64.h>
|
|
|
|
#include <dynarmic/A64/config.h>
|
2018-02-21 12:48:22 -08:00
|
|
|
#include "common/logging/log.h"
|
2018-09-04 02:02:59 -07:00
|
|
|
#include "common/microprofile.h"
|
2016-09-20 23:52:38 -07:00
|
|
|
#include "core/arm/dynarmic/arm_dynarmic.h"
|
2018-03-13 14:49:59 -07:00
|
|
|
#include "core/core.h"
|
2018-08-31 09:21:34 -07:00
|
|
|
#include "core/core_cpu.h"
|
2018-01-09 13:33:46 -08:00
|
|
|
#include "core/core_timing.h"
|
2019-02-15 09:15:28 -08:00
|
|
|
#include "core/core_timing_util.h"
|
2018-09-19 12:40:31 -07:00
|
|
|
#include "core/gdbstub/gdbstub.h"
|
2018-07-31 05:06:09 -07:00
|
|
|
#include "core/hle/kernel/process.h"
|
2018-01-09 13:33:46 -08:00
|
|
|
#include "core/hle/kernel/svc.h"
|
2018-09-20 16:28:48 -07:00
|
|
|
#include "core/hle/kernel/vm_manager.h"
|
2018-01-09 13:33:46 -08:00
|
|
|
#include "core/memory.h"
|
|
|
|
|
2018-08-24 18:43:32 -07:00
|
|
|
namespace Core {
|
|
|
|
|
2018-02-08 16:04:05 -08:00
|
|
|
using Vector = Dynarmic::A64::Vector;
|
|
|
|
|
2018-01-09 13:33:46 -08:00
|
|
|
class ARM_Dynarmic_Callbacks : public Dynarmic::A64::UserCallbacks {
|
|
|
|
public:
|
|
|
|
explicit ARM_Dynarmic_Callbacks(ARM_Dynarmic& parent) : parent(parent) {}
|
|
|
|
|
2018-01-13 14:34:15 -08:00
|
|
|
u8 MemoryRead8(u64 vaddr) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
return Memory::Read8(vaddr);
|
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
u16 MemoryRead16(u64 vaddr) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
return Memory::Read16(vaddr);
|
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
u32 MemoryRead32(u64 vaddr) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
return Memory::Read32(vaddr);
|
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
u64 MemoryRead64(u64 vaddr) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
return Memory::Read64(vaddr);
|
|
|
|
}
|
2018-02-08 16:04:05 -08:00
|
|
|
Vector MemoryRead128(u64 vaddr) override {
|
|
|
|
return {Memory::Read64(vaddr), Memory::Read64(vaddr + 8)};
|
|
|
|
}
|
2018-01-09 13:33:46 -08:00
|
|
|
|
2018-01-13 14:34:15 -08:00
|
|
|
void MemoryWrite8(u64 vaddr, u8 value) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
Memory::Write8(vaddr, value);
|
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
void MemoryWrite16(u64 vaddr, u16 value) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
Memory::Write16(vaddr, value);
|
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
void MemoryWrite32(u64 vaddr, u32 value) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
Memory::Write32(vaddr, value);
|
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
void MemoryWrite64(u64 vaddr, u64 value) override {
|
2018-01-09 13:33:46 -08:00
|
|
|
Memory::Write64(vaddr, value);
|
|
|
|
}
|
2018-02-08 16:04:05 -08:00
|
|
|
void MemoryWrite128(u64 vaddr, Vector value) override {
|
|
|
|
Memory::Write64(vaddr, value[0]);
|
|
|
|
Memory::Write64(vaddr + 8, value[1]);
|
|
|
|
}
|
2018-01-09 13:33:46 -08:00
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
void InterpreterFallback(u64 pc, std::size_t num_instructions) override {
|
2018-07-02 09:13:26 -07:00
|
|
|
LOG_INFO(Core_ARM, "Unicorn fallback @ 0x{:X} for {} instructions (instr = {:08X})", pc,
|
2018-07-02 09:20:50 -07:00
|
|
|
num_instructions, MemoryReadCode(pc));
|
2018-02-21 12:48:22 -08:00
|
|
|
|
2018-01-09 13:33:46 -08:00
|
|
|
ARM_Interface::ThreadContext ctx;
|
|
|
|
parent.SaveContext(ctx);
|
|
|
|
parent.inner_unicorn.LoadContext(ctx);
|
2018-01-19 15:01:41 -08:00
|
|
|
parent.inner_unicorn.ExecuteInstructions(static_cast<int>(num_instructions));
|
2018-01-09 13:33:46 -08:00
|
|
|
parent.inner_unicorn.SaveContext(ctx);
|
|
|
|
parent.LoadContext(ctx);
|
|
|
|
num_interpreted_instructions += num_instructions;
|
|
|
|
}
|
|
|
|
|
2018-02-08 16:04:05 -08:00
|
|
|
void ExceptionRaised(u64 pc, Dynarmic::A64::Exception exception) override {
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
switch (exception) {
|
|
|
|
case Dynarmic::A64::Exception::WaitForInterrupt:
|
|
|
|
case Dynarmic::A64::Exception::WaitForEvent:
|
|
|
|
case Dynarmic::A64::Exception::SendEvent:
|
|
|
|
case Dynarmic::A64::Exception::SendEventLocal:
|
|
|
|
case Dynarmic::A64::Exception::Yield:
|
|
|
|
return;
|
2018-09-19 12:40:31 -07:00
|
|
|
case Dynarmic::A64::Exception::Breakpoint:
|
|
|
|
if (GDBStub::IsServerEnabled()) {
|
2018-09-20 11:12:42 -07:00
|
|
|
parent.jit->HaltExecution();
|
2018-09-19 12:40:31 -07:00
|
|
|
parent.SetPC(pc);
|
|
|
|
Kernel::Thread* thread = Kernel::GetCurrentThread();
|
2018-10-03 15:47:57 -07:00
|
|
|
parent.SaveContext(thread->GetContext());
|
2018-09-19 12:40:31 -07:00
|
|
|
GDBStub::Break();
|
|
|
|
GDBStub::SendTrap(thread, 5);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
[[fallthrough]];
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
default:
|
2018-04-27 04:54:05 -07:00
|
|
|
ASSERT_MSG(false, "ExceptionRaised(exception = {}, pc = {:X})",
|
2018-09-15 06:21:06 -07:00
|
|
|
static_cast<std::size_t>(exception), pc);
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
void CallSVC(u32 swi) override {
|
2019-04-06 15:46:18 -07:00
|
|
|
Kernel::CallSVC(parent.system, swi);
|
2018-01-09 13:33:46 -08:00
|
|
|
}
|
|
|
|
|
2018-01-13 14:34:15 -08:00
|
|
|
void AddTicks(u64 ticks) override {
|
2018-08-12 18:41:28 -07:00
|
|
|
// Divide the number of ticks by the amount of CPU cores. TODO(Subv): This yields only a
|
|
|
|
// rough approximation of the amount of executed ticks in the system, it may be thrown off
|
|
|
|
// if not all cores are doing a similar amount of work. Instead of doing this, we should
|
|
|
|
// device a way so that timing is consistent across all cores without increasing the ticks 4
|
|
|
|
// times.
|
|
|
|
u64 amortized_ticks = (ticks - num_interpreted_instructions) / Core::NUM_CPU_CORES;
|
|
|
|
// Always execute at least one tick.
|
|
|
|
amortized_ticks = std::max<u64>(amortized_ticks, 1);
|
|
|
|
|
2019-04-06 15:46:18 -07:00
|
|
|
parent.system.CoreTiming().AddTicks(amortized_ticks);
|
2018-03-24 02:02:19 -07:00
|
|
|
num_interpreted_instructions = 0;
|
2018-01-09 13:33:46 -08:00
|
|
|
}
|
2018-01-13 14:34:15 -08:00
|
|
|
u64 GetTicksRemaining() override {
|
2019-04-06 15:46:18 -07:00
|
|
|
return std::max(parent.system.CoreTiming().GetDowncount(), 0);
|
2018-01-09 13:33:46 -08:00
|
|
|
}
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
u64 GetCNTPCT() override {
|
2019-04-06 15:46:18 -07:00
|
|
|
return Timing::CpuCyclesToClockCycles(parent.system.CoreTiming().GetTicks());
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
}
|
2018-01-09 13:33:46 -08:00
|
|
|
|
|
|
|
ARM_Dynarmic& parent;
|
2018-09-15 06:21:06 -07:00
|
|
|
std::size_t num_interpreted_instructions = 0;
|
2018-02-12 13:53:32 -08:00
|
|
|
u64 tpidrro_el0 = 0;
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
u64 tpidr_el0 = 0;
|
2018-01-09 13:33:46 -08:00
|
|
|
};
|
|
|
|
|
core/cpu_core_manager: Create threads separately from initialization.
Our initialization process is a little wonky than one would expect when
it comes to code flow. We initialize the CPU last, as opposed to
hardware, where the CPU obviously needs to be first, otherwise nothing
else would work, and we have code that adds checks to get around this.
For example, in the page table setting code, we check to see if the
system is turned on before we even notify the CPU instances of a page
table switch. This results in dead code (at the moment), because the
only time a page table switch will occur is when the system is *not*
running, preventing the emulated CPU instances from being notified of a
page table switch in a convenient manner (technically the code path
could be taken, but we don't emulate the process creation svc handlers
yet).
This moves the threads creation into its own member function of the core
manager and restores a little order (and predictability) to our
initialization process.
Previously, in the multi-threaded cases, we'd kick off several threads
before even the main kernel process was created and ready to execute (gross!).
Now the initialization process is like so:
Initialization:
1. Timers
2. CPU
3. Kernel
4. Filesystem stuff (kind of gross, but can be amended trivially)
5. Applet stuff (ditto in terms of being kind of gross)
6. Main process (will be moved into the loading step in a following
change)
7. Telemetry (this should be initialized last in the future).
8. Services (4 and 5 should ideally be alongside this).
9. GDB (gross. Uses namespace scope state. Needs to be refactored into a
class or booted altogether).
10. Renderer
11. GPU (will also have its threads created in a separate step in a
following change).
Which... isn't *ideal* per-se, however getting rid of the wonky
intertwining of CPU state initialization out of this mix gets rid of
most of the footguns when it comes to our initialization process.
2019-04-09 10:25:54 -07:00
|
|
|
std::unique_ptr<Dynarmic::A64::Jit> ARM_Dynarmic::MakeJit(Common::PageTable& page_table,
|
|
|
|
std::size_t address_space_bits) const {
|
2018-02-12 13:53:32 -08:00
|
|
|
Dynarmic::A64::UserConfig config;
|
2018-07-03 06:28:46 -07:00
|
|
|
|
|
|
|
// Callbacks
|
2018-02-12 13:53:32 -08:00
|
|
|
config.callbacks = cb.get();
|
2018-07-03 06:28:46 -07:00
|
|
|
|
|
|
|
// Memory
|
core/cpu_core_manager: Create threads separately from initialization.
Our initialization process is a little wonky than one would expect when
it comes to code flow. We initialize the CPU last, as opposed to
hardware, where the CPU obviously needs to be first, otherwise nothing
else would work, and we have code that adds checks to get around this.
For example, in the page table setting code, we check to see if the
system is turned on before we even notify the CPU instances of a page
table switch. This results in dead code (at the moment), because the
only time a page table switch will occur is when the system is *not*
running, preventing the emulated CPU instances from being notified of a
page table switch in a convenient manner (technically the code path
could be taken, but we don't emulate the process creation svc handlers
yet).
This moves the threads creation into its own member function of the core
manager and restores a little order (and predictability) to our
initialization process.
Previously, in the multi-threaded cases, we'd kick off several threads
before even the main kernel process was created and ready to execute (gross!).
Now the initialization process is like so:
Initialization:
1. Timers
2. CPU
3. Kernel
4. Filesystem stuff (kind of gross, but can be amended trivially)
5. Applet stuff (ditto in terms of being kind of gross)
6. Main process (will be moved into the loading step in a following
change)
7. Telemetry (this should be initialized last in the future).
8. Services (4 and 5 should ideally be alongside this).
9. GDB (gross. Uses namespace scope state. Needs to be refactored into a
class or booted altogether).
10. Renderer
11. GPU (will also have its threads created in a separate step in a
following change).
Which... isn't *ideal* per-se, however getting rid of the wonky
intertwining of CPU state initialization out of this mix gets rid of
most of the footguns when it comes to our initialization process.
2019-04-09 10:25:54 -07:00
|
|
|
config.page_table = reinterpret_cast<void**>(page_table.pointers.data());
|
|
|
|
config.page_table_address_space_bits = address_space_bits;
|
2018-07-03 06:28:46 -07:00
|
|
|
config.silently_mirror_page_table = false;
|
|
|
|
|
|
|
|
// Multi-process state
|
|
|
|
config.processor_id = core_index;
|
2018-10-15 05:53:01 -07:00
|
|
|
config.global_monitor = &exclusive_monitor.monitor;
|
2018-07-03 06:28:46 -07:00
|
|
|
|
|
|
|
// System registers
|
2018-02-12 13:53:32 -08:00
|
|
|
config.tpidrro_el0 = &cb->tpidrro_el0;
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
config.tpidr_el0 = &cb->tpidr_el0;
|
2018-02-12 13:53:32 -08:00
|
|
|
config.dczid_el0 = 4;
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
config.ctr_el0 = 0x8444c004;
|
2019-02-16 12:52:24 -08:00
|
|
|
config.cntfrq_el0 = Timing::CNTFREQ;
|
dynarmic: Update to 6b4c6b0
6b4c6b0 impl: Update PC when raising exception
7a1313a A64: Implement FDIV (vector)
b2d781d system: Raise exception for YIELD, WFE, WFI, SEV, SEVL
b277bf5 Correct FPSR and FPCR
7673933 A64: Implement USHL
8d0e558 A64: Implement UCVTF (vector, integer), scalar variant
da9a4f8 A64: Partially implement FCVTZU (scalar, fixed-point) and FCVTZS (scalar, fixed-point)
7479684 A64: Implement system register TPIDR_EL0
0fd75fd A64: Implement system registers FPCR and FPSR
31e370c A64: Implement system register CNTPCT_EL0
9a88fd3 A64: Implement system register CTR_EL0
1d16896 A64: Implement NEG (vector)
3184edf IR: Add IR instruction ZeroVector
31f8fbc emit_x64_floating_point: Add maybe_unused to preprocess parameter
567eb1a A64: Implement FMINNM (scalar)
c6d8fa1 A64: Implement FMAXNM (scalar)
616056d constant_pool: Add frame parameter
a3747cb A64: Implement ADDP (scalar)
5cd5d9f reg_alloc: Only exchange GPRs
dd0452a A64: Implement DUP (element), scalar variant
e5732ea emit_x64_floating_point: Correct FP{Max,Min}{32,64} implementations for -0/+0
40eb9c3 A64: Implement FMAX (scalar), FMIN (scalar)
7cef39b fuzz_with_unicorn: QEMU's implementation of FCVT is incorrect
826dce2 travis: Switch unicorn repository
9605f28 a64/config: Allow NaN emulation accuracy to be set
e9435bc a64_emit_x64: Add conf to A64EmitContext
30b596d fuzz_with_unicorn: Explicitly test floating point instructions
be292a8 A64: Implement FSQRT (scalar)
3c42d48 backend_x64: Accurately handle NaNs
4aefed0 fuzz_with_unicorn: Print AArch64 disassembly
2018-02-21 12:51:54 -08:00
|
|
|
|
2018-08-16 02:12:20 -07:00
|
|
|
// Unpredictable instructions
|
|
|
|
config.define_unpredictable_behaviour = true;
|
|
|
|
|
2018-02-08 16:04:05 -08:00
|
|
|
return std::make_unique<Dynarmic::A64::Jit>(config);
|
|
|
|
}
|
|
|
|
|
2018-09-04 02:02:59 -07:00
|
|
|
MICROPROFILE_DEFINE(ARM_Jit_Dynarmic, "ARM JIT", "Dynarmic", MP_RGB(255, 64, 64));
|
|
|
|
|
2018-02-14 09:47:48 -08:00
|
|
|
void ARM_Dynarmic::Run() {
|
2018-09-04 02:02:59 -07:00
|
|
|
MICROPROFILE_SCOPE(ARM_Jit_Dynarmic);
|
2018-02-14 09:47:48 -08:00
|
|
|
|
|
|
|
jit->Run();
|
|
|
|
}
|
|
|
|
|
|
|
|
void ARM_Dynarmic::Step() {
|
|
|
|
cb->InterpreterFallback(jit->GetPC(), 1);
|
|
|
|
}
|
|
|
|
|
2019-04-06 15:46:18 -07:00
|
|
|
ARM_Dynarmic::ARM_Dynarmic(System& system, ExclusiveMonitor& exclusive_monitor,
|
2019-02-14 09:42:58 -08:00
|
|
|
std::size_t core_index)
|
2019-04-06 15:46:18 -07:00
|
|
|
: cb(std::make_unique<ARM_Dynarmic_Callbacks>(*this)), inner_unicorn{system},
|
|
|
|
core_index{core_index}, system{system},
|
core/cpu_core_manager: Create threads separately from initialization.
Our initialization process is a little wonky than one would expect when
it comes to code flow. We initialize the CPU last, as opposed to
hardware, where the CPU obviously needs to be first, otherwise nothing
else would work, and we have code that adds checks to get around this.
For example, in the page table setting code, we check to see if the
system is turned on before we even notify the CPU instances of a page
table switch. This results in dead code (at the moment), because the
only time a page table switch will occur is when the system is *not*
running, preventing the emulated CPU instances from being notified of a
page table switch in a convenient manner (technically the code path
could be taken, but we don't emulate the process creation svc handlers
yet).
This moves the threads creation into its own member function of the core
manager and restores a little order (and predictability) to our
initialization process.
Previously, in the multi-threaded cases, we'd kick off several threads
before even the main kernel process was created and ready to execute (gross!).
Now the initialization process is like so:
Initialization:
1. Timers
2. CPU
3. Kernel
4. Filesystem stuff (kind of gross, but can be amended trivially)
5. Applet stuff (ditto in terms of being kind of gross)
6. Main process (will be moved into the loading step in a following
change)
7. Telemetry (this should be initialized last in the future).
8. Services (4 and 5 should ideally be alongside this).
9. GDB (gross. Uses namespace scope state. Needs to be refactored into a
class or booted altogether).
10. Renderer
11. GPU (will also have its threads created in a separate step in a
following change).
Which... isn't *ideal* per-se, however getting rid of the wonky
intertwining of CPU state initialization out of this mix gets rid of
most of the footguns when it comes to our initialization process.
2019-04-09 10:25:54 -07:00
|
|
|
exclusive_monitor{dynamic_cast<DynarmicExclusiveMonitor&>(exclusive_monitor)} {}
|
2018-01-09 13:33:46 -08:00
|
|
|
|
|
|
|
ARM_Dynarmic::~ARM_Dynarmic() = default;
|
|
|
|
|
|
|
|
void ARM_Dynarmic::SetPC(u64 pc) {
|
2018-02-08 16:04:05 -08:00
|
|
|
jit->SetPC(pc);
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2017-08-28 18:09:42 -07:00
|
|
|
u64 ARM_Dynarmic::GetPC() const {
|
2018-02-08 16:04:05 -08:00
|
|
|
return jit->GetPC();
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-01-09 13:33:46 -08:00
|
|
|
u64 ARM_Dynarmic::GetReg(int index) const {
|
2018-02-08 16:04:05 -08:00
|
|
|
return jit->GetRegister(index);
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-01-09 13:33:46 -08:00
|
|
|
void ARM_Dynarmic::SetReg(int index, u64 value) {
|
2018-02-08 16:04:05 -08:00
|
|
|
jit->SetRegister(index, value);
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-09-17 23:49:40 -07:00
|
|
|
u128 ARM_Dynarmic::GetVectorReg(int index) const {
|
2018-02-08 16:04:05 -08:00
|
|
|
return jit->GetVector(index);
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-09-17 23:49:40 -07:00
|
|
|
void ARM_Dynarmic::SetVectorReg(int index, u128 value) {
|
2018-02-08 16:04:05 -08:00
|
|
|
jit->SetVector(index, value);
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-09-17 23:49:40 -07:00
|
|
|
u32 ARM_Dynarmic::GetPSTATE() const {
|
2018-02-08 16:04:05 -08:00
|
|
|
return jit->GetPstate();
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-09-17 23:49:40 -07:00
|
|
|
void ARM_Dynarmic::SetPSTATE(u32 pstate) {
|
|
|
|
jit->SetPstate(pstate);
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-01-09 13:33:46 -08:00
|
|
|
u64 ARM_Dynarmic::GetTlsAddress() const {
|
2018-02-12 13:53:32 -08:00
|
|
|
return cb->tpidrro_el0;
|
2017-09-30 11:16:39 -07:00
|
|
|
}
|
|
|
|
|
2018-07-31 04:58:24 -07:00
|
|
|
void ARM_Dynarmic::SetTlsAddress(VAddr address) {
|
2018-02-12 13:53:32 -08:00
|
|
|
cb->tpidrro_el0 = address;
|
2017-09-30 11:16:39 -07:00
|
|
|
}
|
|
|
|
|
2018-07-20 17:57:45 -07:00
|
|
|
u64 ARM_Dynarmic::GetTPIDR_EL0() const {
|
|
|
|
return cb->tpidr_el0;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ARM_Dynarmic::SetTPIDR_EL0(u64 value) {
|
|
|
|
cb->tpidr_el0 = value;
|
|
|
|
}
|
|
|
|
|
2018-07-31 04:56:57 -07:00
|
|
|
void ARM_Dynarmic::SaveContext(ThreadContext& ctx) {
|
2018-02-08 16:04:05 -08:00
|
|
|
ctx.cpu_registers = jit->GetRegisters();
|
|
|
|
ctx.sp = jit->GetSP();
|
|
|
|
ctx.pc = jit->GetPC();
|
2018-09-17 23:49:40 -07:00
|
|
|
ctx.pstate = jit->GetPstate();
|
|
|
|
ctx.vector_registers = jit->GetVectors();
|
|
|
|
ctx.fpcr = jit->GetFpcr();
|
2018-09-29 14:58:26 -07:00
|
|
|
ctx.fpsr = jit->GetFpsr();
|
|
|
|
ctx.tpidr = cb->tpidr_el0;
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
2018-07-31 04:56:57 -07:00
|
|
|
void ARM_Dynarmic::LoadContext(const ThreadContext& ctx) {
|
2018-02-08 16:04:05 -08:00
|
|
|
jit->SetRegisters(ctx.cpu_registers);
|
|
|
|
jit->SetSP(ctx.sp);
|
|
|
|
jit->SetPC(ctx.pc);
|
2018-09-29 14:58:26 -07:00
|
|
|
jit->SetPstate(ctx.pstate);
|
2018-09-17 23:49:40 -07:00
|
|
|
jit->SetVectors(ctx.vector_registers);
|
2018-09-29 14:58:26 -07:00
|
|
|
jit->SetFpcr(ctx.fpcr);
|
|
|
|
jit->SetFpsr(ctx.fpsr);
|
|
|
|
SetTPIDR_EL0(ctx.tpidr);
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
void ARM_Dynarmic::PrepareReschedule() {
|
2018-08-13 05:59:01 -07:00
|
|
|
jit->HaltExecution();
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
void ARM_Dynarmic::ClearInstructionCache() {
|
2018-02-08 16:04:05 -08:00
|
|
|
jit->ClearCache();
|
2016-09-01 20:07:14 -07:00
|
|
|
}
|
2017-09-24 14:44:13 -07:00
|
|
|
|
2018-07-16 03:24:00 -07:00
|
|
|
void ARM_Dynarmic::ClearExclusiveState() {
|
|
|
|
jit->ClearExclusiveState();
|
|
|
|
}
|
|
|
|
|
core/cpu_core_manager: Create threads separately from initialization.
Our initialization process is a little wonky than one would expect when
it comes to code flow. We initialize the CPU last, as opposed to
hardware, where the CPU obviously needs to be first, otherwise nothing
else would work, and we have code that adds checks to get around this.
For example, in the page table setting code, we check to see if the
system is turned on before we even notify the CPU instances of a page
table switch. This results in dead code (at the moment), because the
only time a page table switch will occur is when the system is *not*
running, preventing the emulated CPU instances from being notified of a
page table switch in a convenient manner (technically the code path
could be taken, but we don't emulate the process creation svc handlers
yet).
This moves the threads creation into its own member function of the core
manager and restores a little order (and predictability) to our
initialization process.
Previously, in the multi-threaded cases, we'd kick off several threads
before even the main kernel process was created and ready to execute (gross!).
Now the initialization process is like so:
Initialization:
1. Timers
2. CPU
3. Kernel
4. Filesystem stuff (kind of gross, but can be amended trivially)
5. Applet stuff (ditto in terms of being kind of gross)
6. Main process (will be moved into the loading step in a following
change)
7. Telemetry (this should be initialized last in the future).
8. Services (4 and 5 should ideally be alongside this).
9. GDB (gross. Uses namespace scope state. Needs to be refactored into a
class or booted altogether).
10. Renderer
11. GPU (will also have its threads created in a separate step in a
following change).
Which... isn't *ideal* per-se, however getting rid of the wonky
intertwining of CPU state initialization out of this mix gets rid of
most of the footguns when it comes to our initialization process.
2019-04-09 10:25:54 -07:00
|
|
|
void ARM_Dynarmic::PageTableChanged(Common::PageTable& page_table,
|
|
|
|
std::size_t new_address_space_size_in_bits) {
|
|
|
|
jit = MakeJit(page_table, new_address_space_size_in_bits);
|
2017-09-24 14:44:13 -07:00
|
|
|
}
|
2018-07-03 06:28:46 -07:00
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
DynarmicExclusiveMonitor::DynarmicExclusiveMonitor(std::size_t core_count) : monitor(core_count) {}
|
2018-07-03 06:28:46 -07:00
|
|
|
DynarmicExclusiveMonitor::~DynarmicExclusiveMonitor() = default;
|
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
void DynarmicExclusiveMonitor::SetExclusive(std::size_t core_index, VAddr addr) {
|
2018-07-03 06:28:46 -07:00
|
|
|
// Size doesn't actually matter.
|
|
|
|
monitor.Mark(core_index, addr, 16);
|
|
|
|
}
|
|
|
|
|
|
|
|
void DynarmicExclusiveMonitor::ClearExclusive() {
|
|
|
|
monitor.Clear();
|
|
|
|
}
|
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
bool DynarmicExclusiveMonitor::ExclusiveWrite8(std::size_t core_index, VAddr vaddr, u8 value) {
|
2018-07-03 06:28:46 -07:00
|
|
|
return monitor.DoExclusiveOperation(core_index, vaddr, 1,
|
|
|
|
[&] { Memory::Write8(vaddr, value); });
|
|
|
|
}
|
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
bool DynarmicExclusiveMonitor::ExclusiveWrite16(std::size_t core_index, VAddr vaddr, u16 value) {
|
2018-07-03 06:28:46 -07:00
|
|
|
return monitor.DoExclusiveOperation(core_index, vaddr, 2,
|
|
|
|
[&] { Memory::Write16(vaddr, value); });
|
|
|
|
}
|
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
bool DynarmicExclusiveMonitor::ExclusiveWrite32(std::size_t core_index, VAddr vaddr, u32 value) {
|
2018-07-03 06:28:46 -07:00
|
|
|
return monitor.DoExclusiveOperation(core_index, vaddr, 4,
|
|
|
|
[&] { Memory::Write32(vaddr, value); });
|
|
|
|
}
|
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
bool DynarmicExclusiveMonitor::ExclusiveWrite64(std::size_t core_index, VAddr vaddr, u64 value) {
|
2018-07-03 06:28:46 -07:00
|
|
|
return monitor.DoExclusiveOperation(core_index, vaddr, 8,
|
|
|
|
[&] { Memory::Write64(vaddr, value); });
|
|
|
|
}
|
|
|
|
|
2018-09-15 06:21:06 -07:00
|
|
|
bool DynarmicExclusiveMonitor::ExclusiveWrite128(std::size_t core_index, VAddr vaddr, u128 value) {
|
2018-07-03 06:28:46 -07:00
|
|
|
return monitor.DoExclusiveOperation(core_index, vaddr, 16, [&] {
|
2018-09-18 00:54:05 -07:00
|
|
|
Memory::Write64(vaddr + 0, value[0]);
|
|
|
|
Memory::Write64(vaddr + 8, value[1]);
|
2018-07-03 06:28:46 -07:00
|
|
|
});
|
|
|
|
}
|
2018-08-24 18:43:32 -07:00
|
|
|
|
|
|
|
} // namespace Core
|