diff options
| author | 2020-06-16 23:44:48 -0400 | |
|---|---|---|
| committer | 2020-06-16 23:44:48 -0400 | |
| commit | b660ef6c8a524eaacfbf607cc4cae8eeddf88131 (patch) | |
| tree | 82266bbfd000c1a29e2888f3be2503a5677292e4 /src | |
| parent | Merge pull request #3976 from Neodyblue/qdarkstyle_fix_prop (diff) | |
| parent | macro_jit_x64: Remove NEXT_PARAMETER (diff) | |
| download | yuzu-b660ef6c8a524eaacfbf607cc4cae8eeddf88131.tar.gz yuzu-b660ef6c8a524eaacfbf607cc4cae8eeddf88131.tar.xz yuzu-b660ef6c8a524eaacfbf607cc4cae8eeddf88131.zip | |
Merge pull request #4089 from MerryMage/macrojit-cleanup-1
macro_jit_x64: Cleanup
Diffstat (limited to '')
| -rw-r--r-- | src/video_core/macro/macro_jit_x64.cpp | 64 | ||||
| -rw-r--r-- | src/video_core/macro/macro_jit_x64.h | 5 |
2 files changed, 18 insertions, 51 deletions
diff --git a/src/video_core/macro/macro_jit_x64.cpp b/src/video_core/macro/macro_jit_x64.cpp index 11c1cc3be..2eb98173d 100644 --- a/src/video_core/macro/macro_jit_x64.cpp +++ b/src/video_core/macro/macro_jit_x64.cpp | |||
| @@ -14,22 +14,16 @@ MICROPROFILE_DEFINE(MacroJitCompile, "GPU", "Compile macro JIT", MP_RGB(173, 255 | |||
| 14 | MICROPROFILE_DEFINE(MacroJitExecute, "GPU", "Execute macro JIT", MP_RGB(255, 255, 0)); | 14 | MICROPROFILE_DEFINE(MacroJitExecute, "GPU", "Execute macro JIT", MP_RGB(255, 255, 0)); |
| 15 | 15 | ||
| 16 | namespace Tegra { | 16 | namespace Tegra { |
| 17 | static const Xbyak::Reg64 PARAMETERS = Xbyak::util::r9; | 17 | static const Xbyak::Reg64 STATE = Xbyak::util::rbx; |
| 18 | static const Xbyak::Reg64 REGISTERS = Xbyak::util::r10; | 18 | static const Xbyak::Reg32 RESULT = Xbyak::util::ebp; |
| 19 | static const Xbyak::Reg64 STATE = Xbyak::util::r11; | 19 | static const Xbyak::Reg64 PARAMETERS = Xbyak::util::r12; |
| 20 | static const Xbyak::Reg64 NEXT_PARAMETER = Xbyak::util::r12; | ||
| 21 | static const Xbyak::Reg32 RESULT = Xbyak::util::r13d; | ||
| 22 | static const Xbyak::Reg64 RESULT_64 = Xbyak::util::r13; | ||
| 23 | static const Xbyak::Reg32 METHOD_ADDRESS = Xbyak::util::r14d; | 20 | static const Xbyak::Reg32 METHOD_ADDRESS = Xbyak::util::r14d; |
| 24 | static const Xbyak::Reg64 METHOD_ADDRESS_64 = Xbyak::util::r14; | ||
| 25 | static const Xbyak::Reg64 BRANCH_HOLDER = Xbyak::util::r15; | 21 | static const Xbyak::Reg64 BRANCH_HOLDER = Xbyak::util::r15; |
| 26 | 22 | ||
| 27 | static const std::bitset<32> PERSISTENT_REGISTERS = Common::X64::BuildRegSet({ | 23 | static const std::bitset<32> PERSISTENT_REGISTERS = Common::X64::BuildRegSet({ |
| 28 | PARAMETERS, | ||
| 29 | REGISTERS, | ||
| 30 | STATE, | 24 | STATE, |
| 31 | NEXT_PARAMETER, | ||
| 32 | RESULT, | 25 | RESULT, |
| 26 | PARAMETERS, | ||
| 33 | METHOD_ADDRESS, | 27 | METHOD_ADDRESS, |
| 34 | BRANCH_HOLDER, | 28 | BRANCH_HOLDER, |
| 35 | }); | 29 | }); |
| @@ -53,8 +47,7 @@ void MacroJITx64Impl::Execute(const std::vector<u32>& parameters, u32 method) { | |||
| 53 | JITState state{}; | 47 | JITState state{}; |
| 54 | state.maxwell3d = &maxwell3d; | 48 | state.maxwell3d = &maxwell3d; |
| 55 | state.registers = {}; | 49 | state.registers = {}; |
| 56 | state.parameters = parameters.data(); | 50 | program(&state, parameters.data()); |
| 57 | program(&state); | ||
| 58 | } | 51 | } |
| 59 | 52 | ||
| 60 | void MacroJITx64Impl::Compile_ALU(Macro::Opcode opcode) { | 53 | void MacroJITx64Impl::Compile_ALU(Macro::Opcode opcode) { |
| @@ -64,18 +57,18 @@ void MacroJITx64Impl::Compile_ALU(Macro::Opcode opcode) { | |||
| 64 | const bool is_move_operation = !is_a_zero && is_b_zero; | 57 | const bool is_move_operation = !is_a_zero && is_b_zero; |
| 65 | const bool has_zero_register = is_a_zero || is_b_zero; | 58 | const bool has_zero_register = is_a_zero || is_b_zero; |
| 66 | 59 | ||
| 67 | Xbyak::Reg64 src_a; | 60 | Xbyak::Reg32 src_a; |
| 68 | Xbyak::Reg32 src_b; | 61 | Xbyak::Reg32 src_b; |
| 69 | 62 | ||
| 70 | if (!optimizer.zero_reg_skip) { | 63 | if (!optimizer.zero_reg_skip) { |
| 71 | src_a = Compile_GetRegister(opcode.src_a, RESULT_64); | 64 | src_a = Compile_GetRegister(opcode.src_a, RESULT); |
| 72 | src_b = Compile_GetRegister(opcode.src_b, ebx); | 65 | src_b = Compile_GetRegister(opcode.src_b, eax); |
| 73 | } else { | 66 | } else { |
| 74 | if (!is_a_zero) { | 67 | if (!is_a_zero) { |
| 75 | src_a = Compile_GetRegister(opcode.src_a, RESULT_64); | 68 | src_a = Compile_GetRegister(opcode.src_a, RESULT); |
| 76 | } | 69 | } |
| 77 | if (!is_b_zero) { | 70 | if (!is_b_zero) { |
| 78 | src_b = Compile_GetRegister(opcode.src_b, ebx); | 71 | src_b = Compile_GetRegister(opcode.src_b, eax); |
| 79 | } | 72 | } |
| 80 | } | 73 | } |
| 81 | Xbyak::Label skip_carry{}; | 74 | Xbyak::Label skip_carry{}; |
| @@ -329,7 +322,7 @@ void Tegra::MacroJITx64Impl::Compile_Send(Xbyak::Reg32 value) { | |||
| 329 | and_(METHOD_ADDRESS, 0xfff); | 322 | and_(METHOD_ADDRESS, 0xfff); |
| 330 | shr(ecx, 12); | 323 | shr(ecx, 12); |
| 331 | and_(ecx, 0x3f); | 324 | and_(ecx, 0x3f); |
| 332 | lea(eax, ptr[rcx + METHOD_ADDRESS_64]); | 325 | lea(eax, ptr[rcx + METHOD_ADDRESS.cvt64()]); |
| 333 | sal(ecx, 12); | 326 | sal(ecx, 12); |
| 334 | or_(eax, ecx); | 327 | or_(eax, ecx); |
| 335 | 328 | ||
| @@ -424,16 +417,12 @@ void MacroJITx64Impl::Compile() { | |||
| 424 | Common::X64::ABI_PushRegistersAndAdjustStackGPS(*this, Common::X64::ABI_ALL_CALLEE_SAVED, 8); | 417 | Common::X64::ABI_PushRegistersAndAdjustStackGPS(*this, Common::X64::ABI_ALL_CALLEE_SAVED, 8); |
| 425 | // JIT state | 418 | // JIT state |
| 426 | mov(STATE, Common::X64::ABI_PARAM1); | 419 | mov(STATE, Common::X64::ABI_PARAM1); |
| 427 | mov(PARAMETERS, qword[Common::X64::ABI_PARAM1 + | 420 | mov(PARAMETERS, Common::X64::ABI_PARAM2); |
| 428 | static_cast<Xbyak::uint32>(offsetof(JITState, parameters))]); | ||
| 429 | mov(REGISTERS, Common::X64::ABI_PARAM1); | ||
| 430 | add(REGISTERS, static_cast<Xbyak::uint32>(offsetof(JITState, registers))); | ||
| 431 | xor_(RESULT, RESULT); | 421 | xor_(RESULT, RESULT); |
| 432 | xor_(METHOD_ADDRESS, METHOD_ADDRESS); | 422 | xor_(METHOD_ADDRESS, METHOD_ADDRESS); |
| 433 | xor_(NEXT_PARAMETER, NEXT_PARAMETER); | ||
| 434 | xor_(BRANCH_HOLDER, BRANCH_HOLDER); | 423 | xor_(BRANCH_HOLDER, BRANCH_HOLDER); |
| 435 | 424 | ||
| 436 | mov(dword[REGISTERS + 4], Compile_FetchParameter()); | 425 | mov(dword[STATE + offsetof(JITState, registers) + 4], Compile_FetchParameter()); |
| 437 | 426 | ||
| 438 | // Track get register for zero registers and mark it as no-op | 427 | // Track get register for zero registers and mark it as no-op |
| 439 | optimizer.zero_reg_skip = true; | 428 | optimizer.zero_reg_skip = true; |
| @@ -537,8 +526,8 @@ bool MacroJITx64Impl::Compile_NextInstruction() { | |||
| 537 | } | 526 | } |
| 538 | 527 | ||
| 539 | Xbyak::Reg32 Tegra::MacroJITx64Impl::Compile_FetchParameter() { | 528 | Xbyak::Reg32 Tegra::MacroJITx64Impl::Compile_FetchParameter() { |
| 540 | mov(eax, dword[PARAMETERS + NEXT_PARAMETER * sizeof(u32)]); | 529 | mov(eax, dword[PARAMETERS]); |
| 541 | inc(NEXT_PARAMETER); | 530 | add(PARAMETERS, sizeof(u32)); |
| 542 | return eax; | 531 | return eax; |
| 543 | } | 532 | } |
| 544 | 533 | ||
| @@ -547,31 +536,12 @@ Xbyak::Reg32 MacroJITx64Impl::Compile_GetRegister(u32 index, Xbyak::Reg32 dst) { | |||
| 547 | // Register 0 is always zero | 536 | // Register 0 is always zero |
| 548 | xor_(dst, dst); | 537 | xor_(dst, dst); |
| 549 | } else { | 538 | } else { |
| 550 | mov(dst, dword[REGISTERS + index * sizeof(u32)]); | 539 | mov(dst, dword[STATE + offsetof(JITState, registers) + index * sizeof(u32)]); |
| 551 | } | 540 | } |
| 552 | 541 | ||
| 553 | return dst; | 542 | return dst; |
| 554 | } | 543 | } |
| 555 | 544 | ||
| 556 | Xbyak::Reg64 Tegra::MacroJITx64Impl::Compile_GetRegister(u32 index, Xbyak::Reg64 dst) { | ||
| 557 | if (index == 0) { | ||
| 558 | // Register 0 is always zero | ||
| 559 | xor_(dst, dst); | ||
| 560 | } else { | ||
| 561 | mov(dst, dword[REGISTERS + index * sizeof(u32)]); | ||
| 562 | } | ||
| 563 | |||
| 564 | return dst; | ||
| 565 | } | ||
| 566 | |||
| 567 | void Tegra::MacroJITx64Impl::Compile_WriteCarry(Xbyak::Reg64 dst) { | ||
| 568 | Xbyak::Label zero{}, end{}; | ||
| 569 | xor_(ecx, ecx); | ||
| 570 | shr(dst, 32); | ||
| 571 | setne(cl); | ||
| 572 | mov(dword[STATE + offsetof(JITState, carry_flag)], ecx); | ||
| 573 | } | ||
| 574 | |||
| 575 | void MacroJITx64Impl::Compile_ProcessResult(Macro::ResultOperation operation, u32 reg) { | 545 | void MacroJITx64Impl::Compile_ProcessResult(Macro::ResultOperation operation, u32 reg) { |
| 576 | auto SetRegister = [=](u32 reg, Xbyak::Reg32 result) { | 546 | auto SetRegister = [=](u32 reg, Xbyak::Reg32 result) { |
| 577 | // Register 0 is supposed to always return 0. NOP is implemented as a store to the zero | 547 | // Register 0 is supposed to always return 0. NOP is implemented as a store to the zero |
| @@ -579,7 +549,7 @@ void MacroJITx64Impl::Compile_ProcessResult(Macro::ResultOperation operation, u3 | |||
| 579 | if (reg == 0) { | 549 | if (reg == 0) { |
| 580 | return; | 550 | return; |
| 581 | } | 551 | } |
| 582 | mov(dword[REGISTERS + reg * sizeof(u32)], result); | 552 | mov(dword[STATE + offsetof(JITState, registers) + reg * sizeof(u32)], result); |
| 583 | }; | 553 | }; |
| 584 | auto SetMethodAddress = [=](Xbyak::Reg32 reg) { mov(METHOD_ADDRESS, reg); }; | 554 | auto SetMethodAddress = [=](Xbyak::Reg32 reg) { mov(METHOD_ADDRESS, reg); }; |
| 585 | 555 | ||
diff --git a/src/video_core/macro/macro_jit_x64.h b/src/video_core/macro/macro_jit_x64.h index 71f738b9a..51ec090b8 100644 --- a/src/video_core/macro/macro_jit_x64.h +++ b/src/video_core/macro/macro_jit_x64.h | |||
| @@ -55,8 +55,6 @@ private: | |||
| 55 | 55 | ||
| 56 | Xbyak::Reg32 Compile_FetchParameter(); | 56 | Xbyak::Reg32 Compile_FetchParameter(); |
| 57 | Xbyak::Reg32 Compile_GetRegister(u32 index, Xbyak::Reg32 dst); | 57 | Xbyak::Reg32 Compile_GetRegister(u32 index, Xbyak::Reg32 dst); |
| 58 | Xbyak::Reg64 Compile_GetRegister(u32 index, Xbyak::Reg64 dst); | ||
| 59 | void Compile_WriteCarry(Xbyak::Reg64 dst); | ||
| 60 | 58 | ||
| 61 | void Compile_ProcessResult(Macro::ResultOperation operation, u32 reg); | 59 | void Compile_ProcessResult(Macro::ResultOperation operation, u32 reg); |
| 62 | void Compile_Send(Xbyak::Reg32 value); | 60 | void Compile_Send(Xbyak::Reg32 value); |
| @@ -67,11 +65,10 @@ private: | |||
| 67 | struct JITState { | 65 | struct JITState { |
| 68 | Engines::Maxwell3D* maxwell3d{}; | 66 | Engines::Maxwell3D* maxwell3d{}; |
| 69 | std::array<u32, Macro::NUM_MACRO_REGISTERS> registers{}; | 67 | std::array<u32, Macro::NUM_MACRO_REGISTERS> registers{}; |
| 70 | const u32* parameters{}; | ||
| 71 | u32 carry_flag{}; | 68 | u32 carry_flag{}; |
| 72 | }; | 69 | }; |
| 73 | static_assert(offsetof(JITState, maxwell3d) == 0, "Maxwell3D is not at 0x0"); | 70 | static_assert(offsetof(JITState, maxwell3d) == 0, "Maxwell3D is not at 0x0"); |
| 74 | using ProgramType = void (*)(JITState*); | 71 | using ProgramType = void (*)(JITState*, const u32*); |
| 75 | 72 | ||
| 76 | struct OptimizerState { | 73 | struct OptimizerState { |
| 77 | bool can_skip_carry{}; | 74 | bool can_skip_carry{}; |