JIT: update some rather outdated comments

2025-07-26 23:59:54 -06:00 · 2014-09-16 23:10:56 -07:00
parent 978a855d3f
commit 76c8bb40e8
2 changed files with 15 additions and 52 deletions
--- a/Source/Core/Core/PowerPC/Jit64/Jit.cpp
+++ b/Source/Core/Core/PowerPC/Jit64/Jit.cpp
@ -27,10 +27,9 @@
 using namespace Gen;
 using namespace PowerPC;
-// Dolphin's PowerPC->x86 JIT dynamic recompiler
+// Dolphin's PowerPC->x86_64 JIT dynamic recompiler
-// (Nearly) all code by ector (hrydgard)
+// Written mostly by ector (hrydgard)
 // Features:
 // * x86 & x64 support, lots of shared code.
 // * Basic block linking
 // * Fast dispatcher
@ -50,10 +49,6 @@ using namespace PowerPC;
 // Other considerations
 //
 // Many instructions have shorter forms for EAX. However, I believe their performance boost
 // will be as small to be negligible, so I haven't dirtied up the code with that. AMD recommends it in their
 // optimization manuals, though.
 //
 // We support block linking. Reserve space at the exits of every block for a full 5-byte jmp. Save 16-bit offsets
 // from the starts of each block, marking the exits so that they can be nicely patched at any time.
 //
@ -88,48 +83,16 @@ using namespace PowerPC;
    CR2-CR4 are non-volatile, rest of CR is volatile -> dropped on blr.
 	R5-R12 are volatile -> dropped on blr.
  * classic inlining across calls.
-
+  * Track which registers a block clobbers without using, then take advantage of this knowledge
-Low hanging fruit:
+    when compiling a block that links to that block.
-stfd -- guaranteed in memory
+  * Track more dependencies between instructions, e.g. avoiding PPC_FP code, single/double
-cmpl
+    conversion, movddup on non-paired singles, etc where possible.
-mulli
+  * Support loads/stores directly from xmm registers in jit_util and the backpatcher; this might
-stfs
+    help AMD a lot since gpr/xmm transfers are slower there.
-stwu
+  * Smarter register allocation in general; maybe learn to drop values once we know they won't be
-lb/stzx
+    used again before being overwritten?
-
+  * More flexible reordering; there's limits to how far we can go because of exception handling
-bcx - optimize!
+    and such, but it's currently limited to integer ops only. This can definitely be made better.
 bcctr
 stfs
 psq_st
 addx
 orx
 rlwimix
 fcmpo
 DSP_UpdateARAMDMA
 lfd
 stwu
 cntlzwx
 bcctrx
 WriteBigEData
 TODO
 lha
 srawx
 addic_rc
 addex
 subfcx
 subfex
 fmaddx
 fmulx
 faddx
 fnegx
 frspx
 frsqrtex
 ps_sum0
 ps_muls0
 ps_adds1
 */
 void Jit64::Init()
--- a/Source/Core/Core/PowerPC/Jit64/Jit_Branch.cpp
+++ b/Source/Core/Core/PowerPC/Jit64/Jit_Branch.cpp
@ -223,7 +223,7 @@ void Jit64::bclrx(UGeckoInstruction inst)
 	}
 	// This below line can be used to prove that blr "eats flags" in practice.
-		// This observation will let us do a lot of fun observations.
+	// This observation could let us do some useful optimizations.
 #ifdef ACID_TEST
 	AND(32, PPCSTATE(cr), Imm32(~(0xFF000000)));
 #endif