Merge pull request #8027 from MerryMage/MOVAPS

Jit64: Prefer MOVAPS where possible
2025-07-25 07:09:48 -06:00 · 2019-05-22 15:05:17 +10:00
parent 57fbf1cd6e e06111e86f
commit 68877c52d1
2 changed files with 18 additions and 8 deletions
--- a/Source/Core/Common/x64Emitter.cpp
+++ b/Source/Core/Common/x64Emitter.cpp
@ -2180,7 +2180,11 @@ void XEmitter::MOVAPS(X64Reg regOp, const OpArg& arg)
 }
 void XEmitter::MOVAPD(X64Reg regOp, const OpArg& arg)
 {
-  WriteSSEOp(0x66, sseMOVAPfromRM, regOp, arg);
+  // Prefer MOVAPS to MOVAPD as there is no reason to use MOVAPD over MOVAPS:
  // - They have equivalent functionality.
  // - There has never been a microarchitecture with separate single and double domains.
  // - MOVAPD is one byte longer than MOVAPS.
  MOVAPS(regOp, arg);
 }
 void XEmitter::MOVAPS(const OpArg& arg, X64Reg regOp)
 {
@ -2188,7 +2192,7 @@ void XEmitter::MOVAPS(const OpArg& arg, X64Reg regOp)
 }
 void XEmitter::MOVAPD(const OpArg& arg, X64Reg regOp)
 {
-  WriteSSEOp(0x66, sseMOVAPtoRM, regOp, arg);
+  MOVAPS(arg, regOp);
 }
 void XEmitter::MOVUPS(X64Reg regOp, const OpArg& arg)
@ -2425,8 +2429,14 @@ void XEmitter::MOVDDUP(X64Reg regOp, const OpArg& arg)
  }
  else
  {
-    if (!arg.IsSimpleReg(regOp))
+    if (!arg.IsSimpleReg())
    {
      MOVSD(regOp, arg);
    }
    else if (regOp != arg.GetSimpleReg())
    {
      MOVAPD(regOp, arg);
    }
    UNPCKLPD(regOp, R(regOp));
  }
 }
--- a/Source/Core/Core/PowerPC/Jit64Common/EmuCodeBlock.cpp
+++ b/Source/Core/Core/PowerPC/Jit64Common/EmuCodeBlock.cpp
@ -894,7 +894,7 @@ alignas(16) static const __m128i double_qnan_bit = _mm_set_epi64x(0xffffffffffff
 // unless the exponent is in the range of 874 to 896.
 void EmuCodeBlock::ConvertDoubleToSingle(X64Reg dst, X64Reg src)
 {
-  MOVSD(XMM1, R(src));
+  MOVAPD(XMM1, R(src));
  // Grab Exponent
  PAND(XMM1, MConst(double_exponent));
@ -914,7 +914,7 @@ void EmuCodeBlock::ConvertDoubleToSingle(X64Reg dst, X64Reg src)
  PSUBQ(XMM0, R(XMM1));
  // xmm1 = fraction | 0x0010000000000000
-  MOVSD(XMM1, R(src));
+  MOVAPD(XMM1, R(src));
  PAND(XMM1, MConst(double_fraction));
  POR(XMM1, MConst(double_explicit_top_bit));
@ -922,7 +922,7 @@ void EmuCodeBlock::ConvertDoubleToSingle(X64Reg dst, X64Reg src)
  PSRLQ(XMM1, R(XMM0));
  // OR the sign bit in.
-  MOVSD(XMM0, R(src));
+  MOVAPD(XMM0, R(src));
  PAND(XMM0, MConst(double_sign_bit));
  PSRLQ(XMM0, 32);
  POR(XMM1, R(XMM0));
@ -934,12 +934,12 @@ void EmuCodeBlock::ConvertDoubleToSingle(X64Reg dst, X64Reg src)
  // Don't Denormalize
  // We want bits 0, 1
-  MOVSD(XMM1, R(src));
+  MOVAPD(XMM1, R(src));
  PAND(XMM1, MConst(double_top_two_bits));
  PSRLQ(XMM1, 32);
  // And 5 through to 34
-  MOVSD(XMM0, R(src));
+  MOVAPD(XMM0, R(src));
  PAND(XMM0, MConst(double_bottom_bits));
  PSRLQ(XMM0, 29);