emit_x64_vector: Changes to VectorSignedSaturatedDoublingMultiply

* Return both the upper and lower parts of the multiply if required * SSE2 does not support the pmuldq instruction, do sign correction to an unsigned result instead * Improve port utilisation where possible (punpck instructions were a bottleneck)
2026-01-03 21:24:38 +01:00 · 2018-09-15 09:04:19 +01:00 · 2018-09-15 09:04:19 +01:00 · 06b31448aa
commit 06b31448aa
parent 08c0e017a5
8 changed files with 233 additions and 70 deletions
--- a/src/frontend/ir/microinstruction.cpp
+++ b/src/frontend/ir/microinstruction.cpp
@ -361,8 +361,6 @@ bool Inst::WritesToFPSRCumulativeSaturationBit() const {
    case Opcode::VectorSignedSaturatedNarrowToUnsigned16:
    case Opcode::VectorSignedSaturatedNarrowToUnsigned32:
    case Opcode::VectorSignedSaturatedNarrowToUnsigned64:
-    case Opcode::VectorSignedSaturatedDoublingMultiplyReturnHigh16:
-    case Opcode::VectorSignedSaturatedDoublingMultiplyReturnHigh32:
    case Opcode::VectorSignedSaturatedNeg8:
    case Opcode::VectorSignedSaturatedNeg16:
    case Opcode::VectorSignedSaturatedNeg32: