mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-02 07:32:52 +00:00
Use movaps / movapd (instead of movss / movsd) to do FR32 / FR64 reg to reg
transfer. According to the Intel P4 Optimization Manual: Moves that write a portion of a register can introduce unwanted dependences. The movsd reg, reg instruction writes only the bottom 64 bits of a register, not to all 128 bits. This introduces a dependence on the preceding instruction that produces the upper 64 bits (even if those bits are not longer wanted). The dependence inhibits register renaming, and thereby reduces parallelism. Not to mention movaps is shorter than movss. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@26226 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
f17c42d409
commit
d51425a82d
@ -106,9 +106,9 @@ void X86RegisterInfo::copyRegToReg(MachineBasicBlock &MBB,
|
||||
} else if (RC == &X86::RFPRegClass || RC == &X86::RSTRegClass) {
|
||||
Opc = X86::FpMOV;
|
||||
} else if (RC == &X86::FR32RegClass || RC == &X86::V4F4RegClass) {
|
||||
Opc = X86::MOVSSrr;
|
||||
Opc = X86::MOVAPSrr;
|
||||
} else if (RC == &X86::FR64RegClass || RC == &X86::V2F8RegClass) {
|
||||
Opc = X86::MOVSDrr;
|
||||
Opc = X86::MOVAPDrr;
|
||||
} else {
|
||||
assert(0 && "Unknown regclass");
|
||||
abort();
|
||||
|
Loading…
Reference in New Issue
Block a user