mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-05-29 07:39:27 +00:00
Revert "X86 memcpy lowering: use "rep movs" even when esi is used as base pointer" (r204174)
> For functions where esi is used as base pointer, we would previously fall ba > from lowering memcpy with "rep movs" because that clobbers esi. > > With this patch, we just store esi in another physical register, and restore > it afterwards. This adds a little bit of register preassure, but the more > efficient memcpy should be worth it. > > Differential Revision: http://llvm-reviews.chandlerc.com/D2968 This didn't work. I was ending up with code like this: lea edi,[esi+38h] mov ecx,0Fh mov edx,esi mov esi,ebx rep movs dword ptr es:[edi],dword ptr [esi] lea ecx,[esi+74h] <-- Ooops, we're now using esi before restoring it from edx. add ebx,3Ch mov esi,edx I guess if we want to do this we need stronger glue or something, or doing the expansion much later. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@204829 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
7363d2223e
commit
b82f8a28e8
@ -200,11 +200,13 @@ X86SelectionDAGInfo::EmitTargetCodeForMemcpy(SelectionDAG &DAG, SDLoc dl,
|
|||||||
SrcPtrInfo.getAddrSpace() >= 256)
|
SrcPtrInfo.getAddrSpace() >= 256)
|
||||||
return SDValue();
|
return SDValue();
|
||||||
|
|
||||||
// If ESI is used as a base pointer, we must preserve it when doing rep movs.
|
// ESI might be used as a base pointer, in that case we can't simply overwrite
|
||||||
|
// the register. Fall back to generic code.
|
||||||
const X86RegisterInfo *TRI =
|
const X86RegisterInfo *TRI =
|
||||||
static_cast<const X86RegisterInfo *>(DAG.getTarget().getRegisterInfo());
|
static_cast<const X86RegisterInfo *>(DAG.getTarget().getRegisterInfo());
|
||||||
bool PreserveESI = TRI->hasBasePointer(DAG.getMachineFunction()) &&
|
if (TRI->hasBasePointer(DAG.getMachineFunction()) &&
|
||||||
TRI->getBaseRegister() == X86::ESI;
|
TRI->getBaseRegister() == X86::ESI)
|
||||||
|
return SDValue();
|
||||||
|
|
||||||
MVT AVT;
|
MVT AVT;
|
||||||
if (Align & 1)
|
if (Align & 1)
|
||||||
@ -223,45 +225,27 @@ X86SelectionDAGInfo::EmitTargetCodeForMemcpy(SelectionDAG &DAG, SDLoc dl,
|
|||||||
SDValue Count = DAG.getIntPtrConstant(CountVal);
|
SDValue Count = DAG.getIntPtrConstant(CountVal);
|
||||||
unsigned BytesLeft = SizeVal % UBytes;
|
unsigned BytesLeft = SizeVal % UBytes;
|
||||||
|
|
||||||
|
SDValue InFlag(0, 0);
|
||||||
if (PreserveESI) {
|
|
||||||
// Save ESI to a physical register. (We cannot use a virtual register
|
|
||||||
// because if it is spilled we wouldn't be able to reload it.)
|
|
||||||
// We don't glue this because the register dependencies are explicit.
|
|
||||||
Chain = DAG.getCopyToReg(Chain, dl, X86::EDX,
|
|
||||||
DAG.getRegister(X86::ESI, MVT::i32));
|
|
||||||
}
|
|
||||||
|
|
||||||
SDValue InGlue(0, 0);
|
|
||||||
Chain = DAG.getCopyToReg(Chain, dl, Subtarget->is64Bit() ? X86::RCX :
|
Chain = DAG.getCopyToReg(Chain, dl, Subtarget->is64Bit() ? X86::RCX :
|
||||||
X86::ECX,
|
X86::ECX,
|
||||||
Count, InGlue);
|
Count, InFlag);
|
||||||
InGlue = Chain.getValue(1);
|
InFlag = Chain.getValue(1);
|
||||||
Chain = DAG.getCopyToReg(Chain, dl, Subtarget->is64Bit() ? X86::RDI :
|
Chain = DAG.getCopyToReg(Chain, dl, Subtarget->is64Bit() ? X86::RDI :
|
||||||
X86::EDI,
|
X86::EDI,
|
||||||
Dst, InGlue);
|
Dst, InFlag);
|
||||||
InGlue = Chain.getValue(1);
|
InFlag = Chain.getValue(1);
|
||||||
Chain = DAG.getCopyToReg(Chain, dl, Subtarget->is64Bit() ? X86::RSI :
|
Chain = DAG.getCopyToReg(Chain, dl, Subtarget->is64Bit() ? X86::RSI :
|
||||||
X86::ESI,
|
X86::ESI,
|
||||||
Src, InGlue);
|
Src, InFlag);
|
||||||
InGlue = Chain.getValue(1);
|
InFlag = Chain.getValue(1);
|
||||||
|
|
||||||
SDVTList Tys = DAG.getVTList(MVT::Other, MVT::Glue);
|
SDVTList Tys = DAG.getVTList(MVT::Other, MVT::Glue);
|
||||||
SDValue Ops[] = { Chain, DAG.getValueType(AVT), InGlue };
|
SDValue Ops[] = { Chain, DAG.getValueType(AVT), InFlag };
|
||||||
// FIXME: Make X86rep_movs explicitly use FCX, RDI, RSI instead of glue.
|
|
||||||
SDValue RepMovs = DAG.getNode(X86ISD::REP_MOVS, dl, Tys, Ops,
|
SDValue RepMovs = DAG.getNode(X86ISD::REP_MOVS, dl, Tys, Ops,
|
||||||
array_lengthof(Ops));
|
array_lengthof(Ops));
|
||||||
|
|
||||||
if (PreserveESI) {
|
|
||||||
InGlue = RepMovs.getValue(1);
|
|
||||||
RepMovs = DAG.getCopyToReg(RepMovs, dl, X86::ESI,
|
|
||||||
DAG.getRegister(X86::EDX, MVT::i32), InGlue);
|
|
||||||
}
|
|
||||||
|
|
||||||
SmallVector<SDValue, 4> Results;
|
SmallVector<SDValue, 4> Results;
|
||||||
Results.push_back(RepMovs);
|
Results.push_back(RepMovs);
|
||||||
|
|
||||||
|
|
||||||
if (BytesLeft) {
|
if (BytesLeft) {
|
||||||
// Handle the last 1 - 7 bytes.
|
// Handle the last 1 - 7 bytes.
|
||||||
unsigned Offset = SizeVal - BytesLeft;
|
unsigned Offset = SizeVal - BytesLeft;
|
||||||
|
@ -13,7 +13,5 @@ define void @test1(%struct.foo* nocapture %x, i32 %y, i8* %z) nounwind {
|
|||||||
|
|
||||||
; CHECK-LABEL: test1:
|
; CHECK-LABEL: test1:
|
||||||
; CHECK: movl %esp, %esi
|
; CHECK: movl %esp, %esi
|
||||||
; CHECK: movl %esi, %edx
|
; CHECK-NOT: rep;movsl
|
||||||
; CHECK: rep;movsl
|
|
||||||
; CHECK: movl %edx, %esi
|
|
||||||
}
|
}
|
||||||
|
@ -15,9 +15,7 @@ define void @test1(%struct.foo* nocapture %x, i32 %y) nounwind {
|
|||||||
; CHECK-LABEL: test1:
|
; CHECK-LABEL: test1:
|
||||||
; CHECK: andl $-16, %esp
|
; CHECK: andl $-16, %esp
|
||||||
; CHECK: movl %esp, %esi
|
; CHECK: movl %esp, %esi
|
||||||
; CHECK: movl %esi, %edx
|
; CHECK-NOT: rep;movsl
|
||||||
; CHECK: rep;movsl
|
|
||||||
; CHECK: movl %edx, %esi
|
|
||||||
}
|
}
|
||||||
|
|
||||||
; PR19012
|
; PR19012
|
||||||
@ -30,9 +28,7 @@ define void @test2(%struct.foo* nocapture %x, i32 %y, i8* %z) nounwind {
|
|||||||
|
|
||||||
; CHECK-LABEL: test2:
|
; CHECK-LABEL: test2:
|
||||||
; CHECK: movl %esp, %esi
|
; CHECK: movl %esp, %esi
|
||||||
; CHECK: movl %esi, %edx
|
; CHECK-NOT: rep;movsl
|
||||||
; CHECK: rep;movsl
|
|
||||||
; CHECK: movl %edx, %esi
|
|
||||||
}
|
}
|
||||||
|
|
||||||
; Check that we do use rep movs if we make the alloca static.
|
; Check that we do use rep movs if we make the alloca static.
|
||||||
@ -43,6 +39,5 @@ define void @test3(%struct.foo* nocapture %x, i32 %y, i8* %z) nounwind {
|
|||||||
ret void
|
ret void
|
||||||
|
|
||||||
; CHECK-LABEL: test3:
|
; CHECK-LABEL: test3:
|
||||||
; CHECK-NOT: movl %esi, %edx
|
|
||||||
; CHECK: rep;movsl
|
; CHECK: rep;movsl
|
||||||
}
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user