mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-14 00:32:55 +00:00
[mips][msa] Correct the behaviour of the COPY_FW pseudo on lanes 2 and 3.
Summary: Previously, attempting to extract lanes 2 and 3 would actually extract lane 1. The MSA CodeGen tests only covered lanes 0 and 1. Differential Revision: http://llvm-reviews.chandlerc.com/D2935 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@202848 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
80a59df0e7
commit
e06bec47d6
@ -2755,7 +2755,7 @@ emitCOPY_FW(MachineInstr *MI, MachineBasicBlock *BB) const{
|
||||
else {
|
||||
unsigned Wt = RegInfo.createVirtualRegister(&Mips::MSA128WRegClass);
|
||||
|
||||
BuildMI(*BB, MI, DL, TII->get(Mips::SPLATI_W), Wt).addReg(Ws).addImm(1);
|
||||
BuildMI(*BB, MI, DL, TII->get(Mips::SPLATI_W), Wt).addReg(Ws).addImm(Lane);
|
||||
BuildMI(*BB, MI, DL, TII->get(Mips::COPY), Fd).addReg(Wt, 0, Mips::sub_lo);
|
||||
}
|
||||
|
||||
|
@ -137,6 +137,24 @@ define float @extract_v4f32_elt0() nounwind {
|
||||
; MIPS32: .size extract_v4f32_elt0
|
||||
}
|
||||
|
||||
define float @extract_v4f32_elt2() nounwind {
|
||||
; MIPS32: extract_v4f32_elt2:
|
||||
|
||||
%1 = load <4 x float>* @v4f32
|
||||
; MIPS32-DAG: ld.w [[R1:\$w[0-9]+]],
|
||||
|
||||
%2 = fadd <4 x float> %1, %1
|
||||
; MIPS32-DAG: fadd.w [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
||||
|
||||
%3 = extractelement <4 x float> %2, i32 2
|
||||
; Element 2 can be obtained by splatting it across the vector and extracting
|
||||
; $w0:sub_lo
|
||||
; MIPS32-DAG: splati.w $w0, [[R1]][2]
|
||||
|
||||
ret float %3
|
||||
; MIPS32: .size extract_v4f32_elt2
|
||||
}
|
||||
|
||||
define double @extract_v2f64() nounwind {
|
||||
; MIPS32: extract_v2f64:
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user