mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-14 16:33:28 +00:00
9a1aaeb012
Changes to MIPS SelectionDAG: * Added nodes VEXTRACT_[SZ]EXT_ELT to represent extract and extend in a single operation and implemented the DAG combines necessary to fold sign/zero extends into the extract. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@191199 91177308-0d34-0410-b5e6-96231b3b80d8
347 lines
9.8 KiB
LLVM
347 lines
9.8 KiB
LLVM
; RUN: llc -march=mips -mattr=+msa < %s | FileCheck -check-prefix=MIPS32 %s
|
|
|
|
@v16i8 = global <16 x i8> <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>
|
|
@v8i16 = global <8 x i16> <i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0>
|
|
@v4i32 = global <4 x i32> <i32 0, i32 0, i32 0, i32 0>
|
|
@v2i64 = global <2 x i64> <i64 0, i64 0>
|
|
@i64 = global i64 0
|
|
|
|
define void @const_v16i8() nounwind {
|
|
; MIPS32: const_v16i8:
|
|
|
|
store volatile <16 x i8> <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>, <16 x i8>*@v16i8
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 0
|
|
|
|
store volatile <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>, <16 x i8>*@v16i8
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 31>, <16 x i8>*@v16i8
|
|
; MIPS32: ld.b [[R1:\$w[0-9]+]], %lo(
|
|
|
|
store volatile <16 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6>, <16 x i8>*@v16i8
|
|
; MIPS32: ld.b [[R1:\$w[0-9]+]], %lo(
|
|
|
|
store volatile <16 x i8> <i8 1, i8 2, i8 1, i8 2, i8 1, i8 2, i8 1, i8 2, i8 1, i8 2, i8 1, i8 2, i8 1, i8 2, i8 1, i8 2>, <16 x i8>*@v16i8
|
|
; MIPS32: ldi.h [[R1:\$w[0-9]+]], 258
|
|
|
|
store volatile <16 x i8> <i8 1, i8 2, i8 3, i8 4, i8 1, i8 2, i8 3, i8 4, i8 1, i8 2, i8 3, i8 4, i8 1, i8 2, i8 3, i8 4>, <16 x i8>*@v16i8
|
|
; MIPS32-DAG: lui [[R2:\$[0-9]+]], 258
|
|
; MIPS32-DAG: ori [[R2]], [[R2]], 772
|
|
; MIPS32-DAG: fill.w [[R1:\$w[0-9]+]], [[R2]]
|
|
|
|
store volatile <16 x i8> <i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8>, <16 x i8>*@v16i8
|
|
; MIPS32: ld.b [[R1:\$w[0-9]+]], %lo(
|
|
|
|
ret void
|
|
; MIPS32: .size const_v16i8
|
|
}
|
|
|
|
define void @const_v8i16() nounwind {
|
|
; MIPS32: const_v8i16:
|
|
|
|
store volatile <8 x i16> <i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0>, <8 x i16>*@v8i16
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 0
|
|
|
|
store volatile <8 x i16> <i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1, i16 1>, <8 x i16>*@v8i16
|
|
; MIPS32: ldi.h [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <8 x i16> <i16 1, i16 1, i16 1, i16 2, i16 1, i16 1, i16 1, i16 31>, <8 x i16>*@v8i16
|
|
; MIPS32: ld.h [[R1:\$w[0-9]+]], %lo(
|
|
|
|
store volatile <8 x i16> <i16 1028, i16 1028, i16 1028, i16 1028, i16 1028, i16 1028, i16 1028, i16 1028>, <8 x i16>*@v8i16
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 4
|
|
|
|
store volatile <8 x i16> <i16 1, i16 2, i16 1, i16 2, i16 1, i16 2, i16 1, i16 2>, <8 x i16>*@v8i16
|
|
; MIPS32-DAG: lui [[R2:\$[0-9]+]], 1
|
|
; MIPS32-DAG: ori [[R2]], [[R2]], 2
|
|
; MIPS32-DAG: fill.w [[R1:\$w[0-9]+]], [[R2]]
|
|
|
|
store volatile <8 x i16> <i16 1, i16 2, i16 3, i16 4, i16 1, i16 2, i16 3, i16 4>, <8 x i16>*@v8i16
|
|
; MIPS32: ld.h [[R1:\$w[0-9]+]], %lo(
|
|
|
|
ret void
|
|
; MIPS32: .size const_v8i16
|
|
}
|
|
|
|
define void @const_v4i32() nounwind {
|
|
; MIPS32: const_v4i32:
|
|
|
|
store volatile <4 x i32> <i32 0, i32 0, i32 0, i32 0>, <4 x i32>*@v4i32
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 0
|
|
|
|
store volatile <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32>*@v4i32
|
|
; MIPS32: ldi.w [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <4 x i32> <i32 1, i32 1, i32 1, i32 31>, <4 x i32>*@v4i32
|
|
; MIPS32: ld.w [[R1:\$w[0-9]+]], %lo(
|
|
|
|
store volatile <4 x i32> <i32 16843009, i32 16843009, i32 16843009, i32 16843009>, <4 x i32>*@v4i32
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <4 x i32> <i32 65537, i32 65537, i32 65537, i32 65537>, <4 x i32>*@v4i32
|
|
; MIPS32: ldi.h [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <4 x i32> <i32 1, i32 2, i32 1, i32 2>, <4 x i32>*@v4i32
|
|
; MIPS32: ld.w [[R1:\$w[0-9]+]], %lo(
|
|
|
|
store volatile <4 x i32> <i32 3, i32 4, i32 5, i32 6>, <4 x i32>*@v4i32
|
|
; MIPS32: ld.w [[R1:\$w[0-9]+]], %lo(
|
|
|
|
ret void
|
|
; MIPS32: .size const_v4i32
|
|
}
|
|
|
|
define void @const_v2i64() nounwind {
|
|
; MIPS32: const_v2i64:
|
|
|
|
store volatile <2 x i64> <i64 0, i64 0>, <2 x i64>*@v2i64
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 0
|
|
|
|
store volatile <2 x i64> <i64 72340172838076673, i64 72340172838076673>, <2 x i64>*@v2i64
|
|
; MIPS32: ldi.b [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <2 x i64> <i64 281479271743489, i64 281479271743489>, <2 x i64>*@v2i64
|
|
; MIPS32: ldi.h [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <2 x i64> <i64 4294967297, i64 4294967297>, <2 x i64>*@v2i64
|
|
; MIPS32: ldi.w [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <2 x i64> <i64 1, i64 1>, <2 x i64>*@v2i64
|
|
; MIPS32: ldi.d [[R1:\$w[0-9]+]], 1
|
|
|
|
store volatile <2 x i64> <i64 1, i64 31>, <2 x i64>*@v2i64
|
|
; MIPS32: ld.w [[R1:\$w[0-9]+]], %lo(
|
|
|
|
store volatile <2 x i64> <i64 3, i64 4>, <2 x i64>*@v2i64
|
|
; MIPS32: ld.w [[R1:\$w[0-9]+]], %lo(
|
|
|
|
ret void
|
|
; MIPS32: .size const_v2i64
|
|
}
|
|
|
|
define i32 @extract_sext_v16i8() nounwind {
|
|
; MIPS32: extract_sext_v16i8:
|
|
|
|
%1 = load <16 x i8>* @v16i8
|
|
; MIPS32-DAG: ld.b [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <16 x i8> %1, %1
|
|
; MIPS32-DAG: addv.b [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <16 x i8> %2, i32 1
|
|
%4 = sext i8 %3 to i32
|
|
; MIPS32-DAG: copy_s.b [[R3:\$[0-9]+]], [[R1]][1]
|
|
; MIPS32-NOT: sll
|
|
; MIPS32-NOT: sra
|
|
|
|
ret i32 %4
|
|
; MIPS32: .size extract_sext_v16i8
|
|
}
|
|
|
|
define i32 @extract_sext_v8i16() nounwind {
|
|
; MIPS32: extract_sext_v8i16:
|
|
|
|
%1 = load <8 x i16>* @v8i16
|
|
; MIPS32-DAG: ld.h [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <8 x i16> %1, %1
|
|
; MIPS32-DAG: addv.h [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <8 x i16> %2, i32 1
|
|
%4 = sext i16 %3 to i32
|
|
; MIPS32-DAG: copy_s.h [[R3:\$[0-9]+]], [[R1]][1]
|
|
; MIPS32-NOT: sll
|
|
; MIPS32-NOT: sra
|
|
|
|
ret i32 %4
|
|
; MIPS32: .size extract_sext_v8i16
|
|
}
|
|
|
|
define i32 @extract_sext_v4i32() nounwind {
|
|
; MIPS32: extract_sext_v4i32:
|
|
|
|
%1 = load <4 x i32>* @v4i32
|
|
; MIPS32-DAG: ld.w [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <4 x i32> %1, %1
|
|
; MIPS32-DAG: addv.w [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <4 x i32> %2, i32 1
|
|
; MIPS32-DAG: copy_s.w [[R3:\$[0-9]+]], [[R1]][1]
|
|
|
|
ret i32 %3
|
|
; MIPS32: .size extract_sext_v4i32
|
|
}
|
|
|
|
define i64 @extract_sext_v2i64() nounwind {
|
|
; MIPS32: extract_sext_v2i64:
|
|
|
|
%1 = load <2 x i64>* @v2i64
|
|
; MIPS32-DAG: ld.d [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <2 x i64> %1, %1
|
|
; MIPS32-DAG: addv.d [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <2 x i64> %2, i32 1
|
|
; MIPS32-DAG: copy_s.w [[R3:\$[0-9]+]], [[R1]][2]
|
|
; MIPS32-DAG: copy_s.w [[R4:\$[0-9]+]], [[R1]][3]
|
|
; MIPS32-NOT: sll
|
|
; MIPS32-NOT: sra
|
|
|
|
ret i64 %3
|
|
; MIPS32: .size extract_sext_v2i64
|
|
}
|
|
|
|
define i32 @extract_zext_v16i8() nounwind {
|
|
; MIPS32: extract_zext_v16i8:
|
|
|
|
%1 = load <16 x i8>* @v16i8
|
|
; MIPS32-DAG: ld.b [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <16 x i8> %1, %1
|
|
; MIPS32-DAG: addv.b [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <16 x i8> %2, i32 1
|
|
%4 = zext i8 %3 to i32
|
|
; MIPS32-DAG: copy_u.b [[R3:\$[0-9]+]], [[R1]][1]
|
|
; MIPS32-NOT: andi
|
|
|
|
ret i32 %4
|
|
; MIPS32: .size extract_zext_v16i8
|
|
}
|
|
|
|
define i32 @extract_zext_v8i16() nounwind {
|
|
; MIPS32: extract_zext_v8i16:
|
|
|
|
%1 = load <8 x i16>* @v8i16
|
|
; MIPS32-DAG: ld.h [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <8 x i16> %1, %1
|
|
; MIPS32-DAG: addv.h [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <8 x i16> %2, i32 1
|
|
%4 = zext i16 %3 to i32
|
|
; MIPS32-DAG: copy_u.h [[R3:\$[0-9]+]], [[R1]][1]
|
|
; MIPS32-NOT: andi
|
|
|
|
ret i32 %4
|
|
; MIPS32: .size extract_zext_v8i16
|
|
}
|
|
|
|
define i32 @extract_zext_v4i32() nounwind {
|
|
; MIPS32: extract_zext_v4i32:
|
|
|
|
%1 = load <4 x i32>* @v4i32
|
|
; MIPS32-DAG: ld.w [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <4 x i32> %1, %1
|
|
; MIPS32-DAG: addv.w [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <4 x i32> %2, i32 1
|
|
; MIPS32-DAG: copy_{{[su]}}.w [[R3:\$[0-9]+]], [[R1]][1]
|
|
|
|
ret i32 %3
|
|
; MIPS32: .size extract_zext_v4i32
|
|
}
|
|
|
|
define i64 @extract_zext_v2i64() nounwind {
|
|
; MIPS32: extract_zext_v2i64:
|
|
|
|
%1 = load <2 x i64>* @v2i64
|
|
; MIPS32-DAG: ld.d [[R1:\$w[0-9]+]],
|
|
|
|
%2 = add <2 x i64> %1, %1
|
|
; MIPS32-DAG: addv.d [[R2:\$w[0-9]+]], [[R1]], [[R1]]
|
|
|
|
%3 = extractelement <2 x i64> %2, i32 1
|
|
; MIPS32-DAG: copy_{{[su]}}.w [[R3:\$[0-9]+]], [[R1]][2]
|
|
; MIPS32-DAG: copy_{{[su]}}.w [[R4:\$[0-9]+]], [[R1]][3]
|
|
; MIPS32-NOT: andi
|
|
|
|
ret i64 %3
|
|
; MIPS32: .size extract_zext_v2i64
|
|
}
|
|
|
|
define void @insert_v16i8(i32 %a) nounwind {
|
|
; MIPS32: insert_v16i8:
|
|
|
|
%1 = load <16 x i8>* @v16i8
|
|
; MIPS32-DAG: ld.b [[R1:\$w[0-9]+]],
|
|
|
|
%a2 = trunc i32 %a to i8
|
|
%a3 = sext i8 %a2 to i32
|
|
%a4 = trunc i32 %a3 to i8
|
|
; MIPS32-NOT: andi
|
|
; MIPS32-NOT: sra
|
|
|
|
%2 = insertelement <16 x i8> %1, i8 %a4, i32 1
|
|
; MIPS32-DAG: insert.b [[R1]][1], $4
|
|
|
|
store <16 x i8> %2, <16 x i8>* @v16i8
|
|
; MIPS32-DAG: st.b [[R1]]
|
|
|
|
ret void
|
|
; MIPS32: .size insert_v16i8
|
|
}
|
|
|
|
define void @insert_v8i16(i32 %a) nounwind {
|
|
; MIPS32: insert_v8i16:
|
|
|
|
%1 = load <8 x i16>* @v8i16
|
|
; MIPS32-DAG: ld.h [[R1:\$w[0-9]+]],
|
|
|
|
%a2 = trunc i32 %a to i16
|
|
%a3 = sext i16 %a2 to i32
|
|
%a4 = trunc i32 %a3 to i16
|
|
; MIPS32-NOT: andi
|
|
; MIPS32-NOT: sra
|
|
|
|
%2 = insertelement <8 x i16> %1, i16 %a4, i32 1
|
|
; MIPS32-DAG: insert.h [[R1]][1], $4
|
|
|
|
store <8 x i16> %2, <8 x i16>* @v8i16
|
|
; MIPS32-DAG: st.h [[R1]]
|
|
|
|
ret void
|
|
; MIPS32: .size insert_v8i16
|
|
}
|
|
|
|
define void @insert_v4i32(i32 %a) nounwind {
|
|
; MIPS32: insert_v4i32:
|
|
|
|
%1 = load <4 x i32>* @v4i32
|
|
; MIPS32-DAG: ld.w [[R1:\$w[0-9]+]],
|
|
|
|
; MIPS32-NOT: andi
|
|
; MIPS32-NOT: sra
|
|
|
|
%2 = insertelement <4 x i32> %1, i32 %a, i32 1
|
|
; MIPS32-DAG: insert.w [[R1]][1], $4
|
|
|
|
store <4 x i32> %2, <4 x i32>* @v4i32
|
|
; MIPS32-DAG: st.w [[R1]]
|
|
|
|
ret void
|
|
; MIPS32: .size insert_v4i32
|
|
}
|
|
|
|
define void @insert_v2i64(i64 %a) nounwind {
|
|
; MIPS32: insert_v2i64:
|
|
|
|
%1 = load <2 x i64>* @v2i64
|
|
; MIPS32-DAG: ld.w [[R1:\$w[0-9]+]],
|
|
|
|
; MIPS32-NOT: andi
|
|
; MIPS32-NOT: sra
|
|
|
|
%2 = insertelement <2 x i64> %1, i64 %a, i32 1
|
|
; MIPS32-DAG: insert.w [[R1]][2], $4
|
|
; MIPS32-DAG: insert.w [[R1]][3], $5
|
|
|
|
store <2 x i64> %2, <2 x i64>* @v2i64
|
|
; MIPS32-DAG: st.w [[R1]]
|
|
|
|
ret void
|
|
; MIPS32: .size insert_v2i64
|
|
}
|