mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2024-12-26 21:32:10 +00:00
ea28aafa83
Summary: When getConstant() is called for an expanded vector type, it is split into multiple scalar constants which are then combined using appropriate build_vector and bitcast operations. In addition to the usual big/little endian differences, the case where the element-order of the vector does not have the same endianness as the elements themselves is also accounted for. For example, for v4i32 on big-endian MIPS, the byte-order of the vector is <3210,7654,BA98,FEDC>. For little-endian, it is <0123,4567,89AB,CDEF>. Handling this case turns out to be a nop since getConstant() returns a splatted vector (so reversing the element order doesn't change the value) This fixes a number of cases in MIPS MSA where calling getConstant() during operation legalization introduces illegal types (e.g. to legalize v2i64 UNDEF into a v2i64 BUILD_VECTOR of illegal i64 zeros). It should also handle bigger differences between illegal and legal types such as legalizing v2i64 into v8i16. lowerMSASplatImm() in the MIPS backend no longer needs to avoid calling getConstant() so this function has been updated in the same patch. For the sake of transparency, the steps I've taken since the review are: * Added 'virtual' to isVectorEltOrderLittleEndian() as requested. This revealed that the MIPS tests were falsely passing because a polymorphic function was not actually polymorphic in the reviewed patch. * Fixed the tests that were now failing. This involved deleting the code to handle the MIPS MSA element-order (which was previously doing an byte-order swap instead of an element-order swap). This left isVectorEltOrderLittleEndian() unused and it was deleted. * Fixed build failures caused by rebasing beyond r194467-r194472. These build failures involved the bset, bneg, and bclr instructions added in these commits using lowerMSASplatImm() in a way that was no longer valid after this patch. Some of these were fixed by calling SelectionDAG::getConstant() instead, others were fixed by a new function getBuildVectorSplat() that provided the removed functionality of lowerMSASplatImm() in a more sensible way. Reviewers: bkramer Reviewed By: bkramer CC: llvm-commits Differential Revision: http://llvm-reviews.chandlerc.com/D1973 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@194811 91177308-0d34-0410-b5e6-96231b3b80d8
495 lines
20 KiB
LLVM
495 lines
20 KiB
LLVM
; Test the MSA intrinsics that are encoded with the 3R instruction format.
|
|
; There are lots of these so this covers those beginning with 'b'
|
|
|
|
; RUN: llc -march=mips -mattr=+msa,+fp64 < %s | FileCheck %s
|
|
; RUN: llc -march=mipsel -mattr=+msa,+fp64 < %s | FileCheck %s
|
|
|
|
@llvm_mips_bclr_b_ARG1 = global <16 x i8> <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, align 16
|
|
@llvm_mips_bclr_b_ARG2 = global <16 x i8> <i8 16, i8 17, i8 18, i8 19, i8 20, i8 21, i8 22, i8 23, i8 24, i8 25, i8 26, i8 27, i8 28, i8 29, i8 30, i8 31>, align 16
|
|
@llvm_mips_bclr_b_RES = global <16 x i8> <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>, align 16
|
|
|
|
define void @llvm_mips_bclr_b_test() nounwind {
|
|
entry:
|
|
%0 = load <16 x i8>* @llvm_mips_bclr_b_ARG1
|
|
%1 = load <16 x i8>* @llvm_mips_bclr_b_ARG2
|
|
%2 = tail call <16 x i8> @llvm.mips.bclr.b(<16 x i8> %0, <16 x i8> %1)
|
|
store <16 x i8> %2, <16 x i8>* @llvm_mips_bclr_b_RES
|
|
ret void
|
|
}
|
|
|
|
declare <16 x i8> @llvm.mips.bclr.b(<16 x i8>, <16 x i8>) nounwind
|
|
|
|
; CHECK: llvm_mips_bclr_b_test:
|
|
; CHECK: ld.b
|
|
; CHECK: ld.b
|
|
; CHECK: bclr.b
|
|
; CHECK: st.b
|
|
; CHECK: .size llvm_mips_bclr_b_test
|
|
;
|
|
@llvm_mips_bclr_h_ARG1 = global <8 x i16> <i16 0, i16 1, i16 2, i16 3, i16 4, i16 5, i16 6, i16 7>, align 16
|
|
@llvm_mips_bclr_h_ARG2 = global <8 x i16> <i16 8, i16 9, i16 10, i16 11, i16 12, i16 13, i16 14, i16 15>, align 16
|
|
@llvm_mips_bclr_h_RES = global <8 x i16> <i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0>, align 16
|
|
|
|
define void @llvm_mips_bclr_h_test() nounwind {
|
|
entry:
|
|
%0 = load <8 x i16>* @llvm_mips_bclr_h_ARG1
|
|
%1 = load <8 x i16>* @llvm_mips_bclr_h_ARG2
|
|
%2 = tail call <8 x i16> @llvm.mips.bclr.h(<8 x i16> %0, <8 x i16> %1)
|
|
store <8 x i16> %2, <8 x i16>* @llvm_mips_bclr_h_RES
|
|
ret void
|
|
}
|
|
|
|
declare <8 x i16> @llvm.mips.bclr.h(<8 x i16>, <8 x i16>) nounwind
|
|
|
|
; CHECK: llvm_mips_bclr_h_test:
|
|
; CHECK: ld.h
|
|
; CHECK: ld.h
|
|
; CHECK: bclr.h
|
|
; CHECK: st.h
|
|
; CHECK: .size llvm_mips_bclr_h_test
|
|
;
|
|
@llvm_mips_bclr_w_ARG1 = global <4 x i32> <i32 0, i32 1, i32 2, i32 3>, align 16
|
|
@llvm_mips_bclr_w_ARG2 = global <4 x i32> <i32 4, i32 5, i32 6, i32 7>, align 16
|
|
@llvm_mips_bclr_w_RES = global <4 x i32> <i32 0, i32 0, i32 0, i32 0>, align 16
|
|
|
|
define void @llvm_mips_bclr_w_test() nounwind {
|
|
entry:
|
|
%0 = load <4 x i32>* @llvm_mips_bclr_w_ARG1
|
|
%1 = load <4 x i32>* @llvm_mips_bclr_w_ARG2
|
|
%2 = tail call <4 x i32> @llvm.mips.bclr.w(<4 x i32> %0, <4 x i32> %1)
|
|
store <4 x i32> %2, <4 x i32>* @llvm_mips_bclr_w_RES
|
|
ret void
|
|
}
|
|
|
|
declare <4 x i32> @llvm.mips.bclr.w(<4 x i32>, <4 x i32>) nounwind
|
|
|
|
; CHECK: llvm_mips_bclr_w_test:
|
|
; CHECK: ld.w
|
|
; CHECK: ld.w
|
|
; CHECK: bclr.w
|
|
; CHECK: st.w
|
|
; CHECK: .size llvm_mips_bclr_w_test
|
|
;
|
|
@llvm_mips_bclr_d_ARG1 = global <2 x i64> <i64 0, i64 1>, align 16
|
|
@llvm_mips_bclr_d_ARG2 = global <2 x i64> <i64 2, i64 3>, align 16
|
|
@llvm_mips_bclr_d_RES = global <2 x i64> <i64 0, i64 0>, align 16
|
|
|
|
define void @llvm_mips_bclr_d_test() nounwind {
|
|
entry:
|
|
%0 = load <2 x i64>* @llvm_mips_bclr_d_ARG1
|
|
%1 = load <2 x i64>* @llvm_mips_bclr_d_ARG2
|
|
%2 = tail call <2 x i64> @llvm.mips.bclr.d(<2 x i64> %0, <2 x i64> %1)
|
|
store <2 x i64> %2, <2 x i64>* @llvm_mips_bclr_d_RES
|
|
ret void
|
|
}
|
|
|
|
declare <2 x i64> @llvm.mips.bclr.d(<2 x i64>, <2 x i64>) nounwind
|
|
|
|
; CHECK: llvm_mips_bclr_d_test:
|
|
; CHECK: ld.d
|
|
; CHECK: ld.d
|
|
; CHECK: bclr.d
|
|
; CHECK: st.d
|
|
; CHECK: .size llvm_mips_bclr_d_test
|
|
|
|
@llvm_mips_binsl_b_ARG1 = global <16 x i8> <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, align 16
|
|
@llvm_mips_binsl_b_ARG2 = global <16 x i8> <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, align 16
|
|
@llvm_mips_binsl_b_ARG3 = global <16 x i8> <i8 16, i8 17, i8 18, i8 19, i8 20, i8 21, i8 22, i8 23, i8 24, i8 25, i8 26, i8 27, i8 28, i8 29, i8 30, i8 31>, align 16
|
|
@llvm_mips_binsl_b_RES = global <16 x i8> <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>, align 16
|
|
|
|
define void @llvm_mips_binsl_b_test() nounwind {
|
|
entry:
|
|
%0 = load <16 x i8>* @llvm_mips_binsl_b_ARG1
|
|
%1 = load <16 x i8>* @llvm_mips_binsl_b_ARG2
|
|
%2 = load <16 x i8>* @llvm_mips_binsl_b_ARG3
|
|
%3 = tail call <16 x i8> @llvm.mips.binsl.b(<16 x i8> %0, <16 x i8> %1, <16 x i8> %2)
|
|
store <16 x i8> %3, <16 x i8>* @llvm_mips_binsl_b_RES
|
|
ret void
|
|
}
|
|
|
|
declare <16 x i8> @llvm.mips.binsl.b(<16 x i8>, <16 x i8>, <16 x i8>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsl_b_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsl_b_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsl_b_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsl_b_ARG3)(
|
|
; CHECK-DAG: ld.b [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.b [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.b [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsl.b [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.b [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsl_b_test
|
|
|
|
@llvm_mips_binsl_h_ARG1 = global <8 x i16> <i16 0, i16 1, i16 2, i16 3, i16 4, i16 5, i16 6, i16 7>, align 16
|
|
@llvm_mips_binsl_h_ARG2 = global <8 x i16> <i16 0, i16 1, i16 2, i16 3, i16 4, i16 5, i16 6, i16 7>, align 16
|
|
@llvm_mips_binsl_h_ARG3 = global <8 x i16> <i16 8, i16 9, i16 10, i16 11, i16 12, i16 13, i16 14, i16 15>, align 16
|
|
@llvm_mips_binsl_h_RES = global <8 x i16> <i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0>, align 16
|
|
|
|
define void @llvm_mips_binsl_h_test() nounwind {
|
|
entry:
|
|
%0 = load <8 x i16>* @llvm_mips_binsl_h_ARG1
|
|
%1 = load <8 x i16>* @llvm_mips_binsl_h_ARG2
|
|
%2 = load <8 x i16>* @llvm_mips_binsl_h_ARG3
|
|
%3 = tail call <8 x i16> @llvm.mips.binsl.h(<8 x i16> %0, <8 x i16> %1, <8 x i16> %2)
|
|
store <8 x i16> %3, <8 x i16>* @llvm_mips_binsl_h_RES
|
|
ret void
|
|
}
|
|
|
|
declare <8 x i16> @llvm.mips.binsl.h(<8 x i16>, <8 x i16>, <8 x i16>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsl_h_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsl_h_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsl_h_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsl_h_ARG3)(
|
|
; CHECK-DAG: ld.h [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.h [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.h [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsl.h [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.h [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsl_h_test
|
|
|
|
@llvm_mips_binsl_w_ARG1 = global <4 x i32> <i32 0, i32 1, i32 2, i32 3>, align 16
|
|
@llvm_mips_binsl_w_ARG2 = global <4 x i32> <i32 0, i32 1, i32 2, i32 3>, align 16
|
|
@llvm_mips_binsl_w_ARG3 = global <4 x i32> <i32 4, i32 5, i32 6, i32 7>, align 16
|
|
@llvm_mips_binsl_w_RES = global <4 x i32> <i32 0, i32 0, i32 0, i32 0>, align 16
|
|
|
|
define void @llvm_mips_binsl_w_test() nounwind {
|
|
entry:
|
|
%0 = load <4 x i32>* @llvm_mips_binsl_w_ARG1
|
|
%1 = load <4 x i32>* @llvm_mips_binsl_w_ARG2
|
|
%2 = load <4 x i32>* @llvm_mips_binsl_w_ARG3
|
|
%3 = tail call <4 x i32> @llvm.mips.binsl.w(<4 x i32> %0, <4 x i32> %1, <4 x i32> %2)
|
|
store <4 x i32> %3, <4 x i32>* @llvm_mips_binsl_w_RES
|
|
ret void
|
|
}
|
|
|
|
declare <4 x i32> @llvm.mips.binsl.w(<4 x i32>, <4 x i32>, <4 x i32>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsl_w_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsl_w_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsl_w_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsl_w_ARG3)(
|
|
; CHECK-DAG: ld.w [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.w [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.w [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsl.w [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.w [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsl_w_test
|
|
|
|
@llvm_mips_binsl_d_ARG1 = global <2 x i64> <i64 0, i64 1>, align 16
|
|
@llvm_mips_binsl_d_ARG2 = global <2 x i64> <i64 0, i64 1>, align 16
|
|
@llvm_mips_binsl_d_ARG3 = global <2 x i64> <i64 2, i64 3>, align 16
|
|
@llvm_mips_binsl_d_RES = global <2 x i64> <i64 0, i64 0>, align 16
|
|
|
|
define void @llvm_mips_binsl_d_test() nounwind {
|
|
entry:
|
|
%0 = load <2 x i64>* @llvm_mips_binsl_d_ARG1
|
|
%1 = load <2 x i64>* @llvm_mips_binsl_d_ARG2
|
|
%2 = load <2 x i64>* @llvm_mips_binsl_d_ARG3
|
|
%3 = tail call <2 x i64> @llvm.mips.binsl.d(<2 x i64> %0, <2 x i64> %1, <2 x i64> %2)
|
|
store <2 x i64> %3, <2 x i64>* @llvm_mips_binsl_d_RES
|
|
ret void
|
|
}
|
|
|
|
declare <2 x i64> @llvm.mips.binsl.d(<2 x i64>, <2 x i64>, <2 x i64>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsl_d_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsl_d_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsl_d_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsl_d_ARG3)(
|
|
; CHECK-DAG: ld.d [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.d [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.d [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsl.d [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.d [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsl_d_test
|
|
|
|
@llvm_mips_binsr_b_ARG1 = global <16 x i8> <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, align 16
|
|
@llvm_mips_binsr_b_ARG2 = global <16 x i8> <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, align 16
|
|
@llvm_mips_binsr_b_ARG3 = global <16 x i8> <i8 16, i8 17, i8 18, i8 19, i8 20, i8 21, i8 22, i8 23, i8 24, i8 25, i8 26, i8 27, i8 28, i8 29, i8 30, i8 31>, align 16
|
|
@llvm_mips_binsr_b_RES = global <16 x i8> <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>, align 16
|
|
|
|
define void @llvm_mips_binsr_b_test() nounwind {
|
|
entry:
|
|
%0 = load <16 x i8>* @llvm_mips_binsr_b_ARG1
|
|
%1 = load <16 x i8>* @llvm_mips_binsr_b_ARG2
|
|
%2 = load <16 x i8>* @llvm_mips_binsr_b_ARG3
|
|
%3 = tail call <16 x i8> @llvm.mips.binsr.b(<16 x i8> %0, <16 x i8> %1, <16 x i8> %2)
|
|
store <16 x i8> %3, <16 x i8>* @llvm_mips_binsr_b_RES
|
|
ret void
|
|
}
|
|
|
|
declare <16 x i8> @llvm.mips.binsr.b(<16 x i8>, <16 x i8>, <16 x i8>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsr_b_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsr_b_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsr_b_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsr_b_ARG3)(
|
|
; CHECK-DAG: ld.b [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.b [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.b [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsr.b [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.b [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsr_b_test
|
|
|
|
@llvm_mips_binsr_h_ARG1 = global <8 x i16> <i16 0, i16 1, i16 2, i16 3, i16 4, i16 5, i16 6, i16 7>, align 16
|
|
@llvm_mips_binsr_h_ARG2 = global <8 x i16> <i16 0, i16 1, i16 2, i16 3, i16 4, i16 5, i16 6, i16 7>, align 16
|
|
@llvm_mips_binsr_h_ARG3 = global <8 x i16> <i16 8, i16 9, i16 10, i16 11, i16 12, i16 13, i16 14, i16 15>, align 16
|
|
@llvm_mips_binsr_h_RES = global <8 x i16> <i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0>, align 16
|
|
|
|
define void @llvm_mips_binsr_h_test() nounwind {
|
|
entry:
|
|
%0 = load <8 x i16>* @llvm_mips_binsr_h_ARG1
|
|
%1 = load <8 x i16>* @llvm_mips_binsr_h_ARG2
|
|
%2 = load <8 x i16>* @llvm_mips_binsr_h_ARG3
|
|
%3 = tail call <8 x i16> @llvm.mips.binsr.h(<8 x i16> %0, <8 x i16> %1, <8 x i16> %2)
|
|
store <8 x i16> %3, <8 x i16>* @llvm_mips_binsr_h_RES
|
|
ret void
|
|
}
|
|
|
|
declare <8 x i16> @llvm.mips.binsr.h(<8 x i16>, <8 x i16>, <8 x i16>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsr_h_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsr_h_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsr_h_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsr_h_ARG3)(
|
|
; CHECK-DAG: ld.h [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.h [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.h [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsr.h [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.h [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsr_h_test
|
|
|
|
@llvm_mips_binsr_w_ARG1 = global <4 x i32> <i32 0, i32 1, i32 2, i32 3>, align 16
|
|
@llvm_mips_binsr_w_ARG2 = global <4 x i32> <i32 0, i32 1, i32 2, i32 3>, align 16
|
|
@llvm_mips_binsr_w_ARG3 = global <4 x i32> <i32 4, i32 5, i32 6, i32 7>, align 16
|
|
@llvm_mips_binsr_w_RES = global <4 x i32> <i32 0, i32 0, i32 0, i32 0>, align 16
|
|
|
|
define void @llvm_mips_binsr_w_test() nounwind {
|
|
entry:
|
|
%0 = load <4 x i32>* @llvm_mips_binsr_w_ARG1
|
|
%1 = load <4 x i32>* @llvm_mips_binsr_w_ARG2
|
|
%2 = load <4 x i32>* @llvm_mips_binsr_w_ARG3
|
|
%3 = tail call <4 x i32> @llvm.mips.binsr.w(<4 x i32> %0, <4 x i32> %1, <4 x i32> %2)
|
|
store <4 x i32> %3, <4 x i32>* @llvm_mips_binsr_w_RES
|
|
ret void
|
|
}
|
|
|
|
declare <4 x i32> @llvm.mips.binsr.w(<4 x i32>, <4 x i32>, <4 x i32>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsr_w_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsr_w_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsr_w_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsr_w_ARG3)(
|
|
; CHECK-DAG: ld.w [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.w [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.w [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsr.w [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.w [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsr_w_test
|
|
|
|
@llvm_mips_binsr_d_ARG1 = global <2 x i64> <i64 0, i64 1>, align 16
|
|
@llvm_mips_binsr_d_ARG2 = global <2 x i64> <i64 0, i64 1>, align 16
|
|
@llvm_mips_binsr_d_ARG3 = global <2 x i64> <i64 2, i64 3>, align 16
|
|
@llvm_mips_binsr_d_RES = global <2 x i64> <i64 0, i64 0>, align 16
|
|
|
|
define void @llvm_mips_binsr_d_test() nounwind {
|
|
entry:
|
|
%0 = load <2 x i64>* @llvm_mips_binsr_d_ARG1
|
|
%1 = load <2 x i64>* @llvm_mips_binsr_d_ARG2
|
|
%2 = load <2 x i64>* @llvm_mips_binsr_d_ARG3
|
|
%3 = tail call <2 x i64> @llvm.mips.binsr.d(<2 x i64> %0, <2 x i64> %1, <2 x i64> %2)
|
|
store <2 x i64> %3, <2 x i64>* @llvm_mips_binsr_d_RES
|
|
ret void
|
|
}
|
|
|
|
declare <2 x i64> @llvm.mips.binsr.d(<2 x i64>, <2 x i64>, <2 x i64>) nounwind
|
|
|
|
; CHECK: llvm_mips_binsr_d_test:
|
|
; CHECK-DAG: lw [[R1:\$[0-9]+]], %got(llvm_mips_binsr_d_ARG1)(
|
|
; CHECK-DAG: lw [[R2:\$[0-9]+]], %got(llvm_mips_binsr_d_ARG2)(
|
|
; CHECK-DAG: lw [[R3:\$[0-9]+]], %got(llvm_mips_binsr_d_ARG3)(
|
|
; CHECK-DAG: ld.d [[R4:\$w[0-9]+]], 0([[R1]])
|
|
; CHECK-DAG: ld.d [[R5:\$w[0-9]+]], 0([[R2]])
|
|
; CHECK-DAG: ld.d [[R6:\$w[0-9]+]], 0([[R3]])
|
|
; CHECK-DAG: binsr.d [[R4]], [[R5]], [[R6]]
|
|
; CHECK-DAG: st.d [[R4]], 0(
|
|
; CHECK: .size llvm_mips_binsr_d_test
|
|
|
|
@llvm_mips_bneg_b_ARG1 = global <16 x i8> <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, align 16
|
|
@llvm_mips_bneg_b_ARG2 = global <16 x i8> <i8 16, i8 17, i8 18, i8 19, i8 20, i8 21, i8 22, i8 23, i8 24, i8 25, i8 26, i8 27, i8 28, i8 29, i8 30, i8 31>, align 16
|
|
@llvm_mips_bneg_b_RES = global <16 x i8> <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>, align 16
|
|
|
|
define void @llvm_mips_bneg_b_test() nounwind {
|
|
entry:
|
|
%0 = load <16 x i8>* @llvm_mips_bneg_b_ARG1
|
|
%1 = load <16 x i8>* @llvm_mips_bneg_b_ARG2
|
|
%2 = tail call <16 x i8> @llvm.mips.bneg.b(<16 x i8> %0, <16 x i8> %1)
|
|
store <16 x i8> %2, <16 x i8>* @llvm_mips_bneg_b_RES
|
|
ret void
|
|
}
|
|
|
|
declare <16 x i8> @llvm.mips.bneg.b(<16 x i8>, <16 x i8>) nounwind
|
|
|
|
; CHECK: llvm_mips_bneg_b_test:
|
|
; CHECK: ld.b
|
|
; CHECK: ld.b
|
|
; CHECK: bneg.b
|
|
; CHECK: st.b
|
|
; CHECK: .size llvm_mips_bneg_b_test
|
|
;
|
|
@llvm_mips_bneg_h_ARG1 = global <8 x i16> <i16 0, i16 1, i16 2, i16 3, i16 4, i16 5, i16 6, i16 7>, align 16
|
|
@llvm_mips_bneg_h_ARG2 = global <8 x i16> <i16 8, i16 9, i16 10, i16 11, i16 12, i16 13, i16 14, i16 15>, align 16
|
|
@llvm_mips_bneg_h_RES = global <8 x i16> <i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0>, align 16
|
|
|
|
define void @llvm_mips_bneg_h_test() nounwind {
|
|
entry:
|
|
%0 = load <8 x i16>* @llvm_mips_bneg_h_ARG1
|
|
%1 = load <8 x i16>* @llvm_mips_bneg_h_ARG2
|
|
%2 = tail call <8 x i16> @llvm.mips.bneg.h(<8 x i16> %0, <8 x i16> %1)
|
|
store <8 x i16> %2, <8 x i16>* @llvm_mips_bneg_h_RES
|
|
ret void
|
|
}
|
|
|
|
declare <8 x i16> @llvm.mips.bneg.h(<8 x i16>, <8 x i16>) nounwind
|
|
|
|
; CHECK: llvm_mips_bneg_h_test:
|
|
; CHECK: ld.h
|
|
; CHECK: ld.h
|
|
; CHECK: bneg.h
|
|
; CHECK: st.h
|
|
; CHECK: .size llvm_mips_bneg_h_test
|
|
;
|
|
@llvm_mips_bneg_w_ARG1 = global <4 x i32> <i32 0, i32 1, i32 2, i32 3>, align 16
|
|
@llvm_mips_bneg_w_ARG2 = global <4 x i32> <i32 4, i32 5, i32 6, i32 7>, align 16
|
|
@llvm_mips_bneg_w_RES = global <4 x i32> <i32 0, i32 0, i32 0, i32 0>, align 16
|
|
|
|
define void @llvm_mips_bneg_w_test() nounwind {
|
|
entry:
|
|
%0 = load <4 x i32>* @llvm_mips_bneg_w_ARG1
|
|
%1 = load <4 x i32>* @llvm_mips_bneg_w_ARG2
|
|
%2 = tail call <4 x i32> @llvm.mips.bneg.w(<4 x i32> %0, <4 x i32> %1)
|
|
store <4 x i32> %2, <4 x i32>* @llvm_mips_bneg_w_RES
|
|
ret void
|
|
}
|
|
|
|
declare <4 x i32> @llvm.mips.bneg.w(<4 x i32>, <4 x i32>) nounwind
|
|
|
|
; CHECK: llvm_mips_bneg_w_test:
|
|
; CHECK: ld.w
|
|
; CHECK: ld.w
|
|
; CHECK: bneg.w
|
|
; CHECK: st.w
|
|
; CHECK: .size llvm_mips_bneg_w_test
|
|
;
|
|
@llvm_mips_bneg_d_ARG1 = global <2 x i64> <i64 0, i64 1>, align 16
|
|
@llvm_mips_bneg_d_ARG2 = global <2 x i64> <i64 2, i64 3>, align 16
|
|
@llvm_mips_bneg_d_RES = global <2 x i64> <i64 0, i64 0>, align 16
|
|
|
|
define void @llvm_mips_bneg_d_test() nounwind {
|
|
entry:
|
|
%0 = load <2 x i64>* @llvm_mips_bneg_d_ARG1
|
|
%1 = load <2 x i64>* @llvm_mips_bneg_d_ARG2
|
|
%2 = tail call <2 x i64> @llvm.mips.bneg.d(<2 x i64> %0, <2 x i64> %1)
|
|
store <2 x i64> %2, <2 x i64>* @llvm_mips_bneg_d_RES
|
|
ret void
|
|
}
|
|
|
|
declare <2 x i64> @llvm.mips.bneg.d(<2 x i64>, <2 x i64>) nounwind
|
|
|
|
; CHECK: llvm_mips_bneg_d_test:
|
|
; CHECK: ld.d
|
|
; CHECK: ld.d
|
|
; CHECK: bneg.d
|
|
; CHECK: st.d
|
|
; CHECK: .size llvm_mips_bneg_d_test
|
|
;
|
|
@llvm_mips_bset_b_ARG1 = global <16 x i8> <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, align 16
|
|
@llvm_mips_bset_b_ARG2 = global <16 x i8> <i8 16, i8 17, i8 18, i8 19, i8 20, i8 21, i8 22, i8 23, i8 24, i8 25, i8 26, i8 27, i8 28, i8 29, i8 30, i8 31>, align 16
|
|
@llvm_mips_bset_b_RES = global <16 x i8> <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>, align 16
|
|
|
|
define void @llvm_mips_bset_b_test() nounwind {
|
|
entry:
|
|
%0 = load <16 x i8>* @llvm_mips_bset_b_ARG1
|
|
%1 = load <16 x i8>* @llvm_mips_bset_b_ARG2
|
|
%2 = tail call <16 x i8> @llvm.mips.bset.b(<16 x i8> %0, <16 x i8> %1)
|
|
store <16 x i8> %2, <16 x i8>* @llvm_mips_bset_b_RES
|
|
ret void
|
|
}
|
|
|
|
declare <16 x i8> @llvm.mips.bset.b(<16 x i8>, <16 x i8>) nounwind
|
|
|
|
; CHECK: llvm_mips_bset_b_test:
|
|
; CHECK: ld.b
|
|
; CHECK: ld.b
|
|
; CHECK: bset.b
|
|
; CHECK: st.b
|
|
; CHECK: .size llvm_mips_bset_b_test
|
|
;
|
|
@llvm_mips_bset_h_ARG1 = global <8 x i16> <i16 0, i16 1, i16 2, i16 3, i16 4, i16 5, i16 6, i16 7>, align 16
|
|
@llvm_mips_bset_h_ARG2 = global <8 x i16> <i16 8, i16 9, i16 10, i16 11, i16 12, i16 13, i16 14, i16 15>, align 16
|
|
@llvm_mips_bset_h_RES = global <8 x i16> <i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0, i16 0>, align 16
|
|
|
|
define void @llvm_mips_bset_h_test() nounwind {
|
|
entry:
|
|
%0 = load <8 x i16>* @llvm_mips_bset_h_ARG1
|
|
%1 = load <8 x i16>* @llvm_mips_bset_h_ARG2
|
|
%2 = tail call <8 x i16> @llvm.mips.bset.h(<8 x i16> %0, <8 x i16> %1)
|
|
store <8 x i16> %2, <8 x i16>* @llvm_mips_bset_h_RES
|
|
ret void
|
|
}
|
|
|
|
declare <8 x i16> @llvm.mips.bset.h(<8 x i16>, <8 x i16>) nounwind
|
|
|
|
; CHECK: llvm_mips_bset_h_test:
|
|
; CHECK: ld.h
|
|
; CHECK: ld.h
|
|
; CHECK: bset.h
|
|
; CHECK: st.h
|
|
; CHECK: .size llvm_mips_bset_h_test
|
|
;
|
|
@llvm_mips_bset_w_ARG1 = global <4 x i32> <i32 0, i32 1, i32 2, i32 3>, align 16
|
|
@llvm_mips_bset_w_ARG2 = global <4 x i32> <i32 4, i32 5, i32 6, i32 7>, align 16
|
|
@llvm_mips_bset_w_RES = global <4 x i32> <i32 0, i32 0, i32 0, i32 0>, align 16
|
|
|
|
define void @llvm_mips_bset_w_test() nounwind {
|
|
entry:
|
|
%0 = load <4 x i32>* @llvm_mips_bset_w_ARG1
|
|
%1 = load <4 x i32>* @llvm_mips_bset_w_ARG2
|
|
%2 = tail call <4 x i32> @llvm.mips.bset.w(<4 x i32> %0, <4 x i32> %1)
|
|
store <4 x i32> %2, <4 x i32>* @llvm_mips_bset_w_RES
|
|
ret void
|
|
}
|
|
|
|
declare <4 x i32> @llvm.mips.bset.w(<4 x i32>, <4 x i32>) nounwind
|
|
|
|
; CHECK: llvm_mips_bset_w_test:
|
|
; CHECK: ld.w
|
|
; CHECK: ld.w
|
|
; CHECK: bset.w
|
|
; CHECK: st.w
|
|
; CHECK: .size llvm_mips_bset_w_test
|
|
;
|
|
@llvm_mips_bset_d_ARG1 = global <2 x i64> <i64 0, i64 1>, align 16
|
|
@llvm_mips_bset_d_ARG2 = global <2 x i64> <i64 2, i64 3>, align 16
|
|
@llvm_mips_bset_d_RES = global <2 x i64> <i64 0, i64 0>, align 16
|
|
|
|
define void @llvm_mips_bset_d_test() nounwind {
|
|
entry:
|
|
%0 = load <2 x i64>* @llvm_mips_bset_d_ARG1
|
|
%1 = load <2 x i64>* @llvm_mips_bset_d_ARG2
|
|
%2 = tail call <2 x i64> @llvm.mips.bset.d(<2 x i64> %0, <2 x i64> %1)
|
|
store <2 x i64> %2, <2 x i64>* @llvm_mips_bset_d_RES
|
|
ret void
|
|
}
|
|
|
|
declare <2 x i64> @llvm.mips.bset.d(<2 x i64>, <2 x i64>) nounwind
|
|
|
|
; CHECK: llvm_mips_bset_d_test:
|
|
; CHECK: ld.d
|
|
; CHECK: ld.d
|
|
; CHECK: bset.d
|
|
; CHECK: st.d
|
|
; CHECK: .size llvm_mips_bset_d_test
|
|
;
|