mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-08 03:30:22 +00:00
c2ebfd454c
This speeds up selected test cases with up to 5% - no slowdowns observed. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@120286 91177308-0d34-0410-b5e6-96231b3b80d8
68 lines
1.9 KiB
LLVM
68 lines
1.9 KiB
LLVM
; RUN: llc -O1 --march=cellspu < %s | FileCheck %s
|
|
|
|
define <4 x float> @shuffle(<4 x float> %param1, <4 x float> %param2) {
|
|
; CHECK: cwd {{\$.}}, 0($sp)
|
|
; CHECK: shufb {{\$., \$4, \$3, \$.}}
|
|
%val= shufflevector <4 x float> %param1, <4 x float> %param2, <4 x i32> <i32 4,i32 1,i32 2,i32 3>
|
|
ret <4 x float> %val
|
|
}
|
|
|
|
define <4 x float> @splat(float %param1) {
|
|
; CHECK: lqa
|
|
; CHECK: shufb $3
|
|
; CHECK: bi
|
|
%vec = insertelement <1 x float> undef, float %param1, i32 0
|
|
%val= shufflevector <1 x float> %vec, <1 x float> undef, <4 x i32> <i32 0,i32 0,i32 0,i32 0>
|
|
ret <4 x float> %val
|
|
}
|
|
|
|
define void @test_insert( <2 x float>* %ptr, float %val1, float %val2 ) {
|
|
%sl2_17_tmp1 = insertelement <2 x float> zeroinitializer, float %val1, i32 0
|
|
;CHECK: lqa $6,
|
|
;CHECK: shufb $4, $4, $5, $6
|
|
%sl2_17 = insertelement <2 x float> %sl2_17_tmp1, float %val2, i32 1
|
|
|
|
;CHECK: cdd $5, 0($3)
|
|
;CHECK: lqd $6, 0($3)
|
|
;CHECK: shufb $4, $4, $6, $5
|
|
;CHECK: stqd $4, 0($3)
|
|
;CHECK: bi $lr
|
|
store <2 x float> %sl2_17, <2 x float>* %ptr
|
|
ret void
|
|
}
|
|
|
|
define <4 x float> @test_insert_1(<4 x float> %vparam, float %eltparam) {
|
|
;CHECK: cwd $5, 4($sp)
|
|
;CHECK: shufb $3, $4, $3, $5
|
|
;CHECK: bi $lr
|
|
%rv = insertelement <4 x float> %vparam, float %eltparam, i32 1
|
|
ret <4 x float> %rv
|
|
}
|
|
|
|
define <2 x i32> @test_v2i32(<4 x i32>%vec)
|
|
{
|
|
;CHECK: rotqbyi $3, $3, 4
|
|
;CHECK: bi $lr
|
|
%rv = shufflevector <4 x i32> %vec, <4 x i32> undef, <2 x i32><i32 1,i32 2>
|
|
ret <2 x i32> %rv
|
|
}
|
|
|
|
define <4 x i32> @test_v4i32_rot8(<4 x i32>%vec)
|
|
{
|
|
;CHECK: rotqbyi $3, $3, 8
|
|
;CHECK: bi $lr
|
|
%rv = shufflevector <4 x i32> %vec, <4 x i32> undef,
|
|
<4 x i32> <i32 2,i32 3,i32 0, i32 1>
|
|
ret <4 x i32> %rv
|
|
}
|
|
|
|
define <4 x i32> @test_v4i32_rot4(<4 x i32>%vec)
|
|
{
|
|
;CHECK: rotqbyi $3, $3, 4
|
|
;CHECK: bi $lr
|
|
%rv = shufflevector <4 x i32> %vec, <4 x i32> undef,
|
|
<4 x i32> <i32 1,i32 2,i32 3, i32 0>
|
|
ret <4 x i32> %rv
|
|
}
|
|
|