mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-02-23 20:29:30 +00:00
- FP_EXTEND only support extending from vectors with matching elements. This results in the scalarization of extending to v2f64 from v2f32, which will be legalized to v4f32 not matching with v2f64. - add X86-specific VFPEXT supproting extending from v4f32 to v2f64. - add BUILD_VECTOR lowering helper to recover back the original extending from v4f32 to v2f64. - test case is enhanced to include different vector width. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@161894 91177308-0d34-0410-b5e6-96231b3b80d8
57 lines
1.3 KiB
LLVM
57 lines
1.3 KiB
LLVM
; RUN: llc < %s -mtriple=x86_64-pc-linux -mcpu=corei7 | FileCheck %s
|
|
; RUN: llc < %s -mtriple=x86_64-pc-linux -mcpu=core-avx-i | FileCheck %s --check-prefix=AVX
|
|
|
|
define <2 x double> @v2f2d_ext_vec(<2 x float> %v1) nounwind {
|
|
entry:
|
|
; CHECK: v2f2d_ext_vec
|
|
; CHECK: cvtps2pd
|
|
; AVX: v2f2d_ext_vec
|
|
; AVX: vcvtps2pd
|
|
%f1 = fpext <2 x float> %v1 to <2 x double>
|
|
ret <2 x double> %f1
|
|
}
|
|
|
|
define <3 x double> @v3f2d_ext_vec(<3 x float> %v1) nounwind {
|
|
entry:
|
|
; CHECK: v3f2d_ext_vec
|
|
; CHECK: cvtps2pd
|
|
; CHECK: movhlps
|
|
; CHECK: cvtps2pd
|
|
; AVX: v3f2d_ext_vec
|
|
; AVX: vcvtps2pd
|
|
; AVX: ret
|
|
%f1 = fpext <3 x float> %v1 to <3 x double>
|
|
ret <3 x double> %f1
|
|
}
|
|
|
|
define <4 x double> @v4f2d_ext_vec(<4 x float> %v1) nounwind {
|
|
entry:
|
|
; CHECK: v4f2d_ext_vec
|
|
; CHECK: cvtps2pd
|
|
; CHECK: movhlps
|
|
; CHECK: cvtps2pd
|
|
; AVX: v4f2d_ext_vec
|
|
; AVX: vcvtps2pd
|
|
; AVX: ret
|
|
%f1 = fpext <4 x float> %v1 to <4 x double>
|
|
ret <4 x double> %f1
|
|
}
|
|
|
|
define <8 x double> @v8f2d_ext_vec(<8 x float> %v1) nounwind {
|
|
entry:
|
|
; CHECK: v8f2d_ext_vec
|
|
; CHECK: cvtps2pd
|
|
; CHECK: cvtps2pd
|
|
; CHECK: movhlps
|
|
; CHECK: cvtps2pd
|
|
; CHECK: movhlps
|
|
; CHECK: cvtps2pd
|
|
; AVX: v8f2d_ext_vec
|
|
; AVX: vcvtps2pd
|
|
; AVX: vextractf128
|
|
; AVX: vcvtps2pd
|
|
; AVX: ret
|
|
%f1 = fpext <8 x float> %v1 to <8 x double>
|
|
ret <8 x double> %f1
|
|
}
|