2010-07-05 05:52:56 +00:00
|
|
|
; RUN: llc < %s -march=x86-64 -mcpu=penryn -asm-verbose=0 -o - | FileCheck %s -check-prefix=X64
|
2010-07-05 03:56:55 +00:00
|
|
|
; RUN: llc < %s -mcpu=yonah -march=x86 -asm-verbose=0 -o - | FileCheck %s -check-prefix=X32
|
2010-07-04 22:57:10 +00:00
|
|
|
|
|
|
|
; PR7518
|
|
|
|
define void @test1(<2 x float> %Q, float *%P2) nounwind {
|
|
|
|
%a = extractelement <2 x float> %Q, i32 0
|
|
|
|
%b = extractelement <2 x float> %Q, i32 1
|
|
|
|
%c = fadd float %a, %b
|
|
|
|
|
|
|
|
store float %c, float* %P2
|
|
|
|
ret void
|
Just rip v2f32 support completely out of the X86 backend. In
the example in the testcase, we now generate:
_test1: ## @test1
movss 4(%esp), %xmm0
addss 8(%esp), %xmm0
movl 12(%esp), %eax
movss %xmm0, (%eax)
ret
instead of:
_test1: ## @test1
subl $20, %esp
movl 24(%esp), %eax
movq %mm0, (%esp)
movq %mm0, 8(%esp)
movss (%esp), %xmm0
addss 12(%esp), %xmm0
movss %xmm0, (%eax)
addl $20, %esp
ret
v2f32 support did not work reliably because most of the X86
backend didn't know it was legal. It was apparently only added
to support returning source-level v2f32 values in MMX registers
in x86-32 mode. If ABI compatibility is important on this
GCC-extended-vector type for some reason, then the frontend
should generate IR that returns v2i32 instead of v2f32. However,
we generally don't try very hard to be abi compatible on gcc
extended vectors.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@107601 91177308-0d34-0410-b5e6-96231b3b80d8
2010-07-04 23:07:25 +00:00
|
|
|
; X64: test1:
|
|
|
|
; X64-NEXT: addss %xmm1, %xmm0
|
|
|
|
; X64-NEXT: movss %xmm0, (%rdi)
|
|
|
|
; X64-NEXT: ret
|
|
|
|
|
|
|
|
; X32: test1:
|
|
|
|
; X32-NEXT: movss 4(%esp), %xmm0
|
|
|
|
; X32-NEXT: addss 8(%esp), %xmm0
|
|
|
|
; X32-NEXT: movl 12(%esp), %eax
|
|
|
|
; X32-NEXT: movss %xmm0, (%eax)
|
|
|
|
; X32-NEXT: ret
|
2010-07-04 22:57:10 +00:00
|
|
|
}
|
|
|
|
|
2010-07-05 05:52:56 +00:00
|
|
|
|
|
|
|
define <2 x float> @test2(<2 x float> %Q, <2 x float> %R, <2 x float> *%P) nounwind {
|
|
|
|
%Z = fadd <2 x float> %Q, %R
|
|
|
|
ret <2 x float> %Z
|
|
|
|
|
|
|
|
; X64: test2:
|
|
|
|
; X64-NEXT: insertps $0
|
|
|
|
; X64-NEXT: insertps $16
|
|
|
|
; X64-NEXT: insertps $0
|
|
|
|
; X64-NEXT: insertps $16
|
|
|
|
; X64-NEXT: addps
|
|
|
|
; X64-NEXT: movaps
|
|
|
|
; X64-NEXT: pshufd
|
|
|
|
; X64-NEXT: ret
|
|
|
|
}
|