mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-10-25 10:27:04 +00:00
R600/SI: Make more unordered comparisons legal
This saves a second compare and an and / or by using the unordered comparison instructions. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@224066 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
@@ -1,7 +1,7 @@
|
||||
; RUN: llc < %s -march=r600 -mcpu=tahiti -verify-machineinstrs | FileCheck %s
|
||||
|
||||
; CHECK-LABEL: {{^}}flt_f64:
|
||||
; CHECK: v_cmp_lt_f64_e64 {{s[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
; CHECK: v_cmp_nge_f64_e32 vcc, {{v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
define void @flt_f64(i32 addrspace(1)* %out, double addrspace(1)* %in1,
|
||||
double addrspace(1)* %in2) {
|
||||
%r0 = load double addrspace(1)* %in1
|
||||
@@ -13,7 +13,7 @@ define void @flt_f64(i32 addrspace(1)* %out, double addrspace(1)* %in1,
|
||||
}
|
||||
|
||||
; CHECK-LABEL: {{^}}fle_f64:
|
||||
; CHECK: v_cmp_le_f64_e64 {{s[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
; CHECK: v_cmp_ngt_f64_e32 vcc, {{v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
define void @fle_f64(i32 addrspace(1)* %out, double addrspace(1)* %in1,
|
||||
double addrspace(1)* %in2) {
|
||||
%r0 = load double addrspace(1)* %in1
|
||||
@@ -25,7 +25,7 @@ define void @fle_f64(i32 addrspace(1)* %out, double addrspace(1)* %in1,
|
||||
}
|
||||
|
||||
; CHECK-LABEL: {{^}}fgt_f64:
|
||||
; CHECK: v_cmp_gt_f64_e64 {{s[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
; CHECK: v_cmp_nle_f64_e32 vcc, {{v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
define void @fgt_f64(i32 addrspace(1)* %out, double addrspace(1)* %in1,
|
||||
double addrspace(1)* %in2) {
|
||||
%r0 = load double addrspace(1)* %in1
|
||||
@@ -37,7 +37,7 @@ define void @fgt_f64(i32 addrspace(1)* %out, double addrspace(1)* %in1,
|
||||
}
|
||||
|
||||
; CHECK-LABEL: {{^}}fge_f64:
|
||||
; CHECK: v_cmp_ge_f64_e64 {{s[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
; CHECK: v_cmp_nlt_f64_e32 vcc, {{v[[0-9]+:[0-9]+], v[[0-9]+:[0-9]+]}}
|
||||
define void @fge_f64(i32 addrspace(1)* %out, double addrspace(1)* %in1,
|
||||
double addrspace(1)* %in2) {
|
||||
%r0 = load double addrspace(1)* %in1
|
||||
|
||||
@@ -145,10 +145,8 @@ entry:
|
||||
; FUNC-LABEL: {{^}}f32_ugt:
|
||||
; R600: SETGE
|
||||
; R600: SETE_DX10
|
||||
; SI: v_cmp_u_f32
|
||||
; SI: v_cmp_gt_f32
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
; SI: v_cmp_nle_f32_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f32_ugt(i32 addrspace(1)* %out, float %a, float %b) {
|
||||
entry:
|
||||
%0 = fcmp ugt float %a, %b
|
||||
@@ -160,10 +158,9 @@ entry:
|
||||
; FUNC-LABEL: {{^}}f32_uge:
|
||||
; R600: SETGT
|
||||
; R600: SETE_DX10
|
||||
; SI: v_cmp_u_f32
|
||||
; SI: v_cmp_ge_f32
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
|
||||
; SI: v_cmp_nlt_f32_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f32_uge(i32 addrspace(1)* %out, float %a, float %b) {
|
||||
entry:
|
||||
%0 = fcmp uge float %a, %b
|
||||
@@ -175,10 +172,9 @@ entry:
|
||||
; FUNC-LABEL: {{^}}f32_ult:
|
||||
; R600: SETGE
|
||||
; R600: SETE_DX10
|
||||
; SI: v_cmp_u_f32
|
||||
; SI: v_cmp_lt_f32
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
|
||||
; SI: v_cmp_nge_f32_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f32_ult(i32 addrspace(1)* %out, float %a, float %b) {
|
||||
entry:
|
||||
%0 = fcmp ult float %a, %b
|
||||
@@ -190,10 +186,9 @@ entry:
|
||||
; FUNC-LABEL: {{^}}f32_ule:
|
||||
; R600: SETGT
|
||||
; R600: SETE_DX10
|
||||
; SI: v_cmp_u_f32
|
||||
; SI: v_cmp_le_f32
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
|
||||
; SI: v_cmp_ngt_f32_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f32_ule(i32 addrspace(1)* %out, float %a, float %b) {
|
||||
entry:
|
||||
%0 = fcmp ule float %a, %b
|
||||
|
||||
@@ -91,10 +91,9 @@ entry:
|
||||
}
|
||||
|
||||
; FUNC-LABEL: {{^}}f64_ugt:
|
||||
; SI: v_cmp_u_f64
|
||||
; SI: v_cmp_gt_f64
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
|
||||
; SI: v_cmp_nle_f64_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f64_ugt(i32 addrspace(1)* %out, double %a, double %b) {
|
||||
entry:
|
||||
%0 = fcmp ugt double %a, %b
|
||||
@@ -104,10 +103,8 @@ entry:
|
||||
}
|
||||
|
||||
; FUNC-LABEL: {{^}}f64_uge:
|
||||
; SI: v_cmp_u_f64
|
||||
; SI: v_cmp_ge_f64
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
; SI: v_cmp_nlt_f64_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f64_uge(i32 addrspace(1)* %out, double %a, double %b) {
|
||||
entry:
|
||||
%0 = fcmp uge double %a, %b
|
||||
@@ -117,10 +114,8 @@ entry:
|
||||
}
|
||||
|
||||
; FUNC-LABEL: {{^}}f64_ult:
|
||||
; SI: v_cmp_u_f64
|
||||
; SI: v_cmp_lt_f64
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
; SI: v_cmp_nge_f64_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f64_ult(i32 addrspace(1)* %out, double %a, double %b) {
|
||||
entry:
|
||||
%0 = fcmp ult double %a, %b
|
||||
@@ -130,10 +125,8 @@ entry:
|
||||
}
|
||||
|
||||
; FUNC-LABEL: {{^}}f64_ule:
|
||||
; SI: v_cmp_u_f64
|
||||
; SI: v_cmp_le_f64
|
||||
; SI: s_or_b64
|
||||
; SI: v_cndmask_b32
|
||||
; SI: v_cmp_ngt_f64_e32 vcc
|
||||
; SI-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
|
||||
define void @f64_ule(i32 addrspace(1)* %out, double %a, double %b) {
|
||||
entry:
|
||||
%0 = fcmp ule double %a, %b
|
||||
|
||||
Reference in New Issue
Block a user