mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-07-24 22:24:54 +00:00
Refine fix to bug 15041.
Thanks to help from Nadav and Hal, I have a more reasonable (and even correct!) approach. This specifically penalizes the insertelement and extractelement operations for the performance hit that will occur on PowerPC processors. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@174725 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
16
test/Analysis/CostModel/PowerPC/insert_extract.ll
Normal file
16
test/Analysis/CostModel/PowerPC/insert_extract.ll
Normal file
@@ -0,0 +1,16 @@
|
||||
; RUN: opt < %s -cost-model -analyze -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 | FileCheck %s
|
||||
target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
|
||||
target triple = "powerpc64-unknown-linux-gnu"
|
||||
|
||||
define i32 @insert(i32 %arg) {
|
||||
; CHECK: cost of 13 {{.*}} insertelement
|
||||
%x = insertelement <4 x i32> undef, i32 %arg, i32 0
|
||||
ret i32 undef
|
||||
}
|
||||
|
||||
define i32 @extract(<4 x i32> %arg) {
|
||||
; CHECK: cost of 13 {{.*}} extractelement
|
||||
%x = extractelement <4 x i32> %arg, i32 0
|
||||
ret i32 %x
|
||||
}
|
||||
|
Reference in New Issue
Block a user