Dan Gohman 74feef261a Define patterns for shld and shrd that match immediate
shift counts, and patterns that match dynamic shift counts
when the subtract is obscured by a truncate node.

Add DAGCombiner support for recognizing rotate patterns
when the shift counts are defined by truncate nodes.

Fix and simplify the code for commuting shld and shrd
instructions to work even when the given instruction doesn't
have a parent, and when the caller needs a new instruction.

These changes allow LLVM to use the shld, shrd, rol, and ror
instructions on x86 to replace equivalent code using two
shifts and an or in many more cases.


git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@57662 91177308-0d34-0410-b5e6-96231b3b80d8
2008-10-17 01:23:35 +00:00

74 lines
1.4 KiB
LLVM

; RUN: llvm-as < %s | llc -march=x86 > %t
; RUN: grep rol %t | count 3
; RUN: grep ror %t | count 1
; RUN: grep shld %t | count 2
; RUN: grep shrd %t | count 2
define i16 @foo(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = shl i16 %x, %z
%1 = sub i16 16, %z
%2 = lshr i16 %x, %1
%3 = or i16 %2, %0
ret i16 %3
}
define i16 @bar(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = shl i16 %y, %z
%1 = sub i16 16, %z
%2 = lshr i16 %x, %1
%3 = or i16 %2, %0
ret i16 %3
}
define i16 @un(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = lshr i16 %x, %z
%1 = sub i16 16, %z
%2 = shl i16 %x, %1
%3 = or i16 %2, %0
ret i16 %3
}
define i16 @bu(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = lshr i16 %y, %z
%1 = sub i16 16, %z
%2 = shl i16 %x, %1
%3 = or i16 %2, %0
ret i16 %3
}
define i16 @xfoo(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = lshr i16 %x, 11
%1 = shl i16 %x, 5
%2 = or i16 %0, %1
ret i16 %2
}
define i16 @xbar(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = shl i16 %y, 5
%1 = lshr i16 %x, 11
%2 = or i16 %0, %1
ret i16 %2
}
define i16 @xun(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = lshr i16 %x, 5
%1 = shl i16 %x, 11
%2 = or i16 %0, %1
ret i16 %2
}
define i16 @xbu(i16 %x, i16 %y, i16 %z) nounwind readnone {
entry:
%0 = lshr i16 %y, 5
%1 = shl i16 %x, 11
%2 = or i16 %0, %1
ret i16 %2
}