llvm-6502/test/CodeGen/X86/bswap.ll

; bswap should be constant folded when it is passed a constant argument

; RUN: llc < %s -march=x86 -mcpu=i686 | FileCheck %s
; RUN: llc < %s -march=x86-64 | FileCheck %s --check-prefix=CHECK64

declare i16 @llvm.bswap.i16(i16)

declare i32 @llvm.bswap.i32(i32)

declare i64 @llvm.bswap.i64(i64)

define i16 @W(i16 %A) {
; CHECK-LABEL: W:
; CHECK: rolw $8, %ax

; CHECK64-LABEL: W:
; CHECK64: rolw $8, %
        %Z = call i16 @llvm.bswap.i16( i16 %A )         ; <i16> [#uses=1]
        ret i16 %Z
}

define i32 @X(i32 %A) {
; CHECK-LABEL: X:
; CHECK: bswapl %eax

; CHECK64-LABEL: X:
; CHECK64: bswapl %
        %Z = call i32 @llvm.bswap.i32( i32 %A )         ; <i32> [#uses=1]
        ret i32 %Z
}

define i64 @Y(i64 %A) {
; CHECK-LABEL: Y:
; CHECK: bswapl %eax
; CHECK: bswapl %edx

; CHECK64-LABEL: Y:
; CHECK64: bswapq %
        %Z = call i64 @llvm.bswap.i64( i64 %A )         ; <i64> [#uses=1]
        ret i64 %Z
}

; rdar://9164521
define i32 @test1(i32 %a) nounwind readnone {
entry:
; CHECK-LABEL: test1:
; CHECK: bswapl [[REG:%.*]]
; CHECK: shrl $16, [[REG]]

; CHECK64-LABEL: test1:
; CHECK64: bswapl [[REG:%.*]]
; CHECK64: shrl $16, [[REG]]
  %and = lshr i32 %a, 8
  %shr3 = and i32 %and, 255
  %and2 = shl i32 %a, 8
  %shl = and i32 %and2, 65280
  %or = or i32 %shr3, %shl
  ret i32 %or
}

define i32 @test2(i32 %a) nounwind readnone {
entry:
; CHECK-LABEL: test2:
; CHECK: bswapl [[REG:%.*]]
; CHECK: sarl $16, [[REG]]

; CHECK64-LABEL: test2:
; CHECK64: bswapl [[REG:%.*]]
; CHECK64: sarl $16, [[REG]]
  %and = lshr i32 %a, 8
  %shr4 = and i32 %and, 255
  %and2 = shl i32 %a, 8
  %or = or i32 %shr4, %and2
  %sext = shl i32 %or, 16
  %conv3 = ashr exact i32 %sext, 16
  ret i32 %conv3
}

@var8 = global i8 0
@var16 = global i16 0

; The "shl" below can move bits into the high parts of the value, so the
; operation is not a "bswap, shr" pair.

; rdar://problem/14814049
define i64 @not_bswap() {
; CHECK-LABEL: not_bswap:
; CHECK-NOT: bswapl
; CHECK: ret

; CHECK64-LABEL: not_bswap:
; CHECK64-NOT: bswapq
; CHECK64: ret
  %init = load i16* @var16
  %big = zext i16 %init to i64

  %hishifted = lshr i64 %big, 8
  %loshifted = shl i64 %big, 8

  %notswapped = or i64 %hishifted, %loshifted

  ret i64 %notswapped
}

; This time, the lshr (and subsequent or) is completely useless. While it's
; technically correct to convert this into a "bswap, shr", it's suboptimal. A
; simple shl works better.

define i64 @not_useful_bswap() {
; CHECK-LABEL: not_useful_bswap:
; CHECK-NOT: bswapl
; CHECK: ret

; CHECK64-LABEL: not_useful_bswap:
; CHECK64-NOT: bswapq
; CHECK64: ret

  %init = load i8* @var8
  %big = zext i8 %init to i64

  %hishifted = lshr i64 %big, 8
  %loshifted = shl i64 %big, 8

  %notswapped = or i64 %hishifted, %loshifted

  ret i64 %notswapped
}

; Finally, it *is* OK to just mask off the shl if we know that the value is zero
; beyond 16 bits anyway. This is a legitimate bswap.

define i64 @finally_useful_bswap() {
; CHECK-LABEL: finally_useful_bswap:
; CHECK: bswapl [[REG:%.*]]
; CHECK: shrl $16, [[REG]]
; CHECK: ret

; CHECK64-LABEL: finally_useful_bswap:
; CHECK64: bswapq [[REG:%.*]]
; CHECK64: shrq $48, [[REG]]
; CHECK64: ret

  %init = load i16* @var16
  %big = zext i16 %init to i64

  %hishifted = lshr i64 %big, 8
  %lomasked = and i64 %big, 255
  %loshifted = shl i64 %lomasked, 8

  %swapped = or i64 %hishifted, %loshifted

  ret i64 %swapped
}
bswap implementation git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@25312 91177308-0d34-0410-b5e6-96231b3b80d8 2006-01-14 03:14:10 +00:00			`; bswap should be constant folded when it is passed a constant argument`

Force CPU type on test so it doesn't accidentally emit movbe instead of bswap on Intel Atom CPUs. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@141863 91177308-0d34-0410-b5e6-96231b3b80d8 2011-10-13 14:27:54 +00:00			`; RUN: llc < %s -march=x86 -mcpu=i686 \| FileCheck %s`
DAGCombiner: make sure or/shl/srl really has zero high bits before forming bswap We want to convert code like (or (srl N, 8), (shl N, 8)) into (srl (bswap N), const), but this is only valid if the bits above 16 on the source pattern are 0, the checks we were doing on this were slightly wrong before. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189348 91177308-0d34-0410-b5e6-96231b3b80d8 2013-08-27 13:46:45 +00:00			`; RUN: llc < %s -march=x86-64 \| FileCheck %s --check-prefix=CHECK64`
bswap implementation git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@25312 91177308-0d34-0410-b5e6-96231b3b80d8 2006-01-14 03:14:10 +00:00
Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00			`declare i16 @llvm.bswap.i16(i16)`
bswap implementation git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@25312 91177308-0d34-0410-b5e6-96231b3b80d8 2006-01-14 03:14:10 +00:00
Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00			`declare i32 @llvm.bswap.i32(i32)`

			`declare i64 @llvm.bswap.i64(i64)`

			`define i16 @W(i16 %A) {`
Mass update to CodeGen tests to use CHECK-LABEL for labels corresponding to function definitions for more informative error messages. No functionality change and all updated tests passed locally. This update was done with the following bash script: find test/CodeGen -name ".ll" \| \ while read NAME; do echo "$NAME" if ! grep -q "^; RUN: llc.debug" $NAME; then TEMP=`mktemp -t temp` cp $NAME $TEMP sed -n "s/^define [^@]@\([A-Za-z0-9_]\)(.$/\1/p" < $NAME \| \ while read FUNC; do sed -i '' "s/;\(.\)\([A-Za-z0-9_-]\):\( \)$FUNC: \$/;\1\2-LABEL:\3$FUNC:/g" $TEMP done sed -i '' "s/;\(.\)-LABEL-LABEL:/;\1-LABEL:/" $TEMP sed -i '' "s/;\(.\)-NEXT-LABEL:/;\1-NEXT:/" $TEMP sed -i '' "s/;\(.\)-NOT-LABEL:/;\1-NOT:/" $TEMP sed -i '' "s/;\(.*\)-DAG-LABEL:/;\1-DAG:/" $TEMP mv $TEMP $NAME fi done git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@186280 91177308-0d34-0410-b5e6-96231b3b80d8 2013-07-14 06:24:09 +00:00			`; CHECK-LABEL: W:`
Teach dag combine to match halfword byteswap patterns. 1. (((x) & 0xFF00) >> 8) \| (((x) & 0x00FF) << 8) => (bswap x) >> 16 2. ((x&0xff)<<8)\|((x&0xff00)>>8)\|((x&0xff000000)>>8)\|((x&0x00ff0000)<<8)) => (rotl (bswap x) 16) This allows us to eliminate most of the def : Pat patterns for ARM rev16 revsh instructions. It catches many more cases for ARM and x86. rdar://9609108 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@133503 91177308-0d34-0410-b5e6-96231b3b80d8 2011-06-21 06:01:08 +00:00			`; CHECK: rolw $8, %ax`
DAGCombiner: make sure or/shl/srl really has zero high bits before forming bswap We want to convert code like (or (srl N, 8), (shl N, 8)) into (srl (bswap N), const), but this is only valid if the bits above 16 on the source pattern are 0, the checks we were doing on this were slightly wrong before. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189348 91177308-0d34-0410-b5e6-96231b3b80d8 2013-08-27 13:46:45 +00:00
			`; CHECK64-LABEL: W:`
			`; CHECK64: rolw $8, %`
Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00			`%Z = call i16 @llvm.bswap.i16( i16 %A ) ; <i16> [#uses=1]`
			`ret i16 %Z`
bswap implementation git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@25312 91177308-0d34-0410-b5e6-96231b3b80d8 2006-01-14 03:14:10 +00:00			`}`

Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00			`define i32 @X(i32 %A) {`
Mass update to CodeGen tests to use CHECK-LABEL for labels corresponding to function definitions for more informative error messages. No functionality change and all updated tests passed locally. This update was done with the following bash script: find test/CodeGen -name ".ll" \| \ while read NAME; do echo "$NAME" if ! grep -q "^; RUN: llc.debug" $NAME; then TEMP=`mktemp -t temp` cp $NAME $TEMP sed -n "s/^define [^@]@\([A-Za-z0-9_]\)(.$/\1/p" < $NAME \| \ while read FUNC; do sed -i '' "s/;\(.\)\([A-Za-z0-9_-]\):\( \)$FUNC: \$/;\1\2-LABEL:\3$FUNC:/g" $TEMP done sed -i '' "s/;\(.\)-LABEL-LABEL:/;\1-LABEL:/" $TEMP sed -i '' "s/;\(.\)-NEXT-LABEL:/;\1-NEXT:/" $TEMP sed -i '' "s/;\(.\)-NOT-LABEL:/;\1-NOT:/" $TEMP sed -i '' "s/;\(.*\)-DAG-LABEL:/;\1-DAG:/" $TEMP mv $TEMP $NAME fi done git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@186280 91177308-0d34-0410-b5e6-96231b3b80d8 2013-07-14 06:24:09 +00:00			`; CHECK-LABEL: X:`
Teach dag combine to match halfword byteswap patterns. 1. (((x) & 0xFF00) >> 8) \| (((x) & 0x00FF) << 8) => (bswap x) >> 16 2. ((x&0xff)<<8)\|((x&0xff00)>>8)\|((x&0xff000000)>>8)\|((x&0x00ff0000)<<8)) => (rotl (bswap x) 16) This allows us to eliminate most of the def : Pat patterns for ARM rev16 revsh instructions. It catches many more cases for ARM and x86. rdar://9609108 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@133503 91177308-0d34-0410-b5e6-96231b3b80d8 2011-06-21 06:01:08 +00:00			`; CHECK: bswapl %eax`
DAGCombiner: make sure or/shl/srl really has zero high bits before forming bswap We want to convert code like (or (srl N, 8), (shl N, 8)) into (srl (bswap N), const), but this is only valid if the bits above 16 on the source pattern are 0, the checks we were doing on this were slightly wrong before. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189348 91177308-0d34-0410-b5e6-96231b3b80d8 2013-08-27 13:46:45 +00:00
			`; CHECK64-LABEL: X:`
			`; CHECK64: bswapl %`
Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00			`%Z = call i32 @llvm.bswap.i32( i32 %A ) ; <i32> [#uses=1]`
			`ret i32 %Z`
bswap implementation git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@25312 91177308-0d34-0410-b5e6-96231b3b80d8 2006-01-14 03:14:10 +00:00			`}`

Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00			`define i64 @Y(i64 %A) {`
Mass update to CodeGen tests to use CHECK-LABEL for labels corresponding to function definitions for more informative error messages. No functionality change and all updated tests passed locally. This update was done with the following bash script: find test/CodeGen -name ".ll" \| \ while read NAME; do echo "$NAME" if ! grep -q "^; RUN: llc.debug" $NAME; then TEMP=`mktemp -t temp` cp $NAME $TEMP sed -n "s/^define [^@]@\([A-Za-z0-9_]\)(.$/\1/p" < $NAME \| \ while read FUNC; do sed -i '' "s/;\(.\)\([A-Za-z0-9_-]\):\( \)$FUNC: \$/;\1\2-LABEL:\3$FUNC:/g" $TEMP done sed -i '' "s/;\(.\)-LABEL-LABEL:/;\1-LABEL:/" $TEMP sed -i '' "s/;\(.\)-NEXT-LABEL:/;\1-NEXT:/" $TEMP sed -i '' "s/;\(.\)-NOT-LABEL:/;\1-NOT:/" $TEMP sed -i '' "s/;\(.*\)-DAG-LABEL:/;\1-DAG:/" $TEMP mv $TEMP $NAME fi done git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@186280 91177308-0d34-0410-b5e6-96231b3b80d8 2013-07-14 06:24:09 +00:00			`; CHECK-LABEL: Y:`
Teach dag combine to match halfword byteswap patterns. 1. (((x) & 0xFF00) >> 8) \| (((x) & 0x00FF) << 8) => (bswap x) >> 16 2. ((x&0xff)<<8)\|((x&0xff00)>>8)\|((x&0xff000000)>>8)\|((x&0x00ff0000)<<8)) => (rotl (bswap x) 16) This allows us to eliminate most of the def : Pat patterns for ARM rev16 revsh instructions. It catches many more cases for ARM and x86. rdar://9609108 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@133503 91177308-0d34-0410-b5e6-96231b3b80d8 2011-06-21 06:01:08 +00:00			`; CHECK: bswapl %eax`
			`; CHECK: bswapl %edx`
DAGCombiner: make sure or/shl/srl really has zero high bits before forming bswap We want to convert code like (or (srl N, 8), (shl N, 8)) into (srl (bswap N), const), but this is only valid if the bits above 16 on the source pattern are 0, the checks we were doing on this were slightly wrong before. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189348 91177308-0d34-0410-b5e6-96231b3b80d8 2013-08-27 13:46:45 +00:00
			`; CHECK64-LABEL: Y:`
			`; CHECK64: bswapq %`
Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00			`%Z = call i64 @llvm.bswap.i64( i64 %A ) ; <i64> [#uses=1]`
			`ret i64 %Z`
bswap implementation git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@25312 91177308-0d34-0410-b5e6-96231b3b80d8 2006-01-14 03:14:10 +00:00			`}`
Remove llvm-upgrade and update tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@47432 91177308-0d34-0410-b5e6-96231b3b80d8 2008-02-21 07:42:26 +00:00
Teach dag combine to match halfword byteswap patterns. 1. (((x) & 0xFF00) >> 8) \| (((x) & 0x00FF) << 8) => (bswap x) >> 16 2. ((x&0xff)<<8)\|((x&0xff00)>>8)\|((x&0xff000000)>>8)\|((x&0x00ff0000)<<8)) => (rotl (bswap x) 16) This allows us to eliminate most of the def : Pat patterns for ARM rev16 revsh instructions. It catches many more cases for ARM and x86. rdar://9609108 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@133503 91177308-0d34-0410-b5e6-96231b3b80d8 2011-06-21 06:01:08 +00:00			`; rdar://9164521`
			`define i32 @test1(i32 %a) nounwind readnone {`
			`entry:`
DAGCombiner: make sure or/shl/srl really has zero high bits before forming bswap We want to convert code like (or (srl N, 8), (shl N, 8)) into (srl (bswap N), const), but this is only valid if the bits above 16 on the source pattern are 0, the checks we were doing on this were slightly wrong before. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189348 91177308-0d34-0410-b5e6-96231b3b80d8 2013-08-27 13:46:45 +00:00			`; CHECK-LABEL: test1:`
			`; CHECK: bswapl [[REG:%.*]]`
			`; CHECK: shrl $16, [[REG]]`

			`; CHECK64-LABEL: test1:`
			`; CHECK64: bswapl [[REG:%.*]]`
			`; CHECK64: shrl $16, [[REG]]`
Teach dag combine to match halfword byteswap patterns. 1. (((x) & 0xFF00) >> 8) \| (((x) & 0x00FF) << 8) => (bswap x) >> 16 2. ((x&0xff)<<8)\|((x&0xff00)>>8)\|((x&0xff000000)>>8)\|((x&0x00ff0000)<<8)) => (rotl (bswap x) 16) This allows us to eliminate most of the def : Pat patterns for ARM rev16 revsh instructions. It catches many more cases for ARM and x86. rdar://9609108 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@133503 91177308-0d34-0410-b5e6-96231b3b80d8 2011-06-21 06:01:08 +00:00			`%and = lshr i32 %a, 8`
			`%shr3 = and i32 %and, 255`
			`%and2 = shl i32 %a, 8`
			`%shl = and i32 %and2, 65280`
			`%or = or i32 %shr3, %shl`
			`ret i32 %or`
			`}`

			`define i32 @test2(i32 %a) nounwind readnone {`
			`entry:`
DAGCombiner: make sure or/shl/srl really has zero high bits before forming bswap We want to convert code like (or (srl N, 8), (shl N, 8)) into (srl (bswap N), const), but this is only valid if the bits above 16 on the source pattern are 0, the checks we were doing on this were slightly wrong before. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189348 91177308-0d34-0410-b5e6-96231b3b80d8 2013-08-27 13:46:45 +00:00			`; CHECK-LABEL: test2:`
			`; CHECK: bswapl [[REG:%.*]]`
			`; CHECK: sarl $16, [[REG]]`

			`; CHECK64-LABEL: test2:`
			`; CHECK64: bswapl [[REG:%.*]]`
			`; CHECK64: sarl $16, [[REG]]`
Teach dag combine to match halfword byteswap patterns. 1. (((x) & 0xFF00) >> 8) \| (((x) & 0x00FF) << 8) => (bswap x) >> 16 2. ((x&0xff)<<8)\|((x&0xff00)>>8)\|((x&0xff000000)>>8)\|((x&0x00ff0000)<<8)) => (rotl (bswap x) 16) This allows us to eliminate most of the def : Pat patterns for ARM rev16 revsh instructions. It catches many more cases for ARM and x86. rdar://9609108 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@133503 91177308-0d34-0410-b5e6-96231b3b80d8 2011-06-21 06:01:08 +00:00			`%and = lshr i32 %a, 8`
			`%shr4 = and i32 %and, 255`
			`%and2 = shl i32 %a, 8`
			`%or = or i32 %shr4, %and2`
			`%sext = shl i32 %or, 16`
			`%conv3 = ashr exact i32 %sext, 16`
			`ret i32 %conv3`
			`}`
DAGCombiner: make sure or/shl/srl really has zero high bits before forming bswap We want to convert code like (or (srl N, 8), (shl N, 8)) into (srl (bswap N), const), but this is only valid if the bits above 16 on the source pattern are 0, the checks we were doing on this were slightly wrong before. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189348 91177308-0d34-0410-b5e6-96231b3b80d8 2013-08-27 13:46:45 +00:00
			`@var8 = global i8 0`
			`@var16 = global i16 0`

			`; The "shl" below can move bits into the high parts of the value, so the`
			`; operation is not a "bswap, shr" pair.`

			`; rdar://problem/14814049`
			`define i64 @not_bswap() {`
			`; CHECK-LABEL: not_bswap:`
			`; CHECK-NOT: bswapl`
			`; CHECK: ret`

			`; CHECK64-LABEL: not_bswap:`
			`; CHECK64-NOT: bswapq`
			`; CHECK64: ret`
			`%init = load i16* @var16`
			`%big = zext i16 %init to i64`

			`%hishifted = lshr i64 %big, 8`
			`%loshifted = shl i64 %big, 8`

			`%notswapped = or i64 %hishifted, %loshifted`

			`ret i64 %notswapped`
			`}`

			`; This time, the lshr (and subsequent or) is completely useless. While it's`
			`; technically correct to convert this into a "bswap, shr", it's suboptimal. A`
			`; simple shl works better.`

			`define i64 @not_useful_bswap() {`
			`; CHECK-LABEL: not_useful_bswap:`
			`; CHECK-NOT: bswapl`
			`; CHECK: ret`

			`; CHECK64-LABEL: not_useful_bswap:`
			`; CHECK64-NOT: bswapq`
			`; CHECK64: ret`

			`%init = load i8* @var8`
			`%big = zext i8 %init to i64`

			`%hishifted = lshr i64 %big, 8`
			`%loshifted = shl i64 %big, 8`

			`%notswapped = or i64 %hishifted, %loshifted`

			`ret i64 %notswapped`
			`}`

			`; Finally, it is OK to just mask off the shl if we know that the value is zero`
			`; beyond 16 bits anyway. This is a legitimate bswap.`

			`define i64 @finally_useful_bswap() {`
			`; CHECK-LABEL: finally_useful_bswap:`
			`; CHECK: bswapl [[REG:%.*]]`
			`; CHECK: shrl $16, [[REG]]`
			`; CHECK: ret`

			`; CHECK64-LABEL: finally_useful_bswap:`
			`; CHECK64: bswapq [[REG:%.*]]`
			`; CHECK64: shrq $48, [[REG]]`
			`; CHECK64: ret`

			`%init = load i16* @var16`
			`%big = zext i16 %init to i64`

			`%hishifted = lshr i64 %big, 8`
			`%lomasked = and i64 %big, 255`
			`%loshifted = shl i64 %lomasked, 8`

			`%swapped = or i64 %hishifted, %loshifted`

			`ret i64 %swapped`
			`}`