diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp index 951d3ded99d..07c83e8b294 100644 --- a/lib/Target/X86/X86ISelLowering.cpp +++ b/lib/Target/X86/X86ISelLowering.cpp @@ -505,7 +505,9 @@ void X86TargetLowering::resetOperationActions() { } setOperationAction(ISD::READCYCLECOUNTER , MVT::i64 , Custom); - setOperationAction(ISD::BSWAP , MVT::i16 , Expand); + + if (!Subtarget->hasMOVBE()) + setOperationAction(ISD::BSWAP , MVT::i16 , Expand); // These should be promoted to a larger select which is supported. setOperationAction(ISD::SELECT , MVT::i1 , Promote); diff --git a/lib/Target/X86/X86InstrCompiler.td b/lib/Target/X86/X86InstrCompiler.td index 8446c2cfb90..a8aff44d06c 100644 --- a/lib/Target/X86/X86InstrCompiler.td +++ b/lib/Target/X86/X86InstrCompiler.td @@ -1839,3 +1839,9 @@ def : Pat<(cttz_zero_undef GR64:$src), (BSF64rr GR64:$src)>; def : Pat<(cttz_zero_undef (loadi16 addr:$src)), (BSF16rm addr:$src)>; def : Pat<(cttz_zero_undef (loadi32 addr:$src)), (BSF32rm addr:$src)>; def : Pat<(cttz_zero_undef (loadi64 addr:$src)), (BSF64rm addr:$src)>; + +// When HasMOVBE is enabled it is possible to get a non-legalized +// register-register 16 bit bswap. This maps it to a ROL instruction. +let Predicates = [HasMOVBE] in { + def : Pat<(bswap GR16:$src), (ROL16ri GR16:$src, (i8 8))>; +} diff --git a/test/CodeGen/X86/movbe.ll b/test/CodeGen/X86/movbe.ll index 3f459be70d2..e248410b202 100644 --- a/test/CodeGen/X86/movbe.ll +++ b/test/CodeGen/X86/movbe.ll @@ -1,45 +1,66 @@ ; RUN: llc -mtriple=x86_64-linux -mcpu=atom < %s | FileCheck %s ; RUN: llc -mtriple=x86_64-linux -mcpu=slm < %s | FileCheck %s -check-prefix=SLM +declare i16 @llvm.bswap.i16(i16) nounwind readnone declare i32 @llvm.bswap.i32(i32) nounwind readnone declare i64 @llvm.bswap.i64(i64) nounwind readnone -define void @test1(i32* nocapture %x, i32 %y) nounwind { +define void @test1(i16* nocapture %x, i16 %y) nounwind { + %bswap = call i16 @llvm.bswap.i16(i16 %y) + store i16 %bswap, i16* %x, align 2 + ret void +; CHECK-LABEL: test1: +; CHECK: movbew %si, (%rdi) +; SLM-LABEL: test1: +; SLM: movbew %si, (%rdi) +} + +define i16 @test2(i16* %x) nounwind { + %load = load i16* %x, align 2 + %bswap = call i16 @llvm.bswap.i16(i16 %load) + ret i16 %bswap +; CHECK-LABEL: test2: +; CHECK: movbew (%rdi), %ax +; SLM-LABEL: test2: +; SLM: movbew (%rdi), %ax +} + +define void @test3(i32* nocapture %x, i32 %y) nounwind { %bswap = call i32 @llvm.bswap.i32(i32 %y) store i32 %bswap, i32* %x, align 4 ret void -; CHECK-LABEL: test1: +; CHECK-LABEL: test3: ; CHECK: movbel %esi, (%rdi) -; SLM-LABEL: test1: +; SLM-LABEL: test3: ; SLM: movbel %esi, (%rdi) } -define i32 @test2(i32* %x) nounwind { +define i32 @test4(i32* %x) nounwind { %load = load i32* %x, align 4 %bswap = call i32 @llvm.bswap.i32(i32 %load) ret i32 %bswap -; CHECK-LABEL: test2: +; CHECK-LABEL: test4: ; CHECK: movbel (%rdi), %eax -; SLM-LABEL: test2: +; SLM-LABEL: test4: ; SLM: movbel (%rdi), %eax } -define void @test3(i64* %x, i64 %y) nounwind { +define void @test5(i64* %x, i64 %y) nounwind { %bswap = call i64 @llvm.bswap.i64(i64 %y) store i64 %bswap, i64* %x, align 8 ret void -; CHECK-LABEL: test3: +; CHECK-LABEL: test5: ; CHECK: movbeq %rsi, (%rdi) -; SLM-LABEL: test3: +; SLM-LABEL: test5: ; SLM: movbeq %rsi, (%rdi) } -define i64 @test4(i64* %x) nounwind { +define i64 @test6(i64* %x) nounwind { %load = load i64* %x, align 8 %bswap = call i64 @llvm.bswap.i64(i64 %load) ret i64 %bswap -; CHECK-LABEL: test4: +; CHECK-LABEL: test6: ; CHECK: movbeq (%rdi), %rax -; SLM-LABEL: test4: +; SLM-LABEL: test6: ; SLM: movbeq (%rdi), %rax }