[llvm] r322828 - A new test to demostrate the current SHLD/SHRD code generation.

Andrew V. Tischenko via llvm-commits llvm-commits at lists.llvm.org
Thu Jan 18 02:40:48 PST 2018


Author: avt77
Date: Thu Jan 18 02:40:48 2018
New Revision: 322828

URL: http://llvm.org/viewvc/llvm-project?rev=322828&view=rev
Log:
A new test to demostrate the current SHLD/SHRD code generation.

Added:
    llvm/trunk/test/CodeGen/X86/schedule-x86-64-shld.ll

Added: llvm/trunk/test/CodeGen/X86/schedule-x86-64-shld.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/X86/schedule-x86-64-shld.ll?rev=322828&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/X86/schedule-x86-64-shld.ll (added)
+++ llvm/trunk/test/CodeGen/X86/schedule-x86-64-shld.ll Thu Jan 18 02:40:48 2018
@@ -0,0 +1,464 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=x86-64 | FileCheck %s --check-prefix=CHECK --check-prefix=GENERIC
+; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=btver2 | FileCheck %s --check-prefix=CHECK --check-prefix=BTVER2
+; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=bdver1 | FileCheck %s --check-prefix=CHECK --check-prefix=BDVER1
+
+
+; uint64_t lshift10(uint64_t a, uint64_t b)
+; {
+;     return (a << 10) | (b >> 54);
+; }
+
+define i64 @lshift10_optsize(i64 %a, i64 %b) nounwind readnone optsize {
+; GENERIC-LABEL: lshift10_optsize:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    shldq $10, %rsi, %rdi # sched: [2:0.67]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift10_optsize:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    shldq $10, %rsi, %rdi # sched: [3:3.00]
+; BTVER2-NEXT:    movq %rdi, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift10_optsize:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    shldq $10, %rsi, %rdi
+; BDVER1-NEXT:    movq %rdi, %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shl = shl i64 %a, 10
+  %shr = lshr i64 %b, 54
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+define i64 @lshift10(i64 %a, i64 %b) nounwind readnone {
+; GENERIC-LABEL: lshift10:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    shldq $10, %rsi, %rdi # sched: [2:0.67]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift10:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    shlq $10, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    shrq $54, %rsi # sched: [1:0.50]
+; BTVER2-NEXT:    leaq (%rsi,%rdi), %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift10:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    shlq $10, %rdi
+; BDVER1-NEXT:    shrq $54, %rsi
+; BDVER1-NEXT:    leaq (%rsi,%rdi), %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shl = shl i64 %a, 10
+  %shr = lshr i64 %b, 54
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+; uint64_t rshift10(uint64_t a, uint64_t b)
+; {
+;     return (a >> 62) | (b << 2);
+; }
+
+; Should be done via shld
+define i64 @rshift10_optsize(i64 %a, i64 %b) nounwind readnone optsize {
+; GENERIC-LABEL: rshift10_optsize:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    shrdq $62, %rsi, %rdi # sched: [2:0.67]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: rshift10_optsize:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    shrdq $62, %rsi, %rdi # sched: [3:3.00]
+; BTVER2-NEXT:    movq %rdi, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: rshift10_optsize:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    shrdq $62, %rsi, %rdi
+; BDVER1-NEXT:    movq %rdi, %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shl = lshr i64 %a, 62
+  %shr = shl i64 %b, 2
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+; Should be done via lea (x,y,4),z
+define i64 @rshift10(i64 %a, i64 %b) nounwind readnone {
+; GENERIC-LABEL: rshift10:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    shrdq $62, %rsi, %rdi # sched: [2:0.67]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: rshift10:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    shrq $62, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    leaq (%rdi,%rsi,4), %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: rshift10:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    shrq $62, %rdi
+; BDVER1-NEXT:    leaq (%rdi,%rsi,4), %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shl = lshr i64 %a, 62
+  %shr = shl i64 %b, 2
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+;uint64_t lshift(uint64_t a, uint64_t b, uint64_t c)
+;{
+;    return (a << c) | (b >> (64-c));
+;}
+
+define i64 @lshift_cl_optsize(i64 %a, i64 %b, i64 %c) nounwind readnone optsize {
+; GENERIC-LABEL: lshift_cl_optsize:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movl %edx, %ecx # sched: [1:0.33]
+; GENERIC-NEXT:    shldq %cl, %rsi, %rdi # sched: [4:1.50]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_cl_optsize:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movl %edx, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    shldq %cl, %rsi, %rdi # sched: [4:4.00]
+; BTVER2-NEXT:    movq %rdi, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_cl_optsize:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movl %edx, %ecx
+; BDVER1-NEXT:    shldq %cl, %rsi, %rdi
+; BDVER1-NEXT:    movq %rdi, %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shl = shl i64 %a, %c
+  %sub = sub nsw i64 64, %c
+  %shr = lshr i64 %b, %sub
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+define i64 @lshift_cl(i64 %a, i64 %b, i64 %c) nounwind readnone {
+; GENERIC-LABEL: lshift_cl:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movl %edx, %ecx # sched: [1:0.33]
+; GENERIC-NEXT:    shldq %cl, %rsi, %rdi # sched: [4:1.50]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_cl:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movl %edx, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    shlq %cl, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    movl $64, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    subl %edx, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    # kill: def %cl killed %cl killed %ecx
+; BTVER2-NEXT:    shrq %cl, %rsi # sched: [1:0.50]
+; BTVER2-NEXT:    orq %rdi, %rsi # sched: [1:0.50]
+; BTVER2-NEXT:    movq %rsi, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_cl:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movl %edx, %ecx
+; BDVER1-NEXT:    shlq %cl, %rdi
+; BDVER1-NEXT:    movl $64, %ecx
+; BDVER1-NEXT:    subl %edx, %ecx
+; BDVER1-NEXT:    # kill: def %cl killed %cl killed %ecx
+; BDVER1-NEXT:    shrq %cl, %rsi
+; BDVER1-NEXT:    orq %rdi, %rsi
+; BDVER1-NEXT:    movq %rsi, %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shl = shl i64 %a, %c
+  %sub = sub nsw i64 64, %c
+  %shr = lshr i64 %b, %sub
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+
+;uint64_t rshift(uint64_t a, uint64_t b, int c)
+;{
+;    return (a >> c) | (b << (64-c));
+;}
+
+define i64 @rshift_cl_optsize(i64 %a, i64 %b, i64 %c) nounwind readnone optsize {
+; GENERIC-LABEL: rshift_cl_optsize:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movl %edx, %ecx # sched: [1:0.33]
+; GENERIC-NEXT:    shrdq %cl, %rsi, %rdi # sched: [4:1.50]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: rshift_cl_optsize:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movl %edx, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    shrdq %cl, %rsi, %rdi # sched: [4:4.00]
+; BTVER2-NEXT:    movq %rdi, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: rshift_cl_optsize:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movl %edx, %ecx
+; BDVER1-NEXT:    shrdq %cl, %rsi, %rdi
+; BDVER1-NEXT:    movq %rdi, %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shr = lshr i64 %a, %c
+  %sub = sub nsw i64 64, %c
+  %shl = shl i64 %b, %sub
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+define i64 @rshift_cl(i64 %a, i64 %b, i64 %c) nounwind readnone {
+; GENERIC-LABEL: rshift_cl:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movl %edx, %ecx # sched: [1:0.33]
+; GENERIC-NEXT:    shrdq %cl, %rsi, %rdi # sched: [4:1.50]
+; GENERIC-NEXT:    movq %rdi, %rax # sched: [1:0.33]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: rshift_cl:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movl %edx, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    shrq %cl, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    movl $64, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    subl %edx, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    # kill: def %cl killed %cl killed %ecx
+; BTVER2-NEXT:    shlq %cl, %rsi # sched: [1:0.50]
+; BTVER2-NEXT:    orq %rdi, %rsi # sched: [1:0.50]
+; BTVER2-NEXT:    movq %rsi, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: rshift_cl:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movl %edx, %ecx
+; BDVER1-NEXT:    shrq %cl, %rdi
+; BDVER1-NEXT:    movl $64, %ecx
+; BDVER1-NEXT:    subl %edx, %ecx
+; BDVER1-NEXT:    # kill: def %cl killed %cl killed %ecx
+; BDVER1-NEXT:    shlq %cl, %rsi
+; BDVER1-NEXT:    orq %rdi, %rsi
+; BDVER1-NEXT:    movq %rsi, %rax
+; BDVER1-NEXT:    retq
+entry:
+  %shr = lshr i64 %a, %c
+  %sub = sub nsw i64 64, %c
+  %shl = shl i64 %b, %sub
+  %or = or i64 %shr, %shl
+  ret i64 %or
+}
+
+; extern uint64_t x;
+;void lshift(uint64_t a, uint64_t b, uint_64_t c)
+;{
+;    x = (x << c) | (a >> (64-c));
+;}
+ at x = global i64 0, align 4
+
+define void @lshift_mem_cl_optsize(i64 %a, i64 %c) nounwind readnone optsize {
+; GENERIC-LABEL: lshift_mem_cl_optsize:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movl %esi, %ecx # sched: [1:0.33]
+; GENERIC-NEXT:    shldq %cl, %rdi, {{.*}}(%rip) # sched: [10:1.50]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_mem_cl_optsize:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movl %esi, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    shldq %cl, %rdi, {{.*}}(%rip) # sched: [9:11.00]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_mem_cl_optsize:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movl %esi, %ecx
+; BDVER1-NEXT:    shldq %cl, %rdi, {{.*}}(%rip)
+; BDVER1-NEXT:    retq
+entry:
+  %b = load i64, i64* @x
+  %shl = shl i64 %b, %c
+  %sub = sub nsw i64 64, %c
+  %shr = lshr i64 %a, %sub
+  %or = or i64 %shl, %shr
+  store i64 %or, i64* @x
+  ret void
+}
+
+define void @lshift_mem_cl(i64 %a, i64 %c) nounwind readnone {
+; GENERIC-LABEL: lshift_mem_cl:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movl %esi, %ecx # sched: [1:0.33]
+; GENERIC-NEXT:    shldq %cl, %rdi, {{.*}}(%rip) # sched: [10:1.50]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_mem_cl:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movq {{.*}}(%rip), %rax # sched: [5:1.00]
+; BTVER2-NEXT:    movl %esi, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    shlq %cl, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    movl $64, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    subl %esi, %ecx # sched: [1:0.50]
+; BTVER2-NEXT:    # kill: def %cl killed %cl killed %ecx
+; BTVER2-NEXT:    shrq %cl, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    orq %rax, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    movq %rdi, {{.*}}(%rip) # sched: [1:1.00]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_mem_cl:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movq {{.*}}(%rip), %rax
+; BDVER1-NEXT:    movl %esi, %ecx
+; BDVER1-NEXT:    shlq %cl, %rax
+; BDVER1-NEXT:    movl $64, %ecx
+; BDVER1-NEXT:    subl %esi, %ecx
+; BDVER1-NEXT:    # kill: def %cl killed %cl killed %ecx
+; BDVER1-NEXT:    shrq %cl, %rdi
+; BDVER1-NEXT:    orq %rax, %rdi
+; BDVER1-NEXT:    movq %rdi, {{.*}}(%rip)
+; BDVER1-NEXT:    retq
+entry:
+  %b = load i64, i64* @x
+  %shl = shl i64 %b, %c
+  %sub = sub nsw i64 64, %c
+  %shr = lshr i64 %a, %sub
+  %or = or i64 %shl, %shr
+  store i64 %or, i64* @x
+  ret void
+}
+
+define void @lshift_mem(i64 %a) nounwind readnone {
+; GENERIC-LABEL: lshift_mem:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    shldq $10, %rdi, {{.*}}(%rip) # sched: [8:1.00]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_mem:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movq {{.*}}(%rip), %rax # sched: [5:1.00]
+; BTVER2-NEXT:    shrq $54, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    shlq $10, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    orq %rax, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    movq %rdi, {{.*}}(%rip) # sched: [1:1.00]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_mem:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movq {{.*}}(%rip), %rax
+; BDVER1-NEXT:    shlq $10, %rax
+; BDVER1-NEXT:    shrq $54, %rdi
+; BDVER1-NEXT:    orq %rax, %rdi
+; BDVER1-NEXT:    movq %rdi, {{.*}}(%rip)
+; BDVER1-NEXT:    retq
+entry:
+  %b = load i64, i64* @x
+  %shl = shl i64 %b, 10
+  %shr = lshr i64 %a, 54
+  %or = or i64 %shr, %shl
+  store i64 %or, i64* @x
+  ret void
+}
+
+define void @lshift_mem_optsize(i64 %a) nounwind readnone optsize {
+; GENERIC-LABEL: lshift_mem_optsize:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    shldq $10, %rdi, {{.*}}(%rip) # sched: [8:1.00]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_mem_optsize:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    shldq $10, %rdi, {{.*}}(%rip) # sched: [9:11.00]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_mem_optsize:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    shldq $10, %rdi, {{.*}}(%rip)
+; BDVER1-NEXT:    retq
+entry:
+  %b = load i64, i64* @x
+  %shl = shl i64 %b, 10
+  %shr = lshr i64 %a, 54
+  %or = or i64 %shr, %shl
+  store i64 %or, i64* @x
+  ret void
+}
+
+define void @lshift_mem_b(i64 %b) nounwind readnone {
+; GENERIC-LABEL: lshift_mem_b:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movq {{.*}}(%rip), %rax # sched: [5:0.50]
+; GENERIC-NEXT:    shrdq $54, %rdi, %rax # sched: [2:0.67]
+; GENERIC-NEXT:    movq %rax, {{.*}}(%rip) # sched: [5:1.00]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_mem_b:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movq {{.*}}(%rip), %rax # sched: [5:1.00]
+; BTVER2-NEXT:    shlq $10, %rdi # sched: [1:0.50]
+; BTVER2-NEXT:    shrq $54, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    orq %rdi, %rax # sched: [1:0.50]
+; BTVER2-NEXT:    movq %rax, {{.*}}(%rip) # sched: [1:1.00]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_mem_b:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movq {{.*}}(%rip), %rax
+; BDVER1-NEXT:    shlq $10, %rdi
+; BDVER1-NEXT:    shrq $54, %rax
+; BDVER1-NEXT:    orq %rdi, %rax
+; BDVER1-NEXT:    movq %rax, {{.*}}(%rip)
+; BDVER1-NEXT:    retq
+entry:
+  %a = load i64, i64* @x
+  %shl = shl i64 %b, 10
+  %shr = lshr i64 %a, 54
+  %or = or i64 %shr, %shl
+  store i64 %or, i64* @x
+  ret void
+}
+
+define void @lshift_mem_b_optsize(i64 %b) nounwind readnone optsize {
+; GENERIC-LABEL: lshift_mem_b_optsize:
+; GENERIC:       # %bb.0: # %entry
+; GENERIC-NEXT:    movq {{.*}}(%rip), %rax # sched: [5:0.50]
+; GENERIC-NEXT:    shrdq $54, %rdi, %rax # sched: [2:0.67]
+; GENERIC-NEXT:    movq %rax, {{.*}}(%rip) # sched: [5:1.00]
+; GENERIC-NEXT:    retq # sched: [1:1.00]
+;
+; BTVER2-LABEL: lshift_mem_b_optsize:
+; BTVER2:       # %bb.0: # %entry
+; BTVER2-NEXT:    movq {{.*}}(%rip), %rax # sched: [5:1.00]
+; BTVER2-NEXT:    shrdq $54, %rdi, %rax # sched: [3:3.00]
+; BTVER2-NEXT:    movq %rax, {{.*}}(%rip) # sched: [1:1.00]
+; BTVER2-NEXT:    retq # sched: [4:1.00]
+;
+; BDVER1-LABEL: lshift_mem_b_optsize:
+; BDVER1:       # %bb.0: # %entry
+; BDVER1-NEXT:    movq {{.*}}(%rip), %rax
+; BDVER1-NEXT:    shrdq $54, %rdi, %rax
+; BDVER1-NEXT:    movq %rax, {{.*}}(%rip)
+; BDVER1-NEXT:    retq
+entry:
+  %a = load i64, i64* @x
+  %shl = shl i64 %b, 10
+  %shr = lshr i64 %a, 54
+  %or = or i64 %shr, %shl
+  store i64 %or, i64* @x
+  ret void
+}
+




More information about the llvm-commits mailing list