tail-dup-partial.ll 2.75 KB
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu  -O3 | FileCheck %s

; Function Attrs: uwtable
; When tail-duplicating during placement, we work backward from blocks with
; multiple successors. In this case, the block dup1 gets duplicated into dup2
; and if.then64, and then the block dup2 only gets duplicated into land.lhs.true.

define void @partial_tail_dup(i1 %a1, i1 %a2, i32* %a4, i32* %a5, i8* %a6, i32 %a7) #0 align 2  !prof !1 {
; CHECK-LABEL: partial_tail_dup:
; CHECK:        # %bb.0: # %entry
; CHECK-NEXT:   .p2align 4, 0x90
; CHECK-NEXT:   .LBB0_1: # %for.cond
; CHECK-NEXT:   # =>This Inner Loop Header: Depth=1
; CHECK-NEXT:	  testb	$1, %dil
; CHECK-NEXT:	  je	.LBB0_3
; CHECK-NEXT:   # %bb.2: # %land.lhs.true
; CHECK-NEXT:   # in Loop: Header=BB0_1 Depth=1
; CHECK-NEXT:	  movl	$10, (%rdx)
; CHECK-NEXT:	  movl	$2, (%rcx)
; CHECK-NEXT:	  testl	%r9d, %r9d
; CHECK-NEXT:	  je	.LBB0_1
; CHECK-NEXT:	  jmp	.LBB0_8
; CHECK-NEXT:	  .p2align	4, 0x90
; CHECK-NEXT:   .LBB0_6: # %dup2
; CHECK-NEXT:   # in Loop: Header=BB0_1 Depth=1
; CHECK-NEXT:	  movl	$2, (%rcx)
; CHECK-NEXT:	  testl	%r9d, %r9d
; CHECK-NEXT:	  je	.LBB0_1
; CHECK-NEXT:	  jmp	.LBB0_8
; CHECK-NEXT:    .p2align 4, 0x90
; CHECK-NEXT:  .LBB0_3: # %if.end56
; CHECK-NEXT:    # in Loop: Header=BB0_1 Depth=1
; CHECK-NEXT:    testb $1, %sil
; CHECK-NEXT:    je .LBB0_5
; CHECK-NEXT:  # %bb.4: # %if.then64
; CHECK-NEXT:    # in Loop: Header=BB0_1 Depth=1
; CHECK-NEXT:    movb $1, (%r8)
; CHECK-NEXT:    testl %r9d, %r9d
; CHECK-NEXT:    je .LBB0_1
; CHECK-NEXT:    jmp .LBB0_8
; CHECK-NEXT:  .LBB0_5: # %if.end70
; CHECK-NEXT:    # in Loop: Header=BB0_1 Depth=1
; CHECK-NEXT:    movl $12, (%rdx)
; CHECK-NEXT:    jne .LBB0_6  
; CHECK-NEXT:  .LBB0_8: # %for.end
; CHECK-NEXT:    retq
entry:
  br label %for.cond

for.cond:                                      
  br i1 %a1, label %land.lhs.true, label %if.end56

land.lhs.true:                                   
  store i32 10, i32* %a4, align 8
  br label %dup2

if.end56:                                        
  br i1 %a2, label %if.then64, label %if.end70, !prof !2

if.then64:                                       
  store i8 1, i8* %a6, align 1
  br label %dup1

if.end70:                                        
  store i32 12, i32* %a4, align 8
  br i1 %a2, label %dup2, label %for.end

dup2:                                            
  store i32 2, i32* %a5, align 4
  br label %dup1

dup1:                                            
  %val = load i32, i32* %a4, align 8
  %switch = icmp ult i32 %a7, 1
  br i1 %switch, label %for.cond, label %for.end, !prof !3

for.end:                                         
  ret void
}

attributes #0 = { uwtable }

!1 = !{!"function_entry_count", i64 2}
!2 = !{!"branch_weights", i32 5, i32 1}
!3 = !{!"branch_weights", i32 5, i32 1}