stack-align-memcpy.ll 9.26 KB
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -stackrealign -mtriple i386-apple-darwin -mcpu=i486 | FileCheck %s

%struct.foo = type { [88 x i8] }

declare void @bar(i8* nocapture, %struct.foo* align 4 byval) nounwind
declare void @baz(i8*) nounwind

; PR15249
; We can't use rep;movsl here because it clobbers the base pointer in %esi.
define void @test1(%struct.foo* nocapture %x, i32 %y) nounwind {
; CHECK-LABEL: test1:
; CHECK:       ## %bb.0:
; CHECK-NEXT:    pushl %ebp
; CHECK-NEXT:    movl %esp, %ebp
; CHECK-NEXT:    pushl %ebx
; CHECK-NEXT:    pushl %edi
; CHECK-NEXT:    pushl %esi
; CHECK-NEXT:    andl $-16, %esp
; CHECK-NEXT:    subl $80, %esp
; CHECK-NEXT:    movl %esp, %esi
; CHECK-NEXT:    movl 8(%ebp), %ecx
; CHECK-NEXT:    movl 12(%ebp), %edx
; CHECK-NEXT:    movl %esp, %eax
; CHECK-NEXT:    addl $15, %edx
; CHECK-NEXT:    andl $-16, %edx
; CHECK-NEXT:    subl %edx, %eax
; CHECK-NEXT:    movl %eax, %esp
; CHECK-NEXT:    subl $4, %esp
; CHECK-NEXT:    movl 84(%ecx), %edx
; CHECK-NEXT:    movl %edx, 68(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 80(%ecx), %edi
; CHECK-NEXT:    movl 76(%ecx), %ebx
; CHECK-NEXT:    movl 72(%ecx), %edx
; CHECK-NEXT:    movl %edx, 64(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 68(%ecx), %edx
; CHECK-NEXT:    movl %edx, 60(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 64(%ecx), %edx
; CHECK-NEXT:    movl %edx, 56(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 60(%ecx), %edx
; CHECK-NEXT:    movl %edx, 52(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 56(%ecx), %edx
; CHECK-NEXT:    movl %edx, 48(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 52(%ecx), %edx
; CHECK-NEXT:    movl %edx, 44(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 48(%ecx), %edx
; CHECK-NEXT:    movl %edx, 40(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 44(%ecx), %edx
; CHECK-NEXT:    movl %edx, 36(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 40(%ecx), %edx
; CHECK-NEXT:    movl %edx, 32(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 36(%ecx), %edx
; CHECK-NEXT:    movl %edx, 28(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 32(%ecx), %edx
; CHECK-NEXT:    movl %edx, 24(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 28(%ecx), %edx
; CHECK-NEXT:    movl %edx, 20(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 24(%ecx), %edx
; CHECK-NEXT:    movl %edx, 16(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 20(%ecx), %edx
; CHECK-NEXT:    movl %edx, 12(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 16(%ecx), %edx
; CHECK-NEXT:    movl %edx, 8(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 12(%ecx), %edx
; CHECK-NEXT:    movl %edx, 4(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 8(%ecx), %edx
; CHECK-NEXT:    movl %edx, (%esi) ## 4-byte Spill
; CHECK-NEXT:    movl (%ecx), %edx
; CHECK-NEXT:    movl %edx, 72(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 4(%ecx), %ecx
; CHECK-NEXT:    pushl 68(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl %edi
; CHECK-NEXT:    pushl %ebx
; CHECK-NEXT:    pushl 64(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 60(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 56(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 52(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 48(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 44(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 40(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 36(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 32(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 28(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 24(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 20(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 16(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 12(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 8(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 4(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl (%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl %ecx
; CHECK-NEXT:    pushl 72(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl %eax
; CHECK-NEXT:    calll _bar
; CHECK-NEXT:    leal -12(%ebp), %esp
; CHECK-NEXT:    popl %esi
; CHECK-NEXT:    popl %edi
; CHECK-NEXT:    popl %ebx
; CHECK-NEXT:    popl %ebp
; CHECK-NEXT:    retl
  %dynalloc = alloca i8, i32 %y, align 1
  call void @bar(i8* %dynalloc, %struct.foo* align 4 byval %x)
  ret void
}

; PR19012
; Also don't clobber %esi if the dynamic alloca comes after the memcpy.
define void @test2(%struct.foo* nocapture %x, i32 %y, i8* %z) nounwind {
; CHECK-LABEL: test2:
; CHECK:       ## %bb.0:
; CHECK-NEXT:    pushl %ebp
; CHECK-NEXT:    movl %esp, %ebp
; CHECK-NEXT:    pushl %ebx
; CHECK-NEXT:    pushl %edi
; CHECK-NEXT:    pushl %esi
; CHECK-NEXT:    andl $-16, %esp
; CHECK-NEXT:    subl $80, %esp
; CHECK-NEXT:    movl %esp, %esi
; CHECK-NEXT:    movl 12(%ebp), %edi
; CHECK-NEXT:    movl 8(%ebp), %eax
; CHECK-NEXT:    subl $4, %esp
; CHECK-NEXT:    movl 84(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 68(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 80(%eax), %edx
; CHECK-NEXT:    movl 76(%eax), %ebx
; CHECK-NEXT:    movl 72(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 64(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 68(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 60(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 64(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 56(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 60(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 52(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 56(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 48(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 52(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 44(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 48(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 40(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 44(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 36(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 40(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 32(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 36(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 28(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 32(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 24(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 28(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 20(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 24(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 16(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 20(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 12(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 16(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 8(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 12(%eax), %ecx
; CHECK-NEXT:    movl %ecx, 4(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 8(%eax), %ecx
; CHECK-NEXT:    movl %ecx, (%esi) ## 4-byte Spill
; CHECK-NEXT:    movl (%eax), %ecx
; CHECK-NEXT:    movl %ecx, 72(%esi) ## 4-byte Spill
; CHECK-NEXT:    movl 4(%eax), %eax
; CHECK-NEXT:    pushl 68(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl %edx
; CHECK-NEXT:    pushl %ebx
; CHECK-NEXT:    pushl 64(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 60(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 56(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 52(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 48(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 44(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 40(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 36(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 32(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 28(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 24(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 20(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 16(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 12(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 8(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 4(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl (%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl %eax
; CHECK-NEXT:    pushl 72(%esi) ## 4-byte Folded Reload
; CHECK-NEXT:    pushl 16(%ebp)
; CHECK-NEXT:    calll _bar
; CHECK-NEXT:    addl $96, %esp
; CHECK-NEXT:    movl %esp, %eax
; CHECK-NEXT:    addl $15, %edi
; CHECK-NEXT:    andl $-16, %edi
; CHECK-NEXT:    subl %edi, %eax
; CHECK-NEXT:    movl %eax, %esp
; CHECK-NEXT:    subl $12, %esp
; CHECK-NEXT:    pushl %eax
; CHECK-NEXT:    calll _baz
; CHECK-NEXT:    leal -12(%ebp), %esp
; CHECK-NEXT:    popl %esi
; CHECK-NEXT:    popl %edi
; CHECK-NEXT:    popl %ebx
; CHECK-NEXT:    popl %ebp
; CHECK-NEXT:    retl
  call void @bar(i8* %z, %struct.foo* align 4 byval %x)
  %dynalloc = alloca i8, i32 %y, align 1
  call void @baz(i8* %dynalloc)
  ret void
}

; Check that we do use rep movs if we make the alloca static.
define void @test3(%struct.foo* nocapture %x, i32 %y, i8* %z) nounwind {
; CHECK-LABEL: test3:
; CHECK:       ## %bb.0:
; CHECK-NEXT:    pushl %ebp
; CHECK-NEXT:    movl %esp, %ebp
; CHECK-NEXT:    pushl %edi
; CHECK-NEXT:    pushl %esi
; CHECK-NEXT:    andl $-16, %esp
; CHECK-NEXT:    subl $112, %esp
; CHECK-NEXT:    movl 16(%ebp), %eax
; CHECK-NEXT:    movl 8(%ebp), %esi
; CHECK-NEXT:    leal {{[0-9]+}}(%esp), %edi
; CHECK-NEXT:    movl $22, %ecx
; CHECK-NEXT:    rep;movsl (%esi), %es:(%edi)
; CHECK-NEXT:    movl %eax, (%esp)
; CHECK-NEXT:    calll _bar
; CHECK-NEXT:    leal {{[0-9]+}}(%esp), %eax
; CHECK-NEXT:    movl %eax, (%esp)
; CHECK-NEXT:    calll _baz
; CHECK-NEXT:    leal -8(%ebp), %esp
; CHECK-NEXT:    popl %esi
; CHECK-NEXT:    popl %edi
; CHECK-NEXT:    popl %ebp
; CHECK-NEXT:    retl
  call void @bar(i8* %z, %struct.foo* align 4 byval %x)
  %statalloc = alloca i8, i32 8, align 1
  call void @baz(i8* %statalloc)
  ret void
}