ppc64-align-long-double.ll 2.3 KB
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -verify-machineinstrs -mcpu=pwr7 -O2 -fast-isel=false -mattr=-vsx < %s | FileCheck %s
; RUN: llc -verify-machineinstrs -mcpu=pwr7 -O2 -fast-isel=false -mattr=+vsx < %s | FileCheck -check-prefix=CHECK-VSX %s
; RUN: llc -verify-machineinstrs -mcpu=pwr9 -O2 -fast-isel=false -mattr=+vsx < %s | FileCheck -check-prefix=CHECK-P9 %s

; Verify internal alignment of long double in a struct.  The double
; argument comes in GPR3; GPR4 is skipped; GPRs 5 and 6 contain
; the long double.  Check that these are stored to proper locations
; in the parameter save area and loaded from there for return in FPR1/2.

target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
target triple = "powerpc64-unknown-linux-gnu"

%struct.S = type { double, ppc_fp128 }

; The additional stores are caused because we forward the value in the
; store->load->bitcast path to make a store and bitcast of the same
; value. Since the target does bitcast through memory and we no longer
; remember the address we need to do the store in a fresh local
; address.
define ppc_fp128 @test(%struct.S* byval %x) nounwind {
; CHECK-LABEL: test:
; CHECK:       # %bb.0: # %entry
; CHECK-NEXT:    std 5, -16(1)
; CHECK-NEXT:    std 6, -8(1)
; CHECK-NEXT:    lfd 1, -16(1)
; CHECK-NEXT:    lfd 2, -8(1)
; CHECK-NEXT:    std 6, 72(1)
; CHECK-NEXT:    std 5, 64(1)
; CHECK-NEXT:    std 3, 48(1)
; CHECK-NEXT:    std 4, 56(1)
; CHECK-NEXT:    blr
;
; CHECK-VSX-LABEL: test:
; CHECK-VSX:       # %bb.0: # %entry
; CHECK-VSX-NEXT:    std 3, 48(1)
; CHECK-VSX-NEXT:    std 6, 72(1)
; CHECK-VSX-NEXT:    std 5, 64(1)
; CHECK-VSX-NEXT:    std 4, 56(1)
; CHECK-VSX-NEXT:    std 5, -16(1)
; CHECK-VSX-NEXT:    std 6, -8(1)
; CHECK-VSX-NEXT:    lfd 1, -16(1)
; CHECK-VSX-NEXT:    lfd 2, -8(1)
; CHECK-VSX-NEXT:    blr
;
; CHECK-P9-LABEL: test:
; CHECK-P9:       # %bb.0: # %entry
; CHECK-P9-NEXT:    mtfprd 1, 5
; CHECK-P9-NEXT:    mtfprd 2, 6
; CHECK-P9-NEXT:    std 6, 72(1)
; CHECK-P9-NEXT:    std 5, 64(1)
; CHECK-P9-NEXT:    std 3, 48(1)
; CHECK-P9-NEXT:    std 4, 56(1)
; CHECK-P9-NEXT:    blr
entry:
  %b = getelementptr inbounds %struct.S, %struct.S* %x, i32 0, i32 1
  %0 = load ppc_fp128, ppc_fp128* %b, align 16
  ret ppc_fp128 %0
}