pr27078.ll
639 Bytes
; RUN: llc -verify-machineinstrs -mtriple=powerpc64-linux-gnu -mcpu=pwr8 -mattr=+vsx < %s | FileCheck %s
define <4 x float> @bar(float* %p, float* %q) {
%1 = bitcast float* %p to <12 x float>*
%2 = bitcast float* %q to <12 x float>*
%3 = load <12 x float>, <12 x float>* %1, align 16
%4 = load <12 x float>, <12 x float>* %2, align 16
%5 = fsub <12 x float> %4, %3
%6 = shufflevector <12 x float> %5, <12 x float> undef, <4 x i32> <i32 0, i32 3, i32 6, i32 9>
ret <4 x float> %6
; CHECK: xxsldwi
; CHECK-DAG: vmrghw
; CHECK-DAG: vmrglw
; CHECK-NEXT: xxsldwi
; CHECK-NEXT: xxsldwi
; CHECK-NEXT: xxsldwi
; CHECK-NEXT: blr
}