prof-early-if.ll
3.02 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
; RUN: llc -O2 -march=hexagon < %s | FileCheck %s
; Rely on the comments generated by llc. Check that "if.then" was not predicated.
; CHECK: b5
; CHECK: b2
; CHECK-NOT: if{{.*}}memd
%s.0 = type { [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [24 x i32], [3 x i32], [24 x i32], [8 x %s.1], [5 x i32] }
%s.1 = type { i32, i32 }
@g0 = global i64 0
@g1 = global i32 0
@g2 = global i32 0
@g3 = global i8 0
declare i32 @llvm.hexagon.S2.cl0(i32) #0
declare i32 @llvm.hexagon.S2.setbit.r(i32, i32) #0
declare i64 @llvm.hexagon.M2.vmpy2s.s0(i32, i32) #0
declare i64 @llvm.hexagon.M2.vmac2s.s0(i64, i32, i32) #0
declare i64 @llvm.hexagon.A2.vaddws(i64, i64) #0
declare i64 @llvm.hexagon.A2.vsubws(i64, i64) #0
declare i32 @llvm.hexagon.A4.modwrapu(i32, i32) #0
define void @f0(i32 %a0, i64* %a1) #1 {
b0:
br label %b1
b1: ; preds = %b5, %b0
%v0 = phi i32 [ 0, %b0 ], [ %v26, %b5 ]
%v1 = phi i32 [ 0, %b0 ], [ %v25, %b5 ]
%v2 = load i32, i32* @g1, align 4
%v3 = load i32, i32* @g2, align 8
%v4 = and i32 %v3, %v2
br label %b2
b2: ; preds = %b4, %b1
%v5 = phi i64 [ %v21, %b4 ], [ 0, %b1 ]
%v6 = phi i64 [ %v22, %b4 ], [ 0, %b1 ]
%v7 = phi i32 [ %v9, %b4 ], [ %v4, %b1 ]
%v8 = tail call i32 @llvm.hexagon.S2.cl0(i32 %v7)
%v9 = tail call i32 @llvm.hexagon.S2.setbit.r(i32 %v7, i32 %v8)
%v10 = getelementptr [10 x %s.0], [10 x %s.0]* inttoptr (i32 -121502345 to [10 x %s.0]*), i32 0, i32 %v1
%v11 = getelementptr %s.0, %s.0* %v10, i32 0, i32 12, i32 %v8
%v12 = load i32, i32* %v11, align 4
%v13 = tail call i64 @llvm.hexagon.M2.vmpy2s.s0(i32 %v12, i32 %v12)
%v14 = getelementptr %s.0, %s.0* %v10, i32 0, i32 13, i32 %v8
%v15 = load i32, i32* %v14, align 4
%v16 = tail call i64 @llvm.hexagon.M2.vmac2s.s0(i64 %v13, i32 %v15, i32 %v15)
%v17 = load i8, i8* @g3, align 1
%v18 = and i8 %v17, 1
%v19 = icmp eq i8 %v18, 0
br i1 %v19, label %b3, label %b4, !prof !0
b3: ; preds = %b2
%v20 = tail call i64 @llvm.hexagon.A2.vaddws(i64 %v5, i64 %v16)
store i64 %v20, i64* %a1, align 8
br label %b4
b4: ; preds = %b3, %b2
%v21 = phi i64 [ %v20, %b3 ], [ %v5, %b2 ]
%v22 = tail call i64 @llvm.hexagon.A2.vsubws(i64 %v6, i64 %v16)
%v23 = icmp eq i32 %v9, 0
br i1 %v23, label %b5, label %b2, !prof !1
b5: ; preds = %b4
%v24 = add i32 %v1, 1
%v25 = tail call i32 @llvm.hexagon.A4.modwrapu(i32 %v24, i32 10) #0
%v26 = add i32 %v0, 1
%v27 = icmp eq i32 %v26, %a0
br i1 %v27, label %b6, label %b1, !prof !1
b6: ; preds = %b5
store i64 %v16, i64* @g0, align 8
ret void
}
attributes #0 = { nounwind readnone }
attributes #1 = { nounwind }
!0 = !{!"branch_weights", i32 99, i32 1}
!1 = !{!"branch_weights", i32 10, i32 90}