PartialInlineHighCost.ll
3.51 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
; The outlined region has high frequency and the outlining
; call sequence is expensive (input, output, multiple exit etc)
; RUN: opt < %s -partial-inliner -max-num-inline-blocks=2 -S | FileCheck %s
; RUN: opt < %s -passes=partial-inliner -max-num-inline-blocks=2 -S | FileCheck %s
; RUN: opt < %s -partial-inliner -skip-partial-inlining-cost-analysis -max-num-inline-blocks=2 -S | FileCheck --check-prefix=NOCOST %s
; RUN: opt < %s -passes=partial-inliner -skip-partial-inlining-cost-analysis -max-num-inline-blocks=2 -S | FileCheck --check-prefix=NOCOST %s
; Function Attrs: nounwind
define i32 @bar_hot_outline_region(i32 %arg) local_unnamed_addr #0 {
bb:
%tmp = icmp slt i32 %arg, 0
br i1 %tmp, label %bb1, label %bb16, !prof !1
bb1: ; preds = %bb
%tmp2 = tail call i32 (...) @foo() #0
%tmp3 = tail call i32 (...) @foo() #0
%tmp4 = tail call i32 (...) @foo() #0
%tmp5 = tail call i32 (...) @foo() #0
%tmp6 = tail call i32 (...) @foo() #0
%tmp7 = tail call i32 (...) @foo() #0
%tmp8 = add nsw i32 %arg, 1
%tmp9 = tail call i32 @goo(i32 %tmp8) #0
%tmp10 = tail call i32 (...) @foo() #0
%tmp11 = icmp eq i32 %tmp10, 0
br i1 %tmp11, label %bb12, label %bb16
bb12: ; preds = %bb1
%tmp13 = tail call i32 (...) @foo() #0
%tmp14 = icmp eq i32 %tmp13, 0
%tmp15 = select i1 %tmp14, i32 0, i32 3
br label %bb16
bb16: ; preds = %bb12, %bb1, %bb
%tmp17 = phi i32 [ 2, %bb1 ], [ %tmp15, %bb12 ], [ 0, %bb ]
ret i32 %tmp17
}
define i32 @bar_cold_outline_region(i32 %arg) local_unnamed_addr #0 {
bb:
%tmp = icmp slt i32 %arg, 0
br i1 %tmp, label %bb1, label %bb16, !prof !2
bb1: ; preds = %bb
%tmp2 = tail call i32 (...) @foo() #0
%tmp3 = tail call i32 (...) @foo() #0
%tmp4 = tail call i32 (...) @foo() #0
%tmp5 = tail call i32 (...) @foo() #0
%tmp6 = tail call i32 (...) @foo() #0
%tmp7 = tail call i32 (...) @foo() #0
%tmp8 = add nsw i32 %arg, 1
%tmp9 = tail call i32 @goo(i32 %tmp8) #0
%tmp10 = tail call i32 (...) @foo() #0
%tmp11 = icmp eq i32 %tmp10, 0
br i1 %tmp11, label %bb12, label %bb16
bb12: ; preds = %bb1
%tmp13 = tail call i32 (...) @foo() #0
%tmp14 = icmp eq i32 %tmp13, 0
%tmp15 = select i1 %tmp14, i32 0, i32 3
br label %bb16
bb16: ; preds = %bb12, %bb1, %bb
%tmp17 = phi i32 [ 2, %bb1 ], [ %tmp15, %bb12 ], [ 0, %bb ]
ret i32 %tmp17
}
; Function Attrs: nounwind
declare i32 @foo(...) local_unnamed_addr #0
; Function Attrs: nounwind
declare i32 @goo(i32) local_unnamed_addr #0
; Function Attrs: nounwind
define i32 @dummy_caller(i32 %arg) local_unnamed_addr #0 {
bb:
; CHECK-LABEL: @dummy_caller
; CHECK-NOT: br i1
; CHECK-NOT: call{{.*}}bar_hot_outline_region.
; NOCOST-LABEL: @dummy_caller
; NOCOST: br i1
; NOCOST: call{{.*}}bar_hot_outline_region.
%tmp = tail call i32 @bar_hot_outline_region(i32 %arg)
ret i32 %tmp
}
define i32 @dummy_caller2(i32 %arg) local_unnamed_addr #0 {
bb:
; CHECK-LABEL: @dummy_caller2
; CHECK: br i1
; CHECK: call{{.*}}bar_cold_outline_region.
; NOCOST-LABEL: @dummy_caller2
; NOCOST: br i1
; NOCOST: call{{.*}}bar_cold_outline_region.
%tmp = tail call i32 @bar_cold_outline_region(i32 %arg)
ret i32 %tmp
}
attributes #0 = { nounwind }
!llvm.ident = !{!0}
!0 = !{!"clang version 5.0.0 (trunk 301898)"}
!1 = !{!"branch_weights", i32 2000, i32 1}
!2 = !{!"branch_weights", i32 1, i32 100}