nary-gep.ll
4.44 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
; RUN: opt < %s -nary-reassociate -early-cse -earlycse-debug-hash -S | FileCheck %s
; RUN: opt < %s -passes='nary-reassociate' -S | opt -early-cse -S | FileCheck %s
target datalayout = "e-i64:64-v16:16-v32:32-n16:32:64"
target triple = "nvptx64-unknown-unknown"
declare void @foo(float*)
; foo(&a[i]);
; foo(&a[i + j]);
; =>
; t = &a[i];
; foo(t);
; foo(t + j);
define void @reassociate_gep(float* %a, i64 %i, i64 %j) {
; CHECK-LABEL: @reassociate_gep(
%1 = add i64 %i, %j
%2 = getelementptr float, float* %a, i64 %i
; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i64 %i
call void @foo(float* %2)
; CHECK: call void @foo(float* [[t1]])
%3 = getelementptr float, float* %a, i64 %1
; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 %j
call void @foo(float* %3)
; CHECK: call void @foo(float* [[t2]])
ret void
}
; foo(&a[sext(j)]);
; foo(&a[sext(i +nsw j)]);
; foo(&a[sext((i +nsw j) +nsw i)]);
; =>
; t1 = &a[sext(j)];
; foo(t1);
; t2 = t1 + sext(i);
; foo(t2);
; t3 = t2 + sext(i); // sext(i) should be GVN'ed.
; foo(t3);
define void @reassociate_gep_nsw(float* %a, i32 %i, i32 %j) {
; CHECK-LABEL: @reassociate_gep_nsw(
%idxprom.j = sext i32 %j to i64
%1 = getelementptr float, float* %a, i64 %idxprom.j
; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i64 %idxprom.j
call void @foo(float* %1)
; CHECK: call void @foo(float* [[t1]])
%2 = add nsw i32 %i, %j
%idxprom.2 = sext i32 %2 to i64
%3 = getelementptr float, float* %a, i64 %idxprom.2
; CHECK: [[sexti:[^ ]+]] = sext i32 %i to i64
; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 [[sexti]]
call void @foo(float* %3)
; CHECK: call void @foo(float* [[t2]])
%4 = add nsw i32 %2, %i
%idxprom.4 = sext i32 %4 to i64
%5 = getelementptr float, float* %a, i64 %idxprom.4
; CHECK: [[t3:[^ ]+]] = getelementptr float, float* [[t2]], i64 [[sexti]]
call void @foo(float* %5)
; CHECK: call void @foo(float* [[t3]])
ret void
}
; assume(j >= 0);
; foo(&a[zext(j)]);
; assume(i + j >= 0);
; foo(&a[zext(i + j)]);
; =>
; t1 = &a[zext(j)];
; foo(t1);
; t2 = t1 + sext(i);
; foo(t2);
define void @reassociate_gep_assume(float* %a, i32 %i, i32 %j) {
; CHECK-LABEL: @reassociate_gep_assume(
; assume(j >= 0)
%cmp = icmp sgt i32 %j, -1
call void @llvm.assume(i1 %cmp)
%1 = add i32 %i, %j
%cmp2 = icmp sgt i32 %1, -1
call void @llvm.assume(i1 %cmp2)
%idxprom.j = zext i32 %j to i64
%2 = getelementptr float, float* %a, i64 %idxprom.j
; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i64 %idxprom.j
call void @foo(float* %2)
; CHECK: call void @foo(float* [[t1]])
%idxprom.1 = zext i32 %1 to i64
%3 = getelementptr float, float* %a, i64 %idxprom.1
; CHECK: [[sexti:[^ ]+]] = sext i32 %i to i64
; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 [[sexti]]
call void @foo(float* %3)
; CHECK: call void @foo(float* [[t2]])
ret void
}
; Do not split the second GEP because sext(i + j) != sext(i) + sext(j).
define void @reassociate_gep_no_nsw(float* %a, i32 %i, i32 %j) {
; CHECK-LABEL: @reassociate_gep_no_nsw(
%1 = add i32 %i, %j
%2 = getelementptr float, float* %a, i32 %j
; CHECK: getelementptr float, float* %a, i32 %j
call void @foo(float* %2)
%3 = getelementptr float, float* %a, i32 %1
; CHECK: getelementptr float, float* %a, i32 %1
call void @foo(float* %3)
ret void
}
define void @reassociate_gep_128(float* %a, i128 %i, i128 %j) {
; CHECK-LABEL: @reassociate_gep_128(
%1 = add i128 %i, %j
%2 = getelementptr float, float* %a, i128 %i
; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i128 %i
call void @foo(float* %2)
; CHECK: call void @foo(float* [[t1]])
%3 = getelementptr float, float* %a, i128 %1
; CHECK: [[truncj:[^ ]+]] = trunc i128 %j to i64
; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 [[truncj]]
call void @foo(float* %3)
; CHECK: call void @foo(float* [[t2]])
ret void
}
%struct.complex = type { float, float }
declare void @bar(%struct.complex*)
define void @different_types(%struct.complex* %input, i64 %i) {
; CHECK-LABEL: @different_types(
%t1 = getelementptr %struct.complex, %struct.complex* %input, i64 %i
call void @bar(%struct.complex* %t1)
%j = add i64 %i, 5
%t2 = getelementptr %struct.complex, %struct.complex* %input, i64 %j, i32 0
; CHECK: [[cast:[^ ]+]] = bitcast %struct.complex* %t1 to float*
; CHECK-NEXT: %t2 = getelementptr float, float* [[cast]], i64 10
; CHECK-NEXT: call void @foo(float* %t2)
call void @foo(float* %t2)
ret void
}
declare void @llvm.assume(i1)