multidim_fold_constant_dim.ll
4.77 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
; RUN: opt %loadPolly -polly-scops -analyze -S < %s | FileCheck %s
;
; struct com {
; double Real;
; double Img;
; };
;
; void foo(long n, struct com A[][n]) {
; for (long i = 0; i < 100; i++)
; for (long j = 0; j < 1000; j++)
; A[i][j].Real += A[i][j].Img;
; }
;
; int main() {
; struct com A[100][1000];
; foo(1000, A);
; }
; CHECK: Arrays {
; CHECK-NEXT: double MemRef_A[*][(2 * %n)]; // Element size 8
; CHECK-NEXT: }
; CHECK: Stmt_for_body3
; CHECK-NEXT: Domain :=
; CHECK-NEXT: [n] -> { Stmt_for_body3[i0, i1] : 0 <= i0 <= 99 and 0 <= i1 <= 999 };
; CHECK-NEXT: Schedule :=
; CHECK-NEXT: [n] -> { Stmt_for_body3[i0, i1] -> [i0, i1] };
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
; CHECK-NEXT: [n] -> { Stmt_for_body3[i0, i1] -> MemRef_A[i0, 1 + 2i1] };
; CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
; CHECK-NEXT: [n] -> { Stmt_for_body3[i0, i1] -> MemRef_A[i0, 2i1] };
; CHECK-NEXT: MustWriteAccess := [Reduction Type: NONE] [Scalar: 0]
; CHECK-NEXT: [n] -> { Stmt_for_body3[i0, i1] -> MemRef_A[i0, 2i1] };
source_filename = "/tmp/test.c"
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
%struct.com = type { double, double }
%struct.com2 = type { [20000000000 x double] }
define void @foo(i64 %n, %struct.com* %A) {
entry:
br label %for.cond
for.cond: ; preds = %for.inc7, %entry
%i.0 = phi i64 [ 0, %entry ], [ %inc8, %for.inc7 ]
%exitcond1 = icmp ne i64 %i.0, 100
br i1 %exitcond1, label %for.body, label %for.end9
for.body: ; preds = %for.cond
br label %for.cond1
for.cond1: ; preds = %for.inc, %for.body
%j.0 = phi i64 [ 0, %for.body ], [ %inc, %for.inc ]
%exitcond = icmp ne i64 %j.0, 1000
br i1 %exitcond, label %for.body3, label %for.end
for.body3: ; preds = %for.cond1
%tmp = mul nsw i64 %i.0, %n
%arrayidx = getelementptr inbounds %struct.com, %struct.com* %A, i64 %tmp
%arrayidx4 = getelementptr inbounds %struct.com, %struct.com* %arrayidx, i64 %j.0
%Img = getelementptr inbounds %struct.com, %struct.com* %arrayidx4, i64 0, i32 1
%tmp2 = load double, double* %Img, align 8
%tmp3 = mul nsw i64 %i.0, %n
%arrayidx5 = getelementptr inbounds %struct.com, %struct.com* %A, i64 %tmp3
%arrayidx6 = getelementptr inbounds %struct.com, %struct.com* %arrayidx5, i64 %j.0
%Real = getelementptr inbounds %struct.com, %struct.com* %arrayidx6, i64 0, i32 0
%tmp4 = load double, double* %Real, align 8
%add = fadd double %tmp4, %tmp2
store double %add, double* %Real, align 8
br label %for.inc
for.inc: ; preds = %for.body3
%inc = add nuw nsw i64 %j.0, 1
br label %for.cond1
for.end: ; preds = %for.cond1
br label %for.inc7
for.inc7: ; preds = %for.end
%inc8 = add nuw nsw i64 %i.0, 1
br label %for.cond
for.end9: ; preds = %for.cond
ret void
}
; CHECK: Arrays {
; CHECK-NEXT: double MemRef_O[*][%n]; // Element size 8
; CHECK-NEXT: }
define void @foo_overflow(i64 %n, %struct.com2* nocapture %O) local_unnamed_addr #0 {
entry:
br label %for.body
for.cond.cleanup: ; preds = %for.cond.cleanup3
ret void
for.body: ; preds = %for.cond.cleanup3, %entry
%i.024 = phi i64 [ 0, %entry ], [ %inc12, %for.cond.cleanup3 ]
%0 = mul nsw i64 %i.024, %n
%arrayidx = getelementptr inbounds %struct.com2, %struct.com2* %O, i64 %0
br label %for.body4
for.cond.cleanup3: ; preds = %for.body4
%inc12 = add nuw nsw i64 %i.024, 1
%exitcond25 = icmp eq i64 %inc12, 100
br i1 %exitcond25, label %for.cond.cleanup, label %for.body
for.body4: ; preds = %for.body4, %for.body
%j.023 = phi i64 [ 0, %for.body ], [ %inc, %for.body4 ]
%arrayidx5 = getelementptr inbounds %struct.com2, %struct.com2* %arrayidx, i64 %j.023
%Real = getelementptr inbounds %struct.com2, %struct.com2* %arrayidx5, i64 0, i32 0
%arrayidx6 = getelementptr inbounds [20000000000 x double], [20000000000 x double]* %Real, i64 0, i64 1
%1 = load double, double* %arrayidx6, align 8
%arrayidx10 = getelementptr inbounds [20000000000 x double], [20000000000 x double]* %Real, i64 0, i64 0
%2 = load double, double* %arrayidx10, align 8
%add = fadd double %1, %2
store double %add, double* %arrayidx10, align 8
%inc = add nuw nsw i64 %j.023, 1
%exitcond = icmp eq i64 %inc, 1000
br i1 %exitcond, label %for.cond.cleanup3, label %for.body4
}