falkor-hwpf-fix.ll
1.94 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
; RUN: llc < %s -mtriple aarch64 -mcpu=falkor -disable-post-ra | FileCheck %s
; Check that strided load tag collisions are avoided on Falkor.
; CHECK-LABEL: hwpf1:
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE:[0-9]+]], #-16]
; CHECK: mov x[[BASE2:[0-9]+]], x[[BASE]]
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE2]], #-8]
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE3:[0-9]+]]]
; CHECK: mov x[[BASE4:[0-9]+]], x[[BASE3]]
; CHECK: ldp {{w[0-9]+}}, {{w[0-9]+}}, [x[[BASE4]], #8]
define void @hwpf1(i32* %p, i32* %sp, i32* %sp2, i32* %sp3, i32* %sp4) {
entry:
br label %loop
loop:
%iv = phi i32 [ 0, %entry ], [ %inc, %loop ]
%gep = getelementptr inbounds i32, i32* %p, i32 %iv
%load1 = load i32, i32* %gep
%gep2 = getelementptr inbounds i32, i32* %gep, i32 1
%load2 = load i32, i32* %gep2
%add = add i32 %load1, %load2
%storegep = getelementptr inbounds i32, i32* %sp, i32 %iv
store i32 %add, i32* %storegep
%gep3 = getelementptr inbounds i32, i32* %gep, i32 2
%load3 = load i32, i32* %gep3
%gep4 = getelementptr inbounds i32, i32* %gep, i32 3
%load4 = load i32, i32* %gep4
%add2 = add i32 %load3, %load4
%storegep2 = getelementptr inbounds i32, i32* %sp2, i32 %iv
store i32 %add2, i32* %storegep2
%gep5 = getelementptr inbounds i32, i32* %gep, i32 4
%load5 = load i32, i32* %gep5
%gep6 = getelementptr inbounds i32, i32* %gep, i32 5
%load6 = load i32, i32* %gep6
%add3 = add i32 %load5, %load6
%storegep3 = getelementptr inbounds i32, i32* %sp3, i32 %iv
store i32 %add3, i32* %storegep3
%gep7 = getelementptr inbounds i32, i32* %gep, i32 6
%load7 = load i32, i32* %gep7
%gep8 = getelementptr inbounds i32, i32* %gep, i32 7
%load8 = load i32, i32* %gep8
%add4 = add i32 %load7, %load8
%storegep4 = getelementptr inbounds i32, i32* %sp4, i32 %iv
store i32 %add4, i32* %storegep4
%inc = add i32 %iv, 8
%exitcnd = icmp uge i32 %inc, 1024
br i1 %exitcnd, label %exit, label %loop
exit:
ret void
}