1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
|
; RUN: opt %s -disable-output -analyze -lda | FileCheck %s
@x = common global [256 x i32] zeroinitializer, align 4
@y = common global [256 x i32] zeroinitializer, align 4
;; for (i = 0; i < 256; i++)
;; x[i] = x[i] + y[i]
define void @f1(...) nounwind {
entry:
br label %for.body
for.body:
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
%y.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
%x.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
%x = load i32* %x.addr ; 0
%y = load i32* %y.addr ; 1
%r = add i32 %y, %x
store i32 %r, i32* %x.addr ; 2
; CHECK: 0,2: dep
; CHECK: 1,2: ind
%i.next = add i64 %i, 1
%exitcond = icmp eq i64 %i.next, 256
br i1 %exitcond, label %for.end, label %for.body
for.end:
ret void
}
;; for (i = 0; i < 256; i++)
;; x[i+1] = x[i] + y[i]
define void @f2(...) nounwind {
entry:
br label %for.body
for.body:
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
%i.next = add i64 %i, 1
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.next
%x = load i32* %x.ld.addr ; 0
%y = load i32* %y.ld.addr ; 1
%r = add i32 %y, %x
store i32 %r, i32* %x.st.addr ; 2
; CHECK: 0,2: dep
; CHECK: 1,2: ind
%exitcond = icmp eq i64 %i.next, 256
br i1 %exitcond, label %for.end, label %for.body
for.end:
ret void
}
;; for (i = 0; i < 10; i++)
;; x[i+20] = x[i] + y[i]
define void @f3(...) nounwind {
entry:
br label %for.body
for.body:
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i
%i.20 = add i64 %i, 20
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.20
%x = load i32* %x.ld.addr ; 0
%y = load i32* %y.ld.addr ; 1
%r = add i32 %y, %x
store i32 %r, i32* %x.st.addr ; 2
; CHECK: 0,2: dep
; CHECK: 1,2: ind
%i.next = add i64 %i, 1
%exitcond = icmp eq i64 %i.next, 10
br i1 %exitcond, label %for.end, label %for.body
for.end:
ret void
}
;; for (i = 0; i < 10; i++)
;; x[10*i+1] = x[10*i] + y[i]
define void @f4(...) nounwind {
entry:
br label %for.body
for.body:
%i = phi i64 [ 0, %entry ], [ %i.next, %for.body ]
%i.10 = mul i64 %i, 10
%y.ld.addr = getelementptr [256 x i32]* @y, i64 0, i64 %i.10
%x.ld.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.10
%i.10.1 = add i64 %i.10, 1
%x.st.addr = getelementptr [256 x i32]* @x, i64 0, i64 %i.10.1
%x = load i32* %x.ld.addr ; 0
%y = load i32* %y.ld.addr ; 1
%r = add i32 %y, %x
store i32 %r, i32* %x.st.addr ; 2
; CHECK: 0,2: dep
; CHECK: 1,2: ind
%i.next = add i64 %i, 1
%exitcond = icmp eq i64 %i.next, 10
br i1 %exitcond, label %for.end, label %for.body
for.end:
ret void
}
|