1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
| ; RUN: opt %loadPolly -analyze -polly-scops \
; RUN: -polly-invariant-load-hoisting=true < %s | FileCheck %s
; RUN: opt %loadPolly -S -polly-codegen \
; RUN: -polly-invariant-load-hoisting=true < %s | FileCheck %s --check-prefix=IR
;
; void f(long *A, long *B, long *ptr, long val) {
; for (long i = 0; i < 100; i++) {
; long ptrV = ((long)(ptr + 1)) + 1;
; long valP = (long)(((long *)(val + 1)) + 1);
; A[ptrV] += B[valP];
; }
; }
;
; CHECK: ReadAccess := [Reduction Type: NONE] [Scalar: 0]
; CHECK-NEXT: [val, ptr] -> { Stmt_for_body[i0] -> MemRef_B[9 + val] };
; CHECK-NEXT: Execution Context: [val, ptr] -> { : val <= 32766 }
;
; CHECK: ReadAccess := [Reduction Type: +] [Scalar: 0]
; CHECK-NEXT: [val, ptr] -> { Stmt_for_body[i0] -> MemRef_A[9 + ptr] };
; CHECK-NEXT: MustWriteAccess := [Reduction Type: +] [Scalar: 0]
; CHECK-NEXT: [val, ptr] -> { Stmt_for_body[i0] -> MemRef_A[9 + ptr] };
;
; IR: polly.stmt.for.body:
; IR-NEXT: %p_tmp = ptrtoint i64* %scevgep to i16
; IR-NEXT: %p_add = add nsw i16 %p_tmp, 1
; IR-NEXT: %p_arrayidx3 = getelementptr inbounds i64, i64* %A, i16 %p_add
; IR-NEXT: %tmp4_p_scalar_ = load i64, i64* %p_arrayidx3
; IR-NEXT: %p_add4 = add nsw i64 %tmp4_p_scalar_, %polly.preload.tmp3.merge
; IR-NEXT: store i64 %p_add4, i64* %p_arrayidx3
;
; IR: polly.loop_preheader:
; IR-NEXT: %scevgep = getelementptr i64, i64* %ptr, i16 1
; IR-NEXT: %35 = add i16 %val, 1
; IR-NEXT: br label %polly.loop_header
;
;
target datalayout = "e-p:16:16:16-m:e-i64:64-f80:128-n8:16:16:64-S128"
define void @f(i64* %A, i64* %B, i64* %ptr, i16 %val) {
entry:
br label %for.cond
for.cond: ; preds = %for.inc, %entry
%i.0 = phi i64 [ 0, %entry ], [ %inc, %for.inc ]
%exitcond = icmp ne i64 %i.0, 100
br i1 %exitcond, label %for.body, label %for.end
for.body: ; preds = %for.cond
%add.ptr = getelementptr inbounds i64, i64* %ptr, i64 1
%tmp = ptrtoint i64* %add.ptr to i16
%add = add nsw i16 %tmp, 1
%add1 = add nsw i16 %val, 1
%tmp1 = inttoptr i16 %add1 to i64*
%add.ptr2 = getelementptr inbounds i64, i64* %tmp1, i64 1
%tmp2 = ptrtoint i64* %add.ptr2 to i16
%arrayidx = getelementptr inbounds i64, i64* %B, i16 %tmp2
%tmp3 = load i64, i64* %arrayidx
%arrayidx3 = getelementptr inbounds i64, i64* %A, i16 %add
%tmp4 = load i64, i64* %arrayidx3
%add4 = add nsw i64 %tmp4, %tmp3
store i64 %add4, i64* %arrayidx3
br label %for.inc
for.inc: ; preds = %for.body
%inc = add nuw nsw i64 %i.0, 1
br label %for.cond
for.end: ; preds = %for.cond
ret void
}
|