1 ; RUN: opt %loadPolly -polly-detect-unprofitable -polly-parallel -polly-ast -analyze < %s | FileCheck %s -check-prefix=AST
2 ; RUN: opt %loadPolly -polly-detect-unprofitable -polly-parallel -polly-codegen-isl -S < %s | FileCheck %s -check-prefix=IR
3 ; RUN: opt %loadPolly -polly-detect-unprofitable -polly-parallel -polly-codegen-isl -S < %s | FileCheck %s -check-prefix=IR
7 ; void loop_references_outer_ids(long n) {
8 ; for (long i = 0; i < 100; i++)
9 ; for (long j = 0; j < 100; j++)
10 ; for (long k = 0; k < n + i; k++)
14 ; In this test case we verify that the j-loop is generated as OpenMP parallel
15 ; loop and that the values of 'i' and 'n', needed in the loop bounds of the
16 ; k-loop, are correctly passed to the subfunction.
18 ; AST: #pragma minimal dependence distance: 1
19 ; AST: for (int c0 = max(0, -n + 1); c0 <= 99; c0 += 1)
20 ; AST: #pragma omp parallel for
21 ; AST: for (int c1 = 0; c1 <= 99; c1 += 1)
22 ; AST: #pragma minimal dependence distance: 1
23 ; AST: for (int c2 = 0; c2 < n + c0; c2 += 1)
24 ; AST: Stmt_for_body6(c0, c1, c2);
26 ; IR: %polly.par.userContext = alloca { i64, i64 }
27 ; IR: %[[R0:[0-9]+]] = bitcast { i64, i64 }* %polly.par.userContext to i8*
28 ; IR-NEXT: call void @llvm.lifetime.start(i64 16, i8* %[[R0]])
29 ; IR-NEXT: %[[R1:[0-9]+]] = getelementptr inbounds { i64, i64 }, { i64, i64 }* %polly.par.userContext, i32 0, i32 0
30 ; IR-NEXT: store i64 %n, i64* %[[R1]]
31 ; IR-NEXT: %[[R2:[0-9]+]] = getelementptr inbounds { i64, i64 }, { i64, i64 }* %polly.par.userContext, i32 0, i32 1
32 ; IR-NEXT: store i64 %polly.indvar, i64* %[[R2]]
33 ; IR-NEXT: %polly.par.userContext1 = bitcast { i64, i64 }* %polly.par.userContext to i8*
35 ; IR-LABEL: @loop_references_outer_ids.polly.subfn(i8* %polly.par.userContext)
36 ; IR: %polly.par.userContext1 = bitcast i8* %polly.par.userContext to { i64, i64 }*
37 ; IR-NEXT: %[[R3:[0-9]+]] = getelementptr inbounds { i64, i64 }, { i64, i64 }* %polly.par.userContext1, i32 0, i32 0
38 ; IR-NEXT: %[[R4:[0-9]+]] = load i64* %[[R3]]
39 ; IR-NEXT: %[[R5:[0-9]+]] = getelementptr inbounds { i64, i64 }, { i64, i64 }* %polly.par.userContext1, i32 0, i32 1
40 ; IR-NEXT: %[[R6:[0-9]+]] = load i64* %[[R5]]
42 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
44 @A = common global [100 x float] zeroinitializer, align 16
46 define void @loop_references_outer_ids(i64 %n) {
50 for.cond: ; preds = %for.inc03, %entry
51 %i.0 = phi i64 [ 0, %entry ], [ %inc04, %for.inc03 ]
52 %exitcond1 = icmp ne i64 %i.0, 100
53 br i1 %exitcond1, label %for.body, label %for.end15
55 for.body: ; preds = %for.cond
58 for.cond1: ; preds = %for.inc00, %for.body
59 %j.0 = phi i64 [ 0, %for.body ], [ %inc01, %for.inc00 ]
60 %exitcond = icmp ne i64 %j.0, 100
61 br i1 %exitcond, label %for.body3, label %for.end12
63 for.body3: ; preds = %for.cond1
66 for.cond4: ; preds = %for.inc, %for.body3
67 %k.0 = phi i64 [ 0, %for.body3 ], [ %inc, %for.inc ]
68 %add = add nsw i64 %i.0, %n
69 %cmp5 = icmp slt i64 %k.0, %add
70 br i1 %cmp5, label %for.body6, label %for.end
72 for.body6: ; preds = %for.cond4
73 %add7 = add nsw i64 %i.0, %j.0
74 %add8 = add nsw i64 %add7, %k.0
75 %conv = sitofp i64 %add8 to float
76 %arrayidx = getelementptr inbounds [100 x float], [100 x float]* @A, i64 0, i64 %j.0
77 %tmp = load float* %arrayidx, align 4
78 %add9 = fadd float %tmp, %conv
79 store float %add9, float* %arrayidx, align 4
82 for.inc: ; preds = %for.body6
83 %inc = add nsw i64 %k.0, 1
86 for.end: ; preds = %for.cond4
89 for.inc00: ; preds = %for.end
90 %inc01 = add nsw i64 %j.0, 1
93 for.end12: ; preds = %for.cond1
96 for.inc03: ; preds = %for.end12
97 %inc04 = add nsw i64 %i.0, 1
100 for.end15: ; preds = %for.cond