Skip to content

Commit f729a6c

Browse files
committed
[DA] use NSW arithmetic
DA uses SCEV to solve linear constraints. When it generates SCEVs with negative strides, i.e., {0,+,-1}, make sure the SCEVs are marked as non wrap arithmetic. This patch fixes #51512
1 parent 0755bb4 commit f729a6c

File tree

2 files changed

+36
-2
lines changed

2 files changed

+36
-2
lines changed

llvm/lib/Analysis/DependenceAnalysis.cpp

+2-2
Original file line numberDiff line numberDiff line change
@@ -3166,7 +3166,7 @@ const SCEV *DependenceInfo::addToCoefficient(const SCEV *Expr,
31663166
return SE->getAddRecExpr(Expr,
31673167
Value,
31683168
TargetLoop,
3169-
SCEV::FlagAnyWrap); // Worst case, with no info.
3169+
SCEV::FlagNSW); // Worst case, with no info.
31703170
if (AddRec->getLoop() == TargetLoop) {
31713171
const SCEV *Sum = SE->getAddExpr(AddRec->getStepRecurrence(*SE), Value);
31723172
if (Sum->isZero())
@@ -3177,7 +3177,7 @@ const SCEV *DependenceInfo::addToCoefficient(const SCEV *Expr,
31773177
AddRec->getNoWrapFlags());
31783178
}
31793179
if (SE->isLoopInvariant(AddRec, TargetLoop))
3180-
return SE->getAddRecExpr(AddRec, Value, TargetLoop, SCEV::FlagAnyWrap);
3180+
return SE->getAddRecExpr(AddRec, Value, TargetLoop, SCEV::FlagNSW);
31813181
return SE->getAddRecExpr(
31823182
addToCoefficient(AddRec->getStart(), TargetLoop, Value),
31833183
AddRec->getStepRecurrence(*SE), AddRec->getLoop(),
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
; RUN: opt < %s -disable-output "-passes=print<da>" -aa-pipeline=basic-aa
2+
3+
; Check that the testcase does not crash the compiler.
4+
; https://github.com/llvm/llvm-project/issues/51512
5+
6+
define void @func_1() {
7+
entry:
8+
%l_83.i.i = alloca [2 x [5 x i32]], align 1
9+
br label %for.cond857.preheader.i.i
10+
11+
for.cond857.preheader.i.i: ; preds = %cleanup.cont1138.i.i, %entry
12+
%l_89.08.i.i = phi i32 [ 0, %entry ], [ %add1140.i.i, %cleanup.cont1138.i.i ]
13+
%0 = trunc i32 %l_89.08.i.i to i16
14+
%1 = add i16 %0, 3
15+
%arrayidx916.i.i = getelementptr inbounds [2 x [5 x i32]], [2 x [5 x i32]]* %l_83.i.i, i16 0, i16 %0, i16 %1
16+
br label %for.body860.i.i
17+
18+
for.body860.i.i: ; preds = %for.body860.i.i, %for.cond857.preheader.i.i
19+
%l_74.07.i.i = phi i32 [ 0, %for.cond857.preheader.i.i ], [ %add964.i.i, %for.body860.i.i ]
20+
store i32 undef, i32* %arrayidx916.i.i, align 1
21+
%2 = trunc i32 %l_74.07.i.i to i16
22+
%arrayidx962.i.i = getelementptr inbounds [2 x [5 x i32]], [2 x [5 x i32]]* %l_83.i.i, i16 0, i16 %2, i16 %1
23+
store i32 0, i32* %arrayidx962.i.i, align 1
24+
%add964.i.i = add nuw nsw i32 %l_74.07.i.i, 1
25+
br i1 false, label %for.body860.i.i, label %cleanup.cont1138.i.i
26+
27+
cleanup.cont1138.i.i: ; preds = %for.body860.i.i
28+
%add1140.i.i = add nuw nsw i32 %l_89.08.i.i, 1
29+
%cmp602.i.i = icmp eq i32 %l_89.08.i.i, 0
30+
br i1 %cmp602.i.i, label %for.cond857.preheader.i.i, label %for.cond1480.i.i.preheader
31+
32+
for.cond1480.i.i.preheader: ; preds = %cleanup.cont1138.i.i
33+
unreachable
34+
}

0 commit comments

Comments
 (0)