54 lines
1.9 KiB
LLVM
54 lines
1.9 KiB
LLVM
; RUN: opt -loop-reduce -S < %s | FileCheck %s
|
|
;
|
|
; Test LSR's intelligence regarding phi reuse.
|
|
; Verify that scaled GEPs are not reused. rdar://5064068
|
|
|
|
target triple = "x86-apple-darwin"
|
|
|
|
; CHECK: @test
|
|
; multiplies are hoisted out of the loop
|
|
; CHECK: while.body.lr.ph:
|
|
; CHECK: mul i64
|
|
; CHECK: mul i64
|
|
; GEPs are ugly
|
|
; CHECK: while.body:
|
|
; CHECK: phi
|
|
; CHECK: phi
|
|
; CHECK: phi
|
|
; CHECK: phi
|
|
; CHECK-NOT: phi
|
|
; CHECK: bitcast float* {{.*}} to i8*
|
|
; CHECK: bitcast float* {{.*}} to i8*
|
|
; CHECK: getelementptr i8*
|
|
; CHECK: getelementptr i8*
|
|
|
|
define float @test(float* nocapture %A, float* nocapture %B, i32 %N, i32 %IA, i32 %IB) nounwind uwtable readonly ssp {
|
|
entry:
|
|
%cmp1 = icmp sgt i32 %N, 0
|
|
br i1 %cmp1, label %while.body.lr.ph, label %while.end
|
|
|
|
while.body.lr.ph: ; preds = %entry
|
|
%idx.ext = sext i32 %IA to i64
|
|
%idx.ext2 = sext i32 %IB to i64
|
|
br label %while.body
|
|
|
|
while.body: ; preds = %while.body.lr.ph, %while.body
|
|
%A.addr.05 = phi float* [ %A, %while.body.lr.ph ], [ %add.ptr, %while.body ]
|
|
%B.addr.04 = phi float* [ %B, %while.body.lr.ph ], [ %add.ptr3, %while.body ]
|
|
%N.addr.03 = phi i32 [ %N, %while.body.lr.ph ], [ %sub, %while.body ]
|
|
%Sum0.02 = phi float [ 0.000000e+00, %while.body.lr.ph ], [ %add, %while.body ]
|
|
%0 = load float* %A.addr.05, align 4
|
|
%1 = load float* %B.addr.04, align 4
|
|
%mul = fmul float %0, %1
|
|
%add = fadd float %Sum0.02, %mul
|
|
%add.ptr = getelementptr inbounds float* %A.addr.05, i64 %idx.ext
|
|
%add.ptr3 = getelementptr inbounds float* %B.addr.04, i64 %idx.ext2
|
|
%sub = add nsw i32 %N.addr.03, -1
|
|
%cmp = icmp sgt i32 %sub, 0
|
|
br i1 %cmp, label %while.body, label %while.end
|
|
|
|
while.end: ; preds = %while.body, %entry
|
|
%Sum0.0.lcssa = phi float [ 0.000000e+00, %entry ], [ %add, %while.body ]
|
|
ret float %Sum0.0.lcssa
|
|
}
|