| ; RUN: opt -hardware-loops -force-hardware-loops=true -hardware-loop-decrement=1 -hardware-loop-counter-bitwidth=32 -S %s -o - | FileCheck %s |
| ; RUN: opt -hardware-loops -force-hardware-loops=true -hardware-loop-decrement=1 -hardware-loop-counter-bitwidth=32 -force-hardware-loop-phi=true -S %s -o - | FileCheck %s |
| ; RUN: opt -hardware-loops -force-hardware-loops=true -hardware-loop-decrement=1 -hardware-loop-counter-bitwidth=32 -force-nested-hardware-loop=true -S %s -o - | FileCheck %s |
| |
| ; CHECK-LABEL: float_counter |
| ; CHECK-NOT: set.loop.iterations |
| ; CHECK-NOT: loop.decrement |
| define void @float_counter(i32* nocapture %A, float %N) { |
| entry: |
| %cmp6 = fcmp ogt float %N, 0.000000e+00 |
| br i1 %cmp6, label %while.body, label %while.end |
| |
| while.body: |
| %i.07 = phi i32 [ %inc, %while.body ], [ 0, %entry ] |
| %arrayidx = getelementptr inbounds i32, i32* %A, i32 %i.07 |
| store i32 %i.07, i32* %arrayidx, align 4 |
| %inc = add i32 %i.07, 1 |
| %conv = uitofp i32 %inc to float |
| %cmp = fcmp olt float %conv, %N |
| br i1 %cmp, label %while.body, label %while.end |
| |
| while.end: |
| ret void |
| } |
| |
| ; CHECK-LABEL: variant_counter |
| ; CHECK-NOT: set.loop.iterations |
| ; CHECK-NOT: loop.decrement |
| define void @variant_counter(i32* nocapture %A, i32* nocapture readonly %B) { |
| entry: |
| %0 = load i32, i32* %B, align 4 |
| %cmp7 = icmp eq i32 %0, 0 |
| br i1 %cmp7, label %while.end, label %while.body |
| |
| while.body: |
| %i.08 = phi i32 [ %inc, %while.body ], [ 0, %entry ] |
| %arrayidx1 = getelementptr inbounds i32, i32* %A, i32 %i.08 |
| store i32 %i.08, i32* %arrayidx1, align 4 |
| %inc = add nuw i32 %i.08, 1 |
| %arrayidx = getelementptr inbounds i32, i32* %B, i32 %inc |
| %1 = load i32, i32* %arrayidx, align 4 |
| %cmp = icmp ult i32 %inc, %1 |
| br i1 %cmp, label %while.body, label %while.end |
| |
| while.end: |
| ret void |
| } |
| |
| ; CHECK-LABEL: variant_counter2 |
| ; CHECK-NOT: set.loop.iterations |
| ; CHECK-NOT: loop.decrement |
| define void @variant_counter2(i8*, i8*, i64*) { |
| %4 = icmp eq i8* %0, %1 |
| br i1 %4, label %9, label %5 |
| |
| 5: ; preds = %3 |
| %6 = getelementptr inbounds i64, i64* %2, i64 1 |
| %7 = load i64, i64* %6, align 8 |
| br label %10 |
| |
| 8: ; preds = %10 |
| store i64 %14, i64* %6, align 8 |
| br label %9 |
| |
| 9: ; preds = %8, %3 |
| ret void |
| |
| 10: ; preds = %5, %10 |
| %11 = phi i64 [ %7, %5 ], [ %14, %10 ] |
| %12 = phi i32 [ 0, %5 ], [ %15, %10 ] |
| %13 = phi i8* [ %0, %5 ], [ %16, %10 ] |
| %14 = shl nsw i64 %11, 4 |
| %15 = add nuw nsw i32 %12, 1 |
| %16 = getelementptr inbounds i8, i8* %13, i64 1 |
| %17 = icmp ugt i32 %12, 14 |
| %18 = icmp eq i8* %16, %1 |
| %19 = or i1 %18, %17 |
| br i1 %19, label %8, label %10 |
| } |