blob: 0ef6ad15d4eb0f112c6e68880aaf05584edc8c8c [file] [log] [blame] [edit]
// RUN: mlir-opt %s --test-loop-unrolling="unroll-factor=3" -split-input-file -canonicalize | FileCheck %s
// RUN: mlir-opt %s --test-loop-unrolling="unroll-factor=1" -split-input-file -canonicalize | FileCheck %s --check-prefix UNROLL-BY-1
// RUN: mlir-opt %s --test-loop-unrolling="unroll-full=true" -split-input-file -canonicalize | FileCheck %s --check-prefix UNROLL-FULL
// CHECK-LABEL: scf_loop_unroll_single
func.func @scf_loop_unroll_single(%arg0 : f32, %arg1 : f32) -> f32 {
%from = arith.constant 0 : index
%to = arith.constant 10 : index
%step = arith.constant 1 : index
%sum = scf.for %iv = %from to %to step %step iter_args(%sum_iter = %arg0) -> (f32) {
%next = arith.addf %sum_iter, %arg1 : f32
scf.yield %next : f32
}
// CHECK: %[[SUM:.*]] = scf.for %{{.*}} = %{{.*}} to %{{.*}} step %{{.*}} iter_args(%[[V0:.*]] =
// CHECK-NEXT: %[[V1:.*]] = arith.addf %[[V0]]
// CHECK-NEXT: %[[V2:.*]] = arith.addf %[[V1]]
// CHECK-NEXT: %[[V3:.*]] = arith.addf %[[V2]]
// CHECK-NEXT: scf.yield %[[V3]]
// CHECK-NEXT: }
// CHECK-NEXT: %[[RES:.*]] = arith.addf %[[SUM]],
// CHECK-NEXT: return %[[RES]]
return %sum : f32
}
// CHECK-LABEL: scf_loop_unroll_double_symbolic_ub
// CHECK-SAME: (%{{.*}}: f32, %{{.*}}: f32, %[[N:.*]]: index)
func.func @scf_loop_unroll_double_symbolic_ub(%arg0 : f32, %arg1 : f32, %n : index) -> (f32,f32) {
%from = arith.constant 0 : index
%step = arith.constant 1 : index
%sum:2 = scf.for %iv = %from to %n step %step iter_args(%i0 = %arg0, %i1 = %arg1) -> (f32, f32) {
%sum0 = arith.addf %i0, %arg0 : f32
%sum1 = arith.addf %i1, %arg1 : f32
scf.yield %sum0, %sum1 : f32, f32
}
return %sum#0, %sum#1 : f32, f32
// CHECK-DAG: %[[C0:.*]] = arith.constant 0 : index
// CHECK-DAG: %[[C1:.*]] = arith.constant 1 : index
// CHECK-DAG: %[[C3:.*]] = arith.constant 3 : index
// CHECK-NEXT: %[[REM:.*]] = arith.remsi %[[N]], %[[C3]]
// CHECK-NEXT: %[[UB:.*]] = arith.subi %[[N]], %[[REM]]
// CHECK-NEXT: %[[SUM:.*]]:2 = scf.for {{.*}} = %[[C0]] to %[[UB]] step %[[C3]] iter_args
// CHECK: }
// CHECK-NEXT: %[[SUM1:.*]]:2 = scf.for {{.*}} = %[[UB]] to %[[N]] step %[[C1]] iter_args(%[[V1:.*]] = %[[SUM]]#0, %[[V2:.*]] = %[[SUM]]#1)
// CHECK: }
// CHECK-NEXT: return %[[SUM1]]#0, %[[SUM1]]#1
}
// UNROLL-BY-1-LABEL: scf_loop_unroll_factor_1_promote
func.func @scf_loop_unroll_factor_1_promote() -> () {
%step = arith.constant 1 : index
%lo = arith.constant 0 : index
%hi = arith.constant 1 : index
scf.for %i = %lo to %hi step %step {
%x = "test.foo"(%i) : (index) -> i32
}
return
// UNROLL-BY-1-NEXT: %[[C0:.*]] = arith.constant 0 : index
// UNROLL-BY-1-NEXT: %{{.*}} = "test.foo"(%[[C0]]) : (index) -> i32
}
// UNROLL-FULL-LABEL: func @scf_loop_unroll_full_single
// UNROLL-FULL-SAME: %[[ARG:.*]]: index)
func.func @scf_loop_unroll_full_single(%arg : index) -> index {
%0 = arith.constant 0 : index
%1 = arith.constant 1 : index
%2 = arith.constant 4 : index
%4 = scf.for %iv = %0 to %2 step %1 iter_args(%arg1 = %1) -> index {
%3 = arith.addi %arg1, %arg : index
scf.yield %3 : index
}
return %4 : index
// UNROLL-FULL: %[[C1:.*]] = arith.constant 1 : index
// UNROLL-FULL: %[[V0:.*]] = arith.addi %[[ARG]], %[[C1]] : index
// UNROLL-FULL: %[[V1:.*]] = arith.addi %[[V0]], %[[ARG]] : index
// UNROLL-FULL: %[[V2:.*]] = arith.addi %[[V1]], %[[ARG]] : index
// UNROLL-FULL: %[[V3:.*]] = arith.addi %[[V2]], %[[ARG]] : index
// UNROLL-FULL: return %[[V3]] : index
}
// UNROLL-FULL-LABEL: func @scf_loop_unroll_full_outter_loops
// UNROLL-FULL-SAME: %[[ARG:.*]]: vector<4x4xindex>)
func.func @scf_loop_unroll_full_outter_loops(%arg0: vector<4x4xindex>) -> index {
%0 = arith.constant 0 : index
%1 = arith.constant 1 : index
%2 = arith.constant 4 : index
%6 = scf.for %arg1 = %0 to %2 step %1 iter_args(%it0 = %0) -> index {
%5 = scf.for %arg2 = %0 to %2 step %1 iter_args(%it1 = %it0) -> index {
%3 = vector.extract %arg0[%arg1, %arg2] : index from vector<4x4xindex>
%4 = arith.addi %3, %it1 : index
scf.yield %3 : index
}
scf.yield %5 : index
}
return %6 : index
// UNROLL-FULL: %[[C0:.*]] = arith.constant 0 : index
// UNROLL-FULL: %[[C1:.*]] = arith.constant 1 : index
// UNROLL-FULL: %[[C4:.*]] = arith.constant 4 : index
// UNROLL-FULL: %[[SUM0:.*]] = scf.for %[[IV:.*]] = %[[C0]] to %[[C4]] step %[[C1]] iter_args(%{{.*}} = %[[C0]])
// UNROLL-FULL: %[[VAL:.*]] = vector.extract %[[ARG]][0, %[[IV]]] : index from vector<4x4xindex>
// UNROLL-FULL: scf.yield %[[VAL]] : index
// UNROLL-FULL: }
// UNROLL-FULL: %[[SUM1:.*]] = scf.for %[[IV:.*]] = %[[C0]] to %[[C4]] step %[[C1]] iter_args(%{{.*}} = %[[SUM0]])
// UNROLL-FULL: %[[VAL:.*]] = vector.extract %[[ARG]][1, %[[IV]]] : index from vector<4x4xindex>
// UNROLL-FULL: scf.yield %[[VAL]] : index
// UNROLL-FULL: }
// UNROLL-FULL: %[[SUM2:.*]] = scf.for %[[IV:.*]] = %[[C0]] to %[[C4]] step %[[C1]] iter_args(%{{.*}} = %[[SUM1]])
// UNROLL-FULL: %[[VAL:.*]] = vector.extract %[[ARG]][2, %[[IV]]] : index from vector<4x4xindex>
// UNROLL-FULL: scf.yield %[[VAL]] : index
// UNROLL-FULL: }
// UNROLL-FULL: %[[SUM3:.*]] = scf.for %[[IV:.*]] = %[[C0]] to %[[C4]] step %[[C1]] iter_args(%{{.*}} = %[[SUM2]])
// UNROLL-FULL: %[[VAL:.*]] = vector.extract %[[ARG]][3, %[[IV]]] : index from vector<4x4xindex>
// UNROLL-FULL: scf.yield %[[VAL]] : index
// UNROLL-FULL: }
// UNROLL-FULL: return %[[SUM3]] : index
}