| # RUN: %PYTHON %s | FileCheck %s |
| |
| from mlir.ir import * |
| from mlir.dialects import func |
| from mlir.dialects import arith |
| from mlir.dialects import memref |
| from mlir.dialects import affine |
| import mlir.extras.types as T |
| |
| |
| def constructAndPrintInModule(f): |
| print("\nTEST:", f.__name__) |
| with Context(), Location.unknown(): |
| module = Module.create() |
| with InsertionPoint(module.body): |
| f() |
| print(module) |
| return f |
| |
| |
| # CHECK-LABEL: TEST: testAffineStoreOp |
| @constructAndPrintInModule |
| def testAffineStoreOp(): |
| f32 = F32Type.get() |
| index_type = IndexType.get() |
| memref_type_out = MemRefType.get([12, 12], f32) |
| |
| # CHECK: func.func @affine_store_test(%[[ARG0:.*]]: index) -> memref<12x12xf32> { |
| @func.FuncOp.from_py_func(index_type) |
| def affine_store_test(arg0): |
| # CHECK: %[[O_VAR:.*]] = memref.alloc() : memref<12x12xf32> |
| mem = memref.AllocOp(memref_type_out, [], []).result |
| |
| d0 = AffineDimExpr.get(0) |
| s0 = AffineSymbolExpr.get(0) |
| map = AffineMap.get(1, 1, [s0 * 3, d0 + s0 + 1]) |
| |
| # CHECK: %[[A1:.*]] = arith.constant 2.100000e+00 : f32 |
| a1 = arith.ConstantOp(f32, 2.1) |
| |
| # CHECK: affine.store %[[A1]], %alloc[symbol(%[[ARG0]]) * 3, %[[ARG0]] + symbol(%[[ARG0]]) + 1] : memref<12x12xf32> |
| affine.AffineStoreOp(a1, mem, indices=[arg0, arg0], map=map) |
| |
| return mem |
| |
| |
| # CHECK-LABEL: TEST: testAffineDelinearizeInfer |
| @constructAndPrintInModule |
| def testAffineDelinearizeInfer(): |
| # CHECK: %[[C0:.*]] = arith.constant 0 : index |
| c0 = arith.ConstantOp(T.index(), 0) |
| # CHECK: %[[C1:.*]] = arith.constant 1 : index |
| c1 = arith.ConstantOp(T.index(), 1) |
| # CHECK: %{{.*}}:2 = affine.delinearize_index %[[C1:.*]] into (%[[C1:.*]], %[[C0:.*]]) : index, index |
| two_indices = affine.AffineDelinearizeIndexOp(c1, [c1, c0]) |
| |
| |
| # CHECK-LABEL: TEST: testAffineLoadOp |
| @constructAndPrintInModule |
| def testAffineLoadOp(): |
| f32 = F32Type.get() |
| index_type = IndexType.get() |
| memref_type_in = MemRefType.get([10, 10], f32) |
| |
| # CHECK: func.func @affine_load_test(%[[I_VAR:.*]]: memref<10x10xf32>, %[[ARG0:.*]]: index) -> f32 { |
| @func.FuncOp.from_py_func(memref_type_in, index_type) |
| def affine_load_test(I, arg0): |
| d0 = AffineDimExpr.get(0) |
| s0 = AffineSymbolExpr.get(0) |
| map = AffineMap.get(1, 1, [s0 * 3, d0 + s0 + 1]) |
| |
| # CHECK: {{.*}} = affine.load %[[I_VAR]][symbol(%[[ARG0]]) * 3, %[[ARG0]] + symbol(%[[ARG0]]) + 1] : memref<10x10xf32> |
| a1 = affine.AffineLoadOp(f32, I, indices=[arg0, arg0], map=map) |
| |
| return a1 |
| |
| |
| # CHECK-LABEL: TEST: testAffineForOp |
| @constructAndPrintInModule |
| def testAffineForOp(): |
| f32 = F32Type.get() |
| index_type = IndexType.get() |
| memref_type = MemRefType.get([1024], f32) |
| |
| # CHECK: #[[MAP0:.*]] = affine_map<(d0)[s0] -> (0, d0 + s0)> |
| # CHECK: #[[MAP1:.*]] = affine_map<(d0, d1) -> (d0 - 2, d1 * 32)> |
| # CHECK: func.func @affine_for_op_test(%[[BUFFER:.*]]: memref<1024xf32>) { |
| @func.FuncOp.from_py_func(memref_type) |
| def affine_for_op_test(buffer): |
| # CHECK: %[[C1:.*]] = arith.constant 1 : index |
| c1 = arith.ConstantOp(index_type, 1) |
| # CHECK: %[[C2:.*]] = arith.constant 2 : index |
| c2 = arith.ConstantOp(index_type, 2) |
| # CHECK: %[[C3:.*]] = arith.constant 3 : index |
| c3 = arith.ConstantOp(index_type, 3) |
| # CHECK: %[[C9:.*]] = arith.constant 9 : index |
| c9 = arith.ConstantOp(index_type, 9) |
| # CHECK: %[[AC0:.*]] = arith.constant 0.000000e+00 : f32 |
| ac0 = AffineConstantExpr.get(0) |
| |
| d0 = AffineDimExpr.get(0) |
| d1 = AffineDimExpr.get(1) |
| s0 = AffineSymbolExpr.get(0) |
| lb = AffineMap.get(1, 1, [ac0, d0 + s0]) |
| ub = AffineMap.get(2, 0, [d0 - 2, 32 * d1]) |
| sum_0 = arith.ConstantOp(f32, 0.0) |
| |
| # CHECK: %0 = affine.for %[[INDVAR:.*]] = max #[[MAP0]](%[[C2]])[%[[C3]]] to min #[[MAP1]](%[[C9]], %[[C1]]) step 2 iter_args(%[[SUM0:.*]] = %[[AC0]]) -> (f32) { |
| sum = affine.AffineForOp( |
| lb, |
| ub, |
| 2, |
| iter_args=[sum_0], |
| lower_bound_operands=[c2, c3], |
| upper_bound_operands=[c9, c1], |
| ) |
| |
| with InsertionPoint(sum.body): |
| # CHECK: %[[TMP:.*]] = memref.load %[[BUFFER]][%[[INDVAR]]] : memref<1024xf32> |
| tmp = memref.LoadOp(buffer, [sum.induction_variable]) |
| sum_next = arith.AddFOp(sum.inner_iter_args[0], tmp) |
| affine.AffineYieldOp([sum_next]) |
| |
| |
| # CHECK-LABEL: TEST: testAffineForOpErrors |
| @constructAndPrintInModule |
| def testAffineForOpErrors(): |
| c1 = arith.ConstantOp(T.index(), 1) |
| c2 = arith.ConstantOp(T.index(), 2) |
| c3 = arith.ConstantOp(T.index(), 3) |
| d0 = AffineDimExpr.get(0) |
| |
| try: |
| affine.AffineForOp( |
| c1, |
| c2, |
| 1, |
| lower_bound_operands=[c3], |
| upper_bound_operands=[], |
| ) |
| except ValueError as e: |
| assert ( |
| e.args[0] |
| == "Either a concrete lower bound or an AffineMap in combination with lower bound operands, but not both, is supported." |
| ) |
| |
| try: |
| affine.AffineForOp( |
| AffineMap.get_constant(1), |
| c2, |
| 1, |
| lower_bound_operands=[c3, c3], |
| upper_bound_operands=[], |
| ) |
| except ValueError as e: |
| assert ( |
| e.args[0] |
| == "Wrong number of lower bound operands passed to AffineForOp; Expected 0, got 2." |
| ) |
| |
| try: |
| two_indices = affine.AffineDelinearizeIndexOp(c1, [c1, c1]) |
| affine.AffineForOp( |
| two_indices, |
| c2, |
| 1, |
| lower_bound_operands=[], |
| upper_bound_operands=[], |
| ) |
| except ValueError as e: |
| assert e.args[0] == "Only a single concrete value is supported for lower bound." |
| |
| try: |
| affine.AffineForOp( |
| 1.0, |
| c2, |
| 1, |
| lower_bound_operands=[], |
| upper_bound_operands=[], |
| ) |
| except ValueError as e: |
| assert e.args[0] == "lower bound must be int | ResultValueT | AffineMap." |
| |
| |
| @constructAndPrintInModule |
| def testForSugar(): |
| memref_t = T.memref(10, T.index()) |
| range = affine.for_ |
| |
| # CHECK: #[[$ATTR_2:.+]] = affine_map<(d0) -> (d0)> |
| |
| # CHECK-LABEL: func.func @range_loop_1( |
| # CHECK-SAME: %[[VAL_0:.*]]: index, %[[VAL_1:.*]]: index, %[[VAL_2:.*]]: memref<10xindex>) { |
| # CHECK: affine.for %[[VAL_3:.*]] = #[[$ATTR_2]](%[[VAL_0]]) to #[[$ATTR_2]](%[[VAL_1]]) { |
| # CHECK: %[[VAL_4:.*]] = arith.addi %[[VAL_3]], %[[VAL_3]] : index |
| # CHECK: memref.store %[[VAL_4]], %[[VAL_2]]{{\[}}%[[VAL_3]]] : memref<10xindex> |
| # CHECK: } |
| # CHECK: return |
| # CHECK: } |
| @func.FuncOp.from_py_func(T.index(), T.index(), memref_t) |
| def range_loop_1(lb, ub, memref_v): |
| for i in range(lb, ub, step=1): |
| add = arith.addi(i, i) |
| memref.store(add, memref_v, [i]) |
| |
| affine.yield_([]) |
| |
| # CHECK-LABEL: func.func @range_loop_2( |
| # CHECK-SAME: %[[VAL_0:.*]]: index, %[[VAL_1:.*]]: index, %[[VAL_2:.*]]: memref<10xindex>) { |
| # CHECK: affine.for %[[VAL_3:.*]] = #[[$ATTR_2]](%[[VAL_0]]) to 10 { |
| # CHECK: %[[VAL_4:.*]] = arith.addi %[[VAL_3]], %[[VAL_3]] : index |
| # CHECK: memref.store %[[VAL_4]], %[[VAL_2]]{{\[}}%[[VAL_3]]] : memref<10xindex> |
| # CHECK: } |
| # CHECK: return |
| # CHECK: } |
| @func.FuncOp.from_py_func(T.index(), T.index(), memref_t) |
| def range_loop_2(lb, ub, memref_v): |
| for i in range(lb, 10, step=1): |
| add = arith.addi(i, i) |
| memref.store(add, memref_v, [i]) |
| affine.yield_([]) |
| |
| # CHECK-LABEL: func.func @range_loop_3( |
| # CHECK-SAME: %[[VAL_0:.*]]: index, %[[VAL_1:.*]]: index, %[[VAL_2:.*]]: memref<10xindex>) { |
| # CHECK: affine.for %[[VAL_3:.*]] = 0 to #[[$ATTR_2]](%[[VAL_1]]) { |
| # CHECK: %[[VAL_4:.*]] = arith.addi %[[VAL_3]], %[[VAL_3]] : index |
| # CHECK: memref.store %[[VAL_4]], %[[VAL_2]]{{\[}}%[[VAL_3]]] : memref<10xindex> |
| # CHECK: } |
| # CHECK: return |
| # CHECK: } |
| @func.FuncOp.from_py_func(T.index(), T.index(), memref_t) |
| def range_loop_3(lb, ub, memref_v): |
| for i in range(0, ub, step=1): |
| add = arith.addi(i, i) |
| memref.store(add, memref_v, [i]) |
| affine.yield_([]) |
| |
| # CHECK-LABEL: func.func @range_loop_4( |
| # CHECK-SAME: %[[VAL_0:.*]]: index, %[[VAL_1:.*]]: index, %[[VAL_2:.*]]: memref<10xindex>) { |
| # CHECK: affine.for %[[VAL_3:.*]] = 0 to 10 { |
| # CHECK: %[[VAL_4:.*]] = arith.addi %[[VAL_3]], %[[VAL_3]] : index |
| # CHECK: memref.store %[[VAL_4]], %[[VAL_2]]{{\[}}%[[VAL_3]]] : memref<10xindex> |
| # CHECK: } |
| # CHECK: return |
| # CHECK: } |
| @func.FuncOp.from_py_func(T.index(), T.index(), memref_t) |
| def range_loop_4(lb, ub, memref_v): |
| for i in range(0, 10, step=1): |
| add = arith.addi(i, i) |
| memref.store(add, memref_v, [i]) |
| affine.yield_([]) |
| |
| # CHECK-LABEL: func.func @range_loop_8( |
| # CHECK-SAME: %[[VAL_0:.*]]: index, %[[VAL_1:.*]]: index, %[[VAL_2:.*]]: memref<10xindex>) { |
| # CHECK: %[[VAL_3:.*]] = affine.for %[[VAL_4:.*]] = 0 to 10 iter_args(%[[VAL_5:.*]] = %[[VAL_2]]) -> (memref<10xindex>) { |
| # CHECK: %[[VAL_6:.*]] = arith.addi %[[VAL_4]], %[[VAL_4]] : index |
| # CHECK: memref.store %[[VAL_6]], %[[VAL_5]]{{\[}}%[[VAL_4]]] : memref<10xindex> |
| # CHECK: affine.yield %[[VAL_5]] : memref<10xindex> |
| # CHECK: } |
| # CHECK: return |
| # CHECK: } |
| @func.FuncOp.from_py_func(T.index(), T.index(), memref_t) |
| def range_loop_8(lb, ub, memref_v): |
| for i, it in range(0, 10, iter_args=[memref_v]): |
| add = arith.addi(i, i) |
| memref.store(add, it, [i]) |
| affine.yield_([it]) |