[mlir][affine]if the result of a Pure operation that whose operands are dimensional identifiers,then their results are dimensional identifiers. #123542

linuxlonelyeagle · 2025-01-20T02:48:11Z

as title.
see the comment #118478 (comment).

llvmbot · 2025-01-20T02:48:41Z

@llvm/pr-subscribers-mlir

@llvm/pr-subscribers-mlir-affine

Author: lonely eagle (linuxlonelyeagle)

Changes

as title.
see the comment #118478 (comment).

Full diff: https://github.com/llvm/llvm-project/pull/123542.diff

5 Files Affected:

(modified) mlir/docs/Dialects/Affine.md (+2-3)
(modified) mlir/lib/Dialect/Affine/IR/AffineOps.cpp (+11-6)
(modified) mlir/test/Dialect/Affine/invalid.mlir (-12)
(modified) mlir/test/Dialect/Affine/load-store-invalid.mlir (-92)
(modified) mlir/test/Dialect/Affine/ops.mlir (+174)

diff --git a/mlir/docs/Dialects/Affine.md b/mlir/docs/Dialects/Affine.md
index 0b6d7747e8a6f9..94f23af699ca46 100644
--- a/mlir/docs/Dialects/Affine.md
+++ b/mlir/docs/Dialects/Affine.md
@@ -83,9 +83,8 @@ location of the SSA use. Dimensions may be bound not only to anything that a
 symbol is bound to, but also to induction variables of enclosing
 [`affine.for`](#affinefor-mliraffineforop) and
 [`affine.parallel`](#affineparallel-mliraffineparallelop) operations, and the result
-of an [`affine.apply` operation](#affineapply-mliraffineapplyop) (which recursively
-may use other dimensions and symbols).
-
+of a `Pure` operation whose operands are valid dimensional identifiers.
+(which recursively may use other dimensions and symbols).
 ### Affine Expressions
 
 Syntax:
diff --git a/mlir/lib/Dialect/Affine/IR/AffineOps.cpp b/mlir/lib/Dialect/Affine/IR/AffineOps.cpp
index 147f5dd7a24b62..053f8e0bb4f2c8 100644
--- a/mlir/lib/Dialect/Affine/IR/AffineOps.cpp
+++ b/mlir/lib/Dialect/Affine/IR/AffineOps.cpp
@@ -274,7 +274,8 @@ Region *mlir::affine::getAffineScope(Operation *op) {
 // conditions:
 // *) It is valid as a symbol.
 // *) It is an induction variable.
-// *) It is the result of affine apply operation with dimension id arguments.
+// *) It is the result of a `Pure` operation whose operands are valid
+//    dimensional identifiers.
 bool mlir::affine::isValidDim(Value value) {
   // The value must be an index type.
   if (!value.getType().isIndex())
@@ -304,8 +305,8 @@ bool mlir::affine::isValidDim(Value value, Region *region) {
   if (isValidSymbol(value, region))
     return true;
 
-  auto *op = value.getDefiningOp();
-  if (!op) {
+  auto *defOp = value.getDefiningOp();
+  if (!defOp) {
     // This value has to be a block argument for an affine.for or an
     // affine.parallel.
     auto *parentOp = llvm::cast<BlockArgument>(value).getOwner()->getParentOp();
@@ -313,11 +314,15 @@ bool mlir::affine::isValidDim(Value value, Region *region) {
   }
 
   // Affine apply operation is ok if all of its operands are ok.
-  if (auto applyOp = dyn_cast<AffineApplyOp>(op))
-    return applyOp.isValidDim(region);
+  if (isPure(defOp) && llvm::all_of(defOp->getOperands(), [&](Value operand) {
+        return affine::isValidDim(operand, region);
+      })) {
+    return true;
+  }
+
   // The dim op is okay if its operand memref/tensor is defined at the top
   // level.
-  if (auto dimOp = dyn_cast<ShapedDimOpInterface>(op))
+  if (auto dimOp = dyn_cast<ShapedDimOpInterface>(defOp))
     return isTopLevelValue(dimOp.getShapedValue());
   return false;
 }
diff --git a/mlir/test/Dialect/Affine/invalid.mlir b/mlir/test/Dialect/Affine/invalid.mlir
index 44e484b9ba5982..b3b2ec5552482a 100644
--- a/mlir/test/Dialect/Affine/invalid.mlir
+++ b/mlir/test/Dialect/Affine/invalid.mlir
@@ -225,18 +225,6 @@ func.func @affine_parallel(%arg0 : index, %arg1 : index, %arg2 : index) {
 
 // -----
 
-func.func @affine_parallel(%arg0 : index, %arg1 : index, %arg2 : index) {
-  affine.for %x = 0 to 7 {
-    %y = arith.addi %x, %x : index
-    // expected-error@+1 {{operand cannot be used as a dimension id}}
-    affine.parallel (%i, %j) = (0, 0) to (%y, 100) step (10, 10) {
-    }
-  }
-  return
-}
-
-// -----
-
 func.func @affine_parallel(%arg0 : index, %arg1 : index, %arg2 : index) {
   affine.for %x = 0 to 7 {
     %y = arith.addi %x, %x : index
diff --git a/mlir/test/Dialect/Affine/load-store-invalid.mlir b/mlir/test/Dialect/Affine/load-store-invalid.mlir
index 01d6b25dee695b..d8eac141cc52ae 100644
--- a/mlir/test/Dialect/Affine/load-store-invalid.mlir
+++ b/mlir/test/Dialect/Affine/load-store-invalid.mlir
@@ -33,31 +33,6 @@ func.func @store_too_few_subscripts_map(%arg0: memref<?x?xf32>, %arg1: index, %v
 
 // -----
 
-func.func @load_non_affine_index(%arg0 : index) {
-  %0 = memref.alloc() : memref<10xf32>
-  affine.for %i0 = 0 to 10 {
-    %1 = arith.muli %i0, %arg0 : index
-    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
-    %v = affine.load %0[%1] : memref<10xf32>
-  }
-  return
-}
-
-// -----
-
-func.func @store_non_affine_index(%arg0 : index) {
-  %0 = memref.alloc() : memref<10xf32>
-  %1 = arith.constant 11.0 : f32
-  affine.for %i0 = 0 to 10 {
-    %2 = arith.muli %i0, %arg0 : index
-    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
-    affine.store %1, %0[%2] : memref<10xf32>
-  }
-  return
-}
-
-// -----
-
 func.func @invalid_prefetch_rw(%i : index) {
   %0 = memref.alloc() : memref<10xf32>
   // expected-error@+1 {{rw specifier has to be 'read' or 'write'}}
@@ -73,70 +48,3 @@ func.func @invalid_prefetch_cache_type(%i : index) {
   affine.prefetch %0[%i], read, locality<0>, false  : memref<10xf32>
   return
 }
-
-// -----
-
-func.func @dma_start_non_affine_src_index(%arg0 : index) {
-  %0 = memref.alloc() : memref<100xf32>
-  %1 = memref.alloc() : memref<100xf32, 2>
-  %2 = memref.alloc() : memref<1xi32, 4>
-  %c0 = arith.constant 0 : index
-  %c64 = arith.constant 64 : index
-  affine.for %i0 = 0 to 10 {
-    %3 = arith.muli %i0, %arg0 : index
-    // expected-error@+1 {{op src index must be a valid dimension or symbol identifier}}
-    affine.dma_start %0[%3], %1[%i0], %2[%c0], %c64
-        : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
-  }
-  return
-}
-
-// -----
-
-func.func @dma_start_non_affine_dst_index(%arg0 : index) {
-  %0 = memref.alloc() : memref<100xf32>
-  %1 = memref.alloc() : memref<100xf32, 2>
-  %2 = memref.alloc() : memref<1xi32, 4>
-  %c0 = arith.constant 0 : index
-  %c64 = arith.constant 64 : index
-  affine.for %i0 = 0 to 10 {
-    %3 = arith.muli %i0, %arg0 : index
-    // expected-error@+1 {{op dst index must be a valid dimension or symbol identifier}}
-    affine.dma_start %0[%i0], %1[%3], %2[%c0], %c64
-        : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
-  }
-  return
-}
-
-// -----
-
-func.func @dma_start_non_affine_tag_index(%arg0 : index) {
-  %0 = memref.alloc() : memref<100xf32>
-  %1 = memref.alloc() : memref<100xf32, 2>
-  %2 = memref.alloc() : memref<1xi32, 4>
-  %c0 = arith.constant 0 : index
-  %c64 = arith.constant 64 : index
-  affine.for %i0 = 0 to 10 {
-    %3 = arith.muli %i0, %arg0 : index
-    // expected-error@+1 {{op tag index must be a valid dimension or symbol identifier}}
-    affine.dma_start %0[%i0], %1[%arg0], %2[%3], %c64
-        : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
-  }
-  return
-}
-
-// -----
-
-func.func @dma_wait_non_affine_tag_index(%arg0 : index) {
-  %0 = memref.alloc() : memref<100xf32>
-  %1 = memref.alloc() : memref<100xf32, 2>
-  %2 = memref.alloc() : memref<1xi32, 4>
-  %c0 = arith.constant 0 : index
-  %c64 = arith.constant 64 : index
-  affine.for %i0 = 0 to 10 {
-    %3 = arith.muli %i0, %arg0 : index
-    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
-    affine.dma_wait %2[%3], %c64 : memref<1xi32, 4>
-  }
-  return
-}
diff --git a/mlir/test/Dialect/Affine/ops.mlir b/mlir/test/Dialect/Affine/ops.mlir
index e3721806989bb9..74ba098ce27487 100644
--- a/mlir/test/Dialect/Affine/ops.mlir
+++ b/mlir/test/Dialect/Affine/ops.mlir
@@ -409,3 +409,177 @@ func.func @arith_add_vaild_symbol_lower_bound(%arg : index) {
 // CHECK:   affine.for %[[VAL_3:.*]] = #[[$ATTR_0]](%[[VAL_2]]){{\[}}%[[VAL_0]]] to 7 {
 // CHECK:   }
 // CHECK: }
+
+// -----
+
+// CHECK-LABEL: func @affine_parallel
+
+func.func @affine_parallel(%arg0 : index, %arg1 : index, %arg2 : index) {
+  affine.for %x = 0 to 7 {
+    %y = arith.addi %x, %x : index
+    affine.parallel (%i, %j) = (0, 0) to (%y, 100) step (10, 10) {
+    }
+  }
+  return
+}
+
+// CHECK-NEXT: affine.for 
+// CHECK-SAME: %[[VAL_0:.*]] = 0 to 7 {
+// CHECK: %[[VAL_1:.*]] = arith.addi %[[VAL_0]], %[[VAL_0]] : index
+// CHECK:   affine.parallel (%{{.*}}, %{{.*}}) = (0, 0) to (%[[VAL_1]], 100) step (10, 10) {
+// CHECK:   }
+// CHECK: }
+
+// -----
+
+func.func @load_non_affine_index(%arg0 : index) {
+  %0 = memref.alloc() : memref<10xf32>
+  affine.for %i0 = 0 to 10 {
+    %1 = arith.muli %i0, %arg0 : index
+    %v = affine.load %0[%1] : memref<10xf32>
+  }
+  return
+}
+
+// CHECK-LABEL: func @load_non_affine_index
+// CHECK-SAME:  %[[VAL_0:.*]]: index) {
+// CHECK: %[[VAL_1:.*]] = memref.alloc() : memref<10xf32>
+// CHECK: affine.for %[[VAL_2:.*]] = 0 to 10 {
+// CHECK:   %[[VAL_3:.*]] = arith.muli %[[VAL_2]], %[[VAL_0]] : index
+// CHECK:   %{{.*}} = affine.load %[[VAL_1]]{{\[}}%[[VAL_3]]] : memref<10xf32>
+// CHECK: }
+
+// -----
+
+func.func @store_non_affine_index(%arg0 : index) {
+  %0 = memref.alloc() : memref<10xf32>
+  %1 = arith.constant 11.0 : f32
+  affine.for %i0 = 0 to 10 {
+    %2 = arith.muli %i0, %arg0 : index
+    affine.store %1, %0[%2] : memref<10xf32>
+  }
+  return
+}
+
+// CHECK-LABEL: func @store_non_affine_index
+// CHECK-SAME: %[[VAL_0:.*]]: index) {
+// CHECK: %[[VAL_1:.*]] = memref.alloc() : memref<10xf32>
+// CHECK: %[[VAL_2:.*]] = arith.constant 1.100000e+01 : f32
+// CHECK: affine.for %[[VAL_3:.*]] = 0 to 10 {
+// CHECK:   %[[VAL_4:.*]] = arith.muli %[[VAL_3]], %[[VAL_0]] : index
+// CHECK:    affine.store %[[VAL_2]], %[[VAL_1]]{{\[}}%[[VAL_4]]] : memref<10xf32>
+// CHECK: }
+
+// -----
+
+func.func @dma_start_non_affine_src_index(%arg0 : index) {
+  %0 = memref.alloc() : memref<100xf32>
+  %1 = memref.alloc() : memref<100xf32, 2>
+  %2 = memref.alloc() : memref<1xi32, 4>
+  %c0 = arith.constant 0 : index
+  %c64 = arith.constant 64 : index
+  affine.for %i0 = 0 to 10 {
+    %3 = arith.muli %i0, %arg0 : index
+    affine.dma_start %0[%3], %1[%i0], %2[%c0], %c64
+        : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
+  }
+  return
+}
+
+// CHECK-LABEL: func @dma_start_non_affine_src_index
+// CHECK-SAME: %[[VAL_0:.*]]: index) {
+// CHECK: %[[VAL_1:.*]] = memref.alloc() : memref<100xf32>
+// CHECK: %[[VAL_2:.*]] = memref.alloc() : memref<100xf32, 2>
+// CHECK: %[[VAL_3:.*]] = memref.alloc() : memref<1xi32, 4>
+// CHECK: %[[VAL_4:.*]] = arith.constant 0 : index
+// CHECK: %[[VAL_5:.*]] = arith.constant 64 : index
+// CHECK: affine.for %[[VAL_6:.*]] = 0 to 10 {
+// CHECK:   %[[VAL_7:.*]] = arith.muli %[[VAL_6]], %[[VAL_0]] : index
+// CHECK:   affine.dma_start %[[VAL_1]]{{\[}}%[[VAL_7]]], %[[VAL_2]]{{\[}}%[[VAL_6]]], %[[VAL_3]]{{\[}}%[[VAL_4]]], %[[VAL_5]]
+// CHECK-SAME: : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
+// CHECK: }
+
+// -----
+
+func.func @dma_start_non_affine_dst_index(%arg0 : index) {
+  %0 = memref.alloc() : memref<100xf32>
+  %1 = memref.alloc() : memref<100xf32, 2>
+  %2 = memref.alloc() : memref<1xi32, 4>
+  %c0 = arith.constant 0 : index
+  %c64 = arith.constant 64 : index
+  affine.for %i0 = 0 to 10 {
+    %3 = arith.muli %i0, %arg0 : index
+    affine.dma_start %0[%i0], %1[%3], %2[%c0], %c64
+        : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
+  }
+  return
+}
+
+// CHECK-LABEL: func @dma_start_non_affine_dst_index
+// CHECK-SAME: %[[VAL_0:.*]]: index) {
+// CHECK: %[[VAL_1:.*]] = memref.alloc() : memref<100xf32>
+// CHECK: %[[VAL_2:.*]] = memref.alloc() : memref<100xf32, 2>
+// CHECK: %[[VAL_3:.*]] = memref.alloc() : memref<1xi32, 4>
+// CHECK: %[[VAL_4:.*]] = arith.constant 0 : index
+// CHECK: %[[VAL_5:.*]] = arith.constant 64 : index
+// CHECK: affine.for %[[VAL_6:.*]] = 0 to 10 {
+// CHECK: %[[VAL_7:.*]] = arith.muli %[[VAL_6]], %[[VAL_0]] : index
+// CHECK: affine.dma_start %[[VAL_1]]{{\[}}%[[VAL_6]]], %[[VAL_2]]{{\[}}%[[VAL_7]]], %[[VAL_3]]{{\[}}%[[VAL_4]]], %[[VAL_5]]
+// CHECK-SAME: : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
+// CHECK: }
+
+// -----
+
+func.func @dma_start_non_affine_tag_index(%arg0 : index) {
+  %0 = memref.alloc() : memref<100xf32>
+  %1 = memref.alloc() : memref<100xf32, 2>
+  %2 = memref.alloc() : memref<1xi32, 4>
+  %c0 = arith.constant 0 : index
+  %c64 = arith.constant 64 : index
+  affine.for %i0 = 0 to 10 {
+    %3 = arith.muli %i0, %arg0 : index
+    affine.dma_start %0[%i0], %1[%arg0], %2[%3], %c64
+        : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
+  }
+  return
+}
+
+// CHECK-LABEL: func @dma_start_non_affine_tag_index
+// CHECK-SAME: %[[VAL_0:.*]]: index) {
+// CHECK: %[[VAL_1:.*]] = memref.alloc() : memref<100xf32>
+// CHECK: %[[VAL_2:.*]] = memref.alloc() : memref<100xf32, 2>
+// CHECK: %[[VAL_3:.*]] = memref.alloc() : memref<1xi32, 4>
+// CHECK: %{{.*}} = arith.constant 0 : index
+// CHECK: %[[VAL_4:.*]] = arith.constant 64 : index
+// CHECK: affine.for %[[VAL_5:.*]] = 0 to 10 {
+// CHECK: %[[VAL_6:.*]] = arith.muli %[[VAL_5]], %[[VAL_0]] : index
+// CHECK: affine.dma_start %[[VAL_1]]{{\[}}%[[VAL_5]]], %[[VAL_2]]{{\[}}%[[VAL_0]]], %[[VAL_3]]{{\[}}%[[VAL_6]]], %[[VAL_4]]
+// CHECK-SAME: : memref<100xf32>, memref<100xf32, 2>, memref<1xi32, 4>
+// CHECK: }
+
+// -----
+
+func.func @dma_wait_non_affine_tag_index(%arg0 : index) {
+  %0 = memref.alloc() : memref<100xf32>
+  %1 = memref.alloc() : memref<100xf32, 2>
+  %2 = memref.alloc() : memref<1xi32, 4>
+  %c0 = arith.constant 0 : index
+  %c64 = arith.constant 64 : index
+  affine.for %i0 = 0 to 10 {
+    %3 = arith.muli %i0, %arg0 : index
+    affine.dma_wait %2[%3], %c64 : memref<1xi32, 4>
+  }
+  return
+}
+
+// CHECK-LABEL: func @dma_wait_non_affine_tag_index
+// CHECK-SAME: %[[VAL_0:.*]]: index) {
+// CHECK: %{{.*}} = memref.alloc() : memref<100xf32>
+// CHECK: %{{.*}} = memref.alloc() : memref<100xf32, 2>
+// CHECK: %[[VAL_1:.*]] = memref.alloc() : memref<1xi32, 4>
+// CHECK: %{{.*}} = arith.constant 0 : index
+// CHECK: %[[VAL_2:.*]] = arith.constant 64 : index
+// CHECK: affine.for %[[VAL_3:.*]] = 0 to 10 {
+// CHECK:   %[[VAL_4:.*]] = arith.muli %[[VAL_3]], %[[VAL_0]] : index
+// CHECK:   affine.dma_wait %[[VAL_1]]{{\[}}%[[VAL_4]]], %[[VAL_2]] : memref<1xi32, 4>
+// CHECK: }

… identifiers,then their results are dimensional identifiers.

linuxlonelyeagle · 2025-01-23T01:36:06Z

Ping @bondhugula I think the PR need you.

ftynse

Please don't remove valid tests.

Also, this change looks pretty substantial to the nature of the affine restrictions that it deserves a forum post.

ftynse · 2025-01-26T08:51:57Z

mlir/test/Dialect/Affine/invalid.mlir

-func.func @affine_parallel(%arg0 : index, %arg1 : index, %arg2 : index) {
-  affine.for %x = 0 to 7 {
-    %y = arith.addi %x, %x : index
-    // expected-error@+1 {{operand cannot be used as a dimension id}}
-    affine.parallel (%i, %j) = (0, 0) to (%y, 100) step (10, 10) {
-    }
-  }
-  return
-}
-
-// -----


We shouldn't just remove these tests. They are still valid. They should be updated to still emit the message, e.g., by using another operation instead of addi that is not Pure.

I didn't delete the tests, I moved them to the positive tests.You can look at Affine/ops.mlir.

arith.addi is Pure, you can see below and https://mlir.llvm.org/docs/Dialects/ArithOps/#arithandi-arithandiop

def Pure : TraitList<[AlwaysSpeculatable, NoMemoryEffect]>; // arith.addi Traits: AlwaysSpeculatableImplTrait, Commutative, Elementwise, Idempotent, SameOperandsAndResultType, Scalarizable, Tensorizable, Vectorizable Interfaces: ConditionallySpeculatable, InferIntRangeInterface, InferTypeOpInterface, NoMemoryEffect (MemoryEffectOpInterface), VectorUnrollOpInterface Effects: MemoryEffects::Effect{}

Groverkss · 2025-01-26T14:07:25Z

This would make:

affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}

valid right? But in reality, this loop isn't affine anymore. My understanding is that the result of affine.apply with only dimensional identifiers is always a valid dimension for a affine loop, because the operation restricts what it can do. Allowing any pure operation breaks this.

You can see it happening in the tests that you removed:

func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}

This loop isn't always affine depending on the actual value of arg0.

linuxlonelyeagle · 2025-01-26T14:20:54Z

This would make:
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
valid right? But in reality, this loop isn't affine anymore. My understanding is that the result of affine.apply with only dimensional identifiers is always a valid dimension for a affine loop, because the operation restricts what it can do. Allowing any pure operation breaks this.

You can see it happening in the tests that you removed:
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
This loop isn't always affine depending on the actual value of arg0.

I did get your point, my understanding is that the IR you gave is actually generated due to the following IR.I think this is correct.

affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}

#map = affine_map<(d0, d1) -> ()>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}

I didn't look at the test very carefully, ok, but I think it is missing some checks.

func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}

Thanks for pointing that out.

Groverkss · 2025-01-26T14:39:45Z

This would make:
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
valid right? But in reality, this loop isn't affine anymore. My understanding is that the result of affine.apply with only dimensional identifiers is always a valid dimension for a affine loop, because the operation restricts what it can do. Allowing any pure operation breaks this.
You can see it happening in the tests that you removed:
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
This loop isn't always affine depending on the actual value of arg0.
I did get your point, my understanding is that the IR you gave is actually generated due to the following IR.I think this is correct.
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
#map = affine_map<(d0, d1) -> ()>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}
I didn't look at the test very carefully, ok, but I think it is missing some checks.
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
Thanks for pointing that out.

No, the IR in that loop is:

#map = affine_map<(d0, d1) -> (d0 * d1)>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}

This will fail the verifier for affine_map, because the map is not affine: https://mlir.llvm.org/docs/Dialects/Affine/#affine-expressions (You cannot multiply dimensions).

The error:

error: non-affine expression: at least one of the multiply operands has to be either a constant or symbolic
#map = affine_map<(d0, d1) -> (d0 * d1)>

linuxlonelyeagle · 2025-01-26T14:49:30Z

This would make:
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
valid right? But in reality, this loop isn't affine anymore. My understanding is that the result of affine.apply with only dimensional identifiers is always a valid dimension for a affine loop, because the operation restricts what it can do. Allowing any pure operation breaks this.
You can see it happening in the tests that you removed:
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
This loop isn't always affine depending on the actual value of arg0.
I did get your point, my understanding is that the IR you gave is actually generated due to the following IR.I think this is correct.
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
#map = affine_map<(d0, d1) -> ()>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}
I didn't look at the test very carefully, ok, but I think it is missing some checks.
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
Thanks for pointing that out.
No, the IR in that loop is:
#map = affine_map<(d0, d1) -> (d0 * d1)>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}
This will fail the verifier for affine_map, because the map is not affine: https://mlir.llvm.org/docs/Dialects/Affine/#affine-expressions (You cannot multiply dimensions).

The error:
error: non-affine expression: at least one of the multiply operands has to be either a constant or symbolic
#map = affine_map<(d0, d1) -> (d0 * d1)>

Thanks, I think I've learned something new.Maybe I should read more about Affine optimization to understand why it is defined that way, I'm very interested in this piece . I'll close it.

Groverkss · 2025-01-26T15:12:12Z

This would make:
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
valid right? But in reality, this loop isn't affine anymore. My understanding is that the result of affine.apply with only dimensional identifiers is always a valid dimension for a affine loop, because the operation restricts what it can do. Allowing any pure operation breaks this.
You can see it happening in the tests that you removed:
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
This loop isn't always affine depending on the actual value of arg0.
I did get your point, my understanding is that the IR you gave is actually generated due to the following IR.I think this is correct.
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
#map = affine_map<(d0, d1) -> ()>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}
I didn't look at the test very carefully, ok, but I think it is missing some checks.
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
Thanks for pointing that out.
No, the IR in that loop is:
#map = affine_map<(d0, d1) -> (d0 * d1)>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}
This will fail the verifier for affine_map, because the map is not affine: https://mlir.llvm.org/docs/Dialects/Affine/#affine-expressions (You cannot multiply dimensions).
The error:
error: non-affine expression: at least one of the multiply operands has to be either a constant or symbolic
#map = affine_map<(d0, d1) -> (d0 * d1)>
Thanks, I think I've learned something new.Maybe I should read more about Affine optimization to understand why it is defined that way, I'm very interested in this piece . I'll close it.

I think it would be worth making a post on discourse on what you were trying to do with this optimization. You might get good alternatives which may solve your problem.

linuxlonelyeagle · 2025-01-26T15:18:38Z

This would make:
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
valid right? But in reality, this loop isn't affine anymore. My understanding is that the result of affine.apply with only dimensional identifiers is always a valid dimension for a affine loop, because the operation restricts what it can do. Allowing any pure operation breaks this.
You can see it happening in the tests that you removed:
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
This loop isn't always affine depending on the actual value of arg0.
I did get your point, my understanding is that the IR you gave is actually generated due to the following IR.I think this is correct.
affine.for %i = 0 to 100 {
   %i2 = arith.muli %i, %i
   affine.load[%i2]
}
#map = affine_map<(d0, d1) -> ()>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}
I didn't look at the test very carefully, ok, but I think it is missing some checks.
func.func @store_non_affine_index(%arg0 : index) {
  %0 = memref.alloc() : memref<10xf32>
  %1 = arith.constant 11.0 : f32
  affine.for %i0 = 0 to 10 {
    %2 = arith.muli %i0, %arg0 : index
    // expected-error@+1 {{op index must be a valid dimension or symbol identifier}}
    affine.store %1, %0[%2] : memref<10xf32>
  }
  return
}
Thanks for pointing that out.
No, the IR in that loop is:
#map = affine_map<(d0, d1) -> (d0 * d1)>
affine.for %i = 0 to 100 {
   %i2 = affine.apply #map (%i, %i)
   affine.load[%i2]
}
This will fail the verifier for affine_map, because the map is not affine: https://mlir.llvm.org/docs/Dialects/Affine/#affine-expressions (You cannot multiply dimensions).
The error:
error: non-affine expression: at least one of the multiply operands has to be either a constant or symbolic
#map = affine_map<(d0, d1) -> (d0 * d1)>
Thanks, I think I've learned something new.Maybe I should read more about Affine optimization to understand why it is defined that way, I'm very interested in this piece . I'll close it.
I think it would be worth making a post on discourse on what you were trying to do with this optimization. You might get good alternatives which may solve your problem.

The feature I want to support is already supported in the PR in the description, but that change is similar to here. I cited that it should be synchronized here as well.

linuxlonelyeagle · 2025-01-26T15:22:36Z

It's been a wonderful journey, from that PR to this one, and I think I've learned a lot.

llvmbot added mlir:affine mlir labels Jan 20, 2025

linuxlonelyeagle force-pushed the pure-op-add-dim-equal-dim branch from 4c7c994 to 50fcac3 Compare January 20, 2025 02:49

linuxlonelyeagle requested review from bondhugula, ftynse and krzysz00 January 20, 2025 02:49

if the result of a Pure operation that whose operands are dimensional…

666b722

… identifiers,then their results are dimensional identifiers.

linuxlonelyeagle force-pushed the pure-op-add-dim-equal-dim branch from 50fcac3 to 666b722 Compare January 20, 2025 07:35

linuxlonelyeagle requested a review from grypp January 23, 2025 01:34

ftynse requested changes Jan 26, 2025

View reviewed changes

linuxlonelyeagle closed this Jan 26, 2025

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

[mlir][affine]if the result of a Pure operation that whose operands are dimensional identifiers,then their results are dimensional identifiers. #123542

[mlir][affine]if the result of a Pure operation that whose operands are dimensional identifiers,then their results are dimensional identifiers. #123542

Uh oh!

linuxlonelyeagle commented Jan 20, 2025

Uh oh!

llvmbot commented Jan 20, 2025 •

edited

Loading

Uh oh!

linuxlonelyeagle commented Jan 23, 2025 •

edited

Loading

Uh oh!

ftynse left a comment

Uh oh!

ftynse Jan 26, 2025

Uh oh!

linuxlonelyeagle Jan 26, 2025 •

edited

Loading

Uh oh!

linuxlonelyeagle Jan 26, 2025

Uh oh!

Groverkss commented Jan 26, 2025 •

edited

Loading

Uh oh!

linuxlonelyeagle commented Jan 26, 2025 •

edited

Loading

Uh oh!

Groverkss commented Jan 26, 2025 •

edited

Loading

Uh oh!

linuxlonelyeagle commented Jan 26, 2025

Uh oh!

Groverkss commented Jan 26, 2025

Uh oh!

linuxlonelyeagle commented Jan 26, 2025

Uh oh!

linuxlonelyeagle commented Jan 26, 2025

Uh oh!

Uh oh!

[mlir][affine]if the result of a Pure operation that whose operands are dimensional identifiers,then their results are dimensional identifiers. #123542

[mlir][affine]if the result of a Pure operation that whose operands are dimensional identifiers,then their results are dimensional identifiers. #123542

Uh oh!

Conversation

linuxlonelyeagle commented Jan 20, 2025

Uh oh!

llvmbot commented Jan 20, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

linuxlonelyeagle commented Jan 23, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

ftynse left a comment

Choose a reason for hiding this comment

Uh oh!

ftynse Jan 26, 2025

Choose a reason for hiding this comment

Uh oh!

linuxlonelyeagle Jan 26, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

linuxlonelyeagle Jan 26, 2025

Choose a reason for hiding this comment

Uh oh!

Groverkss commented Jan 26, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

linuxlonelyeagle commented Jan 26, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

Groverkss commented Jan 26, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

linuxlonelyeagle commented Jan 26, 2025

Uh oh!

Groverkss commented Jan 26, 2025

Uh oh!

linuxlonelyeagle commented Jan 26, 2025

Uh oh!

linuxlonelyeagle commented Jan 26, 2025

Uh oh!

Uh oh!

llvmbot commented Jan 20, 2025 •

edited

Loading

linuxlonelyeagle commented Jan 23, 2025 •

edited

Loading

linuxlonelyeagle Jan 26, 2025 •

edited

Loading

Groverkss commented Jan 26, 2025 •

edited

Loading

linuxlonelyeagle commented Jan 26, 2025 •

edited

Loading

Groverkss commented Jan 26, 2025 •

edited

Loading