xdslproject · mamanain · Nov 4, 2024 · Nov 5, 2024 · superlopuh · Nov 5, 2024
diff --git a/tests/filecheck/mlir-conversion/with-mlir/ptr_loop_folding.mlir b/tests/filecheck/mlir-conversion/with-mlir/ptr_loop_folding.mlir
@@ -0,0 +1,79 @@
+// RUN: xdsl-opt -p convert-memref-to-ptr,convert-ptr-type-offsets,mlir-opt[scf-for-loop-canonicalization,scf-for-loop-range-folding,scf-for-loop-canonicalization],scf-for-loop-flatten,mlir-opt[scf-for-loop-canonicalization,scf-for-loop-range-folding,scf-for-loop-canonicalization] --split-input-file %s | filecheck %s
+
+func.func @fill(%m: memref<10xi32>) {
+    %c0 = arith.constant 0 : index
+    %end = arith.constant 10 : index
+    %c1 = arith.constant 1 : index
+    %val = arith.constant 100 : i32
+    scf.for %i = %c0 to %end step %c1 {
+        memref.store %val, %m[%i] : memref<10xi32>
+    }
+    return
+}
+
+// CHECK:       func.func @fill(%arg4 : memref<10xi32>) {
+// CHECK-NEXT:    %0 = arith.constant 0 : index
+// CHECK-NEXT:    %1 = arith.constant 100 : i32
+// CHECK-NEXT:    %2 = arith.constant 40 : index
+// CHECK-NEXT:    %3 = arith.constant 4 : index
+// CHECK-NEXT:    scf.for %arg5 = %0 to %2 step %3 {
+// CHECK-NEXT:      %4 = ptr_xdsl.to_ptr %arg4 : memref<10xi32> -> !ptr_xdsl.ptr
+// CHECK-NEXT:      %5 = ptr_xdsl.ptradd %4, %arg5 : (!ptr_xdsl.ptr, index) -> !ptr_xdsl.ptr
+// CHECK-NEXT:      ptr_xdsl.store %1, %5 : i32, !ptr_xdsl.ptr
+// CHECK-NEXT:    }
+// CHECK-NEXT:    func.return
+// CHECK-NEXT:  }
+
+func.func @fill2d(%m: memref<10x10xi32>) {
+    %c0 = arith.constant 0 : index
+    %end = arith.constant 10 : index
+    %c1 = arith.constant 1 : index
+    %val = arith.constant 100 : i32
+    scf.for %i = %c0 to %end step %c1 {
+        scf.for %j = %c0 to %end step %c1 {
+            memref.store %val, %m[%i, %j] : memref<10x10xi32>
+        }
+    }
+    return
+}
+
+// CHECK-NEXT:  func.func @fill2d(%arg2 : memref<10x10xi32>) {
+// CHECK-NEXT:    %0 = arith.constant 0 : index
+// CHECK-NEXT:    %1 = arith.constant 100 : i32
+// CHECK-NEXT:    %2 = arith.constant 400 : index
+// CHECK-NEXT:    %3 = arith.constant 4 : index
+// CHECK-NEXT:    scf.for %arg3 = %0 to %2 step %3 {
+// CHECK-NEXT:      %4 = ptr_xdsl.to_ptr %arg2 : memref<10x10xi32> -> !ptr_xdsl.ptr
+// CHECK-NEXT:      %5 = ptr_xdsl.ptradd %4, %arg3 : (!ptr_xdsl.ptr, index) -> !ptr_xdsl.ptr
+// CHECK-NEXT:      ptr_xdsl.store %1, %5 : i32, !ptr_xdsl.ptr
+// CHECK-NEXT:    }
+// CHECK-NEXT:    func.return
+// CHECK-NEXT:  }
+
+func.func @fill3d(%m: memref<10x10x10xi32>) {
+    %c0 = arith.constant 0 : index
+    %end = arith.constant 10 : index
+    %c1 = arith.constant 1 : index
+    %val = arith.constant 100 : i32
+    scf.for %i = %c0 to %end step %c1 {
+        scf.for %j = %c0 to %end step %c1 {
+            scf.for %k = %c0 to %end step %c1 {
+                memref.store %val, %m[%i, %j, %k] : memref<10x10x10xi32>
+            }
+        }
+    }
+    return
+}
+
+// CHECK-NEXT:  func.func @fill3d(%arg0 : memref<10x10x10xi32>) {
+// CHECK-NEXT:    %0 = arith.constant 0 : index
+// CHECK-NEXT:    %1 = arith.constant 100 : i32
+// CHECK-NEXT:    %2 = arith.constant 4000 : index
+// CHECK-NEXT:    %3 = arith.constant 4 : index
+// CHECK-NEXT:    scf.for %arg1 = %0 to %2 step %3 {
+// CHECK-NEXT:      %4 = ptr_xdsl.to_ptr %arg0 : memref<10x10x10xi32> -> !ptr_xdsl.ptr
+// CHECK-NEXT:      %5 = ptr_xdsl.ptradd %4, %arg1 : (!ptr_xdsl.ptr, index) -> !ptr_xdsl.ptr
+// CHECK-NEXT:      ptr_xdsl.store %1, %5 : i32, !ptr_xdsl.ptr
+// CHECK-NEXT:    }
+// CHECK-NEXT:    func.return
+// CHECK-NEXT:  }
diff --git a/tests/filecheck/transforms/convert_ptr_type_offsets.mlir b/tests/filecheck/transforms/convert_ptr_type_offsets.mlir
@@ -0,0 +1,12 @@
+// RUN: xdsl-opt -p convert-ptr-type-offsets --split-input-file --verify-diagnostics %s | filecheck %s
+
+%a1 = ptr_xdsl.type_offset i32 : index
+// CHECK: %a1 = arith.constant 4 : index
+
+%a2 = ptr_xdsl.type_offset f128 : index
+// CHECK-NEXT: %a2 = arith.constant 16 : index
+
+// -----
+
+%a3 = ptr_xdsl.type_offset tensor<4xi32> : index
+// CHECK: Type offset is currently only supported for fixed size types
diff --git a/xdsl/transforms/__init__.py b/xdsl/transforms/__init__.py
@@ -333,6 +333,11 @@ def get_convert_print_format_to_riscv_debug():
 
         return convert_print_format_to_riscv_debug.ConvertPrintFormatToRiscvDebugPass
 
+    def get_convert_ptr_type_offsets():
+        from xdsl.transforms import convert_ptr_type_offsets
+
+        return convert_ptr_type_offsets.ConvertPtrTypeOffsetsPass
+
     def get_convert_qref_to_qssa():
         from xdsl.transforms import convert_qref_to_qssa
 
@@ -468,6 +473,7 @@ def get_varith_fuse_repeated_operands():
         "convert-scf-to-openmp": get_convert_scf_to_openmp,
         "convert-scf-to-riscv-scf": get_convert_scf_to_riscv_scf,
         "convert-snitch-stream-to-snitch": get_convert_snitch_stream_to_snitch,
+        "convert-ptr-type-offsets": get_convert_ptr_type_offsets,
         "convert-stencil-to-csl-stencil": get_convert_stencil_to_csl_stencil,
         "inline-snrt": get_convert_snrt_to_riscv,
         "convert-stencil-to-ll-mlir": get_convert_stencil_to_ll_mlir,

diff --git a/xdsl/transforms/convert_ptr_type_offsets.py b/xdsl/transforms/convert_ptr_type_offsets.py
@@ -0,0 +1,38 @@
+from dataclasses import dataclass
+from typing import cast
+
+from xdsl.context import MLContext
+from xdsl.dialects import arith, ptr
+from xdsl.dialects.builtin import FixedBitwidthType, IndexType, ModuleOp
+from xdsl.passes import ModulePass
+from xdsl.pattern_rewriter import (
+    GreedyRewritePatternApplier,
+    PatternRewriter,
+    PatternRewriteWalker,
+    RewritePattern,
+    op_type_rewrite_pattern,
+)
+from xdsl.utils.exceptions import DiagnosticException
+
+
+@dataclass
+class ConvertTypeOffsetOp(RewritePattern):
+    @op_type_rewrite_pattern
+    def match_and_rewrite(self, op: ptr.TypeOffsetOp, rewriter: PatternRewriter, /):
+        if not issubclass(type(op.elem_type), FixedBitwidthType):
+            raise DiagnosticException(
+                "Type offset is currently only supported for fixed size types"
+            )
+        elem_type = cast(FixedBitwidthType, op.elem_type)
+        rewriter.replace_matched_op(
+            arith.Constant.from_int_and_width(elem_type.size, IndexType())
+        )
+
+
+class ConvertPtrTypeOffsetsPass(ModulePass):
+    name = "convert-ptr-type-offsets"
+
+    def apply(self, ctx: MLContext, op: ModuleOp) -> None:
+        PatternRewriteWalker(
+            GreedyRewritePatternApplier([ConvertTypeOffsetOp()]),
+        ).rewrite_module(op)