[eudsl-python-extras] better handle callable generics

makslevental · makslevental · commit a32cf7296652 · 2025-11-19T16:08:47.000-08:00
diff --git a/projects/eudsl-python-extras/mlir/extras/dialects/func.py b/projects/eudsl-python-extras/mlir/extras/dialects/func.py
@@ -179,7 +179,7 @@ def __init__(
         self.call_op_ctor = call_op_ctor
         self.arg_attrs = arg_attrs
         self.res_attrs = res_attrs
-        self.generics = generics
+        self.generics = copy.deepcopy(generics)
         self.loc = loc
         self.ip = ip
         self._func_op = None
@@ -379,18 +379,21 @@ def maybe_eval_type_data_closure_vals(unevaled_type_data: _Ptr[PyObject]):
                 )
                 body_builder.__closure__[free_i].cell_contents = r.val
 
+        name_mangled_generics = []
+        for r in reified_type_params:
+            t, v = r.type, r.val
+            if callable(v):
+                v = v.__name__
+            name_mangled_generics.append(f"{t}_{v}")
+
         return FuncBase(
             body_builder,
             self.func_op_ctor,
             self.return_op_ctor,
             self.call_op_ctor,
             return_types=self.return_types,
             sym_visibility=self.sym_visibility,
-            sym_name=(
-                self.func_name
-                + "_"
-                + "_".join([f"{r.type}_{r.val}" for r in reified_type_params])
-            ),
+            sym_name=(self.func_name + "_" + "_".join(name_mangled_generics)),
             arg_attrs=self.arg_attrs,
             res_attrs=self.res_attrs,
             func_attrs=self.func_attrs,
diff --git a/projects/eudsl-python-extras/tests/dialect/test_func.py b/projects/eudsl-python-extras/tests/dialect/test_func.py
@@ -205,11 +205,52 @@ def mat_product_kernel(
         one = arith.constant(1, dtype)
 
     mat_product_kernel[32, 32, 32, T.i32()].emit()
+    mat_product_kernel[32, 32, 32, T.f32()].emit()
 
     # CHECK:  func.func @mat_product_kernel_int_32_int_32_int_32_type_i32(%[[VAL_0:.*]]: memref<32x32xi32>, %[[VAL_1:.*]]: memref<32x32xi32>, %[[VAL_2:.*]]: memref<32x32xi32>) {
     # CHECK:    %[[VAL_3:.*]] = arith.constant 1 : i32
     # CHECK:    return
     # CHECK:  }
+    # CHECK:  func.func @mat_product_kernel_int_32_int_32_int_32_type_f32(%arg0: memref<32x32xf32>, %arg1: memref<32x32xf32>, %arg2: memref<32x32xf32>) {
+    # CHECK:    %cst = arith.constant 1.000000e+00 : f32
+    # CHECK:    return
+    # CHECK:  }
+
+    filecheck_with_comments(ctx.module)
+
+
+def test_generics_callable(ctx: MLIRContext):
+    _op = TypeVar("_op")
+
+    @func(generics=[_op])
+    def mat_product_kernel1():
+        one = arith.constant(1, T.f32())
+        two = _op(one, one)
+
+    @func(generics=[_op])
+    def mat_product_kernel2():
+        one = arith.constant(1, T.f32())
+        two = _op(one, one)
+
+    mat_product_kernel1[arith.maximumf,].emit()
+    mat_product_kernel2[arith.minimumf,].emit()
+    mat_product_kernel2[arith.maximumf,].emit()
+
+    # CHECK:  func.func @mat_product_kernel1_function_maximumf() {
+    # CHECK:    %cst = arith.constant 1.000000e+00 : f32
+    # CHECK:    %0 = arith.maximumf %cst, %cst : f32
+    # CHECK:    return
+    # CHECK:  }
+    # CHECK:  func.func @mat_product_kernel2_function_minimumf() {
+    # CHECK:    %cst = arith.constant 1.000000e+00 : f32
+    # CHECK:    %0 = arith.minimumf %cst, %cst : f32
+    # CHECK:    return
+    # CHECK:  }
+    # CHECK:  func.func @mat_product_kernel2_function_maximumf() {
+    # CHECK:    %cst = arith.constant 1.000000e+00 : f32
+    # CHECK:    %0 = arith.maximumf %cst, %cst : f32
+    # CHECK:    return
+    # CHECK:  }
 
     filecheck_with_comments(ctx.module)
 
diff --git a/projects/eudsl-python-extras/tests/dialect/test_linalg.py b/projects/eudsl-python-extras/tests/dialect/test_linalg.py
@@ -18,6 +18,7 @@
     filecheck_with_comments,
     mlir_ctx as ctx,
 )
+from mlir.extras.runtime.passes import Pipeline, run_pipeline
 
 # needed since the fix isn't defined here nor conftest.py
 pytest.mark.usefixtures("ctx")
@@ -134,3 +135,118 @@ def maxpool3d(
     # CHECK:   return
     # CHECK: }
     filecheck_with_comments(maxpool3d_k)
+
+
+def test_pooling_ncdhw_max_parallel(ctx: MLIRContext):
+    S = ShapedType.get_dynamic_size()
+
+    generics = (
+        kernel_size_0,
+        kernel_size_1,
+        kernel_size_2,
+        stride_0,
+        stride_1,
+        stride_2,
+        dilation_0,
+        dilation_1,
+        dilation_2,
+    ) = list(
+        map(
+            TypeVar,
+            [
+                "kernel_size_0",
+                "kernel_size_1",
+                "kernel_size_2",
+                "stride_0",
+                "stride_1",
+                "stride_2",
+                "dilation_0",
+                "dilation_1",
+                "dilation_2",
+            ],
+        )
+    )
+
+    @func(
+        generics=(
+            kernel_size_0,
+            kernel_size_1,
+            kernel_size_2,
+            stride_0,
+            stride_1,
+            stride_2,
+            dilation_0,
+            dilation_1,
+            dilation_2,
+        )
+    )
+    def maxpool3d(
+        input: T.memref(S, S, S, S, S, T.f32()),
+        output: T.memref(S, S, S, S, S, T.f32()),
+    ):
+        kernel_shape_surrogate = memref.alloca(
+            (kernel_size_0, kernel_size_1, kernel_size_2),
+            T.f32(),
+        )
+
+        linalg.pooling_ncdhw_max(
+            input,
+            kernel_shape_surrogate,
+            output,
+            strides=[stride_0, stride_1, stride_2],
+            dilations=[dilation_0, dilation_1, dilation_2],
+        )
+
+    kernel_sizes = [1, 2, 3]
+    strides = [4, 5, 6]
+    dilations = [7, 8, 9]
+    maxpool3d_k = maxpool3d[
+        kernel_sizes[0],
+        kernel_sizes[1],
+        kernel_sizes[2],
+        strides[0],
+        strides[1],
+        strides[2],
+        dilations[0],
+        dilations[1],
+        dilations[2],
+    ].emit()
+    module = run_pipeline(
+        ctx.module,
+        Pipeline().bufferize().Func(Pipeline().convert_linalg_to_parallel_loops()),
+    )
+    # CHECK: #map = affine_map<(d0, d1) -> (d0 * 4 + d1 * 7)>
+    # CHECK: #map1 = affine_map<(d0, d1) -> (d0 * 5 + d1 * 8)>
+    # CHECK: #map2 = affine_map<(d0, d1) -> (d0 * 6 + d1 * 9)>
+    # CHECK: module {
+    # CHECK:   func.func @maxpool3d_int_1_int_2_int_3_int_4_int_5_int_6_int_7_int_8_int_9(%arg0: memref<?x?x?x?x?xf32>, %arg1: memref<?x?x?x?x?xf32>) {
+    # CHECK:     %c4 = arith.constant 4 : index
+    # CHECK:     %c3 = arith.constant 3 : index
+    # CHECK:     %c2 = arith.constant 2 : index
+    # CHECK:     %c1 = arith.constant 1 : index
+    # CHECK:     %c0 = arith.constant 0 : index
+    # CHECK:     %dim = memref.dim %arg0, %c0 : memref<?x?x?x?x?xf32>
+    # CHECK:     %dim_0 = memref.dim %arg0, %c1 : memref<?x?x?x?x?xf32>
+    # CHECK:     %dim_1 = memref.dim %arg1, %c2 : memref<?x?x?x?x?xf32>
+    # CHECK:     %dim_2 = memref.dim %arg1, %c3 : memref<?x?x?x?x?xf32>
+    # CHECK:     %dim_3 = memref.dim %arg1, %c4 : memref<?x?x?x?x?xf32>
+    # CHECK:     scf.parallel (%arg2, %arg3, %arg4, %arg5, %arg6) = (%c0, %c0, %c0, %c0, %c0) to (%dim, %dim_0, %dim_1, %dim_2, %dim_3) step (%c1, %c1, %c1, %c1, %c1) {
+    # CHECK:       scf.for %arg7 = %c0 to %c1 step %c1 {
+    # CHECK:         scf.for %arg8 = %c0 to %c2 step %c1 {
+    # CHECK:           scf.for %arg9 = %c0 to %c3 step %c1 {
+    # CHECK:             %0 = affine.apply #map(%arg4, %arg7)
+    # CHECK:             %1 = affine.apply #map1(%arg5, %arg8)
+    # CHECK:             %2 = affine.apply #map2(%arg6, %arg9)
+    # CHECK:             %3 = memref.load %arg0[%arg2, %arg3, %0, %1, %2] : memref<?x?x?x?x?xf32>
+    # CHECK:             %4 = memref.load %arg1[%arg2, %arg3, %arg4, %arg5, %arg6] : memref<?x?x?x?x?xf32>
+    # CHECK:             %5 = arith.maximumf %3, %4 : f32
+    # CHECK:             memref.store %5, %arg1[%arg2, %arg3, %arg4, %arg5, %arg6] : memref<?x?x?x?x?xf32>
+    # CHECK:           }
+    # CHECK:         }
+    # CHECK:       }
+    # CHECK:       scf.reduce
+    # CHECK:     }
+    # CHECK:     return
+    # CHECK:   }
+    # CHECK: }
+    filecheck_with_comments(module)