pre-commit

cetagostini · jessegrabowski · commit e5e0af6f1369 · 2025-04-19T13:25:18.000-05:00
diff --git a/pytensor/link/mlx/dispatch/blockwise.py b/pytensor/link/mlx/dispatch/blockwise.py
@@ -4,44 +4,19 @@
 from pytensor.tensor.blockwise import Blockwise
 from pytensor.tensor.signal.conv import Conv1d
 
-import numpy as np
 
 def blockwise_conv1d(op, node, **kwargs):
-    # if op.core_op.mode != "valid":
-    #     raise NotImplementedError("Only 'valid' mode is supported for conv1d")
-    
-    # def inner_f(x, kernel):
-    #     B, T = x.shape
-    #     Bk, K = kernel.shape
-    #     if B != Bk:
-    #         raise ValueError(f"Batch mismatch: x has {B}, kernels has {Bk}")
-
-    #     # 1) Flip each kernel for true convolution
-    #     kernels_flipped = kernel[:, ::-1]  # shape (B, K)
-
-    #     # 2) Reshape input into (N=1, H=T, C_in=B)
-    #     x_in = x.T[None, :, :]              
-
-    #     # 3) Build weight tensor of shape (C_out=B, H_f=K, C_in=1)
-    #     w = kernels_flipped[:, :, None]     
-
-    #     # 4) Convolve with one group per channel → valid mode
-    #     y = mx.conv1d(
-    #         x_in, w,
-    #         stride=1,
-    #         padding=0,
-    #         dilation=1,
-    #         groups=B
-    #     )
-    #     # y: (1, T-K+1, B) → drop batch and transpose to (B, T-K+1)
-    #     return y[0].T
-    
+    """
+    Custom implementation of Blockwise.conv1d for MLX.
+    """
+
     def batched_conv1d(
-            x: mx.array,
-            kernels: mx.array,
-            mode: str = op.core_op.mode,
-            stride: int = 1,
-            dilation: int = 1) -> mx.array:
+        x: mx.array,
+        kernels: mx.array,
+        mode: str = op.core_op.mode,
+        stride: int = 1,
+        dilation: int = 1,
+    ) -> mx.array:
         """
         Apply B separate 1D convolutions (full or valid) to B sequences in parallel.
 
@@ -53,14 +28,14 @@ def batched_conv1d(
                 B kernels of length K.
         mode     : {"valid", "full"}
                 "valid" → no padding, output length = T - K + 1
-                "full"  → zero‑pad so output length = T + K - 1
+                "full"  → zero-pad so output length = T + K - 1
         stride   : int, convolution stride (default=1)
         dilation : int, convolution dilation (default=1)
 
         Returns
         -------
         out      : array of shape (B, L)
-                where L = 
+                where L =
                     - T - K + 1   if mode="valid"
                     - T + K - 1   if mode="full"
         """
@@ -89,20 +64,15 @@ def batched_conv1d(
         w = kernels_flipped[:, :, None]
 
         # --- 5) run grouped conv1d ---
-        y = mx.conv1d(
-            x_in, w,
-            stride=stride,
-            padding=pad,
-            dilation=dilation,
-            groups=B
-        )
+        y = mx.conv1d(x_in, w, stride=stride, padding=pad, dilation=dilation, groups=B)
         # y shape: (1, H_out, B)
 
         # --- 6) return shape (B, H_out) ---
         return y[0].T
 
     return batched_conv1d
 
+
 @mlx_funcify.register(Blockwise)
 def funcify_Blockwise(op: Blockwise, node, **kwargs):
     # 1) If it's a Conv1d Blockwise, use the custom implementation