Rename SparseMultiply Ops

ricardoV94 · ricardoV94 · commit 8884c670f734 · 2025-10-18T19:02:20.000+02:00
diff --git a/pytensor/sparse/basic.py b/pytensor/sparse/basic.py
@@ -2310,7 +2310,7 @@ def sub(x, y):
     return x + (-y)
 
 
-class MulSS(Op):
+class SparseSparseMultiply(Op):
     # mul(sparse, sparse)
     # See the doc of mul() for more detail
     __props__ = ()
@@ -2343,12 +2343,15 @@ def infer_shape(self, fgraph, node, shapes):
         return [shapes[0]]
 
 
-mul_s_s = MulSS()
+mul_s_s = SparseSparseMultiply()
 
 
-class MulSD(Op):
+class SparseDenseMultiply(Op):
     # mul(sparse, dense)
     # See the doc of mul() for more detail
+
+    # We're doing useless copy of indices and indptr, those should be reused
+    # However, PyTensor doesn't support one output -> multiple views...
     __props__ = ()
 
     def make_node(self, x, y):
@@ -2364,64 +2367,42 @@ def make_node(self, x, y):
         # Broadcasting of the sparse matrix is not supported.
         # We support nd == 0 used by grad of SpSum()
         assert y.type.ndim in (0, 2)
-        out = SparseTensorType(dtype=dtype, format=x.type.format)()
+        out = SparseTensorType(dtype=dtype, format=x.type.format, shape=x.type.shape)()
         return Apply(self, [x, y], [out])
 
     def perform(self, node, inputs, outputs):
         (x, y) = inputs
         (out,) = outputs
+        out_dtype = node.outputs[0].dtype
         assert _is_sparse(x) and _is_dense(y)
-        if len(y.shape) == 0:
-            out_dtype = node.outputs[0].dtype
-            if x.dtype == out_dtype:
-                z = x.copy()
-            else:
-                z = x.astype(out_dtype)
-            out[0] = z
-            out[0].data *= y
-        elif len(y.shape) == 1:
-            raise NotImplementedError()  # RowScale / ColScale
-        elif len(y.shape) == 2:
+
+        if x.dtype == out_dtype:
+            z = x.copy()
+        else:
+            z = x.astype(out_dtype)
+        out[0] = z
+        z_data = z.data
+
+        if y.ndim == 0:
+            z_data *= y
+        else:  # y_ndim == 2
             # if we have enough memory to fit y, maybe we can fit x.asarray()
             # too?
             # TODO: change runtime from O(M*N) to O(nonzeros)
             M, N = x.shape
             assert x.shape == y.shape
-            out_dtype = node.outputs[0].dtype
-
+            indices = x.indices
+            indptr = x.indptr
             if x.format == "csc":
-                indices = x.indices
-                indptr = x.indptr
-                if x.dtype == out_dtype:
-                    z = x.copy()
-                else:
-                    z = x.astype(out_dtype)
-                z_data = z.data
-
                 for j in range(0, N):
                     for i_idx in range(indptr[j], indptr[j + 1]):
                         i = indices[i_idx]
                         z_data[i_idx] *= y[i, j]
-                out[0] = z
             elif x.format == "csr":
-                indices = x.indices
-                indptr = x.indptr
-                if x.dtype == out_dtype:
-                    z = x.copy()
-                else:
-                    z = x.astype(out_dtype)
-                z_data = z.data
-
                 for i in range(0, M):
                     for j_idx in range(indptr[i], indptr[i + 1]):
                         j = indices[j_idx]
                         z_data[j_idx] *= y[i, j]
-                out[0] = z
-            else:
-                warn(
-                    "This implementation of MulSD is deficient: {x.format}",
-                )
-                out[0] = type(x)(x.toarray() * y)
 
     def grad(self, inputs, gout):
         (x, y) = inputs
@@ -2434,12 +2415,14 @@ def infer_shape(self, fgraph, node, shapes):
         return [shapes[0]]
 
 
-mul_s_d = MulSD()
+mul_s_d = SparseDenseMultiply()
 
 
-class MulSV(Op):
+class SparseDenseVectorMultiply(Op):
     """Element-wise multiplication of sparse matrix by a broadcasted dense vector element wise.
 
+    TODO: Merge with the SparseDenseMultiply Op
+
     Notes
     -----
     The grad implemented is regular, i.e. not structured.
@@ -2500,7 +2483,7 @@ def infer_shape(self, fgraph, node, ins_shapes):
         return [ins_shapes[0]]
 
 
-mul_s_v = MulSV()
+mul_s_v = SparseDenseVectorMultiply()
 
 
 def mul(x, y):
@@ -2539,16 +2522,17 @@ def mul(x, y):
         # mul_s_s is not implemented if the types differ
         if y.dtype == "float64" and x.dtype == "float32":
             x = x.astype("float64")
-
         return mul_s_s(x, y)
-    elif x_is_sparse_variable and not y_is_sparse_variable:
+    elif x_is_sparse_variable or y_is_sparse_variable:
+        if y_is_sparse_variable:
+            x, y = y, x
         # mul is unimplemented if the dtypes differ
         if y.dtype == "float64" and x.dtype == "float32":
             x = x.astype("float64")
-
-        return mul_s_d(x, y)
-    elif y_is_sparse_variable and not x_is_sparse_variable:
-        return mul_s_d(y, x)
+        if y.ndim == 1:
+            return mul_s_v(x, y)
+        else:
+            return mul_s_d(x, y)
     else:
         raise NotImplementedError()
 
diff --git a/tests/sparse/test_basic.py b/tests/sparse/test_basic.py
@@ -32,12 +32,12 @@
     EnsureSortedIndices,
     GetItemScalar,
     HStack,
-    MulSD,
-    MulSS,
     Neg,
     Remove0,
     SamplingDot,
+    SparseDenseMultiply,
     SparseFromDense,
+    SparseSparseMultiply,
     SparseTensorType,
     SquareDiagonal,
     StructuredDot,
@@ -514,7 +514,7 @@ def test_mul_ss(self):
                 sp.sparse.csr_matrix(random_lil((10, 40), config.floatX, 3)),
             ]
             * 2,
-            MulSS,
+            SparseSparseMultiply,
         )
 
     def test_mul_sd(self):
@@ -527,7 +527,7 @@ def test_mul_sd(self):
                 sp.sparse.csr_matrix(random_lil((10, 40), config.floatX, 3)),
                 np.random.standard_normal((10, 40)).astype(config.floatX),
             ],
-            MulSD,
+            SparseDenseMultiply,
             excluding=["local_mul_s_d"],
         )
 
diff --git a/tests/sparse/test_rewriting.py b/tests/sparse/test_rewriting.py
@@ -77,7 +77,8 @@ def test_local_mul_s_d():
         f = pytensor.function(inputs, sparse.mul_s_d(*inputs), mode=mode)
 
         assert not any(
-            isinstance(node.op, sparse.MulSD) for node in f.maker.fgraph.toposort()
+            isinstance(node.op, sparse.SparseDenseMultiply)
+            for node in f.maker.fgraph.toposort()
         )
 
 
@@ -94,7 +95,8 @@ def test_local_mul_s_v():
         f = pytensor.function(inputs, sparse.mul_s_v(*inputs), mode=mode)
 
         assert not any(
-            isinstance(node.op, sparse.MulSV) for node in f.maker.fgraph.toposort()
+            isinstance(node.op, sparse.SparseDenseVectorMultiply)
+            for node in f.maker.fgraph.toposort()
         )
 
 

Original file line number	Diff line number	Diff line change
`@@ -77,7 +77,8 @@ def test_local_mul_s_d():`
`77`	`77`	`f = pytensor.function(inputs, sparse.mul_s_d(*inputs), mode=mode)`
`78`	`78`
`79`	`79`	`assert not any(`
`80`		`- isinstance(node.op, sparse.MulSD) for node in f.maker.fgraph.toposort()`
	`80`	`+ isinstance(node.op, sparse.SparseDenseMultiply)`
	`81`	`+ for node in f.maker.fgraph.toposort()`
`81`	`82`	`)`
`82`	`83`
`83`	`84`
`@@ -94,7 +95,8 @@ def test_local_mul_s_v():`
`94`	`95`	`f = pytensor.function(inputs, sparse.mul_s_v(*inputs), mode=mode)`
`95`	`96`
`96`	`97`	`assert not any(`
`97`		`- isinstance(node.op, sparse.MulSV) for node in f.maker.fgraph.toposort()`
	`98`	`+ isinstance(node.op, sparse.SparseDenseVectorMultiply)`
	`99`	`+ for node in f.maker.fgraph.toposort()`
`98`	`100`	`)`
`99`	`101`
`100`	`102`