Simplify graph returned by Subtensor.infer_shape

ricardoV94 · ricardoV94 · commit 0dc2a1ed5c41 · 2025-03-25T11:20:00.000+01:00
diff --git a/pytensor/tensor/subtensor.py b/pytensor/tensor/subtensor.py
@@ -33,14 +33,16 @@
     alloc,
     get_scalar_constant_value,
     nonzero,
+    switch,
 )
 from pytensor.tensor.basic import (
     constant as tensor_constant,
 )
 from pytensor.tensor.blockwise import vectorize_node_fallback
 from pytensor.tensor.elemwise import DimShuffle
 from pytensor.tensor.exceptions import AdvancedIndexingError, NotScalarConstantError
-from pytensor.tensor.math import clip
+from pytensor.tensor.math import abs as pt_abs
+from pytensor.tensor.math import clip, eq, ge, lt, maximum, minimum, sign
 from pytensor.tensor.shape import Reshape, Shape_i, specify_broadcastable
 from pytensor.tensor.type import (
     TensorType,
@@ -55,6 +57,7 @@
     lscalar,
     tensor,
     ubscalar,
+    uint_dtypes,
     uiscalar,
     ulscalar,
     uwscalar,
@@ -254,6 +257,25 @@ def get_idx_list(inputs, idx_list):
     return indices_from_subtensor(inputs[1:], idx_list)
 
 
+def undo_scalarization(x):
+    """Undo scalarization of a variable.
+
+    PyTensor Basic index operations use ScalarVariables for the indices/slice arguments.
+    But reasoning symbolically about the result of multiple indexing operations, we usually
+    want to work on TensorVariables, since rewrites work on those and not ScalarVariables.
+
+    This function undoes ScalarFromTensor operation or converts ScalarConstants to TensorConstants.
+    """
+    if isinstance(x, ScalarVariable):
+        if isinstance(x, ScalarConstant):
+            return tensor_constant(x.data, dtype=x.dtype)
+        elif x.owner is not None and isinstance(x.owner.op, ScalarFromTensor):
+            return x.owner.inputs[0]
+        else:
+            return as_tensor_variable(x)
+    return x
+
+
 @overload
 def get_canonical_form_slice(
     theslice: slice,
@@ -296,25 +318,6 @@ def get_canonical_form_slice(
     direction
         Direction to iterate the resulting elements in. (-1 or 1). May be symbolic.
     """
-    from pytensor.tensor import ge, lt, sign, switch
-
-    def undo_scalarization(x):
-        """Undo scalarization of a variable.
-
-        PyTensor Basic index operations use ScalarVariables for the indices/slice arguments.
-        But reasoning symbolically about the result of multiple indexing operations, we usually
-        want to work on TensorVariables, since rewrites work on those and not ScalarVariables.
-
-        This function undoes ScalarFromTensor operation or converts ScalarConstants to TensorConstants.
-        """
-        if isinstance(x, ScalarVariable):
-            if isinstance(x, ScalarConstant):
-                return tensor_constant(x.data, dtype=x.dtype)
-            elif x.owner is not None and isinstance(x.owner.op, ScalarFromTensor):
-                return x.owner.inputs[0]
-            else:
-                return as_tensor_variable(x)
-        return x
 
     def analyze(x):
         try:
@@ -845,6 +848,17 @@ def as_nontensor_scalar(a: Variable) -> ps.ScalarVariable:
         return ps.as_scalar(a)
 
 
+def _eager_switch(
+    cond: TensorVariable | bool, a: TensorVariable, b: TensorVariable
+) -> TensorVariable:
+    # Do not create a switch if cond is True/False
+    # We need this because uint types cannot be negative and creating the lazy switch could upcast everything to float64
+    # It also simplifies immediately the graph that's returned
+    if isinstance(cond, bool):
+        return a if cond else b
+    return cast(TensorVariable, switch(cond, a, b))
+
+
 class Subtensor(COp):
     """Basic NumPy indexing operator."""
 
@@ -956,27 +970,112 @@ def infer_shape(self, fgraph, node, shapes):
         padded = actual_idx_list + [slice(None, None, None)] * (
             len(xshp) - len(self.idx_list)
         )
+
+        zero = tensor_constant(np.array(0, dtype="int64"))
+        one = tensor_constant(np.array(1, dtype="int64"))
         i = 0
         for idx, xl in zip(padded, xshp, strict=True):
             if isinstance(idx, slice):
-                # If it is the default (None, None, None) slice, or a variant,
-                # the shape will be xl
+                a, b, step = idx.start, idx.stop, idx.step
                 if (
-                    (idx.start in [None, 0])
-                    and (idx.stop in [None, sys.maxsize])
-                    and (idx.step is None or idx.step == 1)
+                    a is None
+                    and b is None
+                    and step is not None
+                    and get_scalar_constant_value(step, raise_not_constant=False) == -1
                 ):
+                    # Shortcut for x[::-1]
                     outshp.append(xl)
+
                 else:
-                    cnf = get_canonical_form_slice(idx, xl)[0]
-                    if cnf.step == 1:
-                        length = cnf.stop - cnf.start
+                    if step is None:
+                        step_pos = True
+                        unit_step = True
+                        abs_step = one
+                    else:
+                        step = undo_scalarization(step)
+                        if step.dtype in uint_dtypes:
+                            step_pos = True
+                            abs_step = step.astype("int64")
+                        else:
+                            step_pos = ge(step, zero)
+                            abs_step = pt_abs(step)
+                        unit_step = eq(abs_step, one)
+
+                    if a is None:
+                        a_pos = True
+                        a = _eager_switch(step_pos, zero, xl)
                     else:
-                        length = (cnf.stop - cnf.start - 1) // cnf.step + 1
-                    outshp.append(length)
+                        a = undo_scalarization(a)
+                        if a.dtype in uint_dtypes:
+                            a_pos = True
+                            a = a.astype("int64")
+                        else:
+                            a_pos = ge(a, zero)
+
+                    if b is None:
+                        # For negative steps there is no numerical equivalent for stop=None.
+                        # The formulas below work if we set it to -1 and consider `b_pos=True`
+                        b_pos = True
+                        b = _eager_switch(step_pos, xl, -one)
+                    else:
+                        b = undo_scalarization(b)
+                        if b.dtype in uint_dtypes:
+                            b = b.astype("int64")
+                            b_pos = True
+                        else:
+                            b_pos = ge(b, zero)
+
+                    slice_length_pos_step = _eager_switch(
+                        a_pos,
+                        _eager_switch(
+                            b_pos,
+                            minimum(b - a, xl - a),  # [a: b]
+                            ((xl + b) - a),  # [a: -b]
+                        ),
+                        _eager_switch(
+                            b_pos,
+                            # The [-a: b] is peculiar, the slice length actually decreases for larger arrays
+                            # The branch -a is useless when b - a / 2 <= -a. Similar for the branch b
+                            minimum(minimum(xl, b - a - xl), minimum(-a, b)),  # [-a: b]
+                            minimum(b - a, xl + b),  # [-a: -b]
+                        ),
+                    )
+
+                    slice_length_neg_step = _eager_switch(
+                        a_pos,
+                        _eager_switch(
+                            b_pos,
+                            minimum(a - b, xl - b - one),  # [a: b]
+                            minimum(
+                                minimum(xl, a - (xl + b)), minimum(a + one, -b - one)
+                            ),  # [a: -b]
+                        ),
+                        _eager_switch(
+                            b_pos,
+                            ((xl + a) - b),  # [-a: b]
+                            minimum(a - b, xl + a + one),  # [-a: -b]
+                        ),
+                    )
+
+                    slice_length = _eager_switch(
+                        step_pos,
+                        slice_length_pos_step,
+                        slice_length_neg_step,
+                    )
+
+                    # Incorporate step size
+                    slice_length = _eager_switch(
+                        unit_step,
+                        slice_length,
+                        (slice_length - one) // abs_step + one,
+                    )
+                    # Catch negative sizes
+                    slice_length = maximum(zero, slice_length)
+                    outshp.append(slice_length)
+
                 i += 1
             else:
-                # That dimension is dropped
+                # That dimension is dropped by integer indexing
                 pass
         assert i == node.outputs[0].ndim
         assert len(outshp) == node.outputs[0].ndim
diff --git a/tests/tensor/test_subtensor.py b/tests/tensor/test_subtensor.py
@@ -15,10 +15,10 @@
 from pytensor.compile.mode import Mode
 from pytensor.configdefaults import config
 from pytensor.gradient import grad
-from pytensor.graph import Constant
+from pytensor.graph import Constant, FunctionGraph
 from pytensor.graph.basic import equal_computations
 from pytensor.graph.op import get_test_value
-from pytensor.graph.rewriting.utils import is_same_graph
+from pytensor.graph.rewriting.utils import is_same_graph, rewrite_graph
 from pytensor.printing import pprint
 from pytensor.scalar.basic import as_scalar, int16
 from pytensor.tensor import as_tensor, get_vector_length, vectorize
@@ -71,6 +71,7 @@
     lscalar,
     lvector,
     matrix,
+    scalar,
     tensor,
     tensor3,
     tensor4,
@@ -1055,26 +1056,8 @@ def test_adv_sub1_idx_broadcast(self):
         assert np.allclose(g_0[0], 1)
         assert np.allclose(g_0[1:], 0)
 
-    @pytest.mark.slow
-    def test_shape_i_const(self):
-        # Each axis is treated independently by shape_i/shape operators
-
-        mode_opt = self.mode
-        data = self.shared(np.array(np.arange(5), dtype=self.dtype))
-        for start in [None, -8, -5, -1, 0, 1, 5, 8]:
-            outs = []
-            shapes = []
-            for stop in [None, -8, -5, -1, 0, 1, 5, 8]:
-                for step in [None, -3, -1, 2]:
-                    outs += [data[start:stop:step].shape]
-                    shapes += [data.get_value(borrow=True)[start:stop:step].shape]
-            f = self.function([], outs, mode=mode_opt, op=subtensor_ops, N=0)
-            t_shapes = f()
-            for t_shape, shape in zip(t_shapes, shapes, strict=True):
-                assert np.all(t_shape == shape)
-            assert Subtensor not in [x.op for x in f.maker.fgraph.toposort()]
-
     def test_shape_i_scalar(self):
+        # TODO: Move this to infer_shape
         # Each axis is treated independently by shape_i/shape operators
 
         mode_opt = self.mode
@@ -1466,6 +1449,70 @@ def test_adv1_inc_sub_notlastdim_1_2dval_no_broadcast(self):
             assert np.allclose(m2_val, m2_ref), (m2_val, m2_ref)
 
 
+class TestSubtensorInferShape:
+    _NO_OPT_MODE = Mode(linker="py", optimizer=None)
+
+    @pytest.mark.parametrize(
+        "b", [None, 0, 1, 7, 13, -1, -7, -13], ids=lambda x: f"b={x}"
+    )
+    @pytest.mark.parametrize(
+        "a", [None, 0, 1, 7, 13, -1, -7, -13], ids=lambda x: f"a={x}"
+    )
+    @pytest.mark.parametrize("step", [None, 1, 3, -1, -4], ids=lambda x: f"step={x}")
+    def test_constant_params(self, a, b, step):
+        x = vector("x", dtype="int64")
+        y = x[a:b:step].shape[0]
+
+        fg = FunctionGraph(outputs=[y], clone=False)
+        rewrite_graph(fg, include=("ShapeOpt", "canonicalize"), clone=False)
+        assert not any(isinstance(node.op, Subtensor) for node in fg.apply_nodes)
+        assert len(fg.apply_nodes) <= 9
+
+        fn = pytensor.function(
+            [x],
+            fg.outputs[0],
+            trust_input=True,
+            mode=self._NO_OPT_MODE,
+            on_unused_input="ignore",
+        )
+        x_full = np.arange(20)
+        for n in range(0, 20):
+            x_test = x_full[:n]
+            assert fn(x_test) == x_test[a:b:step].shape[0], f"failed with {n=}"
+
+    @pytest.mark.parametrize("a_dtype", (None, "int64", "uint64"))
+    @pytest.mark.parametrize("b_dtype", (None, "int64", "uint64"))
+    @pytest.mark.parametrize("step_dtype", (None, "int64", "uint64"))
+    def test_uint(self, a_dtype, b_dtype, step_dtype):
+        a = None if a_dtype is None else scalar(dtype=a_dtype)
+        b = None if b_dtype is None else scalar(dtype=b_dtype)
+        step = None if step_dtype is None else scalar(dtype=step_dtype)
+        x = vector("x", dtype="int64")
+
+        y = x[a:b:step].shape[0]
+
+        final_y = rewrite_graph(y, include=("ShapeOpt", "canonicalize"), clone=False)
+        assert final_y.dtype == "int64"
+
+        test_a = None if a is None else 1 if a_dtype.startswith("u") else -1
+        test_b = None if b is None else 10 if b_dtype.startswith("u") else -2
+        test_step = None if step is None else 2 if step_dtype.startswith("u") else -2
+        test_x = np.arange(20)
+
+        test_dict = {x: test_x}
+        if a is not None:
+            test_dict[a] = test_a
+        if b is not None:
+            test_dict[b] = test_b
+        if step is not None:
+            test_dict[step] = test_step
+
+        final_y_eval = final_y.eval(
+            test_dict, mode=self._NO_OPT_MODE, on_unused_input="ignore"
+        )
+        assert final_y_eval == test_x[test_a:test_b:test_step].shape[0]
+
+
 def test_take_basic():
     with pytest.raises(TypeError):
         take(matrix(), lvector(), axis=lscalar())