Don't apply local_upcast_elemwise_constant_inputs when all inputs are constant

ricardoV94 · ricardoV94 · commit 9a9fbbc28bde · 2025-03-25T14:47:03.000+01:00
diff --git a/pytensor/tensor/rewriting/elemwise.py b/pytensor/tensor/rewriting/elemwise.py
@@ -493,65 +493,65 @@ def local_upcast_elemwise_constant_inputs(fgraph, node):
     """
     if len(node.outputs) > 1:
         return
-    try:
-        shape_i = fgraph.shape_feature.shape_i
-    except AttributeError:
-        shape_i = None
-    if isinstance(node.op, Elemwise):
-        scalar_op = node.op.scalar_op
-        # print "aa", scalar_op.output_types_preference
-        if getattr(scalar_op, "output_types_preference", None) in (
-            ps.upgrade_to_float,
-            ps.upcast_out,
-        ):
-            # this is the kind of op that we can screw with the input
-            # dtypes by upcasting explicitly
-            output_dtype = node.outputs[0].type.dtype
-            new_inputs = []
-            for i in node.inputs:
-                if i.type.dtype == output_dtype:
-                    new_inputs.append(i)
-                else:
-                    try:
-                        cval_i = get_underlying_scalar_constant_value(
-                            i, only_process_constants=True
+
+    if all(isinstance(i, Constant) for i in node.inputs):
+        # If all inputs are constant, constant_fold will take care of it
+        return
+
+    if getattr(node.op.scalar_op, "output_types_preference", None) in (
+        ps.upgrade_to_float,
+        ps.upcast_out,
+    ):
+        # this is the kind of op that we can screw with the input
+        # dtypes by upcasting explicitly
+        output_dtype = node.outputs[0].type.dtype
+        new_inputs = []
+        for i in node.inputs:
+            if i.type.dtype == output_dtype:
+                new_inputs.append(i)
+            else:
+                try:
+                    cval_i = get_underlying_scalar_constant_value(
+                        i, only_process_constants=True
+                    )
+                    if all(i.broadcastable):
+                        new_inputs.append(
+                            shape_padleft(cast(cval_i, output_dtype), i.ndim)
                         )
-                        if all(i.broadcastable):
-                            new_inputs.append(
-                                shape_padleft(cast(cval_i, output_dtype), i.ndim)
-                            )
-                        else:
-                            if shape_i is None:
-                                return
-                            new_inputs.append(
-                                alloc(
-                                    cast(cval_i, output_dtype),
-                                    *[shape_i(d)(i) for d in range(i.ndim)],
-                                )
+                    else:
+                        try:
+                            shape_i = fgraph.shape_feature.shape_i
+                        except AttributeError:
+                            return
+                        new_inputs.append(
+                            alloc(
+                                cast(cval_i, output_dtype),
+                                *[shape_i(d)(i) for d in range(i.ndim)],
                             )
-                            # print >> sys.stderr, "AAA",
-                            # *[Shape_i(d)(i) for d in range(i.ndim)]
-                    except NotScalarConstantError:
-                        # for the case of a non-scalar
-                        if isinstance(i, TensorConstant):
-                            new_inputs.append(cast(i, output_dtype))
-                        else:
-                            new_inputs.append(i)
+                        )
+                        # print >> sys.stderr, "AAA",
+                        # *[Shape_i(d)(i) for d in range(i.ndim)]
+                except NotScalarConstantError:
+                    # for the case of a non-scalar
+                    if isinstance(i, TensorConstant):
+                        new_inputs.append(cast(i, output_dtype))
+                    else:
+                        new_inputs.append(i)
 
-            if new_inputs != node.inputs:
-                rval = [node.op(*new_inputs)]
-                if not node.outputs[0].type.is_super(rval[0].type):
-                    # This can happen for example when floatX=float32
-                    # and we do the true division between and int64
-                    # and a constant that will get typed as int8.
+        if new_inputs != node.inputs:
+            rval = [node.op(*new_inputs)]
+            if not node.outputs[0].type.is_super(rval[0].type):
+                # This can happen for example when floatX=float32
+                # and we do the true division between and int64
+                # and a constant that will get typed as int8.
 
-                    # As this is just to allow merging more case, if
-                    # the upcast don't work, we can just skip it.
-                    return
+                # As this is just to allow merging more case, if
+                # the upcast don't work, we can just skip it.
+                return
 
-                # Copy over output stacktrace from before upcasting
-                copy_stack_trace(node.outputs[0], rval)
-                return rval
+            # Copy over output stacktrace from before upcasting
+            copy_stack_trace(node.outputs[0], rval)
+            return rval
 
 
 @node_rewriter([Elemwise])