Upload folder using huggingface_hub

d1ceb73 verified 11 months ago

41 kB

	# mypy: allow-untyped-defs
	import builtins
	import dataclasses
	import inspect
	import sys
	import weakref
	from collections import defaultdict
	from typing import Any, Callable, Dict, List, Optional, Set, Tuple, TYPE_CHECKING, Union

	import torch
	from torch.utils._pytree import (
	_get_node_type,
	BUILTIN_TYPES,
	SUPPORTED_NODES,
	tree_flatten,
	tree_map,
	)

	from .exported_program import ExportedProgram

	if TYPE_CHECKING:
	from sympy import Symbol

	from torch._guards import Source

	from ..fx.experimental.symbolic_shapes import ShapeEnv, StrictMinMaxConstraint

	__all__ = [
	"Constraint",
	"Dim",
	"dims",
	"dynamic_dim",
	"refine_dynamic_shapes_from_suggested_fixes",
	]


	class _Dim(type):
	"""
	Metaclass for :func:`Dim` types.
	"""

	@staticmethod
	def readable(name, min_, max_):
	if min_ == 2:
	min_ = None
	if max_ == sys.maxsize - 1:
	max_ = None
	if min_ is None and max_ is None:
	return f"Dim('{name}')"
	if min_ is None:
	return f"Dim('{name}', max={max_})"
	if max_ is None:
	return f"Dim('{name}', min={min_})"
	return f"Dim('{name}', min={min_}, max={max_})"

	def __add__(cls, other):
	# e.g., dim + 1
	if type(other) is not int:
	raise NotImplementedError(
	f"Attempted to add {other} to {cls.__name__}, where an integer was expected. "
	"(Only increasing linear operations with integer coefficients are supported.)"
	)
	return cls._derive(lambda x: x + other)

	def __radd__(cls, other):
	return cls + other

	def __sub__(cls, other):
	# e.g., dim - 1
	if type(other) is not int:
	raise NotImplementedError(
	f"Attempted to subtract {other} from {cls.__name__}, where an integer was expected. "
	"(Only increasing linear operations with integer coefficients are supported.)"
	)
	return cls._derive(lambda x: x - other)

	def __rsub__(cls, other):
	raise NotImplementedError(
	f"Attempted to negate {cls.__name__}. "
	"(Only increasing linear operations with integer coefficients are supported.)"
	)

	def __mul__(cls, other):
	# e.g., dim * 2
	if type(other) is not int or other <= 0:
	raise NotImplementedError(
	f"Attempted to multiply {other} with {cls.__name__}, where a positive integer was expected. "
	"(Only increasing linear operations with integer coefficients are supported.)"
	)
	return cls._derive(lambda x: x * other)

	def __rmul__(cls, other):
	return cls * other

	def _derived_name(cls, fn):
	from sympy import sympify

	return str(fn(sympify(cls.__name__)))

	def _derive(cls, fn):
	return _DerivedDim(cls._derived_name(fn), (int,), {"root": cls, "fn": fn})


	class _StaticDim(_Dim):
	"""
	Meta class for static :func:`Dim` types.

	This class is only for setting and checking static dim constraints,
	and the user should never interact with it.
	"""

	@property
	def min(self):
	return self.value # type: ignore[attr-defined]

	@property
	def max(self):
	return self.value # type: ignore[attr-defined]


	class _DerivedDim(_Dim):
	"""
	Metaclass for derived :func:`Dim` types.

	Currently we only support increasing linear expressions with integer coefficients.
	In other words, a derived Dim can always be written in the form Ax + B, where
	x is a regular Dim (i.e., non-derived Dim), A and B are integers, and A is positive.
	(In particular, the latter ensures that x < y => Ax + B < Ay + B.)
	These restrictions on the form of derived Dims makes the metatheory simpler: e.g.,
	it simplifies computing ranges for derived Dims, solving for underlying regular Dims,
	deciding equalities between derived Dims, and so on.

	The function lambda x: Ax + B is expressed by `fn`, where x is a normal Dim, `root`.
	The range of a derived Dim is computed by mapping `fn` over the range of its `root`.
	"""

	@property
	def min(self):
	# assume that self.fn is an increasing function
	# TODO(avik): use sympy value range analysis instead?
	from sympy import Integer

	_min_symint = self.fn(Integer(self.root.min)) # type: ignore[attr-defined]
	root = self.root # type: ignore[attr-defined]
	assert _min_symint >= 0, (
	f"Expected derived min value of {self.__name__} to be >= 0. "
	f"Please specify an appropriate min value for {root.__name__} "
	f"(currently {root.min})."
	)
	return int(_min_symint)

	@property
	def max(self):
	# assume that self.fn is an increasing function
	# TODO(avik): use sympy value range analysis instead?
	from sympy import Integer

	_max_symint = self.fn(Integer(self.root.max)) # type: ignore[attr-defined]
	root = self.root # type: ignore[attr-defined]
	assert _max_symint <= sys.maxsize - 1, (
	f"Expected derived max value of {self.__name__} to be <= {sys.maxsize - 1}. "
	f"Please specify an appropriate max value for {root.__name__} "
	f"(currently {root.max})."
	)
	return int(_max_symint)

	def _derive(self, fn):
	# We support nesting, e.g., 2*dim + 1.
	# This is implemented by composing operations on the same root.
	# As a consequence, roots are always regular Dims (i.e., not derived Dims).
	return _DerivedDim(
	self._derived_name(fn),
	(int,),
	{"root": self.root, "fn": lambda x: fn(self.fn(x))}, # type: ignore[attr-defined]
	)


	def Dim(name: str, *, min: Optional[int] = None, max: Optional[int] = None):
	"""
	:func:`Dim` constructs a type analogous to a named symbolic integer with a range.
	It can be used to describe multiple possible values of a dynamic tensor dimension.
	Note that different dynamic dimensions of the same tensor, or of different tensors,
	can be described by the same type.

	Args:
	name (str): Human-readable name for debugging.
	min (Optional[int]): Minimum possible value of given symbol (inclusive)
	max (Optional[int]): Maximum possible value of given symbol (inclusive)

	Returns:
	A type that can be used in dynamic shape specifications for tensors.
	"""
	_min = 0 if min is None else min
	_max = sys.maxsize - 1 if max is None else builtins.min(max, sys.maxsize - 1)
	assert _max > _min, f"Cannot create Dim with inconsistent min={min}, max={max}"
	dim = _Dim(name, (int,), {"min": _min, "max": _max})
	dim.__module__ = getattr(
	inspect.getmodule(inspect.stack()[1][0]), "__name__", "__main__"
	)
	return dim


	def dims(*names: str, min: Optional[int] = None, max: Optional[int] = None):
	"""
	Util to create multiple :func:`Dim` types.
	"""
	return tuple(Dim(name, min=min, max=max) for name in names)


	@dataclasses.dataclass
	class _ConstraintTarget:
	"""
	This represents input tensor dimensions. Don't create this
	class directly; instead, use :func:`dynamic_dim`.
	"""

	w_tensor: Any # weakref to torch.Tensor
	# TODO: We don't need t_id; we can get it off of w_tensor
	t_id: int
	dim: int


	class _ConstraintFactory(type):
	"""
	Metaclass that ensures a private constructor for :class:`_Constraint`
	"""

	def __call__(cls, args, *kwargs):
	raise TypeError(
	f"{cls.__module__}.{cls.__qualname__} has no public constructor. "
	f"Please use torch.export.dynamic_dim() to create one"
	)

	def _create(
	cls, w_tensor, t_id, dim, constraint_range, shared=None, debug_name=None
	):
	return super().__call__(
	w_tensor, t_id, dim, constraint_range, shared, debug_name
	)


	def _create_constraint(
	w_tensor, t_id, dim, constraint_range, shared=None, debug_name=None
	):
	return _Constraint._create(
	w_tensor, t_id, dim, constraint_range, shared, debug_name
	)


	@dataclasses.dataclass
	class _Constraint(_ConstraintTarget, metaclass=_ConstraintFactory):
	"""

	.. warning::
	Do not construct :class:`_Constraint` directly, use :func:`dynamic_dim` instead.

	This represents constraints on input tensor dimensions, e.g., requiring
	them to be fully polymorphic or within some range.

	"""

	# NOTE(avik): In the future, this could be Union[StrictMinMaxConstraint, <other kinds>]
	constraint_range: "StrictMinMaxConstraint"
	# Represent that `constraint_range` is shared with another _ConstraintTarget, which
	# typically arises because of a specified equality with another dynamic dimension.
	shared: Optional[_ConstraintTarget] = None
	debug_name: Optional[str] = None

	def _clone_with_range(self, lower=0, upper=None):
	# Import sympy locally
	from torch.fx.experimental.symbolic_shapes import StrictMinMaxConstraint
	from torch.utils._sympy.value_ranges import ValueRanges

	if upper is None:
	upper = sys.maxsize - 1

	constraint_range = StrictMinMaxConstraint(
	vr=self.constraint_range.vr & ValueRanges(lower=lower, upper=upper),
	warn_only=False,
	)
	return _create_constraint(
	self.w_tensor,
	self.t_id,
	self.dim,
	constraint_range,
	self.shared,
	self.debug_name,
	)

	def __ge__(self, lower):
	return self._clone_with_range(lower=lower)

	def __gt__(self, lower):
	return self._clone_with_range(lower=lower + 1)

	def __le__(self, upper):
	return self._clone_with_range(upper=upper)

	def __lt__(self, upper):
	return self._clone_with_range(upper=upper - 1)

	def __bool__(self):
	# NOTE(avik): We do not support compound expressions like a <= x <= b.
	# This is because Python implicitly desugars them into bool(a <= x) and bool(x <= b),
	# and moreover, enforces that any overload of __bool__ must return True or False.
	# FWIW, sympy also raises TypeError in this case.
	raise TypeError(
	"Cannot determine truth value of _Constraint. "
	"If you are trying to combine _Constraint's with logical connectives, "
	"you can specify them separately instead."
	)

	@property
	def serializable_spec(self):
	# We need a serialization compatible format of the constraint so that it
	# can be savedin the graph module w/o breaking the module serialization.
	# The saved constraints will be used directly for the post-exporting pass
	# that converts constraints to runtime assertion. The saved constraints
	# will not be saved in the serialized module.
	# TODO: A better way is needed. Currently we use 't_id' to map the constraint,
	# which is not reliable
	return {
	"t_id": self.t_id,
	"dim": self.dim,
	"min": self.constraint_range.vr.lower,
	"max": self.constraint_range.vr.upper,
	}

	def __eq__(self, other):
	if not isinstance(other, _Constraint):
	raise TypeError(
	"A dynamic dim can be specified equal only to another dynamic dim. "
	f"Equality with {type(other)} is not supported."
	)

	# import sympy locally
	from torch.fx.experimental.symbolic_shapes import StrictMinMaxConstraint

	constraint_range = StrictMinMaxConstraint(
	vr=self.constraint_range.vr & other.constraint_range.vr,
	warn_only=False,
	)
	if self.debug_name is None:
	debug_name = other.debug_name
	else:
	assert other.debug_name is None or self.debug_name == other.debug_name
	debug_name = self.debug_name
	return _create_constraint(
	self.w_tensor,
	self.t_id,
	self.dim,
	constraint_range,
	shared=_ConstraintTarget(other.w_tensor, other.t_id, other.dim),
	debug_name=debug_name,
	)


	@dataclasses.dataclass
	class _PhantomRoot:
	"""
	This represents the root of a derived Dim where the root does not directly
	specify the shape of any input dimension, but the derived Dim does.

	e.g., the input shapes 2*dim and dim + 1 are related via a "phantom" dim.

	The fields `name`, `constraint_range`, and `val` carried by a phantom root
	help create a symbol for it. Any derived dims with this phantom root are
	backed by expressions over this symbol.
	"""

	name: str
	constraint_range: "StrictMinMaxConstraint"
	val: int


	@dataclasses.dataclass
	class _DerivedConstraint(_ConstraintTarget):
	"""
	This represents a derived Dim, whose root is either a regular constraint target
	(which directly specifies the shape of some input dimension) or a phantom root
	(which does so indirectly).
	"""

	# NOTE: This is not currently a subclass of _Constraint because we do not support
	# `shared` for derived `Dim`s. Indeed, sharing is a necessary concept only for
	# legacy constraints based on `dynamic_dim`: equality can be expressed simply by
	# reusing the same (derived or normal) `Dim`.
	root: Union[_ConstraintTarget, _PhantomRoot]
	fn: Callable
	constraint_range: "StrictMinMaxConstraint"
	debug_name: Optional[str] = None

	@property
	def shared(self):
	# Some code paths expect a union of _Constraint and _DerivedConstraint.
	# Thus we expose a `shared` field that is always None.
	# TODO(avik): clean this up
	return None

	@property
	def serializable_spec(self):
	# same as _Constraint.serializable_spec
	return {
	"t_id": self.t_id,
	"dim": self.dim,
	"min": self.constraint_range.vr.lower,
	"max": self.constraint_range.vr.upper,
	}


	Constraint = Union[_Constraint, _DerivedConstraint]


	def dynamic_dim(t: torch.Tensor, index: int, debug_name: Optional[str] = None):
	"""
	.. warning::
	(This feature is DEPRECATED. See :func:`Dim` instead.)

	:func:`dynamic_dim` constructs a :class:`_Constraint` object that describes the dynamism of
	a dimension ``index`` of tensor ``t``. :class:`_Constraint` objects should be passed to
	``constraints`` argument of :func:`export`.

	Args:
	t (torch.Tensor): Example input tensor that have dynamic dimension size(s)
	index (int): Index of dynamic dimension

	Returns:
	A :class:`_Constraint` object that describes shape dynamism. It can be passed to :func:`export` so
	that :func:`export` does not assume static size of specified tensor, i.e. keeping it dynamic
	as a symbolic size rather than specializing according to size of example tracing input.

	Specifically :func:`dynamic_dim` can be used to express following types of dynamism.

	- Size of a dimension is dynamic and unbounded::

	t0 = torch.rand(2, 3)
	t1 = torch.rand(3, 4)

	# First dimension of t0 can be dynamic size rather than always being static size 2
	constraints = [dynamic_dim(t0, 0)]
	ep = export(fn, (t0, t1), constraints=constraints)

	- Size of a dimension is dynamic with a lower bound::

	t0 = torch.rand(10, 3)
	t1 = torch.rand(3, 4)

	# First dimension of t0 can be dynamic size with a lower bound of 5 (inclusive)
	# Second dimension of t1 can be dynamic size with a lower bound of 2 (exclusive)
	constraints = [
	dynamic_dim(t0, 0) >= 5,
	dynamic_dim(t1, 1) > 2,
	]
	ep = export(fn, (t0, t1), constraints=constraints)

	- Size of a dimension is dynamic with an upper bound::

	t0 = torch.rand(10, 3)
	t1 = torch.rand(3, 4)

	# First dimension of t0 can be dynamic size with a upper bound of 16 (inclusive)
	# Second dimension of t1 can be dynamic size with a upper bound of 8 (exclusive)
	constraints = [
	dynamic_dim(t0, 0) <= 16,
	dynamic_dim(t1, 1) < 8,
	]
	ep = export(fn, (t0, t1), constraints=constraints)

	- Size of a dimension is dynamic and it is always equal to size of another dynamic dimension::

	t0 = torch.rand(10, 3)
	t1 = torch.rand(3, 4)

	# Sizes of second dimension of t0 and first dimension are always equal
	constraints = [
	dynamic_dim(t0, 1) == dynamic_dim(t1, 0),
	]
	ep = export(fn, (t0, t1), constraints=constraints)

	- Mix and match all types above as long as they do not express conflicting requirements

	"""
	from torch._dynamo.exc import UserError, UserErrorType

	if not isinstance(t, torch.Tensor):
	raise UserError(
	UserErrorType.DYNAMIC_DIM,
	f"Expected tensor as input to dynamic_dim but got {type(t)}",
	)

	if t.dim() < 1:
	raise UserError(
	UserErrorType.DYNAMIC_DIM, "Cannot mark 0-dimension tensors to be dynamic"
	)

	if index >= t.dim():
	raise UserError(
	UserErrorType.DYNAMIC_DIM,
	f"Expected the dimension passed to dynamic_dim to be in the range [0:{t.dim()-1}]"
	f" but got {index}, which is out of bounds for the given tensor.",
	)

	# Import sympy locally

	from torch.fx.experimental.symbolic_shapes import StrictMinMaxConstraint
	from torch.utils._sympy.value_ranges import ValueRanges

	return _create_constraint(
	weakref.ref(t),
	id(t),
	index,
	StrictMinMaxConstraint(
	vr=ValueRanges(lower=0, upper=sys.maxsize - 1), warn_only=False
	),
	debug_name=debug_name,
	)


	def _process_equalities(
	constraint: Constraint,
	get_sources: Callable[[int, int], List["Source"]],
	shape_env: "ShapeEnv",
	source_pairs: List[Tuple["Source", "Source"]],
	derived_equalities: List[Tuple["Source", Union["Source", "Symbol"], Callable]],
	phantom_symbols: Dict[str, "Symbol"],
	):
	"""
	Updates `source_pairs`, `derived_equalities`, and `phantom_symbols` (which become
	fields of `EqualityConstraint`) based on a given input `constraint`.
	"""

	source, *other_sources = get_sources(constraint.t_id, constraint.dim)
	# When t.size()[dim] maps to src0, src1, ..., srcN, we add
	# constraints that make src0 "equal" to src1, ..., srcN.
	source_pairs.extend((source, other_source) for other_source in other_sources)
	if not isinstance(constraint, _DerivedConstraint):
	if constraint.shared is not None:
	# Moreover, when t.size()[dim] is specified equal to t'.size()[dim']
	# and t'.size()[dim'] maps to src1', ..., srcN', we add
	# constraints that also make src0 "equal" to src1', ..., srcN'.
	other_sources = get_sources(constraint.shared.t_id, constraint.shared.dim)
	source_pairs.extend(
	(source, other_source) for other_source in other_sources
	)
	else:
	# branch based on the root of the _DerivedConstraint
	if not isinstance(constraint.root, _PhantomRoot):
	# either root points to an input source
	root = get_sources(constraint.root.t_id, constraint.root.dim)[0] # type: ignore[assignment]
	else:
	# or root points to a phantom symbol
	if constraint.root.name in phantom_symbols:
	root = phantom_symbols[constraint.root.name] # type: ignore[assignment]
	else:
	# create a phantom symbol in the shape env based on the _PhantomRoot
	root = shape_env.create_symbol(
	val=constraint.root.val,
	source=torch._dynamo.source.ConstantSource(constraint.root.name),
	dynamic_dim=torch.fx.experimental.symbolic_shapes.DimDynamic.DYNAMIC,
	constraint_dim=constraint.root.constraint_range,
	)
	phantom_symbols[constraint.root.name] = root # type: ignore[assignment]

	fn = constraint.fn
	# A derived equality (source, root, fn) informally corresponds to source = fn(root).
	# Here source describes an input and root might describe another input or a phantom symbol.
	derived_equalities.append((source, root, fn))


	def _tree_map(
	func: Callable[..., Any],
	tree: Any,
	*dynamic_shapes: Any,
	) -> Any:
	"""
	Customized tree_map for mapping pytrees to dynamic_shapes.

	For built-in types (e.g., standard collections) this behaves exactly like tree_map.

	OTOH for a user-defined class C registered with pytree, we cannot assume that a C
	containing tensors can be mapped to a C containing dynamic shapes (i.e., C may not
	be a polymorphic container). In that case we use the flattened form of C instead.
	Thus a C(tensors) that flattens to (tensors) will map to (**dynamic_shapes).

	Args:
	func: function to apply to each (int, float, str, bool, None, torch.Tensor)
	tree: input pytree
	dynamic_shapes: zero or more (typically one) dynamic_shapes to match

	Returns:
	output pytree mapping func to each (int, float, str, bool, None, torch.Tensor)
	"""

	def is_leaf(t):
	# BUILTIN_TYPES is a subset of SUPPORTED_NODES, the latter being all types
	# registered with pytree. Types not in BUILTIN_TYPES include primitive types
	# (int, float, str, bool, None, torch.Tensor), which are not in SUPPORTED_NODES,
	# as well as user-defined classes registered with pytree, which are.
	return _get_node_type(t) not in BUILTIN_TYPES

	def f(t, *dynamic_shapes):
	typ = _get_node_type(t)
	# typ is not in BUILTIN_TYPES
	if typ in SUPPORTED_NODES:
	# thus typ is a user-defined class registered with pytree,
	# in which case flatten and recurse
	return tree_map(
	f,
	SUPPORTED_NODES[typ].flatten_fn(t)[0],
	*dynamic_shapes,
	is_leaf=is_leaf,
	)
	else:
	return func(t, *dynamic_shapes)

	return tree_map(f, tree, *dynamic_shapes, is_leaf=is_leaf)


	def _combine_args(f, args, kwargs, _is_torch_jit_trace=False):
	# combine args and kwargs following the signature of f, as it happens
	# in the body of f when called with args, *kwargs
	if isinstance(f, ExportedProgram):
	f = f.module()
	if not _is_torch_jit_trace:
	signature = (
	inspect.signature(f.forward)
	if isinstance(f, torch.nn.Module)
	else inspect.signature(f)
	)
	kwargs = kwargs if kwargs is not None else {}
	return signature.bind(args, *kwargs).arguments
	return args


	class ShapesCollection:
	"""
	Builder for dynamic_shapes.
	Used to assign dynamic shape specifications to tensors that appear in inputs.

	Example::
	args = ({"x": tensor_x, "others": [tensor_y, tensor_z]})

	dim = torch.export.Dim(...)
	dynamic_shapes = torch.export.ShapesCollection()
	dynamic_shapes[tensor_x] = (dim, dim + 1, 8)
	dynamic_shapes[tensor_y] = {0: dim * 2}
	# This is equivalent to the following (now auto-generated):
	# dynamic_shapes = {"x": (dim, dim + 1, 8), "others": [{0: dim * 2}, None]}

	torch.export(..., args, dynamic_shapes=dynamic_shapes)
	"""

	def __init__(self):
	self._shapes = {}

	def __setitem__(self, t, shape):
	assert isinstance(
	t, torch.Tensor
	), f"Cannot assign shape to non-tensor type {type(t)}"
	# TODO(avik): check that shape is indeed a Shape
	t_id = id(t)
	if t_id in self._shapes:
	_shape = self._shapes[t_id]
	assert (
	shape == _shape
	), f"Shapes assigned to tensor do not match: expected {_shape}, got {shape}"
	else:
	self._shapes[id(t)] = shape

	def __getitem__(self, t):
	t_id = id(t)
	if t_id in self._shapes:
	return self._shapes[t_id]
	else:
	return None

	def __len__(self):
	return len(self._shapes)

	def dynamic_shapes(self, m, args, kwargs=None):
	"""
	Generate dynamic_shapes.
	"""

	t_ids = set()

	def find_shape(t):
	t_id = id(t)
	if t_id in self._shapes:
	t_ids.add(t_id)
	return self._shapes[t_id]
	else:
	return None

	combined_args = _combine_args(m, args, kwargs)
	dynamic_shapes = _tree_map(find_shape, combined_args)
	if any(t_id not in t_ids for t_id in self._shapes):
	raise ValueError(
	"Some tensors that were assigned shapes were not found in args. "
	"Maybe such tensors were copied when passing them as args? "
	"Maybe such tensors are contained in classes that were not registered with pytree?"
	)
	return dynamic_shapes


	def _process_dynamic_shapes(
	f: Callable,
	args: Tuple[Any, ...],
	kwargs: Optional[Dict[str, Any]] = None,
	dynamic_shapes: Optional[Union[Dict[str, Any], Tuple[Any], List[Any]]] = None,
	_is_torch_jit_trace=False,
	) -> Optional[List[Constraint]]:
	from torch._dynamo.exc import UserError, UserErrorType

	if dynamic_shapes is None or len(dynamic_shapes) == 0:
	return None

	# map of Dim names representing input shape dimensions to constraints on them
	symbols: Dict[str, List[Constraint]] = defaultdict(list)
	# track roots that do not directly represent input shape dimensions
	phantom_roots: Dict[str, _PhantomRoot] = {}
	derived_constraints_with_phantom_root: List[_DerivedConstraint] = []

	def to_constraint(dim, tensor, i):
	import sympy

	from torch.fx.experimental.symbolic_shapes import StrictMinMaxConstraint
	from torch.utils._sympy.solve import try_solve
	from torch.utils._sympy.value_ranges import ValueRanges

	def root_value():
	# given tensor.shape[i] is the value of dim = fn(root),
	# find the value of root
	symbol = sympy.Symbol(dim.root.__name__, integer=True)
	expr = dim.fn(symbol)
	solution = try_solve(sympy.Eq(expr, tensor.shape[i]), symbol)
	if solution is not None:
	return int(solution[1]) # type: ignore[call-overload]
	else:
	raise UserError( # noqa: B904
	UserErrorType.CONSTRAINT_VIOLATION,
	f"Expected shape[{i}] = {tensor.shape[i]} of input Tensor to be "
	f"of the form {expr}, where {symbol} is an integer",
	)

	if isinstance(dim, _DerivedDim):
	# generate a _DerivedConstraint where the root is:
	# - either a _ConstraintTarget (if dim.root directly describes an input shape)
	# - or a _PhantomRoot (otherwise)
	dim_root = dim.root # type: ignore[attr-defined]
	if dim_root.__name__ in symbols:
	# root represents an input shape dimension
	root_constraint = symbols[dim_root.__name__][0]
	root = _ConstraintTarget(
	root_constraint.w_tensor,
	root_constraint.t_id,
	root_constraint.dim,
	)
	elif dim_root.__name__ not in phantom_roots:
	# create a phantom root
	root = _PhantomRoot( # type: ignore[assignment]
	name=dim_root.__name__,
	constraint_range=StrictMinMaxConstraint(
	vr=ValueRanges(lower=dim_root.min, upper=dim_root.max),
	warn_only=False,
	),
	val=root_value(),
	)
	phantom_roots[dim_root.__name__] = root # type: ignore[assignment]
	else:
	root = phantom_roots[dim_root.__name__] # type: ignore[assignment]
	constraint = _DerivedConstraint(
	weakref.ref(tensor),
	id(tensor),
	i,
	root,
	dim.fn, # type: ignore[attr-defined]
	StrictMinMaxConstraint(
	vr=ValueRanges(lower=dim.min, upper=dim.max),
	warn_only=False,
	),
	debug_name=dim.__name__,
	)
	if isinstance(root, _PhantomRoot):
	# NOTE(avik): since we have not processed all inputs yet, we may replace this
	# with a root that does represent an input shape dimension later (see below)
	derived_constraints_with_phantom_root.append(constraint)
	elif isinstance(dim, _StaticDim):
	constraint = _create_constraint(
	weakref.ref(tensor),
	id(tensor),
	i,
	StrictMinMaxConstraint(
	vr=ValueRanges(lower=dim.value, upper=dim.value), warn_only=False # type: ignore[attr-defined]
	),
	debug_name=dim.__name__,
	)
	else:
	constraint = dynamic_dim(tensor, i, debug_name=dim.__name__)
	if dim.min != 0:
	constraint = constraint >= dim.min
	if dim.max != sys.maxsize - 1:
	constraint = constraint <= dim.max
	return constraint

	bounds: Dict[str, Tuple[int, int]] = {}

	def check_same_bounds(dim):
	if dim.__name__ in symbols:
	min_, max_ = bounds[dim.__name__]
	if dim.min != min_ or dim.max != max_:
	this_ = _Dim.readable(dim.__name__, min_, max_)
	that_ = _Dim.readable(dim.__name__, dim.min, dim.max)
	raise UserError(
	UserErrorType.INVALID_INPUT,
	f"Found different definitions {this_} and {that_} "
	f"for the same symbolic dimension {dim}!",
	)

	else:
	bounds[dim.__name__] = (dim.min, dim.max)

	def update_symbols(tensor, shape):
	def _create_static_dim(tensor, i, value):
	return _StaticDim(str(value), (int,), {"value": value})

	if isinstance(shape, dict):
	for i, dim in shape.items():
	if isinstance(dim, (int, _Dim)):
	if isinstance(dim, int):
	dim = _create_static_dim(tensor, i, dim)
	check_same_bounds(dim)
	constraint = to_constraint(dim, tensor, i)
	symbols[dim.__name__].append(constraint)
	else:
	if dim is not None:
	raise UserError(
	UserErrorType.INVALID_INPUT,
	f"Unexpected item #{i} ({dim}) in dynamic_shape {shape} of Tensor, "
	"try None instead",
	)
	elif isinstance(shape, (tuple, list)):
	for i, dim in enumerate(shape):
	if isinstance(dim, (int, _Dim)):
	if isinstance(dim, int):
	dim = _create_static_dim(tensor, i, dim)
	check_same_bounds(dim)
	constraint = to_constraint(dim, tensor, i)
	symbols[dim.__name__].append(constraint)
	else:
	if dim is not None:
	raise UserError(
	UserErrorType.INVALID_INPUT,
	f"Unexpected item #{i} ({dim}) in dynamic_shape {shape} of Tensor, "
	"try None instead",
	)
	else:
	if shape is not None:
	raise UserError(
	UserErrorType.INVALID_INPUT,
	f"Unexpected dynamic_shape {shape} of Tensor, " "try None instead",
	)

	def assoc_shapes(combined_args, dynamic_shapes):
	def assoc_shape(t, dynamic_shape):
	if isinstance(t, torch.Tensor):
	update_symbols(t, dynamic_shape)
	else:
	if dynamic_shape is not None:
	raise UserError(
	UserErrorType.INVALID_INPUT,
	f"Cannot associate shape {dynamic_shape} to non-tensor type {type(t)}, "
	f"expected None",
	)

	_tree_map(assoc_shape, combined_args, dynamic_shapes)

	combined_args = _combine_args(
	f, args, kwargs, _is_torch_jit_trace=_is_torch_jit_trace
	)
	if not isinstance(dynamic_shapes, dict):
	assert isinstance(dynamic_shapes, (tuple, list))
	combined_args = type(dynamic_shapes)(combined_args.values()) # type: ignore[assignment, misc]
	assoc_shapes(combined_args, dynamic_shapes)

	constraints = []
	for derived_constraint_with_phantom_root in derived_constraints_with_phantom_root:
	phantom_root_name = derived_constraint_with_phantom_root.root.name # type: ignore[union-attr]
	if phantom_root_name in symbols:
	# We found an input shape dimension corresponding to this name, so we
	# do not need a phantom symbol for it after all.
	# NOTE(avik): Overall we want to maintain the invariant that roots that
	# are phantom symbols are really "phantom," i.e., they cannot be represented
	# by any input source. This is important when we are deciding derived equalities,
	# since we can focus our attention exclusively on input sources: deciding
	# derived equalities involving phantom symbols are, in comparison, trivial.
	derived_constraint_with_phantom_root.root = symbols[phantom_root_name][0]

	for dynamic_dims in symbols.values():
	if all(
	isinstance(dynamic_dim, _DerivedConstraint) for dynamic_dim in dynamic_dims
	):
	constraints.extend(dynamic_dims)
	else:
	primary, *others = dynamic_dims
	if others:
	for other in others:
	constraints.append(primary == other) # type: ignore[arg-type]
	else:
	constraints.append(primary)

	return constraints # type: ignore[return-value]


	def _get_dim_name_mapping(
	dynamic_shapes: Union[Dict[str, Any], Tuple[Any], List[Any], None]
	):
	name_to_dim = {}
	for dim in tree_flatten(
	dynamic_shapes,
	is_leaf=lambda x: isinstance(x, _Dim),
	)[0]:
	if dim is None or isinstance(dim, int):
	continue
	name_to_dim[dim.__name__] = dim
	if isinstance(dim, _DerivedDim):
	name_to_dim[dim.root.__name__] = dim.root # type: ignore[attr-defined]
	return name_to_dim


	def refine_dynamic_shapes_from_suggested_fixes(
	msg: str,
	dynamic_shapes: Union[Dict[str, Any], Tuple[Any], List[Any]],
	) -> Union[Dict[str, Any], Tuple[Any], List[Any]]:
	"""
	For working with export's dynamic shapes suggested fixes, and/or automatic dynamic shapes.
	Refines the given dynamic shapes spec, given a ConstraintViolation error message and the original dynamic shapes.

	For most cases behavior is straightforward - i.e. for suggested fixes that specialize or refine a Dim's range,
	or fixes that suggest a derived relation, the new dynamic shapes spec will be updated as such.

	e.g.
	Suggested fixes:

	dim = Dim('dim', min=3, max=6) -> this just refines the dim's range
	dim = 4 -> this specializes to a constant
	dy = dx + 1 -> dy was specified as an independent dim, but is actually tied to dx with this relation

	However, suggested fixes associated with derived dims can be more complicated.
	For example, if a suggested fix is provided for a root dim, the new derived dim value is evaluated based on the root.

	e.g.
	dx = Dim('dx')
	dy = dx + 2
	dynamic_shapes = {"x": (dx,), "y": (dy,)}

	Suggested fixes:

	dx = 4 # specialization will lead to dy also specializing = 6
	dx = Dim('dx', max=6) # dy now has max = 8

	Derived dims suggested fixes can also be used to express divisibility constraints.
	This involves creating new root dims that aren't tied to a particular input shape.
	In this case the root dims won't appear directly in the new spec, but as a root of
	one of the dims.

	e.g.
	Suggested fixes:

	_dx = Dim('_dx', max=1024) # this won't appear in the return result, but dx will
	dx = 4*_dx # dx is now divisible by 4, with a max value of 4096
	"""

	import re

	import sympy

	from torch._dynamo.exc import UserError, UserErrorType
	from torch.fx.experimental.symbolic_shapes import _is_supported_equivalence

	try:
	shape_fixes_msg = msg.split("Suggested fixes:")[1].strip()
	except Exception as exc:
	raise UserError(
	UserErrorType.INVALID_INPUT,
	"Suggested fixes not found in error message given to refine_dynamic_shapes_from_suggested_fixes()",
	) from exc

	# build shape_fixes dictionary
	shape_fixes = {}
	for fix in shape_fixes_msg.split("\n"):
	fix = fix.strip()
	if match := re.match(r"(.) = Dim\('(.)'.*\)", fix):
	name = match.group(1)
	_min, _max = None, None
	if match_min := re.match(r".* = Dim\('.', min\=([0-9]+).\)", fix):
	_min = int(match_min.group(1))
	if match_max := re.match(r".* = Dim\('.'.max\=([0-9]+)\)", fix):
	_max = int(match_max.group(1))
	shape_fixes[name] = Dim(name, min=_min, max=_max)
	else:
	name, expr = fix.split(" = ")
	expr = sympy.sympify(expr)
	if isinstance(expr, sympy.Number):
	shape_fixes[name] = int(expr) # static, integer
	else:
	shape_fixes[name] = expr # relation or derived dim

	name_to_dim = _get_dim_name_mapping(dynamic_shapes)

	# track derived dim roots
	roots: Set[str] = set()
	for k, c in shape_fixes.items():
	assert isinstance(c, (int, _Dim, _DerivedDim, sympy.Expr))
	if isinstance(c, sympy.Expr): # check dim/derived dim expression
	assert _is_supported_equivalence(c)
	shape_fixes[k] = c
	roots.add(str(next(iter(c.free_symbols))))
	if isinstance(c, _DerivedDim):
	roots.add(c.root.__name__) # type: ignore[attr-defined]

	# check keys are existing dims or new roots
	for k, c in shape_fixes.items():
	assert k in name_to_dim or k in roots

	# cache so we don't produce multiple derived dim objects
	derived_dim_cache: Dict[str, _DerivedDim] = {}

	def apply_fixes(dim, dummy):
	if dim is None or isinstance(dim, int): # not dynamic
	return dim
	elif dim.__name__ in shape_fixes: # directly fix
	fix = shape_fixes[dim.__name__]
	if isinstance(fix, sympy.Expr): # now derived or related
	if str(fix) in derived_dim_cache:
	return derived_dim_cache[str(fix)]
	else:
	symbol = next(iter(fix.free_symbols))
	# try to locate symbol
	if symbol.name in shape_fixes: # type: ignore[attr-defined]
	root = shape_fixes[symbol.name] # type: ignore[attr-defined]
	else:
	assert symbol.name in name_to_dim # type: ignore[attr-defined]
	root = name_to_dim[symbol.name] # type: ignore[attr-defined]
	# figure out value of fix
	modulus, remainder = sympy.polys.polytools.div(fix, symbol)
	dim = root
	if modulus != 1:
	dim = int(modulus) * dim
	if remainder != 0:
	dim = dim + int(remainder)
	derived_dim_cache[str(fix)] = dim
	return dim
	else:
	return fix
	elif isinstance(dim, _DerivedDim) and dim.root.__name__ in shape_fixes: # type: ignore[attr-defined]
	if dim.__name__ in derived_dim_cache:
	return derived_dim_cache[dim.__name__]
	else: # evaluate new derived value based on root
	_dim = dim.fn(shape_fixes[dim.root.__name__]) # type: ignore[attr-defined]
	derived_dim_cache[dim.__name__] = _dim
	return _dim
	return dim # unchanged dim

	return _tree_map(apply_fixes, dynamic_shapes, dynamic_shapes)