Sam Chaudry

Upload folder using huggingface_hub

7885a28 verified about 1 month ago

17.5 kB

	import numpy as np
	from scipy.linalg import lu_factor, lu_solve
	from scipy.sparse import issparse, csc_matrix, eye
	from scipy.sparse.linalg import splu
	from scipy.optimize._numdiff import group_columns
	from .common import (validate_max_step, validate_tol, select_initial_step,
	norm, EPS, num_jac, validate_first_step,
	warn_extraneous)
	from .base import OdeSolver, DenseOutput


	MAX_ORDER = 5
	NEWTON_MAXITER = 4
	MIN_FACTOR = 0.2
	MAX_FACTOR = 10


	def compute_R(order, factor):
	"""Compute the matrix for changing the differences array."""
	I = np.arange(1, order + 1)[:, None]
	J = np.arange(1, order + 1)
	M = np.zeros((order + 1, order + 1))
	M[1:, 1:] = (I - 1 - factor * J) / I
	M[0] = 1
	return np.cumprod(M, axis=0)


	def change_D(D, order, factor):
	"""Change differences array in-place when step size is changed."""
	R = compute_R(order, factor)
	U = compute_R(order, 1)
	RU = R.dot(U)
	D[:order + 1] = np.dot(RU.T, D[:order + 1])


	def solve_bdf_system(fun, t_new, y_predict, c, psi, LU, solve_lu, scale, tol):
	"""Solve the algebraic system resulting from BDF method."""
	d = 0
	y = y_predict.copy()
	dy_norm_old = None
	converged = False
	for k in range(NEWTON_MAXITER):
	f = fun(t_new, y)
	if not np.all(np.isfinite(f)):
	break

	dy = solve_lu(LU, c * f - psi - d)
	dy_norm = norm(dy / scale)

	if dy_norm_old is None:
	rate = None
	else:
	rate = dy_norm / dy_norm_old

	if (rate is not None and (rate >= 1 or
	rate ** (NEWTON_MAXITER - k) / (1 - rate) * dy_norm > tol)):
	break

	y += dy
	d += dy

	if (dy_norm == 0 or
	rate is not None and rate / (1 - rate) * dy_norm < tol):
	converged = True
	break

	dy_norm_old = dy_norm

	return converged, k + 1, y, d


	class BDF(OdeSolver):
	"""Implicit method based on backward-differentiation formulas.

	This is a variable order method with the order varying automatically from
	1 to 5. The general framework of the BDF algorithm is described in [1]_.
	This class implements a quasi-constant step size as explained in [2]_.
	The error estimation strategy for the constant-step BDF is derived in [3]_.
	An accuracy enhancement using modified formulas (NDF) [2]_ is also implemented.

	Can be applied in the complex domain.

	Parameters
	----------
	fun : callable
	Right-hand side of the system: the time derivative of the state ``y``
	at time ``t``. The calling signature is ``fun(t, y)``, where ``t`` is a
	scalar and ``y`` is an ndarray with ``len(y) = len(y0)``. ``fun`` must
	return an array of the same shape as ``y``. See `vectorized` for more
	information.
	t0 : float
	Initial time.
	y0 : array_like, shape (n,)
	Initial state.
	t_bound : float
	Boundary time - the integration won't continue beyond it. It also
	determines the direction of the integration.
	first_step : float or None, optional
	Initial step size. Default is ``None`` which means that the algorithm
	should choose.
	max_step : float, optional
	Maximum allowed step size. Default is np.inf, i.e., the step size is not
	bounded and determined solely by the solver.
	rtol, atol : float and array_like, optional
	Relative and absolute tolerances. The solver keeps the local error
	estimates less than ``atol + rtol * abs(y)``. Here `rtol` controls a
	relative accuracy (number of correct digits), while `atol` controls
	absolute accuracy (number of correct decimal places). To achieve the
	desired `rtol`, set `atol` to be smaller than the smallest value that
	can be expected from ``rtol * abs(y)`` so that `rtol` dominates the
	allowable error. If `atol` is larger than ``rtol * abs(y)`` the
	number of correct digits is not guaranteed. Conversely, to achieve the
	desired `atol` set `rtol` such that ``rtol * abs(y)`` is always smaller
	than `atol`. If components of y have different scales, it might be
	beneficial to set different `atol` values for different components by
	passing array_like with shape (n,) for `atol`. Default values are
	1e-3 for `rtol` and 1e-6 for `atol`.
	jac : {None, array_like, sparse_matrix, callable}, optional
	Jacobian matrix of the right-hand side of the system with respect to y,
	required by this method. The Jacobian matrix has shape (n, n) and its
	element (i, j) is equal to ``d f_i / d y_j``.
	There are three ways to define the Jacobian:

	* If array_like or sparse_matrix, the Jacobian is assumed to
	be constant.
	* If callable, the Jacobian is assumed to depend on both
	t and y; it will be called as ``jac(t, y)`` as necessary.
	For the 'Radau' and 'BDF' methods, the return value might be a
	sparse matrix.
	* If None (default), the Jacobian will be approximated by
	finite differences.

	It is generally recommended to provide the Jacobian rather than
	relying on a finite-difference approximation.
	jac_sparsity : {None, array_like, sparse matrix}, optional
	Defines a sparsity structure of the Jacobian matrix for a
	finite-difference approximation. Its shape must be (n, n). This argument
	is ignored if `jac` is not `None`. If the Jacobian has only few non-zero
	elements in each row, providing the sparsity structure will greatly
	speed up the computations [4]_. A zero entry means that a corresponding
	element in the Jacobian is always zero. If None (default), the Jacobian
	is assumed to be dense.
	vectorized : bool, optional
	Whether `fun` can be called in a vectorized fashion. Default is False.

	If ``vectorized`` is False, `fun` will always be called with ``y`` of
	shape ``(n,)``, where ``n = len(y0)``.

	If ``vectorized`` is True, `fun` may be called with ``y`` of shape
	``(n, k)``, where ``k`` is an integer. In this case, `fun` must behave
	such that ``fun(t, y)[:, i] == fun(t, y[:, i])`` (i.e. each column of
	the returned array is the time derivative of the state corresponding
	with a column of ``y``).

	Setting ``vectorized=True`` allows for faster finite difference
	approximation of the Jacobian by this method, but may result in slower
	execution overall in some circumstances (e.g. small ``len(y0)``).

	Attributes
	----------
	n : int
	Number of equations.
	status : string
	Current status of the solver: 'running', 'finished' or 'failed'.
	t_bound : float
	Boundary time.
	direction : float
	Integration direction: +1 or -1.
	t : float
	Current time.
	y : ndarray
	Current state.
	t_old : float
	Previous time. None if no steps were made yet.
	step_size : float
	Size of the last successful step. None if no steps were made yet.
	nfev : int
	Number of evaluations of the right-hand side.
	njev : int
	Number of evaluations of the Jacobian.
	nlu : int
	Number of LU decompositions.

	References
	----------
	.. [1] G. D. Byrne, A. C. Hindmarsh, "A Polyalgorithm for the Numerical
	Solution of Ordinary Differential Equations", ACM Transactions on
	Mathematical Software, Vol. 1, No. 1, pp. 71-96, March 1975.
	.. [2] L. F. Shampine, M. W. Reichelt, "THE MATLAB ODE SUITE", SIAM J. SCI.
	COMPUTE., Vol. 18, No. 1, pp. 1-22, January 1997.
	.. [3] E. Hairer, G. Wanner, "Solving Ordinary Differential Equations I:
	Nonstiff Problems", Sec. III.2.
	.. [4] A. Curtis, M. J. D. Powell, and J. Reid, "On the estimation of
	sparse Jacobian matrices", Journal of the Institute of Mathematics
	and its Applications, 13, pp. 117-120, 1974.
	"""
	def __init__(self, fun, t0, y0, t_bound, max_step=np.inf,
	rtol=1e-3, atol=1e-6, jac=None, jac_sparsity=None,
	vectorized=False, first_step=None, **extraneous):
	warn_extraneous(extraneous)
	super().__init__(fun, t0, y0, t_bound, vectorized,
	support_complex=True)
	self.max_step = validate_max_step(max_step)
	self.rtol, self.atol = validate_tol(rtol, atol, self.n)
	f = self.fun(self.t, self.y)
	if first_step is None:
	self.h_abs = select_initial_step(self.fun, self.t, self.y,
	t_bound, max_step, f,
	self.direction, 1,
	self.rtol, self.atol)
	else:
	self.h_abs = validate_first_step(first_step, t0, t_bound)
	self.h_abs_old = None
	self.error_norm_old = None

	self.newton_tol = max(10 * EPS / rtol, min(0.03, rtol ** 0.5))

	self.jac_factor = None
	self.jac, self.J = self._validate_jac(jac, jac_sparsity)
	if issparse(self.J):
	def lu(A):
	self.nlu += 1
	return splu(A)

	def solve_lu(LU, b):
	return LU.solve(b)

	I = eye(self.n, format='csc', dtype=self.y.dtype)
	else:
	def lu(A):
	self.nlu += 1
	return lu_factor(A, overwrite_a=True)

	def solve_lu(LU, b):
	return lu_solve(LU, b, overwrite_b=True)

	I = np.identity(self.n, dtype=self.y.dtype)

	self.lu = lu
	self.solve_lu = solve_lu
	self.I = I

	kappa = np.array([0, -0.1850, -1/9, -0.0823, -0.0415, 0])
	self.gamma = np.hstack((0, np.cumsum(1 / np.arange(1, MAX_ORDER + 1))))
	self.alpha = (1 - kappa) * self.gamma
	self.error_const = kappa * self.gamma + 1 / np.arange(1, MAX_ORDER + 2)

	D = np.empty((MAX_ORDER + 3, self.n), dtype=self.y.dtype)
	D[0] = self.y
	D[1] = f * self.h_abs * self.direction
	self.D = D

	self.order = 1
	self.n_equal_steps = 0
	self.LU = None

	def _validate_jac(self, jac, sparsity):
	t0 = self.t
	y0 = self.y

	if jac is None:
	if sparsity is not None:
	if issparse(sparsity):
	sparsity = csc_matrix(sparsity)
	groups = group_columns(sparsity)
	sparsity = (sparsity, groups)

	def jac_wrapped(t, y):
	self.njev += 1
	f = self.fun_single(t, y)
	J, self.jac_factor = num_jac(self.fun_vectorized, t, y, f,
	self.atol, self.jac_factor,
	sparsity)
	return J
	J = jac_wrapped(t0, y0)
	elif callable(jac):
	J = jac(t0, y0)
	self.njev += 1
	if issparse(J):
	J = csc_matrix(J, dtype=y0.dtype)

	def jac_wrapped(t, y):
	self.njev += 1
	return csc_matrix(jac(t, y), dtype=y0.dtype)
	else:
	J = np.asarray(J, dtype=y0.dtype)

	def jac_wrapped(t, y):
	self.njev += 1
	return np.asarray(jac(t, y), dtype=y0.dtype)

	if J.shape != (self.n, self.n):
	raise ValueError(f"`jac` is expected to have shape {(self.n, self.n)},"
	f" but actually has {J.shape}.")
	else:
	if issparse(jac):
	J = csc_matrix(jac, dtype=y0.dtype)
	else:
	J = np.asarray(jac, dtype=y0.dtype)

	if J.shape != (self.n, self.n):
	raise ValueError(f"`jac` is expected to have shape {(self.n, self.n)},"
	f" but actually has {J.shape}.")
	jac_wrapped = None

	return jac_wrapped, J

	def _step_impl(self):
	t = self.t
	D = self.D

	max_step = self.max_step
	min_step = 10 * np.abs(np.nextafter(t, self.direction * np.inf) - t)
	if self.h_abs > max_step:
	h_abs = max_step
	change_D(D, self.order, max_step / self.h_abs)
	self.n_equal_steps = 0
	elif self.h_abs < min_step:
	h_abs = min_step
	change_D(D, self.order, min_step / self.h_abs)
	self.n_equal_steps = 0
	else:
	h_abs = self.h_abs

	atol = self.atol
	rtol = self.rtol
	order = self.order

	alpha = self.alpha
	gamma = self.gamma
	error_const = self.error_const

	J = self.J
	LU = self.LU
	current_jac = self.jac is None

	step_accepted = False
	while not step_accepted:
	if h_abs < min_step:
	return False, self.TOO_SMALL_STEP

	h = h_abs * self.direction
	t_new = t + h

	if self.direction * (t_new - self.t_bound) > 0:
	t_new = self.t_bound
	change_D(D, order, np.abs(t_new - t) / h_abs)
	self.n_equal_steps = 0
	LU = None

	h = t_new - t
	h_abs = np.abs(h)

	y_predict = np.sum(D[:order + 1], axis=0)

	scale = atol + rtol * np.abs(y_predict)
	psi = np.dot(D[1: order + 1].T, gamma[1: order + 1]) / alpha[order]

	converged = False
	c = h / alpha[order]
	while not converged:
	if LU is None:
	LU = self.lu(self.I - c * J)

	converged, n_iter, y_new, d = solve_bdf_system(
	self.fun, t_new, y_predict, c, psi, LU, self.solve_lu,
	scale, self.newton_tol)

	if not converged:
	if current_jac:
	break
	J = self.jac(t_new, y_predict)
	LU = None
	current_jac = True

	if not converged:
	factor = 0.5
	h_abs *= factor
	change_D(D, order, factor)
	self.n_equal_steps = 0
	LU = None
	continue

	safety = 0.9 * (2 * NEWTON_MAXITER + 1) / (2 * NEWTON_MAXITER
	+ n_iter)

	scale = atol + rtol * np.abs(y_new)
	error = error_const[order] * d
	error_norm = norm(error / scale)

	if error_norm > 1:
	factor = max(MIN_FACTOR,
	safety * error_norm ** (-1 / (order + 1)))
	h_abs *= factor
	change_D(D, order, factor)
	self.n_equal_steps = 0
	# As we didn't have problems with convergence, we don't
	# reset LU here.
	else:
	step_accepted = True

	self.n_equal_steps += 1

	self.t = t_new
	self.y = y_new

	self.h_abs = h_abs
	self.J = J
	self.LU = LU

	# Update differences. The principal relation here is
	# D^{j + 1} y_n = D^{j} y_n - D^{j} y_{n - 1}. Keep in mind that D
	# contained difference for previous interpolating polynomial and
	# d = D^{k + 1} y_n. Thus this elegant code follows.
	D[order + 2] = d - D[order + 1]
	D[order + 1] = d
	for i in reversed(range(order + 1)):
	D[i] += D[i + 1]

	if self.n_equal_steps < order + 1:
	return True, None

	if order > 1:
	error_m = error_const[order - 1] * D[order]
	error_m_norm = norm(error_m / scale)
	else:
	error_m_norm = np.inf

	if order < MAX_ORDER:
	error_p = error_const[order + 1] * D[order + 2]
	error_p_norm = norm(error_p / scale)
	else:
	error_p_norm = np.inf

	error_norms = np.array([error_m_norm, error_norm, error_p_norm])
	with np.errstate(divide='ignore'):
	factors = error_norms ** (-1 / np.arange(order, order + 3))

	delta_order = np.argmax(factors) - 1
	order += delta_order
	self.order = order

	factor = min(MAX_FACTOR, safety * np.max(factors))
	self.h_abs *= factor
	change_D(D, order, factor)
	self.n_equal_steps = 0
	self.LU = None

	return True, None

	def _dense_output_impl(self):
	return BdfDenseOutput(self.t_old, self.t, self.h_abs * self.direction,
	self.order, self.D[:self.order + 1].copy())


	class BdfDenseOutput(DenseOutput):
	def __init__(self, t_old, t, h, order, D):
	super().__init__(t_old, t)
	self.order = order
	self.t_shift = self.t - h * np.arange(self.order)
	self.denom = h * (1 + np.arange(self.order))
	self.D = D

	def _call_impl(self, t):
	if t.ndim == 0:
	x = (t - self.t_shift) / self.denom
	p = np.cumprod(x)
	else:
	x = (t - self.t_shift[:, None]) / self.denom[:, None]
	p = np.cumprod(x, axis=0)

	y = np.dot(self.D[1:].T, p)
	if y.ndim == 1:
	y += self.D[0]
	else:
	y += self.D[0, :, None]

	return y