GameServerZ

Running

App Files Files Community

GameServerZ / MLPY /Lib /site-packages /mpmath /libmp /gammazeta.py

Kano001

Upload 1329 files

b200bda verified 10 months ago

raw

history blame

71.5 kB

	"""
	-----------------------------------------------------------------------
	This module implements gamma- and zeta-related functions:

	* Bernoulli numbers
	* Factorials
	* The gamma function
	* Polygamma functions
	* Harmonic numbers
	* The Riemann zeta function
	* Constants related to these functions

	-----------------------------------------------------------------------
	"""

	import math
	import sys

	from .backend import xrange
	from .backend import MPZ, MPZ_ZERO, MPZ_ONE, MPZ_THREE, gmpy

	from .libintmath import list_primes, ifac, ifac2, moebius

	from .libmpf import (\
	round_floor, round_ceiling, round_down, round_up,
	round_nearest, round_fast,
	lshift, sqrt_fixed, isqrt_fast,
	fzero, fone, fnone, fhalf, ftwo, finf, fninf, fnan,
	from_int, to_int, to_fixed, from_man_exp, from_rational,
	mpf_pos, mpf_neg, mpf_abs, mpf_add, mpf_sub,
	mpf_mul, mpf_mul_int, mpf_div, mpf_sqrt, mpf_pow_int,
	mpf_rdiv_int,
	mpf_perturb, mpf_le, mpf_lt, mpf_gt, mpf_shift,
	negative_rnd, reciprocal_rnd,
	bitcount, to_float, mpf_floor, mpf_sign, ComplexResult
	)

	from .libelefun import (\
	constant_memo,
	def_mpf_constant,
	mpf_pi, pi_fixed, ln2_fixed, log_int_fixed, mpf_ln2,
	mpf_exp, mpf_log, mpf_pow, mpf_cosh,
	mpf_cos_sin, mpf_cosh_sinh, mpf_cos_sin_pi, mpf_cos_pi, mpf_sin_pi,
	ln_sqrt2pi_fixed, mpf_ln_sqrt2pi, sqrtpi_fixed, mpf_sqrtpi,
	cos_sin_fixed, exp_fixed
	)

	from .libmpc import (\
	mpc_zero, mpc_one, mpc_half, mpc_two,
	mpc_abs, mpc_shift, mpc_pos, mpc_neg,
	mpc_add, mpc_sub, mpc_mul, mpc_div,
	mpc_add_mpf, mpc_mul_mpf, mpc_div_mpf, mpc_mpf_div,
	mpc_mul_int, mpc_pow_int,
	mpc_log, mpc_exp, mpc_pow,
	mpc_cos_pi, mpc_sin_pi,
	mpc_reciprocal, mpc_square,
	mpc_sub_mpf
	)



	# Catalan's constant is computed using Lupas's rapidly convergent series
	# (listed on http://mathworld.wolfram.com/CatalansConstant.html)
	# oo
	# ___ n-1 8n 2 3 2
	# 1 \ (-1) 2 (40n - 24n + 3) [(2n)!] (n!)
	# K = --- ) -----------------------------------------
	# 64 /___ 3 2
	# n (2n-1) [(4n)!]
	# n = 1

	@constant_memo
	def catalan_fixed(prec):
	prec = prec + 20
	a = one = MPZ_ONE << prec
	s, t, n = 0, 1, 1
	while t:
	a = 32 n*3 (2*n-1)
	a //= (3-16n+16n2)2
	t = a * (-1)*(n-1) (40n2-24n+3) // (n*3 (2*n-1))
	s += t
	n += 1
	return s >> (20 + 6)

	# Khinchin's constant is relatively difficult to compute. Here
	# we use the rational zeta series

	# oo 2*n-1
	# ___ ___
	# \ ` zeta(2*n)-1 \ ` (-1)^(k+1)
	# log(K)*log(2) = ) ------------ ) ----------
	# /___. n /___. k
	# n = 1 k = 1

	# which adds half a digit per term. The essential trick for achieving
	# reasonable efficiency is to recycle both the values of the zeta
	# function (essentially Bernoulli numbers) and the partial terms of
	# the inner sum.

	# An alternative might be to use K = 2*exp[1/log(2) X] where

	# / 1 1 [ pix(1-x^2) ]
	# X = \| ------ log [ ------------ ].
	# / 0 x(1+x) [ sin(pi*x) ]

	# and integrate numerically. In practice, this seems to be slightly
	# slower than the zeta series at high precision.

	@constant_memo
	def khinchin_fixed(prec):
	wp = int(prec + prec**0.5 + 15)
	s = MPZ_ZERO
	fac = from_int(4)
	t = ONE = MPZ_ONE << wp
	pi = mpf_pi(wp)
	pipow = twopi2 = mpf_shift(mpf_mul(pi, pi, wp), 2)
	n = 1
	while 1:
	zeta2n = mpf_abs(mpf_bernoulli(2*n, wp))
	zeta2n = mpf_mul(zeta2n, pipow, wp)
	zeta2n = mpf_div(zeta2n, fac, wp)
	zeta2n = to_fixed(zeta2n, wp)
	term = (((zeta2n - ONE) * t) // n) >> wp
	if term < 100:
	break
	#if not n % 10:
	# print n, math.log(int(abs(term)))
	s += term
	t += ONE//(2n+1) - ONE//(2n)
	n += 1
	fac = mpf_mul_int(fac, (2n)(2*n-1), wp)
	pipow = mpf_mul(pipow, twopi2, wp)
	s = (s << wp) // ln2_fixed(wp)
	K = mpf_exp(from_man_exp(s, -wp), wp)
	K = to_fixed(K, prec)
	return K


	# Glaisher's constant is defined as A = exp(1/2 - zeta'(-1)).
	# One way to compute it would be to perform direct numerical
	# differentiation, but computing arbitrary Riemann zeta function
	# values at high precision is expensive. We instead use the formula

	# A = exp((6 (-zeta'(2))/pi^2 + log 2 pi + gamma)/12)

	# and compute zeta'(2) from the series representation

	# oo
	# ___
	# \ log k
	# -zeta'(2) = ) -----
	# /___ 2
	# k
	# k = 2

	# This series converges exceptionally slowly, but can be accelerated
	# using Euler-Maclaurin formula. The important insight is that the
	# E-M integral can be done in closed form and that the high order
	# are given by

	# n / \
	# d \| log x \| a + b log x
	# --- \| ----- \| = -----------
	# n \| 2 \| 2 + n
	# dx \ x / x

	# where a and b are integers given by a simple recurrence. Note
	# that just one logarithm is needed. However, lots of integer
	# logarithms are required for the initial summation.

	# This algorithm could possibly be turned into a faster algorithm
	# for general evaluation of zeta(s) or zeta'(s); this should be
	# looked into.

	@constant_memo
	def glaisher_fixed(prec):
	wp = prec + 30
	# Number of direct terms to sum before applying the Euler-Maclaurin
	# formula to the tail. TODO: choose more intelligently
	N = int(0.33*prec + 5)
	ONE = MPZ_ONE << wp
	# Euler-Maclaurin, step 1: sum log(k)/k**2 for k from 2 to N-1
	s = MPZ_ZERO
	for k in range(2, N):
	#print k, N
	s += log_int_fixed(k, wp) // k**2
	logN = log_int_fixed(N, wp)
	#logN = to_fixed(mpf_log(from_int(N), wp+20), wp)
	# E-M step 2: integral of log(x)/x**2 from N to inf
	s += (ONE + logN) // N
	# E-M step 3: endpoint correction term f(N)/2
	s += logN // (N*2 2)
	# E-M step 4: the series of derivatives
	pN = N**3
	a = 1
	b = -2
	j = 3
	fac = from_int(2)
	k = 1
	while 1:
	# D(2k-1) B(2k) / fac(2k) [D(n) = nth derivative]
	D = ((a << wp) + b*logN) // pN
	D = from_man_exp(D, -wp)
	B = mpf_bernoulli(2*k, wp)
	term = mpf_mul(B, D, wp)
	term = mpf_div(term, fac, wp)
	term = to_fixed(term, wp)
	if abs(term) < 100:
	break
	#if not k % 10:
	# print k, math.log(int(abs(term)), 10)
	s -= term
	# Advance derivative twice
	a, b, pN, j = b-aj, -jb, pN*N, j+1
	a, b, pN, j = b-aj, -jb, pN*N, j+1
	k += 1
	fac = mpf_mul_int(fac, (2k)(2*k-1), wp)
	# A = exp((6s/pi2 + log(2pi) + euler)/12)
	pi = pi_fixed(wp)
	s *= 6
	s = (s << wp) // (pi**2 >> wp)
	s += euler_fixed(wp)
	s += to_fixed(mpf_log(from_man_exp(2*pi, -wp), wp), wp)
	s //= 12
	A = mpf_exp(from_man_exp(s, -wp), wp)
	return to_fixed(A, prec)

	# Apery's constant can be computed using the very rapidly convergent
	# series
	# oo
	# ___ 2 10
	# \ n 205 n + 250 n + 77 (n!)
	# zeta(3) = ) (-1) ------------------- ----------
	# /___ 64 5
	# n = 0 ((2n+1)!)

	@constant_memo
	def apery_fixed(prec):
	prec += 20
	d = MPZ_ONE << prec
	term = MPZ(77) << prec
	n = 1
	s = MPZ_ZERO
	while term:
	s += term
	d = (n*10)
	d //= (((2n+1)5) (2n)*5)
	term = (-1)*n (205(n2) + 250n + 77) * d
	n += 1
	return s >> (20 + 6)

	"""
	Euler's constant (gamma) is computed using the Brent-McMillan formula,
	gamma ~= I(n)/J(n) - log(n), where

	I(n) = sum_{k=0,1,2,...} (nk / k!)2 * H(k)
	J(n) = sum_{k=0,1,2,...} (nk / k!)2
	H(k) = 1 + 1/2 + 1/3 + ... + 1/k

	The error is bounded by O(exp(-4n)). Choosing n to be a power
	of two, 2**p, the logarithm becomes particularly easy to calculate.[1]

	We use the formulation of Algorithm 3.9 in [2] to make the summation
	more efficient.

	Reference:
	[1] Xavier Gourdon & Pascal Sebah, The Euler constant: gamma
	http://numbers.computation.free.fr/Constants/Gamma/gamma.pdf

	[2] [BorweinBailey]_
	"""

	@constant_memo
	def euler_fixed(prec):
	extra = 30
	prec += extra
	# choose p such that exp(-4(2p)) < 2*-n
	p = int(math.log((prec/4) * math.log(2), 2)) + 1
	n = 2**p
	A = U = -p*ln2_fixed(prec)
	B = V = MPZ_ONE << prec
	k = 1
	while 1:
	B = Bn2//k*2
	A = (An*2//k + B)//k
	U += A
	V += B
	if max(abs(A), abs(B)) < 100:
	break
	k += 1
	return (U<<(prec-extra))//V

	# Use zeta accelerated formulas for the Mertens and twin
	# prime constants; see
	# http://mathworld.wolfram.com/MertensConstant.html
	# http://mathworld.wolfram.com/TwinPrimesConstant.html

	@constant_memo
	def mertens_fixed(prec):
	wp = prec + 20
	m = 2
	s = mpf_euler(wp)
	while 1:
	t = mpf_zeta_int(m, wp)
	if t == fone:
	break
	t = mpf_log(t, wp)
	t = mpf_mul_int(t, moebius(m), wp)
	t = mpf_div(t, from_int(m), wp)
	s = mpf_add(s, t)
	m += 1
	return to_fixed(s, prec)

	@constant_memo
	def twinprime_fixed(prec):
	def I(n):
	return sum(moebius(d)<<(n//d) for d in xrange(1,n+1) if not n%d)//n
	wp = 2*prec + 30
	res = fone
	primes = [from_rational(1,p,wp) for p in [2,3,5,7]]
	ppowers = [mpf_mul(p,p,wp) for p in primes]
	n = 2
	while 1:
	a = mpf_zeta_int(n, wp)
	for i in range(4):
	a = mpf_mul(a, mpf_sub(fone, ppowers[i]), wp)
	ppowers[i] = mpf_mul(ppowers[i], primes[i], wp)
	a = mpf_pow_int(a, -I(n), wp)
	if mpf_pos(a, prec+10, 'n') == fone:
	break
	#from libmpf import to_str
	#print n, to_str(mpf_sub(fone, a), 6)
	res = mpf_mul(res, a, wp)
	n += 1
	res = mpf_mul(res, from_int(31535), wp)
	res = mpf_div(res, from_int(41636), wp)
	return to_fixed(res, prec)


	mpf_euler = def_mpf_constant(euler_fixed)
	mpf_apery = def_mpf_constant(apery_fixed)
	mpf_khinchin = def_mpf_constant(khinchin_fixed)
	mpf_glaisher = def_mpf_constant(glaisher_fixed)
	mpf_catalan = def_mpf_constant(catalan_fixed)
	mpf_mertens = def_mpf_constant(mertens_fixed)
	mpf_twinprime = def_mpf_constant(twinprime_fixed)


	#-----------------------------------------------------------------------#
	# #
	# Bernoulli numbers #
	# #
	#-----------------------------------------------------------------------#

	MAX_BERNOULLI_CACHE = 3000


	r"""
	Small Bernoulli numbers and factorials are used in numerous summations,
	so it is critical for speed that sequential computation is fast and that
	values are cached up to a fairly high threshold.

	On the other hand, we also want to support fast computation of isolated
	large numbers. Currently, no such acceleration is provided for integer
	factorials (though it is for large floating-point factorials, which are
	computed via gamma if the precision is low enough).

	For sequential computation of Bernoulli numbers, we use Ramanujan's formula

	/ n + 3 \
	B = (A(n) - S(n)) / \| \|
	n \ n /

	where A(n) = (n+3)/3 when n = 0 or 2 (mod 6), A(n) = -(n+3)/6
	when n = 4 (mod 6), and

	[n/6]
	___
	\ / n + 3 \
	S(n) = ) \| \| * B
	/___ \ n - 6k / n-6k
	k = 1

	For isolated large Bernoulli numbers, we use the Riemann zeta function
	to calculate a numerical value for B_n. The von Staudt-Clausen theorem
	can then be used to optionally find the exact value of the
	numerator and denominator.
	"""

	bernoulli_cache = {}
	f3 = from_int(3)
	f6 = from_int(6)

	def bernoulli_size(n):
	"""Accurately estimate the size of B_n (even n > 2 only)"""
	lgn = math.log(n,2)
	return int(2.326 + 0.5lgn + n(lgn - 4.094))

	BERNOULLI_PREC_CUTOFF = bernoulli_size(MAX_BERNOULLI_CACHE)

	def mpf_bernoulli(n, prec, rnd=None):
	"""Computation of Bernoulli numbers (numerically)"""
	if n < 2:
	if n < 0:
	raise ValueError("Bernoulli numbers only defined for n >= 0")
	if n == 0:
	return fone
	if n == 1:
	return mpf_neg(fhalf)
	# For odd n > 1, the Bernoulli numbers are zero
	if n & 1:
	return fzero
	# If precision is extremely high, we can save time by computing
	# the Bernoulli number at a lower precision that is sufficient to
	# obtain the exact fraction, round to the exact fraction, and
	# convert the fraction back to an mpf value at the original precision
	if prec > BERNOULLI_PREC_CUTOFF and prec > bernoulli_size(n)*1.1 + 1000:
	p, q = bernfrac(n)
	return from_rational(p, q, prec, rnd or round_floor)
	if n > MAX_BERNOULLI_CACHE:
	return mpf_bernoulli_huge(n, prec, rnd)
	wp = prec + 30
	# Reuse nearby precisions
	wp += 32 - (prec & 31)
	cached = bernoulli_cache.get(wp)
	if cached:
	numbers, state = cached
	if n in numbers:
	if not rnd:
	return numbers[n]
	return mpf_pos(numbers[n], prec, rnd)
	m, bin, bin1 = state
	if n - m > 10:
	return mpf_bernoulli_huge(n, prec, rnd)
	else:
	if n > 10:
	return mpf_bernoulli_huge(n, prec, rnd)
	numbers = {0:fone}
	m, bin, bin1 = state = [2, MPZ(10), MPZ_ONE]
	bernoulli_cache[wp] = (numbers, state)
	while m <= n:
	#print m
	case = m % 6
	# Accurately estimate size of B_m so we can use
	# fixed point math without using too much precision
	szbm = bernoulli_size(m)
	s = 0
	sexp = max(0, szbm) - wp
	if m < 6:
	a = MPZ_ZERO
	else:
	a = bin1
	for j in xrange(1, m//6+1):
	usign, uman, uexp, ubc = u = numbers[m-6*j]
	if usign:
	uman = -uman
	s += lshift(a*uman, uexp-sexp)
	# Update inner binomial coefficient
	j6 = 6*j
	a = ((m-5-j6)(m-4-j6)(m-3-j6)(m-2-j6)(m-1-j6)(m-j6))
	a //= ((4+j6)(5+j6)(6+j6)(7+j6)(8+j6)*(9+j6))
	if case == 0: b = mpf_rdiv_int(m+3, f3, wp)
	if case == 2: b = mpf_rdiv_int(m+3, f3, wp)
	if case == 4: b = mpf_rdiv_int(-m-3, f6, wp)
	s = from_man_exp(s, sexp, wp)
	b = mpf_div(mpf_sub(b, s, wp), from_int(bin), wp)
	numbers[m] = b
	m += 2
	# Update outer binomial coefficient
	bin = bin * ((m+2)(m+3)) // (m(m-1))
	if m > 6:
	bin1 = bin1 * ((2+m)(3+m)) // ((m-7)(m-6))
	state[:] = [m, bin, bin1]
	return numbers[n]

	def mpf_bernoulli_huge(n, prec, rnd=None):
	wp = prec + 10
	piprec = wp + int(math.log(n,2))
	v = mpf_gamma_int(n+1, wp)
	v = mpf_mul(v, mpf_zeta_int(n, wp), wp)
	v = mpf_mul(v, mpf_pow_int(mpf_pi(piprec), -n, wp))
	v = mpf_shift(v, 1-n)
	if not n & 3:
	v = mpf_neg(v)
	return mpf_pos(v, prec, rnd or round_fast)

	def bernfrac(n):
	r"""
	Returns a tuple of integers `(p, q)` such that `p/q = B_n` exactly,
	where `B_n` denotes the `n`-th Bernoulli number. The fraction is
	always reduced to lowest terms. Note that for `n > 1` and `n` odd,
	`B_n = 0`, and `(0, 1)` is returned.

	Examples

	The first few Bernoulli numbers are exactly::

	>>> from mpmath import *
	>>> for n in range(15):
	... p, q = bernfrac(n)
	... print("%s %s/%s" % (n, p, q))
	...
	0 1/1
	1 -1/2
	2 1/6
	3 0/1
	4 -1/30
	5 0/1
	6 1/42
	7 0/1
	8 -1/30
	9 0/1
	10 5/66
	11 0/1
	12 -691/2730
	13 0/1
	14 7/6

	This function works for arbitrarily large `n`::

	>>> p, q = bernfrac(10**4)
	>>> print(q)
	2338224387510
	>>> print(len(str(p)))
	27692
	>>> mp.dps = 15
	>>> print(mpf(p) / q)
	-9.04942396360948e+27677
	>>> print(bernoulli(10**4))
	-9.04942396360948e+27677

	.. note ::

	:func:`~mpmath.bernoulli` computes a floating-point approximation
	directly, without computing the exact fraction first.
	This is much faster for large `n`.

	Algorithm

	:func:`~mpmath.bernfrac` works by computing the value of `B_n` numerically
	and then using the von Staudt-Clausen theorem [1] to reconstruct
	the exact fraction. For large `n`, this is significantly faster than
	computing `B_1, B_2, \ldots, B_2` recursively with exact arithmetic.
	The implementation has been tested for `n = 10^m` up to `m = 6`.

	In practice, :func:`~mpmath.bernfrac` appears to be about three times
	slower than the specialized program calcbn.exe [2]

	References

	1. MathWorld, von Staudt-Clausen Theorem:
	http://mathworld.wolfram.com/vonStaudt-ClausenTheorem.html

	2. The Bernoulli Number Page:
	http://www.bernoulli.org/

	"""
	n = int(n)
	if n < 3:
	return [(1, 1), (-1, 2), (1, 6)][n]
	if n & 1:
	return (0, 1)
	q = 1
	for k in list_primes(n+1):
	if not (n % (k-1)):
	q *= k
	prec = bernoulli_size(n) + int(math.log(q,2)) + 20
	b = mpf_bernoulli(n, prec)
	p = mpf_mul(b, from_int(q))
	pint = to_int(p, round_nearest)
	return (pint, q)


	#-----------------------------------------------------------------------#
	# #
	# Polygamma functions #
	# #
	#-----------------------------------------------------------------------#

	r"""
	For all polygamma (psi) functions, we use the Euler-Maclaurin summation
	formula. It looks slightly different in the m = 0 and m > 0 cases.

	For m = 0, we have
	oo
	___ B
	(0) 1 \ 2 k -2 k
	psi (z) ~ log z + --- - ) ------ z
	2 z /___ (2 k)!
	k = 1

	Experiment shows that the minimum term of the asymptotic series
	reaches 2^(-p) when Re(z) > 0.11*p. So we simply use the recurrence
	for psi (equivalent, in fact, to summing to the first few terms
	directly before applying E-M) to obtain z large enough.

	Since, very crudely, log z ~= 1 for Re(z) > 1, we can use
	fixed-point arithmetic (if z is extremely large, log(z) itself
	is a sufficient approximation, so we can stop there already).

	For Re(z) << 0, we could use recurrence, but this is of course
	inefficient for large negative z, so there we use the
	reflection formula instead.

	For m > 0, we have

	N - 1
	___
	~~~(m) [ \ 1 ] 1 1
	psi (z) ~ [ ) -------- ] + ---------- + -------- +
	[ /___ m+1 ] m+1 m
	k = 1 (z+k) ] 2 (z+N) m (z+N)

	oo
	___ B
	\ 2 k (m+1) (m+2) ... (m+2k-1)
	+ ) ------ ------------------------
	/___ (2 k)! m + 2 k
	k = 1 (z+N)

	where ~~~ denotes the function rescaled by 1/((-1)^(m+1) m!).

	Here again N is chosen to make z+N large enough for the minimum
	term in the last series to become smaller than eps.

	TODO: the current estimation of N for m > 0 is very suboptimal.

	TODO: implement the reflection formula for m > 0, Re(z) << 0.
	It is generally a combination of multiple cotangents. Need to
	figure out a reasonably simple way to generate these formulas
	on the fly.

	TODO: maybe use exact algorithms to compute psi for integral
	and certain rational arguments, as this can be much more
	efficient. (On the other hand, the availability of these
	special values provides a convenient way to test the general
	algorithm.)
	"""

	# Harmonic numbers are just shifted digamma functions
	# We should calculate these exactly when x is an integer
	# and when doing so is faster.

	def mpf_harmonic(x, prec, rnd):
	if x in (fzero, fnan, finf):
	return x
	a = mpf_psi0(mpf_add(fone, x, prec+5), prec)
	return mpf_add(a, mpf_euler(prec+5, rnd), prec, rnd)

	def mpc_harmonic(z, prec, rnd):
	if z[1] == fzero:
	return (mpf_harmonic(z[0], prec, rnd), fzero)
	a = mpc_psi0(mpc_add_mpf(z, fone, prec+5), prec)
	return mpc_add_mpf(a, mpf_euler(prec+5, rnd), prec, rnd)

	def mpf_psi0(x, prec, rnd=round_fast):
	"""
	Computation of the digamma function (psi function of order 0)
	of a real argument.
	"""
	sign, man, exp, bc = x
	wp = prec + 10
	if not man:
	if x == finf: return x
	if x == fninf or x == fnan: return fnan
	if x == fzero or (exp >= 0 and sign):
	raise ValueError("polygamma pole")
	# Near 0 -- fixed-point arithmetic becomes bad
	if exp+bc < -5:
	v = mpf_psi0(mpf_add(x, fone, prec, rnd), prec, rnd)
	return mpf_sub(v, mpf_div(fone, x, wp, rnd), prec, rnd)
	# Reflection formula
	if sign and exp+bc > 3:
	c, s = mpf_cos_sin_pi(x, wp)
	q = mpf_mul(mpf_div(c, s, wp), mpf_pi(wp), wp)
	p = mpf_psi0(mpf_sub(fone, x, wp), wp)
	return mpf_sub(p, q, prec, rnd)
	# The logarithmic term is accurate enough
	if (not sign) and bc + exp > wp:
	return mpf_log(mpf_sub(x, fone, wp), prec, rnd)
	# Initial recurrence to obtain a large enough x
	m = to_int(x)
	n = int(0.11*wp) + 2
	s = MPZ_ZERO
	x = to_fixed(x, wp)
	one = MPZ_ONE << wp
	if m < n:
	for k in xrange(m, n):
	s -= (one << wp) // x
	x += one
	x -= one
	# Logarithmic term
	s += to_fixed(mpf_log(from_man_exp(x, -wp, wp), wp), wp)
	# Endpoint term in Euler-Maclaurin expansion
	s += (one << wp) // (2*x)
	# Euler-Maclaurin remainder sum
	x2 = (x*x) >> wp
	t = one
	prev = 0
	k = 1
	while 1:
	t = (t*x2) >> wp
	bsign, bman, bexp, bbc = mpf_bernoulli(2*k, wp)
	offset = (bexp + 2*wp)
	if offset >= 0: term = (bman << offset) // (t(2k))
	else: term = (bman >> (-offset)) // (t(2k))
	if k & 1: s -= term
	else: s += term
	if k > 2 and term >= prev:
	break
	prev = term
	k += 1
	return from_man_exp(s, -wp, wp, rnd)

	def mpc_psi0(z, prec, rnd=round_fast):
	"""
	Computation of the digamma function (psi function of order 0)
	of a complex argument.
	"""
	re, im = z
	# Fall back to the real case
	if im == fzero:
	return (mpf_psi0(re, prec, rnd), fzero)
	wp = prec + 20
	sign, man, exp, bc = re
	# Reflection formula
	if sign and exp+bc > 3:
	c = mpc_cos_pi(z, wp)
	s = mpc_sin_pi(z, wp)
	q = mpc_mul_mpf(mpc_div(c, s, wp), mpf_pi(wp), wp)
	p = mpc_psi0(mpc_sub(mpc_one, z, wp), wp)
	return mpc_sub(p, q, prec, rnd)
	# Just the logarithmic term
	if (not sign) and bc + exp > wp:
	return mpc_log(mpc_sub(z, mpc_one, wp), prec, rnd)
	# Initial recurrence to obtain a large enough z
	w = to_int(re)
	n = int(0.11*wp) + 2
	s = mpc_zero
	if w < n:
	for k in xrange(w, n):
	s = mpc_sub(s, mpc_reciprocal(z, wp), wp)
	z = mpc_add_mpf(z, fone, wp)
	z = mpc_sub(z, mpc_one, wp)
	# Logarithmic and endpoint term
	s = mpc_add(s, mpc_log(z, wp), wp)
	s = mpc_add(s, mpc_div(mpc_half, z, wp), wp)
	# Euler-Maclaurin remainder sum
	z2 = mpc_square(z, wp)
	t = mpc_one
	prev = mpc_zero
	szprev = fzero
	k = 1
	eps = mpf_shift(fone, -wp+2)
	while 1:
	t = mpc_mul(t, z2, wp)
	bern = mpf_bernoulli(2*k, wp)
	term = mpc_mpf_div(bern, mpc_mul_int(t, 2*k, wp), wp)
	s = mpc_sub(s, term, wp)
	szterm = mpc_abs(term, 10)
	if k > 2 and (mpf_le(szterm, eps) or mpf_le(szprev, szterm)):
	break
	prev = term
	szprev = szterm
	k += 1
	return s

	# Currently unoptimized
	def mpf_psi(m, x, prec, rnd=round_fast):
	"""
	Computation of the polygamma function of arbitrary integer order
	m >= 0, for a real argument x.
	"""
	if m == 0:
	return mpf_psi0(x, prec, rnd=round_fast)
	return mpc_psi(m, (x, fzero), prec, rnd)[0]

	def mpc_psi(m, z, prec, rnd=round_fast):
	"""
	Computation of the polygamma function of arbitrary integer order
	m >= 0, for a complex argument z.
	"""
	if m == 0:
	return mpc_psi0(z, prec, rnd)
	re, im = z
	wp = prec + 20
	sign, man, exp, bc = re
	if not im[1]:
	if im in (finf, fninf, fnan):
	return (fnan, fnan)
	if not man:
	if re == finf and im == fzero:
	return (fzero, fzero)
	if re == fnan:
	return (fnan, fnan)
	# Recurrence
	w = to_int(re)
	n = int(0.4wp + 4m)
	s = mpc_zero
	if w < n:
	for k in xrange(w, n):
	t = mpc_pow_int(z, -m-1, wp)
	s = mpc_add(s, t, wp)
	z = mpc_add_mpf(z, fone, wp)
	zm = mpc_pow_int(z, -m, wp)
	z2 = mpc_pow_int(z, -2, wp)
	# 1/m*(z+N)^m
	integral_term = mpc_div_mpf(zm, from_int(m), wp)
	s = mpc_add(s, integral_term, wp)
	# 1/2*(z+N)^(-(m+1))
	s = mpc_add(s, mpc_mul_mpf(mpc_div(zm, z, wp), fhalf, wp), wp)
	a = m + 1
	b = 2
	k = 1
	# Important: we want to sum up to the relative error,
	# not the absolute error, because psi^(m)(z) might be tiny
	magn = mpc_abs(s, 10)
	magn = magn[2]+magn[3]
	eps = mpf_shift(fone, magn-wp+2)
	while 1:
	zm = mpc_mul(zm, z2, wp)
	bern = mpf_bernoulli(2*k, wp)
	scal = mpf_mul_int(bern, a, wp)
	scal = mpf_div(scal, from_int(b), wp)
	term = mpc_mul_mpf(zm, scal, wp)
	s = mpc_add(s, term, wp)
	szterm = mpc_abs(term, 10)
	if k > 2 and mpf_le(szterm, eps):
	break
	#print k, to_str(szterm, 10), to_str(eps, 10)
	a = (m+2k)(m+2k+1)
	b = (2k+1)(2k+2)
	k += 1
	# Scale and sign factor
	v = mpc_mul_mpf(s, mpf_gamma(from_int(m+1), wp), prec, rnd)
	if not (m & 1):
	v = mpf_neg(v[0]), mpf_neg(v[1])
	return v


	#-----------------------------------------------------------------------#
	# #
	# Riemann zeta function #
	# #
	#-----------------------------------------------------------------------#

	r"""
	We use zeta(s) = eta(s) / (1 - 2**(1-s)) and Borwein's approximation

	n-1
	___ k
	-1 \ (-1) (d_k - d_n)
	eta(s) ~= ---- ) ------------------
	d_n /___ s
	k = 0 (k + 1)
	where
	k
	___ i
	\ (n + i - 1)! 4
	d_k = n ) ---------------.
	/___ (n - i)! (2i)!
	i = 0

	If s = a + b*I, the absolute error for eta(s) is bounded by

	3 (1 + 2\|b\|)
	------------ * exp(\|b\| pi/2)
	n
	(3+sqrt(8))

	Disregarding the linear term, we have approximately,

	log(err) ~= log(exp(1.58\|b\|)) - log(5.8*n)
	log(err) ~= 1.58\|b\| - log(5.8)n
	log(err) ~= 1.58\|b\| - 1.76n
	log2(err) ~= 2.28\|b\| - 2.54n

	So for p bits, we should choose n > (p + 2.28*\|b\|) / 2.54.

	References:
	-----------

	Peter Borwein, "An Efficient Algorithm for the Riemann Zeta Function"
	http://www.cecm.sfu.ca/personal/pborwein/PAPERS/P117.ps

	http://en.wikipedia.org/wiki/Dirichlet_eta_function
	"""

	borwein_cache = {}

	def borwein_coefficients(n):
	if n in borwein_cache:
	return borwein_cache[n]
	ds = [MPZ_ZERO] * (n+1)
	d = MPZ_ONE
	s = ds[0] = MPZ_ONE
	for i in range(1, n+1):
	d = d * 4 * (n+i-1) * (n-i+1)
	d //= ((2i) ((2*i)-1))
	s += d
	ds[i] = s
	borwein_cache[n] = ds
	return ds

	ZETA_INT_CACHE_MAX_PREC = 1000
	zeta_int_cache = {}

	def mpf_zeta_int(s, prec, rnd=round_fast):
	"""
	Optimized computation of zeta(s) for an integer s.
	"""
	wp = prec + 20
	s = int(s)
	if s in zeta_int_cache and zeta_int_cache[s][0] >= wp:
	return mpf_pos(zeta_int_cache[s][1], prec, rnd)
	if s < 2:
	if s == 1:
	raise ValueError("zeta(1) pole")
	if not s:
	return mpf_neg(fhalf)
	return mpf_div(mpf_bernoulli(-s+1, wp), from_int(s-1), prec, rnd)
	# 2^-s term vanishes?
	if s >= wp:
	return mpf_perturb(fone, 0, prec, rnd)
	# 5^-s term vanishes?
	elif s >= wp*0.431:
	t = one = 1 << wp
	t += 1 << (wp - s)
	t += one // (MPZ_THREE ** s)
	t += 1 << max(0, wp - s*2)
	return from_man_exp(t, -wp, prec, rnd)
	else:
	# Fast enough to sum directly?
	# Even better, we use the Euler product (idea stolen from pari)
	m = (float(wp)/(s-1) + 1)
	if m < 30:
	needed_terms = int(2.0**m + 1)
	if needed_terms < int(wp/2.54 + 5) / 10:
	t = fone
	for k in list_primes(needed_terms):
	#print k, needed_terms
	powprec = int(wp - s*math.log(k,2))
	if powprec < 2:
	break
	a = mpf_sub(fone, mpf_pow_int(from_int(k), -s, powprec), wp)
	t = mpf_mul(t, a, wp)
	return mpf_div(fone, t, wp)
	# Use Borwein's algorithm
	n = int(wp/2.54 + 5)
	d = borwein_coefficients(n)
	t = MPZ_ZERO
	s = MPZ(s)
	for k in xrange(n):
	t += (((-1)*k (d[k] - d[n])) << wp) // (k+1)**s
	t = (t << wp) // (-d[n])
	t = (t << wp) // ((1 << wp) - (1 << (wp+1-s)))
	if (s in zeta_int_cache and zeta_int_cache[s][0] < wp) or (s not in zeta_int_cache):
	zeta_int_cache[s] = (wp, from_man_exp(t, -wp-wp))
	return from_man_exp(t, -wp-wp, prec, rnd)

	def mpf_zeta(s, prec, rnd=round_fast, alt=0):
	sign, man, exp, bc = s
	if not man:
	if s == fzero:
	if alt:
	return fhalf
	else:
	return mpf_neg(fhalf)
	if s == finf:
	return fone
	return fnan
	wp = prec + 20
	# First term vanishes?
	if (not sign) and (exp + bc > (math.log(wp,2) + 2)):
	return mpf_perturb(fone, alt, prec, rnd)
	# Optimize for integer arguments
	elif exp >= 0:
	if alt:
	if s == fone:
	return mpf_ln2(prec, rnd)
	z = mpf_zeta_int(to_int(s), wp, negative_rnd[rnd])
	q = mpf_sub(fone, mpf_pow(ftwo, mpf_sub(fone, s, wp), wp), wp)
	return mpf_mul(z, q, prec, rnd)
	else:
	return mpf_zeta_int(to_int(s), prec, rnd)
	# Negative: use the reflection formula
	# Borwein only proves the accuracy bound for x >= 1/2. However, based on
	# tests, the accuracy without reflection is quite good even some distance
	# to the left of 1/2. XXX: verify this.
	if sign:
	# XXX: could use the separate refl. formula for Dirichlet eta
	if alt:
	q = mpf_sub(fone, mpf_pow(ftwo, mpf_sub(fone, s, wp), wp), wp)
	return mpf_mul(mpf_zeta(s, wp), q, prec, rnd)
	# XXX: -1 should be done exactly
	y = mpf_sub(fone, s, 10*wp)
	a = mpf_gamma(y, wp)
	b = mpf_zeta(y, wp)
	c = mpf_sin_pi(mpf_shift(s, -1), wp)
	wp2 = wp + max(0,exp+bc)
	pi = mpf_pi(wp+wp2)
	d = mpf_div(mpf_pow(mpf_shift(pi, 1), s, wp2), pi, wp2)
	return mpf_mul(a,mpf_mul(b,mpf_mul(c,d,wp),wp),prec,rnd)

	# Near pole
	r = mpf_sub(fone, s, wp)
	asign, aman, aexp, abc = mpf_abs(r)
	pole_dist = -2*(aexp+abc)
	if pole_dist > wp:
	if alt:
	return mpf_ln2(prec, rnd)
	else:
	q = mpf_neg(mpf_div(fone, r, wp))
	return mpf_add(q, mpf_euler(wp), prec, rnd)
	else:
	wp += max(0, pole_dist)

	t = MPZ_ZERO
	#wp += 16 - (prec & 15)
	# Use Borwein's algorithm
	n = int(wp/2.54 + 5)
	d = borwein_coefficients(n)
	t = MPZ_ZERO
	sf = to_fixed(s, wp)
	ln2 = ln2_fixed(wp)
	for k in xrange(n):
	u = (-sf*log_int_fixed(k+1, wp, ln2)) >> wp
	#esign, eman, eexp, ebc = mpf_exp(u, wp)
	#offset = eexp + wp
	#if offset >= 0:
	# w = ((d[k] - d[n]) * eman) << offset
	#else:
	# w = ((d[k] - d[n]) * eman) >> (-offset)
	eman = exp_fixed(u, wp, ln2)
	w = (d[k] - d[n]) * eman
	if k & 1:
	t -= w
	else:
	t += w
	t = t // (-d[n])
	t = from_man_exp(t, -wp, wp)
	if alt:
	return mpf_pos(t, prec, rnd)
	else:
	q = mpf_sub(fone, mpf_pow(ftwo, mpf_sub(fone, s, wp), wp), wp)
	return mpf_div(t, q, prec, rnd)

	def mpc_zeta(s, prec, rnd=round_fast, alt=0, force=False):
	re, im = s
	if im == fzero:
	return mpf_zeta(re, prec, rnd, alt), fzero

	# slow for large s
	if (not force) and mpf_gt(mpc_abs(s, 10), from_int(prec)):
	raise NotImplementedError

	wp = prec + 20

	# Near pole
	r = mpc_sub(mpc_one, s, wp)
	asign, aman, aexp, abc = mpc_abs(r, 10)
	pole_dist = -2*(aexp+abc)
	if pole_dist > wp:
	if alt:
	q = mpf_ln2(wp)
	y = mpf_mul(q, mpf_euler(wp), wp)
	g = mpf_shift(mpf_mul(q, q, wp), -1)
	g = mpf_sub(y, g)
	z = mpc_mul_mpf(r, mpf_neg(g), wp)
	z = mpc_add_mpf(z, q, wp)
	return mpc_pos(z, prec, rnd)
	else:
	q = mpc_neg(mpc_div(mpc_one, r, wp))
	q = mpc_add_mpf(q, mpf_euler(wp), wp)
	return mpc_pos(q, prec, rnd)
	else:
	wp += max(0, pole_dist)

	# Reflection formula. To be rigorous, we should reflect to the left of
	# re = 1/2 (see comments for mpf_zeta), but this leads to unnecessary
	# slowdown for interesting values of s
	if mpf_lt(re, fzero):
	# XXX: could use the separate refl. formula for Dirichlet eta
	if alt:
	q = mpc_sub(mpc_one, mpc_pow(mpc_two, mpc_sub(mpc_one, s, wp),
	wp), wp)
	return mpc_mul(mpc_zeta(s, wp), q, prec, rnd)
	# XXX: -1 should be done exactly
	y = mpc_sub(mpc_one, s, 10*wp)
	a = mpc_gamma(y, wp)
	b = mpc_zeta(y, wp)
	c = mpc_sin_pi(mpc_shift(s, -1), wp)
	rsign, rman, rexp, rbc = re
	isign, iman, iexp, ibc = im
	mag = max(rexp+rbc, iexp+ibc)
	wp2 = wp + max(0, mag)
	pi = mpf_pi(wp+wp2)
	pi2 = (mpf_shift(pi, 1), fzero)
	d = mpc_div_mpf(mpc_pow(pi2, s, wp2), pi, wp2)
	return mpc_mul(a,mpc_mul(b,mpc_mul(c,d,wp),wp),prec,rnd)
	n = int(wp/2.54 + 5)
	n += int(0.9*abs(to_int(im)))
	d = borwein_coefficients(n)
	ref = to_fixed(re, wp)
	imf = to_fixed(im, wp)
	tre = MPZ_ZERO
	tim = MPZ_ZERO
	one = MPZ_ONE << wp
	one_2wp = MPZ_ONE << (2*wp)
	critical_line = re == fhalf
	ln2 = ln2_fixed(wp)
	pi2 = pi_fixed(wp-1)
	wp2 = wp+wp
	for k in xrange(n):
	log = log_int_fixed(k+1, wp, ln2)
	# A square root is much cheaper than an exp
	if critical_line:
	w = one_2wp // isqrt_fast((k+1) << wp2)
	else:
	w = exp_fixed((-ref*log) >> wp, wp)
	if k & 1:
	w *= (d[n] - d[k])
	else:
	w *= (d[k] - d[n])
	wre, wim = cos_sin_fixed((-imf*log)>>wp, wp, pi2)
	tre += (w * wre) >> wp
	tim += (w * wim) >> wp
	tre //= (-d[n])
	tim //= (-d[n])
	tre = from_man_exp(tre, -wp, wp)
	tim = from_man_exp(tim, -wp, wp)
	if alt:
	return mpc_pos((tre, tim), prec, rnd)
	else:
	q = mpc_sub(mpc_one, mpc_pow(mpc_two, r, wp), wp)
	return mpc_div((tre, tim), q, prec, rnd)

	def mpf_altzeta(s, prec, rnd=round_fast):
	return mpf_zeta(s, prec, rnd, 1)

	def mpc_altzeta(s, prec, rnd=round_fast):
	return mpc_zeta(s, prec, rnd, 1)

	# Not optimized currently
	mpf_zetasum = None


	def pow_fixed(x, n, wp):
	if n == 1:
	return x
	y = MPZ_ONE << wp
	while n:
	if n & 1:
	y = (y*x) >> wp
	n -= 1
	x = (x*x) >> wp
	n //= 2
	return y

	# TODO: optimize / cleanup interface / unify with list_primes
	sieve_cache = []
	primes_cache = []
	mult_cache = []

	def primesieve(n):
	global sieve_cache, primes_cache, mult_cache
	if n < len(sieve_cache):
	sieve = sieve_cache#[:n+1]
	primes = primes_cache[:primes_cache.index(max(sieve))+1]
	mult = mult_cache#[:n+1]
	return sieve, primes, mult
	sieve = [0] * (n+1)
	mult = [0] * (n+1)
	primes = list_primes(n)
	for p in primes:
	#sieve[p::p] = p
	for k in xrange(p,n+1,p):
	sieve[k] = p
	for i, p in enumerate(sieve):
	if i >= 2:
	m = 1
	n = i // p
	while not n % p:
	n //= p
	m += 1
	mult[i] = m
	sieve_cache = sieve
	primes_cache = primes
	mult_cache = mult
	return sieve, primes, mult

	def zetasum_sieved(critical_line, sre, sim, a, n, wp):
	if a < 1:
	raise ValueError("a cannot be less than 1")
	sieve, primes, mult = primesieve(a+n)
	basic_powers = {}
	one = MPZ_ONE << wp
	one_2wp = MPZ_ONE << (2*wp)
	wp2 = wp+wp
	ln2 = ln2_fixed(wp)
	pi2 = pi_fixed(wp-1)
	for p in primes:
	if p*2 > a+n:
	break
	log = log_int_fixed(p, wp, ln2)
	cos, sin = cos_sin_fixed((-sim*log)>>wp, wp, pi2)
	if critical_line:
	u = one_2wp // isqrt_fast(p<<wp2)
	else:
	u = exp_fixed((-sre*log)>>wp, wp)
	pre = (u*cos) >> wp
	pim = (u*sin) >> wp
	basic_powers[p] = [(pre, pim)]
	tre, tim = pre, pim
	for m in range(1,int(math.log(a+n,p)+0.01)+1):
	tre, tim = ((pretre-pimtim)>>wp), ((pimtre+pretim)>>wp)
	basic_powers[p].append((tre,tim))
	xre = MPZ_ZERO
	xim = MPZ_ZERO
	if a == 1:
	xre += one
	aa = max(a,2)
	for k in xrange(aa, a+n+1):
	p = sieve[k]
	if p in basic_powers:
	m = mult[k]
	tre, tim = basic_powers[p][m-1]
	while 1:
	k //= p**m
	if k == 1:
	break
	p = sieve[k]
	m = mult[k]
	pre, pim = basic_powers[p][m-1]
	tre, tim = ((pretre-pimtim)>>wp), ((pimtre+pretim)>>wp)
	else:
	log = log_int_fixed(k, wp, ln2)
	cos, sin = cos_sin_fixed((-sim*log)>>wp, wp, pi2)
	if critical_line:
	u = one_2wp // isqrt_fast(k<<wp2)
	else:
	u = exp_fixed((-sre*log)>>wp, wp)
	tre = (u*cos) >> wp
	tim = (u*sin) >> wp
	xre += tre
	xim += tim
	return xre, xim

	# Set to something large to disable
	ZETASUM_SIEVE_CUTOFF = 10

	def mpc_zetasum(s, a, n, derivatives, reflect, prec):
	"""
	Fast version of mp._zetasum, assuming s = complex, a = integer.
	"""

	wp = prec + 10
	derivatives = list(derivatives)
	have_derivatives = derivatives != [0]
	have_one_derivative = len(derivatives) == 1

	# parse s
	sre, sim = s
	critical_line = (sre == fhalf)
	sre = to_fixed(sre, wp)
	sim = to_fixed(sim, wp)

	if a > 0 and n > ZETASUM_SIEVE_CUTOFF and not have_derivatives \
	and not reflect and (n < 4e7 or sys.maxsize > 2**32):
	re, im = zetasum_sieved(critical_line, sre, sim, a, n, wp)
	xs = [(from_man_exp(re, -wp, prec, 'n'), from_man_exp(im, -wp, prec, 'n'))]
	return xs, []

	maxd = max(derivatives)
	if not have_one_derivative:
	derivatives = range(maxd+1)

	# x_d = 0, y_d = 0
	xre = [MPZ_ZERO for d in derivatives]
	xim = [MPZ_ZERO for d in derivatives]
	if reflect:
	yre = [MPZ_ZERO for d in derivatives]
	yim = [MPZ_ZERO for d in derivatives]
	else:
	yre = yim = []

	one = MPZ_ONE << wp
	one_2wp = MPZ_ONE << (2*wp)

	ln2 = ln2_fixed(wp)
	pi2 = pi_fixed(wp-1)
	wp2 = wp+wp

	for w in xrange(a, a+n+1):
	log = log_int_fixed(w, wp, ln2)
	cos, sin = cos_sin_fixed((-sim*log)>>wp, wp, pi2)
	if critical_line:
	u = one_2wp // isqrt_fast(w<<wp2)
	else:
	u = exp_fixed((-sre*log)>>wp, wp)
	xterm_re = (u * cos) >> wp
	xterm_im = (u * sin) >> wp
	if reflect:
	reciprocal = (one_2wp // (u*w))
	yterm_re = (reciprocal * cos) >> wp
	yterm_im = (reciprocal * sin) >> wp

	if have_derivatives:
	if have_one_derivative:
	log = pow_fixed(log, maxd, wp)
	xre[0] += (xterm_re * log) >> wp
	xim[0] += (xterm_im * log) >> wp
	if reflect:
	yre[0] += (yterm_re * log) >> wp
	yim[0] += (yterm_im * log) >> wp
	else:
	t = MPZ_ONE << wp
	for d in derivatives:
	xre[d] += (xterm_re * t) >> wp
	xim[d] += (xterm_im * t) >> wp
	if reflect:
	yre[d] += (yterm_re * t) >> wp
	yim[d] += (yterm_im * t) >> wp
	t = (t * log) >> wp
	else:
	xre[0] += xterm_re
	xim[0] += xterm_im
	if reflect:
	yre[0] += yterm_re
	yim[0] += yterm_im
	if have_derivatives:
	if have_one_derivative:
	if maxd % 2:
	xre[0] = -xre[0]
	xim[0] = -xim[0]
	if reflect:
	yre[0] = -yre[0]
	yim[0] = -yim[0]
	else:
	xre = [(-1)*d xre[d] for d in derivatives]
	xim = [(-1)*d xim[d] for d in derivatives]
	if reflect:
	yre = [(-1)*d yre[d] for d in derivatives]
	yim = [(-1)*d yim[d] for d in derivatives]
	xs = [(from_man_exp(xa, -wp, prec, 'n'), from_man_exp(xb, -wp, prec, 'n'))
	for (xa, xb) in zip(xre, xim)]
	ys = [(from_man_exp(ya, -wp, prec, 'n'), from_man_exp(yb, -wp, prec, 'n'))
	for (ya, yb) in zip(yre, yim)]
	return xs, ys


	#-----------------------------------------------------------------------#
	# #
	# The gamma function (NEW IMPLEMENTATION) #
	# #
	#-----------------------------------------------------------------------#

	# Higher means faster, but more precomputation time
	MAX_GAMMA_TAYLOR_PREC = 5000
	# Need to derive higher bounds for Taylor series to go higher
	assert MAX_GAMMA_TAYLOR_PREC < 15000

	# Use Stirling's series if abs(x) > beta*prec
	# Important: must be large enough for convergence!
	GAMMA_STIRLING_BETA = 0.2

	SMALL_FACTORIAL_CACHE_SIZE = 150

	gamma_taylor_cache = {}
	gamma_stirling_cache = {}

	small_factorial_cache = [from_int(ifac(n)) for \
	n in range(SMALL_FACTORIAL_CACHE_SIZE+1)]

	def zeta_array(N, prec):
	"""
	zeta(n) = A * pi**n / n! + B

	where A is a rational number (A = Bernoulli number
	for n even) and B is an infinite sum over powers of exp(2*pi).
	(B = 0 for n even).

	TODO: this is currently only used for gamma, but could
	be very useful elsewhere.
	"""
	extra = 30
	wp = prec+extra
	zeta_values = [MPZ_ZERO] * (N+2)
	pi = pi_fixed(wp)
	# STEP 1:
	one = MPZ_ONE << wp
	zeta_values[0] = -one//2
	f_2pi = mpf_shift(mpf_pi(wp),1)
	exp_2pi_k = exp_2pi = mpf_exp(f_2pi, wp)
	# Compute exponential series
	# Store values of 1/(exp(2pik)-1),
	# exp(2pik)/(exp(2pik)-1)*2, 1/(exp(2pik)-1)*2
	# pikexp(2pik)/(exp(2pik)-1)**2
	exps3 = []
	k = 1
	while 1:
	tp = wp - 9*k
	if tp < 1:
	break
	# 1/(exp(2pik-1)
	q1 = mpf_div(fone, mpf_sub(exp_2pi_k, fone, tp), tp)
	# pikexp(2pik)/(exp(2pik)-1)**2
	q2 = mpf_mul(exp_2pi_k, mpf_mul(q1,q1,tp), tp)
	q1 = to_fixed(q1, wp)
	q2 = to_fixed(q2, wp)
	q2 = (k * q2 * pi) >> wp
	exps3.append((q1, q2))
	# Multiply for next round
	exp_2pi_k = mpf_mul(exp_2pi_k, exp_2pi, wp)
	k += 1
	# Exponential sum
	for n in xrange(3, N+1, 2):
	s = MPZ_ZERO
	k = 1
	for e1, e2 in exps3:
	if n%4 == 3:
	t = e1 // k**n
	else:
	U = (n-1)//4
	t = (e1 + e2//U) // k**n
	if not t:
	break
	s += t
	k += 1
	zeta_values[n] = -2*s
	# Even zeta values
	B = [mpf_abs(mpf_bernoulli(k,wp)) for k in xrange(N+2)]
	pi_pow = fpi = mpf_pow_int(mpf_shift(mpf_pi(wp), 1), 2, wp)
	pi_pow = mpf_div(pi_pow, from_int(4), wp)
	for n in xrange(2,N+2,2):
	z = mpf_mul(B[n], pi_pow, wp)
	zeta_values[n] = to_fixed(z, wp)
	pi_pow = mpf_mul(pi_pow, fpi, wp)
	pi_pow = mpf_div(pi_pow, from_int((n+1)*(n+2)), wp)
	# Zeta sum
	reciprocal_pi = (one << wp) // pi
	for n in xrange(3, N+1, 4):
	U = (n-3)//4
	s = zeta_values[4U+4](4*U+7)//4
	for k in xrange(1, U+1):
	s -= (zeta_values[4k] zeta_values[4U+4-4k]) >> wp
	zeta_values[n] += (2sreciprocal_pi) >> wp
	for n in xrange(5, N+1, 4):
	U = (n-1)//4
	s = zeta_values[4U+2](2*U+1)
	for k in xrange(1, 2*U+1):
	s += ((-1)*k2k zeta_values[2k] zeta_values[4U+2-2k])>>wp
	zeta_values[n] += ((sreciprocal_pi)>>wp)//(2U)
	return [x>>extra for x in zeta_values]

	def gamma_taylor_coefficients(inprec):
	"""
	Gives the Taylor coefficients of 1/gamma(1+x) as
	a list of fixed-point numbers. Enough coefficients are returned
	to ensure that the series converges to the given precision
	when x is in [0.5, 1.5].
	"""
	# Reuse nearby cache values (small case)
	if inprec < 400:
	prec = inprec + (10-(inprec%10))
	elif inprec < 1000:
	prec = inprec + (30-(inprec%30))
	else:
	prec = inprec
	if prec in gamma_taylor_cache:
	return gamma_taylor_cache[prec], prec

	# Experimentally determined bounds
	if prec < 1000:
	N = int(prec**0.76 + 2)
	else:
	# Valid to at least 15000 bits
	N = int(prec**0.787 + 2)

	# Reuse higher precision values
	for cprec in gamma_taylor_cache:
	if cprec > prec:
	coeffs = [x>>(cprec-prec) for x in gamma_taylor_cache[cprec][-N:]]
	if inprec < 1000:
	gamma_taylor_cache[prec] = coeffs
	return coeffs, prec

	# Cache at a higher precision (large case)
	if prec > 1000:
	prec = int(prec * 1.2)

	wp = prec + 20
	A = [0] * N
	A[0] = MPZ_ZERO
	A[1] = MPZ_ONE << wp
	A[2] = euler_fixed(wp)
	# SLOW, reference implementation
	#zeta_values = [0,0]+[to_fixed(mpf_zeta_int(k,wp),wp) for k in xrange(2,N)]
	zeta_values = zeta_array(N, wp)
	for k in xrange(3, N):
	a = (-A[2]*A[k-1])>>wp
	for j in xrange(2,k):
	a += ((-1)*j zeta_values[j] * A[k-j]) >> wp
	a //= (1-k)
	A[k] = a
	A = [a>>20 for a in A]
	A = A[::-1]
	A = A[:-1]
	gamma_taylor_cache[prec] = A
	#return A, prec
	return gamma_taylor_coefficients(inprec)

	def gamma_fixed_taylor(xmpf, x, wp, prec, rnd, type):
	# Determine nearest multiple of N/2
	#n = int(x >> (wp-1))
	#steps = (n-1)>>1
	nearest_int = ((x >> (wp-1)) + MPZ_ONE) >> 1
	one = MPZ_ONE << wp
	coeffs, cwp = gamma_taylor_coefficients(wp)
	if nearest_int > 0:
	r = one
	for i in xrange(nearest_int-1):
	x -= one
	r = (r*x) >> wp
	x -= one
	p = MPZ_ZERO
	for c in coeffs:
	p = c + ((x*p)>>wp)
	p >>= (cwp-wp)
	if type == 0:
	return from_man_exp((r<<wp)//p, -wp, prec, rnd)
	if type == 2:
	return mpf_shift(from_rational(p, (r<<wp), prec, rnd), wp)
	if type == 3:
	return mpf_log(mpf_abs(from_man_exp((r<<wp)//p, -wp)), prec, rnd)
	else:
	r = one
	for i in xrange(-nearest_int):
	r = (r*x) >> wp
	x += one
	p = MPZ_ZERO
	for c in coeffs:
	p = c + ((x*p)>>wp)
	p >>= (cwp-wp)
	if wp - bitcount(abs(x)) > 10:
	# pass very close to 0, so do floating-point multiply
	g = mpf_add(xmpf, from_int(-nearest_int)) # exact
	r = from_man_exp(p*r,-wp-wp)
	r = mpf_mul(r, g, wp)
	if type == 0:
	return mpf_div(fone, r, prec, rnd)
	if type == 2:
	return mpf_pos(r, prec, rnd)
	if type == 3:
	return mpf_log(mpf_abs(mpf_div(fone, r, wp)), prec, rnd)
	else:
	r = from_man_exp(xpr,-3*wp)
	if type == 0: return mpf_div(fone, r, prec, rnd)
	if type == 2: return mpf_pos(r, prec, rnd)
	if type == 3: return mpf_neg(mpf_log(mpf_abs(r), prec, rnd))

	def stirling_coefficient(n):
	if n in gamma_stirling_cache:
	return gamma_stirling_cache[n]
	p, q = bernfrac(n)
	q = MPZ(n(n-1))
	gamma_stirling_cache[n] = p, q, bitcount(abs(p)), bitcount(q)
	return gamma_stirling_cache[n]

	def real_stirling_series(x, prec):
	"""
	Sums the rational part of Stirling's expansion,

	log(sqrt(2pi)) - z + 1/(12z) - 1/(360*z^3) + ...

	"""
	t = (MPZ_ONE<<(prec+prec)) // x # t = 1/x
	u = (tt)>>prec # u = 1/x*2
	s = ln_sqrt2pi_fixed(prec) - x
	# Add initial terms of Stirling's series
	s += t//12; t = (t*u)>>prec
	s -= t//360; t = (t*u)>>prec
	s += t//1260; t = (t*u)>>prec
	s -= t//1680; t = (t*u)>>prec
	if not t: return s
	s += t//1188; t = (t*u)>>prec
	s -= 691t//360360; t = (tu)>>prec
	s += t//156; t = (t*u)>>prec
	if not t: return s
	s -= 3617t//122400; t = (tu)>>prec
	s += 43867t//244188; t = (tu)>>prec
	s -= 174611t//125400; t = (tu)>>prec
	if not t: return s
	k = 22
	# From here on, the coefficients are growing, so we
	# have to keep t at a roughly constant size
	usize = bitcount(abs(u))
	tsize = bitcount(abs(t))
	texp = 0
	while 1:
	p, q, pb, qb = stirling_coefficient(k)
	term_mag = tsize + pb + texp
	shift = -texp
	m = pb - term_mag
	if m > 0 and shift < m:
	p >>= m
	shift -= m
	m = tsize - term_mag
	if m > 0 and shift < m:
	w = t >> m
	shift -= m
	else:
	w = t
	term = (t*p//q) >> shift
	if not term:
	break
	s += term
	t = (t*u) >> usize
	texp -= (prec - usize)
	k += 2
	return s

	def complex_stirling_series(x, y, prec):
	# t = 1/z
	_m = (xx + yy) >> prec
	tre = (x << prec) // _m
	tim = (-y << prec) // _m
	# u = 1/z**2
	ure = (tretre - timtim) >> prec
	uim = tim*tre >> (prec-1)
	# s = log(sqrt(2*pi)) - z
	sre = ln_sqrt2pi_fixed(prec) - x
	sim = -y

	# Add initial terms of Stirling's series
	sre += tre//12; sim += tim//12;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	sre -= tre//360; sim -= tim//360;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	sre += tre//1260; sim += tim//1260;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	sre -= tre//1680; sim -= tim//1680;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	if abs(tre) + abs(tim) < 5: return sre, sim
	sre += tre//1188; sim += tim//1188;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	sre -= 691tre//360360; sim -= 691tim//360360;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	sre += tre//156; sim += tim//156;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	if abs(tre) + abs(tim) < 5: return sre, sim
	sre -= 3617tre//122400; sim -= 3617tim//122400;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	sre += 43867tre//244188; sim += 43867tim//244188;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	sre -= 174611tre//125400; sim -= 174611tim//125400;
	tre, tim = ((treure-timuim)>>prec), ((treuim+timure)>>prec)
	if abs(tre) + abs(tim) < 5: return sre, sim

	k = 22
	# From here on, the coefficients are growing, so we
	# have to keep t at a roughly constant size
	usize = bitcount(max(abs(ure), abs(uim)))
	tsize = bitcount(max(abs(tre), abs(tim)))
	texp = 0
	while 1:
	p, q, pb, qb = stirling_coefficient(k)
	term_mag = tsize + pb + texp
	shift = -texp
	m = pb - term_mag
	if m > 0 and shift < m:
	p >>= m
	shift -= m
	m = tsize - term_mag
	if m > 0 and shift < m:
	wre = tre >> m
	wim = tim >> m
	shift -= m
	else:
	wre = tre
	wim = tim
	termre = (tre*p//q) >> shift
	termim = (tim*p//q) >> shift
	if abs(termre) + abs(termim) < 5:
	break
	sre += termre
	sim += termim
	tre, tim = ((treure - timuim)>>usize), \
	((treuim + timure)>>usize)
	texp -= (prec - usize)
	k += 2
	return sre, sim


	def mpf_gamma(x, prec, rnd='d', type=0):
	"""
	This function implements multipurpose evaluation of the gamma
	function, G(x), as well as the following versions of the same:

	type = 0 -- G(x) [standard gamma function]
	type = 1 -- G(x+1) = x*G(x+1) = x! [factorial]
	type = 2 -- 1/G(x) [reciprocal gamma function]
	type = 3 -- log(\|G(x)\|) [log-gamma function, real part]
	"""

	# Specal values
	sign, man, exp, bc = x
	if not man:
	if x == fzero:
	if type == 1: return fone
	if type == 2: return fzero
	raise ValueError("gamma function pole")
	if x == finf:
	if type == 2: return fzero
	return finf
	return fnan

	# First of all, for log gamma, numbers can be well beyond the fixed-point
	# range, so we must take care of huge numbers before e.g. trying
	# to convert x to the nearest integer
	if type == 3:
	wp = prec+20
	if exp+bc > wp and not sign:
	return mpf_sub(mpf_mul(x, mpf_log(x, wp), wp), x, prec, rnd)

	# We strongly want to special-case small integers
	is_integer = exp >= 0
	if is_integer:
	# Poles
	if sign:
	if type == 2:
	return fzero
	raise ValueError("gamma function pole")
	# n = x
	n = man << exp
	if n < SMALL_FACTORIAL_CACHE_SIZE:
	if type == 0:
	return mpf_pos(small_factorial_cache[n-1], prec, rnd)
	if type == 1:
	return mpf_pos(small_factorial_cache[n], prec, rnd)
	if type == 2:
	return mpf_div(fone, small_factorial_cache[n-1], prec, rnd)
	if type == 3:
	return mpf_log(small_factorial_cache[n-1], prec, rnd)
	else:
	# floor(abs(x))
	n = int(man >> (-exp))

	# Estimate size and precision
	# Estimate log(gamma(\|x\|),2) as x*log(x,2)
	mag = exp + bc
	gamma_size = n*mag

	if type == 3:
	wp = prec + 20
	else:
	wp = prec + bitcount(gamma_size) + 20

	# Very close to 0, pole
	if mag < -wp:
	if type == 0:
	return mpf_sub(mpf_div(fone,x, wp),mpf_shift(fone,-wp),prec,rnd)
	if type == 1: return mpf_sub(fone, x, prec, rnd)
	if type == 2: return mpf_add(x, mpf_shift(fone,mag-wp), prec, rnd)
	if type == 3: return mpf_neg(mpf_log(mpf_abs(x), prec, rnd))

	# From now on, we assume having a gamma function
	if type == 1:
	return mpf_gamma(mpf_add(x, fone), prec, rnd, 0)

	# Special case integers (those not small enough to be caught above,
	# but still small enough for an exact factorial to be faster
	# than an approximate algorithm), and half-integers
	if exp >= -1:
	if is_integer:
	if gamma_size < 10*wp:
	if type == 0:
	return from_int(ifac(n-1), prec, rnd)
	if type == 2:
	return from_rational(MPZ_ONE, ifac(n-1), prec, rnd)
	if type == 3:
	return mpf_log(from_int(ifac(n-1)), prec, rnd)
	# half-integer
	if n < 100 or gamma_size < 10*wp:
	if sign:
	w = sqrtpi_fixed(wp)
	if n % 2: f = ifac2(2*n+1)
	else: f = -ifac2(2*n+1)
	if type == 0:
	return mpf_shift(from_rational(w, f, prec, rnd), -wp+n+1)
	if type == 2:
	return mpf_shift(from_rational(f, w, prec, rnd), wp-n-1)
	if type == 3:
	return mpf_log(mpf_shift(from_rational(w, abs(f),
	prec, rnd), -wp+n+1), prec, rnd)
	elif n == 0:
	if type == 0: return mpf_sqrtpi(prec, rnd)
	if type == 2: return mpf_div(fone, mpf_sqrtpi(wp), prec, rnd)
	if type == 3: return mpf_log(mpf_sqrtpi(wp), prec, rnd)
	else:
	w = sqrtpi_fixed(wp)
	w = from_man_exp(w * ifac2(2*n-1), -wp-n)
	if type == 0: return mpf_pos(w, prec, rnd)
	if type == 2: return mpf_div(fone, w, prec, rnd)
	if type == 3: return mpf_log(mpf_abs(w), prec, rnd)

	# Convert to fixed point
	offset = exp + wp
	if offset >= 0: absxman = man << offset
	else: absxman = man >> (-offset)

	# For log gamma, provide accurate evaluation for x = 1+eps and 2+eps
	if type == 3 and not sign:
	one = MPZ_ONE << wp
	one_dist = abs(absxman-one)
	two_dist = abs(absxman-2*one)
	cancellation = (wp - bitcount(min(one_dist, two_dist)))
	if cancellation > 10:
	xsub1 = mpf_sub(fone, x)
	xsub2 = mpf_sub(ftwo, x)
	xsub1mag = xsub1[2]+xsub1[3]
	xsub2mag = xsub2[2]+xsub2[3]
	if xsub1mag < -wp:
	return mpf_mul(mpf_euler(wp), mpf_sub(fone, x), prec, rnd)
	if xsub2mag < -wp:
	return mpf_mul(mpf_sub(fone, mpf_euler(wp)),
	mpf_sub(x, ftwo), prec, rnd)
	# Proceed but increase precision
	wp += max(-xsub1mag, -xsub2mag)
	offset = exp + wp
	if offset >= 0: absxman = man << offset
	else: absxman = man >> (-offset)

	# Use Taylor series if appropriate
	n_for_stirling = int(GAMMA_STIRLING_BETA*wp)
	if n < max(100, n_for_stirling) and wp < MAX_GAMMA_TAYLOR_PREC:
	if sign:
	absxman = -absxman
	return gamma_fixed_taylor(x, absxman, wp, prec, rnd, type)

	# Use Stirling's series
	# First ensure that \|x\| is large enough for rapid convergence
	xorig = x

	# Argument reduction
	r = 0
	if n < n_for_stirling:
	r = one = MPZ_ONE << wp
	d = n_for_stirling - n
	for k in xrange(d):
	r = (r * absxman) >> wp
	absxman += one
	x = xabs = from_man_exp(absxman, -wp)
	if sign:
	x = mpf_neg(x)
	else:
	xabs = mpf_abs(x)

	# Asymptotic series
	y = real_stirling_series(absxman, wp)
	u = to_fixed(mpf_log(xabs, wp), wp)
	u = ((absxman - (MPZ_ONE<<(wp-1))) * u) >> wp
	y += u
	w = from_man_exp(y, -wp)

	# Compute final value
	if sign:
	# Reflection formula
	A = mpf_mul(mpf_sin_pi(xorig, wp), xorig, wp)
	B = mpf_neg(mpf_pi(wp))
	if type == 0 or type == 2:
	A = mpf_mul(A, mpf_exp(w, wp))
	if r:
	B = mpf_mul(B, from_man_exp(r, -wp), wp)
	if type == 0:
	return mpf_div(B, A, prec, rnd)
	if type == 2:
	return mpf_div(A, B, prec, rnd)
	if type == 3:
	if r:
	B = mpf_mul(B, from_man_exp(r, -wp), wp)
	A = mpf_add(mpf_log(mpf_abs(A), wp), w, wp)
	return mpf_sub(mpf_log(mpf_abs(B), wp), A, prec, rnd)
	else:
	if type == 0:
	if r:
	return mpf_div(mpf_exp(w, wp),
	from_man_exp(r, -wp), prec, rnd)
	return mpf_exp(w, prec, rnd)
	if type == 2:
	if r:
	return mpf_div(from_man_exp(r, -wp),
	mpf_exp(w, wp), prec, rnd)
	return mpf_exp(mpf_neg(w), prec, rnd)
	if type == 3:
	if r:
	return mpf_sub(w, mpf_log(from_man_exp(r,-wp), wp), prec, rnd)
	return mpf_pos(w, prec, rnd)


	def mpc_gamma(z, prec, rnd='d', type=0):
	a, b = z
	asign, aman, aexp, abc = a
	bsign, bman, bexp, bbc = b

	if b == fzero:
	# Imaginary part on negative half-axis for log-gamma function
	if type == 3 and asign:
	re = mpf_gamma(a, prec, rnd, 3)
	n = (-aman) >> (-aexp)
	im = mpf_mul_int(mpf_pi(prec+10), n, prec, rnd)
	return re, im
	return mpf_gamma(a, prec, rnd, type), fzero

	# Some kind of complex inf/nan
	if (not aman and aexp) or (not bman and bexp):
	return (fnan, fnan)

	# Initial working precision
	wp = prec + 20

	amag = aexp+abc
	bmag = bexp+bbc
	if aman:
	mag = max(amag, bmag)
	else:
	mag = bmag

	# Close to 0
	if mag < -8:
	if mag < -wp:
	# 1/gamma(z) = z + euler*z^2 + O(z^3)
	v = mpc_add(z, mpc_mul_mpf(mpc_mul(z,z,wp),mpf_euler(wp),wp), wp)
	if type == 0: return mpc_reciprocal(v, prec, rnd)
	if type == 1: return mpc_div(z, v, prec, rnd)
	if type == 2: return mpc_pos(v, prec, rnd)
	if type == 3: return mpc_log(mpc_reciprocal(v, prec), prec, rnd)
	elif type != 1:
	wp += (-mag)

	# Handle huge log-gamma values; must do this before converting to
	# a fixed-point value. TODO: determine a precise cutoff of validity
	# depending on amag and bmag
	if type == 3 and mag > wp and ((not asign) or (bmag >= amag)):
	return mpc_sub(mpc_mul(z, mpc_log(z, wp), wp), z, prec, rnd)

	# From now on, we assume having a gamma function
	if type == 1:
	return mpc_gamma((mpf_add(a, fone), b), prec, rnd, 0)

	an = abs(to_int(a))
	bn = abs(to_int(b))
	absn = max(an, bn)
	gamma_size = absn*mag
	if type == 3:
	pass
	else:
	wp += bitcount(gamma_size)

	# Reflect to the right half-plane. Note that Stirling's expansion
	# is valid in the left half-plane too, as long as we're not too close
	# to the real axis, but in order to use this argument reduction
	# in the negative direction must be implemented.
	#need_reflection = asign and ((bmag < 0) or (amag-bmag > 4))
	need_reflection = asign
	zorig = z
	if need_reflection:
	z = mpc_neg(z)
	asign, aman, aexp, abc = a = z[0]
	bsign, bman, bexp, bbc = b = z[1]

	# Imaginary part very small compared to real one?
	yfinal = 0
	balance_prec = 0
	if bmag < -10:
	# Check z ~= 1 and z ~= 2 for loggamma
	if type == 3:
	zsub1 = mpc_sub_mpf(z, fone)
	if zsub1[0] == fzero:
	cancel1 = -bmag
	else:
	cancel1 = -max(zsub1[0][2]+zsub1[0][3], bmag)
	if cancel1 > wp:
	pi = mpf_pi(wp)
	x = mpc_mul_mpf(zsub1, pi, wp)
	x = mpc_mul(x, x, wp)
	x = mpc_div_mpf(x, from_int(12), wp)
	y = mpc_mul_mpf(zsub1, mpf_neg(mpf_euler(wp)), wp)
	yfinal = mpc_add(x, y, wp)
	if not need_reflection:
	return mpc_pos(yfinal, prec, rnd)
	elif cancel1 > 0:
	wp += cancel1
	zsub2 = mpc_sub_mpf(z, ftwo)
	if zsub2[0] == fzero:
	cancel2 = -bmag
	else:
	cancel2 = -max(zsub2[0][2]+zsub2[0][3], bmag)
	if cancel2 > wp:
	pi = mpf_pi(wp)
	t = mpf_sub(mpf_mul(pi, pi), from_int(6))
	x = mpc_mul_mpf(mpc_mul(zsub2, zsub2, wp), t, wp)
	x = mpc_div_mpf(x, from_int(12), wp)
	y = mpc_mul_mpf(zsub2, mpf_sub(fone, mpf_euler(wp)), wp)
	yfinal = mpc_add(x, y, wp)
	if not need_reflection:
	return mpc_pos(yfinal, prec, rnd)
	elif cancel2 > 0:
	wp += cancel2
	if bmag < -wp:
	# Compute directly from the real gamma function.
	pp = 2*(wp+10)
	aabs = mpf_abs(a)
	eps = mpf_shift(fone, amag-wp)
	x1 = mpf_gamma(aabs, pp, type=type)
	x2 = mpf_gamma(mpf_add(aabs, eps), pp, type=type)
	xprime = mpf_div(mpf_sub(x2, x1, pp), eps, pp)
	y = mpf_mul(b, xprime, prec, rnd)
	yfinal = (x1, y)
	# Note: we still need to use the reflection formula for
	# near-poles, and the correct branch of the log-gamma function
	if not need_reflection:
	return mpc_pos(yfinal, prec, rnd)
	else:
	balance_prec += (-bmag)

	wp += balance_prec
	n_for_stirling = int(GAMMA_STIRLING_BETA*wp)
	need_reduction = absn < n_for_stirling

	afix = to_fixed(a, wp)
	bfix = to_fixed(b, wp)

	r = 0
	if not yfinal:
	zprered = z
	# Argument reduction
	if absn < n_for_stirling:
	absn = complex(an, bn)
	d = int((1 + n_for_stirling2 - bn2)**0.5 - an)
	rre = one = MPZ_ONE << wp
	rim = MPZ_ZERO
	for k in xrange(d):
	rre, rim = ((afixrre-bfixrim)>>wp), ((afixrim + bfixrre)>>wp)
	afix += one
	r = from_man_exp(rre, -wp), from_man_exp(rim, -wp)
	a = from_man_exp(afix, -wp)
	z = a, b

	yre, yim = complex_stirling_series(afix, bfix, wp)
	# (z-1/2)*log(z) + S
	lre, lim = mpc_log(z, wp)
	lre = to_fixed(lre, wp)
	lim = to_fixed(lim, wp)
	yre = ((lreafix - limbfix)>>wp) - (lre>>1) + yre
	yim = ((lrebfix + limafix)>>wp) - (lim>>1) + yim
	y = from_man_exp(yre, -wp), from_man_exp(yim, -wp)

	if r and type == 3:
	# If re(z) > 0 and abs(z) <= 4, the branches of loggamma(z)
	# and log(gamma(z)) coincide. Otherwise, use the zeroth order
	# Stirling expansion to compute the correct imaginary part.
	y = mpc_sub(y, mpc_log(r, wp), wp)
	zfa = to_float(zprered[0])
	zfb = to_float(zprered[1])
	zfabs = math.hypot(zfa,zfb)
	#if not (zfa > 0.0 and zfabs <= 4):
	yfb = to_float(y[1])
	u = math.atan2(zfb, zfa)
	if zfabs <= 0.5:
	gi = 0.577216*zfb - u
	else:
	gi = -zfb - 0.5u + zfau + zfb*math.log(zfabs)
	n = int(math.floor((gi-yfb)/(2*math.pi)+0.5))
	y = (y[0], mpf_add(y[1], mpf_mul_int(mpf_pi(wp), 2*n, wp), wp))

	if need_reflection:
	if type == 0 or type == 2:
	A = mpc_mul(mpc_sin_pi(zorig, wp), zorig, wp)
	B = (mpf_neg(mpf_pi(wp)), fzero)
	if yfinal:
	if type == 2:
	A = mpc_div(A, yfinal, wp)
	else:
	A = mpc_mul(A, yfinal, wp)
	else:
	A = mpc_mul(A, mpc_exp(y, wp), wp)
	if r:
	B = mpc_mul(B, r, wp)
	if type == 0: return mpc_div(B, A, prec, rnd)
	if type == 2: return mpc_div(A, B, prec, rnd)

	# Reflection formula for the log-gamma function with correct branch
	# http://functions.wolfram.com/GammaBetaErf/LogGamma/16/01/01/0006/
	# LogGamma[z] == -LogGamma[-z] - Log[-z] +
	# Sign[Im[z]] Floor[Re[z]] Pi I + Log[Pi] -
	# Log[Sin[Pi (z - Floor[Re[z]])]] -
	# Pi I (1 - Abs[Sign[Im[z]]]) Abs[Floor[Re[z]]]
	if type == 3:
	if yfinal:
	s1 = mpc_neg(yfinal)
	else:
	s1 = mpc_neg(y)
	# s -= log(-z)
	s1 = mpc_sub(s1, mpc_log(mpc_neg(zorig), wp), wp)
	# floor(re(z))
	rezfloor = mpf_floor(zorig[0])
	imzsign = mpf_sign(zorig[1])
	pi = mpf_pi(wp)
	t = mpf_mul(pi, rezfloor)
	t = mpf_mul_int(t, imzsign, wp)
	s1 = (s1[0], mpf_add(s1[1], t, wp))
	s1 = mpc_add_mpf(s1, mpf_log(pi, wp), wp)
	t = mpc_sin_pi(mpc_sub_mpf(zorig, rezfloor), wp)
	t = mpc_log(t, wp)
	s1 = mpc_sub(s1, t, wp)
	# Note: may actually be unused, because we fall back
	# to the mpf_ function for real arguments
	if not imzsign:
	t = mpf_mul(pi, mpf_floor(rezfloor), wp)
	s1 = (s1[0], mpf_sub(s1[1], t, wp))
	return mpc_pos(s1, prec, rnd)
	else:
	if type == 0:
	if r:
	return mpc_div(mpc_exp(y, wp), r, prec, rnd)
	return mpc_exp(y, prec, rnd)
	if type == 2:
	if r:
	return mpc_div(r, mpc_exp(y, wp), prec, rnd)
	return mpc_exp(mpc_neg(y), prec, rnd)
	if type == 3:
	return mpc_pos(y, prec, rnd)

	def mpf_factorial(x, prec, rnd='d'):
	return mpf_gamma(x, prec, rnd, 1)

	def mpc_factorial(x, prec, rnd='d'):
	return mpc_gamma(x, prec, rnd, 1)

	def mpf_rgamma(x, prec, rnd='d'):
	return mpf_gamma(x, prec, rnd, 2)

	def mpc_rgamma(x, prec, rnd='d'):
	return mpc_gamma(x, prec, rnd, 2)

	def mpf_loggamma(x, prec, rnd='d'):
	sign, man, exp, bc = x
	if sign:
	raise ComplexResult
	return mpf_gamma(x, prec, rnd, 3)

	def mpc_loggamma(z, prec, rnd='d'):
	a, b = z
	asign, aman, aexp, abc = a
	bsign, bman, bexp, bbc = b
	if b == fzero and asign:
	re = mpf_gamma(a, prec, rnd, 3)
	n = (-aman) >> (-aexp)
	im = mpf_mul_int(mpf_pi(prec+10), n, prec, rnd)
	return re, im
	return mpc_gamma(z, prec, rnd, 3)

	def mpf_gamma_int(n, prec, rnd=round_fast):
	if n < SMALL_FACTORIAL_CACHE_SIZE:
	return mpf_pos(small_factorial_cache[n-1], prec, rnd)
	return mpf_gamma(from_int(n), prec, rnd)