You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
845 lines
29 KiB
845 lines
29 KiB
5 months ago
|
"""
|
||
|
Implements the PSLQ algorithm for integer relation detection,
|
||
|
and derivative algorithms for constant recognition.
|
||
|
"""
|
||
|
|
||
|
from .libmp.backend import xrange
|
||
|
from .libmp import int_types, sqrt_fixed
|
||
|
|
||
|
# round to nearest integer (can be done more elegantly...)
|
||
|
def round_fixed(x, prec):
|
||
|
return ((x + (1<<(prec-1))) >> prec) << prec
|
||
|
|
||
|
class IdentificationMethods(object):
|
||
|
pass
|
||
|
|
||
|
|
||
|
def pslq(ctx, x, tol=None, maxcoeff=1000, maxsteps=100, verbose=False):
|
||
|
r"""
|
||
|
Given a vector of real numbers `x = [x_0, x_1, ..., x_n]`, ``pslq(x)``
|
||
|
uses the PSLQ algorithm to find a list of integers
|
||
|
`[c_0, c_1, ..., c_n]` such that
|
||
|
|
||
|
.. math ::
|
||
|
|
||
|
|c_1 x_1 + c_2 x_2 + ... + c_n x_n| < \mathrm{tol}
|
||
|
|
||
|
and such that `\max |c_k| < \mathrm{maxcoeff}`. If no such vector
|
||
|
exists, :func:`~mpmath.pslq` returns ``None``. The tolerance defaults to
|
||
|
3/4 of the working precision.
|
||
|
|
||
|
**Examples**
|
||
|
|
||
|
Find rational approximations for `\pi`::
|
||
|
|
||
|
>>> from mpmath import *
|
||
|
>>> mp.dps = 15; mp.pretty = True
|
||
|
>>> pslq([-1, pi], tol=0.01)
|
||
|
[22, 7]
|
||
|
>>> pslq([-1, pi], tol=0.001)
|
||
|
[355, 113]
|
||
|
>>> mpf(22)/7; mpf(355)/113; +pi
|
||
|
3.14285714285714
|
||
|
3.14159292035398
|
||
|
3.14159265358979
|
||
|
|
||
|
Pi is not a rational number with denominator less than 1000::
|
||
|
|
||
|
>>> pslq([-1, pi])
|
||
|
>>>
|
||
|
|
||
|
To within the standard precision, it can however be approximated
|
||
|
by at least one rational number with denominator less than `10^{12}`::
|
||
|
|
||
|
>>> p, q = pslq([-1, pi], maxcoeff=10**12)
|
||
|
>>> print(p); print(q)
|
||
|
238410049439
|
||
|
75888275702
|
||
|
>>> mpf(p)/q
|
||
|
3.14159265358979
|
||
|
|
||
|
The PSLQ algorithm can be applied to long vectors. For example,
|
||
|
we can investigate the rational (in)dependence of integer square
|
||
|
roots::
|
||
|
|
||
|
>>> mp.dps = 30
|
||
|
>>> pslq([sqrt(n) for n in range(2, 5+1)])
|
||
|
>>>
|
||
|
>>> pslq([sqrt(n) for n in range(2, 6+1)])
|
||
|
>>>
|
||
|
>>> pslq([sqrt(n) for n in range(2, 8+1)])
|
||
|
[2, 0, 0, 0, 0, 0, -1]
|
||
|
|
||
|
**Machin formulas**
|
||
|
|
||
|
A famous formula for `\pi` is Machin's,
|
||
|
|
||
|
.. math ::
|
||
|
|
||
|
\frac{\pi}{4} = 4 \operatorname{acot} 5 - \operatorname{acot} 239
|
||
|
|
||
|
There are actually infinitely many formulas of this type. Two
|
||
|
others are
|
||
|
|
||
|
.. math ::
|
||
|
|
||
|
\frac{\pi}{4} = \operatorname{acot} 1
|
||
|
|
||
|
\frac{\pi}{4} = 12 \operatorname{acot} 49 + 32 \operatorname{acot} 57
|
||
|
+ 5 \operatorname{acot} 239 + 12 \operatorname{acot} 110443
|
||
|
|
||
|
We can easily verify the formulas using the PSLQ algorithm::
|
||
|
|
||
|
>>> mp.dps = 30
|
||
|
>>> pslq([pi/4, acot(1)])
|
||
|
[1, -1]
|
||
|
>>> pslq([pi/4, acot(5), acot(239)])
|
||
|
[1, -4, 1]
|
||
|
>>> pslq([pi/4, acot(49), acot(57), acot(239), acot(110443)])
|
||
|
[1, -12, -32, 5, -12]
|
||
|
|
||
|
We could try to generate a custom Machin-like formula by running
|
||
|
the PSLQ algorithm with a few inverse cotangent values, for example
|
||
|
acot(2), acot(3) ... acot(10). Unfortunately, there is a linear
|
||
|
dependence among these values, resulting in only that dependence
|
||
|
being detected, with a zero coefficient for `\pi`::
|
||
|
|
||
|
>>> pslq([pi] + [acot(n) for n in range(2,11)])
|
||
|
[0, 1, -1, 0, 0, 0, -1, 0, 0, 0]
|
||
|
|
||
|
We get better luck by removing linearly dependent terms::
|
||
|
|
||
|
>>> pslq([pi] + [acot(n) for n in range(2,11) if n not in (3, 5)])
|
||
|
[1, -8, 0, 0, 4, 0, 0, 0]
|
||
|
|
||
|
In other words, we found the following formula::
|
||
|
|
||
|
>>> 8*acot(2) - 4*acot(7)
|
||
|
3.14159265358979323846264338328
|
||
|
>>> +pi
|
||
|
3.14159265358979323846264338328
|
||
|
|
||
|
**Algorithm**
|
||
|
|
||
|
This is a fairly direct translation to Python of the pseudocode given by
|
||
|
David Bailey, "The PSLQ Integer Relation Algorithm":
|
||
|
http://www.cecm.sfu.ca/organics/papers/bailey/paper/html/node3.html
|
||
|
|
||
|
The present implementation uses fixed-point instead of floating-point
|
||
|
arithmetic, since this is significantly (about 7x) faster.
|
||
|
"""
|
||
|
|
||
|
n = len(x)
|
||
|
if n < 2:
|
||
|
raise ValueError("n cannot be less than 2")
|
||
|
|
||
|
# At too low precision, the algorithm becomes meaningless
|
||
|
prec = ctx.prec
|
||
|
if prec < 53:
|
||
|
raise ValueError("prec cannot be less than 53")
|
||
|
|
||
|
if verbose and prec // max(2,n) < 5:
|
||
|
print("Warning: precision for PSLQ may be too low")
|
||
|
|
||
|
target = int(prec * 0.75)
|
||
|
|
||
|
if tol is None:
|
||
|
tol = ctx.mpf(2)**(-target)
|
||
|
else:
|
||
|
tol = ctx.convert(tol)
|
||
|
|
||
|
extra = 60
|
||
|
prec += extra
|
||
|
|
||
|
if verbose:
|
||
|
print("PSLQ using prec %i and tol %s" % (prec, ctx.nstr(tol)))
|
||
|
|
||
|
tol = ctx.to_fixed(tol, prec)
|
||
|
assert tol
|
||
|
|
||
|
# Convert to fixed-point numbers. The dummy None is added so we can
|
||
|
# use 1-based indexing. (This just allows us to be consistent with
|
||
|
# Bailey's indexing. The algorithm is 100 lines long, so debugging
|
||
|
# a single wrong index can be painful.)
|
||
|
x = [None] + [ctx.to_fixed(ctx.mpf(xk), prec) for xk in x]
|
||
|
|
||
|
# Sanity check on magnitudes
|
||
|
minx = min(abs(xx) for xx in x[1:])
|
||
|
if not minx:
|
||
|
raise ValueError("PSLQ requires a vector of nonzero numbers")
|
||
|
if minx < tol//100:
|
||
|
if verbose:
|
||
|
print("STOPPING: (one number is too small)")
|
||
|
return None
|
||
|
|
||
|
g = sqrt_fixed((4<<prec)//3, prec)
|
||
|
A = {}
|
||
|
B = {}
|
||
|
H = {}
|
||
|
# Initialization
|
||
|
# step 1
|
||
|
for i in xrange(1, n+1):
|
||
|
for j in xrange(1, n+1):
|
||
|
A[i,j] = B[i,j] = (i==j) << prec
|
||
|
H[i,j] = 0
|
||
|
# step 2
|
||
|
s = [None] + [0] * n
|
||
|
for k in xrange(1, n+1):
|
||
|
t = 0
|
||
|
for j in xrange(k, n+1):
|
||
|
t += (x[j]**2 >> prec)
|
||
|
s[k] = sqrt_fixed(t, prec)
|
||
|
t = s[1]
|
||
|
y = x[:]
|
||
|
for k in xrange(1, n+1):
|
||
|
y[k] = (x[k] << prec) // t
|
||
|
s[k] = (s[k] << prec) // t
|
||
|
# step 3
|
||
|
for i in xrange(1, n+1):
|
||
|
for j in xrange(i+1, n):
|
||
|
H[i,j] = 0
|
||
|
if i <= n-1:
|
||
|
if s[i]:
|
||
|
H[i,i] = (s[i+1] << prec) // s[i]
|
||
|
else:
|
||
|
H[i,i] = 0
|
||
|
for j in range(1, i):
|
||
|
sjj1 = s[j]*s[j+1]
|
||
|
if sjj1:
|
||
|
H[i,j] = ((-y[i]*y[j])<<prec)//sjj1
|
||
|
else:
|
||
|
H[i,j] = 0
|
||
|
# step 4
|
||
|
for i in xrange(2, n+1):
|
||
|
for j in xrange(i-1, 0, -1):
|
||
|
#t = floor(H[i,j]/H[j,j] + 0.5)
|
||
|
if H[j,j]:
|
||
|
t = round_fixed((H[i,j] << prec)//H[j,j], prec)
|
||
|
else:
|
||
|
#t = 0
|
||
|
continue
|
||
|
y[j] = y[j] + (t*y[i] >> prec)
|
||
|
for k in xrange(1, j+1):
|
||
|
H[i,k] = H[i,k] - (t*H[j,k] >> prec)
|
||
|
for k in xrange(1, n+1):
|
||
|
A[i,k] = A[i,k] - (t*A[j,k] >> prec)
|
||
|
B[k,j] = B[k,j] + (t*B[k,i] >> prec)
|
||
|
# Main algorithm
|
||
|
for REP in range(maxsteps):
|
||
|
# Step 1
|
||
|
m = -1
|
||
|
szmax = -1
|
||
|
for i in range(1, n):
|
||
|
h = H[i,i]
|
||
|
sz = (g**i * abs(h)) >> (prec*(i-1))
|
||
|
if sz > szmax:
|
||
|
m = i
|
||
|
szmax = sz
|
||
|
# Step 2
|
||
|
y[m], y[m+1] = y[m+1], y[m]
|
||
|
for i in xrange(1,n+1): H[m,i], H[m+1,i] = H[m+1,i], H[m,i]
|
||
|
for i in xrange(1,n+1): A[m,i], A[m+1,i] = A[m+1,i], A[m,i]
|
||
|
for i in xrange(1,n+1): B[i,m], B[i,m+1] = B[i,m+1], B[i,m]
|
||
|
# Step 3
|
||
|
if m <= n - 2:
|
||
|
t0 = sqrt_fixed((H[m,m]**2 + H[m,m+1]**2)>>prec, prec)
|
||
|
# A zero element probably indicates that the precision has
|
||
|
# been exhausted. XXX: this could be spurious, due to
|
||
|
# using fixed-point arithmetic
|
||
|
if not t0:
|
||
|
break
|
||
|
t1 = (H[m,m] << prec) // t0
|
||
|
t2 = (H[m,m+1] << prec) // t0
|
||
|
for i in xrange(m, n+1):
|
||
|
t3 = H[i,m]
|
||
|
t4 = H[i,m+1]
|
||
|
H[i,m] = (t1*t3+t2*t4) >> prec
|
||
|
H[i,m+1] = (-t2*t3+t1*t4) >> prec
|
||
|
# Step 4
|
||
|
for i in xrange(m+1, n+1):
|
||
|
for j in xrange(min(i-1, m+1), 0, -1):
|
||
|
try:
|
||
|
t = round_fixed((H[i,j] << prec)//H[j,j], prec)
|
||
|
# Precision probably exhausted
|
||
|
except ZeroDivisionError:
|
||
|
break
|
||
|
y[j] = y[j] + ((t*y[i]) >> prec)
|
||
|
for k in xrange(1, j+1):
|
||
|
H[i,k] = H[i,k] - (t*H[j,k] >> prec)
|
||
|
for k in xrange(1, n+1):
|
||
|
A[i,k] = A[i,k] - (t*A[j,k] >> prec)
|
||
|
B[k,j] = B[k,j] + (t*B[k,i] >> prec)
|
||
|
# Until a relation is found, the error typically decreases
|
||
|
# slowly (e.g. a factor 1-10) with each step TODO: we could
|
||
|
# compare err from two successive iterations. If there is a
|
||
|
# large drop (several orders of magnitude), that indicates a
|
||
|
# "high quality" relation was detected. Reporting this to
|
||
|
# the user somehow might be useful.
|
||
|
best_err = maxcoeff<<prec
|
||
|
for i in xrange(1, n+1):
|
||
|
err = abs(y[i])
|
||
|
# Maybe we are done?
|
||
|
if err < tol:
|
||
|
# We are done if the coefficients are acceptable
|
||
|
vec = [int(round_fixed(B[j,i], prec) >> prec) for j in \
|
||
|
range(1,n+1)]
|
||
|
if max(abs(v) for v in vec) < maxcoeff:
|
||
|
if verbose:
|
||
|
print("FOUND relation at iter %i/%i, error: %s" % \
|
||
|
(REP, maxsteps, ctx.nstr(err / ctx.mpf(2)**prec, 1)))
|
||
|
return vec
|
||
|
best_err = min(err, best_err)
|
||
|
# Calculate a lower bound for the norm. We could do this
|
||
|
# more exactly (using the Euclidean norm) but there is probably
|
||
|
# no practical benefit.
|
||
|
recnorm = max(abs(h) for h in H.values())
|
||
|
if recnorm:
|
||
|
norm = ((1 << (2*prec)) // recnorm) >> prec
|
||
|
norm //= 100
|
||
|
else:
|
||
|
norm = ctx.inf
|
||
|
if verbose:
|
||
|
print("%i/%i: Error: %8s Norm: %s" % \
|
||
|
(REP, maxsteps, ctx.nstr(best_err / ctx.mpf(2)**prec, 1), norm))
|
||
|
if norm >= maxcoeff:
|
||
|
break
|
||
|
if verbose:
|
||
|
print("CANCELLING after step %i/%i." % (REP, maxsteps))
|
||
|
print("Could not find an integer relation. Norm bound: %s" % norm)
|
||
|
return None
|
||
|
|
||
|
def findpoly(ctx, x, n=1, **kwargs):
|
||
|
r"""
|
||
|
``findpoly(x, n)`` returns the coefficients of an integer
|
||
|
polynomial `P` of degree at most `n` such that `P(x) \approx 0`.
|
||
|
If no polynomial having `x` as a root can be found,
|
||
|
:func:`~mpmath.findpoly` returns ``None``.
|
||
|
|
||
|
:func:`~mpmath.findpoly` works by successively calling :func:`~mpmath.pslq` with
|
||
|
the vectors `[1, x]`, `[1, x, x^2]`, `[1, x, x^2, x^3]`, ...,
|
||
|
`[1, x, x^2, .., x^n]` as input. Keyword arguments given to
|
||
|
:func:`~mpmath.findpoly` are forwarded verbatim to :func:`~mpmath.pslq`. In
|
||
|
particular, you can specify a tolerance for `P(x)` with ``tol``
|
||
|
and a maximum permitted coefficient size with ``maxcoeff``.
|
||
|
|
||
|
For large values of `n`, it is recommended to run :func:`~mpmath.findpoly`
|
||
|
at high precision; preferably 50 digits or more.
|
||
|
|
||
|
**Examples**
|
||
|
|
||
|
By default (degree `n = 1`), :func:`~mpmath.findpoly` simply finds a linear
|
||
|
polynomial with a rational root::
|
||
|
|
||
|
>>> from mpmath import *
|
||
|
>>> mp.dps = 15; mp.pretty = True
|
||
|
>>> findpoly(0.7)
|
||
|
[-10, 7]
|
||
|
|
||
|
The generated coefficient list is valid input to ``polyval`` and
|
||
|
``polyroots``::
|
||
|
|
||
|
>>> nprint(polyval(findpoly(phi, 2), phi), 1)
|
||
|
-2.0e-16
|
||
|
>>> for r in polyroots(findpoly(phi, 2)):
|
||
|
... print(r)
|
||
|
...
|
||
|
-0.618033988749895
|
||
|
1.61803398874989
|
||
|
|
||
|
Numbers of the form `m + n \sqrt p` for integers `(m, n, p)` are
|
||
|
solutions to quadratic equations. As we find here, `1+\sqrt 2`
|
||
|
is a root of the polynomial `x^2 - 2x - 1`::
|
||
|
|
||
|
>>> findpoly(1+sqrt(2), 2)
|
||
|
[1, -2, -1]
|
||
|
>>> findroot(lambda x: x**2 - 2*x - 1, 1)
|
||
|
2.4142135623731
|
||
|
|
||
|
Despite only containing square roots, the following number results
|
||
|
in a polynomial of degree 4::
|
||
|
|
||
|
>>> findpoly(sqrt(2)+sqrt(3), 4)
|
||
|
[1, 0, -10, 0, 1]
|
||
|
|
||
|
In fact, `x^4 - 10x^2 + 1` is the *minimal polynomial* of
|
||
|
`r = \sqrt 2 + \sqrt 3`, meaning that a rational polynomial of
|
||
|
lower degree having `r` as a root does not exist. Given sufficient
|
||
|
precision, :func:`~mpmath.findpoly` will usually find the correct
|
||
|
minimal polynomial of a given algebraic number.
|
||
|
|
||
|
**Non-algebraic numbers**
|
||
|
|
||
|
If :func:`~mpmath.findpoly` fails to find a polynomial with given
|
||
|
coefficient size and tolerance constraints, that means no such
|
||
|
polynomial exists.
|
||
|
|
||
|
We can verify that `\pi` is not an algebraic number of degree 3 with
|
||
|
coefficients less than 1000::
|
||
|
|
||
|
>>> mp.dps = 15
|
||
|
>>> findpoly(pi, 3)
|
||
|
>>>
|
||
|
|
||
|
It is always possible to find an algebraic approximation of a number
|
||
|
using one (or several) of the following methods:
|
||
|
|
||
|
1. Increasing the permitted degree
|
||
|
2. Allowing larger coefficients
|
||
|
3. Reducing the tolerance
|
||
|
|
||
|
One example of each method is shown below::
|
||
|
|
||
|
>>> mp.dps = 15
|
||
|
>>> findpoly(pi, 4)
|
||
|
[95, -545, 863, -183, -298]
|
||
|
>>> findpoly(pi, 3, maxcoeff=10000)
|
||
|
[836, -1734, -2658, -457]
|
||
|
>>> findpoly(pi, 3, tol=1e-7)
|
||
|
[-4, 22, -29, -2]
|
||
|
|
||
|
It is unknown whether Euler's constant is transcendental (or even
|
||
|
irrational). We can use :func:`~mpmath.findpoly` to check that if is
|
||
|
an algebraic number, its minimal polynomial must have degree
|
||
|
at least 7 and a coefficient of magnitude at least 1000000::
|
||
|
|
||
|
>>> mp.dps = 200
|
||
|
>>> findpoly(euler, 6, maxcoeff=10**6, tol=1e-100, maxsteps=1000)
|
||
|
>>>
|
||
|
|
||
|
Note that the high precision and strict tolerance is necessary
|
||
|
for such high-degree runs, since otherwise unwanted low-accuracy
|
||
|
approximations will be detected. It may also be necessary to set
|
||
|
maxsteps high to prevent a premature exit (before the coefficient
|
||
|
bound has been reached). Running with ``verbose=True`` to get an
|
||
|
idea what is happening can be useful.
|
||
|
"""
|
||
|
x = ctx.mpf(x)
|
||
|
if n < 1:
|
||
|
raise ValueError("n cannot be less than 1")
|
||
|
if x == 0:
|
||
|
return [1, 0]
|
||
|
xs = [ctx.mpf(1)]
|
||
|
for i in range(1,n+1):
|
||
|
xs.append(x**i)
|
||
|
a = ctx.pslq(xs, **kwargs)
|
||
|
if a is not None:
|
||
|
return a[::-1]
|
||
|
|
||
|
def fracgcd(p, q):
|
||
|
x, y = p, q
|
||
|
while y:
|
||
|
x, y = y, x % y
|
||
|
if x != 1:
|
||
|
p //= x
|
||
|
q //= x
|
||
|
if q == 1:
|
||
|
return p
|
||
|
return p, q
|
||
|
|
||
|
def pslqstring(r, constants):
|
||
|
q = r[0]
|
||
|
r = r[1:]
|
||
|
s = []
|
||
|
for i in range(len(r)):
|
||
|
p = r[i]
|
||
|
if p:
|
||
|
z = fracgcd(-p,q)
|
||
|
cs = constants[i][1]
|
||
|
if cs == '1':
|
||
|
cs = ''
|
||
|
else:
|
||
|
cs = '*' + cs
|
||
|
if isinstance(z, int_types):
|
||
|
if z > 0: term = str(z) + cs
|
||
|
else: term = ("(%s)" % z) + cs
|
||
|
else:
|
||
|
term = ("(%s/%s)" % z) + cs
|
||
|
s.append(term)
|
||
|
s = ' + '.join(s)
|
||
|
if '+' in s or '*' in s:
|
||
|
s = '(' + s + ')'
|
||
|
return s or '0'
|
||
|
|
||
|
def prodstring(r, constants):
|
||
|
q = r[0]
|
||
|
r = r[1:]
|
||
|
num = []
|
||
|
den = []
|
||
|
for i in range(len(r)):
|
||
|
p = r[i]
|
||
|
if p:
|
||
|
z = fracgcd(-p,q)
|
||
|
cs = constants[i][1]
|
||
|
if isinstance(z, int_types):
|
||
|
if abs(z) == 1: t = cs
|
||
|
else: t = '%s**%s' % (cs, abs(z))
|
||
|
([num,den][z<0]).append(t)
|
||
|
else:
|
||
|
t = '%s**(%s/%s)' % (cs, abs(z[0]), z[1])
|
||
|
([num,den][z[0]<0]).append(t)
|
||
|
num = '*'.join(num)
|
||
|
den = '*'.join(den)
|
||
|
if num and den: return "(%s)/(%s)" % (num, den)
|
||
|
if num: return num
|
||
|
if den: return "1/(%s)" % den
|
||
|
|
||
|
def quadraticstring(ctx,t,a,b,c):
|
||
|
if c < 0:
|
||
|
a,b,c = -a,-b,-c
|
||
|
u1 = (-b+ctx.sqrt(b**2-4*a*c))/(2*c)
|
||
|
u2 = (-b-ctx.sqrt(b**2-4*a*c))/(2*c)
|
||
|
if abs(u1-t) < abs(u2-t):
|
||
|
if b: s = '((%s+sqrt(%s))/%s)' % (-b,b**2-4*a*c,2*c)
|
||
|
else: s = '(sqrt(%s)/%s)' % (-4*a*c,2*c)
|
||
|
else:
|
||
|
if b: s = '((%s-sqrt(%s))/%s)' % (-b,b**2-4*a*c,2*c)
|
||
|
else: s = '(-sqrt(%s)/%s)' % (-4*a*c,2*c)
|
||
|
return s
|
||
|
|
||
|
# Transformation y = f(x,c), with inverse function x = f(y,c)
|
||
|
# The third entry indicates whether the transformation is
|
||
|
# redundant when c = 1
|
||
|
transforms = [
|
||
|
(lambda ctx,x,c: x*c, '$y/$c', 0),
|
||
|
(lambda ctx,x,c: x/c, '$c*$y', 1),
|
||
|
(lambda ctx,x,c: c/x, '$c/$y', 0),
|
||
|
(lambda ctx,x,c: (x*c)**2, 'sqrt($y)/$c', 0),
|
||
|
(lambda ctx,x,c: (x/c)**2, '$c*sqrt($y)', 1),
|
||
|
(lambda ctx,x,c: (c/x)**2, '$c/sqrt($y)', 0),
|
||
|
(lambda ctx,x,c: c*x**2, 'sqrt($y)/sqrt($c)', 1),
|
||
|
(lambda ctx,x,c: x**2/c, 'sqrt($c)*sqrt($y)', 1),
|
||
|
(lambda ctx,x,c: c/x**2, 'sqrt($c)/sqrt($y)', 1),
|
||
|
(lambda ctx,x,c: ctx.sqrt(x*c), '$y**2/$c', 0),
|
||
|
(lambda ctx,x,c: ctx.sqrt(x/c), '$c*$y**2', 1),
|
||
|
(lambda ctx,x,c: ctx.sqrt(c/x), '$c/$y**2', 0),
|
||
|
(lambda ctx,x,c: c*ctx.sqrt(x), '$y**2/$c**2', 1),
|
||
|
(lambda ctx,x,c: ctx.sqrt(x)/c, '$c**2*$y**2', 1),
|
||
|
(lambda ctx,x,c: c/ctx.sqrt(x), '$c**2/$y**2', 1),
|
||
|
(lambda ctx,x,c: ctx.exp(x*c), 'log($y)/$c', 0),
|
||
|
(lambda ctx,x,c: ctx.exp(x/c), '$c*log($y)', 1),
|
||
|
(lambda ctx,x,c: ctx.exp(c/x), '$c/log($y)', 0),
|
||
|
(lambda ctx,x,c: c*ctx.exp(x), 'log($y/$c)', 1),
|
||
|
(lambda ctx,x,c: ctx.exp(x)/c, 'log($c*$y)', 1),
|
||
|
(lambda ctx,x,c: c/ctx.exp(x), 'log($c/$y)', 0),
|
||
|
(lambda ctx,x,c: ctx.ln(x*c), 'exp($y)/$c', 0),
|
||
|
(lambda ctx,x,c: ctx.ln(x/c), '$c*exp($y)', 1),
|
||
|
(lambda ctx,x,c: ctx.ln(c/x), '$c/exp($y)', 0),
|
||
|
(lambda ctx,x,c: c*ctx.ln(x), 'exp($y/$c)', 1),
|
||
|
(lambda ctx,x,c: ctx.ln(x)/c, 'exp($c*$y)', 1),
|
||
|
(lambda ctx,x,c: c/ctx.ln(x), 'exp($c/$y)', 0),
|
||
|
]
|
||
|
|
||
|
def identify(ctx, x, constants=[], tol=None, maxcoeff=1000, full=False,
|
||
|
verbose=False):
|
||
|
r"""
|
||
|
Given a real number `x`, ``identify(x)`` attempts to find an exact
|
||
|
formula for `x`. This formula is returned as a string. If no match
|
||
|
is found, ``None`` is returned. With ``full=True``, a list of
|
||
|
matching formulas is returned.
|
||
|
|
||
|
As a simple example, :func:`~mpmath.identify` will find an algebraic
|
||
|
formula for the golden ratio::
|
||
|
|
||
|
>>> from mpmath import *
|
||
|
>>> mp.dps = 15; mp.pretty = True
|
||
|
>>> identify(phi)
|
||
|
'((1+sqrt(5))/2)'
|
||
|
|
||
|
:func:`~mpmath.identify` can identify simple algebraic numbers and simple
|
||
|
combinations of given base constants, as well as certain basic
|
||
|
transformations thereof. More specifically, :func:`~mpmath.identify`
|
||
|
looks for the following:
|
||
|
|
||
|
1. Fractions
|
||
|
2. Quadratic algebraic numbers
|
||
|
3. Rational linear combinations of the base constants
|
||
|
4. Any of the above after first transforming `x` into `f(x)` where
|
||
|
`f(x)` is `1/x`, `\sqrt x`, `x^2`, `\log x` or `\exp x`, either
|
||
|
directly or with `x` or `f(x)` multiplied or divided by one of
|
||
|
the base constants
|
||
|
5. Products of fractional powers of the base constants and
|
||
|
small integers
|
||
|
|
||
|
Base constants can be given as a list of strings representing mpmath
|
||
|
expressions (:func:`~mpmath.identify` will ``eval`` the strings to numerical
|
||
|
values and use the original strings for the output), or as a dict of
|
||
|
formula:value pairs.
|
||
|
|
||
|
In order not to produce spurious results, :func:`~mpmath.identify` should
|
||
|
be used with high precision; preferably 50 digits or more.
|
||
|
|
||
|
**Examples**
|
||
|
|
||
|
Simple identifications can be performed safely at standard
|
||
|
precision. Here the default recognition of rational, algebraic,
|
||
|
and exp/log of algebraic numbers is demonstrated::
|
||
|
|
||
|
>>> mp.dps = 15
|
||
|
>>> identify(0.22222222222222222)
|
||
|
'(2/9)'
|
||
|
>>> identify(1.9662210973805663)
|
||
|
'sqrt(((24+sqrt(48))/8))'
|
||
|
>>> identify(4.1132503787829275)
|
||
|
'exp((sqrt(8)/2))'
|
||
|
>>> identify(0.881373587019543)
|
||
|
'log(((2+sqrt(8))/2))'
|
||
|
|
||
|
By default, :func:`~mpmath.identify` does not recognize `\pi`. At standard
|
||
|
precision it finds a not too useful approximation. At slightly
|
||
|
increased precision, this approximation is no longer accurate
|
||
|
enough and :func:`~mpmath.identify` more correctly returns ``None``::
|
||
|
|
||
|
>>> identify(pi)
|
||
|
'(2**(176/117)*3**(20/117)*5**(35/39))/(7**(92/117))'
|
||
|
>>> mp.dps = 30
|
||
|
>>> identify(pi)
|
||
|
>>>
|
||
|
|
||
|
Numbers such as `\pi`, and simple combinations of user-defined
|
||
|
constants, can be identified if they are provided explicitly::
|
||
|
|
||
|
>>> identify(3*pi-2*e, ['pi', 'e'])
|
||
|
'(3*pi + (-2)*e)'
|
||
|
|
||
|
Here is an example using a dict of constants. Note that the
|
||
|
constants need not be "atomic"; :func:`~mpmath.identify` can just
|
||
|
as well express the given number in terms of expressions
|
||
|
given by formulas::
|
||
|
|
||
|
>>> identify(pi+e, {'a':pi+2, 'b':2*e})
|
||
|
'((-2) + 1*a + (1/2)*b)'
|
||
|
|
||
|
Next, we attempt some identifications with a set of base constants.
|
||
|
It is necessary to increase the precision a bit.
|
||
|
|
||
|
>>> mp.dps = 50
|
||
|
>>> base = ['sqrt(2)','pi','log(2)']
|
||
|
>>> identify(0.25, base)
|
||
|
'(1/4)'
|
||
|
>>> identify(3*pi + 2*sqrt(2) + 5*log(2)/7, base)
|
||
|
'(2*sqrt(2) + 3*pi + (5/7)*log(2))'
|
||
|
>>> identify(exp(pi+2), base)
|
||
|
'exp((2 + 1*pi))'
|
||
|
>>> identify(1/(3+sqrt(2)), base)
|
||
|
'((3/7) + (-1/7)*sqrt(2))'
|
||
|
>>> identify(sqrt(2)/(3*pi+4), base)
|
||
|
'sqrt(2)/(4 + 3*pi)'
|
||
|
>>> identify(5**(mpf(1)/3)*pi*log(2)**2, base)
|
||
|
'5**(1/3)*pi*log(2)**2'
|
||
|
|
||
|
An example of an erroneous solution being found when too low
|
||
|
precision is used::
|
||
|
|
||
|
>>> mp.dps = 15
|
||
|
>>> identify(1/(3*pi-4*e+sqrt(8)), ['pi', 'e', 'sqrt(2)'])
|
||
|
'((11/25) + (-158/75)*pi + (76/75)*e + (44/15)*sqrt(2))'
|
||
|
>>> mp.dps = 50
|
||
|
>>> identify(1/(3*pi-4*e+sqrt(8)), ['pi', 'e', 'sqrt(2)'])
|
||
|
'1/(3*pi + (-4)*e + 2*sqrt(2))'
|
||
|
|
||
|
**Finding approximate solutions**
|
||
|
|
||
|
The tolerance ``tol`` defaults to 3/4 of the working precision.
|
||
|
Lowering the tolerance is useful for finding approximate matches.
|
||
|
We can for example try to generate approximations for pi::
|
||
|
|
||
|
>>> mp.dps = 15
|
||
|
>>> identify(pi, tol=1e-2)
|
||
|
'(22/7)'
|
||
|
>>> identify(pi, tol=1e-3)
|
||
|
'(355/113)'
|
||
|
>>> identify(pi, tol=1e-10)
|
||
|
'(5**(339/269))/(2**(64/269)*3**(13/269)*7**(92/269))'
|
||
|
|
||
|
With ``full=True``, and by supplying a few base constants,
|
||
|
``identify`` can generate almost endless lists of approximations
|
||
|
for any number (the output below has been truncated to show only
|
||
|
the first few)::
|
||
|
|
||
|
>>> for p in identify(pi, ['e', 'catalan'], tol=1e-5, full=True):
|
||
|
... print(p)
|
||
|
... # doctest: +ELLIPSIS
|
||
|
e/log((6 + (-4/3)*e))
|
||
|
(3**3*5*e*catalan**2)/(2*7**2)
|
||
|
sqrt(((-13) + 1*e + 22*catalan))
|
||
|
log(((-6) + 24*e + 4*catalan)/e)
|
||
|
exp(catalan*((-1/5) + (8/15)*e))
|
||
|
catalan*(6 + (-6)*e + 15*catalan)
|
||
|
sqrt((5 + 26*e + (-3)*catalan))/e
|
||
|
e*sqrt(((-27) + 2*e + 25*catalan))
|
||
|
log(((-1) + (-11)*e + 59*catalan))
|
||
|
((3/20) + (21/20)*e + (3/20)*catalan)
|
||
|
...
|
||
|
|
||
|
The numerical values are roughly as close to `\pi` as permitted by the
|
||
|
specified tolerance:
|
||
|
|
||
|
>>> e/log(6-4*e/3)
|
||
|
3.14157719846001
|
||
|
>>> 135*e*catalan**2/98
|
||
|
3.14166950419369
|
||
|
>>> sqrt(e-13+22*catalan)
|
||
|
3.14158000062992
|
||
|
>>> log(24*e-6+4*catalan)-1
|
||
|
3.14158791577159
|
||
|
|
||
|
**Symbolic processing**
|
||
|
|
||
|
The output formula can be evaluated as a Python expression.
|
||
|
Note however that if fractions (like '2/3') are present in
|
||
|
the formula, Python's :func:`~mpmath.eval()` may erroneously perform
|
||
|
integer division. Note also that the output is not necessarily
|
||
|
in the algebraically simplest form::
|
||
|
|
||
|
>>> identify(sqrt(2))
|
||
|
'(sqrt(8)/2)'
|
||
|
|
||
|
As a solution to both problems, consider using SymPy's
|
||
|
:func:`~mpmath.sympify` to convert the formula into a symbolic expression.
|
||
|
SymPy can be used to pretty-print or further simplify the formula
|
||
|
symbolically::
|
||
|
|
||
|
>>> from sympy import sympify # doctest: +SKIP
|
||
|
>>> sympify(identify(sqrt(2))) # doctest: +SKIP
|
||
|
2**(1/2)
|
||
|
|
||
|
Sometimes :func:`~mpmath.identify` can simplify an expression further than
|
||
|
a symbolic algorithm::
|
||
|
|
||
|
>>> from sympy import simplify # doctest: +SKIP
|
||
|
>>> x = sympify('-1/(-3/2+(1/2)*5**(1/2))*(3/2-1/2*5**(1/2))**(1/2)') # doctest: +SKIP
|
||
|
>>> x # doctest: +SKIP
|
||
|
(3/2 - 5**(1/2)/2)**(-1/2)
|
||
|
>>> x = simplify(x) # doctest: +SKIP
|
||
|
>>> x # doctest: +SKIP
|
||
|
2/(6 - 2*5**(1/2))**(1/2)
|
||
|
>>> mp.dps = 30 # doctest: +SKIP
|
||
|
>>> x = sympify(identify(x.evalf(30))) # doctest: +SKIP
|
||
|
>>> x # doctest: +SKIP
|
||
|
1/2 + 5**(1/2)/2
|
||
|
|
||
|
(In fact, this functionality is available directly in SymPy as the
|
||
|
function :func:`~mpmath.nsimplify`, which is essentially a wrapper for
|
||
|
:func:`~mpmath.identify`.)
|
||
|
|
||
|
**Miscellaneous issues and limitations**
|
||
|
|
||
|
The input `x` must be a real number. All base constants must be
|
||
|
positive real numbers and must not be rationals or rational linear
|
||
|
combinations of each other.
|
||
|
|
||
|
The worst-case computation time grows quickly with the number of
|
||
|
base constants. Already with 3 or 4 base constants,
|
||
|
:func:`~mpmath.identify` may require several seconds to finish. To search
|
||
|
for relations among a large number of constants, you should
|
||
|
consider using :func:`~mpmath.pslq` directly.
|
||
|
|
||
|
The extended transformations are applied to x, not the constants
|
||
|
separately. As a result, ``identify`` will for example be able to
|
||
|
recognize ``exp(2*pi+3)`` with ``pi`` given as a base constant, but
|
||
|
not ``2*exp(pi)+3``. It will be able to recognize the latter if
|
||
|
``exp(pi)`` is given explicitly as a base constant.
|
||
|
|
||
|
"""
|
||
|
|
||
|
solutions = []
|
||
|
|
||
|
def addsolution(s):
|
||
|
if verbose: print("Found: ", s)
|
||
|
solutions.append(s)
|
||
|
|
||
|
x = ctx.mpf(x)
|
||
|
|
||
|
# Further along, x will be assumed positive
|
||
|
if x == 0:
|
||
|
if full: return ['0']
|
||
|
else: return '0'
|
||
|
if x < 0:
|
||
|
sol = ctx.identify(-x, constants, tol, maxcoeff, full, verbose)
|
||
|
if sol is None:
|
||
|
return sol
|
||
|
if full:
|
||
|
return ["-(%s)"%s for s in sol]
|
||
|
else:
|
||
|
return "-(%s)" % sol
|
||
|
|
||
|
if tol:
|
||
|
tol = ctx.mpf(tol)
|
||
|
else:
|
||
|
tol = ctx.eps**0.7
|
||
|
M = maxcoeff
|
||
|
|
||
|
if constants:
|
||
|
if isinstance(constants, dict):
|
||
|
constants = [(ctx.mpf(v), name) for (name, v) in sorted(constants.items())]
|
||
|
else:
|
||
|
namespace = dict((name, getattr(ctx,name)) for name in dir(ctx))
|
||
|
constants = [(eval(p, namespace), p) for p in constants]
|
||
|
else:
|
||
|
constants = []
|
||
|
|
||
|
# We always want to find at least rational terms
|
||
|
if 1 not in [value for (name, value) in constants]:
|
||
|
constants = [(ctx.mpf(1), '1')] + constants
|
||
|
|
||
|
# PSLQ with simple algebraic and functional transformations
|
||
|
for ft, ftn, red in transforms:
|
||
|
for c, cn in constants:
|
||
|
if red and cn == '1':
|
||
|
continue
|
||
|
t = ft(ctx,x,c)
|
||
|
# Prevent exponential transforms from wreaking havoc
|
||
|
if abs(t) > M**2 or abs(t) < tol:
|
||
|
continue
|
||
|
# Linear combination of base constants
|
||
|
r = ctx.pslq([t] + [a[0] for a in constants], tol, M)
|
||
|
s = None
|
||
|
if r is not None and max(abs(uw) for uw in r) <= M and r[0]:
|
||
|
s = pslqstring(r, constants)
|
||
|
# Quadratic algebraic numbers
|
||
|
else:
|
||
|
q = ctx.pslq([ctx.one, t, t**2], tol, M)
|
||
|
if q is not None and len(q) == 3 and q[2]:
|
||
|
aa, bb, cc = q
|
||
|
if max(abs(aa),abs(bb),abs(cc)) <= M:
|
||
|
s = quadraticstring(ctx,t,aa,bb,cc)
|
||
|
if s:
|
||
|
if cn == '1' and ('/$c' in ftn):
|
||
|
s = ftn.replace('$y', s).replace('/$c', '')
|
||
|
else:
|
||
|
s = ftn.replace('$y', s).replace('$c', cn)
|
||
|
addsolution(s)
|
||
|
if not full: return solutions[0]
|
||
|
|
||
|
if verbose:
|
||
|
print(".")
|
||
|
|
||
|
# Check for a direct multiplicative formula
|
||
|
if x != 1:
|
||
|
# Allow fractional powers of fractions
|
||
|
ilogs = [2,3,5,7]
|
||
|
# Watch out for existing fractional powers of fractions
|
||
|
logs = []
|
||
|
for a, s in constants:
|
||
|
if not sum(bool(ctx.findpoly(ctx.ln(a)/ctx.ln(i),1)) for i in ilogs):
|
||
|
logs.append((ctx.ln(a), s))
|
||
|
logs = [(ctx.ln(i),str(i)) for i in ilogs] + logs
|
||
|
r = ctx.pslq([ctx.ln(x)] + [a[0] for a in logs], tol, M)
|
||
|
if r is not None and max(abs(uw) for uw in r) <= M and r[0]:
|
||
|
addsolution(prodstring(r, logs))
|
||
|
if not full: return solutions[0]
|
||
|
|
||
|
if full:
|
||
|
return sorted(solutions, key=len)
|
||
|
else:
|
||
|
return None
|
||
|
|
||
|
IdentificationMethods.pslq = pslq
|
||
|
IdentificationMethods.findpoly = findpoly
|
||
|
IdentificationMethods.identify = identify
|
||
|
|
||
|
|
||
|
if __name__ == '__main__':
|
||
|
import doctest
|
||
|
doctest.testmod()
|