forked from OSchip/llvm-project
1336 lines
48 KiB
Julia
1336 lines
48 KiB
Julia
|
#!/usr/bin/env julia
|
|||
|
# -*- julia -*-
|
|||
|
|
|||
|
# remez.jl - implementation of the Remez algorithm for polynomial approximation
|
|||
|
#
|
|||
|
# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|||
|
# See https://llvm.org/LICENSE.txt for license information.
|
|||
|
# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|||
|
|
|||
|
import Base.\
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Helper functions to cope with different Julia versions.
|
|||
|
if VERSION >= v"0.7.0"
|
|||
|
array1d(T, d) = Array{T, 1}(undef, d)
|
|||
|
array2d(T, d1, d2) = Array{T, 2}(undef, d1, d2)
|
|||
|
else
|
|||
|
array1d(T, d) = Array(T, d)
|
|||
|
array2d(T, d1, d2) = Array(T, d1, d2)
|
|||
|
end
|
|||
|
if VERSION < v"0.5.0"
|
|||
|
String = ASCIIString
|
|||
|
end
|
|||
|
if VERSION >= v"0.6.0"
|
|||
|
# Use Base.invokelatest to run functions made using eval(), to
|
|||
|
# avoid "world age" error
|
|||
|
run(f, x...) = Base.invokelatest(f, x...)
|
|||
|
else
|
|||
|
# Prior to 0.6.0, invokelatest doesn't exist (but fortunately the
|
|||
|
# world age problem also doesn't seem to exist)
|
|||
|
run(f, x...) = f(x...)
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Global variables configured by command-line options.
|
|||
|
floatsuffix = "" # adjusted by --floatsuffix
|
|||
|
xvarname = "x" # adjusted by --variable
|
|||
|
epsbits = 256 # adjusted by --bits
|
|||
|
debug_facilities = Set() # adjusted by --debug
|
|||
|
full_output = false # adjusted by --full
|
|||
|
array_format = false # adjusted by --array
|
|||
|
preliminary_commands = array1d(String, 0) # adjusted by --pre
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Diagnostic and utility functions.
|
|||
|
|
|||
|
# Enable debugging printouts from a particular subpart of this
|
|||
|
# program.
|
|||
|
#
|
|||
|
# Arguments:
|
|||
|
# facility Name of the facility to debug. For a list of facility names,
|
|||
|
# look through the code for calls to debug().
|
|||
|
#
|
|||
|
# Return value is a BigFloat.
|
|||
|
function enable_debug(facility)
|
|||
|
push!(debug_facilities, facility)
|
|||
|
end
|
|||
|
|
|||
|
# Print a diagnostic.
|
|||
|
#
|
|||
|
# Arguments:
|
|||
|
# facility Name of the facility for which this is a debug message.
|
|||
|
# printargs Arguments to println() if debugging of that facility is
|
|||
|
# enabled.
|
|||
|
macro debug(facility, printargs...)
|
|||
|
printit = quote
|
|||
|
print("[", $facility, "] ")
|
|||
|
end
|
|||
|
for arg in printargs
|
|||
|
printit = quote
|
|||
|
$printit
|
|||
|
print($(esc(arg)))
|
|||
|
end
|
|||
|
end
|
|||
|
return quote
|
|||
|
if $facility in debug_facilities
|
|||
|
$printit
|
|||
|
println()
|
|||
|
end
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# Evaluate a polynomial.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# coeffs Array of BigFloats giving the coefficients of the polynomial.
|
|||
|
# Starts with the constant term, i.e. coeffs[i] is the
|
|||
|
# coefficient of x^(i-1) (because Julia arrays are 1-based).
|
|||
|
# x Point at which to evaluate the polynomial.
|
|||
|
#
|
|||
|
# Return value is a BigFloat.
|
|||
|
function poly_eval(coeffs::Array{BigFloat}, x::BigFloat)
|
|||
|
n = length(coeffs)
|
|||
|
if n == 0
|
|||
|
return BigFloat(0)
|
|||
|
elseif n == 1
|
|||
|
return coeffs[1]
|
|||
|
else
|
|||
|
return coeffs[1] + x * poly_eval(coeffs[2:n], x)
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# Evaluate a rational function.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# ncoeffs Array of BigFloats giving the coefficients of the numerator.
|
|||
|
# Starts with the constant term, and 1-based, as above.
|
|||
|
# dcoeffs Array of BigFloats giving the coefficients of the denominator.
|
|||
|
# Starts with the constant term, and 1-based, as above.
|
|||
|
# x Point at which to evaluate the function.
|
|||
|
#
|
|||
|
# Return value is a BigFloat.
|
|||
|
function ratfn_eval(ncoeffs::Array{BigFloat}, dcoeffs::Array{BigFloat},
|
|||
|
x::BigFloat)
|
|||
|
return poly_eval(ncoeffs, x) / poly_eval(dcoeffs, x)
|
|||
|
end
|
|||
|
|
|||
|
# Format a BigFloat into an appropriate output format.
|
|||
|
# Arguments:
|
|||
|
# x BigFloat to format.
|
|||
|
#
|
|||
|
# Return value is a string.
|
|||
|
function float_to_str(x)
|
|||
|
return string(x) * floatsuffix
|
|||
|
end
|
|||
|
|
|||
|
# Format a polynomial into an arithmetic expression, for pasting into
|
|||
|
# other tools such as gnuplot.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# coeffs Array of BigFloats giving the coefficients of the polynomial.
|
|||
|
# Starts with the constant term, and 1-based, as above.
|
|||
|
#
|
|||
|
# Return value is a string.
|
|||
|
function poly_to_string(coeffs::Array{BigFloat})
|
|||
|
n = length(coeffs)
|
|||
|
if n == 0
|
|||
|
return "0"
|
|||
|
elseif n == 1
|
|||
|
return float_to_str(coeffs[1])
|
|||
|
else
|
|||
|
return string(float_to_str(coeffs[1]), "+", xvarname, "*(",
|
|||
|
poly_to_string(coeffs[2:n]), ")")
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# Format a rational function into a string.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# ncoeffs Array of BigFloats giving the coefficients of the numerator.
|
|||
|
# Starts with the constant term, and 1-based, as above.
|
|||
|
# dcoeffs Array of BigFloats giving the coefficients of the denominator.
|
|||
|
# Starts with the constant term, and 1-based, as above.
|
|||
|
#
|
|||
|
# Return value is a string.
|
|||
|
function ratfn_to_string(ncoeffs::Array{BigFloat}, dcoeffs::Array{BigFloat})
|
|||
|
if length(dcoeffs) == 1 && dcoeffs[1] == 1
|
|||
|
# Special case: if the denominator is just 1, leave it out.
|
|||
|
return poly_to_string(ncoeffs)
|
|||
|
else
|
|||
|
return string("(", poly_to_string(ncoeffs), ")/(",
|
|||
|
poly_to_string(dcoeffs), ")")
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# Format a list of x,y pairs into a string.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# xys Array of (x,y) pairs of BigFloats.
|
|||
|
#
|
|||
|
# Return value is a string.
|
|||
|
function format_xylist(xys::Array{Tuple{BigFloat,BigFloat}})
|
|||
|
return ("[\n" *
|
|||
|
join([" "*string(x)*" -> "*string(y) for (x,y) in xys], "\n") *
|
|||
|
"\n]")
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Matrix-equation solver for matrices of BigFloat.
|
|||
|
#
|
|||
|
# I had hoped that Julia's type-genericity would allow me to solve the
|
|||
|
# matrix equation Mx=V by just writing 'M \ V'. Unfortunately, that
|
|||
|
# works by translating the inputs into double precision and handing
|
|||
|
# off to an optimised library, which misses the point when I have a
|
|||
|
# matrix and vector of BigFloat and want my result in _better_ than
|
|||
|
# double precision. So I have to implement my own specialisation of
|
|||
|
# the \ operator for that case.
|
|||
|
#
|
|||
|
# Fortunately, the point of using BigFloats is that we have precision
|
|||
|
# to burn, so I can do completely naïve Gaussian elimination without
|
|||
|
# worrying about instability.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# matrix_in 2-dimensional array of BigFloats, representing a matrix M
|
|||
|
# in row-first order, i.e. matrix_in[r,c] represents the
|
|||
|
# entry in row r col c.
|
|||
|
# vector_in 1-dimensional array of BigFloats, representing a vector V.
|
|||
|
#
|
|||
|
# Return value: a 1-dimensional array X of BigFloats, satisfying M X = V.
|
|||
|
#
|
|||
|
# Expects the input to be an invertible square matrix and a vector of
|
|||
|
# the corresponding size, on pain of failing an assertion.
|
|||
|
function \(matrix_in :: Array{BigFloat,2},
|
|||
|
vector_in :: Array{BigFloat,1})
|
|||
|
# Copy the inputs, because we'll be mutating them as we go.
|
|||
|
M = copy(matrix_in)
|
|||
|
V = copy(vector_in)
|
|||
|
|
|||
|
# Input consistency criteria: matrix is square, and vector has
|
|||
|
# length to match.
|
|||
|
n = length(V)
|
|||
|
@assert(n > 0)
|
|||
|
@assert(size(M) == (n,n))
|
|||
|
|
|||
|
@debug("gausselim", "starting, n=", n)
|
|||
|
|
|||
|
for i = 1:1:n
|
|||
|
# Straightforward Gaussian elimination: find the largest
|
|||
|
# non-zero entry in column i (and in a row we haven't sorted
|
|||
|
# out already), swap it into row i, scale that row to
|
|||
|
# normalise it to 1, then zero out the rest of the column by
|
|||
|
# subtracting a multiple of that row from each other row.
|
|||
|
|
|||
|
@debug("gausselim", "matrix=", repr(M))
|
|||
|
@debug("gausselim", "vector=", repr(V))
|
|||
|
|
|||
|
# Find the best pivot.
|
|||
|
bestrow = 0
|
|||
|
bestval = 0
|
|||
|
for j = i:1:n
|
|||
|
if abs(M[j,i]) > bestval
|
|||
|
bestrow = j
|
|||
|
bestval = M[j,i]
|
|||
|
end
|
|||
|
end
|
|||
|
@assert(bestrow > 0) # make sure we did actually find one
|
|||
|
|
|||
|
@debug("gausselim", "bestrow=", bestrow)
|
|||
|
|
|||
|
# Swap it into row i.
|
|||
|
if bestrow != i
|
|||
|
for k = 1:1:n
|
|||
|
M[bestrow,k],M[i,k] = M[i,k],M[bestrow,k]
|
|||
|
end
|
|||
|
V[bestrow],V[i] = V[i],V[bestrow]
|
|||
|
end
|
|||
|
|
|||
|
# Scale that row so that M[i,i] becomes 1.
|
|||
|
divisor = M[i,i]
|
|||
|
for k = 1:1:n
|
|||
|
M[i,k] = M[i,k] / divisor
|
|||
|
end
|
|||
|
V[i] = V[i] / divisor
|
|||
|
@assert(M[i,i] == 1)
|
|||
|
|
|||
|
# Zero out all other entries in column i, by subtracting
|
|||
|
# multiples of this row.
|
|||
|
for j = 1:1:n
|
|||
|
if j != i
|
|||
|
factor = M[j,i]
|
|||
|
for k = 1:1:n
|
|||
|
M[j,k] = M[j,k] - M[i,k] * factor
|
|||
|
end
|
|||
|
V[j] = V[j] - V[i] * factor
|
|||
|
@assert(M[j,i] == 0)
|
|||
|
end
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
@debug("gausselim", "matrix=", repr(M))
|
|||
|
@debug("gausselim", "vector=", repr(V))
|
|||
|
@debug("gausselim", "done!")
|
|||
|
|
|||
|
# Now we're done: M is the identity matrix, so the equation Mx=V
|
|||
|
# becomes just x=V, i.e. V is already exactly the vector we want
|
|||
|
# to return.
|
|||
|
return V
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Least-squares fitting of a rational function to a set of (x,y)
|
|||
|
# points.
|
|||
|
#
|
|||
|
# We use this to get an initial starting point for the Remez
|
|||
|
# iteration. Therefore, it doesn't really need to be particularly
|
|||
|
# accurate; it only needs to be good enough to wiggle back and forth
|
|||
|
# across the target function the right number of times (so as to give
|
|||
|
# enough error extrema to start optimising from) and not have any
|
|||
|
# poles in the target interval.
|
|||
|
#
|
|||
|
# Least-squares fitting of a _polynomial_ is actually a sensible thing
|
|||
|
# to do, and minimises the rms error. Doing the following trick with a
|
|||
|
# rational function P/Q is less sensible, because it cannot be made to
|
|||
|
# minimise the error function (P/Q-f)^2 that you actually wanted;
|
|||
|
# instead it minimises (P-fQ)^2. But that should be good enough to
|
|||
|
# have the properties described above.
|
|||
|
#
|
|||
|
# Some theory: suppose you're trying to choose a set of parameters a_i
|
|||
|
# so as to minimise the sum of squares of some error function E_i.
|
|||
|
# Basic calculus says, if you do this in one variable, just
|
|||
|
# differentiate and solve for zero. In this case, that works fine even
|
|||
|
# with multiple variables, because you _partially_ differentiate with
|
|||
|
# respect to each a_i, giving a system of equations, and that system
|
|||
|
# turns out to be linear so we just solve it as a matrix.
|
|||
|
#
|
|||
|
# In this case, our parameters are the coefficients of P and Q; to
|
|||
|
# avoid underdetermining the system we'll fix Q's constant term at 1,
|
|||
|
# so that our error function (as described above) is
|
|||
|
#
|
|||
|
# E = \sum (p_0 + p_1 x + ... + p_n x^n - y - y q_1 x - ... - y q_d x^d)^2
|
|||
|
#
|
|||
|
# where the sum is over all (x,y) coordinate pairs. Setting dE/dp_j=0
|
|||
|
# (for each j) gives an equation of the form
|
|||
|
#
|
|||
|
# 0 = \sum 2(p_0 + p_1 x + ... + p_n x^n - y - y q_1 x - ... - y q_d x^d) x^j
|
|||
|
#
|
|||
|
# and setting dE/dq_j=0 gives one of the form
|
|||
|
#
|
|||
|
# 0 = \sum 2(p_0 + p_1 x + ... + p_n x^n - y - y q_1 x - ... - y q_d x^d) y x^j
|
|||
|
#
|
|||
|
# And both of those row types, treated as multivariate linear
|
|||
|
# equations in the p,q values, have each coefficient being a value of
|
|||
|
# the form \sum x^i, \sum y x^i or \sum y^2 x^i, for various i. (Times
|
|||
|
# a factor of 2, but we can throw that away.) So we can go through the
|
|||
|
# list of input coordinates summing all of those things, and then we
|
|||
|
# have enough information to construct our matrix and solve it
|
|||
|
# straight off for the rational function coefficients.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# f The function to be approximated. Maps BigFloat -> BigFloat.
|
|||
|
# xvals Array of BigFloats, giving the list of x-coordinates at which
|
|||
|
# to evaluate f.
|
|||
|
# n Degree of the numerator polynomial of the desired rational
|
|||
|
# function.
|
|||
|
# d Degree of the denominator polynomial of the desired rational
|
|||
|
# function.
|
|||
|
# w Error-weighting function. Takes two BigFloat arguments x,y
|
|||
|
# and returns a scaling factor for the error at that location.
|
|||
|
# A larger value indicates that the error should be given
|
|||
|
# greater weight in the square sum we try to minimise.
|
|||
|
# If unspecified, defaults to giving everything the same weight.
|
|||
|
#
|
|||
|
# Return values: a pair of arrays of BigFloats (N,D) giving the
|
|||
|
# coefficients of the returned rational function. N has size n+1; D
|
|||
|
# has size d+1. Both start with the constant term, i.e. N[i] is the
|
|||
|
# coefficient of x^(i-1) (because Julia arrays are 1-based). D[1] will
|
|||
|
# be 1.
|
|||
|
function ratfn_leastsquares(f::Function, xvals::Array{BigFloat}, n, d,
|
|||
|
w = (x,y)->BigFloat(1))
|
|||
|
# Accumulate sums of x^i y^j, for j={0,1,2} and a range of x.
|
|||
|
# Again because Julia arrays are 1-based, we'll have sums[i,j]
|
|||
|
# being the sum of x^(i-1) y^(j-1).
|
|||
|
maxpow = max(n,d) * 2 + 1
|
|||
|
sums = zeros(BigFloat, maxpow, 3)
|
|||
|
for x = xvals
|
|||
|
y = f(x)
|
|||
|
weight = w(x,y)
|
|||
|
for i = 1:1:maxpow
|
|||
|
for j = 1:1:3
|
|||
|
sums[i,j] += x^(i-1) * y^(j-1) * weight
|
|||
|
end
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
@debug("leastsquares", "sums=", repr(sums))
|
|||
|
|
|||
|
# Build the matrix. We're solving n+d+1 equations in n+d+1
|
|||
|
# unknowns. (We actually have to return n+d+2 coefficients, but
|
|||
|
# one of them is hardwired to 1.)
|
|||
|
matrix = array2d(BigFloat, n+d+1, n+d+1)
|
|||
|
vector = array1d(BigFloat, n+d+1)
|
|||
|
for i = 0:1:n
|
|||
|
# Equation obtained by differentiating with respect to p_i,
|
|||
|
# i.e. the numerator coefficient of x^i.
|
|||
|
row = 1+i
|
|||
|
for j = 0:1:n
|
|||
|
matrix[row, 1+j] = sums[1+i+j, 1]
|
|||
|
end
|
|||
|
for j = 1:1:d
|
|||
|
matrix[row, 1+n+j] = -sums[1+i+j, 2]
|
|||
|
end
|
|||
|
vector[row] = sums[1+i, 2]
|
|||
|
end
|
|||
|
for i = 1:1:d
|
|||
|
# Equation obtained by differentiating with respect to q_i,
|
|||
|
# i.e. the denominator coefficient of x^i.
|
|||
|
row = 1+n+i
|
|||
|
for j = 0:1:n
|
|||
|
matrix[row, 1+j] = sums[1+i+j, 2]
|
|||
|
end
|
|||
|
for j = 1:1:d
|
|||
|
matrix[row, 1+n+j] = -sums[1+i+j, 3]
|
|||
|
end
|
|||
|
vector[row] = sums[1+i, 3]
|
|||
|
end
|
|||
|
|
|||
|
@debug("leastsquares", "matrix=", repr(matrix))
|
|||
|
@debug("leastsquares", "vector=", repr(vector))
|
|||
|
|
|||
|
# Solve the matrix equation.
|
|||
|
all_coeffs = matrix \ vector
|
|||
|
|
|||
|
@debug("leastsquares", "all_coeffs=", repr(all_coeffs))
|
|||
|
|
|||
|
# And marshal the results into two separate polynomial vectors to
|
|||
|
# return.
|
|||
|
ncoeffs = all_coeffs[1:n+1]
|
|||
|
dcoeffs = vcat([1], all_coeffs[n+2:n+d+1])
|
|||
|
return (ncoeffs, dcoeffs)
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Golden-section search to find a maximum of a function.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# f Function to be maximised/minimised. Maps BigFloat -> BigFloat.
|
|||
|
# a,b,c BigFloats bracketing a maximum of the function.
|
|||
|
#
|
|||
|
# Expects:
|
|||
|
# a,b,c are in order (either a<=b<=c or c<=b<=a)
|
|||
|
# a != c (but b can equal one or the other if it wants to)
|
|||
|
# f(a) <= f(b) >= f(c)
|
|||
|
#
|
|||
|
# Return value is an (x,y) pair of BigFloats giving the extremal input
|
|||
|
# and output. (That is, y=f(x).)
|
|||
|
function goldensection(f::Function, a::BigFloat, b::BigFloat, c::BigFloat)
|
|||
|
# Decide on a 'good enough' threshold.
|
|||
|
threshold = abs(c-a) * 2^(-epsbits/2)
|
|||
|
|
|||
|
# We'll need the golden ratio phi, of course. Or rather, in this
|
|||
|
# case, we need 1/phi = 0.618...
|
|||
|
one_over_phi = 2 / (1 + sqrt(BigFloat(5)))
|
|||
|
|
|||
|
# Flip round the interval endpoints so that the interval [a,b] is
|
|||
|
# at least as large as [b,c]. (Then we can always pick our new
|
|||
|
# point in [a,b] without having to handle lots of special cases.)
|
|||
|
if abs(b-a) < abs(c-a)
|
|||
|
a, c = c, a
|
|||
|
end
|
|||
|
|
|||
|
# Evaluate the function at the initial points.
|
|||
|
fa = f(a)
|
|||
|
fb = f(b)
|
|||
|
fc = f(c)
|
|||
|
|
|||
|
@debug("goldensection", "starting")
|
|||
|
|
|||
|
while abs(c-a) > threshold
|
|||
|
@debug("goldensection", "a: ", a, " -> ", fa)
|
|||
|
@debug("goldensection", "b: ", b, " -> ", fb)
|
|||
|
@debug("goldensection", "c: ", c, " -> ", fc)
|
|||
|
|
|||
|
# Check invariants.
|
|||
|
@assert(a <= b <= c || c <= b <= a)
|
|||
|
@assert(fa <= fb >= fc)
|
|||
|
|
|||
|
# Subdivide the larger of the intervals [a,b] and [b,c]. We've
|
|||
|
# arranged that this is always [a,b], for simplicity.
|
|||
|
d = a + (b-a) * one_over_phi
|
|||
|
|
|||
|
# Now we have an interval looking like this (possibly
|
|||
|
# reversed):
|
|||
|
#
|
|||
|
# a d b c
|
|||
|
#
|
|||
|
# and we know f(b) is bigger than either f(a) or f(c). We have
|
|||
|
# two cases: either f(d) > f(b), or vice versa. In either
|
|||
|
# case, we can narrow to an interval of 1/phi the size, and
|
|||
|
# still satisfy all our invariants (three ordered points,
|
|||
|
# [a,b] at least the width of [b,c], f(a)<=f(b)>=f(c)).
|
|||
|
fd = f(d)
|
|||
|
@debug("goldensection", "d: ", d, " -> ", fd)
|
|||
|
if fd > fb
|
|||
|
a, b, c = a, d, b
|
|||
|
fa, fb, fc = fa, fd, fb
|
|||
|
@debug("goldensection", "adb case")
|
|||
|
else
|
|||
|
a, b, c = c, b, d
|
|||
|
fa, fb, fc = fc, fb, fd
|
|||
|
@debug("goldensection", "cbd case")
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
@debug("goldensection", "done: ", b, " -> ", fb)
|
|||
|
return (b, fb)
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Find the extrema of a function within a given interval.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# f The function to be approximated. Maps BigFloat -> BigFloat.
|
|||
|
# grid A set of points at which to evaluate f. Must be high enough
|
|||
|
# resolution to make extrema obvious.
|
|||
|
#
|
|||
|
# Returns an array of (x,y) pairs of BigFloats, with each x,y giving
|
|||
|
# the extremum location and its value (i.e. y=f(x)).
|
|||
|
function find_extrema(f::Function, grid::Array{BigFloat})
|
|||
|
len = length(grid)
|
|||
|
extrema = array1d(Tuple{BigFloat, BigFloat}, 0)
|
|||
|
for i = 1:1:len
|
|||
|
# We have to provide goldensection() with three points
|
|||
|
# bracketing the extremum. If the extremum is at one end of
|
|||
|
# the interval, then the only way we can do that is to set two
|
|||
|
# of the points equal (which goldensection() will cope with).
|
|||
|
prev = max(1, i-1)
|
|||
|
next = min(i+1, len)
|
|||
|
|
|||
|
# Find our three pairs of (x,y) coordinates.
|
|||
|
xp, xi, xn = grid[prev], grid[i], grid[next]
|
|||
|
yp, yi, yn = f(xp), f(xi), f(xn)
|
|||
|
|
|||
|
# See if they look like an extremum, and if so, ask
|
|||
|
# goldensection() to give a more exact location for it.
|
|||
|
if yp <= yi >= yn
|
|||
|
push!(extrema, goldensection(f, xp, xi, xn))
|
|||
|
elseif yp >= yi <= yn
|
|||
|
x, y = goldensection(x->-f(x), xp, xi, xn)
|
|||
|
push!(extrema, (x, -y))
|
|||
|
end
|
|||
|
end
|
|||
|
return extrema
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Winnow a list of a function's extrema to give a subsequence of a
|
|||
|
# specified length, with the extrema in the subsequence alternating
|
|||
|
# signs, and with the smallest absolute value of an extremum in the
|
|||
|
# subsequence as large as possible.
|
|||
|
#
|
|||
|
# We do this using a dynamic-programming approach. We work along the
|
|||
|
# provided array of extrema, and at all times, we track the best set
|
|||
|
# of extrema we have so far seen for each possible (length, sign of
|
|||
|
# last extremum) pair. Each new extremum is evaluated to see whether
|
|||
|
# it can be added to any previously seen best subsequence to make a
|
|||
|
# new subsequence that beats the previous record holder in its slot.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# extrema An array of (x,y) pairs of BigFloats giving the input extrema.
|
|||
|
# n Number of extrema required as output.
|
|||
|
#
|
|||
|
# Returns a new array of (x,y) pairs which is a subsequence of the
|
|||
|
# original sequence. (So, in particular, if the input was sorted by x
|
|||
|
# then so will the output be.)
|
|||
|
function winnow_extrema(extrema::Array{Tuple{BigFloat,BigFloat}}, n)
|
|||
|
# best[i,j] gives the best sequence so far of length i and with
|
|||
|
# sign j (where signs are coded as 1=positive, 2=negative), in the
|
|||
|
# form of a tuple (cost, actual array of x,y pairs).
|
|||
|
best = fill((BigFloat(0), array1d(Tuple{BigFloat,BigFloat}, 0)), n, 2)
|
|||
|
|
|||
|
for (x,y) = extrema
|
|||
|
if y > 0
|
|||
|
sign = 1
|
|||
|
elseif y < 0
|
|||
|
sign = 2
|
|||
|
else
|
|||
|
# A zero-valued extremum cannot possibly contribute to any
|
|||
|
# optimal sequence, so we simply ignore it!
|
|||
|
continue
|
|||
|
end
|
|||
|
|
|||
|
for i = 1:1:n
|
|||
|
# See if we can create a new entry for best[i,sign] by
|
|||
|
# appending our current (x,y) to some previous thing.
|
|||
|
if i == 1
|
|||
|
# Special case: we don't store a best zero-length
|
|||
|
# sequence :-)
|
|||
|
candidate = (abs(y), [(x,y)])
|
|||
|
else
|
|||
|
othersign = 3-sign # map 1->2 and 2->1
|
|||
|
oldscore, oldlist = best[i-1, othersign]
|
|||
|
newscore = min(abs(y), oldscore)
|
|||
|
newlist = vcat(oldlist, [(x,y)])
|
|||
|
candidate = (newscore, newlist)
|
|||
|
end
|
|||
|
# If our new candidate improves on the previous value of
|
|||
|
# best[i,sign], then replace it.
|
|||
|
if candidate[1] > best[i,sign][1]
|
|||
|
best[i,sign] = candidate
|
|||
|
end
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# Our ultimate return value has to be either best[n,1] or
|
|||
|
# best[n,2], but it could be either. See which one has the higher
|
|||
|
# score.
|
|||
|
if best[n,1][1] > best[n,2][1]
|
|||
|
ret = best[n,1][2]
|
|||
|
else
|
|||
|
ret = best[n,2][2]
|
|||
|
end
|
|||
|
# Make sure we did actually _find_ a good answer.
|
|||
|
@assert(length(ret) == n)
|
|||
|
return ret
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Construct a rational-function approximation with equal and
|
|||
|
# alternating weighted deviation at a specific set of x-coordinates.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# f The function to be approximated. Maps BigFloat -> BigFloat.
|
|||
|
# coords An array of BigFloats giving the x-coordinates. There should
|
|||
|
# be n+d+2 of them.
|
|||
|
# n, d The degrees of the numerator and denominator of the desired
|
|||
|
# approximation.
|
|||
|
# prev_err A plausible value for the alternating weighted deviation.
|
|||
|
# (Required to kickstart a binary search in the nonlinear case;
|
|||
|
# see comments below.)
|
|||
|
# w Error-weighting function. Takes two BigFloat arguments x,y
|
|||
|
# and returns a scaling factor for the error at that location.
|
|||
|
# The returned approximation R should have the minimum possible
|
|||
|
# maximum value of abs((f(x)-R(x)) * w(x,f(x))). Optional
|
|||
|
# parameter, defaulting to the always-return-1 function.
|
|||
|
#
|
|||
|
# Return values: a pair of arrays of BigFloats (N,D) giving the
|
|||
|
# coefficients of the returned rational function. N has size n+1; D
|
|||
|
# has size d+1. Both start with the constant term, i.e. N[i] is the
|
|||
|
# coefficient of x^(i-1) (because Julia arrays are 1-based). D[1] will
|
|||
|
# be 1.
|
|||
|
function ratfn_equal_deviation(f::Function, coords::Array{BigFloat},
|
|||
|
n, d, prev_err::BigFloat,
|
|||
|
w = (x,y)->BigFloat(1))
|
|||
|
@debug("equaldev", "n=", n, " d=", d, " coords=", repr(coords))
|
|||
|
@assert(length(coords) == n+d+2)
|
|||
|
|
|||
|
if d == 0
|
|||
|
# Special case: we're after a polynomial. In this case, we
|
|||
|
# have the particularly easy job of just constructing and
|
|||
|
# solving a system of n+2 linear equations, to find the n+1
|
|||
|
# coefficients of the polynomial and also the amount of
|
|||
|
# deviation at the specified coordinates. Each equation is of
|
|||
|
# the form
|
|||
|
#
|
|||
|
# p_0 x^0 + p_1 x^1 + ... + p_n x^n ± e/w(x) = f(x)
|
|||
|
#
|
|||
|
# in which the p_i and e are the variables, and the powers of
|
|||
|
# x and calls to w and f are the coefficients.
|
|||
|
|
|||
|
matrix = array2d(BigFloat, n+2, n+2)
|
|||
|
vector = array1d(BigFloat, n+2)
|
|||
|
currsign = +1
|
|||
|
for i = 1:1:n+2
|
|||
|
x = coords[i]
|
|||
|
for j = 0:1:n
|
|||
|
matrix[i,1+j] = x^j
|
|||
|
end
|
|||
|
y = f(x)
|
|||
|
vector[i] = y
|
|||
|
matrix[i, n+2] = currsign / w(x,y)
|
|||
|
currsign = -currsign
|
|||
|
end
|
|||
|
|
|||
|
@debug("equaldev", "matrix=", repr(matrix))
|
|||
|
@debug("equaldev", "vector=", repr(vector))
|
|||
|
|
|||
|
outvector = matrix \ vector
|
|||
|
|
|||
|
@debug("equaldev", "outvector=", repr(outvector))
|
|||
|
|
|||
|
ncoeffs = outvector[1:n+1]
|
|||
|
dcoeffs = [BigFloat(1)]
|
|||
|
return ncoeffs, dcoeffs
|
|||
|
else
|
|||
|
# For a nontrivial rational function, the system of equations
|
|||
|
# we need to solve becomes nonlinear, because each equation
|
|||
|
# now takes the form
|
|||
|
#
|
|||
|
# p_0 x^0 + p_1 x^1 + ... + p_n x^n
|
|||
|
# --------------------------------- ± e/w(x) = f(x)
|
|||
|
# x^0 + q_1 x^1 + ... + q_d x^d
|
|||
|
#
|
|||
|
# and multiplying up by the denominator gives you a lot of
|
|||
|
# terms containing e × q_i. So we can't do this the really
|
|||
|
# easy way using a matrix equation as above.
|
|||
|
#
|
|||
|
# Fortunately, this is a fairly easy kind of nonlinear system.
|
|||
|
# The equations all become linear if you switch to treating e
|
|||
|
# as a constant, so a reasonably sensible approach is to pick
|
|||
|
# a candidate value of e, solve all but one of the equations
|
|||
|
# for the remaining unknowns, and then see what the error
|
|||
|
# turns out to be in the final equation. The Chebyshev
|
|||
|
# alternation theorem guarantees that that error in the last
|
|||
|
# equation will be anti-monotonic in the input e, so we can
|
|||
|
# just binary-search until we get the two as close to equal as
|
|||
|
# we need them.
|
|||
|
|
|||
|
function try_e(e)
|
|||
|
# Try a given value of e, derive the coefficients of the
|
|||
|
# resulting rational function by setting up equations
|
|||
|
# based on the first n+d+1 of the n+d+2 coordinates, and
|
|||
|
# see what the error turns out to be at the final
|
|||
|
# coordinate.
|
|||
|
matrix = array2d(BigFloat, n+d+1, n+d+1)
|
|||
|
vector = array1d(BigFloat, n+d+1)
|
|||
|
currsign = +1
|
|||
|
for i = 1:1:n+d+1
|
|||
|
x = coords[i]
|
|||
|
y = f(x)
|
|||
|
y_adj = y - currsign * e / w(x,y)
|
|||
|
for j = 0:1:n
|
|||
|
matrix[i,1+j] = x^j
|
|||
|
end
|
|||
|
for j = 1:1:d
|
|||
|
matrix[i,1+n+j] = -x^j * y_adj
|
|||
|
end
|
|||
|
vector[i] = y_adj
|
|||
|
currsign = -currsign
|
|||
|
end
|
|||
|
|
|||
|
@debug("equaldev", "trying e=", e)
|
|||
|
@debug("equaldev", "matrix=", repr(matrix))
|
|||
|
@debug("equaldev", "vector=", repr(vector))
|
|||
|
|
|||
|
outvector = matrix \ vector
|
|||
|
|
|||
|
@debug("equaldev", "outvector=", repr(outvector))
|
|||
|
|
|||
|
ncoeffs = outvector[1:n+1]
|
|||
|
dcoeffs = vcat([BigFloat(1)], outvector[n+2:n+d+1])
|
|||
|
|
|||
|
x = coords[n+d+2]
|
|||
|
y = f(x)
|
|||
|
last_e = (ratfn_eval(ncoeffs, dcoeffs, x) - y) * w(x,y) * -currsign
|
|||
|
|
|||
|
@debug("equaldev", "last e=", last_e)
|
|||
|
|
|||
|
return ncoeffs, dcoeffs, last_e
|
|||
|
end
|
|||
|
|
|||
|
threshold = 2^(-epsbits/2) # convergence threshold
|
|||
|
|
|||
|
# Start by trying our previous iteration's error value. This
|
|||
|
# value (e0) will be one end of our binary-search interval,
|
|||
|
# and whatever it caused the last point's error to be, that
|
|||
|
# (e1) will be the other end.
|
|||
|
e0 = prev_err
|
|||
|
@debug("equaldev", "e0 = ", e0)
|
|||
|
nc, dc, e1 = try_e(e0)
|
|||
|
@debug("equaldev", "e1 = ", e1)
|
|||
|
if abs(e1-e0) <= threshold
|
|||
|
# If we're _really_ lucky, we hit the error right on the
|
|||
|
# nose just by doing that!
|
|||
|
return nc, dc
|
|||
|
end
|
|||
|
s = sign(e1-e0)
|
|||
|
@debug("equaldev", "s = ", s)
|
|||
|
|
|||
|
# Verify by assertion that trying our other interval endpoint
|
|||
|
# e1 gives a value that's wrong in the other direction.
|
|||
|
# (Otherwise our binary search won't get a sensible answer at
|
|||
|
# all.)
|
|||
|
nc, dc, e2 = try_e(e1)
|
|||
|
@debug("equaldev", "e2 = ", e2)
|
|||
|
@assert(sign(e2-e1) == -s)
|
|||
|
|
|||
|
# Now binary-search until our two endpoints narrow enough.
|
|||
|
local emid
|
|||
|
while abs(e1-e0) > threshold
|
|||
|
emid = (e1+e0)/2
|
|||
|
nc, dc, enew = try_e(emid)
|
|||
|
if sign(enew-emid) == s
|
|||
|
e0 = emid
|
|||
|
else
|
|||
|
e1 = emid
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
@debug("equaldev", "final e=", emid)
|
|||
|
return nc, dc
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Top-level function to find a minimax rational-function approximation.
|
|||
|
|
|||
|
# Arguments:
|
|||
|
# f The function to be approximated. Maps BigFloat -> BigFloat.
|
|||
|
# interval A pair of BigFloats giving the endpoints of the interval
|
|||
|
# (in either order) on which to approximate f.
|
|||
|
# n, d The degrees of the numerator and denominator of the desired
|
|||
|
# approximation.
|
|||
|
# w Error-weighting function. Takes two BigFloat arguments x,y
|
|||
|
# and returns a scaling factor for the error at that location.
|
|||
|
# The returned approximation R should have the minimum possible
|
|||
|
# maximum value of abs((f(x)-R(x)) * w(x,f(x))). Optional
|
|||
|
# parameter, defaulting to the always-return-1 function.
|
|||
|
#
|
|||
|
# Return values: a tuple (N,D,E,X), where
|
|||
|
|
|||
|
# N,D A pair of arrays of BigFloats giving the coefficients
|
|||
|
# of the returned rational function. N has size n+1; D
|
|||
|
# has size d+1. Both start with the constant term, i.e.
|
|||
|
# N[i] is the coefficient of x^(i-1) (because Julia
|
|||
|
# arrays are 1-based). D[1] will be 1.
|
|||
|
# E The maximum weighted error (BigFloat).
|
|||
|
# X An array of pairs of BigFloats giving the locations of n+2
|
|||
|
# points and the weighted error at each of those points. The
|
|||
|
# weighted error values will have alternating signs, which
|
|||
|
# means that the Chebyshev alternation theorem guarantees
|
|||
|
# that any other function of the same degree must exceed
|
|||
|
# the error of this one at at least one of those points.
|
|||
|
function ratfn_minimax(f::Function, interval::Tuple{BigFloat,BigFloat}, n, d,
|
|||
|
w = (x,y)->BigFloat(1))
|
|||
|
# We start off by finding a least-squares approximation. This
|
|||
|
# doesn't need to be perfect, but if we can get it reasonably good
|
|||
|
# then it'll save iterations in the refining stage.
|
|||
|
#
|
|||
|
# Least-squares approximations tend to look nicer in a minimax
|
|||
|
# sense if you evaluate the function at a big pile of Chebyshev
|
|||
|
# nodes rather than uniformly spaced points. These values will
|
|||
|
# also make a good grid to use for the initial search for error
|
|||
|
# extrema, so we'll keep them around for that reason too.
|
|||
|
|
|||
|
# Construct the grid.
|
|||
|
lo, hi = minimum(interval), maximum(interval)
|
|||
|
local grid
|
|||
|
let
|
|||
|
mid = (hi+lo)/2
|
|||
|
halfwid = (hi-lo)/2
|
|||
|
nnodes = 16 * (n+d+1)
|
|||
|
pi = 2*asin(BigFloat(1))
|
|||
|
grid = [ mid - halfwid * cos(pi*i/nnodes) for i=0:1:nnodes ]
|
|||
|
end
|
|||
|
|
|||
|
# Find the initial least-squares approximation.
|
|||
|
(nc, dc) = ratfn_leastsquares(f, grid, n, d, w)
|
|||
|
@debug("minimax", "initial leastsquares approx = ",
|
|||
|
ratfn_to_string(nc, dc))
|
|||
|
|
|||
|
# Threshold of convergence. We stop when the relative difference
|
|||
|
# between the min and max (winnowed) error extrema is less than
|
|||
|
# this.
|
|||
|
#
|
|||
|
# This is set to the cube root of machine epsilon on a more or
|
|||
|
# less empirical basis, because the rational-function case will
|
|||
|
# not converge reliably if you set it to only the square root.
|
|||
|
# (Repeatable by using the --test mode.) On the assumption that
|
|||
|
# input and output error in each iteration can be expected to be
|
|||
|
# related by a simple power law (because it'll just be down to how
|
|||
|
# many leading terms of a Taylor series are zero), the cube root
|
|||
|
# was the next thing to try.
|
|||
|
threshold = 2^(-epsbits/3)
|
|||
|
|
|||
|
# Main loop.
|
|||
|
while true
|
|||
|
# Find all the error extrema we can.
|
|||
|
function compute_error(x)
|
|||
|
real_y = f(x)
|
|||
|
approx_y = ratfn_eval(nc, dc, x)
|
|||
|
return (approx_y - real_y) * w(x, real_y)
|
|||
|
end
|
|||
|
extrema = find_extrema(compute_error, grid)
|
|||
|
@debug("minimax", "all extrema = ", format_xylist(extrema))
|
|||
|
|
|||
|
# Winnow the extrema down to the right number, and ensure they
|
|||
|
# have alternating sign.
|
|||
|
extrema = winnow_extrema(extrema, n+d+2)
|
|||
|
@debug("minimax", "winnowed extrema = ", format_xylist(extrema))
|
|||
|
|
|||
|
# See if we've finished.
|
|||
|
min_err = minimum([abs(y) for (x,y) = extrema])
|
|||
|
max_err = maximum([abs(y) for (x,y) = extrema])
|
|||
|
variation = (max_err - min_err) / max_err
|
|||
|
@debug("minimax", "extremum variation = ", variation)
|
|||
|
if variation < threshold
|
|||
|
@debug("minimax", "done!")
|
|||
|
return nc, dc, max_err, extrema
|
|||
|
end
|
|||
|
|
|||
|
# If not, refine our function by equalising the error at the
|
|||
|
# extrema points, and go round again.
|
|||
|
(nc, dc) = ratfn_equal_deviation(f, map(x->x[1], extrema),
|
|||
|
n, d, max_err, w)
|
|||
|
@debug("minimax", "refined approx = ", ratfn_to_string(nc, dc))
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Check if a polynomial is well-conditioned for accurate evaluation in
|
|||
|
# a given interval by Horner's rule.
|
|||
|
#
|
|||
|
# This is true if at every step where Horner's rule computes
|
|||
|
# (coefficient + x*value_so_far), the constant coefficient you're
|
|||
|
# adding on is of larger magnitude than the x*value_so_far operand.
|
|||
|
# And this has to be true for every x in the interval.
|
|||
|
#
|
|||
|
# Arguments:
|
|||
|
# coeffs The coefficients of the polynomial under test. Starts with
|
|||
|
# the constant term, i.e. coeffs[i] is the coefficient of
|
|||
|
# x^(i-1) (because Julia arrays are 1-based).
|
|||
|
# lo, hi The bounds of the interval.
|
|||
|
#
|
|||
|
# Return value: the largest ratio (x*value_so_far / coefficient), at
|
|||
|
# any step of evaluation, for any x in the interval. If this is less
|
|||
|
# than 1, the polynomial is at least somewhat well-conditioned;
|
|||
|
# ideally you want it to be more like 1/8 or 1/16 or so, so that the
|
|||
|
# relative rounding error accumulated at each step are reduced by
|
|||
|
# several factors of 2 when the next coefficient is added on.
|
|||
|
|
|||
|
function wellcond(coeffs, lo, hi)
|
|||
|
x = max(abs(lo), abs(hi))
|
|||
|
worst = 0
|
|||
|
so_far = 0
|
|||
|
for i = length(coeffs):-1:1
|
|||
|
coeff = abs(coeffs[i])
|
|||
|
so_far *= x
|
|||
|
if coeff != 0
|
|||
|
thisval = so_far / coeff
|
|||
|
worst = max(worst, thisval)
|
|||
|
so_far += coeff
|
|||
|
end
|
|||
|
end
|
|||
|
return worst
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Small set of unit tests.
|
|||
|
|
|||
|
function test()
|
|||
|
passes = 0
|
|||
|
fails = 0
|
|||
|
|
|||
|
function approx_eq(x, y, limit=1e-6)
|
|||
|
return abs(x - y) < limit
|
|||
|
end
|
|||
|
|
|||
|
function test(condition)
|
|||
|
if condition
|
|||
|
passes += 1
|
|||
|
else
|
|||
|
println("fail")
|
|||
|
fails += 1
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# Test Gaussian elimination.
|
|||
|
println("Gaussian test 1:")
|
|||
|
m = BigFloat[1 1 2; 3 5 8; 13 34 21]
|
|||
|
v = BigFloat[1, -1, 2]
|
|||
|
ret = m \ v
|
|||
|
println(" ",repr(ret))
|
|||
|
test(approx_eq(ret[1], 109/26))
|
|||
|
test(approx_eq(ret[2], -105/130))
|
|||
|
test(approx_eq(ret[3], -31/26))
|
|||
|
|
|||
|
# Test leastsquares rational functions.
|
|||
|
println("Leastsquares test 1:")
|
|||
|
n = 10000
|
|||
|
a = array1d(BigFloat, n+1)
|
|||
|
for i = 0:1:n
|
|||
|
a[1+i] = i/BigFloat(n)
|
|||
|
end
|
|||
|
(nc, dc) = ratfn_leastsquares(x->exp(x), a, 2, 2)
|
|||
|
println(" ",ratfn_to_string(nc, dc))
|
|||
|
for x = a
|
|||
|
test(approx_eq(exp(x), ratfn_eval(nc, dc, x), 1e-4))
|
|||
|
end
|
|||
|
|
|||
|
# Test golden section search.
|
|||
|
println("Golden section test 1:")
|
|||
|
x, y = goldensection(x->sin(x),
|
|||
|
BigFloat(0), BigFloat(1)/10, BigFloat(4))
|
|||
|
println(" ", x, " -> ", y)
|
|||
|
test(approx_eq(x, asin(BigFloat(1))))
|
|||
|
test(approx_eq(y, 1))
|
|||
|
|
|||
|
# Test extrema-winnowing algorithm.
|
|||
|
println("Winnow test 1:")
|
|||
|
extrema = [(x, sin(20*x)*sin(197*x))
|
|||
|
for x in BigFloat(0):BigFloat(1)/1000:BigFloat(1)]
|
|||
|
winnowed = winnow_extrema(extrema, 12)
|
|||
|
println(" ret = ", format_xylist(winnowed))
|
|||
|
prevx, prevy = -1, 0
|
|||
|
for (x,y) = winnowed
|
|||
|
test(x > prevx)
|
|||
|
test(y != 0)
|
|||
|
test(prevy * y <= 0) # tolerates initial prevx having no sign
|
|||
|
test(abs(y) > 0.9)
|
|||
|
prevx, prevy = x, y
|
|||
|
end
|
|||
|
|
|||
|
# Test actual minimax approximation.
|
|||
|
println("Minimax test 1 (polynomial):")
|
|||
|
(nc, dc, e, x) = ratfn_minimax(x->exp(x), (BigFloat(0), BigFloat(1)), 4, 0)
|
|||
|
println(" ",e)
|
|||
|
println(" ",ratfn_to_string(nc, dc))
|
|||
|
test(0 < e < 1e-3)
|
|||
|
for x = 0:BigFloat(1)/1000:1
|
|||
|
test(abs(ratfn_eval(nc, dc, x) - exp(x)) <= e * 1.0000001)
|
|||
|
end
|
|||
|
|
|||
|
println("Minimax test 2 (rational):")
|
|||
|
(nc, dc, e, x) = ratfn_minimax(x->exp(x), (BigFloat(0), BigFloat(1)), 2, 2)
|
|||
|
println(" ",e)
|
|||
|
println(" ",ratfn_to_string(nc, dc))
|
|||
|
test(0 < e < 1e-3)
|
|||
|
for x = 0:BigFloat(1)/1000:1
|
|||
|
test(abs(ratfn_eval(nc, dc, x) - exp(x)) <= e * 1.0000001)
|
|||
|
end
|
|||
|
|
|||
|
println("Minimax test 3 (polynomial, weighted):")
|
|||
|
(nc, dc, e, x) = ratfn_minimax(x->exp(x), (BigFloat(0), BigFloat(1)), 4, 0,
|
|||
|
(x,y)->1/y)
|
|||
|
println(" ",e)
|
|||
|
println(" ",ratfn_to_string(nc, dc))
|
|||
|
test(0 < e < 1e-3)
|
|||
|
for x = 0:BigFloat(1)/1000:1
|
|||
|
test(abs(ratfn_eval(nc, dc, x) - exp(x))/exp(x) <= e * 1.0000001)
|
|||
|
end
|
|||
|
|
|||
|
println("Minimax test 4 (rational, weighted):")
|
|||
|
(nc, dc, e, x) = ratfn_minimax(x->exp(x), (BigFloat(0), BigFloat(1)), 2, 2,
|
|||
|
(x,y)->1/y)
|
|||
|
println(" ",e)
|
|||
|
println(" ",ratfn_to_string(nc, dc))
|
|||
|
test(0 < e < 1e-3)
|
|||
|
for x = 0:BigFloat(1)/1000:1
|
|||
|
test(abs(ratfn_eval(nc, dc, x) - exp(x))/exp(x) <= e * 1.0000001)
|
|||
|
end
|
|||
|
|
|||
|
println("Minimax test 5 (rational, weighted, odd degree):")
|
|||
|
(nc, dc, e, x) = ratfn_minimax(x->exp(x), (BigFloat(0), BigFloat(1)), 2, 1,
|
|||
|
(x,y)->1/y)
|
|||
|
println(" ",e)
|
|||
|
println(" ",ratfn_to_string(nc, dc))
|
|||
|
test(0 < e < 1e-3)
|
|||
|
for x = 0:BigFloat(1)/1000:1
|
|||
|
test(abs(ratfn_eval(nc, dc, x) - exp(x))/exp(x) <= e * 1.0000001)
|
|||
|
end
|
|||
|
|
|||
|
total = passes + fails
|
|||
|
println(passes, " passes ", fails, " fails ", total, " total")
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Online help.
|
|||
|
function help()
|
|||
|
print("""
|
|||
|
Usage:
|
|||
|
|
|||
|
remez.jl [options] <lo> <hi> <n> <d> <expr> [<weight>]
|
|||
|
|
|||
|
Arguments:
|
|||
|
|
|||
|
<lo>, <hi>
|
|||
|
|
|||
|
Bounds of the interval on which to approximate the target
|
|||
|
function. These are parsed and evaluated as Julia expressions,
|
|||
|
so you can write things like '1/BigFloat(6)' to get an
|
|||
|
accurate representation of 1/6, or '4*atan(BigFloat(1))' to
|
|||
|
get pi. (Unfortunately, the obvious 'BigFloat(pi)' doesn't
|
|||
|
work in Julia.)
|
|||
|
|
|||
|
<n>, <d>
|
|||
|
|
|||
|
The desired degree of polynomial(s) you want for your
|
|||
|
approximation. These should be non-negative integers. If you
|
|||
|
want a rational function as output, set <n> to the degree of
|
|||
|
the numerator, and <d> the denominator. If you just want an
|
|||
|
ordinary polynomial, set <d> to 0, and <n> to the degree of
|
|||
|
the polynomial you want.
|
|||
|
|
|||
|
<expr>
|
|||
|
|
|||
|
A Julia expression giving the function to be approximated on
|
|||
|
the interval. The input value is predefined as 'x' when this
|
|||
|
expression is evaluated, so you should write something along
|
|||
|
the lines of 'sin(x)' or 'sqrt(1+tan(x)^2)' etc.
|
|||
|
|
|||
|
<weight>
|
|||
|
|
|||
|
If provided, a Julia expression giving the weighting factor
|
|||
|
for the approximation error. The output polynomial will
|
|||
|
minimise the largest absolute value of (P-f) * w at any point
|
|||
|
in the interval, where P is the value of the polynomial, f is
|
|||
|
the value of the target function given by <expr>, and w is the
|
|||
|
weight given by this function.
|
|||
|
|
|||
|
When this expression is evaluated, the input value to P and f
|
|||
|
is predefined as 'x', and also the true output value f(x) is
|
|||
|
predefined as 'y'. So you can minimise the relative error by
|
|||
|
simply writing '1/y'.
|
|||
|
|
|||
|
If the <weight> argument is not provided, the default
|
|||
|
weighting function always returns 1, so that the polynomial
|
|||
|
will minimise the maximum absolute error |P-f|.
|
|||
|
|
|||
|
Computation options:
|
|||
|
|
|||
|
--pre=<predef_expr>
|
|||
|
|
|||
|
Evaluate the Julia expression <predef_expr> before starting
|
|||
|
the computation. This permits you to pre-define variables or
|
|||
|
functions which the Julia expressions in your main arguments
|
|||
|
can refer to. All of <lo>, <hi>, <expr> and <weight> can make
|
|||
|
use of things defined by <predef_expr>.
|
|||
|
|
|||
|
One internal remez.jl function that you might sometimes find
|
|||
|
useful in this expression is 'goldensection', which finds the
|
|||
|
location and value of a maximum of a function. For example,
|
|||
|
one implementation strategy for the gamma function involves
|
|||
|
translating it to put its unique local minimum at the origin,
|
|||
|
in which case you can write something like this
|
|||
|
|
|||
|
--pre='(m,my) = goldensection(x -> -gamma(x),
|
|||
|
BigFloat(1), BigFloat(1.5), BigFloat(2))'
|
|||
|
|
|||
|
to predefine 'm' as the location of gamma's minimum, and 'my'
|
|||
|
as the (negated) value that gamma actually takes at that
|
|||
|
point, i.e. -gamma(m).
|
|||
|
|
|||
|
(Since 'goldensection' always finds a maximum, we had to
|
|||
|
negate gamma in the input function to make it find a minimum
|
|||
|
instead. Consult the comments in the source for more details
|
|||
|
on the use of this function.)
|
|||
|
|
|||
|
If you use this option more than once, all the expressions you
|
|||
|
provide will be run in sequence.
|
|||
|
|
|||
|
--bits=<bits>
|
|||
|
|
|||
|
Specify the accuracy to which you want the output polynomial,
|
|||
|
in bits. Default 256, which should be more than enough.
|
|||
|
|
|||
|
--bigfloatbits=<bits>
|
|||
|
|
|||
|
Turn up the precision used by Julia for its BigFloat
|
|||
|
evaluation. Default is Julia's default (also 256). You might
|
|||
|
want to try setting this higher than the --bits value if the
|
|||
|
algorithm is failing to converge for some reason.
|
|||
|
|
|||
|
Output options:
|
|||
|
|
|||
|
--full
|
|||
|
|
|||
|
Instead of just printing the approximation function itself,
|
|||
|
also print auxiliary information:
|
|||
|
- the locations of the error extrema, and the actual
|
|||
|
(weighted) error at each of those locations
|
|||
|
- the overall maximum error of the function
|
|||
|
- a 'well-conditioning quotient', giving the worst-case ratio
|
|||
|
between any polynomial coefficient and the largest possible
|
|||
|
value of the higher-order terms it will be added to.
|
|||
|
|
|||
|
The well-conditioning quotient should be less than 1, ideally
|
|||
|
by several factors of two, for accurate evaluation in the
|
|||
|
target precision. If you request a rational function, a
|
|||
|
separate well-conditioning quotient will be printed for the
|
|||
|
numerator and denominator.
|
|||
|
|
|||
|
Use this option when deciding how wide an interval to
|
|||
|
approximate your function on, and what degree of polynomial
|
|||
|
you need.
|
|||
|
|
|||
|
--variable=<identifier>
|
|||
|
|
|||
|
When writing the output polynomial or rational function in its
|
|||
|
usual form as an arithmetic expression, use <identifier> as
|
|||
|
the name of the input variable. Default is 'x'.
|
|||
|
|
|||
|
--suffix=<suffix>
|
|||
|
|
|||
|
When writing the output polynomial or rational function in its
|
|||
|
usual form as an arithmetic expression, write <suffix> after
|
|||
|
every floating-point literal. For example, '--suffix=F' will
|
|||
|
generate a C expression in which the coefficients are literals
|
|||
|
of type 'float' rather than 'double'.
|
|||
|
|
|||
|
--array
|
|||
|
|
|||
|
Instead of writing the output polynomial as an arithmetic
|
|||
|
expression in Horner's rule form, write out just its
|
|||
|
coefficients, one per line, each with a trailing comma.
|
|||
|
Suitable for pasting into a C array declaration.
|
|||
|
|
|||
|
This option is not currently supported if the output is a
|
|||
|
rational function, because you'd need two separate arrays for
|
|||
|
the numerator and denominator coefficients and there's no
|
|||
|
obviously right way to provide both of those together.
|
|||
|
|
|||
|
Debug and test options:
|
|||
|
|
|||
|
--debug=<facility>
|
|||
|
|
|||
|
Enable debugging output from various parts of the Remez
|
|||
|
calculation. <facility> should be the name of one of the
|
|||
|
classes of diagnostic output implemented in the program.
|
|||
|
Useful values include 'gausselim', 'leastsquares',
|
|||
|
'goldensection', 'equaldev', 'minimax'. This is probably
|
|||
|
mostly useful to people debugging problems with the script, so
|
|||
|
consult the source code for more information about what the
|
|||
|
diagnostic output for each of those facilities will be.
|
|||
|
|
|||
|
If you want diagnostics from more than one facility, specify
|
|||
|
this option multiple times with different arguments.
|
|||
|
|
|||
|
--test
|
|||
|
|
|||
|
Run remez.jl's internal test suite. No arguments needed.
|
|||
|
|
|||
|
Miscellaneous options:
|
|||
|
|
|||
|
--help
|
|||
|
|
|||
|
Display this text and exit. No arguments needed.
|
|||
|
|
|||
|
""")
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Main program.
|
|||
|
|
|||
|
function main()
|
|||
|
nargs = length(argwords)
|
|||
|
if nargs != 5 && nargs != 6
|
|||
|
error("usage: remez.jl <lo> <hi> <n> <d> <expr> [<weight>]\n" *
|
|||
|
" run 'remez.jl --help' for more help")
|
|||
|
end
|
|||
|
|
|||
|
for preliminary_command in preliminary_commands
|
|||
|
eval(Meta.parse(preliminary_command))
|
|||
|
end
|
|||
|
|
|||
|
lo = BigFloat(eval(Meta.parse(argwords[1])))
|
|||
|
hi = BigFloat(eval(Meta.parse(argwords[2])))
|
|||
|
n = parse(Int,argwords[3])
|
|||
|
d = parse(Int,argwords[4])
|
|||
|
f = eval(Meta.parse("x -> " * argwords[5]))
|
|||
|
|
|||
|
# Wrap the user-provided function with a function of our own. This
|
|||
|
# arranges to detect silly FP values (inf,nan) early and diagnose
|
|||
|
# them sensibly, and also lets us log all evaluations of the
|
|||
|
# function in case you suspect it's doing the wrong thing at some
|
|||
|
# special-case point.
|
|||
|
function func(x)
|
|||
|
y = run(f,x)
|
|||
|
@debug("f", x, " -> ", y)
|
|||
|
if !isfinite(y)
|
|||
|
error("f(" * string(x) * ") returned non-finite value " * string(y))
|
|||
|
end
|
|||
|
return y
|
|||
|
end
|
|||
|
|
|||
|
if nargs == 6
|
|||
|
# Wrap the user-provided weight function similarly.
|
|||
|
w = eval(Meta.parse("(x,y) -> " * argwords[6]))
|
|||
|
function wrapped_weight(x,y)
|
|||
|
ww = run(w,x,y)
|
|||
|
if !isfinite(ww)
|
|||
|
error("w(" * string(x) * "," * string(y) *
|
|||
|
") returned non-finite value " * string(ww))
|
|||
|
end
|
|||
|
return ww
|
|||
|
end
|
|||
|
weight = wrapped_weight
|
|||
|
else
|
|||
|
weight = (x,y)->BigFloat(1)
|
|||
|
end
|
|||
|
|
|||
|
(nc, dc, e, extrema) = ratfn_minimax(func, (lo, hi), n, d, weight)
|
|||
|
if array_format
|
|||
|
if d == 0
|
|||
|
functext = join([string(x)*",\n" for x=nc],"")
|
|||
|
else
|
|||
|
# It's unclear how you should best format an array of
|
|||
|
# coefficients for a rational function, so I'll leave
|
|||
|
# implementing this option until I have a use case.
|
|||
|
error("--array unsupported for rational functions")
|
|||
|
end
|
|||
|
else
|
|||
|
functext = ratfn_to_string(nc, dc) * "\n"
|
|||
|
end
|
|||
|
if full_output
|
|||
|
# Print everything you might want to know about the function
|
|||
|
println("extrema = ", format_xylist(extrema))
|
|||
|
println("maxerror = ", string(e))
|
|||
|
if length(dc) > 1
|
|||
|
println("wellconditioning_numerator = ",
|
|||
|
string(wellcond(nc, lo, hi)))
|
|||
|
println("wellconditioning_denominator = ",
|
|||
|
string(wellcond(dc, lo, hi)))
|
|||
|
else
|
|||
|
println("wellconditioning = ", string(wellcond(nc, lo, hi)))
|
|||
|
end
|
|||
|
print("function = ", functext)
|
|||
|
else
|
|||
|
# Just print the text people will want to paste into their code
|
|||
|
print(functext)
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
# ----------------------------------------------------------------------
|
|||
|
# Top-level code: parse the argument list and decide what to do.
|
|||
|
|
|||
|
what_to_do = main
|
|||
|
|
|||
|
doing_opts = true
|
|||
|
argwords = array1d(String, 0)
|
|||
|
for arg = ARGS
|
|||
|
global doing_opts, what_to_do, argwords
|
|||
|
global full_output, array_format, xvarname, floatsuffix, epsbits
|
|||
|
if doing_opts && startswith(arg, "-")
|
|||
|
if arg == "--"
|
|||
|
doing_opts = false
|
|||
|
elseif arg == "--help"
|
|||
|
what_to_do = help
|
|||
|
elseif arg == "--test"
|
|||
|
what_to_do = test
|
|||
|
elseif arg == "--full"
|
|||
|
full_output = true
|
|||
|
elseif arg == "--array"
|
|||
|
array_format = true
|
|||
|
elseif startswith(arg, "--debug=")
|
|||
|
enable_debug(arg[length("--debug=")+1:end])
|
|||
|
elseif startswith(arg, "--variable=")
|
|||
|
xvarname = arg[length("--variable=")+1:end]
|
|||
|
elseif startswith(arg, "--suffix=")
|
|||
|
floatsuffix = arg[length("--suffix=")+1:end]
|
|||
|
elseif startswith(arg, "--bits=")
|
|||
|
epsbits = parse(Int,arg[length("--bits=")+1:end])
|
|||
|
elseif startswith(arg, "--bigfloatbits=")
|
|||
|
set_bigfloat_precision(
|
|||
|
parse(Int,arg[length("--bigfloatbits=")+1:end]))
|
|||
|
elseif startswith(arg, "--pre=")
|
|||
|
push!(preliminary_commands, arg[length("--pre=")+1:end])
|
|||
|
else
|
|||
|
error("unrecognised option: ", arg)
|
|||
|
end
|
|||
|
else
|
|||
|
push!(argwords, arg)
|
|||
|
end
|
|||
|
end
|
|||
|
|
|||
|
what_to_do()
|