GitList - GitList

Browse code

move learners to seperate files

Bas Nijholt authored on 30/10/2017 16:48:13
Showing 10 changed files

adaptive/learner.py index d4925b5..0000000
adaptive/learner/__init__.py index 0000000..25091b3
adaptive/learner/average_learner.py index 0000000..e21fb82
adaptive/learner/balancing_learner.py index 0000000..5c8bb02
adaptive/learner/base_learner.py index 0000000..0ecd7f1
coeffs.py index b2ee474..021561f 100644
cquad.py index 972d3aa..bf2c499 100644
adaptive/learner/learner1D.py index 0000000..2df0271
adaptive/learner/learner2D.py index 0000000..7322c22
adaptive/learner/utils.py index 0000000..5a866af

                     deleted file mode 100644
@@ -1,775 +0,0 @@
                     -# -*- coding: utf-8 -*-
                     -import abc
                     -import collections
                     -from contextlib import contextmanager
                     -from copy import deepcopy as copy
                     -import functools
                     -import heapq
                     -import itertools
                     -from math import sqrt, hypot
                     -from operator import itemgetter
+                    -
                     -import holoviews as hv
                     -import numpy as np
                     -from scipy import interpolate, optimize, special
                     -import sortedcontainers
+                    -
+                    -
                     -class BaseLearner(metaclass=abc.ABCMeta):
                     -    """Base class for algorithms for learning a function 'f: X → Y'.
+                    -
                     -    Attributes
                     -    ----------
                     -    function : callable: X → Y
                     -        The function to learn.
                     -    data : dict: X → Y
                     -        'function' evaluated at certain points.
                     -        The values can be 'None', which indicates that the point
                     -        will be evaluated, but that we do not have the result yet.
+                    -
                     -    Subclasses may define a 'plot' method that takes no parameters
                     -    and returns a holoviews plot.
                     -    """
+                    -
                     -    def add_data(self, xvalues, yvalues):
                     -        """Add data to the learner.
+                    -
                     -        Parameters
                     -        ----------
                     -        xvalues : value from the function domain, or iterable of such
                     -            Values from the domain of the learned function.
                     -        yvalues : value from the function image, or iterable of such
                     -            Values from the range of the learned function, or None.
                     -            If 'None', then it indicates that the value has not yet
                     -            been computed.
                     -        """
                     -        if all(isinstance(i, collections.Iterable) for i in [xvalues, yvalues]):
                     -            for x, y in zip(xvalues, yvalues):
                     -                self.add_point(x, y)
                     -        else:
                     -            self.add_point(xvalues, yvalues)
+                    -
                     -    @abc.abstractmethod
                     -    def add_point(self, x, y):
                     -        """Add a single datapoint to the learner."""
                     -        pass
+                    -
                     -    @abc.abstractmethod
                     -    def remove_unfinished(self):
                     -        """Remove uncomputed data from the learner."""
                     -        pass
+                    -
                     -    @abc.abstractmethod
                     -    def loss(self, real=True):
                     -        """Return the loss for the current state of the learner.
+                    -
                     -        Parameters
                     -        ----------
                     -        real : bool, default: True
                     -            If False, return the "expected" loss, i.e. the
                     -            loss including the as-yet unevaluated points
                     -            (possibly by interpolation).
                     -        """
+                    -
                     -    @abc.abstractmethod
                     -    def choose_points(self, n, add_data=True):
                     -        """Choose the next 'n' points to evaluate.
+                    -
                     -        Parameters
                     -        ----------
                     -        n : int
                     -            The number of points to choose.
                     -        add_data : bool, default: True
                     -            If True, add the chosen points to this
                     -            learner's 'data' with 'None' for the 'y'
                     -            values. Set this to False if you do not
                     -            want to modify the state of the learner.
                     -        """
                     -        pass
+                    -
                     -    def __getstate__(self):
                     -        return copy(self.__dict__)
+                    -
                     -    def __setstate__(self, state):
                     -        self.__dict__ = state
+                    -
+                    -
                     -class AverageLearner(BaseLearner):
                     -    """A naive implementation of adaptive computing of averages.
+                    -
                     -    The learned function must depend on an integer input variable that
                     -    represents the source of randomness.
+                    -
                     -    Parameters:
                     -    -----------
                     -    atol : float
                     -        Desired absolute tolerance
                     -    rtol : float
                     -        Desired relative tolerance
                     -    """
+                    -
                     -    def __init__(self, function, atol=None, rtol=None):
                     -        if atol is None and rtol is None:
                     -            raise Exception('At least one of `atol` and `rtol` should be set.')
                     -        if atol is None:
                     -            atol = np.inf
                     -        if rtol is None:
                     -            rtol = np.inf
+                    -
                     -        self.data = {}
                     -        self.function = function
                     -        self.atol = atol
                     -        self.rtol = rtol
                     -        self.n = 0
                     -        self.n_requested = 0
                     -        self.sum_f = 0
                     -        self.sum_f_sq = 0
+                    -
                     -    def choose_points(self, n, add_data=True):
                     -        points = list(range(self.n_requested, self.n_requested + n))
                     -        loss_improvements = [self.loss()] * n
                     -        if add_data:
                     -            self.add_data(points, itertools.repeat(None))
                     -        return points, loss_improvements
+                    -
                     -    def add_point(self, n, value):
                     -        self.data[n] = value
                     -        if value is None:
                     -            self.n_requested += 1
                     -            return
                     -        else:
                     -            self.n += 1
                     -            self.sum_f += value
                     -            self.sum_f_sq += value**2
+                    -
                     -    @property
                     -    def mean(self):
                     -        return self.sum_f / self.n
+                    -
                     -    @property
                     -    def std(self):
                     -        n = self.n
                     -        if n < 2:
                     -            return np.inf
                     -        return sqrt((self.sum_f_sq - n * self.mean**2) / (n - 1))
+                    -
                     -    def loss(self, real=True):
                     -        n = self.n
                     -        if n < 2:
                     -            return np.inf
                     -        standard_error = self.std / sqrt(n if real else self.n_requested)
                     -        return max(standard_error / self.atol,
                     -                   standard_error / abs(self.mean) / self.rtol)
+                    -
                     -    def remove_unfinished(self):
                     -        """Remove uncomputed data from the learner."""
                     -        pass
+                    -
                     -    def plot(self):
                     -        vals = [v for v in self.data.values() if v is not None]
                     -        if not vals:
                     -            return hv.Histogram([[], []])
                     -        num_bins = int(max(5, sqrt(self.n)))
                     -        vals = hv.Points(vals)
                     -        return hv.operation.histogram(vals, num_bins=num_bins, dimension=1)
+                    -
+                    -
                     -class Learner1D(BaseLearner):
                     -    """Learns and predicts a function 'f:ℝ → ℝ'.
+                    -
                     -    Parameters
                     -    ----------
                     -    function : callable
                     -        The function to learn. Must take a single real parameter and
                     -        return a real number.
                     -    bounds : pair of reals
                     -        The bounds of the interval on which to learn 'function'.
                     -    """
+                    -
                     -    def __init__(self, function, bounds):
                     -        self.function = function
+                    -
                     -        # A dict storing the loss function for each interval x_n.
                     -        self.losses = {}
                     -        self.losses_combined = {}
+                    -
                     -        self.data = sortedcontainers.SortedDict()
                     -        self.data_interp = {}
+                    -
                     -        # A dict {x_n: [x_{n-1}, x_{n+1}]} for quick checking of local
                     -        # properties.
                     -        self.neighbors = sortedcontainers.SortedDict()
                     -        self.neighbors_combined = sortedcontainers.SortedDict()
+                    -
                     -        # Bounding box [[minx, maxx], [miny, maxy]].
                     -        self._bbox = [list(bounds), [np.inf, -np.inf]]
+                    -
                     -        # Data scale (maxx - minx), (maxy - miny)
                     -        self._scale = [bounds[1] - bounds[0], 0]
                     -        self._oldscale = copy(self._scale)
+                    -
                     -        self.bounds = list(bounds)
+                    -
                     -    @property
                     -    def data_combined(self):
                     -        return {**self.data, **self.data_interp}
+                    -
                     -    def interval_loss(self, x_left, x_right, data):
                     -        """Calculate loss in the interval x_left, x_right.
+                    -
                     -        Currently returns the rescaled length of the interval. If one of the
                     -        y-values is missing, returns 0 (so the intervals with missing data are
                     -        never touched. This behavior should be improved later.
                     -        """
                     -        y_right, y_left = data[x_right], data[x_left]
                     -        if self._scale[1] == 0:
                     -            return sqrt(((x_right - x_left) / self._scale[0])**2)
                     -        else:
                     -            return sqrt(((x_right - x_left) / self._scale[0])**2 +
                     -                        ((y_right - y_left) / self._scale[1])**2)
+                    -
                     -    def loss(self, real=True):
                     -        losses = self.losses if real else self.losses_combined
                     -        if len(losses) == 0:
                     -            return float('inf')
                     -        else:
                     -            return max(losses.values())
+                    -
                     -    def update_losses(self, x, data, neighbors, losses):
                     -        x_lower, x_upper = neighbors[x]
                     -        if x_lower is not None:
                     -            losses[x_lower, x] = self.interval_loss(x_lower, x, data)
                     -        if x_upper is not None:
                     -            losses[x, x_upper] = self.interval_loss(x, x_upper, data)
                     -        try:
                     -            del losses[x_lower, x_upper]
                     -        except KeyError:
                     -            pass
+                    -
                     -    def find_neighbors(self, x, neighbors):
                     -        pos = neighbors.bisect_left(x)
                     -        x_lower = neighbors.iloc[pos-1] if pos != 0 else None
                     -        x_upper = neighbors.iloc[pos] if pos != len(neighbors) else None
                     -        return x_lower, x_upper
+                    -
                     -    def update_neighbors(self, x, neighbors):
                     -        if x not in neighbors:  # The point is new
                     -            x_lower, x_upper = self.find_neighbors(x, neighbors)
                     -            neighbors[x] = [x_lower, x_upper]
                     -            neighbors.get(x_lower, [None, None])[1] = x
                     -            neighbors.get(x_upper, [None, None])[0] = x
+                    -
                     -    def update_scale(self, x, y):
                     -        self._bbox[0][0] = min(self._bbox[0][0], x)
                     -        self._bbox[0][1] = max(self._bbox[0][1], x)
                     -        if y is not None:
                     -            self._bbox[1][0] = min(self._bbox[1][0], y)
                     -            self._bbox[1][1] = max(self._bbox[1][1], y)
+                    -
                     -        self._scale = [self._bbox[0][1] - self._bbox[0][0],
                     -                       self._bbox[1][1] - self._bbox[1][0]]
+                    -
                     -    def add_point(self, x, y):
                     -        real = y is not None
+                    -
                     -        if real:
                     -            # Add point to the real data dict and pop from the unfinished
                     -            # data_interp dict.
                     -            self.data[x] = y
                     -            try:
                     -                del self.data_interp[x]
                     -            except KeyError:
                     -                pass
                     -        else:
                     -            # The keys of data_interp are the unknown points
                     -            self.data_interp[x] = None
+                    -
                     -        # Update the neighbors
                     -        self.update_neighbors(x, self.neighbors_combined)
                     -        if real:
                     -            self.update_neighbors(x, self.neighbors)
+                    -
                     -        # Update the scale
                     -        self.update_scale(x, y)
+                    -
                     -        # Interpolate
                     -        if not real:
                     -            self.data_interp = self.interpolate()
+                    -
                     -        # Update the losses
                     -        self.update_losses(x, self.data_combined, self.neighbors_combined,
                     -                           self.losses_combined)
                     -        if real:
                     -            self.update_losses(x, self.data, self.neighbors, self.losses)
+                    -
                     -        # If the scale has doubled, recompute all losses.
                     -        if self._scale > self._oldscale * 2:
                     -            self.losses = {xs: self.interval_loss(*xs, self.data)
                     -                           for xs in self.losses}
                     -            self.losses_combined = {x: self.interval_loss(*x,
                     -                                                          self.data_combined)
                     -                                    for x in self.losses_combined}
                     -            self._oldscale = self._scale
+                    -
                     -    def choose_points(self, n, add_data=True):
                     -        """Return n points that are expected to maximally reduce the loss."""
                     -        # Find out how to divide the n points over the intervals
                     -        # by finding  positive integer n_i that minimize max(L_i / n_i) subject
                     -        # to a constraint that sum(n_i) = n + N, with N the total number of
                     -        # intervals.
+                    -
                     -        # Return equally spaced points within each interval to which points
                     -        # will be added.
                     -        if n == 0:
                     -            return []
+                    -
                     -        # If the bounds have not been chosen yet, we choose them first.
                     -        points = []
                     -        for bound in self.bounds:
                     -            if bound not in self.data and bound not in self.data_interp:
                     -                points.append(bound)
+                    -
                     -        # Ensure we return exactly 'n' points.
                     -        if points:
                     -            loss_improvements = [float('inf')] * n
                     -            if n <= 2:
                     -                points = points[:n]
                     -            else:
                     -                points = np.linspace(*self.bounds, n)
                     -        else:
                     -            def xs(x, n):
                     -                if n == 1:
                     -                    return []
                     -                else:
                     -                    step = (x[1] - x[0]) / n
                     -                    return [x[0] + step * i for i in range(1, n)]
+                    -
                     -            # Calculate how many points belong to each interval.
                     -            quals = [(-loss, x_range, 1) for (x_range, loss) in
                     -                     self.losses_combined.items()]
+                    -
                     -            heapq.heapify(quals)
+                    -
                     -            for point_number in range(n):
                     -                quality, x, n = quals[0]
                     -                heapq.heapreplace(quals, (quality * n / (n + 1), x, n + 1))
+                    -
                     -            points = list(itertools.chain.from_iterable(xs(x, n)
                     -                          for quality, x, n in quals))
+                    -
                     -            loss_improvements = list(itertools.chain.from_iterable(
                     -                                     itertools.repeat(-quality, n)
                     -                                     for quality, x, n in quals))
+                    -
                     -        if add_data:
                     -            self.add_data(points, itertools.repeat(None))
+                    -
                     -        return points, loss_improvements
+                    -
                     -    def interpolate(self, extra_points=None):
                     -        xs = list(self.data.keys())
                     -        ys = list(self.data.values())
                     -        xs_unfinished = list(self.data_interp.keys())
+                    -
                     -        if extra_points is not None:
                     -            xs_unfinished += extra_points
+                    -
                     -        if len(ys) == 0:
                     -            interp_ys = (0,) * len(xs_unfinished)
                     -        else:
                     -            interp_ys = np.interp(xs_unfinished, xs, ys)
+                    -
                     -        data_interp = {x: y for x, y in zip(xs_unfinished, interp_ys)}
+                    -
                     -        return data_interp
+                    -
                     -    def plot(self):
                     -            if self.data:
                     -                return hv.Scatter(self.data)
                     -            else:
                     -                return hv.Scatter([])
+                    -
                     -    def remove_unfinished(self):
                     -        self.data_interp = {}
                     -        self.losses_combined = copy(self.losses)
                     -        self.neighbors_combined = copy(self.neighbors)
+                    -
+                    -
                     -def dispatch(child_functions, arg):
                     -    index, x = arg
                     -    return child_functions[index](x)
+                    -
+                    -
                     -class BalancingLearner(BaseLearner):
                     -    """Choose the optimal points from a set of learners.
+                    -
                     -    Parameters
                     -    ----------
                     -    learners : sequence of BaseLearner
                     -        The learners from which to choose. These must all have the same type.
+                    -
                     -    Notes
                     -    -----
                     -    This learner compares the 'loss' calculated from the "child" learners.
                     -    This requires that the 'loss' from different learners *can be meaningfully
                     -    compared*. For the moment we enforce this restriction by requiring that
                     -    all learners are the same type but (depending on the internals of the
                     -    learner) it may be that the loss cannot be compared *even between learners
                     -    of the same type*. In this case the BalancingLearner will behave in an
                     -    undefined way.
                     -    """
+                    -
                     -    def __init__(self, learners):
                     -        self.learners = learners
+                    -
                     -        # Naively we would make 'function' a method, but this causes problems
                     -        # when using executors from 'concurrent.futures' because we have to
                     -        # pickle the whole learner.
                     -        self.function = functools.partial(dispatch, [l.function for l
                     -                                                     in self.learners])
+                    -
                     -        if len(set(learner.__class__ for learner in self.learners)) > 1:
                     -            raise TypeError('A BalacingLearner can handle only one type'
                     -                            'of learners.')
+                    -
                     -    def _choose_and_add_points(self, n):
                     -        points = []
                     -        for _ in range(n):
                     -            loss_improvements = []
                     -            pairs = []
                     -            for index, learner in enumerate(self.learners):
                     -                point, loss_improvement = learner.choose_points(n=1,
                     -                                                                add_data=False)
                     -                loss_improvements.append(loss_improvement[0])
                     -                pairs.append((index, point[0]))
                     -            x, _ = max(zip(pairs, loss_improvements), key=itemgetter(1))
                     -            points.append(x)
                     -            self.add_point(x, None)
                     -        return points, None
+                    -
                     -    def choose_points(self, n, add_data=True):
                     -        """Chose points for learners."""
                     -        if not add_data:
                     -            with restore(*self.learners):
                     -                return self._choose_and_add_points(n)
                     -        else:
                     -            return self._choose_and_add_points(n)
+                    -
                     -    def add_point(self, x, y):
                     -        index, x = x
                     -        self.learners[index].add_point(x, y)
+                    -
                     -    def loss(self, real=True):
                     -        return max(learner.loss(real) for learner in self.learners)
+                    -
                     -    def plot(self, index):
                     -        return self.learners[index].plot()
+                    -
                     -    def remove_unfinished(self):
                     -        """Remove uncomputed data from the learners."""
                     -        for learner in self.learners:
                     -            learner.remove_unfinished()
+                    -
+                    -
                     -# Learner2D and helper functions.
+                    -
                     -def _losses_per_triangle(ip):
                     -    tri = ip.tri
                     -    vs = ip.values.ravel()
+                    -
                     -    gradients = interpolate.interpnd.estimate_gradients_2d_global(
                     -        tri, vs, tol=1e-6)
                     -    p = tri.points[tri.vertices]
                     -    g = gradients[tri.vertices]
                     -    v = vs[tri.vertices]
                     -    n_points_per_triangle = p.shape[1]
+                    -
                     -    dev = 0
                     -    for j in range(n_points_per_triangle):
                     -        vest = v[:, j, None] + ((p[:, :, :] - p[:, j, None, :]) *
                     -                                g[:, j, None, :]).sum(axis=-1)
                     -        dev += abs(vest - v).max(axis=1)
+                    -
                     -    q = p[:, :-1, :] - p[:, -1, None, :]
                     -    areas = abs(q[:, 0, 0] * q[:, 1, 1] - q[:, 0, 1] * q[:, 1, 0])
                     -    areas /= special.gamma(n_points_per_triangle)
                     -    areas = np.sqrt(areas)
+                    -
                     -    vs_scale = vs[tri.vertices].ptp()
                     -    if vs_scale != 0:
                     -        dev /= vs_scale
+                    -
                     -    return dev * areas
+                    -
                     -class Learner2D(BaseLearner):
                     -    """Learns and predicts a function 'f: ℝ^2 → ℝ'.
+                    -
                     -    Parameters
                     -    ----------
                     -    function : callable
                     -        The function to learn. Must take a tuple of two real
                     -        parameters and return a real number.
                     -    bounds : list of 2-tuples
                     -        A list ``[(a1, b1), (a2, b2)]`` containing bounds,
                     -        one per dimension.
+                    -
                     -    Attributes
                     -    ----------
                     -    points_combined
                     -        Sample points so far including the unknown interpolated ones.
                     -    values_combined
                     -        Sampled values so far including the unknown interpolated ones.
                     -    points
                     -        Sample points so far with real results.
                     -    values
                     -        Sampled values so far with real results.
+                    -
                     -    Notes
                     -    -----
                     -    Adapted from an initial implementation by Pauli Virtanen.
+                    -
                     -    The sample points are chosen by estimating the point where the
                     -    linear and cubic interpolants based on the existing points have
                     -    maximal disagreement. This point is then taken as the next point
                     -    to be sampled.
+                    -
                     -    In practice, this sampling protocol results to sparser sampling of
                     -    smooth regions, and denser sampling of regions where the function
                     -    changes rapidly, which is useful if the function is expensive to
                     -    compute.
+                    -
                     -    This sampling procedure is not extremely fast, so to benefit from
                     -    it, your function needs to be slow enough to compute.
                     -    """
+                    -
                     -    def __init__(self, function, bounds):
                     -        self.ndim = len(bounds)
                     -        if self.ndim != 2:
                     -            raise ValueError("Only 2-D sampling supported.")
                     -        self.bounds = tuple((float(a), float(b)) for a, b in bounds)
                     -        self._points = np.zeros([100, self.ndim])
                     -        self._values = np.zeros([100], dtype=float)
                     -        self._stack = []
                     -        self._interp = {}
+                    -
                     -        xy_mean = np.mean(self.bounds, axis=1)
                     -        xy_scale = np.ptp(self.bounds, axis=1)
+                    -
                     -        def scale(points):
                     -            return (points - xy_mean) / xy_scale
+                    -
                     -        def unscale(points):
                     -            return points * xy_scale + xy_mean
+                    -
                     -        self.scale = scale
                     -        self.unscale = unscale
+                    -
                     -        # Keeps track till which index _points and _values are filled
                     -        self.n = 0
+                    -
                     -        self._bounds_points = list(itertools.product(*bounds))
+                    -
                     -        # Add the loss improvement to the bounds in the stack
                     -        self._stack = [(*p, np.inf) for p in self._bounds_points]
+                    -
                     -        self.function = function
+                    -
                     -    @property
                     -    def points_combined(self):
                     -        return self._points[:self.n]
+                    -
                     -    @property
                     -    def values_combined(self):
                     -        return self._values[:self.n]
+                    -
                     -    @property
                     -    def points(self):
                     -        return np.delete(self.points_combined,
                     -                         list(self._interp.values()), axis=0)
+                    -
                     -    @property
                     -    def values(self):
                     -        return np.delete(self.values_combined,
                     -                         list(self._interp.values()), axis=0)
+                    -
                     -    def ip(self):
                     -        points = self.scale(self.points)
                     -        return interpolate.LinearNDInterpolator(points, self.values)
+                    -
                     -    @property
                     -    def n_real(self):
                     -        return self.n - len(self._interp)
+                    -
                     -    def ip_combined(self):
                     -        points = self.scale(self.points_combined)
                     -        values = self.values_combined
+                    -
                     -        # Interpolate the unfinished points
                     -        if self._interp:
                     -            n_interp = list(self._interp.values())
                     -            bounds_are_done = not any(p in self._interp
                     -                                      for p in self._bounds_points)
                     -            if bounds_are_done:
                     -                values[n_interp] = self.ip()(points[n_interp])
                     -            else:
                     -                # It is important not to return exact zeros because
                     -                # otherwise the algo will try to add the same point
                     -                # to the stack each time.
                     -                values[n_interp] = np.random.rand(len(n_interp)) * 1e-15
+                    -
                     -        return interpolate.LinearNDInterpolator(points, values)
+                    -
                     -    def add_point(self, point, value):
                     -        nmax = self.values_combined.shape[0]
                     -        if self.n >= nmax:
                     -            self._values = np.resize(self._values, [2*nmax + 10])
                     -            self._points = np.resize(self._points, [2*nmax + 10, self.ndim])
+                    -
                     -        point = tuple(point)
+                    -
                     -        # When the point is not evaluated yet, add an entry to self._interp
                     -        # that saves the point and index.
                     -        if value is None:
                     -            self._interp[point] = self.n
                     -            old_point = False
                     -        else:
                     -            old_point = point in self._interp
+                    -
                     -        # If the point is new add it a new value to _points and _values,
                     -        # otherwise get the index of the value that is being replaced.
                     -        if old_point:
                     -            n = self._interp.pop(point)
                     -        else:
                     -            n = self.n
                     -            self.n += 1
+                    -
                     -        self._points[n] = point
                     -        self._values[n] = value
+                    -
                     -        # Remove the point if in the stack.
                     -        for i, (*_point, _) in enumerate(self._stack):
                     -            if point == tuple(_point):
                     -                self._stack.pop(i)
                     -                break
+                    -
                     -    def _fill_stack(self, stack_till=None):
                     -        if stack_till is None:
                     -            stack_till = 1
+                    -
                     -        if self.values_combined.shape[0] < self.ndim + 1:
                     -            raise ValueError("too few points...")
+                    -
                     -        # Interpolate
                     -        ip = self.ip_combined()
                     -        tri = ip.tri
+                    -
                     -        losses = _losses_per_triangle(ip)
+                    -
                     -        def point_exists(p):
                     -            eps = np.finfo(float).eps * self.points_combined.ptp() * 100
                     -            if abs(p - self.points_combined).sum(axis=1).min() < eps:
                     -                return True
                     -            if self._stack:
                     -                _stack_points, _ = self._split_stack()
                     -                if abs(p - np.asarray(_stack_points)).sum(axis=1).min() < eps:
                     -                    return True
                     -            return False
+                    -
                     -        for j, _ in enumerate(losses):
                     -            # Estimate point of maximum curvature inside the simplex
                     -            jsimplex = np.argmax(losses)
                     -            p = tri.points[tri.vertices[jsimplex]]
                     -            point_new = self.unscale(p.mean(axis=-2))
+                    -
                     -            # XXX: not sure whether this is necessary it was there
                     -            # originally.
                     -            point_new = np.clip(point_new, *zip(*self.bounds))
+                    -
                     -            # Check if it is really new
                     -            if point_exists(point_new):
                     -                losses[jsimplex] = 0
                     -                continue
+                    -
                     -            # Add to stack
                     -            self._stack.append((*point_new, losses[jsimplex]))
+                    -
                     -            if len(self._stack) >= stack_till:
                     -                break
                     -            else:
                     -                losses[jsimplex] = 0
+                    -
                     -    def _split_stack(self, n=None):
                     -        points = []
                     -        loss_improvements = []
                     -        for *point, loss_improvement in self._stack[:n]:
                     -            points.append(point)
                     -            loss_improvements.append(loss_improvement)
                     -        return points, loss_improvements
+                    -
                     -    def _choose_and_add_points(self, n):
                     -        if n <= len(self._stack):
                     -            points, loss_improvements = self._split_stack(n)
                     -            self.add_data(points, itertools.repeat(None))
                     -        else:
                     -            points = []
                     -            loss_improvements = []
                     -            n_left = n
                     -            while n_left > 0:
                     -                # The while loop is needed because `stack_till` could be larger
                     -                # than the number of triangles between the points. Therefore
                     -                # it could fill up till a length smaller than `stack_till`.
                     -                if self.n >= 2**self.ndim:
                     -                    # Only fill the stack if no more bounds left in _stack
                     -                    self._fill_stack(stack_till=n_left)
                     -                new_points, new_loss_improvements = self._split_stack(n_left)
                     -                points += new_points
                     -                loss_improvements += new_loss_improvements
                     -                self.add_data(new_points, itertools.repeat(None))
                     -                n_left -= len(new_points)
+                    -
                     -        return points, loss_improvements
+                    -
                     -    def choose_points(self, n, add_data=True):
                     -        if not add_data:
                     -            with restore(self):
                     -                return self._choose_and_add_points(n)
                     -        else:
                     -            return self._choose_and_add_points(n)
+                    -
                     -    def loss(self, real=True):
                     -        n = self.n_real if real else self.n
                     -        bounds_are_not_done = any(p in self._interp
                     -                                  for p in self._bounds_points)
                     -        if n <= 4 or bounds_are_not_done:
                     -            return np.inf
                     -        ip = self.ip() if real else self.ip_combined()
                     -        losses = _losses_per_triangle(ip)
                     -        return losses.max()
+                    -
                     -    def remove_unfinished(self):
                     -        self._points = self.points.copy()
                     -        self._values = self.values.copy()
                     -        self.n -= len(self._interp)
                     -        self._interp = {}
+                    -
                     -    def plot(self, n_x=201, n_y=201):
                     -        x, y = self.bounds
                     -        lbrt = x[0], y[0], x[1], y[1]
                     -        if self.n_real >= 4:
                     -            x = np.linspace(-0.5, 0.5, n_x)
                     -            y = np.linspace(-0.5, 0.5, n_y)
                     -            ip = self.ip()
                     -            z = ip(x[:, None], y[None, :])
                     -            return hv.Image(np.rot90(z), bounds=lbrt)
                     -        else:
                     -            return hv.Image(np.zeros((2, 2)), bounds=lbrt)
+                    -
+                    -
                     -@contextmanager
                     -def restore(*learners):
                     -    states = [learner.__getstate__() for learner in learners]
                     -    try:
                     -        yield
                     -    finally:
                     -        for state, learner in zip(states, learners):
                     -            learner.__setstate__(state)

adaptive/learner/__init__.py

History View file @ 5261c86

                     new file mode 100644
@@ -0,0 +1,7 @@
                     +# -*- coding: utf-8 -*-
                     +from .average_learner import AverageLearner
                     +from .base_learner import BaseLearner
                     +from .balancing_learner import BalancingLearner
                     +from .learner1D import Learner1D
                     +from .learner2D import Learner2D
                     +from .integrator_learner import IntegratorLearner

adaptive/learner/average_learner.py

History View file @ 5261c86

                     new file mode 100644
@@ -0,0 +1,87 @@
                     +# -*- coding: utf-8 -*-
                     +import itertools
                     +from math import sqrt
+                    +
                     +import holoviews as hv
                     +import numpy as np
+                    +
                     +from .base_learner import BaseLearner
+                    +
                     +class AverageLearner(BaseLearner):
                     +    """A naive implementation of adaptive computing of averages.
+                    +
                     +    The learned function must depend on an integer input variable that
                     +    represents the source of randomness.
+                    +
                     +    Parameters:
                     +    -----------
                     +    atol : float
                     +        Desired absolute tolerance
                     +    rtol : float
                     +        Desired relative tolerance
                     +    """
+                    +
                     +    def __init__(self, function, atol=None, rtol=None):
                     +        if atol is None and rtol is None:
                     +            raise Exception('At least one of `atol` and `rtol` should be set.')
                     +        if atol is None:
                     +            atol = np.inf
                     +        if rtol is None:
                     +            rtol = np.inf
+                    +
                     +        self.data = {}
                     +        self.function = function
                     +        self.atol = atol
                     +        self.rtol = rtol
                     +        self.n = 0
                     +        self.n_requested = 0
                     +        self.sum_f = 0
                     +        self.sum_f_sq = 0
+                    +
                     +    def choose_points(self, n, add_data=True):
                     +        points = list(range(self.n_requested, self.n_requested + n))
                     +        loss_improvements = [self.loss()] * n
                     +        if add_data:
                     +            self.add_data(points, itertools.repeat(None))
                     +        return points, loss_improvements
+                    +
                     +    def add_point(self, n, value):
                     +        self.data[n] = value
                     +        if value is None:
                     +            self.n_requested += 1
                     +            return
                     +        else:
                     +            self.n += 1
                     +            self.sum_f += value
                     +            self.sum_f_sq += value**2
+                    +
                     +    @property
                     +    def mean(self):
                     +        return self.sum_f / self.n
+                    +
                     +    @property
                     +    def std(self):
                     +        n = self.n
                     +        if n < 2:
                     +            return np.inf
                     +        return sqrt((self.sum_f_sq - n * self.mean**2) / (n - 1))
+                    +
                     +    def loss(self, real=True):
                     +        n = self.n
                     +        if n < 2:
                     +            return np.inf
                     +        standard_error = self.std / sqrt(n if real else self.n_requested)
                     +        return max(standard_error / self.atol,
                     +                   standard_error / abs(self.mean) / self.rtol)
+                    +
                     +    def remove_unfinished(self):
                     +        """Remove uncomputed data from the learner."""
                     +        pass
+                    +
                     +    def plot(self):
                     +        vals = [v for v in self.data.values() if v is not None]
                     +        if not vals:
                     +            return hv.Histogram([[], []])
                     +        num_bins = int(max(5, sqrt(self.n)))
                     +        vals = hv.Points(vals)
                     +        return hv.operation.histogram(vals, num_bins=num_bins, dimension=1)

adaptive/learner/balancing_learner.py

History View file @ 5261c86

                     new file mode 100644
@@ -0,0 +1,82 @@
                     +# -*- coding: utf-8 -*-
                     +import functools
                     +from operator import itemgetter
+                    +
                     +from .base_learner import BaseLearner
                     +from .utils import restore
+                    +
+                    +
                     +def dispatch(child_functions, arg):
                     +    index, x = arg
                     +    return child_functions[index](x)
+                    +
+                    +
                     +class BalancingLearner(BaseLearner):
                     +    """Choose the optimal points from a set of learners.
+                    +
                     +    Parameters
                     +    ----------
                     +    learners : sequence of BaseLearner
                     +        The learners from which to choose. These must all have the same type.
+                    +
                     +    Notes
                     +    -----
                     +    This learner compares the 'loss' calculated from the "child" learners.
                     +    This requires that the 'loss' from different learners *can be meaningfully
                     +    compared*. For the moment we enforce this restriction by requiring that
                     +    all learners are the same type but (depending on the internals of the
                     +    learner) it may be that the loss cannot be compared *even between learners
                     +    of the same type*. In this case the BalancingLearner will behave in an
                     +    undefined way.
                     +    """
+                    +
                     +    def __init__(self, learners):
                     +        self.learners = learners
+                    +
                     +        # Naively we would make 'function' a method, but this causes problems
                     +        # when using executors from 'concurrent.futures' because we have to
                     +        # pickle the whole learner.
                     +        self.function = functools.partial(dispatch, [l.function for l
                     +                                                     in self.learners])
+                    +
                     +        if len(set(learner.__class__ for learner in self.learners)) > 1:
                     +            raise TypeError('A BalacingLearner can handle only one type'
                     +                            'of learners.')
+                    +
                     +    def _choose_and_add_points(self, n):
                     +        points = []
                     +        for _ in range(n):
                     +            loss_improvements = []
                     +            pairs = []
                     +            for index, learner in enumerate(self.learners):
                     +                point, loss_improvement = learner.choose_points(n=1,
                     +                                                                add_data=False)
                     +                loss_improvements.append(loss_improvement[0])
                     +                pairs.append((index, point[0]))
                     +            x, _ = max(zip(pairs, loss_improvements), key=itemgetter(1))
                     +            points.append(x)
                     +            self.add_point(x, None)
                     +        return points, None
+                    +
                     +    def choose_points(self, n, add_data=True):
                     +        """Chose points for learners."""
                     +        if not add_data:
                     +            with restore(*self.learners):
                     +                return self._choose_and_add_points(n)
                     +        else:
                     +            return self._choose_and_add_points(n)
+                    +
                     +    def add_point(self, x, y):
                     +        index, x = x
                     +        self.learners[index].add_point(x, y)
+                    +
                     +    def loss(self, real=True):
                     +        return max(learner.loss(real) for learner in self.learners)
+                    +
                     +    def plot(self, index):
                     +        return self.learners[index].plot()
+                    +
                     +    def remove_unfinished(self):
                     +        """Remove uncomputed data from the learners."""
                     +        for learner in self.learners:
                     +            learner.remove_unfinished()

adaptive/learner/base_learner.py

History View file @ 5261c86

                     new file mode 100644
@@ -0,0 +1,83 @@
                     +# -*- coding: utf-8 -*-
                     +import abc
                     +import collections
                     +from copy import deepcopy
+                    +
+                    +
                     +class BaseLearner(metaclass=abc.ABCMeta):
                     +    """Base class for algorithms for learning a function 'f: X → Y'.
+                    +
                     +    Attributes
                     +    ----------
                     +    function : callable: X → Y
                     +        The function to learn.
                     +    data : dict: X → Y
                     +        'function' evaluated at certain points.
                     +        The values can be 'None', which indicates that the point
                     +        will be evaluated, but that we do not have the result yet.
+                    +
                     +    Subclasses may define a 'plot' method that takes no parameters
                     +    and returns a holoviews plot.
                     +    """
+                    +
                     +    def add_data(self, xvalues, yvalues):
                     +        """Add data to the learner.
+                    +
                     +        Parameters
                     +        ----------
                     +        xvalues : value from the function domain, or iterable of such
                     +            Values from the domain of the learned function.
                     +        yvalues : value from the function image, or iterable of such
                     +            Values from the range of the learned function, or None.
                     +            If 'None', then it indicates that the value has not yet
                     +            been computed.
                     +        """
                     +        if all(isinstance(i, collections.Iterable) for i in [xvalues, yvalues]):
                     +            for x, y in zip(xvalues, yvalues):
                     +                self.add_point(x, y)
                     +        else:
                     +            self.add_point(xvalues, yvalues)
+                    +
                     +    @abc.abstractmethod
                     +    def add_point(self, x, y):
                     +        """Add a single datapoint to the learner."""
                     +        pass
+                    +
                     +    @abc.abstractmethod
                     +    def remove_unfinished(self):
                     +        """Remove uncomputed data from the learner."""
                     +        pass
+                    +
                     +    @abc.abstractmethod
                     +    def loss(self, real=True):
                     +        """Return the loss for the current state of the learner.
+                    +
                     +        Parameters
                     +        ----------
                     +        real : bool, default: True
                     +            If False, return the "expected" loss, i.e. the
                     +            loss including the as-yet unevaluated points
                     +            (possibly by interpolation).
                     +        """
+                    +
                     +    @abc.abstractmethod
                     +    def choose_points(self, n, add_data=True):
                     +        """Choose the next 'n' points to evaluate.
+                    +
                     +        Parameters
                     +        ----------
                     +        n : int
                     +            The number of points to choose.
                     +        add_data : bool, default: True
                     +            If True, add the chosen points to this
                     +            learner's 'data' with 'None' for the 'y'
                     +            values. Set this to False if you do not
                     +            want to modify the state of the learner.
                     +        """
                     +        pass
+                    +
                     +    def __getstate__(self):
                     +        return deepcopy(self.__dict__)
+                    +
                     +    def __setstate__(self, state):
                     +        self.__dict__ = state

coeffs.py

History View file @ 5261c86

                     similarity index 96%
                     rename from coeffs.py
                     rename to adaptive/learner/integrator_coeffs.py
@@ -1,4 +1,5 @@
                     -from fractions import Fraction as Frac
                     +# -*- coding: utf-8 -*-
                     +from fractions import Fraction
                      from collections import defaultdict
                      import numpy as np
                      import scipy.linalg
@@ -11,12 +12,12 @@ def legendre(n):
                          The return value is a list of list of fraction.Fraction instances.
                          """
                     -    result = [[Frac(1)], [Frac(0), Frac(1)]]
                     +    result = [[Fraction(1)], [Fraction(0), Fraction(1)]]
                          if n <= 2:
                              return result[:n]
                          for i in range(2, n):
                              # Use Bonnet's recursion formula.
                     -        new = (i + 1) * [Frac(0)]
                     +        new = (i + 1) * [Fraction(0)]
                              new[1:] = (r * (2*i - 1) for r in result[-1])
                              new[:-2] = (n - r * (i - 1) for n, r in zip(new[:-2], result[-2]))
                              new[:] = (n / i for n in new)
@@ -115,7 +116,7 @@ def calc_bdef(ns):
                          result = []
                          for n in ns:
                              poly = []
                     -        a = list(map(Frac, newton(n)))
                     +        a = list(map(Fraction, newton(n)))
                              for b in legs[:n + 1]:
                                  igral = scalar_product(a, b)

cquad.py

History View file @ 5261c86

                     similarity index 98%
                     rename from cquad.py
                     rename to adaptive/learner/integrator_learner.py
@@ -1,3 +1,4 @@
                     +# -*- coding: utf-8 -*-
                      # Copyright 2010 Pedro Gonnet
                      # Copyright 2017 Christoph Groth
                      # Copyright 2017 `adaptive` authors
@@ -11,8 +12,10 @@ import numpy as np
                      from scipy.linalg import norm
                      from sortedcontainers import SortedDict, SortedSet
                     -from adaptive.learner import BaseLearner
                     -from coeffs import b_def, T_left, T_right, ns, xi, V_inv, Vcond, alpha, gamma
                     +from .base_learner import BaseLearner
                     +from .integrator_coeffs import (b_def, T_left, T_right, ns,
                     +                                xi, V_inv, Vcond, alpha, gamma)
+                    +
                      eps = np.spacing(1)
@@ -273,7 +276,7 @@ class Interval:
                              return all(same_slots)
                     -class Learner(BaseLearner):
                     +class IntegratorLearner(BaseLearner):
                          def __init__(self, function, bounds, tol):
                              self.function = function
                              self.bounds = bounds

adaptive/learner/learner1D.py

History View file @ 5261c86

                     new file mode 100644
@@ -0,0 +1,231 @@
                     +# -*- coding: utf-8 -*-
                     +from copy import deepcopy
                     +import heapq
                     +import itertools
                     +from math import sqrt
+                    +
                     +import holoviews as hv
                     +import numpy as np
                     +import sortedcontainers
+                    +
                     +from .base_learner import BaseLearner
+                    +
                     +class Learner1D(BaseLearner):
                     +    """Learns and predicts a function 'f:ℝ → ℝ'.
+                    +
                     +    Parameters
                     +    ----------
                     +    function : callable
                     +        The function to learn. Must take a single real parameter and
                     +        return a real number.
                     +    bounds : pair of reals
                     +        The bounds of the interval on which to learn 'function'.
                     +    """
+                    +
                     +    def __init__(self, function, bounds):
                     +        self.function = function
+                    +
                     +        # A dict storing the loss function for each interval x_n.
                     +        self.losses = {}
                     +        self.losses_combined = {}
+                    +
                     +        self.data = sortedcontainers.SortedDict()
                     +        self.data_interp = {}
+                    +
                     +        # A dict {x_n: [x_{n-1}, x_{n+1}]} for quick checking of local
                     +        # properties.
                     +        self.neighbors = sortedcontainers.SortedDict()
                     +        self.neighbors_combined = sortedcontainers.SortedDict()
+                    +
                     +        # Bounding box [[minx, maxx], [miny, maxy]].
                     +        self._bbox = [list(bounds), [np.inf, -np.inf]]
+                    +
                     +        # Data scale (maxx - minx), (maxy - miny)
                     +        self._scale = [bounds[1] - bounds[0], 0]
                     +        self._oldscale = deepcopy(self._scale)
+                    +
                     +        self.bounds = list(bounds)
+                    +
                     +    @property
                     +    def data_combined(self):
                     +        return {**self.data, **self.data_interp}
+                    +
                     +    def interval_loss(self, x_left, x_right, data):
                     +        """Calculate loss in the interval x_left, x_right.
+                    +
                     +        Currently returns the rescaled length of the interval. If one of the
                     +        y-values is missing, returns 0 (so the intervals with missing data are
                     +        never touched. This behavior should be improved later.
                     +        """
                     +        y_right, y_left = data[x_right], data[x_left]
                     +        if self._scale[1] == 0:
                     +            return sqrt(((x_right - x_left) / self._scale[0])**2)
                     +        else:
                     +            return sqrt(((x_right - x_left) / self._scale[0])**2 +
                     +                        ((y_right - y_left) / self._scale[1])**2)
+                    +
                     +    def loss(self, real=True):
                     +        losses = self.losses if real else self.losses_combined
                     +        if len(losses) == 0:
                     +            return float('inf')
                     +        else:
                     +            return max(losses.values())
+                    +
                     +    def update_losses(self, x, data, neighbors, losses):
                     +        x_lower, x_upper = neighbors[x]
                     +        if x_lower is not None:
                     +            losses[x_lower, x] = self.interval_loss(x_lower, x, data)
                     +        if x_upper is not None:
                     +            losses[x, x_upper] = self.interval_loss(x, x_upper, data)
                     +        try:
                     +            del losses[x_lower, x_upper]
                     +        except KeyError:
                     +            pass
+                    +
                     +    def find_neighbors(self, x, neighbors):
                     +        pos = neighbors.bisect_left(x)
                     +        x_lower = neighbors.iloc[pos-1] if pos != 0 else None
                     +        x_upper = neighbors.iloc[pos] if pos != len(neighbors) else None
                     +        return x_lower, x_upper
+                    +
                     +    def update_neighbors(self, x, neighbors):
                     +        if x not in neighbors:  # The point is new
                     +            x_lower, x_upper = self.find_neighbors(x, neighbors)
                     +            neighbors[x] = [x_lower, x_upper]
                     +            neighbors.get(x_lower, [None, None])[1] = x
                     +            neighbors.get(x_upper, [None, None])[0] = x
+                    +
                     +    def update_scale(self, x, y):
                     +        self._bbox[0][0] = min(self._bbox[0][0], x)
                     +        self._bbox[0][1] = max(self._bbox[0][1], x)
                     +        if y is not None:
                     +            self._bbox[1][0] = min(self._bbox[1][0], y)
                     +            self._bbox[1][1] = max(self._bbox[1][1], y)
+                    +
                     +        self._scale = [self._bbox[0][1] - self._bbox[0][0],
                     +                       self._bbox[1][1] - self._bbox[1][0]]
+                    +
                     +    def add_point(self, x, y):
                     +        real = y is not None
+                    +
                     +        if real:
                     +            # Add point to the real data dict and pop from the unfinished
                     +            # data_interp dict.
                     +            self.data[x] = y
                     +            try:
                     +                del self.data_interp[x]
                     +            except KeyError:
                     +                pass
                     +        else:
                     +            # The keys of data_interp are the unknown points
                     +            self.data_interp[x] = None
+                    +
                     +        # Update the neighbors
                     +        self.update_neighbors(x, self.neighbors_combined)
                     +        if real:
                     +            self.update_neighbors(x, self.neighbors)
+                    +
                     +        # Update the scale
                     +        self.update_scale(x, y)
+                    +
                     +        # Interpolate
                     +        if not real:
                     +            self.data_interp = self.interpolate()
+                    +
                     +        # Update the losses
                     +        self.update_losses(x, self.data_combined, self.neighbors_combined,
                     +                           self.losses_combined)
                     +        if real:
                     +            self.update_losses(x, self.data, self.neighbors, self.losses)
+                    +
                     +        # If the scale has doubled, recompute all losses.
                     +        if self._scale > self._oldscale * 2:
                     +            self.losses = {xs: self.interval_loss(*xs, self.data)
                     +                           for xs in self.losses}
                     +            self.losses_combined = {x: self.interval_loss(*x,
                     +                                                          self.data_combined)
                     +                                    for x in self.losses_combined}
                     +            self._oldscale = self._scale
+                    +
                     +    def choose_points(self, n, add_data=True):
                     +        """Return n points that are expected to maximally reduce the loss."""
                     +        # Find out how to divide the n points over the intervals
                     +        # by finding  positive integer n_i that minimize max(L_i / n_i) subject
                     +        # to a constraint that sum(n_i) = n + N, with N the total number of
                     +        # intervals.
+                    +
                     +        # Return equally spaced points within each interval to which points
                     +        # will be added.
                     +        if n == 0:
                     +            return []
+                    +
                     +        # If the bounds have not been chosen yet, we choose them first.
                     +        points = []
                     +        for bound in self.bounds:
                     +            if bound not in self.data and bound not in self.data_interp:
                     +                points.append(bound)
+                    +
                     +        # Ensure we return exactly 'n' points.
                     +        if points:
                     +            loss_improvements = [float('inf')] * n
                     +            if n <= 2:
                     +                points = points[:n]
                     +            else:
                     +                points = np.linspace(*self.bounds, n)
                     +        else:
                     +            def xs(x, n):
                     +                if n == 1:
                     +                    return []
                     +                else:
                     +                    step = (x[1] - x[0]) / n
                     +                    return [x[0] + step * i for i in range(1, n)]
+                    +
                     +            # Calculate how many points belong to each interval.
                     +            quals = [(-loss, x_range, 1) for (x_range, loss) in
                     +                     self.losses_combined.items()]
+                    +
                     +            heapq.heapify(quals)
+                    +
                     +            for point_number in range(n):
                     +                quality, x, n = quals[0]
                     +                heapq.heapreplace(quals, (quality * n / (n + 1), x, n + 1))
+                    +
                     +            points = list(itertools.chain.from_iterable(xs(x, n)
                     +                          for quality, x, n in quals))
+                    +
                     +            loss_improvements = list(itertools.chain.from_iterable(
                     +                                     itertools.repeat(-quality, n)
                     +                                     for quality, x, n in quals))
+                    +
                     +        if add_data:
                     +            self.add_data(points, itertools.repeat(None))
+                    +
                     +        return points, loss_improvements
+                    +
                     +    def interpolate(self, extra_points=None):
                     +        xs = list(self.data.keys())
                     +        ys = list(self.data.values())
                     +        xs_unfinished = list(self.data_interp.keys())
+                    +
                     +        if extra_points is not None:
                     +            xs_unfinished += extra_points
+                    +
                     +        if len(ys) == 0:
                     +            interp_ys = (0,) * len(xs_unfinished)
                     +        else:
                     +            interp_ys = np.interp(xs_unfinished, xs, ys)
+                    +
                     +        data_interp = {x: y for x, y in zip(xs_unfinished, interp_ys)}
+                    +
                     +        return data_interp
+                    +
                     +    def plot(self):
                     +            if self.data:
                     +                return hv.Scatter(self.data)
                     +            else:
                     +                return hv.Scatter([])
+                    +
                     +    def remove_unfinished(self):
                     +        self.data_interp = {}
                     +        self.losses_combined = deepcopy(self.losses)
                     +        self.neighbors_combined = deepcopy(self.neighbors)

adaptive/learner/learner2D.py

History View file @ 5261c86

                     new file mode 100644
@@ -0,0 +1,303 @@
                     +# -*- coding: utf-8 -*-
                     +import itertools
+                    +
                     +import holoviews as hv
                     +import numpy as np
                     +from scipy import interpolate, special
+                    +
                     +from .base_learner import BaseLearner
                     +from .utils import restore
+                    +
+                    +
                     +# Learner2D and helper functions.
+                    +
                     +def _losses_per_triangle(ip):
                     +    tri = ip.tri
                     +    vs = ip.values.ravel()
+                    +
                     +    gradients = interpolate.interpnd.estimate_gradients_2d_global(
                     +        tri, vs, tol=1e-6)
                     +    p = tri.points[tri.vertices]
                     +    g = gradients[tri.vertices]
                     +    v = vs[tri.vertices]
                     +    n_points_per_triangle = p.shape[1]
+                    +
                     +    dev = 0
                     +    for j in range(n_points_per_triangle):
                     +        vest = v[:, j, None] + ((p[:, :, :] - p[:, j, None, :]) *
                     +                                g[:, j, None, :]).sum(axis=-1)
                     +        dev += abs(vest - v).max(axis=1)
+                    +
                     +    q = p[:, :-1, :] - p[:, -1, None, :]
                     +    areas = abs(q[:, 0, 0] * q[:, 1, 1] - q[:, 0, 1] * q[:, 1, 0])
                     +    areas /= special.gamma(n_points_per_triangle)
                     +    areas = np.sqrt(areas)
+                    +
                     +    vs_scale = vs[tri.vertices].ptp()
                     +    if vs_scale != 0:
                     +        dev /= vs_scale
+                    +
                     +    return dev * areas
+                    +
                     +class Learner2D(BaseLearner):
                     +    """Learns and predicts a function 'f: ℝ^2 → ℝ'.
+                    +
                     +    Parameters
                     +    ----------
                     +    function : callable
                     +        The function to learn. Must take a tuple of two real
                     +        parameters and return a real number.
                     +    bounds : list of 2-tuples
                     +        A list ``[(a1, b1), (a2, b2)]`` containing bounds,
                     +        one per dimension.
+                    +
                     +    Attributes
                     +    ----------
                     +    points_combined
                     +        Sample points so far including the unknown interpolated ones.
                     +    values_combined
                     +        Sampled values so far including the unknown interpolated ones.
                     +    points
                     +        Sample points so far with real results.
                     +    values
                     +        Sampled values so far with real results.
+                    +
                     +    Notes
                     +    -----
                     +    Adapted from an initial implementation by Pauli Virtanen.
+                    +
                     +    The sample points are chosen by estimating the point where the
                     +    linear and cubic interpolants based on the existing points have
                     +    maximal disagreement. This point is then taken as the next point
                     +    to be sampled.
+                    +
                     +    In practice, this sampling protocol results to sparser sampling of
                     +    smooth regions, and denser sampling of regions where the function
                     +    changes rapidly, which is useful if the function is expensive to
                     +    compute.
+                    +
                     +    This sampling procedure is not extremely fast, so to benefit from
                     +    it, your function needs to be slow enough to compute.
                     +    """
+                    +
                     +    def __init__(self, function, bounds):
                     +        self.ndim = len(bounds)
                     +        if self.ndim != 2:
                     +            raise ValueError("Only 2-D sampling supported.")
                     +        self.bounds = tuple((float(a), float(b)) for a, b in bounds)
                     +        self._points = np.zeros([100, self.ndim])
                     +        self._values = np.zeros([100], dtype=float)
                     +        self._stack = []
                     +        self._interp = {}
+                    +
                     +        xy_mean = np.mean(self.bounds, axis=1)
                     +        xy_scale = np.ptp(self.bounds, axis=1)
+                    +
                     +        def scale(points):
                     +            return (points - xy_mean) / xy_scale
+                    +
                     +        def unscale(points):
                     +            return points * xy_scale + xy_mean
+                    +
                     +        self.scale = scale
                     +        self.unscale = unscale
+                    +
                     +        # Keeps track till which index _points and _values are filled
                     +        self.n = 0
+                    +
                     +        self._bounds_points = list(itertools.product(*bounds))
+                    +
                     +        # Add the loss improvement to the bounds in the stack
                     +        self._stack = [(*p, np.inf) for p in self._bounds_points]
+                    +
                     +        self.function = function
+                    +
                     +    @property
                     +    def points_combined(self):
                     +        return self._points[:self.n]
+                    +
                     +    @property
                     +    def values_combined(self):
                     +        return self._values[:self.n]
+                    +
                     +    @property
                     +    def points(self):
                     +        return np.delete(self.points_combined,
                     +                         list(self._interp.values()), axis=0)
+                    +
                     +    @property
                     +    def values(self):
                     +        return np.delete(self.values_combined,
                     +                         list(self._interp.values()), axis=0)
+                    +
                     +    def ip(self):
                     +        points = self.scale(self.points)
                     +        return interpolate.LinearNDInterpolator(points, self.values)
+                    +
                     +    @property
                     +    def n_real(self):
                     +        return self.n - len(self._interp)
+                    +
                     +    def ip_combined(self):
                     +        points = self.scale(self.points_combined)
                     +        values = self.values_combined
+                    +
                     +        # Interpolate the unfinished points
                     +        if self._interp:
                     +            n_interp = list(self._interp.values())
                     +            bounds_are_done = not any(p in self._interp
                     +                                      for p in self._bounds_points)
                     +            if bounds_are_done:
                     +                values[n_interp] = self.ip()(points[n_interp])
                     +            else:
                     +                # It is important not to return exact zeros because
                     +                # otherwise the algo will try to add the same point
                     +                # to the stack each time.
                     +                values[n_interp] = np.random.rand(len(n_interp)) * 1e-15
+                    +
                     +        return interpolate.LinearNDInterpolator(points, values)
+                    +
                     +    def add_point(self, point, value):
                     +        nmax = self.values_combined.shape[0]
                     +        if self.n >= nmax:
                     +            self._values = np.resize(self._values, [2*nmax + 10])
                     +            self._points = np.resize(self._points, [2*nmax + 10, self.ndim])
+                    +
                     +        point = tuple(point)
+                    +
                     +        # When the point is not evaluated yet, add an entry to self._interp
                     +        # that saves the point and index.
                     +        if value is None:
                     +            self._interp[point] = self.n
                     +            old_point = False
                     +        else:
                     +            old_point = point in self._interp
+                    +
                     +        # If the point is new add it a new value to _points and _values,
                     +        # otherwise get the index of the value that is being replaced.
                     +        if old_point:
                     +            n = self._interp.pop(point)
                     +        else:
                     +            n = self.n
                     +            self.n += 1
+                    +
                     +        self._points[n] = point
                     +        self._values[n] = value
+                    +
                     +        # Remove the point if in the stack.
                     +        for i, (*_point, _) in enumerate(self._stack):
                     +            if point == tuple(_point):
                     +                self._stack.pop(i)
                     +                break
+                    +
                     +    def _fill_stack(self, stack_till=None):
                     +        if stack_till is None:
                     +            stack_till = 1
+                    +
                     +        if self.values_combined.shape[0] < self.ndim + 1:
                     +            raise ValueError("too few points...")
+                    +
                     +        # Interpolate
                     +        ip = self.ip_combined()
                     +        tri = ip.tri
+                    +
                     +        losses = _losses_per_triangle(ip)
+                    +
                     +        def point_exists(p):
                     +            eps = np.finfo(float).eps * self.points_combined.ptp() * 100
                     +            if abs(p - self.points_combined).sum(axis=1).min() < eps:
                     +                return True
                     +            if self._stack:
                     +                _stack_points, _ = self._split_stack()
                     +                if abs(p - np.asarray(_stack_points)).sum(axis=1).min() < eps:
                     +                    return True
                     +            return False
+                    +
                     +        for j, _ in enumerate(losses):
                     +            # Estimate point of maximum curvature inside the simplex
                     +            jsimplex = np.argmax(losses)
                     +            p = tri.points[tri.vertices[jsimplex]]
                     +            point_new = self.unscale(p.mean(axis=-2))
+                    +
                     +            # XXX: not sure whether this is necessary it was there
                     +            # originally.
                     +            point_new = np.clip(point_new, *zip(*self.bounds))
+                    +
                     +            # Check if it is really new
                     +            if point_exists(point_new):
                     +                losses[jsimplex] = 0
                     +                continue
+                    +
                     +            # Add to stack
                     +            self._stack.append((*point_new, losses[jsimplex]))
+                    +
                     +            if len(self._stack) >= stack_till:
                     +                break
                     +            else:
                     +                losses[jsimplex] = 0
+                    +
                     +    def _split_stack(self, n=None):
                     +        points = []
                     +        loss_improvements = []
                     +        for *point, loss_improvement in self._stack[:n]:
                     +            points.append(point)
                     +            loss_improvements.append(loss_improvement)
                     +        return points, loss_improvements
+                    +
                     +    def _choose_and_add_points(self, n):
                     +        if n <= len(self._stack):
                     +            points, loss_improvements = self._split_stack(n)
                     +            self.add_data(points, itertools.repeat(None))
                     +        else:
                     +            points = []
                     +            loss_improvements = []
                     +            n_left = n
                     +            while n_left > 0:
                     +                # The while loop is needed because `stack_till` could be larger
                     +                # than the number of triangles between the points. Therefore
                     +                # it could fill up till a length smaller than `stack_till`.
                     +                if self.n >= 2**self.ndim:
                     +                    # Only fill the stack if no more bounds left in _stack
                     +                    self._fill_stack(stack_till=n_left)
                     +                new_points, new_loss_improvements = self._split_stack(n_left)
                     +                points += new_points
                     +                loss_improvements += new_loss_improvements
                     +                self.add_data(new_points, itertools.repeat(None))
                     +                n_left -= len(new_points)
+                    +
                     +        return points, loss_improvements
+                    +
                     +    def choose_points(self, n, add_data=True):
                     +        if not add_data:
                     +            with restore(self):
                     +                return self._choose_and_add_points(n)
                     +        else:
                     +            return self._choose_and_add_points(n)
+                    +
                     +    def loss(self, real=True):
                     +        n = self.n_real if real else self.n
                     +        bounds_are_not_done = any(p in self._interp
                     +                                  for p in self._bounds_points)
                     +        if n <= 4 or bounds_are_not_done:
                     +            return np.inf
                     +        ip = self.ip() if real else self.ip_combined()
                     +        losses = _losses_per_triangle(ip)
                     +        return losses.max()
+                    +
                     +    def remove_unfinished(self):
                     +        self._points = self.points.copy()
                     +        self._values = self.values.copy()
                     +        self.n -= len(self._interp)
                     +        self._interp = {}
+                    +
                     +    def plot(self, n_x=201, n_y=201):
                     +        x, y = self.bounds
                     +        lbrt = x[0], y[0], x[1], y[1]
                     +        if self.n_real >= 4:
                     +            x = np.linspace(-0.5, 0.5, n_x)
                     +            y = np.linspace(-0.5, 0.5, n_y)
                     +            ip = self.ip()
                     +            z = ip(x[:, None], y[None, :])
                     +            return hv.Image(np.rot90(z), bounds=lbrt)
                     +        else:
                     +            return hv.Image(np.zeros((2, 2)), bounds=lbrt)

adaptive/learner/utils.py

History View file @ 5261c86

                     new file mode 100644
@@ -0,0 +1,11 @@
                     +# -*- coding: utf-8 -*-
                     +from contextlib import contextmanager
+                    +
                     +@contextmanager
                     +def restore(*learners):
                     +    states = [learner.__getstate__() for learner in learners]
                     +    try:
                     +        yield
                     +    finally:
                     +        for state, learner in zip(states, learners):
                     +            learner.__setstate__(state)