adaptive/learner/new_learnerND.py

import abc
import itertools
from collections.abc import Iterable
import math

import numpy as np
import scipy.spatial
import scipy.interpolate

from adaptive.learner.base_learner import BaseLearner
from adaptive.learner.triangulation import simplex_volume_in_embedding
from adaptive.notebook_integration import ensure_holoviews
from adaptive.priority_queue import Queue
from adaptive.domain import Interval, ConvexHull


class LossFunction(metaclass=abc.ABCMeta):
    @abc.abstractproperty
    def n_neighbors(self):
        "The maximum degree of neighboring subdomains required."

    @abc.abstractmethod
    def __call__(self, domain, subdomain, codomain_bounds, data):
        """Return the loss for 'subdomain' given 'data'

        Neighboring subdomains can be obtained with
        'domain.neighbors(subdomain, self.n_neighbors)'.
        """


class DistanceLoss(LossFunction):
    @property
    def n_neighbors(self):
        return 0

    def __call__(self, domain, subdomain, codomain_bounds, data):
        assert isinstance(domain, Interval)
        a, b = subdomain
        ya, yb = data[a], data[b]
        return math.sqrt((b - a) ** 2 + (yb - ya) ** 2)


class EmbeddedVolumeLoss(LossFunction):
    @property
    def n_neighbors(self):
        return 0

    def __call__(self, domain, subdomain, codomain_bounds, data):
        assert isinstance(domain, ConvexHull)
        xs = [tuple(domain.triangulation.vertices[x]) for x in subdomain]
        ys = [data[x] for x in xs]
        if isinstance(ys[0], Iterable):
            pts = [(*x, *y) for x, y in zip(xs, ys)]
        else:
            pts = [(*x, y) for x, y in zip(xs, ys)]
        return simplex_volume_in_embedding(pts)


class TriangleLoss(LossFunction):
    @property
    def n_neighbors(self):
        return 1

    def __call__(self, domain, subdomain, codomain_bounds, data):
        assert isinstance(domain, ConvexHull)
        neighbors = domain.neighbors(subdomain, self.n_neighbors)
        if not neighbors:
            return 0
        neighbor_points = set.union(*(set(n) - set(subdomain) for n in neighbors))

        neighbor_points = [domain.triangulation.vertices[p] for p in neighbor_points]

        simplex = [domain.triangulation.vertices[p] for p in subdomain]

        z = data[simplex[0]]
        if isinstance(z, Iterable):
            s = [(*x, *data[x]) for x in simplex]
            n = [(*x, *data[x]) for x in neighbor_points]
        else:
            s = [(*x, data[x]) for x in simplex]
            n = [(*x, data[x]) for x in neighbor_points]

        return sum(simplex_volume_in_embedding([*s, neigh]) for neigh in n) / len(
            neighbors
        )


class CurvatureLoss(LossFunction):
    def __init__(self, exploration=0.05):
        self.exploration = exploration

    @property
    def n_neighbors(self):
        return 1

    def __call__(self, domain, subdomain, codomain_bounds, data):
        dim = domain.ndim

        loss_input_volume = domain.volume(subdomain)
        triangle_loss = TriangleLoss()

        loss_curvature = triangle_loss(domain, subdomain, codomain_bounds, data)
        return (
            loss_curvature + self.exploration * loss_input_volume ** ((2 + dim) / dim)
        ) ** (1 / (2 + dim))


class LearnerND(BaseLearner):
    """Learns a function 'f: ℝ^N → ℝ^m'.

    Parameters
    ---------
    f : callable
        The function to learn. Must take a tuple of N real parameters and return a real
        number or an arraylike of length M.
    bounds : list of 2-tuples or `scipy.spatial.ConvexHull`
        A list ``[(a_1, b_1), (a_2, b_2), ..., (a_N, b_N)]`` describing a bounding box
        in N dimensions, or a convex hull that defines the boundary of the domain.
    loss : callable, optional
        An instance of a subclass of `LossFunction` that describes the loss
        of a subdomain.
    """

    def __init__(self, f, bounds, loss=None):

        if len(bounds) == 1:
            (a, b), = (boundary_points,) = bounds
            self.domain = Interval(a, b)
            self.loss_function = loss or DistanceLoss()
            self.ndim = 1
        else:
            if isinstance(bounds, scipy.spatial.ConvexHull):
                boundary_points = bounds.points[bounds.vertices]
            else:
                boundary_points = sorted(tuple(p) for p in itertools.product(*bounds))
            self.domain = ConvexHull(boundary_points)
            self.loss_function = loss or EmbeddedVolumeLoss()
            self.ndim = len(boundary_points[0])

        self.boundary_points = boundary_points
        self.data = dict()  # Contains the evaluated data only
        self.pending_points = set()
        self.function = f

        # The loss function may depend on the "scale" (i.e. the difference between
        # the maximum and the minimum) of the function values, in addition to the
        # function values themselves. In order to take into account this "global"
        # information we recompute the losses for all subdomains when the scale
        # changes by more than this factor from the last time we recomputed all
        # the losses.
        self._recompute_losses_factor = 1.1

        # As an optimization we keep a map from subdomain to loss.
        # This is updated in 'self.priority' whenever the loss function is evaluated
        # for a new subdomain. 'self.tell_many' removes subdomains from here when
        # they are split, and also removes neighboring subdomains from here (to force
        # a loss function recomputation).
        self.losses = dict()

        # We must wait until the boundary points have been evaluated before we can
        # set these attributes.
        self._initialized = False
        # The dimension of the output space.
        self.vdim = None
        # The maximum and minimum values of 'f' seen thus far.
        self.codomain_bounds = None
        # The difference between the maximum and minimum of 'f' at the last
        # time all the losses were recomputed.
        self.codomain_scale_at_last_update = None

        # A priority queue of subdomains, which is used to determine where to add
        # points.
        self.queue = Queue()
        for subdomain in self.domain.subdomains():
            self.queue.insert(subdomain, priority=self.priority(subdomain))

    def _finalize_initialization(self):
        assert all(x in self.data for x in self.boundary_points)

        self._initialized = True

        vals = list(self.data.values())
        codomain_min = np.min(vals, axis=0)
        codomain_max = np.max(vals, axis=0)
        self.codomain_bounds = (codomain_min, codomain_max)
        self.codomain_scale_at_last_update = codomain_max - codomain_min

        try:
            self.vdim = len(np.squeeze(self.data[self.boundary_points[0]]))
        except TypeError:  # Trying to take the length of a number
            self.vdim = 1

        # Generate new subdomains using any evaluated points, skipping the boundary
        # points (these are already vertices in the domain) and discarding any points
        # that are outside the domain.
        xs = list(x for x in self.data.keys() if x not in self.boundary_points)
        if xs:
            xs = np.array(xs)
            xs = xs[self.domain.encloses(xs)]
            for x in xs:
                self.domain.split_at(x)

        # Recompute all the losses from scratch
        self.losses = dict()
        self.queue = Queue(
            (subdomain, self.priority(subdomain))
            for subdomain in self.domain.subdomains()
        )

    @property
    def npoints(self):
        return len(self.data)

    def priority(self, subdomain):
        # Compute the loss of 'subdomain'
        if self._initialized:
            if subdomain in self.losses:
                L_0 = self.losses[subdomain]
            else:
                L_0 = self.loss_function(
                    self.domain, subdomain, self.codomain_bounds, self.data
                )
                self.losses[subdomain] = L_0
        else:
            # Before we have all the boundary points we can't calculate losses because we
            # do not have enough data. We just assign the subdomain volume as the loss.
            L_0 = self.domain.volume(subdomain)

        # Scale the subdomain loss by the maximum relative volume of its own subdomains
        # (those formed of pending points within the subdomain). If there are no pending
        # points in the subdomain then the scaling is 1 and the priority is just the loss.
        subvolumes = self.domain.subvolumes(subdomain)
        return (max(subvolumes) / sum(subvolumes)) * L_0

    def ask(self, n, tell_pending=True):
        if self._initialized:
            points, point_priorities = self._ask(n, tell_pending)
        else:
            # Give priority to boundary points, but don't include points that
            # we have data for or have already asked for.
            points = [
                x
                for x in self.boundary_points
                if x not in self.data and x not in self.pending_points
            ]
            # Make sure we don't give more points than asked for
            points = points[:n]
            # Infinite priority so that the boundary points are prioritized
            point_priorities = [math.inf] * len(points)
            if tell_pending:
                for x in points:
                    self.pending_points.add(x)
            n_extra = n - len(points)
            if n_extra > 0:
                extra_points, extra_point_priorities = self._ask(n_extra, tell_pending)
                points += tuple(extra_points)
                point_priorities += tuple(extra_point_priorities)

        return points, point_priorities

    def _ask(self, n, tell_pending):
        new_points = []
        point_priorities = []
        # Insert a point into the subdomain at the front of the queue, and update the
        # priorities of that subdomain and any neighbors (if the point was added on
        # a subdomain boundary).
        for _ in range(n):
            subdomain, _ = self.queue.peek()
            (new_point,), affected_subdomains = self.domain.insert_points(subdomain, 1)
            self.pending_points.add(new_point)
            for subdomain in affected_subdomains:
                self.queue.update(subdomain, priority=self.priority(subdomain))
            new_points.append(new_point)
            # TODO: don't call 'priority' again here: we already called it above, we just
            #       need to identify 'subdomin' within 'affected_subdomains'. Maybe change
            #       the API of 'Domain.insert_points' to not return 'subdomain'...
            point_priorities.append(self.priority(subdomain))

        # Remove all the points we just added and update the priorities of any subdomains
        # we touched.
        if not tell_pending:
            affected_subdomains = set()
            for point in new_points:
                self.pending_points.remove(point)
                sd = self.domain.remove(point)
                affected_subdomains.update(sd)
            for subdomain in affected_subdomains:
                self.queue.update(subdomain, priority=self.priority(subdomain))

        return new_points, point_priorities

    def tell_pending(self, x):
        if x in self.data:
            raise ValueError("Data already present for point {}".format(x))

        self.pending_points.add(x)

        # We cannot 'insert' a boundary point into the domain because it already
        # exists as a vertex. This does not affect the queue ordering.
        if not self._initialized and x in self.boundary_points:
            return

        affected_subdomains = self.domain.insert(x)
        for subdomain in affected_subdomains:
            self.queue.update(subdomain, priority=self.priority(subdomain))

    def tell_many(self, xs, ys):
        # Filter out points that are already present
        if all(x in self.data for x in xs):
            return
        xs, ys = zip(*((x, y) for x, y in zip(xs, ys) if x not in self.data))

        self.data.update(zip(xs, ys))
        self.pending_points -= set(xs)

        if not self._initialized:
            if all(x in self.data for x in self.boundary_points):
                self._finalize_initialization()
            return

        # Filter out any points that are outside the domain. These still appear in
        # 'self.data', but they are not added to the domain, and so have no effect
        # on the learning.
        are_inside = self.domain.encloses(xs)
        if not np.any(are_inside):
            return
        xs, ys = zip(*((x, y) for x, y, inside in zip(xs, ys, are_inside) if inside))

        need_loss_update = self._update_codomain_bounds(ys)

        to_remove = set()
        to_add = set()
        for x in xs:
            old_subdomains, new_subdomains = map(set, self.domain.split_at(x))
            # Subdomains that were added in a prior iteration of this loop,
            # but which have now been removed to make way for others.
            temp_subdomains = to_add.intersection(old_subdomains)
            # We no longer want to add subdomains that have now been removed,
            # and we want to add the new subdomains.
            to_add -= temp_subdomains
            to_add.update(new_subdomains)
            # We do not want to remove subdomains that were produced on a
            # prior iteration of this loop, as these will not be in the queue.
            to_remove.update(old_subdomains - temp_subdomains)

        for subdomain in to_remove:
            self.queue.remove(subdomain)
            del self.losses[subdomain]

        if need_loss_update:
            self.queue = Queue(
                (subdomain, self.priority(subdomain))
                for subdomain in itertools.chain(self.queue.items(), to_add)
            )
        else:
            # Insert the newly created subdomains into the queue.
            for subdomain in to_add:
                self.queue.insert(subdomain, priority=self.priority(subdomain))

            # If the loss function depends on data in neighboring subdomains then
            # we must recompute the priorities of all neighboring subdomains of
            # the subdomains we just added.
            if self.loss_function.n_neighbors > 0:
                subdomains_to_update = set()
                for subdomain in to_add:
                    subdomains_to_update.update(
                        self.domain.neighbors(subdomain, self.loss_function.n_neighbors)
                    )
                subdomains_to_update -= to_add
                for subdomain in subdomains_to_update:
                    # We have more data, so we must force a loss recomputation by
                    # removing the subdomain from the loss cache.
                    del self.losses[subdomain]
                    self.queue.update(subdomain, priority=self.priority(subdomain))

    def _update_codomain_bounds(self, ys):
        # Update the codomain bounds: the minimum and the maximum values that the
        # learner has seen thus far.
        mn, mx = self.codomain_bounds
        if self.vdim == 1:
            mn = min(mn, *ys)
            mx = max(mx, *ys)
        else:
            mn = np.min(np.vstack([mn, ys]), axis=0)
            mx = np.max(np.vstack([mx, ys]), axis=0)
        self.codomain_bounds = (mn, mx)

        scale = mx - mn
        # How much has the scale of the outputs changed since the last time
        # we recomputed the losses?
        if np.any(self.codomain_scale_at_last_update == 0):
            scale_factor = math.inf
        else:
            scale_factor = scale / self.codomain_scale_at_last_update

        # We need to recompute all losses if the scale has increased by more
        # than a certain factor since the last time we recomputed all the losses
        if self.vdim == 1:
            need_loss_update = scale_factor > self._recompute_losses_factor
        else:
            need_loss_update = np.any(scale_factor > self._recompute_losses_factor)

        if need_loss_update:
            self.codomain_scale_at_last_update = scale
            return True
        else:
            return False

    def remove_unfinished(self):
        self.pending_points = set()
        cleared_subdomains = self.domain.clear_subdomains()
        # Subdomains that had points removed need their priority updating
        for subdomain in cleared_subdomains:
            self.queue.update(subdomain, priority=self.priority(subdomain))

    def loss(self, real=True):
        if real:
            if not self.losses:
                return math.inf
            # NOTE: O(N) in the number of subintervals, but with a low prefactor.
            #       We have to do this because the queue is sorted in *priority*
            #       order, and it's possible that a subinterval with a high loss
            #       may have a low priority (if it has many pending points).
            return max(self.losses.values())
        else:
            # The 'not real' loss (which takes pending points into account) is
            # just the priority in the subdomain queue.
            _, priority = self.queue.peek()
            return priority

    def plot(self, **kwargs):
        if isinstance(self.domain, Interval):
            return self._plot_1d(**kwargs)
        elif isinstance(self.domain, ConvexHull):
            return self._plot_nd(**kwargs)

    def _plot_nd(self, n=None, tri_alpha=0):
        # XXX: Copied from LearnerND. At the moment we reach deep into internal
        #      datastructures of self.domain. We should see what data we need and
        #      add APIs to 'Domain' to support this.
        hv = ensure_holoviews()
        if self.vdim > 1:
            raise NotImplementedError(
                "holoviews currently does not support", "3D surface plots in bokeh."
            )
        if self.ndim != 2:
            raise NotImplementedError(
                "Only 2D plots are implemented: You can "
                "plot a 2D slice with 'plot_slice'."
            )
        x, y = self.domain.bounding_box
        lbrt = x[0], y[0], x[1], y[1]

        if len(self.data) >= 4:
            if n is None:
                # Calculate how many grid points are needed.
                # factor from A=√3/4 * a² (equilateral triangle)
                scale_factor = 1  # np.product(np.diag(self._transform))
                min_volume = min(map(self.domain.volume, self.domain.subdomains()))
                a_sq = np.sqrt(scale_factor * min_volume)
                n = max(10, int(0.658 / a_sq))

            xs = ys = np.linspace(0, 1, n)
            xs = xs * (x[1] - x[0]) + x[0]
            ys = ys * (y[1] - y[0]) + y[0]
            keys = np.array(list(self.data.keys()))
            values = np.array(list(self.data.values()))
            interpolator = scipy.interpolate.LinearNDInterpolator(keys, values)
            z = interpolator(xs[:, None], ys[None, :]).squeeze()

            im = hv.Image(np.rot90(z), bounds=lbrt)

            if tri_alpha:
                points = np.array(
                    [
                        [self.domain.triangulation.vertices[i] for i in s]
                        for s in self.domain.subdomains()
                    ]
                )
                points = np.pad(
                    points[:, [0, 1, 2, 0], :],
                    pad_width=((0, 0), (0, 1), (0, 0)),
                    mode="constant",
                    constant_values=np.nan,
                ).reshape(-1, 2)
                tris = hv.EdgePaths([points])
            else:
                tris = hv.EdgePaths([])
        else:
            im = hv.Image([], bounds=lbrt)
            tris = hv.EdgePaths([])

        im_opts = dict(cmap="viridis")
        tri_opts = dict(line_width=0.5, alpha=tri_alpha)
        no_hover = dict(plot=dict(inspection_policy=None, tools=[]))

        return im.opts(style=im_opts) * tris.opts(style=tri_opts, **no_hover)

    def _plot_1d(self):
        assert isinstance(self.domain, Interval)
        hv = ensure_holoviews()

        xs, ys = zip(*sorted(self.data.items())) if self.data else ([], [])
        if self.vdim == 1:
            p = hv.Path([]) * hv.Scatter((xs, ys))
        else:
            p = hv.Path((xs, ys)) * hv.Scatter([])

        # Plot with 5% empty margins such that the boundary points are visible
        a, b = self.domain.bounds
        margin = 0.05 * (b - a)
        plot_bounds = (a - margin, b + margin)

        return p.redim(x=dict(range=plot_bounds))

    def _get_data(self):
        return self.data

    def _set_data(self, data):
        if data:
            self.tell_many(*zip(*data.items()))