Source code for spatula.optimize

# Copyright (c) 2021-2026 The Regents of the University of Michigan
# Part of spatula, released under the BSD 3-Clause License.

"""Classes to optimize over SO(3) for `spatula.PGOP`."""

from importlib.resources import as_file, files

import numpy as np
import scipy as sp
from scipy.spatial.transform import Rotation

from . import _spatula_nb

"""The Golden ratio, 1.61803398875..."""
GOLDEN_RATIO = (1 + np.sqrt(5)) / 2


"""The angle that divides 2π radians into the golden ratio.
This takes the longer of the two segments π(√5 - 1), where π[(√5 - 1) + (3-√5)] = 2π
"""
GOLDEN_ANGLE = np.pi * (np.sqrt(5) - 1)


def _spherical_fibonacci_lattice(n):
    """Generate a Fibonacci lattice of `n` points on the 2-sphere.

    n : `int`
        n (int): The number of points in the lattice.
    """
    t = np.arange(n)

    z = 1 - (t / (n - 1)) * 2
    radius = np.sqrt(1 - z**2)
    theta = (GOLDEN_ANGLE * t) % (2 * np.pi)

    x = np.cos(theta) * radius
    y = np.sin(theta) * radius

    return np.column_stack([x, y, z]).T


def _quaternion_fibonacci_lattice(n):
    """Generate a near-uniform grid of `n` quaternions.

    This is equivalent to a Fibonacci lattice on the 3-sphere. See
    `this paper <https://ieeexplore.ieee.org/document/9878746>`_ for a derivation.
    """
    psi = 1.533751168755204288118041413  # Solution to ψ**4 = ψ + 4
    s = np.arange(n) + 1 / 2
    t = s / n
    d = 2 * np.pi * s
    r0, r1 = (np.sqrt(t), np.sqrt(1 - t))
    α, β = (d / np.sqrt(2), d / psi)

    # Allocate as rows and then transpose, rather than stacking columns
    result = np.empty((4, n))
    result[...] = r0 * np.sin(α), r0 * np.cos(α), r1 * np.sin(β), r1 * np.cos(β)
    return result.T


# Only here for typing/documentation purposes.

[docs]
class Optimizer:
    """Base class for optimizers."""




[docs]
class RandomSearch(Optimizer):
    """Optimize by testing :math:`N` random rotations."""


[docs]
    def __init__(self, max_iter=150, seed=42):
        """Create a RandomSearch optimizer.

        Parameters
        ----------
        max_iter : `int`, optional
            The number of rotations to try. Defaults to 150.
        seed : `int`, optional
            The random number seed to use for generating random rotations.
            Defaults to 42.

        """
        self._cpp = _spatula_nb.RandomSearch(max_iter, seed)





[docs]
class StepGradientDescent(Optimizer):
    r"""Optimize by rounds of 3 1D gradient descents.

    The optimization uses a 3-vector, :math:`\nu` to represent rotations in
    :math:`SO(3)`. The conversion to the axis-angle representation for
    :math:`\nu` is

    .. math::

        \alpha = \frac{\nu}{||\nu||} \\
        \theta = ||\nu||.

    The representation is continuous in :math:`SO(3)`. `StepGradientDescent`
    performs potentially multiple rounds of 3 1-dimensional gradient descents,
    one for each dimension to find the local minimum. Each smaller optimization
    is terminated when the improvement in objective is less than the provided
    tolerance. The entire optimization ends when between rounds of optimization
    the decrease in objective is less than the provided tolerance.
    """


[docs]
    def __init__(
        self,
        initial_point=(1.0, 0.0, 0.0, 0.0),
        max_iter=150,
        initial_jump=0.001,
        learning_rate=0.05,
        tol=1e-6,
    ):
        """Create a `StepGradientDescent` object.

        Parameters
        ----------
        optimizer : Optimizer
            The initial optimizer. The best/final point of this optimizer will
            be sent to the `StepGradientDescent` as the initial point.
        initial_point : :math:`(4,)` numpy.ndarray of float, optional
            The initial point to start the optimization. Defaults to the
            identity quaternion.
        max_iter : `int`, optional
            The maximum number of iterations before stopping optimization.
            Defaults to 150.
        initial_jump : `float`, optional
            The size of the initial jump in each dimension to get an initial
            gradient. Defaults to 0.001.
        learning_rate : `float`, optional
            The degree to move along the gradient. Higher values lead to larger
            moves and can result in quicker convergence or failure to converge.
            Defaults to 0.05.
        tol : `float`, optional
            The value that when the reduction in the object is less than the
            current optimization stops. The entire optimization stops when the
            objective from the last round of 1 dimensional optimizations is
            below ``tol``. Defaults to 1e-6.

        """
        self._cpp = _spatula_nb.StepGradientDescent(
            tuple(initial_point),
            max_iter,
            initial_jump,
            learning_rate,
            tol,
        )




def _load_sphere_codes():
    """Load and return the stored numerical solutions to the Tammes problem.

    The file stores the solutions of the Tammes problem up to 249 points.

    Returns
    -------
    sphere_codes : list[numpy.ndarray]
        The list of sphere codes from 1 to 249 points.

    """
    res = files(__package__) / "sphere-codes.npz"
    with as_file(res) as fn, np.load(str(fn)) as data:
        return list(data.values())



[docs]
class Mesh(Optimizer):
    """Optimize by testing provided rotations."""

    _sphere_codes = _load_sphere_codes()


[docs]
    def __init__(self, points):
        """Create a Mesh optimizer.

        Parameters
        ----------
        points : :math:`(N, 4)` numpy.ndarray of float
            The rotaional quaternions to test.

        """
        self._cpp = _spatula_nb.Mesh(np.asarray(points, dtype=np.float32, order="C"))



[docs]
    @classmethod
    def from_grid(cls, n_axes=75, n_angles=10):
        r"""Create a Mesh optimizer that tests rotations on a uniform grid.

        The axes are chosen by the numerical solutions to the Tammes problem and
        angles by equadistant rotations according to the Haar measure.

        Parameters
        ----------
        n_axes : `int`, optional
            The number of axes to rotate about. Defaults to 75.
        n_angles : `int`, optional
            The number of angles to rotate per axes. Defaults to 10.

        Returns
        -------
        mesh : Mesh
            The optimizer which will test :math:`N_{axes} \cdot N_{angles}`
            points.

        """
        if n_axes < 1 or n_axes > 250:
            raise ValueError("Can only chose [1, 250] for n_axes.")
        axes = cls._sphere_codes[n_axes - 1].reshape((-1, 1, 3))
        points = np.empty((n_angles * n_axes + 1, 4), dtype=float)
        points[0] = np.array([1.0, 0.0, 0.0, 0.0])
        angles = cls._sample_angles(n_angles).reshape((1, -1, 1))
        # Flatten axes and angles for creating the rotation objects
        axes = axes.repeat(n_angles, axis=1).reshape(-1, 3)
        angles = angles.repeat(n_axes, axis=0).reshape(-1)
        # Generate quaternions from axis-angle
        quaternions = Rotation.from_rotvec(axes * angles[:, None]).as_quat()
        quaternions = quaternions.reshape((n_axes * n_angles, 4))
        points[1:] = np.hstack((quaternions[:, -1].reshape(-1, 1), quaternions[:, :-1]))
        return cls(points)



[docs]
    @classmethod
    def from_lattice(cls, n_rotations=150):
        r"""Create a Mesh optimizer that tests rotations on a Fibonacci lattice.

        The lattice provides a mostly-uniform covering of the 3-sphere. Refer to
        `this paper <https://ieeexplore.ieee.org/document/9878746>`_ for a derivation.
        Although the quaternions generated by this method are slightly less uniform than
        those from ``~.from_grid``, an arbitrary number of rotations can be
        generated by this approach.

        Parameters
        ----------
        n_rotations : `int`, optional
            The number of rotation in the lattice. Defaults to 75.

        Returns
        -------
        mesh : Mesh
            The optimizer which will test :math:`N_{rotations}` samples.

        """
        return cls(_quaternion_fibonacci_lattice(n_rotations))


    @staticmethod
    def _sample_angles(n_angles):
        """Find n equally spaced angle rotations w.r.t. the Haar measure."""

        def cdf(theta, root):
            ipi = 1 / np.pi
            sinx = np.sin(theta)
            return (
                ipi * (theta - sinx) - root,
                ipi * (1 - np.cos(theta)),
                ipi * sinx,
            )

        roots = np.linspace(0, 1, n_angles + 1)[1:]
        angles = []
        for r in roots:
            opt = sp.optimize.root_scalar(
                cdf,
                args=(r,),
                method="halley",
                bracket=[0, np.pi],
                x0=r * np.pi,
                fprime=True,
                fprime2=True,
            )
            angles.append(opt.root)
        return np.array(angles)




[docs]
class Union(Optimizer):
    """Combine an optimization scheme with a specific secondary optimizer.

    The union optimizer uses the best point from the first optimization to start
    the second optimizer.
    """


[docs]
    @classmethod
    def with_step_gradient_descent(
        cls,
        optimizer,
        max_iter=150,
        initial_jump=0.001,
        learning_rate=0.055,
        tol=1e-6,
    ):
        """Create a Union optimizer with a `StepGradientDescent` second step.

        Arguments are passed through to the constructor of
        `StepGradientDescent`.

        Parameters
        ----------
        optimizer : Optimizer
            The initial optimizer. The best/final point of this optimizer will
            be sent to the `StepGradientDescent` as the initial point.
        max_iter : `int`, optional
            The maximum number of iterations before stopping optimization.
            Defaults to 150.
        initial_jump : `float`, optional
            The size of the initial jump in each dimension to get an initial
            gradient. Defaults to 0.001.
        learning_rate : `float`, optional
            The degree to move along the gradient. Higher values lead to larger
            moves and can result in quicker convergence or failure to converge.
            Defaults to 0.05.
        tol : `float`, optional
            The value that when the reduction in the object is less than the
            current optimization stops. The entire optimization stops when the
            objective from the last round of 1 dimensional optimizations is
            below ``tol``. Defaults to 1e-6.

        """
        instance = cls()
        instance._cpp = _spatula_nb.Union.with_step_gradient_descent(
            optimizer._cpp, max_iter, initial_jump, learning_rate, tol
        )
        return instance





[docs]
class NoOptimization(Optimizer):
    """Evaluate at one fixed orientation with no optimization loop.

    Instead of searching over rotations, this optimizer evaluates the objective
    exactly once at the provided orientation. For PGOP and BOOSOP this is
    equivalent to rotating each neighborhood by the same fixed quaternion and
    then computing the order parameter.
    """


[docs]
    def __init__(self, orientation=(1.0, 0.0, 0.0, 0.0)):
        """Create a NoOptimization object.

        Parameters
        ----------
        orientation : tuple[float, float, float, float], optional
            The fixed orientation quaternion in ``[w, x, y, z]`` convention
            (note SciPy uses ``[x, y, z, w]``). The quaternion is normalized
            internally before use.

            This sets the single rotation used for evaluation. Example:
            ``NoOptimization(orientation=q)`` on an unrotated neighborhood gives
            the same result as ``NoOptimization()`` on a neighborhood rotated by
            ``q``.

            Defaults to the identity quaternion ``(1, 0, 0, 0)``, which means
            no additional rotation is applied.

        """
        orientation = np.asarray(orientation, dtype=np.float64)
        if orientation.shape != (4,):
            raise ValueError(
                "orientation must contain exactly 4 values in [w, x, y, z]."
            )
        norm = np.linalg.norm(orientation)
        if norm == 0:
            raise ValueError("orientation quaternion cannot be zero.")
        orientation /= norm
        self._orientation = tuple(orientation)
        self._cpp = _spatula_nb.NoOptimization(self._orientation)


    @property
    def orientation(self):
        """tuple[float, float, float, float]: Normalized fixed quaternion.

        Returned in ``[w, x, y, z]`` convention.
        """
        return self._orientation