Source code for IMLCV.base.CV

from __future__ import annotations

import dataclasses
from abc import abstractmethod
from collections.abc import Callable
from functools import partial

import distrax
import jax.flatten_util
import jax.lax
import jax.numpy as jnp
import jax.scipy.optimize
import jax_dataclasses as jdc
import jaxopt.objective
import numpy as np
from flax import linen as nn
from jax import Array
from jax import jacfwd
from jax import jacrev
from jax import jit
from jax import vmap
from molmod.units import angstrom
from netket.jax import vmap_chunked
from ott.geometry.pointcloud import PointCloud
from ott.problems.linear import linear_problem
from ott.solvers.linear import sinkhorn

######################################
#        Data types                  #
######################################


@jdc.pytree_dataclass
[docs]class SystemParams:
[docs]    coordinates: Array
[docs]    cell: Array | None = None

[docs]    def __post_init__(self):
        if isinstance(self.coordinates, Array):
            self.__dict__["coordinates"] = jnp.array(self.coordinates)
        if isinstance(self.cell, Array):
            self.__dict__["cell"] = jnp.array(self.cell)

[docs]    def __getitem__(self, slices) -> SystemParams:
        return SystemParams(
            coordinates=self.coordinates[slices],
            cell=(self.cell[slices] if self.cell is not None else None),
        )

[docs]    def __iter__(self):
        if not self.batched:
            yield self
            return
        for i in range(self.coordinates.shape[0]):
            yield SystemParams(
                coordinates=self.coordinates[i, :, :],
                cell=self.cell[i, :, :] if self.cell is not None else None,
            )
        return

    @property
[docs]    def batched(self):
        return len(self.coordinates.shape) == 3

    @property
[docs]    def shape(self):
        return self.coordinates.shape

[docs]    def __add__(self, other):
        assert isinstance(other, SystemParams)
        if self.cell is None:
            assert other.cell is None

        s = self.batch()
        o = other.batch()

        assert s.shape[1:] == o.shape[1:]

        return SystemParams(
            coordinates=jnp.vstack([s.coordinates, o.coordinates]),
            cell=None if self.cell is None else jnp.vstack([s.cell, o.cell]),
        )

[docs]    def __str__(self):
        string = f"coordinates shape: \n{self.coordinates.shape}"
        if self.cell is not None:
            string += f"\n cell [Angstrom]:\n{self.cell/angstrom }"

        return string

[docs]    def batch(self) -> SystemParams:
        if self.batched:
            return self

        return SystemParams(
            coordinates=jnp.array([self.coordinates]),
            cell=self.cell if self.cell is None else jnp.array([self.cell]),
        )

[docs]    def unbatch(self) -> SystemParams:
        if not self.batched:
            return self
        assert self.shape[0] == 1
        return SystemParams(
            coordinates=self.coordinates[0, :],
            cell=self.cell if self.cell is None else self.cell[0, :],
        )

[docs]    def angles(self, deg=True) -> Array:
        @partial(vmap, in_axes=(None, 0))
        @partial(vmap, in_axes=(0, None))
        def ang(x1, x2):
            a = jnp.arccos(jnp.dot(x1, x2) / (jnp.dot(x1, x1) * jnp.dot(x2, x2)) ** 0.5)
            if deg:
                a *= 180 / jnp.pi
            return a

        return ang(self.cell, self.cell)

[docs]    def _get_neighbour_list(
        self,
        r_cut,
        r_skin: float = 0.0,
        z_array: tuple[int] | None = None,
        z_unique: tuple[int] | None = None,
        num_z_unique: tuple[int] | None = None,
        num_neighs: int | None = None,
        nxyz: tuple[int] | None = None,
    ) -> tuple[bool, NeighbourList | None]:
        if r_cut is None:
            return False, None

        sp, op_cell, op_coor = self.canoncialize()

        b = True

        def _get_num_per_images(cell, r_cut):
            if cell is None or r_cut is None:
                return None

            # orthogonal distance for number of blocks
            v1, v2, v3 = cell[0, :], cell[1, :], cell[2, :]

            # sorted from short to long
            e3 = v3 / jnp.linalg.norm(v3)
            e1 = jnp.cross(v2, e3)
            e1 /= jnp.linalg.norm(e1)
            e2 = jnp.cross(e3, e1)

            proj = vmap(vmap(jnp.dot, in_axes=(0, None)), in_axes=(None, 0))(
                jnp.array([e1, e2, e3]),
                jnp.array([v1, v2, v3]),
            )

            bounds = jnp.ceil(jnp.sum(jnp.abs(jnp.linalg.inv(proj)) * r_cut, axis=1))

            return bounds

        # cannot be jitted
        if sp.cell is not None:
            if nxyz is None:
                if sp.batched:
                    nxyz = [
                        int(i)
                        for i in jnp.max(
                            vmap(
                                lambda sp: _get_num_per_images(sp.cell, r_cut + r_skin),
                            )(sp),
                            axis=0,
                        ).tolist()
                    ]
                else:
                    nxyz = [int(i) for i in _get_num_per_images(sp.cell, r_cut + r_skin).tolist()]
            else:
                b = (
                    b and (_get_num_per_images(sp.cell, r_cut) <= jnp.array(nxyz)).all()
                )  # only check r_cut, because we are retracing
            nx, ny, nz = nxyz
            bx = jnp.arange(-nx, nx + 1)
            by = jnp.arange(-ny, ny + 1)
            bz = jnp.arange(-nz, nz + 1)
        else:
            bx, by, bz = None, None, None

        @jax.jit
        def func(r_ij, index, i, j, k):
            return (
                jnp.linalg.norm(r_ij),
                jnp.array(index),
                jnp.array([i, j, k]),
            )

        @jax.jit
        def func2(r_ij, index, i, j, k):
            return (
                jnp.linalg.norm(r_ij),
                jnp.array(index),
                None,
            )

        def _apply_g_inner(
            sp: SystemParams,
            func,
            r_cut,
            ijk=(None, None, None),
            exclude_self=True,
        ):
            i, j, k = ijk

            if ijk != (None, None, None):
                assert sp.cell is not None
                pos = sp.coordinates + i * sp.cell[0, :] + j * sp.cell[1, :] + k * sp.cell[2, :]
            else:
                pos = sp.coordinates

            norm2 = jnp.sum(pos**2, axis=1)
            index_j = jnp.ones_like(norm2, dtype=jnp.int32).cumsum() - 1

            bools = norm2 < r_cut**2

            if exclude_self:
                bools = jnp.logical_and(
                    bools,
                    jnp.logical_not(
                        vmap(jnp.allclose, in_axes=(0, None))(pos, jnp.zeros((3,))),
                    ),
                )

            true_val = vmap(func, in_axes=(0, 0, None, None, None))(
                pos,
                index_j,
                i,
                j,
                k,
            )
            false_val = jax.tree_map(
                jnp.zeros_like,
                true_val,
            )

            val = vmap(
                lambda b, x, y: jax.tree_map(
                    lambda t, f: jnp.where(b, t, f),
                    x,
                    y,
                ),
            )(
                bools,
                true_val,
                false_val,
            )

            return bools, val

        @partial(vmap, in_axes=(None, 0))
        def res(sp, center_coordinates):
            if center_coordinates is not None:
                sp_center = SystemParams(sp.coordinates - center_coordinates, sp.cell)
            else:
                sp_center = SystemParams(sp.coordinates, sp.cell)

            sp_center, center_op = sp_center.wrap_positions(min=True)

            if sp_center.cell is None:
                _, (r, atoms, _) = _apply_g_inner(
                    sp=sp_center,
                    func=func2,
                    r_cut=jnp.inf,
                    exclude_self=False,
                )

                idx = jnp.argsort(r)

                return r[idx] < r_cut + r_skin, r[idx], atoms[idx], None, center_op

            _, (r, atoms, indices) = vmap(
                vmap(
                    vmap(
                        lambda i, j, k: _apply_g_inner(
                            sp=sp_center,
                            func=func,
                            r_cut=jnp.inf,
                            ijk=(i, j, k),
                            exclude_self=False,
                        ),
                        in_axes=(0, None, None),
                        out_axes=0,
                    ),
                    in_axes=(None, 0, None),
                    out_axes=1,
                ),
                in_axes=(None, None, 0),
                out_axes=2,
            )(bx, by, bz)

            r, atoms, indices = (
                jnp.reshape(r, (-1,)),
                jnp.reshape(atoms, (-1)),
                jnp.reshape(indices, (-1, 3)),
            )
            idx = jnp.argsort(r)

            return (
                r[idx] < r_cut + r_skin,
                r[idx],
                atoms[idx],
                indices[idx, :],
                center_op,
            )

        @jax.jit
        def _f(sp):
            bools, r, a, ijk, co = res(sp, sp.coordinates)
            num_neighs = jnp.max(jnp.sum(bools, axis=1))

            return num_neighs, bools, r, a, ijk, co

        @partial(jit, static_argnums=0)
        def take(num_neighs, r, a, ijk):
            r, a = (
                r[:, 0:num_neighs],
                a[:, 0:num_neighs],
            )
            if ijk is not None:
                ijk = ijk[:, 0:num_neighs]
            return r, a, ijk

        if sp.batched:
            _f = vmap(_f)
            take = vmap(take, in_axes=(None, 0, 0, 0))

        nn, _, r, a, ijk, co = _f(sp)

        if sp.batched:
            nn = jnp.max(nn)  # ingore: type

        if num_neighs is None:
            num_neighs = int(nn)
        else:
            b = jnp.logical_and(b, nn <= num_neighs)

        r, a, ijk = take(num_neighs, r, a, ijk)

        # r_rec = jnp.linalg.norm(_pos(self, ijk, a, op_cell, op_coor,co), axis=-1)
        # assert jnp.mean(jnp.abs(r_rec - r)) < 1e-6

        return (
            b,
            NeighbourList(
                r_cut=r_cut,
                r_skin=r_skin,
                atom_indices=a,
                ijk_indices=ijk,
                z_array=z_array,
                z_unique=z_unique,
                num_z_unique=num_z_unique,
                sp_orig=self,
                nxyz=nxyz,
                op_cell=op_cell,
                op_coor=op_coor,
                op_center=co,
            ),
        )

[docs]    def get_neighbour_list(
        self,
        r_cut,
        z_array: list[int] | Array,
        r_skin=0.0,
    ) -> NeighbourList | None:
        def to_tuple(a):
            if a is None:
                return None
            return tuple([int(ai) for ai in a])

        zu = jnp.unique(jnp.array(z_array)) if z_array is not None else None
        nzu = vmap(lambda zu: jnp.sum(jnp.array(z_array) == zu))(zu) if zu is not None else None

        b, nl = self._get_neighbour_list(
            r_cut=r_cut,
            r_skin=r_skin,
            z_array=to_tuple(z_array),
            z_unique=to_tuple(zu),
            num_z_unique=to_tuple(nzu),
        )
        return nl

    @jax.jit
[docs]    def minkowski_reduce(self) -> tuple[SystemParams, Array]:
        """base on code from ASE: https://wiki.fysik.dtu.dk/ase/_modules/ase/geometry/minkowski_reductsp.cellion.html#minkowski_reduce"""
        if self.cell is None:
            return self, jnp.eye(3)

        import itertools

        TOL = 1e-12

        @partial(jit, static_argnums=(0,))
        def cycle_checker(d):
            assert d in [2, 3]
            max_cycle_length = {2: 60, 3: 3960}[d]
            return jnp.zeros((max_cycle_length, 3 * d), dtype=int)

        @jax.jit
        def add_site(visited, H):
            # flatten array for simplicity
            H = H.ravel()

            # check if site exists
            found = (visited == H).all(axis=1).any()

            # shift all visited sites down and place current site at the top
            visited = jnp.roll(visited, 1, axis=0)
            visited = visited.at[0].set(H)
            return visited, found

        @jax.jit
        def reduction_gauss(B, hu, hv):
            """Calculate a Gauss-reduced lattice basis (2D reduction)."""
            visited = cycle_checker(2)
            u = hu @ B
            v = hv @ B

            def body(vals):
                u, v, hu, hv, visited, found, i = vals

                x = jnp.array(jnp.round(jnp.dot(u, v) / jnp.dot(u, u)), dtype=jnp.int32)
                hu, hv = hv - x * hu, hu
                u = hu @ B
                v = hv @ B
                site = jnp.array([hu, hv])

                visited, found = add_site(visited=visited, H=site)

                return (u, v, hu, hv, visited, found, i + 1)

            def cond_fun(vals):
                u, v, hu, hv, visited, found, i = vals

                return jnp.logical_not(
                    jnp.logical_and(
                        jnp.logical_or(jnp.dot(u, u) >= jnp.dot(v, v), found),
                        i != 0,
                    ),
                )

            u, v, hu, hv, visited, found, i = jax.lax.while_loop(
                cond_fun=cond_fun,
                body_fun=body,
                init_val=(u, v, hu, hv, visited, False, 0),
            )

            return hv, hu

        @jax.jit
        def relevant_vectors_2D(u, v):
            cs = jnp.array(list(itertools.product([-1, 0, 1], repeat=2)))
            vs = cs @ jnp.array([u, v])
            indices = jnp.argsort(jnp.linalg.norm(vs, axis=1))[:7]
            return vs[indices], cs[indices]

        @jax.jit
        def closest_vector(t0, u, v):
            t = t0
            a = jnp.zeros(2, dtype=int)
            rs, cs = relevant_vectors_2D(u, v)

            dprev = float("inf")
            ds = jnp.linalg.norm(rs + t, axis=1)
            index = jnp.argmin(ds)

            def body_fun(vals):
                ds, index, a, _, t, i = vals

                dprev = ds[index]

                r = rs[index]
                kopt = jnp.array(
                    jnp.round(-jnp.dot(t, r) / jnp.dot(r, r)),
                    dtype=jnp.int32,
                )
                a += kopt * cs[index]
                t = t0 + a[0] * u + a[1] * v

                ds = jnp.linalg.norm(rs + t, axis=1)
                index = jnp.argmin(ds)

                return ds, index, a, dprev, t, i + 1

            def cond_fun(vals):
                ds, index, a, dprev, t, i = vals

                return jnp.logical_not(jnp.logical_or(index == 0, ds[index] >= dprev))

            ds, index, a, dprev, t, i = jax.lax.while_loop(
                cond_fun=cond_fun,
                body_fun=body_fun,
                init_val=(ds, index, a, dprev, t0, 0),
            )

            return a

        @jax.jit
        def reduction_full(B):
            """Calculate a Minkowski-reduced lattice basis (3D reduction)."""
            # init
            visited = cycle_checker(d=3)
            H = jnp.eye(3, dtype=int)
            norms = jnp.linalg.norm(B, axis=1)

            def body(vals):
                H, norms, visited, _, i = vals
                # for it in range(MAX_IT):
                # Sort vectors by norm
                H = H[jnp.argsort(norms)]

                # Gauss-reduce smallest two vectors
                hw = H[2]
                hu, hv = reduction_gauss(B, H[0], H[1])
                H = jnp.array([hu, hv, hw])
                R = H @ B

                # Orthogonalize vectors using Gram-Schmidt
                u, v, _ = R
                X = u / jnp.linalg.norm(u)
                Y = v - X * jnp.dot(v, X)
                Y /= jnp.linalg.norm(Y)

                # Find closest vector to last element of R
                pu, pv, pw = R @ jnp.array([X, Y]).T
                nb = closest_vector(pw, pu, pv)

                # Update basis
                H = H.at[2].set(jnp.array([nb[0], nb[1], 1]) @ H)
                R = H @ B

                norms = jnp.linalg.norm(R, axis=1)

                visited, found = add_site(visited, H)

                return H, norms, visited, found, i + 1

            def cond_fun(vals):
                _, norms, _, found, i = vals

                return jnp.logical_not(
                    jnp.logical_and(
                        jnp.logical_or(
                            norms[2] >= norms[1],
                            found,
                        ),
                        i != 0,
                    ),
                )

            H, norms, visited, found, i = jax.lax.while_loop(
                cond_fun,
                body,
                (H, norms, visited, False, 0),
            )

            return H @ B, H

        @jax.jit
        def is_minkowski_reduced(cell):
            """Tests if a cell is Minkowski-reduced.

            Parameters:

            cell: array
                The lattice basis to test (in row-vector format).
            pbc: array, optional
                The periodic boundary conditions of the cell (Default `True`).
                If `pbc` is provided, only periodic cell vectors are tested.

            Returns:

            is_reduced: bool
                True if cell is Minkowski-reduced, False otherwise.
            """

            """These conditions are due to Minkowski, but a nice description in English
            can be found in the thesis of Carine Jaber: "Algorithmic approaches to
            Siegel's fundamental domain", https://www.theses.fr/2017UBFCK006.pdf
            This is also good background reading for Minkowski reduction.

            0D and 1D cells are trivially reduced. For 2D cells, the conditions which
            an already-reduced basis fulfil are:
            |b1| ≤ |b2|
            |b2| ≤ |b1 - b2|
            |b2| ≤ |b1 + b2|

            For 3D cells, the conditions which an already-reduced basis fulfil are:
            |b1| ≤ |b2| ≤ |b3|

            |b1 + b2|      ≥ |b2|
            |b1 + b3|      ≥ |b3|
            |b2 + b3|      ≥ |b3|
            |b1 - b2|      ≥ |b2|
            |b1 - b3|      ≥ |b3|
            |b2 - b3|      ≥ |b3|
            |b1 + b2 + b3| ≥ |b3|
            |b1 - b2 + b3| ≥ |b3|
            |b1 + b2 - b3| ≥ |b3|
            |b1 - b2 - b3| ≥ |b3|
            """

            A = jnp.array(
                [
                    [0, 1, 0],
                    [0, 0, 1],
                    [1, 1, 0],
                    [1, 0, 1],
                    [0, 1, 1],
                    [1, -1, 0],
                    [1, 0, -1],
                    [0, 1, -1],
                    [1, 1, 1],
                    [1, -1, 1],
                    [1, 1, -1],
                    [1, -1, -1],
                ],
            )
            lhs = jnp.linalg.norm(A @ cell, axis=1)
            norms = jnp.linalg.norm(cell, axis=1)
            rhs = norms[jnp.array([0, 1, 1, 2, 2, 1, 2, 2, 2, 2, 2, 2])]

            return (lhs >= rhs - TOL).all()

        @jax.jit
        def minkowski_reduce(cell):
            """Calculate a Minkowski-reduced lattice basis.  The reduced basis
            has the shortest possible vector lengths and has
            norm(a) <= norm(b) <= norm(c).

            Implements the method described in:

            Low-dimensional Lattice Basis Reduction Revisited
            Nguyen, Phong Q. and Stehlé, Damien,
            ACM Trans. Algorithms 5(4) 46:1--46:48, 2009
            :doi:`10.1145/1597036.1597050`

            Parameters:

            cell: array
                The lattice basis to reduce (in row-vector format).
            pbc: array, optional
                The periodic boundary conditions of the cell (Default `True`).
                If `pbc` is provided, only periodic cell vectors are reduced.

            Returns:

            rcell: array
                The reduced lattice basis.
            op: array
                The unimodular matrix transformation (rcell = op @ cell).
            """

            reduced, op = jax.lax.cond(
                is_minkowski_reduced(cell=cell),
                lambda: (cell, jnp.eye(3, dtype=int)),
                lambda: reduction_full(cell),
            )

            sgn = jnp.diag(jnp.sign(jnp.sum(jnp.sign(reduced), axis=1)))

            return sgn @ reduced, sgn @ op

        if self.batched:
            cell, op = vmap(minkowski_reduce)(self.cell)
        else:
            cell, op = minkowski_reduce(self.cell)

        return SystemParams(coordinates=self.coordinates, cell=cell), op

    @partial(jit, static_argnames=["min"])
[docs]    def wrap_positions(self, min=False) -> tuple[SystemParams, Array]:
        """wrap pos to lie within unit cell"""

        def f(x, y):
            return SystemParams._wrap_pos(cell=x, coordinates=y, min=min)

        if self.batched:
            f = vmap(f)

        coor, op = f(self.cell, self.coordinates)
        return (
            SystemParams(coordinates=coor, cell=self.cell),
            op,
        )

    @staticmethod
    @partial(jit, static_argnames=["min"])
[docs]    def _wrap_pos(
        cell: Array | None,
        coordinates: Array,
        min=False,
    ) -> tuple[Array, Array]:
        if cell is None:
            return coordinates, jnp.zeros_like(coordinates, dtype=jnp.int64)

        trans = vmap(vmap(jnp.dot, in_axes=(0, None)), in_axes=(None, 0))(
            vmap(lambda x: x / jnp.linalg.norm(x))(cell),
            jnp.eye(3),
        )

        @partial(vmap)
        def proj(x):
            return jnp.linalg.inv(trans) @ x

        @partial(vmap)
        def deproj(x):
            return trans @ x

        scaled = proj(coordinates)

        norms = jnp.linalg.norm(cell, axis=1)

        def _f1():
            x0 = scaled / norms + 0.5
            a = jnp.mod(x0, 1)
            b = (a - 0.5) * norms
            return a - x0, b

        def _f2():
            x0 = scaled / norms
            a = jnp.mod(x0, 1)
            b = a * norms
            return a - x0, b

        op, reduced = jax.lax.cond(min, _f1, _f2)

        return deproj(reduced), op

    @partial(jit, static_argnames=["min"])
[docs]    def canoncialize(self, min=False) -> tuple[SystemParams, Array, Array]:
        if self.batched:
            return vmap(lambda sp: sp.canoncialize(min=min))(self)

        mr, op_cell = self.minkowski_reduce()
        mr, op_coor = mr.wrap_positions(min)

        return mr, op_cell, op_coor

[docs]    def min_distance(self, index_1, index_2):
        assert self.batched is False

        sp, _, _ = self.canoncialize()  # necessary if cell is skewed
        coor1 = sp.coordinates[index_1, :]
        coor2 = sp.coordinates[index_2, :]

        @partial(vmap, in_axes=(None, None, 0))
        @partial(vmap, in_axes=(None, 0, None))
        @partial(vmap, in_axes=(0, None, None))
        def dist(n0, n1, n2):
            return jnp.linalg.norm(
                coor2 - coor1 + n0 * sp.cell[0, :] + n1 * sp.cell[1, :] + n2 * sp.cell[2, :],
            )

        ind = jnp.array([-1, 0, 1])
        return jnp.min(dist(ind, ind, ind))


@jdc.pytree_dataclass
[docs]class NeighbourList:
[docs]    r_cut: jdc.Static[jnp.floating]
[docs]    atom_indices: Array

[docs]    op_cell: Array | None
[docs]    op_coor: Array | None
[docs]    op_center: Array | None

[docs]    r_skin: jdc.Static[jnp.floating]
[docs]    sp_orig: SystemParams | None = None
[docs]    ijk_indices: Array | None = None
[docs]    nxyz: jdc.Static[tuple[int] | None] = None
[docs]    z_array: jdc.Static[tuple[int] | None] = None
[docs]    z_unique: jdc.Static[tuple[int] | None] = None
[docs]    num_z_unique: jdc.Static[tuple[int] | None] = None

    @jax.jit
[docs]    def _pos(self, sp_orig):
        @partial(vmap, in_axes=(0, 0, None, None))
        def _transform(ijk, a, spi, cell):
            out = spi[a]
            if ijk is not None:
                (i, j, k) = ijk
                out = out + i * cell[0, :] + j * cell[1, :] + k * cell[2, :]
            return out

        @partial(vmap, in_axes=(0, 0, 0, None, 0))
        def _recover(center_coordinates, ijk_indices, atom_indices, sp, co):
            sp_center = sp.coordinates - center_coordinates
            if sp.cell is not None:
                sp_center += co @ sp.cell

            return _transform(
                ijk_indices,
                atom_indices,
                sp_center,
                sp.cell,
            )

        def _sp(sp: SystemParams, op_cell, op_coor):
            if sp.cell is not None:
                cell = op_cell @ sp.cell
                coor = sp.coordinates + op_coor @ cell
            else:
                cell = None
                coor = sp.coordinates
            return SystemParams(coor, cell)

        if sp_orig.batched:
            assert self.batched
            _recover = vmap(_recover, in_axes=(0, 0, 0, 0))
            _sp = vmap(_sp)

        sp = _sp(sp_orig, self.op_cell, self.op_coor)

        return _recover(
            sp.coordinates,
            self.ijk_indices,
            self.atom_indices,
            sp,
            self.op_center,
        )

[docs]    def apply_fun_neighbour(
        self,
        sp: SystemParams,
        func,
        r_cut=None,
        fill_value=0,
        reduce="full",  # or 'z' or 'none'
        split_z=False,  #
        exclude_self=False,
    ):
        if sp.batched:
            return vmap(
                lambda nl, sp: NeighbourList.apply_fun_neighbour(
                    self=nl,
                    sp=sp,
                    func=func,
                    r_cut=r_cut,
                    fill_value=fill_value,
                    reduce=reduce,
                    split_z=split_z,
                    exclude_self=exclude_self,
                ),
            )(self, sp)

        if r_cut is None:
            r_cut is self.r_cut

        pos = self._pos(sp)
        ind = self.atom_indices
        r = jnp.linalg.norm(pos, axis=-1)

        bools = r**2 < self.r_cut**2

        if exclude_self:
            bools = jnp.logical_and(bools, r**2 != 0.0)

        bools = jnp.logical_and(bools, ind != -1)

        if func is None:
            return bools, None

        true_val = vmap(vmap(func))(pos, ind)
        false_val = jax.tree_map(
            lambda a: jnp.zeros_like(a) + fill_value,
            true_val,
        )

        def _get(bools):
            def _red(bools):
                val = vmap(
                    lambda b, x, y: jax.tree_map(
                        lambda t, f: vmap(jnp.where)(b, t, f),
                        x,
                        y,
                    ),
                )(bools, true_val, false_val)

                if reduce == "full":
                    return jax.tree_map(lambda x: jnp.sum(x, axis=(1)), (bools, val))
                elif reduce == "z":
                    return jax.tree_map(lambda x: jnp.sum(x, axis=(0, 1)), (bools, val))
                elif reduce == "none":
                    return bools, val
                else:
                    raise ValueError(
                        f"unknown value {reduce} for reduce argument of neighbourghfunction, try 'none','z' or 'full'",
                    )

            if not reduce == "z":
                return _red(bools=bools)

            @partial(vmap, in_axes=(0, None))
            def _f(u, a):
                b = vmap(
                    lambda t, f: jnp.where(a == u, t, f),
                    in_axes=(1, 1),
                    out_axes=1,
                )(bools, jnp.full_like(bools, False))

                return _red(bools=b)

            return _f(jnp.array(self.z_unique), jnp.array(self.z_array))

        if not split_z:
            return _get(bools)

        assert self.z_array is not None, "provide z_array to neighbourlist"

        @partial(vmap, in_axes=(0, None), out_axes=1)
        def sel(u1, at):
            @vmap
            def _b(at):
                bools_z1 = vmap(lambda x: x == u1)(at)
                return bools_z1

            return _get(jnp.logical_and(_b(at), bools))

        return sel(jnp.array(self.z_unique), jnp.array(self.z_array)[ind])

        # return _apply_fun_neighbour(sp, self)

[docs]    def apply_fun_neighbour_pair(
        self,
        sp: SystemParams,
        func_double,
        func_single=None,
        r_cut=None,
        fill_value=0,
        reduce="full",  # or 'z' or 'none'
        split_z=False,  #
        exclude_self=True,
        unique=True,
    ):
        """
        Args:
        ______
        func_single=lambda r_ij, atom_index_j: (1,),
        func_double=lambda r_ij, atom_index_j, data_j, r_ik, atom_index_k, data_k: (
            r_ij,
            atom_index_j,
            r_ik,
            atom_index_k,
        ),

        """
        if sp.batched:
            return vmap(
                lambda nl, sp: NeighbourList.apply_fun_neighbour_pair(
                    self=nl,
                    sp=sp,
                    func_single=func_single,
                    func_double=func_double,
                    r_cut=r_cut,
                    fill_value=fill_value,
                    reduce=reduce,
                    split_z=split_z,
                    exclude_self=exclude_self,
                    unique=unique,
                ),
            )(self, sp)

        pos = self._pos(sp)
        ind = self.atom_indices

        bools, data_single = self.apply_fun_neighbour(
            sp=sp,
            func=func_single,
            r_cut=r_cut,
            reduce="none",
            fill_value=fill_value,
            exclude_self=exclude_self,
        )

        out_ijk = vmap(
            lambda x, y, z: vmap(
                vmap(func_double, in_axes=(0, 0, 0, None, None, None)),
                in_axes=(None, None, None, 0, 0, 0),
            )(x, y, z, x, y, z),
        )(pos, ind, data_single)

        bools = vmap(
            lambda b: vmap(
                vmap(jnp.logical_and, in_axes=(0, None)),
                in_axes=(None, 0),
            )(b, b),
        )(bools)

        if unique:
            bools = vmap(lambda b: b.at[jnp.diag_indices_from(b)].set(False))(bools)

        # check if indices are not -1

        out_ijk_f = jax.tree_map(
            lambda o: jnp.full_like(o, fill_value),
            out_ijk,
        )

        def get(bools):
            def _red(bools):
                val = jax.tree_map(
                    lambda t, f: vmap(vmap(vmap(jnp.where)))(bools, t, f),
                    out_ijk,
                    out_ijk_f,
                )

                if reduce == "full":
                    return jax.tree_map(lambda x: jnp.sum(x, axis=(1, 2)), (bools, val))
                elif reduce == "z":
                    return jax.tree_map(
                        lambda x: jnp.sum(x, axis=(0, 1, 2)),
                        (bools, val),
                    )
                elif reduce == "none":
                    return bools, val
                else:
                    raise ValueError(
                        f"unknown value {reduce} for reduce argument of neighbourghfunction, try 'none','z' or 'full'",
                    )

            if not reduce == "z":
                return _red(bools=bools)

            @partial(vmap, in_axes=(0, None))
            def _f(u, a):
                b = vmap(
                    vmap(
                        lambda t, f: jnp.where(a == u, t, f),
                        in_axes=(1, 1),
                        out_axes=1,
                    ),
                    in_axes=(2, 2),
                    out_axes=2,
                )(bools, jnp.full_like(bools, False))

                return _red(bools=b)

            return _f(jnp.array(self.z_unique), jnp.array(self.z_array))

        if not split_z:
            return get(bools)

        assert self.z_array is not None, "provide z_array to neighbourlist"

        @partial(vmap, in_axes=(None, 0, None), out_axes=2)
        @partial(vmap, in_axes=(0, None, None), out_axes=1)
        def sel(u1, u2, at):
            @partial(vmap, in_axes=(0))
            def _b(at):
                bools_z1_z2 = vmap(
                    vmap(
                        lambda x, y: jnp.logical_and(x == u1, y == u2),
                        in_axes=(0, None),
                    ),
                    in_axes=(None, 0),
                )(at, at)
                return bools_z1_z2

            return get(jnp.logical_and(_b(at), bools))

        return sel(
            jnp.array(self.z_unique),
            jnp.array(self.z_unique),
            jnp.array(self.z_array)[self.atom_indices],
        )

    @property
[docs]    def batched(self):
        return len(self.atom_indices.shape) == 3

    @property
[docs]    def shape(self):
        return self.atom_indices.shape

    @property
[docs]    def num_neigh(self):
        return self.shape[-1]

[docs]    def __getitem__(self, slices):
        return NeighbourList(
            r_cut=self.r_cut,
            atom_indices=self.atom_indices[slices, :] if self.atom_indices is not None else None,
            ijk_indices=self.ijk_indices[slices, :] if self.ijk_indices is not None else None,
            op_cell=self.op_cell[slices, :, :] if self.op_cell is not None else None,
            op_coor=self.op_coor[slices, :, :] if self.op_coor is not None else None,
            op_center=self.op_center[slices, :] if self.op_center is not None else None,
            z_array=self.z_array,
            z_unique=self.z_unique,
            num_z_unique=self.num_z_unique,
            r_skin=self.r_skin,
            sp_orig=self.sp_orig[slices],
            nxyz=self.nxyz,
        )

    @jax.jit
[docs]    def update(self, sp: SystemParams) -> tuple[bool, NeighbourList]:
        max_displacement = jnp.max(
            jnp.linalg.norm(self._pos(self.sp_orig) - self._pos(sp), axis=-1),
        )

        def _f(sp: SystemParams):
            return sp._get_neighbour_list(
                r_cut=self.r_cut,
                r_skin=self.r_skin,
                z_array=self.z_array,
                z_unique=self.z_unique,
                num_z_unique=self.num_z_unique,
                num_neighs=self.num_neigh,
                nxyz=self.nxyz,
            )

        return jax.lax.cond(
            max_displacement > self.r_skin,
            _f,
            lambda _: (True, self),
            sp,
        )

[docs]    def nl_split_z(self, p):
        if self.batched:
            return vmap(NeighbourList.nl_split_z)(self, p)

        bool_masks = [jnp.array(self.z_array) == zu for zu in self.z_unique]

        arg_split = [jnp.argsort(~bm, kind="stable")[0:nzu] for bm, nzu in zip(bool_masks, self.num_z_unique)]
        p = [jax.tree_map(lambda pi: pi[a], tree=p) for a in arg_split]

        return jnp.array(bool_masks), arg_split, p

    @staticmethod
[docs]    # @partial(jit, static_argnums=(4, 5, 6, 7))
    def match_kernel(
        p1: Array,
        p2: Array,
        nl1: NeighbourList,
        nl2: NeighbourList,
        matching="REMatch",
        # norm=True,
        alpha=1e-2,
        mode="divergence",
        # average_kernels=True,
        jit=True,
    ):
        # file:///home/david/Downloads/Permutation_Invariant_Representations_with_Applica.pdf

        if nl1.batched:
            return vmap(
                lambda p1, nl1: NeighbourList.match_kernel(
                    p1=p1,
                    nl1=nl1,
                    p2=p2,
                    nl2=nl2,
                    matching=matching,
                    # norm=norm,
                    alpha=alpha,
                    # average_kernels=average_kernels,
                ),
            )(p1, nl1)

        if nl2.batched:
            return vmap(
                lambda p2, nl2: NeighbourList.match_kernel(
                    p1=p1,
                    nl1=nl1,
                    p2=p2,
                    nl2=nl2,
                    matching=matching,
                    # norm=norm,
                    alpha=alpha,
                    # average_kernels=average_kernels,
                ),
            )(p2, nl2)

        # jnp.all(nl1.z_unique == nl2.z_unique)
        # assert jnp.all(nl1.num_z_unique == nl2.num_z_unique)
        # b = nl1.num_z_unique

        @vmap
        def __norm(p):
            n1_sq = jnp.einsum("...,...->", p, p)
            n1_sq_safe = jnp.where(n1_sq <= 1e-16, 1, n1_sq)

            mask = n1_sq == 0

            n1_i = jnp.where(mask, 0.0, 1 / jnp.sqrt(n1_sq_safe))

            return p * n1_i, n1_sq, ~mask

        p1, n1_sq, m1 = __norm(p1)
        p2, n2_sq, m2 = __norm(p2)

        b1, a1_s, z1 = nl1.nl_split_z((p1, n1_sq))
        b2, a2_s, z2 = nl2.nl_split_z((p2, n2_sq))

        # @jax.jit
        # def split_and_rearrange(f, z1, z2, a1_s, a2_s):
        #     P_p = jax.scipy.linalg.block_diag(
        #         *[f(a, b, an, bn) for (a, an), (b, bn) in zip(z1, z2)]
        #     )

        #     a1, a2 = jnp.hstack(a1_s), jnp.hstack(a2_s)
        #     a1_i = jnp.zeros_like(a1).at[a1].set(jnp.arange(a1.shape[0]))
        #     a2_i = jnp.zeros_like(a2).at[a2].set(jnp.arange(a2.shape[0]))

        #     P = P_p[a1_i, :][:, a2_i]

        #     return P

        # @partial(jax.jit, static_argnums=(4))
        def _f(p1, p2, b1, b2, matching):
            # if norm:

            b1 = jnp.array(b1)
            b2 = jnp.array(b2)

            if matching == "average":
                P12 = jnp.einsum("ni,nj->ij", b1, b2)
                P11 = jnp.einsum("ni,nj->ij", b1, b1)
                P22 = jnp.einsum("ni,nj->ij", b2, b2)

            elif matching == "norm":
                raise

                # def __gs(p1_s, p2_s, n1_s, n2_s):
                #     n1_ss = jnp.argsort(n1_s)
                #     n2_ss = jnp.argsort(n2_s)

                #     p = jnp.zeros((p1_s.shape[0], p2_s.shape[0]))
                #     p = p.at[n1_ss, n2_ss].set(1)

                #     return p

                # P12 = split_and_rearrange(__gs, z1, z2, a1_s, a2_s)
            else:

                @jax.jit
                def __gs_mask(p1, p2, m1, m2):
                    n = p1.shape[0]

                    geom = PointCloud(
                        x=jnp.reshape(p1, (n, -1)),
                        y=jnp.reshape(p2, (n, -1)),
                        # scale_cost=True, leads to problems if x==y
                        epsilon=alpha,
                    )

                    geom = geom.mask(m1, m2)

                    prob = linear_problem.LinearProblem(geom)

                    solver = sinkhorn.Sinkhorn()
                    out = solver(prob)

                    # out = sinkhorn_divergence(geom, x=geom.x, y=geom.y)

                    P_ij = out.matrix

                    # Tr(  P.T * C )
                    return P_ij

                P12 = jnp.einsum(
                    "nij,ni,nj->ij",
                    vmap(__gs_mask, in_axes=(None, None, 0, 0))(p1, p2, b1, b2),
                    b1,
                    b2,
                )
                P11 = jnp.einsum(
                    "nij,ni,nj->ij",
                    vmap(__gs_mask, in_axes=(None, None, 0, 0))(p1, p1, b1, b1),
                    b1,
                    b1,
                )
                P22 = jnp.einsum(
                    "nij,ni,nj->ij",
                    vmap(__gs_mask, in_axes=(None, None, 0, 0))(p2, p2, b2, b2),
                    b2,
                    b2,
                )

            if mode == "divergence":
                res = (
                    0.5 * jnp.einsum("ij,i...,j...->", P11, p1, p1)
                    + 0.5 * jnp.einsum("ij,i...,j...->", P22, p2, p2)
                    - jnp.einsum("ij,i...,j...->", P12, p1, p2)
                )
            else:
                raise ValueError(f"unknown value {mode} for mode argument")

            return res, (P11, P12, P22)

        return _f(p1, p2, b1, b2, matching)

[docs]    def __add__(self, other):
        assert isinstance(other, NeighbourList)

        if self.batched and not other.batched:
            return vmap(lambda self: self + other)(self)

        if other.batched and not self.batched:
            return vmap(lambda other: self + other)(other)

        assert self.r_cut == other.r_cut
        assert self.r_skin == other.r_skin
        if self.z_array is None:  # pragma: no cover
            assert other.z_array is None
        else:
            assert jnp.all(self.z_array == other.z_array)

        if self.z_unique is None:
            assert other.z_unique is None
        else:
            assert jnp.all(self.z_unique == other.z_unique)

        if self.atom_indices is not None:
            assert other.atom_indices is not None

        if self.nxyz is None:
            assert other.nxyz is None
        else:
            assert self.nxyz == other.nxyz

        if self.sp_orig is None:
            assert other.sp_orig is None

        if self.ijk_indices is None:
            assert other.ijk_indices is None

        if self.op_cell is None:
            assert other.op_cell is None

        if self.op_coor is None:
            assert other.op_coor is None

        if self.op_center is None:
            assert other.op_center is None

        if self.num_z_unique is None:
            assert other.num_z_unique is None
        else:
            assert jnp.all(self.num_z_unique == other.num_z_unique)

        if self.atom_indices is not None:
            m = jnp.max(
                jnp.array([self.atom_indices.shape[-1], other.atom_indices.shape[-1]]),
            )

            def _p(a, n):
                return jnp.pad(
                    array=a,
                    pad_width=((0, 0), (0, n)),
                    constant_values=-1,
                )

            if self.batched:
                _p = vmap(_p, in_axes=(0, None))

            if self.atom_indices.shape[-1] != m:
                sa = _p(self.atom_indices, m - self.atom_indices.shape[-1])
            else:
                sa = self.atom_indices

            if other.atom_indices.shape[-1] != m:
                sb = _p(other.atom_indices, m - other.atom_indices.shape[-1])
            else:
                sb = other.atom_indices

        return NeighbourList(
            r_cut=self.r_cut,
            r_skin=self.r_skin,
            atom_indices=jnp.vstack([sa, sb]) if self.atom_indices is not None else None,
            z_array=self.z_array,
            z_unique=self.z_unique,
            nxyz=self.nxyz,
            sp_orig=self.sp_orig + other.sp_orig if self.sp_orig is not None else None,
            ijk_indices=jnp.vstack([self.ijk_indices, other.ijk_indices]) if self.ijk_indices is not None else None,
            op_cell=jnp.vstack([self.op_cell, other.op_cell]) if self.op_cell is not None else None,
            op_coor=jnp.vstack([self.op_coor, other.op_coor]) if self.op_coor is not None else None,
            op_center=jnp.vstack([self.op_center, other.op_center]) if self.op_center is not None else None,
            num_z_unique=self.num_z_unique,
        )

    @staticmethod
[docs]    def stack(*nls: NeighbourList) -> NeighbourList:
        return sum(nls[1:], nls[0])


@jdc.pytree_dataclass
[docs]class CV:
[docs]    cv: Array
[docs]    mapped: jdc.Static[bool] = False
[docs]    atomic: jdc.Static[bool] = False
[docs]    _combine_dims: jdc.Static[list | None] = None
[docs]    _stack_dims: jdc.Static[list | None] = None

    @property
[docs]    def batched(self):
        if self.atomic:
            return len(self.cv.shape) == 3

        return len(self.cv.shape) == 2

    @property
[docs]    def batch_dim(self):
        if self.batched:
            return self.shape[0]
        return 1

    @property
[docs]    def dim(self):
        if self.cv.shape == ():
            return 1
        return self.cv.shape[-1]

    @property
[docs]    def size(self):
        return self.cv.size

    @property
[docs]    def shape(self):
        return self.cv.shape

    @property
[docs]    def combine_dims(self):
        if self._combine_dims is None:
            return self.dim
        return self._combine_dims

    @property
[docs]    def stack_dims(self):
        if self._stack_dims is None:
            return [self.batch_dim]
        return self._stack_dims

[docs]    def __add__(self, other) -> CV:
        assert isinstance(other, Array)

        return CV(
            cv=self.cv + other,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

[docs]    def __radd__(self, other) -> CV:
        return other + self

[docs]    def __sub__(self, other) -> CV:
        assert isinstance(other, Array)
        return CV(
            cv=self.cv - other,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

[docs]    def __rsub__(self, other) -> CV:
        return other - self

[docs]    def __mul__(self, other) -> CV:
        assert isinstance(other, Array)
        return CV(
            cv=self.cv * other,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

[docs]    def __rmul__(self, other) -> CV:
        return other * self

[docs]    def __matmul__(self, other) -> CV:
        assert isinstance(other, Array)
        return CV(
            cv=self.cv @ other,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

[docs]    def __rmatmul__(self, other) -> CV:
        return other @ self

[docs]    def __div__(self, other) -> CV:
        assert isinstance(other, Array)
        return CV(
            cv=self.cv / other,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

[docs]    def __rdiv__(self, other) -> CV:
        return other / self

[docs]    def batch(self) -> CV:
        if self.batched:
            return self
        return CV(
            cv=jnp.array([self.cv]),
            mapped=self.mapped,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

[docs]    def __iter__(self):
        if not self.batched:
            yield self
            return

        for i in range(self.cv.shape[0]):
            yield self[i]
        return

[docs]    def __getitem__(self, idx):
        assert self.batched
        return CV(
            cv=self.cv[idx, :],
            mapped=self.mapped,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

[docs]    def unbatch(self) -> CV:
        if not self.batched:
            return self
        assert self.cv.shape[0] == 1
        return CV(
            cv=self.cv[0, :],
            mapped=self.mapped,
            atomic=self.atomic,
            _stack_dims=self._stack_dims,
            _combine_dims=self._combine_dims,
        )

    @staticmethod
[docs]    def stack(*cvs: CV) -> CV:
        """stacks a list of CVs into a single CV. The dimenisions are stored such that it can later be unstacked into separated CVs. The CVs are stacked over the batch dimension"""

        assert len(cvs) != 0
        atomic = cvs[0].atomic

        in_dims = None
        mapped = None

        cv_arr = []
        stack_dims = []

        for cv in cvs:
            assert atomic == cv.atomic

            assert isinstance(cv, CV)
            if in_dims is None:
                in_dims = cv._combine_dims
                mapped = cv.mapped
            else:
                assert cv._combine_dims == in_dims
                assert cv.mapped == mapped

            cv_arr.append(cv.batch().cv)
            stack_dims += cv.stack_dims

        assert mapped is not None

        return CV(
            cv=jnp.vstack(cv_arr),
            _combine_dims=in_dims,
            _stack_dims=stack_dims,
            atomic=atomic,
        )

[docs]    def unstack(self) -> list[CV]:
        i = 0

        out: list[CV] = []
        for j in self.stack_dims:
            out += [
                CV(
                    cv=self.cv[i : i + j, :],
                    mapped=self.mapped,
                    _combine_dims=self._combine_dims,
                    atomic=self.atomic,
                ),
            ]
            i += j
        return out

[docs]    def split(self, flatten=False) -> list[CV]:
        """inverse operation of combine"""

        if self._combine_dims is None:
            return [CV(cv=self.cv, mapped=self.mapped, atomic=self.atomic)]

        def broaden_tree(subtree):
            if isinstance(subtree, int):
                return [subtree]
            num = []
            for leaf in subtree:
                num += broaden_tree(leaf)

            return num

        if not flatten:
            sz = [sum(broaden_tree(a)) for a in self._combine_dims]
            out_dim = self._combine_dims
        else:
            sz = broaden_tree(self._combine_dims)
            out_dim = sz

        end = jnp.cumsum(jnp.array(sz))
        start = jnp.hstack([0, end[:-1]])

        return [
            CV(
                cv=jax.lax.dynamic_slice_in_dim(
                    self.cv,
                    start_index=s,
                    slice_size=e,
                    axis=-1,
                ),
                _combine_dims=out_dim[i] if isinstance(out_dim[i], list) else None,
                _stack_dims=self._stack_dims,
                atomic=self.atomic,
            )
            for i, (s, e) in enumerate(zip(start, sz))
        ]

    @staticmethod
[docs]    def combine(*cvs: CV, flatten=False) -> CV:
        """merges a list of CVs into a single CV. The dimenisions are stored such that it can later be split into separated CVs. The CVs are combined over the last dimension"""

        out_cv: list[Array] = []
        out_dim: list[int] = []

        mapped = cvs[0].mapped
        batched = cvs[0].batched
        atomic = cvs[0].atomic
        bdim = cvs[0].batch_dim

        stack_dims = cvs[0].stack_dims

        assert len(cvs) != 0
        if len(cvs) == 1:
            return cvs[0]

        def _inner(cv: CV, batched, mapped, atomic, bdim, stack_dims) -> tuple[list[Array], list[int]]:
            assert mapped == cv.mapped

            if batched is None:
                batched = cv.batched
                if batched:
                    bdim = cv.batch_dim
            else:
                assert batched == cv.batched
                if batched:
                    assert bdim == cv.batch_dim

            if atomic is None:
                atomic = cv.atomic
            else:
                assert atomic == cv.atomic

            assert stack_dims == cv.stack_dims

            def simple(cv: CV):
                return [cv.cv], [cv.combine_dims]

            if cv._combine_dims is not None and flatten:
                cv_split = cv.split()

                cvi: list[Array] = []
                dimi: list[int] = []

                for ii in cv_split:
                    if ii._combine_dims is None:
                        a, b = simple(ii)
                    else:
                        a, b = a, b = _inner(ii, batched, mapped, atomic, bdim)

                    cvi += a
                    dimi += b

            else:
                cvi, dimi = simple(cv)

            return cvi, dimi

        for cv in cvs:
            a, b = _inner(cv, batched, mapped, atomic, bdim, stack_dims)
            out_cv += a
            out_dim += b

        # type: ignore
        return CV(cv=jnp.hstack(out_cv), mapped=mapped, _combine_dims=out_dim, _stack_dims=stack_dims, atomic=atomic)


[docs]class CvMetric:
    """class to keep track of topology of given CV. Identifies the periodicitie of CVs and maps to unit square with correct peridicities"""

    def __init__(
        self,
        periodicities,
        bounding_box=None,
        # map_meshgrids=None,
    ) -> None:
        if bounding_box is None:
            bounding_box = jnp.zeros((len(periodicities), 2))
            bounding_box = bounding_box.at[:, 1].set(1.0)

        if isinstance(bounding_box, list):
            bounding_box = jnp.array(bounding_box)

        if bounding_box.ndim == 1:
            bounding_box = jnp.reshape(bounding_box, (1, 2))

        if isinstance(periodicities, list):
            periodicities = jnp.array(periodicities)
        assert periodicities.ndim == 1

        self.bounding_box = bounding_box
        self.periodicities = periodicities

    @partial(jit, static_argnums=(0))
[docs]    def norm(self, x1: CV, x2: CV, k=1.0):
        diff = self.difference(x1=x1, x2=x2) * k
        return jnp.linalg.norm(diff)

    @partial(jit, static_argnums=(0, 2))
[docs]    def periodic_wrap(self, x: CV, min=False) -> CV:
        out = CV(cv=self.__periodic_wrap(self.map(x.cv), min=min), mapped=True)

        if x.mapped:
            return out
        return self.unmap(out)

    @partial(jit, static_argnums=(0))
[docs]    def difference(self, x1: CV, x2: CV) -> Array:
        assert not x1.mapped
        assert not x2.mapped

        return self.min_cv(
            x2.cv - x1.cv,
        )

[docs]    def min_cv(self, cv: Array):
        mapped = self.map(cv, displace=False)
        wrapped = self.__periodic_wrap(mapped, min=True)

        return self.unmap(
            wrapped,
            displace=False,
        )

    @partial(jit, static_argnums=(0, 2))
[docs]    def __periodic_wrap(self, xs: Array, min=False):
        """Translate cvs such over unit cell.

        min=True calculates distances, False translates one vector inside box
        """

        coor = jnp.mod(xs, 1)  # between 0 and 1
        if min:
            coor = jnp.where(coor > 0.5, coor - 1, coor)  # between [-0.5,0.5]

        return jnp.where(self.periodicities, coor, xs)

    @partial(jit, static_argnums=(0, 2))
[docs]    def map(self, x: Array, displace=True) -> Array:
        """transform CVs to lie in unit square."""

        if displace:
            x -= self.bounding_box[:, 0]

        y = x / (self.bounding_box[:, 1] - self.bounding_box[:, 0])

        return y

    @partial(jit, static_argnums=(0, 2))
[docs]    def unmap(self, x: Array, displace=True) -> Array:
        """transform CVs to lie in unit square."""

        y = x * (self.bounding_box[:, 1] - self.bounding_box[:, 0])

        if displace:
            x += self.bounding_box[:, 0]

        return y

[docs]    def __add__(self, other):
        assert isinstance(self, CvMetric)
        if other is None:
            return self

        assert isinstance(other, CvMetric)

        periodicities = jnp.hstack((self.periodicities, other.periodicities))
        bounding_box = jnp.vstack((self.bounding_box, other.bounding_box))

        return CvMetric(
            periodicities=periodicities,
            bounding_box=bounding_box,
        )

[docs]    def grid(self, n, endpoints=None, margin=None):
        """forms regular grid in mapped space. If coordinate is periodic, last rows are ommited.

        Args:
            n: number of points in each dim
            map: boolean. True: work in mapped space (default), False: calculate grid in space without metric
            endpoints: if

        Returns:
            meshgrid and vector with distances between points

        """

        if endpoints is None:
            endpoints = np.array(~self.periodicities)
        elif isinstance(endpoints, bool):
            endpoints = np.full(self.periodicities.shape, endpoints)

        b = self.bounding_box

        if margin is not None:
            diff = (b[:, 1] - b[:, 0]) * margin
            b = b.at[:, 0].set(b[:, 0] - diff)
            b = b.at[:, 1].set(b[:, 1] + diff)

        assert not (jnp.abs(b[:, 1] - b[:, 0]) < 1e-12).any(), "give proper boundaries"
        grid = [jnp.linspace(row[0], row[1], n, endpoint=endpoints[i]) for i, row in enumerate(b)]

        return grid

    @property
[docs]    def ndim(self):
        return len(self.periodicities)


######################################
#       CV tranformations            #
######################################


@dataclasses.dataclass(kw_only=True)
[docs]class CvFunInput:
[docs]    input: int
[docs]    conditioners: list[int] | None = None

[docs]    def split(self, x: CV):
        cvs = x.split()
        if self.conditioners is not None:
            cond = [cvs[i] for i in self.conditioners]
        else:
            cond = []

        return cvs[self.input], cond

[docs]    def combine(self, x: CV, res: CV):
        cvs = [*x.split()]
        cvs[self.input] = res
        return CV.combine(*cvs)


@dataclasses.dataclass(kw_only=True)
[docs]class CvFunBase:
[docs]    _: dataclasses.KW_ONLY
[docs]    cv_input: CvFunInput | None = None

[docs]    def calc(self, x: CV, nl: NeighbourList | None, reverse=False, log_det=False) -> tuple[CV, Array | None]:
        if self.cv_input is not None:
            y, cond = self.cv_input.split(x)
        else:
            y, cond = x, None

        if log_det:
            out, log_det = self._log_Jf(y, nl, reverse=reverse, conditioners=cond)
        else:
            out, log_det = self._calc(y, nl, reverse=reverse, conditioners=cond), None

        if self.cv_input:
            out = self.cv_input.combine(x, out)

        return out, log_det

    @abstractmethod
[docs]    def _calc(
        self,
        x: CV,
        nl: NeighbourList | None,
        reverse=False,
        conditioners: list[CV] | None = None,
    ) -> CV:
        pass

[docs]    def _log_Jf(
        self,
        x: CV,
        nl: NeighbourList | None,
        reverse=False,
        conditioners: list[CV] | None = None,
    ) -> tuple[CV, Array | None]:
        """naive automated implementation, overrride this"""

        def f(x):
            return self._calc(x, nl, reverse, conditioners)

        a = f(x)
        b = jacfwd(f)(x)
        log_det = jnp.log(jnp.abs(jnp.linalg.det(b.cv.cv)))

        return a, log_det


@dataclasses.dataclass(kw_only=True)
[docs]class CvFun(CvFunBase):
[docs]    forward: Callable[[CV, NeighbourList | None, CV | None], CV] | None = None
[docs]    backward: Callable[[CV, NeighbourList | None, CV | None], CV] | None = None

[docs]    def _calc(self, x: CV, nl: NeighbourList | None, reverse=False, conditioners: list[CV] | None = None) -> CV:
        if conditioners is None:
            c = None
        else:
            c = CV.combine(*conditioners)

        if reverse:
            assert self.backward is not None
            return self.backward(x, nl, c)
        else:
            assert self.forward is not None
            return self.forward(x, nl, c)


[docs]class CvFunNn(nn.Module, CvFunBase):
    """used to instantiate flax linen CvTrans"""

    @abstractmethod
[docs]    def setup(self):
        pass

    # @partial(jit, static_argnums=(0,3))
[docs]    def _calc(
        self,
        x: CV,
        nl: NeighbourList | None,
        reverse=False,
        conditioners: list[CV] | None = None,
    ) -> CV:
        if reverse:
            return self.backward(x, nl, conditioners)
        else:
            return self.forward(x, nl, conditioners)

    @abstractmethod
[docs]    def forward(self, x: CV, nl: NeighbourList | None, conditioners: list[CV] | None = None) -> CV:
        pass

    @abstractmethod
[docs]    def backward(self, x: CV, nl: NeighbourList | None, conditioners: list[CV] | None = None) -> CV:
        pass


[docs]class CvFunDistrax(nn.Module, CvFunBase):
    """
    creates bijective CV function based on a distrax flow. The seup function should initialize the bijector

    class RealNVP(CvFunDistrax):
        _: dataclasses.KW_ONLY
        latent_dim: int

        def setup(self):
            self.s = Dense(features=self.latent_dim)
            self.t = Dense(features=self.latent_dim)

            # Alternating binary mask.
            self.bijector = distrax.as_bijector(
                tfp.bijectors.RealNVP(
                    fraction_masked=0.5,
                    shift_and_log_scale_fn=self.shift_and_scale,
                )
            )

        def shift_and_scale(self, x0, input_depth, **condition_kwargs):
            return self.s(x0), self.t(x0)
    """

[docs]    bijector: distrax.Bijector = dataclasses.field(init=False)

    @abstractmethod
[docs]    def setup(self):
        """setups self.bijector"""

    # @partial(jit, static_argnums=(0, 4, 5))
[docs]    def _calc(
        self,
        x: CV,
        nl: NeighbourList | None,
        reverse=False,
        log_det=False,
        conditioners: list[CV] | None = None,
    ) -> CV:
        if conditioners is not None:
            z = CV.combine(*conditioners, x).cv
        else:
            z = x.cv

        assert nl is None, "not implemented"

        if reverse:
            assert self.bijector is not None
            return CV(self.bijector.inverse(z), atomic=x.atomic)
        else:
            assert self.bijector is not None
            return CV(self.bijector.forward(z), atomic=x.atomic)

[docs]    def _log_Jf(
        self,
        x: CV,
        nl: NeighbourList | None,
        reverse=False,
        conditioners: list[CV] | None = None,
    ) -> tuple[CV, Array | None]:
        """naive implementation, overrride this"""
        assert nl is None, "not implemented"
        assert self.bijector is not None
        if conditioners is not None:
            z = CV.combine(*conditioners, x).cv
        else:
            z = x.cv

        f = self.bijector.inverse_and_log_det if reverse else self.bijector.forward_and_log_det
        z, jac = f(z)
        return CV(cv=z, atomic=x.atomic), jac


@dataclasses.dataclass(kw_only=True)
[docs]class CombinedCvFun(CvFunBase):
[docs]    classes: list[list[CvFunBase]]

[docs]    def calc(self, x: CV, nl: NeighbourList | None, reverse=False, log_det=False) -> tuple[CV, Array | None]:
        assert x._combine_dims is not None, "combine dims not set. Use CV.combine(*cvs)"

        out_x = []
        out_log_det = []

        for cl, xi in zip(self.classes, x.split()):
            ordered = reversed(cl) if reverse else cl

            if log_det:
                log_det = jnp.array(0.0)
            else:
                log_det = None

            for tr in ordered:
                xi, log_det_i = tr.calc(x=xi, nl=nl, reverse=reverse, log_det=log_det)
                if log_det:
                    assert log_det_i is not None
                    log_det += log_det_i

            out_x.append(xi)
            out_log_det.append(log_det)

        return CV.combine(*out_x), jnp.sum(jnp.array(out_log_det))

[docs]    def _log_Jf(
        self,
        x: CV,
        nl: NeighbourList | None,
        reverse=False,
        conditioners: list[CV] | None = None,
    ) -> tuple[CV, Array | None]:
        """naive automated implementation, overrride this"""

        raise NotImplementedError("untested")


@dataclasses.dataclass(kw_only=True)
[docs]class CvTrans:
    """f can either be a single CV tranformation or a list of transformations"""

[docs]    trans: list[CvFunBase]

    @staticmethod
[docs]    def from_array_function(f: Callable[[Array, NeighbourList | None, None], Array]):
        def f2(x: CV, nl: NeighbourList | None, conditioners: list[CV] | None = None):
            assert conditioners is None, "implement this"

            if x.batched:
                out = vmap(f)(x.cv, nl, None)
            else:
                out = f(x.cv, nl, None)

            return CV(cv=out, atomic=x.atomic)

        return CvTrans.from_cv_function(f=f2)

    @staticmethod
[docs]    def from_cv_function(f: Callable[[CV, NeighbourList | None, CV | None], CV]) -> CvTrans:
        return CvTrans.from_cv_fun(proto=CvFun(forward=f))

    @staticmethod
[docs]    def from_cv_fun(proto: CvFunBase):
        return CvTrans(trans=[proto])

[docs]    def compute_cv_trans(
        self,
        x: CV,
        nl: NeighbourList | None = None,
        reverse=False,
        log_Jf=False,
    ) -> tuple[CV, Array | None]:
        """
        result is always batched
        arg: CV
        """
        if x.batched:
            return vmap(lambda x, nl: self.compute_cv_trans(x, nl, reverse, log_Jf))(x, nl)

        ordered = reversed(self.trans) if reverse else self.trans

        if log_Jf:
            log_det = jnp.array(0.0)
        else:
            log_det = None

        for tr in ordered:
            x, log_det_i = tr.calc(x=x, nl=nl, reverse=reverse, log_det=log_Jf)
            if log_Jf:
                assert log_det_i is not None
                log_det += log_det_i
        return x, log_det

[docs]    def __mul__(self, other):
        assert isinstance(other, CvTrans), "can only multiply by CvTrans object"
        return CvTrans(trans=[*self.trans, *other.trans])

[docs]    def __add__(self, other: CvTrans) -> CvTrans:
        assert isinstance(other, CvTrans), "can only add CvTrans object"

        @CvTrans.from_cv_function
        def double(x: CV, nl: NeighbourList | None, _):
            return CV.combine(x, x)

        return double * CvTrans(trans=[CombinedCvFun(classes=[self.trans, other.trans])])

    @staticmethod
[docs]    def stack(*cv_trans: CvTrans):
        n = len(cv_trans)

        @CvTrans.from_cv_function
        def duplicate(x: CV, nl: NeighbourList | None, _):
            return CV.combine(*[x] * n)

        return duplicate * CvTrans(trans=[CombinedCvFun(classes=[cvt.trans for cvt in cv_trans])])


[docs]class CvTransNN(nn.Module, CvTrans):
[docs]    trans: list[CvFunBase]

[docs]    def setup(self) -> None:
        pass

    @nn.compact
[docs]    def compute_cv_trans(
        self,
        x: CV,
        nl: NeighbourList | None,
        reverse=False,
        log_Jf=False,
    ) -> tuple[CV, Array | None]:
        return super().compute_cv_trans(x, nl, reverse, log_Jf)

    @nn.nowrap
[docs]    def __mul__(self, other):
        assert isinstance(other, CvTrans | CvTransNN)
        return CvTransNN(trans=[s + o for s, o in zip(self.trans, other.trans)])


[docs]class NormalizingFlow(nn.Module):
    """normalizing flow. _ProtoCvTransNN are stored separately because they need to be initialized by this module in setup"""

[docs]    flow: CvTransNN | CvTransNN

[docs]    def setup(self) -> None:
        if isinstance(self.flow, CvTrans):
            self.nn_flow = CvTransNN(trans=self.flow.trans)
        else:
            self.nn_flow = self.flow

    # @partial(jit, static_argnums=(0, 2, 3))
[docs]    def calc(self, x: CV, nl: NeighbourList | None, reverse: bool, test_log_det=False):
        a, b = self.nn_flow.compute_cv_trans(x, nl, reverse=reverse, log_Jf=True)

        if test_log_det:
            b2 = jnp.log(
                jnp.abs(
                    jnp.linalg.det(
                        jacrev(
                            lambda x: self.nn_flow.compute_cv_trans(
                                x,
                                nl,
                                reverse=reverse,
                                log_Jf=False,
                            )[0],
                        )(x).cv.cv,
                    ),
                ),
            )
            assert jnp.abs(b - b2) < 1e-5

        return a, b


[docs]class CvFlow:
    def __init__(
        self,
        func: Callable[[SystemParams, NeighbourList | None], CV],
        trans: CvTrans | None = None,
        # batched=False,
    ) -> None:
        self.f0 = func
        self.f1 = trans
        # self.batched = batched

    @staticmethod
[docs]    def from_function(f: Callable[[SystemParams, NeighbourList | None], Array], atomic=False) -> CvFlow:
        def f2(
            sp: SystemParams,
            nl: NeighbourList | None = None,
        ):
            cv = CV(cv=f(sp, nl), atomic=atomic)
            # assert (
            #     len(cv.shape) == 1
            # ), f"The CV output should have shape (n,), got shape {cv.shape} for cv function {f} "

            return cv

        return CvFlow(func=f2)

[docs]    def compute_cv_flow(
        self,
        x: SystemParams,
        nl: NeighbourList | None = None,
        jit=True,
        chunk_size: int | None = None,
    ) -> CV:
        if x.batched:
            return vmap_chunked(
                self.compute_cv_flow,
                in_axes=(0, 0, None, None),
                chunk_size=chunk_size,
            )(x, nl, jit, chunk_size)

        def _compute_cv_flow(x, nl):
            out = self.f0(x, nl)
            if self.f1 is not None:
                out, _ = self.f1.compute_cv_trans(out, nl)

            return out

        if jit:
            _compute_cv_flow = jax.jit(_compute_cv_flow)

        return _compute_cv_flow(x, nl)

[docs]    def __add__(self, other):
        assert isinstance(other, CvFlow)

        def f_add(x: SystemParams, nl: NeighbourList):
            cv1: CV = self.compute_cv_flow(x, nl)
            cv2: CV = other.compute_cv_flow(x, nl)

            return CV.combine(cv1, cv2)

        return CvFlow(func=f_add)

[docs]    def __mul__(self, other):
        assert isinstance(other, CvTrans), "can only multiply by CvTrans object"

        if self.f1 is None:
            self.f1 = other
        else:
            self.f1 *= other

        return self

[docs]    def find_sp(
        self,
        x0: SystemParams,
        target: CV,
        target_nl: NeighbourList,
        nl0: NeighbourList | None = None,
        maxiter=10000,
        tol=1e-4,
        norm=lambda cv1, cv2, nl1, nl2: jnp.linalg.norm(cv1 - cv2),
        solver=jaxopt.GradientDescent,
    ) -> SystemParams:
        def loss(sp: SystemParams, nl: NeighbourList, norm):
            b, nl = jit(nl.update)(sp)
            cvi = self.compute_cv_flow(sp, nl)
            nn = norm(cvi.cv, target.cv, nl, target_nl)

            return nn, (b, nl, nn)  # aux output

        _l = jit(partial(loss, norm=norm))

        slvr = solver(
            fun=_l,
            tol=tol,
            has_aux=True,
            maxiter=10,
        )
        state = slvr.init_state(x0, nl=nl0)
        r = jit(slvr.update)

        for _ in range(maxiter):
            x0, state = r(x0, state, nl=nl0)
            b, nl0, nn = state.aux

            print(
                f"step:{state.iter_num} norm {nn:.14f} err {state.error:.4f} update nl={not b}",
            )

            if not b:
                nl0 = x0.get_neighbour_list(
                    r_cut=nl0.r_cut,
                    r_skin=nl0.r_skin,
                    z_array=nl0.z_array,
                )

        sp0 = _l(x0, nl0)
        return sp0


######################################
#       Collective variable          #
######################################


[docs]class CollectiveVariable:
    def __init__(self, f: CvFlow, metric: CvMetric, jac=jacrev) -> None:
        "jac: kind of jacobian. Default is jacrev (more efficient low dimensional CVs)"

        self.metric = metric
        self.f = f
        self.jac = jac

    @partial(jit, static_argnums=(0,))
[docs]    def _jit_f(self, sp, nl):
        return self.f.compute_cv_flow(sp, nl)

    @partial(jit, static_argnums=(0,))
[docs]    def _jit_df(self, sp, nl):
        return self.jac(self.f.compute_cv_flow)(sp, nl)

    # @partial(jit, static_argnums=(0, 3))
[docs]    def compute_cv(
        self,
        sp: SystemParams,
        nl: NeighbourList | None = None,
        jacobian=False,
        jit=True,
        chunk_size: int | None = None,
    ) -> tuple[CV, CV]:
        if sp.batched:
            if nl is None:
                return vmap_chunked(
                    self.compute_cv,
                    in_axes=(0, None, None, None, None),
                    chunk_size=chunk_size,
                )(
                    sp,
                    nl,
                    jacobian,
                    jit,
                    chunk_size,
                )
            else:
                assert nl.batched
                return vmap_chunked(
                    self.compute_cv,
                    in_axes=(0, 0, None, None, None),
                    chunk_size=chunk_size,
                )(
                    sp,
                    nl,
                    jacobian,
                    jit,
                    chunk_size,
                )

        if jit:
            cv = self._jit_f(sp, nl)
            dcv = self._jit_df(sp, nl) if jacobian else None
        else:
            cv = self.f.compute_cv_flow(sp, nl, jit=False)
            dcv = self.jac(self.f.compute_cv_flow)(sp, nl, jit=False) if jacobian else None

        return (cv, dcv)

    @property
[docs]    def n(self):
        return self.metric.ndim