deepmodeling · KuangYu · Apr 7, 2024 · Jan 22, 2024 · Jan 22, 2024 · Jan 22, 2024
diff --git a/dmff/difftraj.py b/dmff/difftraj.py
@@ -0,0 +1,243 @@
+import jax
+import jax.numpy as jnp
+from jax import jit, value_and_grad, vmap, grad, vjp, tree_util, custom_jvp
+from functools import partial
+from .common.nblist import NeighborListFreud
+
+
+class Loss_Generator:
+
+    def __init__(self, f_nout, box, pos0, mass, dt, nsteps, nout, cov_map, rc, efunc):
+
+        """ Constructor
+
+        Parameters
+        ----------
+        f_nout: function
+            Function of state user defined.
+        box: jnp.ndarray
+            Box of system, 3*3.
+        pos0: jnp.ndarray
+            Initial position used to allcate nblist.
+        mass: jnp.ndarray
+            Mass of each atom.
+        dt: float
+            Time step in simulation.
+        nsteps: int
+            Total steps in simulation.
+        nout: int
+            Get state in every nout steps.
+        cov_map: jnp.ndarray
+            Cov_map matrix.
+        rc: float
+            Cutoff distance in nblist.
+        efunc: function
+            Potential energy function.            
+
+        Examples
+        ----------
+
+        """
+
+        self.f_nout = f_nout
+        self.box = box
+        mass = jnp.tile(mass.reshape([len(mass), 1]), (1, 3))
+        self.dt = dt
+        self.nsteps = nsteps
+        self.nout = nout
+        nbl = NeighborListFreud(box, rc, cov_map)
+        nbl.allocate(pos0)
+
+        def return_pairs(pos):
+            pos = jax.lax.stop_gradient(pos)
+            nbl.update(pos)
+            return nbl.pairs
+        bonds = []
+        for i in range(len(cov_map)):
+            bonds.append(jnp.concatenate([jnp.array([i]), jnp.where(cov_map[i] > 0)[0]]))
+
+        @jit
+        def regularize_pos(pos):
+            cpos = jnp.stack([jnp.sum(pos[bond], axis=0)/len(bond) for bond in bonds])
+            box_inv = jnp.linalg.inv(box)
+            spos = cpos.dot(box_inv)
+            spos -= jnp.floor(spos)
+            shift = spos.dot(box) - cpos
+            return pos + shift
+
+        self.states_axis = {'pos': 0, 'vel': 0}
+        # use leap-frog Verlet integration method (v_0.5, x1) -> (v_1.5, x2)
+        @jit
+        def vv_step(state, params, pairs):
+            x0 = state['pos']
+            v0 = state['vel']
+            f0 = -grad(efunc, argnums=(0))(x0, box, pairs, params)
+            a0 = f0 / mass
+            v1 = v0 + a0 * dt
+            x1 = x0 + v1 * dt
+            x1 = regularize_pos(x1)
+            return {'pos': x1, 'vel':v1}   
+
+        self.return_pairs = return_pairs
+        self.regularize_pos = regularize_pos
+        self.vv_step = vv_step
+
+        return 
+
+
+    def ode_fwd(self, state, params):
+        """
+        Run forward to get 'trajectory'
+
+        Parameters
+        ----------
+        state: dict
+            Initial state, {'pos': jnp.ndarray, 'vel': jnp.ndarray}
+        params: dict
+            Forcefield parameters
+
+        Returns
+        ----------
+        state: dict
+            Final state, {'pos': jnp.ndarray, 'vel': jnp.ndarray}
+        traj: dict
+            Save each 'state' in 'trajectory', {'time': jnp.ndarray, 'state': jnp.ndarray}
+        """
+
+        def fwd(state):
+            for i in range(self.nout):
+                pairs = jnp.stack([self.return_pairs(x) for x in state['pos']])
+                state = vmap(self.vv_step, in_axes=(self.states_axis, None, 0), out_axes=(0))(state, params, pairs)
+            return state
+        traj = {}
+        traj['time'] = jnp.zeros(self.nsteps//self.nout+1)
+        traj0 = self.f_nout(state)
+        traj['state'] = jnp.repeat(traj0[jnp.newaxis, ...], (self.nsteps//self.nout+1), axis=0)
+        for i in range(self.nsteps//self.nout):
+            state = fwd(state)
+            traj['time'] = traj['time'].at[i+1].set(self.nout*self.dt*(i+1))
+            traj['state'] = traj['state'].at[i+1].set(self.f_nout(state))
+        return state, traj
+
+
+    def _ode_bwd(self, state, params, gradient_traj):
+        """
+        Run backward to get final adjoint_state and gradient
+
+        Parameters
+        ----------
+        state: dict
+            Final state, {'pos': jnp.ndarray, 'vel': jnp.ndarray}
+        params: dict
+            Forcefield parameters
+        gradient_traj: jnp.ndarray
+            Derivatives of Loss with respect to 'state' in traj
+
+        Returns
+        ----------
+        adjoint_state: dict
+            Final adjoint state, {'pos': jnp.ndarray, 'vel': jnp.ndarray}
+        gradient: dict
+            Gradient of Loss with respect to params
+        """
+        def batch_vjp(state, params, pairs, adjoint_state):
+            primals, vv_vjp = vjp(partial(self.vv_step, pairs=pairs), state, params)
+            (grad_state, grad_params) = vv_vjp(adjoint_state)
+            return grad_state, grad_params
+
+        def bwd(state, adjoint_state, gradient):
+            for i in range(self.nout):
+                pairs = jnp.stack([self.return_pairs(x) for x in state['pos']])
+                state = vmap(self.vv_step, in_axes=(self.states_axis, None, 0), out_axes=(0))(state, params, pairs)
+                state['vel'] = - state['vel']
+                state['pos'] = state['pos'] + state['vel']* self.dt
+                state['pos'] = vmap(self.regularize_pos)(state['pos'])
+                pairs = jnp.stack([self.return_pairs(x) for x in state['pos']])
+                (grad_state, grad_params) = vmap(batch_vjp, in_axes=(self.states_axis, None, 0, self.states_axis))(state, params, pairs, adjoint_state)
+                gradient = tree_util.tree_map(lambda p, u: p + jnp.sum(u, axis=0), gradient, grad_params)
+                adjoint_state = grad_state  
+                state['pos'] = state['pos'] - state['vel']*self.dt
+                state['pos'] = vmap(self.regularize_pos)(state['pos'])
+                state['vel'] = - state['vel']
+            return state, adjoint_state, gradient
+        primals, f_vjp = vjp(self.f_nout, state)
+        adjoint_state = f_vjp(gradient_traj[-1])[0]
+        gradient = tree_util.tree_map(jnp.zeros_like, params)
+        # (v_1.5, x2) -> (-v_1.5, x1)
+        state['pos'] = state['pos'] - state['vel']*self.dt
+        state['pos'] = vmap(self.regularize_pos)(state['pos'])
+        state['vel'] = - state['vel']
+        for i in range(self.nsteps//self.nout):
+            state, adjoint_state, gradient = bwd(state, adjoint_state, gradient)
+            primals, f_vjp = vjp(self.f_nout, state)
+            adjoint_state = {key: adjoint_state[key] + f_vjp(gradient_traj[-(i+2)])[0][key] for key in state}
+        return adjoint_state, gradient
+
+    def generate_Loss(self, L, has_aux=False, metadata=[]):
+        """
+        Generate Loss function
+
+        Parameters
+        ----------
+        L:  function
+            The 'Loss' function user defined, input: traj['state'], output: loss
+        has_aux: bool
+            If the L function returns auxiliary data
+        metadata: []
+            Record the traj and auxiliary data, {'traj':traj, 'aux_data':aux_data}
+
+        Returns:
+        ----------
+        Loss: function
+            Loss function
+
+        Examples:
+        ----------  
+        """
+        @custom_jvp
+        def Loss(initial_state, params):
+            """ 
+            This function returns the loss.
+
+            Parameters
+            ----------
+            initial_state: dict
+                Initial state, {'pos': jnp.ndarray, 'vel': jnp.ndarray}
+            params: dict
+                The parameter dictionary.
+
+            Returns:
+            ----------
+            loss: float 
+                Loss
+
+            Examples:
+            ----------
+            """
+            final_state, traj = self.ode_fwd(initial_state, params)
+            if has_aux == True:
+                loss, aux_data = L(traj['state'])
+                metadata.append({'traj':traj, 'aux_data':aux_data})
+            else: 
+                loss = L(traj['state'])
+                metadata.append({'traj':traj})
+            return loss
+
+        @Loss.defjvp
+        def _f_jvp(primals, tangents):
+            x, y = primals
+            x_dot, y_dot = tangents
+            final_state, traj = self.ode_fwd(x, y)
+            metadata.append(traj)
+            if has_aux == True:
+                (primal_out, aux_data), gradient_traj = value_and_grad(L, has_aux=True)(traj['state'])
+                metadata.append({'traj':traj, 'aux_data':aux_data})
+            else:
+                primal_out, gradient_traj = value_and_grad(L)(traj['state'])
+                metadata.append({'traj':traj})
+            adjoint_state, gradient = self._ode_bwd(final_state, y, gradient_traj)
+            tangent_out = sum(tree_util.tree_leaves(tree_util.tree_map(lambda p, u: jnp.sum(p * u), adjoint_state, x_dot))) + sum(tree_util.tree_leaves(tree_util.tree_map(lambda p, u: jnp.sum(p * u), gradient, y_dot)))
+            return primal_out, tangent_out
+
+        return Loss
+
diff --git a/docs/user_guide/4.8DiffTraj.md b/docs/user_guide/4.8DiffTraj.md
@@ -0,0 +1,68 @@
+# DiffTraj
+## 1. Theory
+DiffTraj provides a support to do gradient calculation on a loss function from trajectory. First a NVE (leap-frog Verlet) simulation is conducted, and then compute the gradient from the trajectory.
+### 1.1 NVE simulation
+NVE simulation follows the leap-frog Verlet integration method, just like in openMM. The positions and velocities stored in the context are offset from each other by half a time step. In each step, they are updated as follows:
+
+```math
+\begin{aligned}
+\mathbf{v}_i(t+\Delta t / 2) & =\mathbf{v}_i(t-\Delta t / 2)+\mathbf{f}_i(t) \Delta t / m_i \\
+\mathbf{r}_i(t+\Delta t) & =\mathbf{r}_i(t)+\mathbf{v}_i(t+\Delta t / 2) \Delta t
+\end{aligned}
+```
+where $\mathbf{v}_i$ is the velocity of particle i, $\mathbf{r}_i$ is its position, $\mathbf{f}_i$ is the force acting on it which is got from auto-differential calculation on energy, $m_i$ is its mass, and $\Delta t$ is the time step.
+### 1.2 Gradient calculation
+Naive using auto-differential `jax.grad` of jax on the trajectory may case the OOM problem, here in DiffTraj, we use the adjoint method to run a reverse calculation utilizing the time reversibility of NVE integrator to accumulate the gradient. The Loss function is,
+
+```math
+L\left( \mathbf{z}\left( t_1 \right) \right) =L\left( \mathbf{z}\left( t_0 \right) +\int_{t_0}^{t_1}{f\left( \mathbf{z}\left( t \right) ,\ t,\ \theta \right) dt} \right) =L\left( \text{ODESolve}\left( \mathbf{z}\left( t_0 \right) ,\ f,\ t_0,\ t_1,\ \theta \right) \right) 
+```
+
+where $L$ is the loss function, $\mathbf{z}\left( t_1 \right)$ is the state(velocity and position) at time $t_1$, $f$ is the integrator, and $\theta$ is the parameter. The gradient calculation starts at final state, the adjoint state is defined as $\mathbf{a}\left( t \right) =\frac{\partial L}{\partial \mathbf{z}\left( t \right)}$, the gradient is calculated using chain rule, 
+
+```math
+\frac{\partial L}{\partial \mathbf{z}\left( t_0 \right)}=\frac{\partial L}{\partial \mathbf{z}\left( t_1 \right)}\frac{\partial \mathbf{z}\left( t_1 \right)}{\partial \mathbf{z}\left( t_0 \right)}
+```
+
+```math
+\frac{\partial L}{\partial \theta}=\mathbf{a}\left( t_1 \right) ^T\frac{\partial f\left( \mathbf{z}\left( t_0 \right) ,\ \theta \right)}{\partial \theta}
+```
+
+When the Loss function is a function of trajectory, the calculation follows:
+
+[![grad.png](https://i.postimg.cc/pdm6fWX1/grad.png)](https://postimg.cc/nst2Ztmv)
+
+### References
+1. [Neural Ordinary Differential Equations](https://doi.org/10.48550/arXiv.1806.07366)
+
+## 2. Function module
+
+Class `Loss_Generator`:
+- Set the condition of simulation.
+- Contains the leap-frog Verlet integration method.
+
+Function `ode_fwd`:
+- Run the NVE simulation.
+- Get the trajectory.
+
+Function `generate_Loss`:
+- Generate the Loss function.
+
+## 3. How to use it
+Here we would tell you how to use Loss_Generator and get gradient.
+- Initialization: Create an instance of the `Loss_Generator`.
+
+```python
+Generator = Loss_Generator(f_nout, box, init_state['pos'][0], mass, dt, nsteps, nout, cov_map, rc, efunc)
+```
+You can use the Generator to only do a NVE simulation or do both NVE simulation and gradient calculation.
+
+- Only do a NVE simulation
+```python
+final_state, traj = Generator.ode_fwd(initial_state, params)
+```
+- Define Loss function and get gradient
+```python
+Loss = Generator.generate_Loss(L, has_aux=True, metadata=metadata)
+v, g = value_and_grad(Loss, argnums=(1))(init_state, params)
+```
diff --git a/docs/user_guide/4.modules.md b/docs/user_guide/4.modules.md
@@ -9,3 +9,4 @@ In this part, you will see 7 modules of DMFF, some of which are newly released i
 + [Optimization](./4.5Optimization.md)
 + [Mbar Estimator](./4.6MBAR.md)
 + [OpenMM Plugin](./4.7OpenMMplugin.md)
++ [DiffTraj](./4.7DiffTraj.md)