Source code for snrv.snrv

if __name__ == "__main__":
    # Do something if this file is invoked on its own
    print('0')

import numpy as np

import torch
import torch.optim as optim
import torch.nn as nn
from torch.utils.data import Dataset, DataLoader
from torch.utils.data.dataset import random_split

from tqdm import tqdm

__all__ = ['DatasetSnrv', 'Snrv', 'load_snrv']


[docs]class DatasetSnrv(Dataset):
    """
    Custom dataset for Snrv class

    Parameters
    ----------
    data : float tensor (single traj) or list of float tensors (multi traj); dim 0 = steps, dim 1 = features
        time-continuous trajectories

    lag : int
        lag in steps to apply to data trajectory

    ln_pathweight : torch.tensor, n, n = observations
        accumulated sum of the log Girsanov path weights between frames in the trajectory;
            Girsanov theorem measure of the probability of the observed sample path under a target potential
            relative to that which was actually observed under the simulation potential;
            identically unity (no reweighting rqd) for target potential == simulation potential and code as None

    Attributes
    ----------
    self.lag : int
        lag in steps

    self.x_t0 : float tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
        non-time-lagged trajectory

    self.x_tt : float tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
        time-lagged trajectory

    self.pathweight : float tensor, n = observations
        pathweights from Girsanov theorem between time lagged observations;
        identically unity (no reweighting rqd) for target potential == simulation potential;
        if ln_pathweight == None => pathweight == ones
    """

[docs]    def __init__(self, data, lag, ln_pathweight):

        self.lag = lag

        if type(data) is list:

            for ii in range(0, len(data)):
                assert type(data[ii]) is torch.Tensor

            if ln_pathweight is not None:
                assert type(ln_pathweight) is list
                assert len(data) == len(ln_pathweight)
                for ii in range(0, len(ln_pathweight)):
                    assert type(ln_pathweight[ii]) is torch.Tensor
                    assert data[ii].size()[0] == ln_pathweight[ii].size()[0]

            x_t0 = []
            x_tt = []
            pathweight = []

            for ii in range(0, len(data)):
                x_t0.append(data[ii][:-self.lag])
                x_tt.append(data[ii][self.lag:])

                K = data[ii][self.lag:].size()[0]
                pathweight_ii = torch.ones(K)
                if ln_pathweight is not None:
                    for jj in range(0, K):
                        arg = torch.sum(ln_pathweight[ii][jj + 1: jj + self.lag])
                        pathweight_ii[jj] = torch.exp(arg)
                pathweight.append(pathweight_ii)

            x_t0 = torch.cat(x_t0, dim=0)
            x_tt = torch.cat(x_tt, dim=0)
            pathweight = torch.cat(pathweight, dim=0)

        elif type(data) is torch.Tensor:

            if ln_pathweight is not None:
                assert type(ln_pathweight) is torch.Tensor
                assert data.size()[0] == ln_pathweight.size()[0]

            x_t0 = data[:-self.lag]
            x_tt = data[self.lag:]

            K = x_tt.size()[0]
            pathweight = torch.ones(K)
            if ln_pathweight is not None:
                for ii in range(0, K):
                    arg = torch.sum(ln_pathweight[ii + 1: ii + self.lag])
                    pathweight[ii] = torch.exp(arg)

        else:
            raise TypeError(
                "Data type %s is not supported; must be a float tensor (single traj) or list of float tensors (multi "
                "traj)" % type(data))

        self.x_t0 = x_t0
        self.x_tt = x_tt
        self.pathweight = pathweight

    def __getitem__(self, index):
        x_t0 = self.x_t0[index]
        x_tt = self.x_tt[index]
        pathweight = self.pathweight[index]
        return x_t0, x_tt, pathweight

    def __len__(self):
        assert len(self.x_t0) == len(self.x_tt) == len(self.pathweight)
        return len(self.x_t0)


[docs]class Snrv(nn.Module):
    """
    ANN encoder for state-free reversible VAMPnet

    Parameters
    ----------
    input_size : int
        number of neurons in input layer

    output_size : int
        number of neurons in output layer corresponding to number of basis functions to compute for VAC / VAMP

    hidden_depth : int, default = 2
        number of hidden layers

    hidden_size : int, default = 100
        number of neurons in each hidden layer

    activation : str, default = nn.ReLU()
        activation function to be used in each neuron

    batch_norm : bool, default = False
        use batch normalization after each layer

    dropout_rate : float, default = 0.
        dropout rate to use in each layer

    lr : float, default = 0.1
        learning rate for Adam optimizer

    weight_decay : float, default = 0.
        weight decay for Adam optimizer

    val_frac : float, default = 0.2
        fraction of data to place in validation partition; balance is used for training

    n_epochs : int, default = 100
        number of training epochs for ANN

    batch_size : int, default = 100
        no. of instances per mini batch

    VAMPdegree: int, default = 2
        exponent to use in VAMP-r score loss function

    is_reversible : bool, default = True
        indicator flag as to whether to enforce detailed balance by symmetrizing trajectory by augmenting with time
        reversed twin and solve VAC OR not assume microscopic reversibility and solve VAMP

    Attributes
    ----------
    self.device : str
        specification as to whether to use 'cpu' or 'cuda' for model training

    self.is_fitted : bool
        indicator flag as to whether or nor model has been fitted

    self._train_loader : DataLoader object
        training data loader

    self._val_loader : DataLoader object
        validation data loader

    self.lag : int
        lag in steps to apply to data trajectory

    self.optimizer : torch.optim.Adam object
        optimizer for backpropagation

    self._train_step : function
        training step function produced by self._make_train_step

    self.evals : torch.tensor, n_comp, n_comp = no. of basis functions in ANN == output_size
        eigenvalues of VAC generalized eigenvalue problem finding linear combination of learned basis functions to
        produce approximations of transfer operator eigenvectors in non-ascending order OR singular values of VAMP
        singular value problem finding linear combination of learned basis functions to produce approximations of
        transfer operator left and right singular vectors in non-ascending order

    self.expansion_coefficients : n_comp, n_comp = no. of basis functions in ANN == output_size
        expansion coefficients for linear combination of learned basis functions into transfer operator eigenvectors
        (reversible) or left singular vectors (non-reversible)

    self.expansion_coefficients_right : n_comp, n_comp = no. of basis functions in ANN == output_size
        expansion coefficients for linear combination of learned basis functions into transfer operator right
        singular vectors (non-reversible)

    self.training_losses : list, n_epoch
        loss over training data in each epoch

    self.validation_losses : list, n_epoch
        loss over validation data in each epoch
    """

[docs]    def __init__(self, input_size, output_size, hidden_depth=2, hidden_size=100, activation=nn.ReLU(), batch_norm=False,
                 dropout_rate=0., lr=0.1, weight_decay=0., val_frac=0.2, n_epochs=100, batch_size=100, VAMPdegree=2,
                 is_reversible=True):

        super().__init__()

        assert 0. < val_frac < 1.
        assert isinstance(VAMPdegree, int) and VAMPdegree > 0

        self.input_size = input_size
        self.output_size = output_size
        self.hidden_depth = hidden_depth
        self.hidden_size = hidden_size
        self.activation = activation
        self.batch_norm = batch_norm
        self.dropout_rate = dropout_rate
        self.lr = lr
        self.weight_decay = weight_decay
        self.val_frac = val_frac
        self.n_epochs = n_epochs
        self.batch_size = batch_size
        self.VAMPdegree = VAMPdegree
        self.is_reversible = is_reversible

        # building SNRV encoder as simple feedforward ANN
        self.layers = nn.ModuleList()
        self.layers.append(nn.Linear(self.input_size, self.hidden_size))
        if self.dropout_rate > 0.:
            self.layers.append(nn.Dropout(self.dropout_rate))
        if self.batch_norm == True:
            self.layers.append(nn.BatchNorm1d(self.hidden_size))
        self.layers.append(self.activation)
        for k in range(hidden_depth - 1):
            self.layers.append(nn.Linear(self.hidden_size, self.hidden_size))
            if self.dropout_rate > 0.:
                self.layers.append(nn.Dropout(self.dropout_rate))
            if self.batch_norm == True:
                self.layers.append(nn.BatchNorm1d(self.hidden_size))
            self.layers.append(self.activation)
        self.layers.append(nn.Linear(self.hidden_size, self.output_size))

        # cached variables
        self.device = 'cuda' if torch.cuda.is_available() else 'cpu'
        self.is_fitted = False
        self._train_loader = None
        self._val_loader = None
        self.lag = None
        self.optimizer = None
        self._train_step = None
        self.training_losses = None
        self.validation_losses = None
        self.evals = None
        self.expansion_coefficients = None
        self.expansion_coefficients_right = None

    def forward(self, x_t0, x_tt):
        """
        Forward pass through network

        Parameters
        ----------
        x_t0 : torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
            trajectory

        x_tt : torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
            time-lagged trajectory of same length as trajectory

        Return
        ------
        z_t0 : torch.tensor, n x n_comp, n = observations, n_comp = number of basis functions produced by network
            trajectory projected into basis functions learned by SNRV encoder

        z_tt : torch.tensor, n x n_comp, n = observations, n_comp = number of basis functions produced by network
            time-lagged trajectory of same length as trajectory projected into basis functions learned by SNRV encoder
        """
        assert x_tt.size()[0] == x_t0.size()[0]

        # passing inputs through ANN to project into self.output_size basis vectors
        for layer in self.layers:
            x_t0 = layer(x_t0)

        for layer in self.layers:
            x_tt = layer(x_tt)

        return x_t0, x_tt  # really z_t0, z_tt resulting from passing x_t0, x_tt through network

    @staticmethod
    def _stable_symmetric_inverse(A, ret_sqrt=False):
        """
        Utility function to return stable inverse A^(-1) or sqrt of inverse A^(-0.5) of a symmetric matrix A
        Ref.: https://github.com/markovmodel/deeptime

        Proceeds by diagonalizing matrix, setting eigenvalues smaller than threshold to zero, performing operations
        on diagonlized matrix, reprojecting back to original basis

        Parameters
        ----------
        A : torch.tensor
            symmetric matrix

        ret_sqrt : bool, default = False
            indicator flag as to whether to return square root of inverse

        Return
        ------
        B : torch.tensor
            stable inverse approximation to A^(-1) or A^(-0.5) depending on ret_sqrt flag
        """
        assert torch.allclose(A, A.t())

        w, V = torch.linalg.eigh(A)

        w_threshold = torch.zeros_like(w)
        for ii in range(w.size()[0]):
            if w[ii] > torch.finfo(torch.float32).eps:
                w_threshold[ii] = w[ii]

        if ret_sqrt:
            B = torch.matmul(V, torch.matmul(torch.diag(w_threshold ** (-0.5)), V.t()))
        else:
            B = torch.matmul(V, torch.matmul(torch.diag(w_threshold ** (-1)), V.t()))

        return B

    @staticmethod
    def _gen_eig_chol(C, Q):
        """
        Solution of symmetric generalized eigenvalue problem using Cholesky decomposition to convert to regular eigenvalue problem
        Ref: Sidky, Chen, Ferguson J. Chem. Phys. 150, 214114 (2019); doi: 10.1063/1.5092521

        C*v_i = w_i*Q*v_i (generalized eigenvalue problem)

        Q = L*LT
        Ctilde = Linv*C*LTinv
        vtilde_i = LT*v_i

        Ctilde*vtilde_i = w_i*v_i (regular eigenvalue problem)
        v_i = LTinv*vtilde_i

        Parameters
        ----------
        C : torch.tensor
            symmetric matrix

        Q : torch.tensor
            symmetric matrix

        Return
        ------
        w : torch.tensor
            eigenvalues in non-ascending order

        v : torch.tensor
            eigenvectors in non-ascending order
        """

        # Cholesky
        L = torch.linalg.cholesky(Q)
        Linv = torch.linalg.inv(L)
        LTinv = torch.linalg.inv(L.t())

        # Ctilde
        Ctilde = torch.matmul(Linv, torch.matmul(C, LTinv))

        # regular eigenvalue problem
        w, vtilde = torch.linalg.eigh(Ctilde)

        # correcting to generalized eigenvalue eigenvectors
        v = torch.matmul(LTinv, vtilde)

        # reordering to non-ascending
        w = torch.flip(w, [0])
        v = torch.flip(v, [1])

        return w, v

    @staticmethod
    def _accumulate_correlation_matrices(z_t0, z_tt, pathweight, C00, C01, C10, C11):
        """
        Accumulating instantaneous and time-lagged correlations in z_t0 and z_tt into pre-existing C00, C01, C10, C11

        Parameters
        ----------
        z_t0 : torch.tensor, n x n_comp, n = observations, n_comp = number of basis functions produced by network
            trajectory projected into basis functions learned by SNRV encoder

        z_tt : torch.tensor, n x n_comp, n = observations, n_comp = number of basis functions produced by network
            time-lagged trajectory of same length as trajectory projected into basis functions learned by SNRV encoder

        pathweight : float tensor, n = observations
            pathweights from Girsanov theorem between time lagged observations;
            identically unity (no reweighting rqd) for target potential == simulation potential

        C00 : torch.tensor, n_comp x n_comp
            correlation of z_t0 with z_t0

        C01 : torch.tensor, n_comp x n_comp
            correlation of z_t0 with z_tt

        C10 : torch.tensor, n_comp x n_comp
            correlation of z_tt with z_t0

        C11 : torch.tensor, n_comp x n_comp
            correlation of z_tt with z_tt

        Return
        ------
        C00 : torch.tensor, n_comp x n_comp
            correlation of z_t0 with z_t0

        C01 : torch.tensor, n_comp x n_comp
            correlation of z_t0 with z_tt

        C10 : torch.tensor, n_comp x n_comp
            correlation of z_tt with z_t0

        C11 : torch.tensor, n_comp x n_comp
            correlation of z_tt with z_tt
        """

        assert z_t0.size()[0] == z_tt.size()[0] == pathweight.size()[0]
        assert z_t0.size()[1] == z_tt.size()[1]

        W = torch.tile(torch.reshape(pathweight, (-1, 1)), (1, z_tt.size()[1]))
        z_tt_r = torch.multiply(W, z_tt)
        C00 += torch.matmul(z_t0.t(), z_t0)
        C01 += torch.matmul(z_t0.t(), z_tt_r)
        C10 += torch.matmul(z_tt_r.t(), z_t0)
        C11 += torch.matmul(z_tt.t(), z_tt)

        return C00, C01, C10, C11

    def _loss_fn(self, z_t0, z_tt, pathweight):
        """
        VAC / VAMP VAMP-r loss function

        Parameters
        ----------
        z_t0 : torch.tensor, n x n_comp, n = observations, n_comp = number of basis functions produced by network
            trajectory projected into basis functions learned by SNRV encoder

        z_tt : torch.tensor, n x n_comp, n = observations, n_comp = number of basis functions produced by network
            time-lagged trajectory of same length as trajectory projected into basis functions learned by SNRV encoder

        pathweight : float tensor, n = observations
            pathweights from Girsanov theorem between time lagged observations;
            identically unity (no reweighting rqd) for target potential == simulation potential

        Return
        ------
        loss : float
            negative squared sum of eigenvalues from solving VAC generalized eigenvalue problem OR VAMP singular value problem
        """

        assert z_t0.size()[0] == z_tt.size()[0] == pathweight.size()[0]
        assert z_t0.size()[1] == z_tt.size()[1]

        # VAC / VAMP on instantaneous z_t0 and time-lagged z_tt trajectories projected into ANN basis functions
        # Ref.: Noe arXiv:1812.07669v1
        dim = z_t0.size()[1]

        # - accumulating correlation matrices
        C00 = torch.zeros(dim, dim).to(self.device)
        C01 = torch.zeros(dim, dim).to(self.device)
        C10 = torch.zeros(dim, dim).to(self.device)
        C11 = torch.zeros(dim, dim).to(self.device)
        C00, C01, C10, C11 = self._accumulate_correlation_matrices(z_t0, z_tt, pathweight, C00, C01, C10, C11)

        if self.is_reversible:

            # VAC
            # Ref.: Noe arXiv:1812.07669v1

            # - assuming detailed balance (i.e., data augmentation with time reversed trajectories)
            Q = 0.5 * (C00 + C11)
            C = 0.5 * (C01 + C10)

            # - applying regularization (nugget regularization of unpopulated bins with pseudocounts)
            # Q += torch.eye(Q.size()[0], dtype=torch.float, requires_grad=False)*torch.finfo(torch.float32).eps

            # solving generalized eigenvalue problem Cv = wQv using Cholesky trick to enable backpropagation
            evals, _ = self._gen_eig_chol(C, Q)

            # loss
            loss = -(evals ** self.VAMPdegree).sum()

        else:

            # VAMP
            # Ref.: Noe arXiv:1812.07669v1, Algorithm 4

            # - assembling balanced propagator (Eqn. 34)
            C00invhalf = self._stable_symmetric_inverse(C00, ret_sqrt=True)
            C11invhalf = self._stable_symmetric_inverse(C11, ret_sqrt=True)

            P = torch.matmul(C00invhalf, torch.matmul(C01, C11invhalf))

            # - SVD
            Up, S, VpT = torch.linalg.svd(P)

            # - projecting singular values back to original (non-balanced) propagator
            #U = torch.matmul(C00invhalf, Up)
            #V = torch.matmul(C11invhalf, VpT.t())

            # loss
            loss = -(S ** self.VAMPdegree).sum()

        return loss

    def _create_dataset(self, data, ln_pathweight):
        """
        create training and validation data loader

        Parameters
        ----------
        data : torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
            trajectory

        ln_pathweight : torch.tensor, n, n = observations
            accumulated sum of the log Girsanov path weights between frames in the trajectory;
                Girsanov theorem measure of the probability of the observed sample path under a target potential
                relative to that which was actually observed under the simulation potential;
                identically unity (no reweighting rqd) for target potential == simulation potential and code as None;
            Ref.: Kieninger and Keller J. Chem. Phys 154 094102 (2021)  https://doi.org/10.1063/5.0038408

        Return
        ------
        self._train_loader : torch DataLoader
            training data loader

        self._val_loader : torch DataLoader
            validation data loader
        """
        dataset = DatasetSnrv(data, self.lag, ln_pathweight)

        n = dataset.__len__()
        train_size = int((1.0 - self.val_frac) * n)
        val_size = n - train_size
        train_dataset, val_dataset = random_split(dataset, [train_size, val_size])

        self._train_loader = DataLoader(dataset=train_dataset, batch_size=self.batch_size, shuffle=True)
        self._val_loader = DataLoader(dataset=val_dataset, batch_size=self.batch_size, shuffle=True)

        return None

    def _make_train_step(self):
        """
        defining model training step

        Parameters
        ----------

        Return
        ------
        _train_step : function
            definition of a single training step of the model
        """

        def _train_step(x_t0, x_tt, pathweight):
            """
            model training step

            Parameters
            ----------
            x_t0: torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
                trajectory

            x_tt: torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
                time-lagged trajectory of same length as trajectory

            pathweight : float tensor, n = observations
                pathweights from Girsanov theorem between time lagged observations;
                identically unity (no reweighting rqd) for target potential == simulation potential

            Return
            ------
            loss.item() : float
                network loss over x_t0 and x_tt mini batch extracted as a float
            """
            self.train()
            z_t0, z_tt = self(x_t0, x_tt)
            loss = self._loss_fn(z_t0, z_tt, pathweight)
            loss.backward()
            self.optimizer.step()
            self.optimizer.zero_grad()
            return loss.item()

        return _train_step

[docs]    def fit(self, data, lag, ln_pathweight=None):
        """
        fit SNRV model to data

        Parameters
        ----------
        data : torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
            trajectory

        lag : int
            lag in steps to apply to data trajectory

        ln_pathweight : torch.tensor, n, n = observations, default = None
            accumulated sum of the log Girsanov path weights between frames in the trajectory;
            Girsanov theorem measure of the probability of the observed sample path under a target potential
            relative to that which was actually observed under the simulation potential;
            identically unity (no reweighting rqd) for target potential == simulation potential and code as None;
            Ref.: Kieninger and Keller J. Chem. Phys 154 094102 (2021)  https://doi.org/10.1063/5.0038408

        Return
        ------
        self.lag : int
            lag in steps

        self.training_losses: list, n_epoch
            loss over training data in each epoch

        self.validation_losses: list, n_epoch
            loss over validation data in each epoch

        self.evals : torch.tensor, n_comp, n_comp = no. of basis functions in ANN == output_size
            eigenvalues of VAC generalized eigenvalue problem finding linear combination of learned basis functions to
            produce approximations of transfer operator eigenvectors in non-ascending order OR singular values of VAMP
            singular value problem finding linear combination of learned basis functions to produce approximations of
            transfer operator left and right singular vectors in non-ascending order

        self.expansion_coefficients : n_comp, n_comp = no. of basis functions in ANN == output_size
            expansion coefficients for linear combination of learned basis functions into transfer operator eigenvectors
            (reversible) or left singular vectors (non-reversible)

        self.expansion_coefficients_right : n_comp, n_comp = no. of basis functions in ANN == output_size
            expansion coefficients for linear combination of learned basis functions into transfer operator right
            singular vectors (non-reversible)

        self.is_fitted: bool
            indicator flag as to whether or nor model has been fitted
        """

        assert isinstance(lag, int) and lag >= 1

        self.lag = lag
        self._create_dataset(data, ln_pathweight)
        self.optimizer = optim.Adam(self.parameters(), lr=self.lr, weight_decay=self.weight_decay)
        self._train_step = self._make_train_step()

        training_losses = []
        validation_losses = []

        for epoch in range(self.n_epochs):

            with tqdm(self._train_loader, unit="batch") as tepoch:
                train_losses = []
                for x_t0_batch, x_tt_batch, pathweight_batch in tepoch:
                    tepoch.set_description("Epoch %d" % epoch)
                    self.train()
                    x_t0_batch = x_t0_batch.to(self.device)
                    x_tt_batch = x_tt_batch.to(self.device)
                    pathweight_batch = pathweight_batch.to(self.device)
                    loss = self._train_step(x_t0_batch, x_tt_batch, pathweight_batch)
                    train_losses.append(loss)
                training_loss = float(np.mean(train_losses))
                training_losses.append(training_loss)

                with torch.no_grad():
                    val_losses = []
                    for x_t0_batch, x_tt_batch, pathweight_batch in self._val_loader:
                        x_t0_batch = x_t0_batch.to(self.device)
                        x_tt_batch = x_tt_batch.to(self.device)
                        pathweight_batch = pathweight_batch.to(self.device)
                        self.eval()
                        z_t0_batch, z_tt_batch = self(x_t0_batch, x_tt_batch)
                        val_loss = self._loss_fn(z_t0_batch, z_tt_batch, pathweight_batch)
                        val_loss = val_loss.item()
                        val_losses.append(val_loss)
                    validation_loss = float(np.mean(val_losses))
                    validation_losses.append(validation_loss)

                print("[Epoch %d]\t training loss = %.3f\t validation loss = %.3f" % (
                    epoch, training_loss, validation_loss))

        self.training_losses = training_losses
        self.validation_losses = validation_losses

        self._compute_expansion_coefficients()

        self.is_fitted = True

        return None

    def _compute_expansion_coefficients(self):
        """
        calculate expansion coefficients by applying trained SNRV encoder ANN to all training data

        Parameters
        ----------

        Return
        ------
        self.evals : torch.tensor, n_comp, n_comp = no. of basis functions in ANN == output_size
            eigenvalues of VAC generalized eigenvalue problem finding linear combination of learned basis functions to
            produce approximations of transfer operator eigenvectors in non-ascending order OR singular values of VAMP
            singular value problem finding linear combination of learned basis functions to produce approximations of
            transfer operator left and right singular vectors in non-ascending order

        self.expansion_coefficients : n_comp, n_comp = no. of basis functions in ANN == output_size
            expansion coefficients for linear combination of learned basis functions into transfer operator eigenvectors
            (reversible) or left singular vectors (non-reversible)

        self.expansion_coefficients_right : n_comp, n_comp = no. of basis functions in ANN == output_size
            expansion coefficients for linear combination of learned basis functions into transfer operator right
            singular vectors (non-reversible)
        """

        C00 = torch.zeros(self.output_size, self.output_size).to(self.device)
        C01 = torch.zeros(self.output_size, self.output_size).to(self.device)
        C10 = torch.zeros(self.output_size, self.output_size).to(self.device)
        C11 = torch.zeros(self.output_size, self.output_size).to(self.device)

        for x_t0_batch, x_tt_batch, pathweight_batch in self._train_loader:
            x_t0_batch = x_t0_batch.to(self.device)
            x_tt_batch = x_tt_batch.to(self.device)
            pathweight_batch = pathweight_batch.to(self.device)
            self.eval()
            z_t0_batch, z_tt_batch = self(x_t0_batch, x_tt_batch)
            C00, C01, C10, C11 = self._accumulate_correlation_matrices(z_t0_batch, z_tt_batch, pathweight_batch, C00, C01, C10, C11)

        if self.is_reversible:

            # VAC
            # Ref.: Noe arXiv:1812.07669v1

            # assuming detailed balance (i.e., data augmentation with time reversed trajectories)
            Q = 0.5 * (C00 + C11)
            C = 0.5 * (C01 + C10)

            # applying regularization (nugget regularization of unpopulated bins with pseudocounts)
            # Q += torch.eye(Q.size()[0], dtype=torch.float, requires_grad=False)*torch.finfo(torch.float32).eps

            # solving generalized eigenvalue problem Cv = wQv using Cholesky trick to enable backpropagation
            # - column evecs are the expansion coefficients to assemble transfer operator eigenvector / singluar vector
            # approximations from learned SNRV basis functions
            evals, expansion_coefficients = self._gen_eig_chol(C, Q)

            self.evals = evals
            self.expansion_coefficients = expansion_coefficients

        else:

            # VAMP
            # Ref.: Noe arXiv:1812.07669v1, Algorithm 4

            # - assembling balanced propagator (Eqn. 34)
            C00invhalf = self._stable_symmetric_inverse(C00, ret_sqrt=True)
            C11invhalf = self._stable_symmetric_inverse(C11, ret_sqrt=True)

            P = torch.matmul(C00invhalf, torch.matmul(C01, C11invhalf))

            # - SVD
            Up, S, VpT = torch.linalg.svd(P)

            # - projecting singular values back to original (non-balanced) propagator
            U = torch.matmul(C00invhalf, Up)
            V = torch.matmul(C11invhalf, VpT.t())

            self.evals = S
            self.expansion_coefficients = U
            self.expansion_coefficients_right = V

        return None

[docs]    def transform(self, data):
        """
        project data into learned eigenvector basis

        Parameters
        ----------
        data : torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
            trajectory

        Return
        ------
        psi : torch.tensor, n x n_comp, n_comp = no. of basis functions in ANN == output_size
            projection of data into learned eigenvector approximations of transfer operator
        """

        if self.is_fitted:
            data = data.to(self.device)
            z, _ = self(data, data)
            psi = torch.matmul(z, self.expansion_coefficients)
        else:
            raise RuntimeError('Model needs to be fit first.')

        return psi

[docs]    def fit_transform(self, data, lag, ln_pathweight=None):
        """
        fit SNRV over data then project data into learned eigenvector (VAC) / singular vectors (VAMP) of transfer operator

        Parameters
        ----------
        data : torch.tensor, n x dim, n = observations, dim = dimensionality of trajectory featurization
            trajectory

        lag : int
            lag in steps to apply to data trajectory

        ln_pathweight : torch.tensor, n, n = observations, default = None
            accumulated sum of the log Girsanov path weights between frames in the trajectory;
            Girsanov theorem measure of the probability of the observed sample path under a target potential
            relative to that which was actually observed under the simulation potential;
            identically unity (no reweighting rqd) for target potential == simulation potential and code as None;
            Ref.: Kieninger and Keller J. Chem. Phys 154 094102 (2021)  https://doi.org/10.1063/5.0038408

        Return
        ------
        self.lag : int
            lag in steps

        self.training_losses: list, n_epoch
            loss over training data in each epoch

        self.validation_losses: list, n_epoch
            loss over validation data in each epoch

        self.evals : torch.tensor, n_comp, n_comp = no. of basis functions in ANN == output_size
            eigenvalues of VAC generalized eigenvalue problem finding linear combination of learned basis functions to
            produce approximations of transfer operator eigenvectors in non-ascending order OR singular values of VAMP
            singular value problem finding linear combination of learned basis functions to produce approximations of
            transfer operator left and right singular vectors in non-ascending order

        self.expansion_coefficients : n_comp, n_comp = no. of basis functions in ANN == output_size
            expansion coefficients for linear combination of learned basis functions into transfer operator eigenvectors
            (reversible) or left singular vectors (non-reversible)

        self.expansion_coefficients_right : n_comp, n_comp = no. of basis functions in ANN == output_size
            expansion coefficients for linear combination of learned basis functions into transfer operator right
            singular vectors (non-reversible)

        self.is_fitted: bool
            indicator flag as to whether or nor model has been fitted

        psi : torch.tensor, n x n_comp, n_comp = no. of basis functions in ANN == output_size
            projection of data into learned eigenvector approximations of transfer operator
        """

        assert isinstance(lag, int) and lag >= 1

        self.lag = lag
        self.fit(data, self.lag, ln_pathweight=ln_pathweight)
        psi = self.transform(data)

        return psi

[docs]    def get_transform_Jacobian(self, data):
        """
        compute Jacobian of self.transform computational graph output (psi) wrt input (data)

        - data is n x dim_in tensor -- n instances of dim_in = self.input_size vectors at which to compute Jacobian
        - psi = self.transform(data) is n x dim_out -- n dim_out = n_comp = no. basis functions in ANN
          = self.output_size projections of data vectors
        - Jacobian[n,i,j] = d(psi_i)/d(data_j) @ data[n,:]

        Parameters
        ----------
        data : torch.tensor, n x dim_in, n = observations, dim_in = dimensionality of trajectory
            featurization = self.input_size

        Return
        ------
        Jacobian : torch.tensor, n x dim_out x dim_in, n = observations, dim_in = dimensionality of input,
            dim_out = dimensionality of output
        """

        if not self.is_fitted:

            raise RuntimeError('Model needs to be fit first.')

        else:

            # passing data through self.transform computational graph with gradients
            data.requires_grad = True
            psi = self.transform(data)

            # preparing Jacobian
            n = data.size()[0]
            dim_out = self.output_size
            dim_in = data.size()[1]

            Jacobian = torch.zeros(n, dim_out, dim_in)

            # sequential computation of Jacobian[:,ii,:] (i.e., row ii of each Jacobian corresponding to each n)
            for ii in range(dim_out):

                # - selecting the computational graph output for which to compute gradient wrt all inputs
                #   (i.e., row of 2D dim_out x dim_in Jacobian for each ii = 0...n)
                grad_mask = torch.zeros(dim_out).to(self.device)
                grad_mask[ii] = 1
                grad_mask_matrix = torch.tile(grad_mask, (n, 1)).to(self.device)

                # - zeroing gradients
                if hasattr(data.grad, 'data'):
                    _ = data.grad.data.zero_()

                # - backward pass
                psi.backward(grad_mask_matrix, retain_graph=True)

                # - computing gradients and storing in Jacobian
                Jacobian[:, ii, :] = torch.clone(data.grad.data)

        return Jacobian

[docs]    def save_model(self, modelFilePath):
        """
        saving model parameters required for building and running (i.e., self.transform)

        Parameters
        ----------
        modelFilePath : str
            path to .pt file

        Return
        ------
        """
        torch.save({'input_size': self.input_size,
                    'output_size': self.output_size,
                    'hidden_depth': self.hidden_depth,
                    'hidden_size': self.hidden_size,
                    'activation': self.activation,
                    'batch_norm': self.batch_norm,
                    'dropout_rate': self.dropout_rate,
                    'lr': self.lr,
                    'weight_decay': self.weight_decay,
                    'val_frac': self.val_frac,
                    'n_epochs': self.n_epochs,
                    'batch_size': self.batch_size,
                    'VAMPdegree': self.VAMPdegree,
                    'is_reversible' : self.is_reversible,
                    'evals': self.evals,
                    'expansion_coefficients': self.expansion_coefficients,
                    'network_weights': self.state_dict()
                    },
                   modelFilePath)

        return None

[docs]    def load_weights(self, network_weights):
        """
        loading SNRV network weights from file

        Parameters
        ----------
        network_weights : ordered dictionary
            dictionary of network_weights
            (N.B. model must possess same architecture as that used to save these weights!)

        Return
        ------
        """
        self.load_state_dict(network_weights)
        self.is_fitted = True
        self.eval()

        return None


[docs]def load_snrv(modelFilePath):
    """
    loading SNRV model from file

    Parameters
    ----------
    modelFilePath : str
        path to .pt file containing saved model parameters

    Return
    ------
    model : Snrv object
        SNRV model initialized from saved parameter set
    """
    d = torch.load(modelFilePath)

    input_size = d['input_size']
    output_size = d['output_size']
    hidden_depth = d['hidden_depth']
    hidden_size = d['hidden_size']
    activation = d['activation']
    batch_norm = d['batch_norm']
    dropout_rate = d['dropout_rate']
    lr = d['lr']
    weight_decay = d['weight_decay']
    val_frac = d['val_frac']
    n_epochs = d['n_epochs']
    batch_size = d['batch_size']
    VAMPdegree = d['VAMPdegree']
    is_reversible = d['is_reversible']

    evals = d['evals']
    expansion_coefficients = d['expansion_coefficients']
    network_weights = d['network_weights']

    model = Snrv(input_size, output_size, hidden_depth=hidden_depth, hidden_size=hidden_size, activation=activation,
                batch_norm=batch_norm, dropout_rate=dropout_rate, lr=lr, weight_decay=weight_decay,
                val_frac=val_frac, n_epochs=n_epochs, batch_size=batch_size, VAMPdegree=VAMPdegree,
                is_reversible=is_reversible)

    model.evals = evals
    model.expansion_coefficients = expansion_coefficients
    model.load_weights(network_weights)

    device = 'cuda' if torch.cuda.is_available() else 'cpu'
    model.to(device)

    return model