Source code for mlcolvar.cvs.committor.committor

import torch
import lightning
from mlcolvar.cvs import BaseCV
from mlcolvar.core import FeedForward, Normalization
from mlcolvar.core.loss import CommittorLoss
from mlcolvar.core.nn.utils import Custom_Sigmoid

__all__ = ["Committor"]



[docs]
class Committor(BaseCV, lightning.LightningModule):
    """Base class for data-driven learning of committor function.
    The committor function q is expressed as the output of a neural network optimized with a self-consistent
    approach based on the Kolmogorov's variational principle for the committor and on the imposition of its boundary conditions (see Refs. [1,2]).
    It is also possible to use an approximated variational approach without explicit dependence on the atomic coordinates (see Ref. [3]).
 

    **Data**: for training it requires a DictDataset with the keys 'data', 'labels' and 'weights'

    **Loss**: Minimize Kolmogorov's variational functional of q and impose boundary condition on the metastable states (CommittorLoss) from Refs. [1,2].
              It is also possible to use an approximated variational approach without explicit dependence on the atomic coordinates
    
    References
    ----------
    .. [1] P. Kang, E. Trizio, and M. Parrinello, "Computing the committor using the committor to study the transition state ensemble", Nat. Comput. Sci., 2024, DOI: 10.1038/s43588-024-00645-0
    .. [2] E. Trizio, P. Kang, and M. Parrinello, "Everything everywhere all at once: a probability-based enhanced sampling approach to rare events", Nat. Comput. Sci., 2025, DOI: 10.1038/s43588-025-00799-5
    .. [3] E. Trizio, G. Rossi, and M. Parrinello, "Ceci n'est pas un committor: Efficient sampling via approximated committor functions", J Chem. Phys., 2026, DOI: 10.1063/5.0331622

    See also
    --------
    mlcolvar.cvs.committor.utils.compute_committor_weights
        Utils to compute the appropriate weights for the training set
    mlcolvar.cvs.committor.utils.initialize_committor_masses
        Utils to initialize the masses tensor for the training
    mlcolvar.core.loss.CommittorLoss
        Kolmogorov's variational optimization of committor and imposition of boundary conditions
    mlcolvar.core.loss.utils.SmartDerivatives
        Class to optimize the gradients calculation imporving speed and memory efficiency.
    """

    BLOCKS = ["norm_in", "nn", "sigmoid"]


[docs]
    def __init__(
        self, 
        layers: list,
        alpha: float,
        atomic_masses: torch.Tensor = None,
        gamma: float = 10000,
        delta_f: float = 0,
        cell: float = None,
        separate_boundary_dataset: bool = True,
        descriptors_derivatives: torch.nn.Module = None,
        log_var: bool = False,
        use_gradients_wrt_positions: bool = True,
        z_regularization: float = 0.0,
        z_threshold: float = None,
        n_dim: int = None,
        norm_in: bool = False,
        options: dict = None,
        **kwargs,
    ):
        """Define a NN-based committor model

        Parameters
        ----------
        layers : list
            Number of neurons per layer
        alpha : float
            Hyperparamer that scales the boundary conditions contribution to loss, i.e. alpha*(loss_bound_A + loss_bound_B)
        atomic_masses : torch.Tensor
            List of masses of all the atoms we are using, for each atom we need to repeat three times for x,y,z, by default None.
            The mlcolvar.cvs.committor.utils.initialize_committor_masses can be used to simplify this.
            If the position-less loss is used, this must be set to None.
        gamma : float, optional
            Hyperparamer that scales the whole loss to avoid too small numbers, i.e. gamma*(loss_var + loss_bound), by default 10000
        delta_f : float, optional
            Delta free energy between A (label 0) and B (label 1), units is kBT, by default 0. 
            State B is supposed to be higher in energy.
        cell : float, optional
            CUBIC cell size length, used to scale the positions from reduce coordinates to real coordinates, by default None
        separate_boundary_dataset : bool, optional
            Switch to exculde boundary condition labeled data from the variational loss, by default True
        descriptors_derivatives : torch.nn.Module, optional
            `SmartDerivatives` object to save memory and time when using descriptors.
            See also mlcolvar.core.loss.committor_loss.SmartDerivatives
        log_var : bool, optional
            Switch to minimize the log of the variational functional, by default False.
        use_gradients_wrt_positions : bool, optional
            Whether to use gradients with respect to positions as prescribed in the original Kolmogorov variational functional, by default True.
            Set to false to use the approximated variational principle defined in Ref. [3] without explicit dependence on the atomic coordinates derivatives.
        z_regularization : float, optional
            Scales a regularization on the learned z space preventing it from exceeding the threshold given with 'z_threshold'.
            The magnitude of the regularization is scaled by the given number, by default 0.0
        z_threshold : float, optional
            Sets a maximum threshold for the z value during the training, by default None. 
            The magnitude of the regularization term is scaled via the `z_regularization` key.
        n_dim : int
            Number of dimensions, by default None. 
            If None, it defaults to 3 for the position-based loss and to 1 for the position-less loss.
        norm_in : bool
            Whether to normalize the input of the NN model, by default False.
        options : dict[str, Any], optional
            Options for the building blocks of the model, by default {}.
            Available blocks: ['nn'] .
        """
        super().__init__(in_features=layers[0], out_features=layers[-1], **kwargs) 
        
        if use_gradients_wrt_positions and atomic_masses is None:
            raise ValueError("atomic_masses must be provided when using Kolmogorov variational functional (use_gradients_wrt_positions is True)")
        elif not use_gradients_wrt_positions:
            if atomic_masses is not None:
                raise ValueError("atomic_masses must be None when using approximated variational principle (use_gradients_wrt_positions is False)")
            if descriptors_derivatives is not None:
                raise ValueError("descriptors_derivatives must be None when using approximated variational principle (use_gradients_wrt_positions is False)")
            
        # =======  LOSS  =======
        self.loss_fn = CommittorLoss(alpha=alpha,
                                     atomic_masses=atomic_masses,
                                     gamma=gamma,
                                     delta_f=delta_f,
                                     cell=cell,
                                     separate_boundary_dataset=separate_boundary_dataset,
                                     descriptors_derivatives=descriptors_derivatives,
                                     log_var=log_var,
                                     use_gradients_wrt_positions=use_gradients_wrt_positions,
                                     z_regularization=z_regularization,
                                     z_threshold=z_threshold,
                                     n_dim=n_dim
        )

        # ======= OPTIONS =======
        # parse and sanitize
        options = self.parse_options(options)

        # ======= BLOCKS =======
        # Initialize norm_in
        o = "norm_in"
        if norm_in and (options[o] is not False) and (options[o] is not None):
            self.norm_in = Normalization(self.in_features, **options[o])

        # initialize NN turning
        o = "nn"
        # set default activation to tanh
        if "activation" not in options[o]: 
            options[o]["activation"] = "tanh"
        self.nn = FeedForward(layers, **options[o])

        # separately add sigmoid activation on last layer, this way it can be deactived
        o = "sigmoid"
        if (options[o] is not False) and (options[o] is not None):
            self.sigmoid = Custom_Sigmoid(**options[o])


    def forward_nn(self, x):
        if self.preprocessing is not None:
            x = self.preprocessing(x)
        if self.norm_in is not None:
            x = self.norm_in(x)
        z = self.nn(x)
        return z


[docs]
    def training_step(self, train_batch, batch_idx):
        torch.set_grad_enabled(True)

        """Compute and return the training loss and record metrics."""
        # =================get data===================
        x = train_batch["data"]
        # check data are have shape (n_data, -1)
        x = x.reshape((x.shape[0], -1))
        x.requires_grad = True

        labels = train_batch["labels"]
        weights = train_batch["weights"]
        try:
            ref_idx = train_batch["ref_idx"]
        except KeyError:
            ref_idx = None

        # =================forward====================
        z = self.forward_nn(x)
        
        if self.sigmoid is not None:
            q = self.sigmoid(z)
        else:
            q = z        
        
        # ===================loss=====================
        if self.training:
            loss, loss_var, loss_bound_A, loss_bound_B = self.loss_fn(
                x, z, q, labels, weights, ref_idx 
            )
        else:
            loss, loss_var, loss_bound_A, loss_bound_B = self.loss_fn(
                x, z, q, labels, weights, ref_idx 
            )

        # ====================log=====================+
        name = "train" if self.training else "valid"
        self.log(f"{name}_loss", loss, on_epoch=True)
        self.log(f"{name}_loss_var", loss_var, on_epoch=True)
        self.log(f"{name}_loss_bound_A", loss_bound_A, on_epoch=True)
        self.log(f"{name}_loss_bound_B", loss_bound_B, on_epoch=True)
        return loss




def test_committor():
    from mlcolvar.data import DictDataset, DictModule
    from mlcolvar.cvs.committor.utils import initialize_committor_masses, KolmogorovBias
    import platform

    a_tol = 1e-3
    # The hard-coded reference values below are only bit-reproducible on the platform
    # where they were generated (Linux). Elsewhere, floating-point/BLAS differences make
    # the exact comparison unreliable, so off-Linux we only assert portable invariants.
    run_strict = platform.system() == "Linux"

    def check_committor(out, ref):
        out = out.detach()
        assert out.shape == ref.shape
        assert torch.all(torch.isfinite(out))
        assert out.min() >= 0.0 and out.max() <= 1.0
        if run_strict:
            assert torch.allclose(out, ref, atol=a_tol)

    def check_bias(bias, ref):
        bias = bias.detach()
        assert bias.shape == ref.shape
        assert torch.all(torch.isfinite(bias))
        if run_strict:
            assert torch.allclose(bias, ref, atol=a_tol)

    torch.manual_seed(42)
    # create two fake atoms and use their fake positions
    atomic_masses = initialize_committor_masses(atom_types=[0,1], masses=[15.999, 1.008])
    # create dataset
    samples = 20
    X = torch.randn((4*samples, 6))
    
    # create labels
    y = torch.zeros(X.shape[0])
    y[samples:] += 1
    y[int(2*samples):] += 1
    y[int(3*samples):] += 1
    
    # create weights
    w = torch.ones(X.shape[0])

    dataset = DictDataset({"data": X, "labels": y, "weights": w})
    datamodule = DictModule(dataset, lengths=[1])
    
    # train model
    trainer = lightning.Trainer(max_epochs=1, logger=None, enable_checkpointing=False, limit_val_batches=0, num_sanity_val_steps=0)
    
    # dataset separation
    ref_out = torch.Tensor([[0.6622],[0.6293],[0.5999],[0.5826],[0.6632],[0.5593],[0.5666],[0.6292],[0.5644],[0.5496],
                            [0.6479],[0.6079],[0.6472],[0.6002],[0.6529],[0.5767],[0.6111],[0.6117],[0.6470],[0.6242],
                            [0.6264],[0.6613],[0.6674],[0.6307],[0.6723],[0.5907],[0.5877],[0.6278],[0.6460],[0.6643],
                            [0.5951],[0.5923],[0.5973],[0.6676],[0.6658],[0.6544],[0.6504],[0.6687],[0.6555],[0.5625],
                            [0.6226],[0.6441],[0.6282],[0.5216],[0.6065],[0.6091],[0.5569],[0.6576],[0.5826],[0.6230],
                            [0.6549],[0.6457],[0.5342],[0.6241],[0.6092],[0.5921],[0.6445],[0.6234],[0.5788],[0.5034],
                            [0.6621],[0.6104],[0.6558],[0.6376],[0.6357],[0.5299],[0.6386],[0.6122],[0.6173],[0.6107],
                            [0.5907],[0.6058],[0.6549],[0.6571],[0.6355],[0.5669],[0.6368],[0.6450],[0.6024],[0.6780]])
    ref_bias = torch.Tensor([-6.1754, -6.8354, -7.7970, -7.9340, -5.7851, -7.5762, -7.9460, -6.9859,
                             -7.9346, -7.8172, -7.2156, -7.7203, -6.7477, -7.8528, -6.6614, -7.6932,
                             -7.7617, -7.5786, -6.7062, -7.5386, -7.5333, -4.9228, -6.4712, -7.4311,
                             -6.0271, -7.9461, -7.9332, -7.2807, -7.1991, -5.8248, -7.9603, -7.7892,
                             -7.7611, -4.7404, -5.3761, -5.8665, -6.4764, -4.6565, -5.8538, -7.8057,
                             -7.4344, -7.3929, -7.3325, -7.5757, -7.8021, -7.7619, -7.9274, -6.2869,
                             -7.9318, -7.7833, -6.4206, -5.6966, -7.9976, -7.1985, -7.7411, -7.8606,
                             -6.7020, -7.6421, -7.9529, -7.0869, -5.1529, -7.8873, -5.8033, -7.0834,
                             -7.0064, -7.2989, -6.5627, -7.6897, -7.3463, -7.7043, -7.9186, -7.7664,
                             -6.6557, -6.3900, -7.2810, -7.7624, -6.6961, -7.2745, -7.8269, -5.6305])
    model = Committor(layers=[6, 4, 2, 1], atomic_masses=atomic_masses, alpha=1e-1)
    trainer.fit(model, datamodule)
    out = model(X)
    out.sum().backward()
    check_committor(out, ref_out)
    bias_model = KolmogorovBias(input_model=model, beta=1, epsilon=1e-6, lambd=1)
    bias = bias_model(X)
    check_bias(bias, ref_bias)


    # naive whole dataset
    ref_out = torch.Tensor([[0.1042],[0.1850],[0.1561],[0.1569],[0.1589],[0.1569],[0.1160],[0.1973],[0.1311],[0.1735],
                            [0.1779],[0.1191],[0.1545],[0.1499],[0.1142],[0.1639],[0.1164],[0.1506],[0.1657],[0.1224],
                            [0.1370],[0.1357],[0.1383],[0.1727],[0.1344],[0.1307],[0.1904],[0.1314],[0.1243],[0.1702],
                            [0.1730],[0.0946],[0.1046],[0.1758],[0.1449],[0.1599],[0.1858],[0.1788],[0.1663],[0.1271],
                            [0.1744],[0.0951],[0.1339],[0.1726],[0.1104],[0.1972],[0.0754],[0.1549],[0.1461],[0.0818],
                            [0.1239],[0.1787],[0.1137],[0.1168],[0.1311],[0.1317],[0.1229],[0.1380],[0.1496],[0.1000],
                            [0.1805],[0.1178],[0.1714],[0.1742],[0.1477],[0.1189],[0.1830],[0.1078],[0.1209],[0.1026],
                            [0.1246],[0.0979],[0.1717],[0.1264],[0.1243],[0.1344],[0.1695],[0.1127],[0.1788],[0.0962]])
    trainer = lightning.Trainer(max_epochs=1, logger=None, enable_checkpointing=False, limit_val_batches=0, num_sanity_val_steps=0)
    model = Committor(layers=[6, 4, 2, 1], atomic_masses=atomic_masses, alpha=1e-1, separate_boundary_dataset=False)
    trainer.fit(model, datamodule)
    out = model(X)
    out.sum().backward()
    check_committor(out, ref_out)

    # test log loss
    ref_out = torch.Tensor([[0.9117],[0.7253],[0.7833],[0.7956],[0.7775],[0.8984],[0.9036],[0.7169],[0.8289],[0.8312],
                            [0.7610],[0.8825],[0.8054],[0.8474],[0.8474],[0.8628],[0.8355],[0.7986],[0.8701],[0.8562],
                            [0.8028],[0.8016],[0.8166],[0.7903],[0.7776],[0.8184],[0.7826],[0.8686],[0.8690],[0.8382],
                            [0.8328],[0.8493],[0.8855],[0.7325],[0.8250],[0.7755],[0.7372],[0.7362],[0.7284],[0.8276],
                            [0.8145],[0.8857],[0.8578],[0.8065],[0.8272],[0.7883],[0.8474],[0.7800],[0.8621],[0.8377],
                            [0.8067],[0.7760],[0.8898],[0.8582],[0.8529],[0.8275],[0.8441],[0.7749],[0.8684],[0.8889],
                            [0.8348],[0.8418],[0.7769],[0.7816],[0.8040],[0.9240],[0.7593],[0.8493],[0.7864],[0.9133],
                            [0.9077],[0.8956],[0.7555],[0.8968],[0.9050],[0.8908],[0.8005],[0.8778],[0.9044],[0.7629]])
    trainer = lightning.Trainer(max_epochs=1, logger=None, enable_checkpointing=False, limit_val_batches=0, num_sanity_val_steps=0)
    model = Committor(layers=[6, 4, 2, 1], atomic_masses=atomic_masses, alpha=1e-1, log_var=True)
    trainer.fit(model, datamodule)
    out = model(X)
    out.sum().backward()
    check_committor(out, ref_out)

    # test z regularization
    ref_out = torch.Tensor([[0.2299],[0.2478],[0.2812],[0.2426],[0.2030],[0.2233],[0.2309],[0.2242],[0.2567],[0.2616],
                            [0.2181],[0.1941],[0.2479],[0.2745],[0.2502],[0.2671],[0.2802],[0.2385],[0.1984],[0.2410],
                            [0.2558],[0.2110],[0.2350],[0.2336],[0.2472],[0.2400],[0.2507],[0.2686],[0.2290],[0.1947],
                            [0.2798],[0.2818],[0.2224],[0.2125],[0.2161],[0.2645],[0.2201],[0.2193],[0.2405],[0.2917],
                            [0.2322],[0.2502],[0.2135],[0.2793],[0.2976],[0.2272],[0.2752],[0.2183],[0.2463],[0.2820],
                            [0.2597],[0.2147],[0.2822],[0.2759],[0.2340],[0.2778],[0.2489],[0.2422],[0.2278],[0.2498],
                            [0.1890],[0.2424],[0.2307],[0.2370],[0.2628],[0.2556],[0.2359],[0.2791],[0.2622],[0.2382],
                            [0.2744],[0.2395],[0.2316],[0.2339],[0.2130],[0.2487],[0.2345],[0.2574],[0.2035],[0.2916]])
    trainer = lightning.Trainer(max_epochs=1, logger=None, enable_checkpointing=False, limit_val_batches=0, num_sanity_val_steps=0)
    model = Committor(layers=[6, 4, 2, 1], atomic_masses=atomic_masses, alpha=1e-1, z_regularization=100, z_threshold=0.000001)
    trainer.fit(model, datamodule)
    out = model(X)
    out.sum().backward()
    check_committor(out, ref_out)

    # test position-less loss
    ref_out = torch.Tensor([[0.3011],[0.3833],[0.4288],[0.3129],[0.2730],[0.2704],[0.2797],[0.3380],[0.3471],[0.3543],
                            [0.3086],[0.2408],[0.3612],[0.4553],[0.3475],[0.3847],[0.4621],[0.2910],[0.2776],[0.3386],
                            [0.3495],[0.3102],[0.3414],[0.3452],[0.3786],[0.3114],[0.4048],[0.3856],[0.3366],[0.2743],
                            [0.4377],[0.4595],[0.2732],[0.2986],[0.3258],[0.4365],[0.3098],[0.2919],[0.3688],[0.4664],
                            [0.3377],[0.3550],[0.2808],[0.4121],[0.4675],[0.3492],[0.3674],[0.2958],[0.2993],[0.4182],
                            [0.3816],[0.2860],[0.3527],[0.3749],[0.2975],[0.4376],[0.3331],[0.3241],[0.2746],[0.2975],
                            [0.2485],[0.3314],[0.3198],[0.3667],[0.3681],[0.3358],[0.2999],[0.4109],[0.3302],[0.3188],
                            [0.3858],[0.3065],[0.3372],[0.3317],[0.2931],[0.3442],[0.2822],[0.3965],[0.2688],[0.4545]])
    trainer = lightning.Trainer(max_epochs=1, logger=None, enable_checkpointing=False, limit_val_batches=0, num_sanity_val_steps=0)
    model = Committor(layers=[6, 4, 2, 1], atomic_masses=None, alpha=1e-1, use_gradients_wrt_positions=False)
    trainer.fit(model, datamodule)
    out = model(X)
    print(out)
    out.sum().backward()
    check_committor(out, ref_out)

    # test z_regularization errors
    trainer = lightning.Trainer(max_epochs=1, logger=None, enable_checkpointing=False, limit_val_batches=0, num_sanity_val_steps=0)
    for z_regularization, z_threshold in zip([10,   0,      -1,     10], 
                                             [None, 10,      1,     -1]):
        try:
            model = Committor(layers=[6, 4, 2, 1], atomic_masses=atomic_masses, alpha=1e-1, z_regularization=z_regularization, z_threshold=z_threshold, n_dim=2)
            trainer.fit(model, datamodule)
        except ValueError as e:
            print("[TEST LOG] Checked this error: ", e)

    # test dimension error
    try:
        trainer = lightning.Trainer(max_epochs=1, logger=None, enable_checkpointing=False, limit_val_batches=0, num_sanity_val_steps=0)
        model = Committor(layers=[6, 4, 2, 1], atomic_masses=atomic_masses, alpha=1e-1, z_regularization=10, z_threshold=1, n_dim=2)
        trainer.fit(model, datamodule)
    except RuntimeError as e:
        print("[TEST LOG] Checked this error: ", e)




def test_committor_with_derivatives():
    from mlcolvar.cvs.committor.utils import initialize_committor_masses
    from mlcolvar.data import DictModule, DictDataset
    from mlcolvar.core.loss.utils.smart_derivatives import SmartDerivatives, compute_descriptors_derivatives
    from mlcolvar.core.transform import PairwiseDistances
    
    torch.manual_seed(42)
    n_atoms = 10
    kT = 2.49432
    
    # input positions for alanine example 
    ref_pos = torch.Tensor([[ 1.2980, 0.5370, 1.3370, 1.3270, 0.5710, 1.1960, 1.4110, 0.5070, 1.1310, 1.2520, 0.6710, 1.1440,
                              1.2490, 0.6890, 0.9990, 1.1270, 0.6130, 0.9550, 1.2340, 0.8420, 0.9810, 1.1860, 0.9140, 1.0700,
                              1.2790, 0.8870, 0.8630, 1.2550, 1.0230, 0.8240 ],
                            [ 2.7530, 0.7150, 0.5170, 2.8460, 0.6150, 0.5780, 2.9520, 0.6560, 0.6220, 2.8150, 0.4870, 0.5730,
                              2.9100, 0.3830, 0.6150, 2.9310, 0.3890, 0.7690, 2.8520, 0.2450, 0.5830, 2.7300, 0.2380, 0.5550,
                              2.9420, 0.1390, 0.5840, 2.9030, -0.0030, 0.5690 ],
                            [ 0.4830, 2.5610, 2.9980, 0.5620, 2.5410, 2.8660, 0.5080, 2.4950, 2.7660, 0.6960, 2.5590, 2.8790,
                              0.8060, 2.5410, 2.7750, 0.7890, 2.6570, 2.6680, 0.9450, 2.5390, 2.8400, 0.9620, 2.5380, 2.9610,
                              1.0510, 2.5430, 2.7590, 1.1860, 2.5410, 2.7990 ],
                            [ 1.0680, 0.1770, 0.1670, 0.9560, 0.2290, 0.0920, 0.9320, 0.1730, -0.0070, 0.8770, 0.3280, 0.1460,
                              0.7710, 0.4040, 0.0760, 0.7230, 0.5180, 0.1660, 0.8270, 0.4640, -0.0530, 0.9010, 0.5650, -0.0450,
                              0.7790, 0.4160, -0.1670, 0.8260, 0.4500, -0.2950 ],
                            [ 2.4600, 0.5670, 2.4940, 2.6050, 0.5640, 2.5060, 2.6660, 0.4630, 2.5020, 2.6640, 0.6830, 2.5220,
                              2.8040, 0.7250, 2.5200, 2.8880, 0.6370, 2.6190, 2.8690, 0.7270, 2.3820, 2.9600, 0.8080, 2.3570,
                              2.8260, 0.6310, 2.3010, 2.8630, 0.6170, 2.1580 ]]
                          )

    # weights for inputs                     
    ref_weights = torch.Tensor([1.4809, 0.0736, 0.3693, 0.1849, 0.0885])
    
    # initialize dataset with positions
    dataset = DictDataset({"data": ref_pos, "weights": ref_weights, "labels": torch.arange((len(ref_pos)))})

    # initialize descriptors calculations: all pairwise distances
    ComputeDistances = PairwiseDistances(n_atoms=10, 
                                         PBC=False, 
                                         cell=[1, 1, 1], 
                                         scaled_coords=False)

    # create friction tensor
    masses = initialize_committor_masses(atom_types=[0,0,1,2,0,0,0,1,2,0], 
                                         masses=[ 12.011, 12.011, 15.999, 14.0067, 12.011, 12.011, 12.011, 15.999, 14.0067, 12.011])


    # --------------------------------- TRAIN MODELS ---------------------------------
    # Train the models: positions as input, desc as input with smartderivatives and passing derivatives
    for separate_boundary_dataset in [False, True]:
    
        # 1 ------------ Positions as input ------------
        # initialize datamodule
        torch.manual_seed(42)
        datamodule = DictModule(dataset, lengths=[1.0])
    
        # seed for reproducibility
        model = Committor(layers=[45, 20, 1],
                        atomic_masses=masses,
                        alpha=1, 
                        separate_boundary_dataset=separate_boundary_dataset)

        # here we use the preprocessing
        model.preprocessing = ComputeDistances

        trainer = lightning.Trainer(
            accelerator='cpu',
            callbacks=None,
            max_epochs=6,
            enable_progress_bar=False,
            enable_checkpointing=False,
            logger=False,
            limit_val_batches=0,
            num_sanity_val_steps=0,
        )

        # fit
        trainer.fit(model, datamodule)

        # save outputs as a reference
        X = dataset["data"]
        
        # this is to check other strategies
        ref_output = model(X)
        if separate_boundary_dataset:
            ref_output_check = torch.Tensor([[0.4759],
                                            [0.4765],
                                            [0.4828],
                                            [0.4786],
                                            [0.4725]])
        else:
            ref_output_check = torch.Tensor([[0.4756],
                                            [0.4762],
                                            [0.4825],
                                            [0.4783],
                                            [0.4723]])
            
        assert( (torch.allclose(ref_output, ref_output_check, atol=1e-3)))

        if not separate_boundary_dataset:
            # 2 ------------ Descriptors as input + explicit pass derivatives ------------
            # get descriptor and their derivatives
            pos, desc, d_desc_d_pos = compute_descriptors_derivatives(dataset=dataset,
                                                                    descriptor_function=ComputeDistances,
                                                                    n_atoms=n_atoms,
                                                                    separate_boundary_dataset=separate_boundary_dataset)

            dataset_desc = DictDataset({"data": desc, "weights": ref_weights, "labels": torch.arange((len(ref_pos)))}, create_ref_idx=True)

            # seed for reproducibility
            torch.manual_seed(42)
            datamodule = DictModule(dataset_desc, lengths=[1.0])
            
            model = Committor(layers=[45, 20, 1],
                            atomic_masses=masses,
                            alpha=1, 
                            separate_boundary_dataset=separate_boundary_dataset,
                            descriptors_derivatives=d_desc_d_pos)
            
            trainer = lightning.Trainer(
                accelerator='cpu',
                callbacks=None,
                max_epochs=6,
                enable_progress_bar=False,
                enable_checkpointing=False,
                logger=False,
                limit_val_batches=0,
                num_sanity_val_steps=0,
            )

            # fit
            trainer.fit(model, datamodule)

            # save outputs as a reference
            X = dataset_desc["data"]
            
            # this is to check other strategies
            ref_output = model(X)
            assert( (torch.allclose(ref_output, ref_output_check, atol=1e-3)))

            # test errors
            try:
                # separate boundary with explicit derivatives
                model = Committor(layers=[45, 20, 1],
                            atomic_masses=masses,
                            alpha=1, 
                            separate_boundary_dataset=True,
                            descriptors_derivatives=d_desc_d_pos)
                trainer = lightning.Trainer(
                    accelerator='cpu',
                    callbacks=None,
                    max_epochs=6,
                    enable_progress_bar=False,
                    enable_checkpointing=False,
                    logger=False,
                    limit_val_batches=0,
                    num_sanity_val_steps=0,
                )
                trainer.fit(model, datamodule)
            except ValueError as e:
                print("[TEST LOG] Checked this error: ", e)


        # 3 ------------ Descriptors as input + SmartDerivatives ------------
        # initialize smart derivatives, we do it explicitly to test different functionalities
        smart_derivatives = SmartDerivatives()
        smart_dataset = smart_derivatives.setup(dataset=dataset,
                                                descriptor_function=ComputeDistances,
                                                n_atoms=n_atoms,
                                                separate_boundary_dataset=separate_boundary_dataset)
        
        # seed for reproducibility
        torch.manual_seed(42)
        datamodule = DictModule(smart_dataset, lengths=[1.0])

        model = Committor(layers=[45, 20, 1],
                        atomic_masses=masses,
                        alpha=1, 
                        separate_boundary_dataset=separate_boundary_dataset,
                        descriptors_derivatives=smart_derivatives)
        
        trainer = lightning.Trainer(
            accelerator='cpu',
            callbacks=None,
            max_epochs=6,
            enable_progress_bar=False,
            enable_checkpointing=False,
            logger=False,
            limit_val_batches=0,
            num_sanity_val_steps=0,
        )

        # fit
        trainer.fit(model, datamodule)

        # save outputs as a reference
        X = smart_dataset["data"]
        
        # this is to check other strategies
        ref_output = model(X)
        assert( (torch.allclose(ref_output, ref_output_check, atol=1e-3)))

        # test errors
        try:
            # no ref_idx!
            wrong_dataset = DictDataset(data=smart_dataset['data'], labels=smart_dataset['labels'], weights=smart_dataset['weights'])
            wrong_datamodule = DictModule(wrong_dataset, lengths=[1.0])
            trainer = lightning.Trainer(
                accelerator='cpu',
                callbacks=None,
                max_epochs=6,
                enable_progress_bar=False,
                enable_checkpointing=False,
                logger=False,
                limit_val_batches=0,
                num_sanity_val_steps=0,
            )
            trainer.fit(model, wrong_datamodule)
        except ValueError as e:
            print("[TEST LOG] Checked this error: ", e)