From 80645245d3f3c90b06817bd480777c9390c50b46 Mon Sep 17 00:00:00 2001
From: "Gonzales, Carmelo" <carmelo.gonzales@intel.com>
Date: Wed, 17 Apr 2024 15:52:45 -0700
Subject: [PATCH 1/2] updating test_sam to include SAM callback for multitask
 test, update callback to process losses from multitask pipelines

---
 matsciml/lightning/callbacks.py      |  17 +
 matsciml/lightning/tests/test_sam.py | 522 +++++++++++++--------------
 2 files changed, 273 insertions(+), 266 deletions(-)

diff --git a/matsciml/lightning/callbacks.py b/matsciml/lightning/callbacks.py
index 65dcbc49..e9b3c0d4 100644
--- a/matsciml/lightning/callbacks.py
+++ b/matsciml/lightning/callbacks.py
@@ -8,6 +8,7 @@
 from logging import DEBUG, getLogger
 from pathlib import Path
 from time import time
+from copy import copy
 from typing import Any, Callable, Dict, Iterator, Optional
 
 import numpy as np
@@ -753,6 +754,21 @@ def on_train_batch_start(
         self.batch = batch
         self.batch_idx = batch_idx
 
+    def extract_optimizer_specific_loss(self, trainer, optimizer, loss):
+        optimizer_names = copy(trainer.model.optimizer_names)
+        opt_idx = [opt == optimizer for opt in trainer.optimizers].index(True)
+        loss_keys = optimizer_names[opt_idx]
+        if loss_keys == ("Global", "Encoder"):
+            optimizer_names.pop(opt_idx)
+            global_loss = 0
+            for dataset, task in optimizer_names:
+                global_loss += loss[dataset][task]["loss"]
+            return {"loss": global_loss}
+        else:
+            for key in loss_keys:
+                loss = loss[key]
+        return loss
+
     def on_before_optimizer_step(
         self,
         trainer: Trainer,
@@ -763,6 +779,7 @@ def on_before_optimizer_step(
             org_weights = self._first_step(optimizer)
         with torch.enable_grad():
             loss = task._compute_losses(self.batch)
+            loss = self.extract_optimizer_specific_loss(trainer, optimizer, loss)
             loss = self._get_loss(loss)
             if torch.isfinite(loss):
                 trainer.strategy.backward(loss, optimizer=optimizer)
diff --git a/matsciml/lightning/tests/test_sam.py b/matsciml/lightning/tests/test_sam.py
index 8b3012ca..c24b6087 100644
--- a/matsciml/lightning/tests/test_sam.py
+++ b/matsciml/lightning/tests/test_sam.py
@@ -5,303 +5,293 @@
 from matsciml.datasets.transforms import (
     PeriodicPropertiesTransform,
     PointCloudToGraphTransform,
-    FrameAveraging,
-    UnitCellCalculator,
 )
 
-from matsciml.lightning import MatSciMLDataModule, MultiDataModule
+from matsciml.lightning import MultiDataModule
 from matsciml.datasets import MultiDataset, IS2REDataset, S2EFDataset
-from matsciml.models.pyg import EGNN
 from matsciml.lightning.callbacks import SAM
-from matsciml.models.pyg import FAENet
-from torch import nn
-from e3nn.o3 import Irreps
-from mace.modules.blocks import RealAgnosticInteractionBlock
-from matsciml.models.pyg.mace import MACEWrapper
 from matsciml.models.dgl import PLEGNNBackbone
 from matsciml.models.base import (
     MultiTaskLitModule,
     ForceRegressionTask,
-    GradFreeForceRegressionTask,
     ScalarRegressionTask,
-    BinaryClassificationTask,
 )
 
 
-def test_egnn_end_to_end_with_SAM():
-    """
-    Test the end to end pipeline using a devset with EGNN and SAM callback.
+# def test_egnn_end_to_end_with_SAM():
+#     """
+#     Test the end to end pipeline using a devset with EGNN and SAM callback.
 
-    The idea is that this basically mimics an example script to
-    try and maximize coverage across dataset to training, which
-    is particularly useful for checking new dependencies, etc.
-    """
-    dm = MatSciMLDataModule.from_devset(
-        "MaterialsProjectDataset",
-        dset_kwargs={
-            "transforms": [
-                PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
-                PointCloudToGraphTransform("pyg"),
-            ]
-        },
-        batch_size=8,
-    )
+#     The idea is that this basically mimics an example script to
+#     try and maximize coverage across dataset to training, which
+#     is particularly useful for checking new dependencies, etc.
+#     """
+#     dm = MatSciMLDataModule.from_devset(
+#         "MaterialsProjectDataset",
+#         dset_kwargs={
+#             "transforms": [
+#                 PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
+#                 PointCloudToGraphTransform("pyg"),
+#             ]
+#         },
+#         batch_size=8,
+#     )
 
-    # this specifies a whole lot to make sure we have coverage
-    task = ScalarRegressionTask(
-        encoder_class=EGNN,
-        encoder_kwargs={
-            "hidden_dim": 48,
-            "output_dim": 32,
-            "num_conv": 2,
-            "num_atom_embedding": 200,
-        },
-        scheduler_kwargs={
-            "CosineAnnealingLR": {
-                "T_max": 5,
-                "eta_min": 1e-7,
-            }
-        },
-        lr=1e-3,
-        weight_decay=0.0,
-        output_kwargs={
-            "lazy": False,
-            "hidden_dim": 48,
-            "input_dim": 48,
-            "dropout": 0.2,
-            "num_hidden": 2,
-        },
-        task_keys=["band_gap"],
-    )
+#     # this specifies a whole lot to make sure we have coverage
+#     task = ScalarRegressionTask(
+#         encoder_class=EGNN,
+#         encoder_kwargs={
+#             "hidden_dim": 48,
+#             "output_dim": 32,
+#             "num_conv": 2,
+#             "num_atom_embedding": 200,
+#         },
+#         scheduler_kwargs={
+#             "CosineAnnealingLR": {
+#                 "T_max": 5,
+#                 "eta_min": 1e-7,
+#             }
+#         },
+#         lr=1e-3,
+#         weight_decay=0.0,
+#         output_kwargs={
+#             "lazy": False,
+#             "hidden_dim": 48,
+#             "input_dim": 48,
+#             "dropout": 0.2,
+#             "num_hidden": 2,
+#         },
+#         task_keys=["band_gap"],
+#     )
 
-    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-    trainer.fit(task, datamodule=dm)
+#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+#     trainer.fit(task, datamodule=dm)
 
 
-def test_mace_with_SAM():
-    """
-    Test the MACE Wrapper with SAM callback.
-    """
-    # Construct MACE relaxed energy regression with PyG implementation of E(n)-GNN
-    task = ScalarRegressionTask(
-        encoder_class=MACEWrapper,
-        encoder_kwargs={
-            "r_max": 6.0,
-            "num_bessel": 3,
-            "num_polynomial_cutoff": 3,
-            "max_ell": 2,
-            "interaction_cls": RealAgnosticInteractionBlock,
-            "interaction_cls_first": RealAgnosticInteractionBlock,
-            "num_interactions": 2,
-            "atom_embedding_dim": 64,
-            "MLP_irreps": Irreps("256x0e"),
-            "avg_num_neighbors": 10.0,
-            "correlation": 1,
-            "radial_type": "bessel",
-            "gate": nn.Identity(),
-        },
-        task_keys=["energy_relaxed"],
-    )
+# def test_mace_with_SAM():
+#     """
+#     Test the MACE Wrapper with SAM callback.
+#     """
+#     # Construct MACE relaxed energy regression with PyG implementation of E(n)-GNN
+#     task = ScalarRegressionTask(
+#         encoder_class=MACEWrapper,
+#         encoder_kwargs={
+#             "r_max": 6.0,
+#             "num_bessel": 3,
+#             "num_polynomial_cutoff": 3,
+#             "max_ell": 2,
+#             "interaction_cls": RealAgnosticInteractionBlock,
+#             "interaction_cls_first": RealAgnosticInteractionBlock,
+#             "num_interactions": 2,
+#             "atom_embedding_dim": 64,
+#             "MLP_irreps": Irreps("256x0e"),
+#             "avg_num_neighbors": 10.0,
+#             "correlation": 1,
+#             "radial_type": "bessel",
+#             "gate": nn.Identity(),
+#         },
+#         task_keys=["energy_relaxed"],
+#     )
 
-    # Prepare data module
-    dm = MatSciMLDataModule.from_devset(
-        "IS2REDataset",
-        dset_kwargs={
-            "transforms": [
-                PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
-                PointCloudToGraphTransform(
-                    "pyg",
-                    node_keys=["pos", "atomic_numbers"],
-                ),
-            ],
-        },
-    )
+#     # Prepare data module
+#     dm = MatSciMLDataModule.from_devset(
+#         "IS2REDataset",
+#         dset_kwargs={
+#             "transforms": [
+#                 PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
+#                 PointCloudToGraphTransform(
+#                     "pyg",
+#                     node_keys=["pos", "atomic_numbers"],
+#                 ),
+#             ],
+#         },
+#     )
 
-    # Run a quick training loop
-    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-    trainer.fit(task, datamodule=dm)
+#     # Run a quick training loop
+#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+#     trainer.fit(task, datamodule=dm)
 
 
-def test_faenet_with_SAM():
-    """
-    Test FAENet with SAM Callback.
-    """
-    task = ScalarRegressionTask(
-        encoder_class=FAENet,
-        encoder_kwargs={
-            "pred_as_dict": False,
-            "hidden_dim": 128,
-            "out_dim": 64,
-            "tag_hidden_channels": 0,
-            "input_dim": 128,
-        },
-        output_kwargs={"lazy": False, "input_dim": 64, "hidden_dim": 64},
-        task_keys=["band_gap"],
-    )
+# def test_faenet_with_SAM():
+#     """
+#     Test FAENet with SAM Callback.
+#     """
+#     task = ScalarRegressionTask(
+#         encoder_class=FAENet,
+#         encoder_kwargs={
+#             "pred_as_dict": False,
+#             "hidden_dim": 128,
+#             "out_dim": 64,
+#             "tag_hidden_channels": 0,
+#             "input_dim": 128,
+#         },
+#         output_kwargs={"lazy": False, "input_dim": 64, "hidden_dim": 64},
+#         task_keys=["band_gap"],
+#     )
 
-    dm = MatSciMLDataModule.from_devset(
-        "MaterialsProjectDataset",
-        dset_kwargs={
-            "transforms": [
-                UnitCellCalculator(),
-                PointCloudToGraphTransform(
-                    "pyg",
-                    cutoff_dist=20.0,
-                    node_keys=["pos", "atomic_numbers"],
-                ),
-                FrameAveraging(frame_averaging="3D", fa_method="stochastic"),
-            ],
-        },
-    )
+#     dm = MatSciMLDataModule.from_devset(
+#         "MaterialsProjectDataset",
+#         dset_kwargs={
+#             "transforms": [
+#                 UnitCellCalculator(),
+#                 PointCloudToGraphTransform(
+#                     "pyg",
+#                     cutoff_dist=20.0,
+#                     node_keys=["pos", "atomic_numbers"],
+#                 ),
+#                 FrameAveraging(frame_averaging="3D", fa_method="stochastic"),
+#             ],
+#         },
+#     )
 
-    # run a quick training loop
-    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-    trainer.fit(task, datamodule=dm)
+#     # run a quick training loop
+#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+#     trainer.fit(task, datamodule=dm)
 
 
-def test_force_regression_with_SAM():
-    """
-    Tests force regression with SAM using PLEGNNBackbone.
-    """
-    devset = MatSciMLDataModule.from_devset(
-        "S2EFDataset",
-        dset_kwargs={
-            "transforms": [
-                PointCloudToGraphTransform(
-                    "dgl",
-                    cutoff_dist=20.0,
-                    node_keys=["pos", "atomic_numbers"],
-                ),
-            ],
-        },
-    )
-    model_args = {
-        "embed_in_dim": 128,
-        "embed_hidden_dim": 32,
-        "embed_out_dim": 128,
-        "embed_depth": 5,
-        "embed_feat_dims": [128, 128, 128],
-        "embed_message_dims": [128, 128, 128],
-        "embed_position_dims": [64, 64],
-        "embed_edge_attributes_dim": 0,
-        "embed_activation": "relu",
-        "embed_residual": True,
-        "embed_normalize": True,
-        "embed_tanh": True,
-        "embed_activate_last": False,
-        "embed_k_linears": 1,
-        "embed_use_attention": False,
-        "embed_attention_norm": "sigmoid",
-        "readout": "sum",
-        "node_projection_depth": 3,
-        "node_projection_hidden_dim": 128,
-        "node_projection_activation": "relu",
-        "prediction_out_dim": 1,
-        "prediction_depth": 3,
-        "prediction_hidden_dim": 128,
-        "prediction_activation": "relu",
-        "encoder_only": True,
-    }
+# def test_force_regression_with_SAM():
+#     """
+#     Tests force regression with SAM using PLEGNNBackbone.
+#     """
+#     devset = MatSciMLDataModule.from_devset(
+#         "S2EFDataset",
+#         dset_kwargs={
+#             "transforms": [
+#                 PointCloudToGraphTransform(
+#                     "dgl",
+#                     cutoff_dist=20.0,
+#                     node_keys=["pos", "atomic_numbers"],
+#                 ),
+#             ],
+#         },
+#     )
+#     model_args = {
+#         "embed_in_dim": 128,
+#         "embed_hidden_dim": 32,
+#         "embed_out_dim": 128,
+#         "embed_depth": 5,
+#         "embed_feat_dims": [128, 128, 128],
+#         "embed_message_dims": [128, 128, 128],
+#         "embed_position_dims": [64, 64],
+#         "embed_edge_attributes_dim": 0,
+#         "embed_activation": "relu",
+#         "embed_residual": True,
+#         "embed_normalize": True,
+#         "embed_tanh": True,
+#         "embed_activate_last": False,
+#         "embed_k_linears": 1,
+#         "embed_use_attention": False,
+#         "embed_attention_norm": "sigmoid",
+#         "readout": "sum",
+#         "node_projection_depth": 3,
+#         "node_projection_hidden_dim": 128,
+#         "node_projection_activation": "relu",
+#         "prediction_out_dim": 1,
+#         "prediction_depth": 3,
+#         "prediction_hidden_dim": 128,
+#         "prediction_activation": "relu",
+#         "encoder_only": True,
+#     }
 
-    task = ForceRegressionTask(encoder_class=PLEGNNBackbone, encoder_kwargs=model_args)
-    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-    trainer.fit(task, datamodule=devset)
-    # make sure losses are tracked
-    for key in ["energy", "force"]:
-        assert f"train_{key}" in trainer.logged_metrics
+#     task = ForceRegressionTask(encoder_class=PLEGNNBackbone, encoder_kwargs=model_args)
+#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+#     trainer.fit(task, datamodule=devset)
+#     # make sure losses are tracked
+#     for key in ["energy", "force"]:
+#         assert f"train_{key}" in trainer.logged_metrics
 
 
-def test_gradfree_force_regression():
-    """
-    Tests force regression with SAM using PLEGNNBackbone.
-    """
-    devset = MatSciMLDataModule.from_devset(
-        "S2EFDataset",
-        dset_kwargs={
-            "transforms": [
-                PointCloudToGraphTransform(
-                    "dgl",
-                    cutoff_dist=20.0,
-                    node_keys=["pos", "atomic_numbers"],
-                ),
-            ],
-        },
-    )
-    model_args = {
-        "embed_in_dim": 128,
-        "embed_hidden_dim": 32,
-        "embed_out_dim": 128,
-        "embed_depth": 5,
-        "embed_feat_dims": [128, 128, 128],
-        "embed_message_dims": [128, 128, 128],
-        "embed_position_dims": [64, 64],
-        "embed_edge_attributes_dim": 0,
-        "embed_activation": "relu",
-        "embed_residual": True,
-        "embed_normalize": True,
-        "embed_tanh": True,
-        "embed_activate_last": False,
-        "embed_k_linears": 1,
-        "embed_use_attention": False,
-        "embed_attention_norm": "sigmoid",
-        "readout": "sum",
-        "node_projection_depth": 3,
-        "node_projection_hidden_dim": 128,
-        "node_projection_activation": "relu",
-        "prediction_out_dim": 1,
-        "prediction_depth": 3,
-        "prediction_hidden_dim": 128,
-        "prediction_activation": "relu",
-        "encoder_only": True,
-    }
-    task = GradFreeForceRegressionTask(
-        encoder_class=PLEGNNBackbone,
-        encoder_kwargs=model_args,
-    )
-    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-    trainer.fit(task, datamodule=devset)
-    # make sure losses are tracked
-    assert "train_force" in trainer.logged_metrics
+# def test_gradfree_force_regression():
+#     """
+#     Tests force regression with SAM using PLEGNNBackbone.
+#     """
+#     devset = MatSciMLDataModule.from_devset(
+#         "S2EFDataset",
+#         dset_kwargs={
+#             "transforms": [
+#                 PointCloudToGraphTransform(
+#                     "dgl",
+#                     cutoff_dist=20.0,
+#                     node_keys=["pos", "atomic_numbers"],
+#                 ),
+#             ],
+#         },
+#     )
+#     model_args = {
+#         "embed_in_dim": 128,
+#         "embed_hidden_dim": 32,
+#         "embed_out_dim": 128,
+#         "embed_depth": 5,
+#         "embed_feat_dims": [128, 128, 128],
+#         "embed_message_dims": [128, 128, 128],
+#         "embed_position_dims": [64, 64],
+#         "embed_edge_attributes_dim": 0,
+#         "embed_activation": "relu",
+#         "embed_residual": True,
+#         "embed_normalize": True,
+#         "embed_tanh": True,
+#         "embed_activate_last": False,
+#         "embed_k_linears": 1,
+#         "embed_use_attention": False,
+#         "embed_attention_norm": "sigmoid",
+#         "readout": "sum",
+#         "node_projection_depth": 3,
+#         "node_projection_hidden_dim": 128,
+#         "node_projection_activation": "relu",
+#         "prediction_out_dim": 1,
+#         "prediction_depth": 3,
+#         "prediction_hidden_dim": 128,
+#         "prediction_activation": "relu",
+#         "encoder_only": True,
+#     }
+#     task = GradFreeForceRegressionTask(
+#         encoder_class=PLEGNNBackbone,
+#         encoder_kwargs=model_args,
+#     )
+#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+#     trainer.fit(task, datamodule=devset)
+#     # make sure losses are tracked
+#     assert "train_force" in trainer.logged_metrics
 
 
-def test_egnn_binary_classification_with_SAM():
-    """
-    Test BinaryClassification Task with SAM callback .
-    """
-    dm = MatSciMLDataModule.from_devset(
-        "NomadDataset",
-        dset_kwargs={
-            "transforms": [
-                PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
-                PointCloudToGraphTransform("pyg"),
-            ]
-        },
-        batch_size=8,
-    )
+# def test_egnn_binary_classification_with_SAM():
+#     """
+#     Test BinaryClassification Task with SAM callback .
+#     """
+#     dm = MatSciMLDataModule.from_devset(
+#         "NomadDataset",
+#         dset_kwargs={
+#             "transforms": [
+#                 PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
+#                 PointCloudToGraphTransform("pyg"),
+#             ]
+#         },
+#         batch_size=8,
+#     )
 
-    # this specifies a whole lot to make sure we have coverage
-    task = BinaryClassificationTask(
-        encoder_class=EGNN,
-        encoder_kwargs={
-            "hidden_dim": 48,
-            "output_dim": 32,
-            "num_conv": 2,
-            "num_atom_embedding": 200,
-        },
-        lr=1e-3,
-        weight_decay=0.0,
-        output_kwargs={
-            "lazy": False,
-            "hidden_dim": 48,
-            "input_dim": 48,
-            "dropout": 0.2,
-            "num_hidden": 2,
-        },
-        task_keys=["spin_polarized"],
-    )
+#     # this specifies a whole lot to make sure we have coverage
+#     task = BinaryClassificationTask(
+#         encoder_class=EGNN,
+#         encoder_kwargs={
+#             "hidden_dim": 48,
+#             "output_dim": 32,
+#             "num_conv": 2,
+#             "num_atom_embedding": 200,
+#         },
+#         lr=1e-3,
+#         weight_decay=0.0,
+#         output_kwargs={
+#             "lazy": False,
+#             "hidden_dim": 48,
+#             "input_dim": 48,
+#             "dropout": 0.2,
+#             "num_hidden": 2,
+#         },
+#         task_keys=["spin_polarized"],
+#     )
 
-    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-    trainer.fit(task, datamodule=dm)
+#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+#     trainer.fit(task, datamodule=dm)
 
 
 def test_multitask_sam():
@@ -365,5 +355,5 @@ def test_multitask_sam():
         ("IS2REDataset", is2re),
         ("S2EFDataset", s2ef),
     )
-    trainer = pl.Trainer(fast_dev_run=10)
+    trainer = pl.Trainer(fast_dev_run=10, callbacks=SAM())
     trainer.fit(task, datamodule=dm)

From f19566c72d3e9cf6566a32802549f86d7d468bd8 Mon Sep 17 00:00:00 2001
From: "Gonzales, Carmelo" <carmelo.gonzales@intel.com>
Date: Wed, 17 Apr 2024 16:02:00 -0700
Subject: [PATCH 2/2] adding check for number of optimizers, adding back in
 ruff purged items

---
 matsciml/lightning/callbacks.py      |   3 +-
 matsciml/lightning/tests/test_sam.py | 520 ++++++++++++++-------------
 2 files changed, 267 insertions(+), 256 deletions(-)

diff --git a/matsciml/lightning/callbacks.py b/matsciml/lightning/callbacks.py
index e9b3c0d4..9a87773a 100644
--- a/matsciml/lightning/callbacks.py
+++ b/matsciml/lightning/callbacks.py
@@ -779,7 +779,8 @@ def on_before_optimizer_step(
             org_weights = self._first_step(optimizer)
         with torch.enable_grad():
             loss = task._compute_losses(self.batch)
-            loss = self.extract_optimizer_specific_loss(trainer, optimizer, loss)
+            if len(trainer.optimizers) > 1:
+                loss = self.extract_optimizer_specific_loss(trainer, optimizer, loss)
             loss = self._get_loss(loss)
             if torch.isfinite(loss):
                 trainer.strategy.backward(loss, optimizer=optimizer)
diff --git a/matsciml/lightning/tests/test_sam.py b/matsciml/lightning/tests/test_sam.py
index c24b6087..c250f6aa 100644
--- a/matsciml/lightning/tests/test_sam.py
+++ b/matsciml/lightning/tests/test_sam.py
@@ -5,293 +5,303 @@
 from matsciml.datasets.transforms import (
     PeriodicPropertiesTransform,
     PointCloudToGraphTransform,
+    FrameAveraging,
+    UnitCellCalculator,
 )
 
-from matsciml.lightning import MultiDataModule
+from matsciml.lightning import MatSciMLDataModule, MultiDataModule
 from matsciml.datasets import MultiDataset, IS2REDataset, S2EFDataset
+from matsciml.models.pyg import EGNN
 from matsciml.lightning.callbacks import SAM
+from matsciml.models.pyg import FAENet
+from torch import nn
+from e3nn.o3 import Irreps
+from mace.modules.blocks import RealAgnosticInteractionBlock
+from matsciml.models.pyg.mace import MACEWrapper
 from matsciml.models.dgl import PLEGNNBackbone
 from matsciml.models.base import (
     MultiTaskLitModule,
     ForceRegressionTask,
+    GradFreeForceRegressionTask,
     ScalarRegressionTask,
+    BinaryClassificationTask,
 )
 
 
-# def test_egnn_end_to_end_with_SAM():
-#     """
-#     Test the end to end pipeline using a devset with EGNN and SAM callback.
+def test_egnn_end_to_end_with_SAM():
+    """
+    Test the end to end pipeline using a devset with EGNN and SAM callback.
 
-#     The idea is that this basically mimics an example script to
-#     try and maximize coverage across dataset to training, which
-#     is particularly useful for checking new dependencies, etc.
-#     """
-#     dm = MatSciMLDataModule.from_devset(
-#         "MaterialsProjectDataset",
-#         dset_kwargs={
-#             "transforms": [
-#                 PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
-#                 PointCloudToGraphTransform("pyg"),
-#             ]
-#         },
-#         batch_size=8,
-#     )
+    The idea is that this basically mimics an example script to
+    try and maximize coverage across dataset to training, which
+    is particularly useful for checking new dependencies, etc.
+    """
+    dm = MatSciMLDataModule.from_devset(
+        "MaterialsProjectDataset",
+        dset_kwargs={
+            "transforms": [
+                PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
+                PointCloudToGraphTransform("pyg"),
+            ]
+        },
+        batch_size=8,
+    )
 
-#     # this specifies a whole lot to make sure we have coverage
-#     task = ScalarRegressionTask(
-#         encoder_class=EGNN,
-#         encoder_kwargs={
-#             "hidden_dim": 48,
-#             "output_dim": 32,
-#             "num_conv": 2,
-#             "num_atom_embedding": 200,
-#         },
-#         scheduler_kwargs={
-#             "CosineAnnealingLR": {
-#                 "T_max": 5,
-#                 "eta_min": 1e-7,
-#             }
-#         },
-#         lr=1e-3,
-#         weight_decay=0.0,
-#         output_kwargs={
-#             "lazy": False,
-#             "hidden_dim": 48,
-#             "input_dim": 48,
-#             "dropout": 0.2,
-#             "num_hidden": 2,
-#         },
-#         task_keys=["band_gap"],
-#     )
+    # this specifies a whole lot to make sure we have coverage
+    task = ScalarRegressionTask(
+        encoder_class=EGNN,
+        encoder_kwargs={
+            "hidden_dim": 48,
+            "output_dim": 32,
+            "num_conv": 2,
+            "num_atom_embedding": 200,
+        },
+        scheduler_kwargs={
+            "CosineAnnealingLR": {
+                "T_max": 5,
+                "eta_min": 1e-7,
+            }
+        },
+        lr=1e-3,
+        weight_decay=0.0,
+        output_kwargs={
+            "lazy": False,
+            "hidden_dim": 48,
+            "input_dim": 48,
+            "dropout": 0.2,
+            "num_hidden": 2,
+        },
+        task_keys=["band_gap"],
+    )
 
-#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-#     trainer.fit(task, datamodule=dm)
+    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+    trainer.fit(task, datamodule=dm)
 
 
-# def test_mace_with_SAM():
-#     """
-#     Test the MACE Wrapper with SAM callback.
-#     """
-#     # Construct MACE relaxed energy regression with PyG implementation of E(n)-GNN
-#     task = ScalarRegressionTask(
-#         encoder_class=MACEWrapper,
-#         encoder_kwargs={
-#             "r_max": 6.0,
-#             "num_bessel": 3,
-#             "num_polynomial_cutoff": 3,
-#             "max_ell": 2,
-#             "interaction_cls": RealAgnosticInteractionBlock,
-#             "interaction_cls_first": RealAgnosticInteractionBlock,
-#             "num_interactions": 2,
-#             "atom_embedding_dim": 64,
-#             "MLP_irreps": Irreps("256x0e"),
-#             "avg_num_neighbors": 10.0,
-#             "correlation": 1,
-#             "radial_type": "bessel",
-#             "gate": nn.Identity(),
-#         },
-#         task_keys=["energy_relaxed"],
-#     )
+def test_mace_with_SAM():
+    """
+    Test the MACE Wrapper with SAM callback.
+    """
+    # Construct MACE relaxed energy regression with PyG implementation of E(n)-GNN
+    task = ScalarRegressionTask(
+        encoder_class=MACEWrapper,
+        encoder_kwargs={
+            "r_max": 6.0,
+            "num_bessel": 3,
+            "num_polynomial_cutoff": 3,
+            "max_ell": 2,
+            "interaction_cls": RealAgnosticInteractionBlock,
+            "interaction_cls_first": RealAgnosticInteractionBlock,
+            "num_interactions": 2,
+            "atom_embedding_dim": 64,
+            "MLP_irreps": Irreps("256x0e"),
+            "avg_num_neighbors": 10.0,
+            "correlation": 1,
+            "radial_type": "bessel",
+            "gate": nn.Identity(),
+        },
+        task_keys=["energy_relaxed"],
+    )
 
-#     # Prepare data module
-#     dm = MatSciMLDataModule.from_devset(
-#         "IS2REDataset",
-#         dset_kwargs={
-#             "transforms": [
-#                 PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
-#                 PointCloudToGraphTransform(
-#                     "pyg",
-#                     node_keys=["pos", "atomic_numbers"],
-#                 ),
-#             ],
-#         },
-#     )
+    # Prepare data module
+    dm = MatSciMLDataModule.from_devset(
+        "IS2REDataset",
+        dset_kwargs={
+            "transforms": [
+                PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
+                PointCloudToGraphTransform(
+                    "pyg",
+                    node_keys=["pos", "atomic_numbers"],
+                ),
+            ],
+        },
+    )
 
-#     # Run a quick training loop
-#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-#     trainer.fit(task, datamodule=dm)
+    # Run a quick training loop
+    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+    trainer.fit(task, datamodule=dm)
 
 
-# def test_faenet_with_SAM():
-#     """
-#     Test FAENet with SAM Callback.
-#     """
-#     task = ScalarRegressionTask(
-#         encoder_class=FAENet,
-#         encoder_kwargs={
-#             "pred_as_dict": False,
-#             "hidden_dim": 128,
-#             "out_dim": 64,
-#             "tag_hidden_channels": 0,
-#             "input_dim": 128,
-#         },
-#         output_kwargs={"lazy": False, "input_dim": 64, "hidden_dim": 64},
-#         task_keys=["band_gap"],
-#     )
+def test_faenet_with_SAM():
+    """
+    Test FAENet with SAM Callback.
+    """
+    task = ScalarRegressionTask(
+        encoder_class=FAENet,
+        encoder_kwargs={
+            "pred_as_dict": False,
+            "hidden_dim": 128,
+            "out_dim": 64,
+            "tag_hidden_channels": 0,
+            "input_dim": 128,
+        },
+        output_kwargs={"lazy": False, "input_dim": 64, "hidden_dim": 64},
+        task_keys=["band_gap"],
+    )
 
-#     dm = MatSciMLDataModule.from_devset(
-#         "MaterialsProjectDataset",
-#         dset_kwargs={
-#             "transforms": [
-#                 UnitCellCalculator(),
-#                 PointCloudToGraphTransform(
-#                     "pyg",
-#                     cutoff_dist=20.0,
-#                     node_keys=["pos", "atomic_numbers"],
-#                 ),
-#                 FrameAveraging(frame_averaging="3D", fa_method="stochastic"),
-#             ],
-#         },
-#     )
+    dm = MatSciMLDataModule.from_devset(
+        "MaterialsProjectDataset",
+        dset_kwargs={
+            "transforms": [
+                UnitCellCalculator(),
+                PointCloudToGraphTransform(
+                    "pyg",
+                    cutoff_dist=20.0,
+                    node_keys=["pos", "atomic_numbers"],
+                ),
+                FrameAveraging(frame_averaging="3D", fa_method="stochastic"),
+            ],
+        },
+    )
 
-#     # run a quick training loop
-#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-#     trainer.fit(task, datamodule=dm)
+    # run a quick training loop
+    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+    trainer.fit(task, datamodule=dm)
 
 
-# def test_force_regression_with_SAM():
-#     """
-#     Tests force regression with SAM using PLEGNNBackbone.
-#     """
-#     devset = MatSciMLDataModule.from_devset(
-#         "S2EFDataset",
-#         dset_kwargs={
-#             "transforms": [
-#                 PointCloudToGraphTransform(
-#                     "dgl",
-#                     cutoff_dist=20.0,
-#                     node_keys=["pos", "atomic_numbers"],
-#                 ),
-#             ],
-#         },
-#     )
-#     model_args = {
-#         "embed_in_dim": 128,
-#         "embed_hidden_dim": 32,
-#         "embed_out_dim": 128,
-#         "embed_depth": 5,
-#         "embed_feat_dims": [128, 128, 128],
-#         "embed_message_dims": [128, 128, 128],
-#         "embed_position_dims": [64, 64],
-#         "embed_edge_attributes_dim": 0,
-#         "embed_activation": "relu",
-#         "embed_residual": True,
-#         "embed_normalize": True,
-#         "embed_tanh": True,
-#         "embed_activate_last": False,
-#         "embed_k_linears": 1,
-#         "embed_use_attention": False,
-#         "embed_attention_norm": "sigmoid",
-#         "readout": "sum",
-#         "node_projection_depth": 3,
-#         "node_projection_hidden_dim": 128,
-#         "node_projection_activation": "relu",
-#         "prediction_out_dim": 1,
-#         "prediction_depth": 3,
-#         "prediction_hidden_dim": 128,
-#         "prediction_activation": "relu",
-#         "encoder_only": True,
-#     }
+def test_force_regression_with_SAM():
+    """
+    Tests force regression with SAM using PLEGNNBackbone.
+    """
+    devset = MatSciMLDataModule.from_devset(
+        "S2EFDataset",
+        dset_kwargs={
+            "transforms": [
+                PointCloudToGraphTransform(
+                    "dgl",
+                    cutoff_dist=20.0,
+                    node_keys=["pos", "atomic_numbers"],
+                ),
+            ],
+        },
+    )
+    model_args = {
+        "embed_in_dim": 128,
+        "embed_hidden_dim": 32,
+        "embed_out_dim": 128,
+        "embed_depth": 5,
+        "embed_feat_dims": [128, 128, 128],
+        "embed_message_dims": [128, 128, 128],
+        "embed_position_dims": [64, 64],
+        "embed_edge_attributes_dim": 0,
+        "embed_activation": "relu",
+        "embed_residual": True,
+        "embed_normalize": True,
+        "embed_tanh": True,
+        "embed_activate_last": False,
+        "embed_k_linears": 1,
+        "embed_use_attention": False,
+        "embed_attention_norm": "sigmoid",
+        "readout": "sum",
+        "node_projection_depth": 3,
+        "node_projection_hidden_dim": 128,
+        "node_projection_activation": "relu",
+        "prediction_out_dim": 1,
+        "prediction_depth": 3,
+        "prediction_hidden_dim": 128,
+        "prediction_activation": "relu",
+        "encoder_only": True,
+    }
 
-#     task = ForceRegressionTask(encoder_class=PLEGNNBackbone, encoder_kwargs=model_args)
-#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-#     trainer.fit(task, datamodule=devset)
-#     # make sure losses are tracked
-#     for key in ["energy", "force"]:
-#         assert f"train_{key}" in trainer.logged_metrics
+    task = ForceRegressionTask(encoder_class=PLEGNNBackbone, encoder_kwargs=model_args)
+    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+    trainer.fit(task, datamodule=devset)
+    # make sure losses are tracked
+    for key in ["energy", "force"]:
+        assert f"train_{key}" in trainer.logged_metrics
 
 
-# def test_gradfree_force_regression():
-#     """
-#     Tests force regression with SAM using PLEGNNBackbone.
-#     """
-#     devset = MatSciMLDataModule.from_devset(
-#         "S2EFDataset",
-#         dset_kwargs={
-#             "transforms": [
-#                 PointCloudToGraphTransform(
-#                     "dgl",
-#                     cutoff_dist=20.0,
-#                     node_keys=["pos", "atomic_numbers"],
-#                 ),
-#             ],
-#         },
-#     )
-#     model_args = {
-#         "embed_in_dim": 128,
-#         "embed_hidden_dim": 32,
-#         "embed_out_dim": 128,
-#         "embed_depth": 5,
-#         "embed_feat_dims": [128, 128, 128],
-#         "embed_message_dims": [128, 128, 128],
-#         "embed_position_dims": [64, 64],
-#         "embed_edge_attributes_dim": 0,
-#         "embed_activation": "relu",
-#         "embed_residual": True,
-#         "embed_normalize": True,
-#         "embed_tanh": True,
-#         "embed_activate_last": False,
-#         "embed_k_linears": 1,
-#         "embed_use_attention": False,
-#         "embed_attention_norm": "sigmoid",
-#         "readout": "sum",
-#         "node_projection_depth": 3,
-#         "node_projection_hidden_dim": 128,
-#         "node_projection_activation": "relu",
-#         "prediction_out_dim": 1,
-#         "prediction_depth": 3,
-#         "prediction_hidden_dim": 128,
-#         "prediction_activation": "relu",
-#         "encoder_only": True,
-#     }
-#     task = GradFreeForceRegressionTask(
-#         encoder_class=PLEGNNBackbone,
-#         encoder_kwargs=model_args,
-#     )
-#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-#     trainer.fit(task, datamodule=devset)
-#     # make sure losses are tracked
-#     assert "train_force" in trainer.logged_metrics
+def test_gradfree_force_regression():
+    """
+    Tests force regression with SAM using PLEGNNBackbone.
+    """
+    devset = MatSciMLDataModule.from_devset(
+        "S2EFDataset",
+        dset_kwargs={
+            "transforms": [
+                PointCloudToGraphTransform(
+                    "dgl",
+                    cutoff_dist=20.0,
+                    node_keys=["pos", "atomic_numbers"],
+                ),
+            ],
+        },
+    )
+    model_args = {
+        "embed_in_dim": 128,
+        "embed_hidden_dim": 32,
+        "embed_out_dim": 128,
+        "embed_depth": 5,
+        "embed_feat_dims": [128, 128, 128],
+        "embed_message_dims": [128, 128, 128],
+        "embed_position_dims": [64, 64],
+        "embed_edge_attributes_dim": 0,
+        "embed_activation": "relu",
+        "embed_residual": True,
+        "embed_normalize": True,
+        "embed_tanh": True,
+        "embed_activate_last": False,
+        "embed_k_linears": 1,
+        "embed_use_attention": False,
+        "embed_attention_norm": "sigmoid",
+        "readout": "sum",
+        "node_projection_depth": 3,
+        "node_projection_hidden_dim": 128,
+        "node_projection_activation": "relu",
+        "prediction_out_dim": 1,
+        "prediction_depth": 3,
+        "prediction_hidden_dim": 128,
+        "prediction_activation": "relu",
+        "encoder_only": True,
+    }
+    task = GradFreeForceRegressionTask(
+        encoder_class=PLEGNNBackbone,
+        encoder_kwargs=model_args,
+    )
+    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+    trainer.fit(task, datamodule=devset)
+    # make sure losses are tracked
+    assert "train_force" in trainer.logged_metrics
 
 
-# def test_egnn_binary_classification_with_SAM():
-#     """
-#     Test BinaryClassification Task with SAM callback .
-#     """
-#     dm = MatSciMLDataModule.from_devset(
-#         "NomadDataset",
-#         dset_kwargs={
-#             "transforms": [
-#                 PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
-#                 PointCloudToGraphTransform("pyg"),
-#             ]
-#         },
-#         batch_size=8,
-#     )
+def test_egnn_binary_classification_with_SAM():
+    """
+    Test BinaryClassification Task with SAM callback .
+    """
+    dm = MatSciMLDataModule.from_devset(
+        "NomadDataset",
+        dset_kwargs={
+            "transforms": [
+                PeriodicPropertiesTransform(6.0, adaptive_cutoff=True),
+                PointCloudToGraphTransform("pyg"),
+            ]
+        },
+        batch_size=8,
+    )
 
-#     # this specifies a whole lot to make sure we have coverage
-#     task = BinaryClassificationTask(
-#         encoder_class=EGNN,
-#         encoder_kwargs={
-#             "hidden_dim": 48,
-#             "output_dim": 32,
-#             "num_conv": 2,
-#             "num_atom_embedding": 200,
-#         },
-#         lr=1e-3,
-#         weight_decay=0.0,
-#         output_kwargs={
-#             "lazy": False,
-#             "hidden_dim": 48,
-#             "input_dim": 48,
-#             "dropout": 0.2,
-#             "num_hidden": 2,
-#         },
-#         task_keys=["spin_polarized"],
-#     )
+    # this specifies a whole lot to make sure we have coverage
+    task = BinaryClassificationTask(
+        encoder_class=EGNN,
+        encoder_kwargs={
+            "hidden_dim": 48,
+            "output_dim": 32,
+            "num_conv": 2,
+            "num_atom_embedding": 200,
+        },
+        lr=1e-3,
+        weight_decay=0.0,
+        output_kwargs={
+            "lazy": False,
+            "hidden_dim": 48,
+            "input_dim": 48,
+            "dropout": 0.2,
+            "num_hidden": 2,
+        },
+        task_keys=["spin_polarized"],
+    )
 
-#     trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
-#     trainer.fit(task, datamodule=dm)
+    trainer = pl.Trainer(fast_dev_run=5, callbacks=[SAM()])
+    trainer.fit(task, datamodule=dm)
 
 
 def test_multitask_sam():