IntelLabs · laserkelvin · Sep 27, 2024 · Sep 27, 2024 · Sep 27, 2024 · Sep 27, 2024
diff --git a/docs/source/index.rst b/docs/source/index.rst
@@ -17,6 +17,7 @@ The Open MatSciML Toolkit
    training
    callbacks
    experiment-interface
+   inference
    best-practices
    how-to
    developers

diff --git a/docs/source/inference.rst b/docs/source/inference.rst
@@ -40,6 +40,12 @@ these keys, ``predictions`` and ``targets``. Note that ``pred_split`` does not n
 a completely different hold out: you can pass your training LMDB path if you wish to double check the
 performance of your model after training, or you can use it with unseen samples.
 
+Note that by default, `predict` triggers PyTorch's inference mode, which is a specialized case where
+absolutely no autograd is enabled. ``ForceRegressionTask`` uses automatic differentiation to evaluate
+forces, and so for inference tasks that require gradients, you **must** pass `inference_mode=False` to
+``pl.Trainer``.
+
+
 .. note::
 
     For developers, this is handled by the ``matsciml.models.inference.ParityData`` class. This is

diff --git a/matsciml/lightning/data_utils.py b/matsciml/lightning/data_utils.py
@@ -259,6 +259,9 @@ def setup(self, stage: str | None = None) -> None:
                     f"Prediction split provided, but not found: {pred_split_path}"
                 )
             dset = self._make_dataset(pred_split_path, self.dataset)
+            # assumes that if we're providing a predict set, we're not going
+            # to be doing training in the same run
+            self.dataset = dset
             splits["pred"] = dset
         # the last case assumes only the dataset is passed, we will treat it as train
         if len(splits) == 0:
@@ -288,7 +291,7 @@ def predict_dataloader(self):
             target,
             batch_size=self.hparams.batch_size,
             num_workers=self.hparams.num_workers,
-            collate_fn=self.dataset.collate_fn,
+            collate_fn=target.collate_fn,
             persistent_workers=self.persistent_workers,
         )
 

diff --git a/matsciml/models/inference.py b/matsciml/models/inference.py
@@ -60,7 +60,7 @@ def targets(self, values: torch.Tensor) -> None:
 
     @property
     def predictions(self) -> torch.Tensor:
-        return torch.vstack(self._targets)
+        return torch.vstack(self._predictions)
 
     @predictions.setter
     def predictions(self, values: torch.Tensor) -> None:
@@ -112,8 +112,7 @@ def predict_step(
 
     @classmethod
     def from_pretrained_checkpoint(
-        cls,
-        task_ckpt_path: str | Path,
+        cls, task_ckpt_path: str | Path, ckpt_class_name: str | None = None
     ) -> BaseInferenceTask:
         """
         Instantiate a ``BaseInferenceTask`` from an existing Lightning checkpoint
@@ -124,9 +123,15 @@ def from_pretrained_checkpoint(
 
         Parameters
         ----------
-        task_ckpt_path : Union[str, Path]
+        task_ckpt_path : str | Path
             Path to an existing task checkpoint file. Typically, this
             would be a PyTorch Lightning checkpoint.
+        ckpt_class_name : str, optional
+            If specified, this will load the task based on its native
+            ``load_from_checkpoint`` method. This is a good alternative
+            if this method is unable to resolve parameter naming, etc,
+            and if your inference task depends on specific methods in
+            the task.
 
         Examples
         --------
@@ -143,6 +148,13 @@ def from_pretrained_checkpoint(
         assert (
             task_ckpt_path.exists()
         ), "Encoder checkpoint filepath specified but does not exist."
+        # if a task name for the checkpoint is given, use that task's
+        # loading method directly
+        if ckpt_class_name:
+            task_cls = registry.get_task_class(ckpt_class_name)
+            if not task_cls:
+                raise KeyError(f"Requested {task_cls}, which is not a registered task.")
+            return cls(task_cls.load_from_checkpoint(str(task_ckpt_path)))
         ckpt = torch.load(task_ckpt_path)
         select_kwargs = {}
         for key in ["encoder_class", "encoder_kwargs"]: