determined-ai · shiyuann · Jun 30, 2020 · Jun 30, 2020
diff --git a/common/determined_common/experimental/checkpoint/_torch.py b/common/determined_common/experimental/checkpoint/_torch.py
@@ -17,9 +17,6 @@ def load_model(ckpt_dir: pathlib.Path, metadata: Dict[str, Any], **kwargs: Any)
     trial = cast(PyTorchTrial, trial)
     model = trial.build_model()
     checkpoint = torch.load(ckpt_dir.joinpath("state_dict.pth"), map_location="cpu")  # type: ignore
-
-    # TODO(DET-3456): The checkpoint schema is changed for mutliple models so this function should
-    #       be updated accordingly.
-    model.load_state_dict(checkpoint["models_state_dict"][0])
+    model.load_state_dict(checkpoint["model_state_dict"])
 
     return model
diff --git a/harness/determined/_experiment_config.py b/harness/determined/_experiment_config.py
@@ -23,7 +23,6 @@ def native_enabled(self) -> bool:
     def native_parallel_enabled(self) -> bool:
         return bool(self["resources"]["native_parallel"])
 
-    # TODO(DET-3262): remove this backward compatibility.
     def mixed_precision_enabled(self) -> bool:
         return bool(self["optimizations"]["mixed_precision"] != "O0")
 

diff --git a/harness/determined/pytorch/_callback.py b/harness/determined/pytorch/_callback.py
@@ -47,7 +47,6 @@ def on_before_optimizer_step(self, parameters: Iterator) -> None:
         after gradient updates have been communicated. Typically used to perform gradient
         clipping.
         """
-        # TODO(DET-3267): deprecate this when releasing pytorch flexible primitives.
         pass
 
     def on_validation_step_start(self) -> None:
@@ -88,7 +87,6 @@ def load_state_dict(self, state_dict: Dict[str, Any]) -> None:
         pass
 
 
-# TODO(DET-3267): deprecate this when releasing pytorch flexible primitives.
 class ClipGradsL2Norm(PyTorchCallback):
     """
     Callback that performs gradient clipping using
@@ -102,7 +100,6 @@ def on_before_optimizer_step(self, parameters: Iterator) -> None:
         torch.nn.utils.clip_grad_norm_(parameters, self._clip_value)  # type: ignore
 
 
-# TODO(DET-3267): deprecate this when releasing pytorch flexible primitives.
 class ClipGradsL2Value(PyTorchCallback):
     """
     Callback that performs gradient clipping using

diff --git a/harness/determined/pytorch/_lr_scheduler.py b/harness/determined/pytorch/_lr_scheduler.py
@@ -10,10 +10,9 @@ class LRScheduler:
     """Wrapper for a PyTorch LRScheduler.
 
     This wrapper fulfills two main functions:
-
-    1. Save and restore the learning rate when a trial is paused, preempted, etc.
-    2. Step the learning rate scheduler at the configured frequency
-       (e.g., every batch or every epoch).
+        1. Save and restore the learning rate when a trial is paused, preempted, etc.
+        2. Step the learning rate scheduler at the configured frequency
+           (e.g., every batch or every epoch).
     """
 
     class StepMode(enum.Enum):