Lightning-AI
diff --git a/‎CHANGELOG.md‎
Lines changed: 9 additions & 3 deletions b/‎CHANGELOG.md‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎benchmarks/test_basic_parity.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/test_basic_parity.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/advanced/mixed_precision.rst‎
Lines changed: 3 additions & 3 deletions b/‎docs/source/advanced/mixed_precision.rst‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎docs/source/common/trainer.rst‎
Lines changed: 2 additions & 2 deletions b/‎docs/source/common/trainer.rst‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/source/conf.py‎
Lines changed: 0 additions & 1 deletion b/‎docs/source/conf.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎docs/source/guides/speed.rst‎
Lines changed: 1 addition & 1 deletion b/‎docs/source/guides/speed.rst‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pytorch_lightning/accelerators/accelerator.py‎
Lines changed: 2 additions & 6 deletions b/‎pytorch_lightning/accelerators/accelerator.py‎
Lines changed: 2 additions & 6 deletions
diff --git a/‎pytorch_lightning/callbacks/progress/rich_progress.py‎
Lines changed: 1 addition & 1 deletion b/‎pytorch_lightning/callbacks/progress/rich_progress.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pytorch_lightning/callbacks/rich_model_summary.py‎
Lines changed: 1 addition & 1 deletion b/‎pytorch_lightning/callbacks/rich_model_summary.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pytorch_lightning/loops/optimization/optimizer_loop.py‎
Lines changed: 6 additions & 11 deletions b/‎pytorch_lightning/loops/optimization/optimizer_loop.py‎
Lines changed: 6 additions & 11 deletions
@@ -163,6 +163,9 @@ The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/).
 - Added `pl_legacy_patch` load utility for loading old checkpoints that have pickled legacy Lightning attributes ([#9166](https://github.com/PyTorchLightning/pytorch-lightning/pull/9166))
 
 
+- Added support for `torch.use_deterministic_algorithms` ([#9121](https://github.com/PyTorchLightning/pytorch-lightning/pull/9121))
+
+
 - Enabled auto parameters tying for TPUs ([#9525](https://github.com/PyTorchLightning/pytorch-lightning/pull/9525))
 
 
@@ -228,9 +231,6 @@ The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/).
 - Executing the `optimizer_closure` is now required when overriding the `optimizer_step` hook ([#9360](https://github.com/PyTorchLightning/pytorch-lightning/pull/9360))
 
 
-- Removed `TrainerProperties` mixin and moved property definitions directly into `Trainer` ([#9495](https://github.com/PyTorchLightning/pytorch-lightning/pull/9495))
-
-
 - Changed logging of `LightningModule` and `LightningDataModule` hyperparameters to raise an exception only if there are colliding keys with different values ([#9496](https://github.com/PyTorchLightning/pytorch-lightning/pull/9496))
 
 
@@ -349,6 +349,9 @@ The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/).
 - Removed `TrainingTypePlugin.on_save` and `Accelerator.on_save` ([#9023](https://github.com/PyTorchLightning/pytorch-lightning/pull/9023))
 
 
+- Removed `{Accelerator,TrainingTypePlugin,PrecisionPlugin}.post_optimizer_step` ([#9746](https://github.com/PyTorchLightning/pytorch-lightning/pull/9746))
+
+
 - Removed deprecated `connect_precision_plugin` and `connect_training_type_plugin` from `Accelerator` ([#9019](https://github.com/PyTorchLightning/pytorch-lightning/pull/9019))
 
 
@@ -397,6 +400,9 @@ The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/).
 - Removed `call_configure_sharded_model_hook` property from `Accelerator` and `TrainingTypePlugin` ([#9612](https://github.com/PyTorchLightning/pytorch-lightning/pull/9612))
 
 
+- Removed `TrainerProperties` mixin and moved property definitions directly into `Trainer` ([#9495](https://github.com/PyTorchLightning/pytorch-lightning/pull/9495))
+
+
 ### Fixed
 
 
 
@@ -151,6 +151,7 @@ def vanilla_loop(cls_model, idx, device_type: str = "cuda", num_epochs=10):
 
 def lightning_loop(cls_model, idx, device_type: str = "cuda", num_epochs=10):
     seed_everything(idx)
+    torch.backends.cudnn.deterministic = True
 
     model = cls_model()
     # init model parts
@@ -161,7 +162,6 @@ def lightning_loop(cls_model, idx, device_type: str = "cuda", num_epochs=10):
         weights_summary=None,
         gpus=1 if device_type == "cuda" else 0,
         checkpoint_callback=False,
-        deterministic=True,
         logger=False,
         replace_sampler_ddp=False,
     )
 
@@ -30,7 +30,7 @@ Since computation happens in FP16, there is a chance of numerical instability. T
     When using TPUs, setting ``precision=16`` will enable bfloat16 which is the only supported precision type on TPUs.
 
 .. testcode::
-    :skipif: not _APEX_AVAILABLE and not _NATIVE_AMP_AVAILABLE or not torch.cuda.is_available()
+    :skipif: not torch.cuda.is_available()
 
     Trainer(gpus=1, precision=16)
 
@@ -71,13 +71,13 @@ NVIDIA APEX Mixed Precision
 `NVIDIA APEX <https://github.com/NVIDIA/apex>`__ offers some additional flexibility in setting mixed precision. This can be useful for when wanting to try out different precision configurations, such as keeping most of your weights in FP16 as well as running computation in FP16.
 
 .. testcode::
-    :skipif: not _APEX_AVAILABLE and not _NATIVE_AMP_AVAILABLE or not torch.cuda.is_available()
+    :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available()
 
     Trainer(gpus=1, amp_backend="apex")
 
 Set the `NVIDIA optimization level <https://nvidia.github.io/apex/amp.html#opt-levels>`__ via the trainer.
 
 .. testcode::
-    :skipif: not _APEX_AVAILABLE and not _NATIVE_AMP_AVAILABLE or not torch.cuda.is_available()
+    :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available()
 
     Trainer(gpus=1, amp_backend="apex", amp_level="O2")
@@ -1172,7 +1172,7 @@ Lightning supports either double precision (64), full precision (32), or half pr
 Half precision, or mixed precision, is the combined use of 32 and 16 bit floating points to reduce memory footprint during model training. This can result in improved performance, achieving +3X speedups on modern GPUs.
 
 .. testcode::
-    :skipif: not _APEX_AVAILABLE and not _NATIVE_AMP_AVAILABLE or not torch.cuda.is_available()
+    :skipif: not torch.cuda.is_available()
 
     # default used by the Trainer
     trainer = Trainer(precision=32, gpus=1)
@@ -1221,7 +1221,7 @@ Half precision, or mixed precision, is the combined use of 32 and 16 bit floatin
     2. Set the `precision` trainer flag to 16. You can customize the `Apex optimization level <https://nvidia.github.io/apex/amp.html#opt-levels>`_ by setting the `amp_level` flag.
 
     .. testcode::
-        :skipif: not _APEX_AVAILABLE and not _NATIVE_AMP_AVAILABLE or not torch.cuda.is_available()
+        :skipif: not _APEX_AVAILABLE or not torch.cuda.is_available()
 
         # turn on 16-bit
         trainer = Trainer(amp_backend="apex", amp_level="O2", precision=16)
 
@@ -369,7 +369,6 @@ def package_list_from_file(file):
 import pytorch_lightning as pl
 from pytorch_lightning import LightningDataModule, LightningModule, Trainer
 from pytorch_lightning.utilities import (
-    _NATIVE_AMP_AVAILABLE,
     _APEX_AVAILABLE,
     _XLA_AVAILABLE,
     _TPU_AVAILABLE,
 
@@ -214,7 +214,7 @@ Lightning offers mixed precision training for GPUs and CPUs, as well as bfloat16
 
 
 .. testcode::
-    :skipif: not _APEX_AVAILABLE and not _NATIVE_AMP_AVAILABLE or not torch.cuda.is_available()
+    :skipif: torch.cuda.device_count() < 4
 
     # 16-bit precision
     trainer = Trainer(precision=16, gpus=4)
 
@@ -16,6 +16,7 @@
 
 import torch
 from torch import Tensor
+from torch.cuda.amp import GradScaler
 from torch.nn import Module
 from torch.optim import Optimizer
 from torch.utils.data import DataLoader
@@ -24,14 +25,11 @@
 from pytorch_lightning.plugins.precision import ApexMixedPrecisionPlugin, NativeMixedPrecisionPlugin, PrecisionPlugin
 from pytorch_lightning.plugins.training_type import DataParallelPlugin, TrainingTypePlugin
 from pytorch_lightning.trainer.states import TrainerFn
-from pytorch_lightning.utilities import _NATIVE_AMP_AVAILABLE, rank_zero_deprecation
+from pytorch_lightning.utilities import rank_zero_deprecation
 from pytorch_lightning.utilities.apply_func import apply_to_collection, move_data_to_device
 from pytorch_lightning.utilities.enums import AMPType, GradClipAlgorithmType, LightningEnum
 from pytorch_lightning.utilities.types import _PATH, STEP_OUTPUT
 
-if _NATIVE_AMP_AVAILABLE:
-    from torch.cuda.amp import GradScaler
-
 
 class Accelerator:
     """The Accelerator Base Class. An Accelerator is meant to deal with one type of Hardware.
@@ -258,8 +256,6 @@ def optimizer_step(self, optimizer: Optimizer, opt_idx: int, lambda_closure: Cal
         )
         if make_optimizer_step:
             self.run_optimizer_step(optimizer, opt_idx, lambda_closure, **kwargs)
-        self.precision_plugin.post_optimizer_step(optimizer, opt_idx)
-        self.training_type_plugin.post_optimizer_step(optimizer, opt_idx, **kwargs)
 
     def run_optimizer_step(
         self, optimizer: Optimizer, optimizer_idx: int, lambda_closure: Callable, **kwargs: Any
 
@@ -209,7 +209,7 @@ def __init__(
     ) -> None:
         if not _RICH_AVAILABLE:
             raise ImportError(
-                "`RichProgressBar` requires `rich` to be installed. Install it by running `pip install rich`."
+                "`RichProgressBar` requires `rich` to be installed. Install it by running `pip install -U rich`."
             )
         super().__init__()
         self._refresh_rate_per_second: int = refresh_rate_per_second
 
@@ -61,7 +61,7 @@ class RichModelSummary(ModelSummary):
     def __init__(self, max_depth: int = 1) -> None:
         if not _RICH_AVAILABLE:
             raise ImportError(
-                "`RichModelSummary` requires `rich` to be installed. Install it by running `pip install rich`."
+                "`RichProgressBar` requires `rich` to be installed. Install it by running `pip install -U rich`."
             )
         super().__init__(max_depth)
 
 
@@ -371,7 +371,11 @@ def _run_optimization_end(self, opt_idx: int) -> None:
             model.untoggle_optimizer(opt_idx)
 
     def _optimizer_step(
-        self, optimizer: torch.optim.Optimizer, opt_idx: int, batch_idx: int, train_step_and_backward_closure: Callable
+        self,
+        optimizer: Optimizer,
+        opt_idx: int,
+        batch_idx: int,
+        train_step_and_backward_closure: Callable[[], Optional[Tensor]],
     ) -> None:
         """Performs the optimizer step and some sanity checking.
 
@@ -385,15 +389,6 @@ def _optimizer_step(
         lightning_module = self.trainer.lightning_module
 
         is_lbfgs = isinstance(optimizer, torch.optim.LBFGS)
-        using_native_amp = self.trainer.amp_backend is not None and self.trainer.amp_backend == AMPType.NATIVE
-
-        # native amp + lbfgs is a no go right now
-        if using_native_amp and is_lbfgs:
-            raise MisconfigurationException(
-                "native PyTorch amp and lbfgs are not compatible."
-                " To request, please file a Github issue in PyTorch and tag @mcarilli"
-            )
-
         # wraps into LightningOptimizer only for running step
         optimizer = LightningOptimizer._to_lightning_optimizer(optimizer, self.trainer, opt_idx)
 
@@ -407,7 +402,7 @@ def _optimizer_step(
             opt_idx,
             train_step_and_backward_closure,
             on_tpu=(self.trainer._device_type == DeviceType.TPU and _TPU_AVAILABLE),
-            using_native_amp=using_native_amp,
+            using_native_amp=(self.trainer.amp_backend is not None and self.trainer.amp_backend == AMPType.NATIVE),
             using_lbfgs=is_lbfgs,
         )
Original file line number	Diff line number	Diff line change
`@@ -209,7 +209,7 @@ def __init__(`
`209`	`209`	`) -> None:`
`210`	`210`	`if not _RICH_AVAILABLE:`
`211`	`211`	`raise ImportError(`
`212`		- "`RichProgressBar` requires `rich` to be installed. Install it by running `pip install rich`."
	`212`	+ "`RichProgressBar` requires `rich` to be installed. Install it by running `pip install -U rich`."
`213`	`213`	`)`
`214`	`214`	`super().__init__()`
`215`	`215`	`self._refresh_rate_per_second: int = refresh_rate_per_second`
Original file line number	Diff line number	Diff line change
`@@ -61,7 +61,7 @@ class RichModelSummary(ModelSummary):`
`61`	`61`	`def __init__(self, max_depth: int = 1) -> None:`
`62`	`62`	`if not _RICH_AVAILABLE:`
`63`	`63`	`raise ImportError(`
`64`		- "`RichModelSummary` requires `rich` to be installed. Install it by running `pip install rich`."
	`64`	+ "`RichProgressBar` requires `rich` to be installed. Install it by running `pip install -U rich`."
`65`	`65`	`)`
`66`	`66`	`super().__init__(max_depth)`
`67`	`67`