-
Notifications
You must be signed in to change notification settings - Fork 3.4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
refactor accelerator teardown -> training type plugin teardown (#7579)
- Loading branch information
1 parent
a8d9b5f
commit 2242423
Showing
15 changed files
with
237 additions
and
32 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,48 @@ | ||
# Copyright The PyTorch Lightning team. | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
import torch | ||
|
||
from pytorch_lightning import Trainer | ||
from pytorch_lightning.plugins import DDPPlugin | ||
from tests.helpers.boring_model import BoringModel | ||
from tests.helpers.runif import RunIf | ||
|
||
|
||
class BoringModelGPU(BoringModel): | ||
|
||
def on_train_start(self) -> None: | ||
# make sure that the model is on GPU when training | ||
assert self.device == torch.device(f"cuda:{self.trainer.training_type_plugin.local_rank}") | ||
self.start_cuda_memory = torch.cuda.memory_allocated() | ||
|
||
|
||
@RunIf(skip_windows=True, min_gpus=2, special=True) | ||
def test_ddp_with_2_gpus(): | ||
"""Tests if device is set correctely when training and after teardown for DDPPlugin.""" | ||
trainer = Trainer(gpus=2, accelerator="ddp", fast_dev_run=True) | ||
# assert training type plugin attributes for device setting | ||
assert isinstance(trainer.training_type_plugin, DDPPlugin) | ||
assert trainer.training_type_plugin.on_gpu | ||
assert not trainer.training_type_plugin.on_tpu | ||
local_rank = trainer.training_type_plugin.local_rank | ||
assert trainer.training_type_plugin.root_device == torch.device(f"cuda:{local_rank}") | ||
|
||
model = BoringModelGPU() | ||
|
||
trainer.fit(model) | ||
|
||
# assert after training, model is moved to CPU and memory is deallocated | ||
assert model.device == torch.device("cpu") | ||
cuda_memory = torch.cuda.memory_allocated() | ||
assert cuda_memory < model.start_cuda_memory |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,42 @@ | ||
# Copyright The PyTorch Lightning team. | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
import torch | ||
|
||
from pytorch_lightning import Trainer | ||
from pytorch_lightning.plugins import DDPSpawnPlugin | ||
from tests.helpers.boring_model import BoringModel | ||
from tests.helpers.runif import RunIf | ||
|
||
|
||
class BoringModelDDPCPU(BoringModel): | ||
|
||
def on_train_start(self) -> None: | ||
# make sure that the model is on CPU when training | ||
assert self.device == torch.device("cpu") | ||
|
||
|
||
@RunIf(skip_windows=True) | ||
def test_ddp_cpu(): | ||
"""Tests if device is set correctely when training for DDPSpawnPlugin.""" | ||
trainer = Trainer(num_processes=2, fast_dev_run=True) | ||
# assert training type plugin attributes for device setting | ||
|
||
assert isinstance(trainer.training_type_plugin, DDPSpawnPlugin) | ||
assert not trainer.training_type_plugin.on_gpu | ||
assert not trainer.training_type_plugin.on_tpu | ||
assert trainer.training_type_plugin.root_device == torch.device("cpu") | ||
|
||
model = BoringModelDDPCPU() | ||
|
||
trainer.fit(model) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.