lightning/tests/plugins/test_ddp_plugin.py

import os
from unittest import mock

import pytest
from pytorch_lightning import Trainer, accelerators
from pytorch_lightning.callbacks import Callback
from pytorch_lightning.plugins.ddp_plugin import DDPPlugin
from tests.base.boring_model import BoringModel


@mock.patch.dict(
    os.environ,
    {
        "CUDA_VISIBLE_DEVICES": "0,1",
        "SLURM_NTASKS": "2",
        "SLURM_JOB_NAME": "SOME_NAME",
        "SLURM_NODEID": "0",
        "LOCAL_RANK": "0",
        "SLURM_LOCALID": "0",
    },
)
@mock.patch("torch.cuda.device_count", return_value=2)
@pytest.mark.parametrize(
    ["ddp_backend", "gpus", "num_processes"],
    [("ddp_cpu", None, None), ("ddp", 2, 0), ("ddp2", 2, 0), ("ddp_spawn", 2, 0)],
)
def test_ddp_choice_default_ddp_cpu(tmpdir, ddp_backend, gpus, num_processes):
    class CB(Callback):
        def on_fit_start(self, trainer, pl_module):
            assert isinstance(trainer.accelerator_backend.ddp_plugin, DDPPlugin)
            raise SystemExit()

    model = BoringModel()
    trainer = Trainer(
        fast_dev_run=True,
        gpus=gpus,
        num_processes=num_processes,
        distributed_backend=ddp_backend,
        callbacks=[CB()],
    )

    with pytest.raises(SystemExit):
        trainer.fit(model)


@mock.patch.dict(
    os.environ,
    {
        "CUDA_VISIBLE_DEVICES": "0,1",
        "SLURM_NTASKS": "2",
        "SLURM_JOB_NAME": "SOME_NAME",
        "SLURM_NODEID": "0",
        "LOCAL_RANK": "0",
        "SLURM_LOCALID": "0",
    },
)
@mock.patch("torch.cuda.device_count", return_value=2)
@pytest.mark.parametrize(
    ["ddp_backend", "gpus", "num_processes"],
    [("ddp_cpu", None, None), ("ddp", 2, 0), ("ddp2", 2, 0), ("ddp_spawn", 2, 0)],
)
def test_ddp_choice_custom_ddp_cpu(tmpdir, ddp_backend, gpus, num_processes):
    class MyDDP(DDPPlugin):
        pass

    class CB(Callback):
        def on_fit_start(self, trainer, pl_module):
            assert isinstance(trainer.accelerator_backend.ddp_plugin, MyDDP)
            raise SystemExit()

    model = BoringModel()
    trainer = Trainer(
        fast_dev_run=True,
        gpus=gpus,
        num_processes=num_processes,
        distributed_backend=ddp_backend,
        plugins=[MyDDP()],
        callbacks=[CB()],
    )

    with pytest.raises(SystemExit):
        trainer.fit(model)


@mock.patch.dict(
    os.environ,
    {
        "CUDA_VISIBLE_DEVICES": "0,1",
        "SLURM_NTASKS": "2",
        "SLURM_JOB_NAME": "SOME_NAME",
        "SLURM_NODEID": "0",
        "LOCAL_RANK": "0",
        "SLURM_LOCALID": "0",
    },
)
@mock.patch("torch.cuda.device_count", return_value=2)
@pytest.mark.parametrize(
    ["ddp_backend", "gpus", "num_processes"],
    [("ddp_cpu", None, None), ("ddp", 2, 0), ("ddp2", 2, 0), ("ddp_spawn", 2, 0)],
)
def test_ddp_choice_custom_ddp_cpu_custom_args(
    tmpdir, ddp_backend, gpus, num_processes
):
    class MyDDP(DDPPlugin):
        pass

    class CB(Callback):
        def on_fit_start(self, trainer, pl_module):
            assert isinstance(trainer.accelerator_backend.ddp_plugin, MyDDP)
            raise SystemExit()

    model = BoringModel()
    trainer = Trainer(
        fast_dev_run=True,
        gpus=gpus,
        num_processes=num_processes,
        distributed_backend=ddp_backend,
        plugins=[MyDDP(broadcast_buffers=False, find_unused_parameters=True)],
        callbacks=[CB()],
    )

    with pytest.raises(SystemExit):
        trainer.fit(model)
enable ddp as a plugin (#4285) * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin Co-authored-by: chaton <thomas@grid.ai> 2020-10-22 09:15:51 +00:00			`import os`
			`from unittest import mock`

Enable DDP Plugin to pass through args to LightningDistributedDataParallel (#4382) * Update ddp_plugin.py * Update ddp_plugin.py * Update ddp_plugin.py * Update test_ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Fixed imports, make ddp_kwargs protected Co-authored-by: SeanNaren <sean.narenthiran@gmail.com> 2020-10-27 12:27:59 +00:00			`import pytest`
			`from pytorch_lightning import Trainer, accelerators`
			`from pytorch_lightning.callbacks import Callback`
			`from pytorch_lightning.plugins.ddp_plugin import DDPPlugin`
			`from tests.base.boring_model import BoringModel`
enable ddp as a plugin (#4285) * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin Co-authored-by: chaton <thomas@grid.ai> 2020-10-22 09:15:51 +00:00

Enable DDP Plugin to pass through args to LightningDistributedDataParallel (#4382) * Update ddp_plugin.py * Update ddp_plugin.py * Update ddp_plugin.py * Update test_ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Fixed imports, make ddp_kwargs protected Co-authored-by: SeanNaren <sean.narenthiran@gmail.com> 2020-10-27 12:27:59 +00:00			`@mock.patch.dict(`
			`os.environ,`
			`{`
			`"CUDA_VISIBLE_DEVICES": "0,1",`
			`"SLURM_NTASKS": "2",`
			`"SLURM_JOB_NAME": "SOME_NAME",`
			`"SLURM_NODEID": "0",`
			`"LOCAL_RANK": "0",`
			`"SLURM_LOCALID": "0",`
			`},`
			`)`
			`@mock.patch("torch.cuda.device_count", return_value=2)`
			`@pytest.mark.parametrize(`
			`["ddp_backend", "gpus", "num_processes"],`
			`[("ddp_cpu", None, None), ("ddp", 2, 0), ("ddp2", 2, 0), ("ddp_spawn", 2, 0)],`
			`)`
			`def test_ddp_choice_default_ddp_cpu(tmpdir, ddp_backend, gpus, num_processes):`
enable ddp as a plugin (#4285) * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin Co-authored-by: chaton <thomas@grid.ai> 2020-10-22 09:15:51 +00:00			`class CB(Callback):`
			`def on_fit_start(self, trainer, pl_module):`
			`assert isinstance(trainer.accelerator_backend.ddp_plugin, DDPPlugin)`
			`raise SystemExit()`

			`model = BoringModel()`
			`trainer = Trainer(`
			`fast_dev_run=True,`
			`gpus=gpus,`
			`num_processes=num_processes,`
			`distributed_backend=ddp_backend,`
Enable DDP Plugin to pass through args to LightningDistributedDataParallel (#4382) * Update ddp_plugin.py * Update ddp_plugin.py * Update ddp_plugin.py * Update test_ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Fixed imports, make ddp_kwargs protected Co-authored-by: SeanNaren <sean.narenthiran@gmail.com> 2020-10-27 12:27:59 +00:00			`callbacks=[CB()],`
enable ddp as a plugin (#4285) * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin Co-authored-by: chaton <thomas@grid.ai> 2020-10-22 09:15:51 +00:00			`)`

			`with pytest.raises(SystemExit):`
			`trainer.fit(model)`


Enable DDP Plugin to pass through args to LightningDistributedDataParallel (#4382) * Update ddp_plugin.py * Update ddp_plugin.py * Update ddp_plugin.py * Update test_ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Fixed imports, make ddp_kwargs protected Co-authored-by: SeanNaren <sean.narenthiran@gmail.com> 2020-10-27 12:27:59 +00:00			`@mock.patch.dict(`
			`os.environ,`
			`{`
			`"CUDA_VISIBLE_DEVICES": "0,1",`
			`"SLURM_NTASKS": "2",`
			`"SLURM_JOB_NAME": "SOME_NAME",`
			`"SLURM_NODEID": "0",`
			`"LOCAL_RANK": "0",`
			`"SLURM_LOCALID": "0",`
			`},`
			`)`
			`@mock.patch("torch.cuda.device_count", return_value=2)`
			`@pytest.mark.parametrize(`
			`["ddp_backend", "gpus", "num_processes"],`
			`[("ddp_cpu", None, None), ("ddp", 2, 0), ("ddp2", 2, 0), ("ddp_spawn", 2, 0)],`
			`)`
enable ddp as a plugin (#4285) * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin Co-authored-by: chaton <thomas@grid.ai> 2020-10-22 09:15:51 +00:00			`def test_ddp_choice_custom_ddp_cpu(tmpdir, ddp_backend, gpus, num_processes):`
			`class MyDDP(DDPPlugin):`
			`pass`

			`class CB(Callback):`
			`def on_fit_start(self, trainer, pl_module):`
			`assert isinstance(trainer.accelerator_backend.ddp_plugin, MyDDP)`
			`raise SystemExit()`

			`model = BoringModel()`
			`trainer = Trainer(`
			`fast_dev_run=True,`
			`gpus=gpus,`
			`num_processes=num_processes,`
			`distributed_backend=ddp_backend,`
			`plugins=[MyDDP()],`
Enable DDP Plugin to pass through args to LightningDistributedDataParallel (#4382) * Update ddp_plugin.py * Update ddp_plugin.py * Update ddp_plugin.py * Update test_ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Update pytorch_lightning/plugins/ddp_plugin.py * Fixed imports, make ddp_kwargs protected Co-authored-by: SeanNaren <sean.narenthiran@gmail.com> 2020-10-27 12:27:59 +00:00			`callbacks=[CB()],`
			`)`

			`with pytest.raises(SystemExit):`
			`trainer.fit(model)`


			`@mock.patch.dict(`
			`os.environ,`
			`{`
			`"CUDA_VISIBLE_DEVICES": "0,1",`
			`"SLURM_NTASKS": "2",`
			`"SLURM_JOB_NAME": "SOME_NAME",`
			`"SLURM_NODEID": "0",`
			`"LOCAL_RANK": "0",`
			`"SLURM_LOCALID": "0",`
			`},`
			`)`
			`@mock.patch("torch.cuda.device_count", return_value=2)`
			`@pytest.mark.parametrize(`
			`["ddp_backend", "gpus", "num_processes"],`
			`[("ddp_cpu", None, None), ("ddp", 2, 0), ("ddp2", 2, 0), ("ddp_spawn", 2, 0)],`
			`)`
			`def test_ddp_choice_custom_ddp_cpu_custom_args(`
			`tmpdir, ddp_backend, gpus, num_processes`
			`):`
			`class MyDDP(DDPPlugin):`
			`pass`

			`class CB(Callback):`
			`def on_fit_start(self, trainer, pl_module):`
			`assert isinstance(trainer.accelerator_backend.ddp_plugin, MyDDP)`
			`raise SystemExit()`

			`model = BoringModel()`
			`trainer = Trainer(`
			`fast_dev_run=True,`
			`gpus=gpus,`
			`num_processes=num_processes,`
			`distributed_backend=ddp_backend,`
			`plugins=[MyDDP(broadcast_buffers=False, find_unused_parameters=True)],`
			`callbacks=[CB()],`
enable ddp as a plugin (#4285) * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin * enable custom ddp plugin Co-authored-by: chaton <thomas@grid.ai> 2020-10-22 09:15:51 +00:00			`)`

			`with pytest.raises(SystemExit):`
			`trainer.fit(model)`