2021-10-29 21:46:39 +00:00
|
|
|
# Copyright The Lightning AI team.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2023-01-09 14:01:11 +00:00
|
|
|
from unittest import mock
|
ruff: replace isort with ruff +TPU (#17684)
* ruff: replace isort with ruff
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* fixing & imports
* lines in warning test
* docs
* fix enum import
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* fixing
* import
* fix lines
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* type ClusterEnvironment
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
---------
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
2023-09-26 15:54:55 +00:00
|
|
|
from unittest.mock import Mock, call
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
import pytest
|
|
|
|
import torch
|
2023-02-01 20:34:38 +00:00
|
|
|
from lightning.fabric.fabric import Fabric
|
2023-04-24 11:50:59 +00:00
|
|
|
from lightning.fabric.plugins import Precision
|
2023-02-01 20:34:38 +00:00
|
|
|
from lightning.fabric.utilities.device_dtype_mixin import _DeviceDtypeModuleMixin
|
2023-10-03 17:49:39 +00:00
|
|
|
from lightning.fabric.utilities.imports import _TORCH_GREATER_EQUAL_2_1
|
2023-05-11 17:02:30 +00:00
|
|
|
from lightning.fabric.wrappers import (
|
|
|
|
_FabricDataLoader,
|
|
|
|
_FabricModule,
|
|
|
|
_FabricOptimizer,
|
2024-01-24 02:17:41 +00:00
|
|
|
_unwrap_compiled,
|
2023-05-11 17:02:30 +00:00
|
|
|
_unwrap_objects,
|
|
|
|
is_wrapped,
|
|
|
|
)
|
ruff: replace isort with ruff +TPU (#17684)
* ruff: replace isort with ruff
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* fixing & imports
* lines in warning test
* docs
* fix enum import
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* fixing
* import
* fix lines
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
* type ClusterEnvironment
* [pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
---------
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
2023-09-26 15:54:55 +00:00
|
|
|
from torch.utils.data import BatchSampler, DistributedSampler
|
|
|
|
from torch.utils.data.dataloader import DataLoader
|
|
|
|
|
2023-03-03 16:55:48 +00:00
|
|
|
from tests_fabric.helpers.runif import RunIf
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_module_wraps():
|
2021-10-29 21:46:39 +00:00
|
|
|
"""Test that the wrapped module is accessible via the property."""
|
|
|
|
module = Mock()
|
2023-01-04 15:57:18 +00:00
|
|
|
assert _FabricModule(module, Mock()).module is module
|
2021-10-29 21:46:39 +00:00
|
|
|
|
2022-05-11 18:28:08 +00:00
|
|
|
wrapped_module = Mock()
|
|
|
|
original_module = Mock()
|
2023-01-04 15:57:18 +00:00
|
|
|
assert _FabricModule(wrapped_module, Mock(), original_module=original_module).module is original_module
|
2022-05-11 18:28:08 +00:00
|
|
|
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_module_attribute_lookup():
|
2022-09-14 23:29:23 +00:00
|
|
|
"""Test that attribute lookup passes through to the original module when possible."""
|
2022-05-11 18:28:08 +00:00
|
|
|
|
|
|
|
class OriginalModule(torch.nn.Module):
|
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.layer = torch.nn.Linear(2, 3)
|
|
|
|
self.attribute = 1
|
|
|
|
|
|
|
|
def method(self):
|
|
|
|
return 2
|
|
|
|
|
|
|
|
original_module = OriginalModule()
|
|
|
|
|
|
|
|
class ModuleWrapper(torch.nn.Module):
|
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.wrapped = original_module
|
|
|
|
|
|
|
|
wrapped_module = ModuleWrapper()
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_module = _FabricModule(wrapped_module, Mock(), original_module=original_module)
|
|
|
|
assert fabric_module.attribute == 1
|
|
|
|
assert fabric_module.layer is original_module.layer
|
|
|
|
assert fabric_module.forward.__self__.__class__ == _FabricModule
|
2022-05-11 18:28:08 +00:00
|
|
|
|
|
|
|
with pytest.raises(AttributeError):
|
2023-01-10 15:02:05 +00:00
|
|
|
_ = fabric_module.not_exists
|
2022-05-11 18:28:08 +00:00
|
|
|
|
2021-10-29 21:46:39 +00:00
|
|
|
|
2023-04-21 19:29:32 +00:00
|
|
|
def test_fabric_module_method_lookup():
|
|
|
|
"""Test that access to methods warns about improper use when a wrapper from a strategy is involved."""
|
|
|
|
|
|
|
|
class OriginalModule(torch.nn.Module):
|
2023-10-23 02:26:28 +00:00
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.submodule = torch.nn.Linear(2, 3)
|
|
|
|
|
|
|
|
def forward(self, x):
|
|
|
|
return x
|
|
|
|
|
|
|
|
def method_without_module_invocation(self):
|
2023-04-21 19:29:32 +00:00
|
|
|
return 100
|
|
|
|
|
2023-10-23 02:26:28 +00:00
|
|
|
def method_with_submodule_invocation(self):
|
|
|
|
self.submodule(torch.rand(2, 2))
|
2023-06-26 15:35:27 +00:00
|
|
|
return 101
|
|
|
|
|
2023-10-23 02:26:28 +00:00
|
|
|
def method_with_self_invocation(self):
|
|
|
|
self(None)
|
|
|
|
return 102
|
|
|
|
|
2023-04-21 19:29:32 +00:00
|
|
|
class ModuleWrapper(torch.nn.Module):
|
|
|
|
def __init__(self, module):
|
|
|
|
super().__init__()
|
|
|
|
self.wrapped = module
|
|
|
|
|
|
|
|
# Regular case: forward_module == original_module -> no warnings
|
|
|
|
original_module = OriginalModule()
|
|
|
|
fabric_module = _FabricModule(forward_module=original_module, precision=Mock(), original_module=original_module)
|
2023-10-23 02:26:28 +00:00
|
|
|
assert fabric_module.method_without_module_invocation() == 100
|
2023-04-21 19:29:32 +00:00
|
|
|
|
2023-06-26 15:35:27 +00:00
|
|
|
# Special case: original module wrapped by forward module: -> warn if method accepts args
|
2023-04-21 19:29:32 +00:00
|
|
|
original_module = OriginalModule()
|
|
|
|
wrapped_module = ModuleWrapper(original_module)
|
|
|
|
fabric_module = _FabricModule(forward_module=wrapped_module, precision=Mock(), original_module=original_module)
|
2023-10-23 02:26:28 +00:00
|
|
|
assert fabric_module.method_without_module_invocation() == 100
|
|
|
|
with pytest.raises(
|
|
|
|
RuntimeError, match=r"You are calling the method `OriginalModule.method_with_submodule_invocation\(\)` from"
|
|
|
|
):
|
|
|
|
assert fabric_module.method_with_submodule_invocation() == 101
|
|
|
|
with pytest.raises(
|
|
|
|
RuntimeError, match=r"You are calling the method `OriginalModule.method_with_self_invocation\(\)` from"
|
|
|
|
):
|
|
|
|
assert fabric_module.method_with_self_invocation() == 102
|
2023-04-21 19:29:32 +00:00
|
|
|
|
|
|
|
|
2023-06-12 19:33:51 +00:00
|
|
|
def test_fabric_module_setattr():
|
|
|
|
"""Test that setattr sets attributes on the original module."""
|
|
|
|
|
|
|
|
class OriginalModule(torch.nn.Module):
|
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.layer = torch.nn.Linear(2, 3)
|
|
|
|
self.attribute = 1
|
|
|
|
self._x = None
|
|
|
|
|
|
|
|
@property
|
|
|
|
def x(self):
|
|
|
|
return self._x
|
|
|
|
|
|
|
|
@x.setter
|
|
|
|
def x(self, value):
|
|
|
|
self._x = value
|
|
|
|
|
|
|
|
original_module = OriginalModule()
|
|
|
|
|
|
|
|
class ModuleWrapper(torch.nn.Module):
|
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.wrapped = original_module
|
|
|
|
|
|
|
|
wrapped_module = ModuleWrapper()
|
|
|
|
fabric_module = _FabricModule(wrapped_module, Mock(), original_module=original_module)
|
|
|
|
|
|
|
|
# Check new attribute is set on original_module
|
|
|
|
fabric_module.new_attribute = 100
|
|
|
|
assert original_module.new_attribute == 100
|
|
|
|
|
|
|
|
# Modify existing attribute on original_module
|
|
|
|
fabric_module.attribute = 101
|
|
|
|
assert original_module.attribute == 101
|
|
|
|
|
|
|
|
# Check setattr of original_module
|
|
|
|
fabric_module.x = 102
|
|
|
|
assert original_module.x == 102
|
|
|
|
|
|
|
|
# Check set submodule
|
|
|
|
assert not hasattr(original_module, "linear")
|
|
|
|
linear = torch.nn.Linear(2, 2)
|
|
|
|
fabric_module.linear = linear
|
|
|
|
assert hasattr(original_module, "linear")
|
|
|
|
assert isinstance(original_module.linear, torch.nn.Module)
|
|
|
|
assert linear in fabric_module.modules()
|
|
|
|
assert linear in original_module.modules()
|
|
|
|
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_module_state_dict_access():
|
2022-09-14 23:29:23 +00:00
|
|
|
"""Test that state_dict access passes through to the original module."""
|
|
|
|
|
|
|
|
class OriginalModule(torch.nn.Module):
|
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.layer = torch.nn.Linear(2, 3)
|
|
|
|
|
|
|
|
original_module = OriginalModule()
|
|
|
|
|
|
|
|
class ModuleWrapper(torch.nn.Module):
|
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.wrapped = original_module
|
|
|
|
|
|
|
|
wrapped_module = ModuleWrapper()
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_module = _FabricModule(wrapped_module, Mock(), original_module=original_module)
|
|
|
|
state_dict = fabric_module.state_dict()
|
2022-09-14 23:29:23 +00:00
|
|
|
assert set(state_dict.keys()) == {"layer.weight", "layer.bias"}
|
|
|
|
|
|
|
|
weight, bias = torch.rand(3, 2), torch.rand(3)
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_module.load_state_dict({"layer.weight": weight, "layer.bias": bias})
|
|
|
|
assert torch.equal(fabric_module.layer.weight, weight)
|
|
|
|
assert torch.equal(fabric_module.layer.bias, bias)
|
2022-09-14 23:29:23 +00:00
|
|
|
|
2023-10-03 17:49:39 +00:00
|
|
|
if _TORCH_GREATER_EQUAL_2_1:
|
|
|
|
# Can use additional `assign` argument in PyTorch >= 2.1
|
|
|
|
with torch.device("meta"):
|
|
|
|
original_module = OriginalModule()
|
|
|
|
fabric_module = _FabricModule(wrapped_module, Mock(), original_module=original_module)
|
|
|
|
assert fabric_module.layer.weight.is_meta
|
|
|
|
fabric_module.load_state_dict({"layer.weight": weight, "layer.bias": bias}, assign=True)
|
|
|
|
assert not fabric_module.layer.weight.is_meta
|
|
|
|
|
2022-09-14 23:29:23 +00:00
|
|
|
|
2021-10-29 21:46:39 +00:00
|
|
|
@pytest.mark.parametrize(
|
2023-05-04 15:50:39 +00:00
|
|
|
("precision", "input_type", "expected_type", "accelerator", "device_str"),
|
2021-10-29 21:46:39 +00:00
|
|
|
[
|
2023-03-02 23:41:37 +00:00
|
|
|
pytest.param(32, torch.float16, torch.float16, "gpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
2022-06-24 12:15:48 +00:00
|
|
|
pytest.param(32, torch.float32, torch.float32, "gpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
2023-03-02 23:41:37 +00:00
|
|
|
pytest.param(32, torch.float64, torch.float64, "gpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
2022-06-24 12:15:48 +00:00
|
|
|
pytest.param(32, torch.int, torch.int, "gpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
|
|
|
pytest.param(16, torch.float32, torch.float16, "gpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
|
|
|
pytest.param(16, torch.float64, torch.float16, "gpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
|
|
|
pytest.param(16, torch.long, torch.long, "gpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
|
|
|
pytest.param(
|
|
|
|
"bf16",
|
|
|
|
torch.float32,
|
|
|
|
torch.bfloat16,
|
|
|
|
"gpu",
|
|
|
|
"cuda:0",
|
2022-11-10 13:59:13 +00:00
|
|
|
marks=RunIf(min_cuda_gpus=1, bf16_cuda=True),
|
2022-06-24 12:15:48 +00:00
|
|
|
),
|
|
|
|
pytest.param(
|
|
|
|
"bf16",
|
|
|
|
torch.float64,
|
|
|
|
torch.bfloat16,
|
|
|
|
"gpu",
|
|
|
|
"cuda:0",
|
2022-11-10 13:59:13 +00:00
|
|
|
marks=RunIf(min_cuda_gpus=1, bf16_cuda=True),
|
2022-06-24 12:15:48 +00:00
|
|
|
),
|
|
|
|
pytest.param(
|
|
|
|
"bf16",
|
|
|
|
torch.bool,
|
|
|
|
torch.bool,
|
|
|
|
"gpu",
|
|
|
|
"cuda:0",
|
2022-11-10 13:59:13 +00:00
|
|
|
marks=RunIf(min_cuda_gpus=1, bf16_cuda=True),
|
2022-06-24 12:15:48 +00:00
|
|
|
),
|
|
|
|
pytest.param(32, torch.float32, torch.float32, "mps", "mps:0", marks=RunIf(mps=True)),
|
2021-10-29 21:46:39 +00:00
|
|
|
],
|
|
|
|
)
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_module_forward_conversion(precision, input_type, expected_type, accelerator, device_str):
|
2023-01-04 15:57:18 +00:00
|
|
|
"""Test that the FabricModule performs autocasting on the input tensors and during forward()."""
|
2023-03-07 15:57:31 +00:00
|
|
|
fabric = Fabric(precision=precision, accelerator=accelerator, devices=1)
|
2022-06-24 12:15:48 +00:00
|
|
|
device = torch.device(device_str)
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
def check_autocast(forward_input):
|
|
|
|
assert precision != 16 or torch.is_autocast_enabled()
|
|
|
|
return forward_input
|
|
|
|
|
2021-11-09 14:21:00 +00:00
|
|
|
module = Mock(wraps=torch.nn.Identity(), side_effect=check_autocast)
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_module = _FabricModule(module, fabric._precision).to(device)
|
|
|
|
out = fabric_module(torch.tensor([1, 2, 3], dtype=input_type, device=device))
|
2021-10-29 21:46:39 +00:00
|
|
|
assert module.call_args[0][0].dtype == expected_type
|
2021-11-09 14:21:00 +00:00
|
|
|
assert out.dtype == input_type or out.dtype == torch.get_default_dtype()
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
|
2021-11-16 17:26:46 +00:00
|
|
|
@pytest.mark.parametrize(
|
2022-06-24 12:15:48 +00:00
|
|
|
"device_str",
|
|
|
|
[
|
|
|
|
"cpu",
|
|
|
|
pytest.param("cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
|
|
|
pytest.param("mps", marks=RunIf(mps=True)),
|
|
|
|
],
|
2021-11-16 17:26:46 +00:00
|
|
|
)
|
|
|
|
@pytest.mark.parametrize("dtype", [torch.float32, torch.float16])
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_module_device_dtype_propagation(device_str, dtype):
|
2023-01-04 15:57:18 +00:00
|
|
|
"""Test that the FabricModule propagates device and dtype properties to its submodules (e.g. torchmetrics)."""
|
2022-06-24 12:15:48 +00:00
|
|
|
device = torch.device(device_str)
|
|
|
|
|
2022-09-06 12:17:15 +00:00
|
|
|
class DeviceModule(_DeviceDtypeModuleMixin):
|
2021-11-16 17:26:46 +00:00
|
|
|
pass
|
|
|
|
|
|
|
|
device_module = DeviceModule()
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_module = _FabricModule(device_module, Mock())
|
|
|
|
fabric_module.to(device)
|
2021-11-16 17:26:46 +00:00
|
|
|
assert device_module.device == device
|
2023-01-10 15:02:05 +00:00
|
|
|
assert fabric_module.device == device
|
2021-11-16 17:26:46 +00:00
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_module.to(dtype)
|
2021-11-16 17:26:46 +00:00
|
|
|
assert device_module.dtype == dtype
|
2023-01-10 15:02:05 +00:00
|
|
|
assert fabric_module.dtype == dtype
|
2021-11-16 17:26:46 +00:00
|
|
|
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_dataloader_iterator():
|
2023-08-09 14:44:20 +00:00
|
|
|
"""Test that the iteration over a FabricDataLoader wraps the iterator of the underlying dataloader (no automatic
|
|
|
|
device placement)."""
|
2021-11-02 10:40:35 +00:00
|
|
|
dataloader = DataLoader(range(5), batch_size=2)
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_dataloader = _FabricDataLoader(dataloader)
|
|
|
|
assert len(fabric_dataloader) == len(dataloader) == 3
|
2021-11-02 10:40:35 +00:00
|
|
|
|
|
|
|
iterator = iter(dataloader)
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_iterator = iter(fabric_dataloader)
|
2021-11-02 10:40:35 +00:00
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
assert torch.equal(next(iterator), next(fabric_iterator))
|
|
|
|
assert torch.equal(next(iterator), next(fabric_iterator))
|
|
|
|
assert torch.equal(next(iterator), next(fabric_iterator))
|
2021-11-02 10:40:35 +00:00
|
|
|
|
|
|
|
with pytest.raises(StopIteration):
|
|
|
|
next(iterator)
|
|
|
|
|
|
|
|
with pytest.raises(StopIteration):
|
2023-01-10 15:02:05 +00:00
|
|
|
next(fabric_iterator)
|
2021-11-02 10:40:35 +00:00
|
|
|
|
|
|
|
|
2021-10-29 21:46:39 +00:00
|
|
|
@pytest.mark.parametrize(
|
2023-05-04 15:50:39 +00:00
|
|
|
("src_device_str", "dest_device_str"),
|
2021-10-29 21:46:39 +00:00
|
|
|
[
|
2022-06-24 12:15:48 +00:00
|
|
|
("cpu", "cpu"),
|
|
|
|
pytest.param("cpu", "cuda:0", marks=RunIf(min_cuda_gpus=1)),
|
|
|
|
pytest.param("cuda:0", "cpu", marks=RunIf(min_cuda_gpus=1)),
|
2023-10-04 18:30:44 +00:00
|
|
|
pytest.param("cpu", "mps", marks=RunIf(mps=True)),
|
2022-06-24 12:15:48 +00:00
|
|
|
pytest.param("mps", "cpu", marks=RunIf(mps=True)),
|
2021-10-29 21:46:39 +00:00
|
|
|
],
|
|
|
|
)
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_dataloader_device_placement(src_device_str, dest_device_str):
|
2023-01-04 15:57:18 +00:00
|
|
|
"""Test that the FabricDataLoader moves data to the device in its iterator."""
|
2022-06-24 12:15:48 +00:00
|
|
|
src_device = torch.device(src_device_str)
|
|
|
|
dest_device = torch.device(dest_device_str)
|
|
|
|
|
2021-10-29 21:46:39 +00:00
|
|
|
sample0 = torch.tensor(0, device=src_device)
|
|
|
|
sample1 = torch.tensor(1, device=src_device)
|
|
|
|
sample2 = {"data": torch.tensor(2, device=src_device)}
|
|
|
|
sample3 = {"data": torch.tensor(3, device=src_device)}
|
2021-11-01 18:33:13 +00:00
|
|
|
dataloader = DataLoader([sample0, sample1, sample2, sample3], batch_size=2)
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_dataloader = _FabricDataLoader(dataloader=dataloader, device=dest_device)
|
|
|
|
iterator = iter(fabric_dataloader)
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
batch0 = next(iterator)
|
2022-09-16 19:21:36 +00:00
|
|
|
assert torch.equal(batch0, torch.tensor([0, 1], device=dest_device))
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
batch1 = next(iterator)
|
2022-09-16 19:21:36 +00:00
|
|
|
assert torch.equal(batch1["data"], torch.tensor([2, 3], device=dest_device))
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
|
2023-05-05 06:25:15 +00:00
|
|
|
@pytest.mark.parametrize("use_batch_sampler", [False, True])
|
2023-02-23 00:11:29 +00:00
|
|
|
def test_fabric_dataloader_distributed_sampler_set_epoch(use_batch_sampler):
|
2023-01-10 15:02:05 +00:00
|
|
|
"""Test that the FabricDataLoader calls `set_epoch()` on the wrapped sampler if applicable."""
|
2023-02-23 00:11:29 +00:00
|
|
|
dataset = range(3)
|
|
|
|
sampler = DistributedSampler(dataset, num_replicas=2, rank=0)
|
2022-12-19 21:57:15 +00:00
|
|
|
sampler.set_epoch = Mock()
|
2023-02-23 00:11:29 +00:00
|
|
|
|
|
|
|
if not use_batch_sampler:
|
|
|
|
dataloader = DataLoader(dataset, sampler=sampler)
|
|
|
|
else:
|
|
|
|
batch_sampler = BatchSampler(sampler, batch_size=1, drop_last=False)
|
|
|
|
dataloader = DataLoader(dataset, batch_sampler=batch_sampler)
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_dataloader = _FabricDataLoader(dataloader)
|
|
|
|
iterator_epoch_0 = iter(fabric_dataloader)
|
2023-02-23 00:11:29 +00:00
|
|
|
sampler.set_epoch.assert_not_called()
|
|
|
|
|
2022-12-19 21:57:15 +00:00
|
|
|
next(iterator_epoch_0)
|
|
|
|
# .set_epoch() gets called before the first sample gets fetched from the wrapped dataloader
|
2023-02-23 00:11:29 +00:00
|
|
|
assert sampler.set_epoch.mock_calls == [call(0)]
|
|
|
|
|
2022-12-19 21:57:15 +00:00
|
|
|
next(iterator_epoch_0)
|
2023-02-23 00:11:29 +00:00
|
|
|
assert sampler.set_epoch.mock_calls == [call(0)]
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
iterator_epoch_1 = iter(fabric_dataloader)
|
2023-02-23 00:11:29 +00:00
|
|
|
assert sampler.set_epoch.mock_calls == [call(0)]
|
|
|
|
|
2022-12-19 21:57:15 +00:00
|
|
|
next(iterator_epoch_1)
|
|
|
|
# with every new iterator call, the epoch increases
|
2023-02-23 00:11:29 +00:00
|
|
|
assert sampler.set_epoch.mock_calls == [call(0), call(1)]
|
2022-12-19 21:57:15 +00:00
|
|
|
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_optimizer_wraps():
|
2023-01-04 15:57:18 +00:00
|
|
|
"""Test that the FabricOptimizer fully wraps the optimizer."""
|
2021-10-29 21:46:39 +00:00
|
|
|
optimizer_cls = torch.optim.SGD
|
|
|
|
optimizer = Mock(spec=optimizer_cls)
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_optimizer = _FabricOptimizer(optimizer, Mock())
|
|
|
|
assert fabric_optimizer.optimizer is optimizer
|
|
|
|
assert isinstance(fabric_optimizer, optimizer_cls)
|
2023-09-12 07:30:44 +00:00
|
|
|
assert isinstance(fabric_optimizer, _FabricOptimizer)
|
|
|
|
assert type(fabric_optimizer).__name__ == "FabricSGD"
|
2021-10-29 21:46:39 +00:00
|
|
|
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_optimizer_state_dict():
|
2023-01-04 15:57:18 +00:00
|
|
|
"""Test that the FabricOptimizer calls into the strategy to collect the state."""
|
2023-09-06 15:51:42 +00:00
|
|
|
optimizer = Mock(spec=torch.optim.Adam)
|
2021-11-30 14:16:59 +00:00
|
|
|
strategy = Mock()
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_optimizer = _FabricOptimizer(optimizer=optimizer, strategy=strategy)
|
|
|
|
fabric_optimizer.state_dict()
|
2022-09-16 17:25:27 +00:00
|
|
|
strategy.get_optimizer_state.assert_called_with(optimizer)
|
2021-11-27 04:54:45 +00:00
|
|
|
|
|
|
|
|
2023-09-06 15:51:42 +00:00
|
|
|
def test_fabric_optimizer_load_state_dict():
|
2023-10-03 20:07:21 +00:00
|
|
|
"""Test that the FabricOptimizer can load the state dict on the wrapped optimizer and update its internal
|
|
|
|
`__dict__`."""
|
2023-09-06 15:51:42 +00:00
|
|
|
model = torch.nn.Linear(1, 1)
|
|
|
|
optimizer = torch.optim.Adam(model.parameters())
|
|
|
|
assert not optimizer.state # a fresh optimizer has no state
|
|
|
|
model(torch.rand(1)).backward()
|
|
|
|
optimizer.step()
|
|
|
|
assert optimizer.state
|
|
|
|
state_dict = optimizer.state_dict()
|
|
|
|
|
|
|
|
optimizer = torch.optim.Adam(model.parameters()) # fresh optimizer
|
|
|
|
fabric_optimizer = _FabricOptimizer(optimizer=optimizer, strategy=Mock())
|
|
|
|
assert not fabric_optimizer.state # a fresh optimizer has no state
|
|
|
|
fabric_optimizer.load_state_dict(state_dict)
|
|
|
|
assert fabric_optimizer.state
|
|
|
|
assert fabric_optimizer.optimizer.state_dict()["state"] == state_dict["state"]
|
|
|
|
|
|
|
|
|
2023-01-10 15:02:05 +00:00
|
|
|
def test_fabric_optimizer_steps():
|
2023-01-04 15:57:18 +00:00
|
|
|
"""Test that the FabricOptimizer forwards the step() and zero_grad() calls to the wrapped optimizer."""
|
2023-09-06 15:51:42 +00:00
|
|
|
optimizer = Mock(spec=torch.optim.Adam)
|
2022-09-21 17:28:45 +00:00
|
|
|
strategy = Mock(spec=["optimizer_step"])
|
2022-02-09 09:37:13 +00:00
|
|
|
strategy.optimizer_step.return_value = 123
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_optimizer = _FabricOptimizer(optimizer=optimizer, strategy=strategy)
|
|
|
|
step_output = fabric_optimizer.step()
|
2022-02-09 09:37:13 +00:00
|
|
|
assert step_output == 123
|
2022-09-21 17:28:45 +00:00
|
|
|
strategy.optimizer_step.assert_called_once_with(optimizer)
|
2022-09-16 17:25:27 +00:00
|
|
|
|
2022-09-21 17:28:45 +00:00
|
|
|
strategy.reset_mock()
|
2022-09-16 17:25:27 +00:00
|
|
|
|
|
|
|
# with closure as input
|
|
|
|
closure = Mock()
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_optimizer.step(closure=closure)
|
2022-09-21 17:28:45 +00:00
|
|
|
strategy.optimizer_step.assert_called_once_with(optimizer, closure=closure)
|
|
|
|
|
|
|
|
# with model as optimizer
|
|
|
|
strategy = Mock(spec=["optimizer_step", "model"])
|
2023-01-10 15:02:05 +00:00
|
|
|
fabric_optimizer = _FabricOptimizer(optimizer=optimizer, strategy=strategy)
|
|
|
|
fabric_optimizer.step()
|
2022-09-21 17:28:45 +00:00
|
|
|
strategy.optimizer_step.assert_called_once_with(strategy.model)
|
2023-01-09 14:01:11 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_fabric_optimizer_zero_grad_kwargs():
|
|
|
|
"""Test that Fabric can adapt the `.zero_grad()` arguments to the underlying optimizer."""
|
|
|
|
# Test PyTorch's standard `.zero_grad()` signature
|
|
|
|
with mock.patch("torch.optim.SGD.zero_grad") as zero_grad_mock:
|
|
|
|
optimizer = torch.optim.SGD(torch.nn.Linear(1, 1).parameters(), 0.1)
|
|
|
|
fabric_optimizer = _FabricOptimizer(optimizer=optimizer, strategy=Mock())
|
|
|
|
fabric_optimizer.zero_grad()
|
|
|
|
zero_grad_mock.assert_called_with()
|
|
|
|
fabric_optimizer.zero_grad(set_to_none=False)
|
|
|
|
zero_grad_mock.assert_called_with(set_to_none=False)
|
|
|
|
fabric_optimizer.zero_grad(set_to_none=True)
|
|
|
|
zero_grad_mock.assert_called_with(set_to_none=True)
|
|
|
|
|
|
|
|
# Test weird `.zero_grad()` signatures from other libraries
|
|
|
|
custom_zero_grad = Mock()
|
|
|
|
|
|
|
|
class CustomSGD(torch.optim.SGD):
|
|
|
|
def zero_grad(self, set_grads_to_None=False):
|
|
|
|
custom_zero_grad(set_grads_to_None=set_grads_to_None)
|
|
|
|
|
|
|
|
optimizer = CustomSGD(torch.nn.Linear(1, 1).parameters(), 0.1)
|
|
|
|
fabric_optimizer = _FabricOptimizer(optimizer=optimizer, strategy=Mock())
|
|
|
|
fabric_optimizer.zero_grad()
|
|
|
|
custom_zero_grad.assert_called_with(set_grads_to_None=False)
|
2023-03-14 13:03:38 +00:00
|
|
|
|
|
|
|
|
2023-05-03 07:00:11 +00:00
|
|
|
@pytest.mark.parametrize("compile", [False, pytest.param(True, marks=RunIf(dynamo=True))])
|
|
|
|
def test_is_wrapped(compile):
|
2023-03-14 13:03:38 +00:00
|
|
|
"""Test that the `is_wrapped` utility recognizes when an object was wrapped by Fabric."""
|
|
|
|
assert not is_wrapped(None)
|
|
|
|
|
|
|
|
# _FabricModule
|
|
|
|
module = torch.nn.Linear(2, 2)
|
|
|
|
assert not is_wrapped(module)
|
|
|
|
wrapped = _FabricModule(module, Mock())
|
|
|
|
assert is_wrapped(wrapped)
|
|
|
|
|
2023-05-03 07:00:11 +00:00
|
|
|
# _FabricModule inside an OptimizedModule
|
|
|
|
if compile:
|
|
|
|
from torch._dynamo import OptimizedModule
|
|
|
|
|
|
|
|
module = torch.nn.Linear(2, 2)
|
|
|
|
wrapped = torch.compile(_FabricModule(module, Mock()))
|
|
|
|
assert isinstance(wrapped, OptimizedModule)
|
|
|
|
assert is_wrapped(wrapped)
|
|
|
|
|
2023-03-14 13:03:38 +00:00
|
|
|
# _FabricOptimizer
|
|
|
|
optimizer = torch.optim.Adam(module.parameters())
|
|
|
|
assert not is_wrapped(optimizer)
|
|
|
|
wrapped = _FabricOptimizer(optimizer, Mock())
|
|
|
|
assert is_wrapped(wrapped)
|
|
|
|
|
|
|
|
# _FabricDataLoader
|
|
|
|
dataloader = DataLoader([1, 2, 3])
|
|
|
|
assert not is_wrapped(dataloader)
|
|
|
|
wrapped = _FabricDataLoader(dataloader)
|
|
|
|
assert is_wrapped(wrapped)
|
2023-04-21 19:29:32 +00:00
|
|
|
|
|
|
|
|
2023-05-03 07:00:11 +00:00
|
|
|
@pytest.mark.parametrize("compile", [False, pytest.param(True, marks=RunIf(dynamo=True))])
|
|
|
|
def test_unwrap_objects(compile):
|
|
|
|
# empty container
|
|
|
|
assert _unwrap_objects({}) == {}
|
|
|
|
|
|
|
|
# container with pure objects and wrapped objects
|
|
|
|
module = torch.nn.Linear(1, 1)
|
|
|
|
wrapped_module = _FabricModule(module, Mock())
|
|
|
|
if compile:
|
|
|
|
wrapped_module = torch.compile(wrapped_module)
|
|
|
|
optimizer = torch.optim.Adam(module.parameters())
|
|
|
|
wrapped_optimizer = _FabricOptimizer(optimizer, Mock())
|
|
|
|
dataloader = DataLoader([1, 2, 3])
|
|
|
|
wrapped_dataloader = _FabricDataLoader(dataloader)
|
|
|
|
container = {
|
|
|
|
"int": 1,
|
|
|
|
"module": module,
|
|
|
|
"wrapped_module": wrapped_module,
|
|
|
|
"optimizer": optimizer,
|
|
|
|
"wrapped_optimizer": wrapped_optimizer,
|
|
|
|
"dataloader": dataloader,
|
|
|
|
"wrapped_dataloader": wrapped_dataloader,
|
|
|
|
"nested": [module, wrapped_module, optimizer, wrapped_optimizer, dataloader, wrapped_dataloader],
|
|
|
|
}
|
|
|
|
expected = {
|
|
|
|
"int": 1,
|
|
|
|
"module": module,
|
|
|
|
"wrapped_module": wrapped_module._forward_module,
|
|
|
|
"optimizer": optimizer,
|
|
|
|
"wrapped_optimizer": optimizer,
|
|
|
|
"dataloader": dataloader,
|
|
|
|
"wrapped_dataloader": dataloader,
|
|
|
|
"nested": [module, wrapped_module._forward_module, optimizer, optimizer, dataloader, dataloader],
|
|
|
|
}
|
|
|
|
assert _unwrap_objects(container) == expected
|
|
|
|
|
|
|
|
|
2023-04-21 19:29:32 +00:00
|
|
|
def test_step_method_redirection():
|
|
|
|
"""Test that the FabricModule redirects the special `LightningModule.*_step` methods through the forward-
|
|
|
|
module."""
|
|
|
|
|
|
|
|
class DDP(torch.nn.Module):
|
|
|
|
def __init__(self, module):
|
|
|
|
super().__init__()
|
|
|
|
self.module = module
|
|
|
|
|
|
|
|
def forward(self, *args, **kwargs):
|
|
|
|
return self.module(*args, **kwargs)
|
|
|
|
|
|
|
|
class LightningModule(torch.nn.Module):
|
|
|
|
def forward(self):
|
|
|
|
return "forward_return"
|
|
|
|
|
|
|
|
def training_step(self, arg, kwarg=None):
|
|
|
|
assert self() == "forward_return"
|
|
|
|
assert arg == "train_arg"
|
|
|
|
assert kwarg == "train_kwarg"
|
|
|
|
return "training_step_return"
|
|
|
|
|
|
|
|
def validation_step(self, arg, kwarg=None):
|
|
|
|
assert self() == "forward_return"
|
|
|
|
assert arg == "val_arg"
|
|
|
|
assert kwarg == "val_kwarg"
|
|
|
|
return "validation_step_return"
|
|
|
|
|
|
|
|
def normal_method(self):
|
|
|
|
pass
|
|
|
|
|
2023-04-24 11:50:59 +00:00
|
|
|
precision = Mock(wraps=Precision())
|
2023-04-21 19:29:32 +00:00
|
|
|
original_module = LightningModule()
|
|
|
|
forward_module = DDP(original_module)
|
2023-04-24 11:50:59 +00:00
|
|
|
fabric_module = _FabricModule(forward_module=forward_module, precision=precision, original_module=original_module)
|
2023-04-21 19:29:32 +00:00
|
|
|
|
|
|
|
# Regular methods on the original_module are visible and identical on the fabric_module ...
|
2023-10-23 02:26:28 +00:00
|
|
|
assert fabric_module.normal_method.__wrapped__ == original_module.normal_method
|
2023-04-21 19:29:32 +00:00
|
|
|
|
|
|
|
# ... but special methods like training_step get redirected to the forward_module
|
|
|
|
assert fabric_module.training_step.__name__ == "call_forward_module"
|
|
|
|
assert fabric_module.validation_step.__name__ == "call_forward_module"
|
|
|
|
assert fabric_module.test_step.__name__ == "call_forward_module"
|
|
|
|
assert fabric_module.predict_step.__name__ == "call_forward_module"
|
|
|
|
|
|
|
|
with pytest.raises(AttributeError, match="has no attribute 'predict_step'"):
|
|
|
|
# A special method that does not exist will raise its AttributeError when being called
|
|
|
|
fabric_module.predict_step()
|
|
|
|
|
|
|
|
# The forward method on the original module remains untouched
|
|
|
|
assert original_module.forward.__name__ == "forward"
|
|
|
|
|
|
|
|
# The special methods get redirected correctly to produce the expected output
|
|
|
|
assert fabric_module.training_step("train_arg", kwarg="train_kwarg") == "training_step_return"
|
|
|
|
assert fabric_module.training_step("train_arg", kwarg="train_kwarg") == "training_step_return" # call 2nd time
|
|
|
|
assert fabric_module.validation_step("val_arg", kwarg="val_kwarg") == "validation_step_return"
|
2023-04-24 11:50:59 +00:00
|
|
|
precision.forward_context.assert_called()
|
2023-04-21 19:29:32 +00:00
|
|
|
|
|
|
|
# The forward method remains untouched/unpatched after the special methods have been called
|
|
|
|
assert original_module.forward.__name__ == "forward"
|
|
|
|
|
|
|
|
# Special case: forward_module == original_module -> no special treatment applied
|
|
|
|
fabric_module = _FabricModule(forward_module=original_module, precision=Mock(), original_module=original_module)
|
|
|
|
assert fabric_module.training_step == original_module.training_step
|
|
|
|
assert fabric_module.validation_step == original_module.validation_step
|
2024-01-24 02:17:41 +00:00
|
|
|
|
|
|
|
|
|
|
|
@RunIf(dynamo=True)
|
|
|
|
def test_unwrap_compiled():
|
|
|
|
model = torch.nn.Linear(1, 1)
|
|
|
|
|
|
|
|
with mock.patch("lightning.fabric.wrappers", "_TORCH_GREATER_EQUAL_2_0", False):
|
|
|
|
unwrapped, compile_kwargs = _unwrap_compiled(model)
|
|
|
|
assert unwrapped is model
|
|
|
|
assert compile_kwargs is None
|
|
|
|
|
|
|
|
compiled = torch.compile(model, fullgraph=True, dynamic=True, disable=False)
|
|
|
|
assert compiled._compile_kwargs == {"fullgraph": True, "dynamic": True, "disable": False}
|
|
|
|
unwrapped, compile_kwargs = _unwrap_compiled(compiled)
|
|
|
|
assert unwrapped is compiled._orig_mod
|
|
|
|
assert compile_kwargs == {"fullgraph": True, "dynamic": True, "disable": False}
|
|
|
|
|
|
|
|
del compiled._compile_kwargs
|
|
|
|
with pytest.raises(RuntimeError, match="Failed to determine the arguments that were used to compile the module"):
|
|
|
|
_unwrap_compiled(compiled)
|