2021-03-01 12:17:09 +00:00
|
|
|
# Copyright The PyTorch Lightning team.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
2021-03-02 18:57:13 +00:00
|
|
|
import os
|
2021-03-02 09:36:01 +00:00
|
|
|
import sys
|
2021-03-01 12:17:09 +00:00
|
|
|
from typing import Optional
|
|
|
|
|
|
|
|
import pytest
|
|
|
|
import torch
|
2021-04-22 18:25:51 +00:00
|
|
|
from packaging.version import Version
|
2021-03-01 12:17:09 +00:00
|
|
|
from pkg_resources import get_distribution
|
|
|
|
|
2021-03-02 16:21:20 +00:00
|
|
|
from pytorch_lightning.utilities import (
|
|
|
|
_APEX_AVAILABLE,
|
2022-02-04 17:02:09 +00:00
|
|
|
_BAGUA_AVAILABLE,
|
2021-03-02 19:45:13 +00:00
|
|
|
_DEEPSPEED_AVAILABLE,
|
|
|
|
_FAIRSCALE_AVAILABLE,
|
2021-05-24 07:11:45 +00:00
|
|
|
_FAIRSCALE_FULLY_SHARDED_AVAILABLE,
|
2022-05-05 16:06:26 +00:00
|
|
|
_HIVEMIND_AVAILABLE,
|
2021-03-02 16:21:20 +00:00
|
|
|
_HOROVOD_AVAILABLE,
|
2022-03-25 10:24:52 +00:00
|
|
|
_HPU_AVAILABLE,
|
2021-06-11 15:07:04 +00:00
|
|
|
_IPU_AVAILABLE,
|
2021-11-30 14:48:03 +00:00
|
|
|
_OMEGACONF_AVAILABLE,
|
2021-08-24 02:40:36 +00:00
|
|
|
_RICH_AVAILABLE,
|
2022-04-10 04:23:16 +00:00
|
|
|
_TORCH_GREATER_EQUAL_1_10,
|
2021-03-02 16:21:20 +00:00
|
|
|
_TORCH_QUANTIZE_AVAILABLE,
|
|
|
|
_TPU_AVAILABLE,
|
|
|
|
)
|
|
|
|
|
2022-02-28 10:45:32 +00:00
|
|
|
_HOROVOD_NCCL_AVAILABLE = False
|
|
|
|
if _HOROVOD_AVAILABLE:
|
|
|
|
import horovod
|
2021-07-26 11:37:35 +00:00
|
|
|
|
2022-02-28 10:45:32 +00:00
|
|
|
try:
|
|
|
|
|
|
|
|
# `nccl_built` returns an integer
|
|
|
|
_HOROVOD_NCCL_AVAILABLE = bool(horovod.torch.nccl_built())
|
|
|
|
except AttributeError:
|
|
|
|
# AttributeError can be raised if MPI is not available:
|
|
|
|
# https://github.com/horovod/horovod/blob/v0.23.0/horovod/torch/__init__.py#L33-L34
|
|
|
|
pass
|
2021-03-01 12:17:09 +00:00
|
|
|
|
|
|
|
|
2021-03-02 08:03:32 +00:00
|
|
|
class RunIf:
|
2021-09-06 12:49:09 +00:00
|
|
|
"""RunIf wrapper for simple marking specific cases, fully compatible with pytest.mark::
|
2021-03-01 12:17:09 +00:00
|
|
|
|
2021-09-06 12:49:09 +00:00
|
|
|
@RunIf(min_torch="0.0")
|
|
|
|
@pytest.mark.parametrize("arg1", [1, 2.0])
|
|
|
|
def test_wrapper(arg1):
|
|
|
|
assert arg1 > 0.0
|
2021-03-01 12:17:09 +00:00
|
|
|
"""
|
|
|
|
|
2021-03-02 09:36:01 +00:00
|
|
|
def __new__(
|
|
|
|
self,
|
|
|
|
*args,
|
|
|
|
min_gpus: int = 0,
|
|
|
|
min_torch: Optional[str] = None,
|
2021-03-23 20:43:21 +00:00
|
|
|
max_torch: Optional[str] = None,
|
2021-03-02 16:21:20 +00:00
|
|
|
min_python: Optional[str] = None,
|
2021-03-02 09:36:01 +00:00
|
|
|
quantization: bool = False,
|
2021-03-02 12:43:53 +00:00
|
|
|
amp_apex: bool = False,
|
2022-04-10 04:23:16 +00:00
|
|
|
bf16_cuda: bool = False,
|
2021-03-02 16:21:20 +00:00
|
|
|
tpu: bool = False,
|
2021-06-11 15:07:04 +00:00
|
|
|
ipu: bool = False,
|
2022-03-25 10:24:52 +00:00
|
|
|
hpu: bool = False,
|
2021-03-02 16:21:20 +00:00
|
|
|
horovod: bool = False,
|
|
|
|
horovod_nccl: bool = False,
|
2021-03-02 09:36:01 +00:00
|
|
|
skip_windows: bool = False,
|
2021-11-26 17:13:14 +00:00
|
|
|
standalone: bool = False,
|
2021-03-02 19:45:13 +00:00
|
|
|
fairscale: bool = False,
|
2021-05-24 07:11:45 +00:00
|
|
|
fairscale_fully_sharded: bool = False,
|
2021-03-02 19:45:13 +00:00
|
|
|
deepspeed: bool = False,
|
2021-08-24 02:40:36 +00:00
|
|
|
rich: bool = False,
|
2021-11-30 18:36:12 +00:00
|
|
|
skip_hanging_spawn: bool = False,
|
2021-11-30 14:48:03 +00:00
|
|
|
omegaconf: bool = False,
|
2021-12-01 19:58:18 +00:00
|
|
|
slow: bool = False,
|
2022-02-04 17:02:09 +00:00
|
|
|
bagua: bool = False,
|
2022-05-05 16:06:26 +00:00
|
|
|
hivemind: bool = False,
|
2021-07-26 11:37:35 +00:00
|
|
|
**kwargs,
|
2021-03-02 09:36:01 +00:00
|
|
|
):
|
2021-03-01 15:26:09 +00:00
|
|
|
"""
|
|
|
|
Args:
|
2021-11-30 13:21:38 +00:00
|
|
|
*args: Any :class:`pytest.mark.skipif` arguments.
|
|
|
|
min_gpus: Require this number of gpus.
|
|
|
|
min_torch: Require that PyTorch is greater or equal than this version.
|
|
|
|
max_torch: Require that PyTorch is less than this version.
|
|
|
|
min_python: Require that Python is greater or equal than this version.
|
|
|
|
quantization: Require that `torch.quantization` is available.
|
|
|
|
amp_apex: Require that NVIDIA/apex is installed.
|
2022-04-10 04:23:16 +00:00
|
|
|
bf16_cuda: Require that CUDA device supports bf16.
|
2021-11-30 13:21:38 +00:00
|
|
|
tpu: Require that TPU is available.
|
|
|
|
ipu: Require that IPU is available.
|
2022-03-25 10:24:52 +00:00
|
|
|
hpu: Require that HPU is available.
|
2021-11-30 13:21:38 +00:00
|
|
|
horovod: Require that Horovod is installed.
|
|
|
|
horovod_nccl: Require that Horovod is installed with NCCL support.
|
|
|
|
skip_windows: Skip for Windows platform.
|
2021-11-26 17:13:14 +00:00
|
|
|
standalone: Mark the test as standalone, our CI will run it in a separate process.
|
2021-11-30 13:21:38 +00:00
|
|
|
fairscale: Require that facebookresearch/fairscale is installed.
|
|
|
|
fairscale_fully_sharded: Require that `fairscale` fully sharded support is available.
|
2021-11-30 14:48:03 +00:00
|
|
|
deepspeed: Require that microsoft/DeepSpeed is installed.
|
2021-11-30 13:21:38 +00:00
|
|
|
rich: Require that willmcgugan/rich is installed.
|
2021-11-30 18:36:12 +00:00
|
|
|
skip_hanging_spawn: Skip the test as it's impacted by hanging loggers on spawn.
|
2021-11-30 14:48:03 +00:00
|
|
|
omegaconf: Require that omry/omegaconf is installed.
|
2021-12-01 19:58:18 +00:00
|
|
|
slow: Mark the test as slow, our CI will run it in a separate job.
|
2022-02-04 17:02:09 +00:00
|
|
|
bagua: Require that BaguaSys/bagua is installed.
|
2022-05-05 16:06:26 +00:00
|
|
|
hivemind: Require that Hivemind is installed.
|
2021-11-30 13:21:38 +00:00
|
|
|
**kwargs: Any :class:`pytest.mark.skipif` keyword arguments.
|
2021-03-01 15:26:09 +00:00
|
|
|
"""
|
|
|
|
conditions = []
|
|
|
|
reasons = []
|
2021-03-01 12:17:09 +00:00
|
|
|
|
2021-03-01 15:26:09 +00:00
|
|
|
if min_gpus:
|
|
|
|
conditions.append(torch.cuda.device_count() < min_gpus)
|
|
|
|
reasons.append(f"GPUs>={min_gpus}")
|
2021-03-01 12:17:09 +00:00
|
|
|
|
2021-03-01 15:26:09 +00:00
|
|
|
if min_torch:
|
2021-04-22 18:25:51 +00:00
|
|
|
torch_version = get_distribution("torch").version
|
|
|
|
conditions.append(Version(torch_version) < Version(min_torch))
|
2021-03-01 15:26:09 +00:00
|
|
|
reasons.append(f"torch>={min_torch}")
|
2021-03-01 12:17:09 +00:00
|
|
|
|
2021-03-23 20:43:21 +00:00
|
|
|
if max_torch:
|
2021-04-22 18:25:51 +00:00
|
|
|
torch_version = get_distribution("torch").version
|
|
|
|
conditions.append(Version(torch_version) >= Version(max_torch))
|
2021-03-23 20:43:21 +00:00
|
|
|
reasons.append(f"torch<{max_torch}")
|
|
|
|
|
2021-03-02 16:21:20 +00:00
|
|
|
if min_python:
|
|
|
|
py_version = f"{sys.version_info.major}.{sys.version_info.minor}.{sys.version_info.micro}"
|
2021-04-22 18:25:51 +00:00
|
|
|
conditions.append(Version(py_version) < Version(min_python))
|
2021-03-02 16:21:20 +00:00
|
|
|
reasons.append(f"python>={min_python}")
|
|
|
|
|
2021-03-01 15:26:09 +00:00
|
|
|
if quantization:
|
2021-07-26 11:37:35 +00:00
|
|
|
_miss_default = "fbgemm" not in torch.backends.quantized.supported_engines
|
2021-03-01 15:26:09 +00:00
|
|
|
conditions.append(not _TORCH_QUANTIZE_AVAILABLE or _miss_default)
|
2021-03-02 16:21:20 +00:00
|
|
|
reasons.append("PyTorch quantization")
|
2021-03-01 12:17:09 +00:00
|
|
|
|
2021-03-02 12:43:53 +00:00
|
|
|
if amp_apex:
|
|
|
|
conditions.append(not _APEX_AVAILABLE)
|
2021-03-02 16:21:20 +00:00
|
|
|
reasons.append("NVIDIA Apex")
|
2021-03-02 12:43:53 +00:00
|
|
|
|
2022-04-10 04:23:16 +00:00
|
|
|
if bf16_cuda:
|
|
|
|
try:
|
|
|
|
cond = not (torch.cuda.is_available() and _TORCH_GREATER_EQUAL_1_10 and torch.cuda.is_bf16_supported())
|
|
|
|
except (AssertionError, RuntimeError) as e:
|
|
|
|
# AssertionError: Torch not compiled with CUDA enabled
|
|
|
|
# RuntimeError: Found no NVIDIA driver on your system.
|
|
|
|
is_unrelated = "Found no NVIDIA driver" not in str(e) or "Torch not compiled with CUDA" not in str(e)
|
|
|
|
if is_unrelated:
|
|
|
|
raise e
|
|
|
|
cond = True
|
|
|
|
|
|
|
|
conditions.append(cond)
|
|
|
|
reasons.append("CUDA device bf16")
|
|
|
|
|
2021-03-02 09:36:01 +00:00
|
|
|
if skip_windows:
|
|
|
|
conditions.append(sys.platform == "win32")
|
|
|
|
reasons.append("unimplemented on Windows")
|
|
|
|
|
2021-03-02 16:21:20 +00:00
|
|
|
if tpu:
|
|
|
|
conditions.append(not _TPU_AVAILABLE)
|
|
|
|
reasons.append("TPU")
|
|
|
|
|
2021-06-11 15:07:04 +00:00
|
|
|
if ipu:
|
2022-03-25 05:20:22 +00:00
|
|
|
env_flag = os.getenv("PL_RUN_IPU_TESTS", "0")
|
|
|
|
conditions.append(env_flag != "1" or not _IPU_AVAILABLE)
|
2021-06-11 15:07:04 +00:00
|
|
|
reasons.append("IPU")
|
2022-03-25 05:20:22 +00:00
|
|
|
kwargs["ipu"] = True
|
2021-06-11 15:07:04 +00:00
|
|
|
|
2022-03-25 10:24:52 +00:00
|
|
|
if hpu:
|
|
|
|
conditions.append(not _HPU_AVAILABLE)
|
|
|
|
reasons.append("HPU")
|
|
|
|
|
2021-03-02 16:21:20 +00:00
|
|
|
if horovod:
|
|
|
|
conditions.append(not _HOROVOD_AVAILABLE)
|
|
|
|
reasons.append("Horovod")
|
|
|
|
|
|
|
|
if horovod_nccl:
|
2022-02-28 10:45:32 +00:00
|
|
|
conditions.append(not _HOROVOD_NCCL_AVAILABLE)
|
2021-03-02 16:21:20 +00:00
|
|
|
reasons.append("Horovod with NCCL")
|
|
|
|
|
2021-11-26 17:13:14 +00:00
|
|
|
if standalone:
|
|
|
|
env_flag = os.getenv("PL_RUN_STANDALONE_TESTS", "0")
|
2021-07-26 11:37:35 +00:00
|
|
|
conditions.append(env_flag != "1")
|
2021-11-26 17:13:14 +00:00
|
|
|
reasons.append("Standalone execution")
|
2021-11-17 15:46:14 +00:00
|
|
|
# used in tests/conftest.py::pytest_collection_modifyitems
|
2021-11-26 17:13:14 +00:00
|
|
|
kwargs["standalone"] = True
|
2021-03-02 18:57:13 +00:00
|
|
|
|
2021-03-02 19:45:13 +00:00
|
|
|
if fairscale:
|
|
|
|
conditions.append(not _FAIRSCALE_AVAILABLE)
|
|
|
|
reasons.append("Fairscale")
|
|
|
|
|
2021-05-24 07:11:45 +00:00
|
|
|
if fairscale_fully_sharded:
|
|
|
|
conditions.append(not _FAIRSCALE_FULLY_SHARDED_AVAILABLE)
|
|
|
|
reasons.append("Fairscale Fully Sharded")
|
|
|
|
|
2021-03-02 19:45:13 +00:00
|
|
|
if deepspeed:
|
|
|
|
conditions.append(not _DEEPSPEED_AVAILABLE)
|
|
|
|
reasons.append("Deepspeed")
|
|
|
|
|
2021-08-24 02:40:36 +00:00
|
|
|
if rich:
|
|
|
|
conditions.append(not _RICH_AVAILABLE)
|
|
|
|
reasons.append("Rich")
|
|
|
|
|
2021-11-30 18:36:12 +00:00
|
|
|
if skip_hanging_spawn:
|
|
|
|
# strategy=ddp_spawn, accelerator=cpu, python>=3.8, torch<1.9 does not work
|
|
|
|
py_version = f"{sys.version_info.major}.{sys.version_info.minor}.{sys.version_info.micro}"
|
|
|
|
ge_3_8 = Version(py_version) >= Version("3.8")
|
|
|
|
torch_version = get_distribution("torch").version
|
|
|
|
old_torch = Version(torch_version) < Version("1.9")
|
|
|
|
conditions.append(ge_3_8 and old_torch)
|
|
|
|
reasons.append("Impacted by hanging DDP spawn")
|
|
|
|
|
2021-11-30 14:48:03 +00:00
|
|
|
if omegaconf:
|
|
|
|
conditions.append(not _OMEGACONF_AVAILABLE)
|
|
|
|
reasons.append("omegaconf")
|
|
|
|
|
2021-12-01 19:58:18 +00:00
|
|
|
if slow:
|
|
|
|
env_flag = os.getenv("PL_RUN_SLOW_TESTS", "0")
|
|
|
|
conditions.append(env_flag != "1")
|
|
|
|
reasons.append("Slow test")
|
|
|
|
# used in tests/conftest.py::pytest_collection_modifyitems
|
|
|
|
kwargs["slow"] = True
|
|
|
|
|
2022-02-04 17:02:09 +00:00
|
|
|
if bagua:
|
|
|
|
conditions.append(not _BAGUA_AVAILABLE or sys.platform in ("win32", "darwin"))
|
|
|
|
reasons.append("Bagua")
|
|
|
|
|
2022-05-05 16:06:26 +00:00
|
|
|
if hivemind:
|
|
|
|
conditions.append(not _HIVEMIND_AVAILABLE or sys.platform in ("win32", "darwin"))
|
|
|
|
reasons.append("Hivemind")
|
|
|
|
|
2021-03-01 15:26:09 +00:00
|
|
|
reasons = [rs for cond, rs in zip(conditions, reasons) if cond]
|
|
|
|
return pytest.mark.skipif(
|
2021-07-26 11:37:35 +00:00
|
|
|
*args, condition=any(conditions), reason=f"Requires: [{' + '.join(reasons)}]", **kwargs
|
2021-03-01 15:26:09 +00:00
|
|
|
)
|
2021-03-01 12:17:09 +00:00
|
|
|
|
|
|
|
|
2021-03-02 08:03:32 +00:00
|
|
|
@RunIf(min_torch="99")
|
2021-03-01 12:17:09 +00:00
|
|
|
def test_always_skip():
|
|
|
|
exit(1)
|
|
|
|
|
|
|
|
|
2021-03-01 15:26:09 +00:00
|
|
|
@pytest.mark.parametrize("arg1", [0.5, 1.0, 2.0])
|
2021-03-02 08:03:32 +00:00
|
|
|
@RunIf(min_torch="0.0")
|
2021-03-09 11:27:15 +00:00
|
|
|
def test_wrapper(arg1: float):
|
2021-03-01 15:26:09 +00:00
|
|
|
assert arg1 > 0.0
|