2022-06-22 08:57:50 +00:00
|
|
|
# Copyright The Lightning AI team.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
import os
|
|
|
|
from unittest import mock
|
|
|
|
|
|
|
|
import pytest
|
2022-07-27 15:40:40 +00:00
|
|
|
import torch
|
2022-06-22 08:57:50 +00:00
|
|
|
|
2023-02-01 20:34:38 +00:00
|
|
|
import lightning.fabric
|
2023-07-14 23:16:42 +00:00
|
|
|
from lightning.fabric.accelerators.xla import _using_pjrt, _XLA_GREATER_EQUAL_2_1
|
2023-02-01 20:34:38 +00:00
|
|
|
from lightning.fabric.plugins.environments import XLAEnvironment
|
2023-03-03 16:55:48 +00:00
|
|
|
from tests_fabric.helpers.runif import RunIf
|
2022-06-22 08:57:50 +00:00
|
|
|
|
|
|
|
|
|
|
|
@RunIf(tpu=True)
|
2023-04-11 22:24:11 +00:00
|
|
|
# keep existing environment or else xla will default to pjrt
|
|
|
|
@mock.patch.dict(os.environ, os.environ.copy(), clear=True)
|
2023-04-19 14:39:00 +00:00
|
|
|
def test_default_attributes(monkeypatch):
|
2022-06-22 08:57:50 +00:00
|
|
|
"""Test the default attributes when no environment variables are set."""
|
2023-07-14 23:16:42 +00:00
|
|
|
if _using_pjrt():
|
2023-07-23 11:39:00 +00:00
|
|
|
# calling these creates side effects in other tests
|
2023-07-14 23:16:42 +00:00
|
|
|
if _XLA_GREATER_EQUAL_2_1:
|
2023-07-23 11:39:00 +00:00
|
|
|
from torch_xla import runtime
|
|
|
|
|
|
|
|
monkeypatch.setattr(runtime, "world_size", lambda: 1)
|
|
|
|
monkeypatch.setattr(runtime, "global_ordinal", lambda: 0)
|
|
|
|
monkeypatch.setattr(runtime, "local_ordinal", lambda: 0)
|
2023-07-14 23:16:42 +00:00
|
|
|
else:
|
2023-07-23 11:39:00 +00:00
|
|
|
from torch_xla.experimental import pjrt
|
|
|
|
|
|
|
|
monkeypatch.setattr(pjrt, "world_size", lambda: 1)
|
|
|
|
monkeypatch.setattr(pjrt, "global_ordinal", lambda: 0)
|
|
|
|
monkeypatch.setattr(pjrt, "local_ordinal", lambda: 0)
|
2023-04-19 14:39:00 +00:00
|
|
|
else:
|
|
|
|
from torch_xla import _XLAC
|
|
|
|
|
|
|
|
# avoid: "Cannot replicate if number of devices ... is different from ..."
|
|
|
|
monkeypatch.setattr(_XLAC, "_xla_get_default_device", lambda: torch.device("xla:0"))
|
|
|
|
|
2022-06-22 08:57:50 +00:00
|
|
|
env = XLAEnvironment()
|
|
|
|
assert not env.creates_processes_externally
|
|
|
|
assert env.world_size() == 1
|
|
|
|
assert env.global_rank() == 0
|
|
|
|
assert env.local_rank() == 0
|
|
|
|
assert env.node_rank() == 0
|
|
|
|
|
2023-04-18 16:52:36 +00:00
|
|
|
with pytest.raises(NotImplementedError):
|
2022-06-22 08:57:50 +00:00
|
|
|
_ = env.main_address
|
2023-04-18 16:52:36 +00:00
|
|
|
with pytest.raises(NotImplementedError):
|
2022-06-22 08:57:50 +00:00
|
|
|
_ = env.main_port
|
|
|
|
|
|
|
|
|
|
|
|
@RunIf(tpu=True)
|
2023-04-18 16:52:36 +00:00
|
|
|
@mock.patch.dict(os.environ, os.environ.copy(), clear=True)
|
|
|
|
def test_attributes_from_environment_variables(monkeypatch):
|
2022-06-22 08:57:50 +00:00
|
|
|
"""Test that the default cluster environment takes the attributes from the environment variables."""
|
2023-07-14 23:16:42 +00:00
|
|
|
if not _using_pjrt():
|
2023-04-18 16:52:36 +00:00
|
|
|
os.environ.update(
|
|
|
|
{
|
|
|
|
"XRT_SHARD_WORLD_SIZE": "1",
|
|
|
|
"XRT_SHARD_ORDINAL": "0",
|
|
|
|
"XRT_SHARD_LOCAL_ORDINAL": "2",
|
2023-07-23 11:39:00 +00:00
|
|
|
"XRT_HOST_ORDINAL": "3",
|
2023-04-18 16:52:36 +00:00
|
|
|
}
|
|
|
|
)
|
|
|
|
else:
|
2023-07-23 11:39:00 +00:00
|
|
|
# PJRT doesn't pull these from envvars
|
2023-07-14 23:16:42 +00:00
|
|
|
if _XLA_GREATER_EQUAL_2_1:
|
2023-07-23 11:39:00 +00:00
|
|
|
from torch_xla import runtime
|
|
|
|
|
|
|
|
monkeypatch.setattr(runtime, "world_size", lambda: 1)
|
|
|
|
monkeypatch.setattr(runtime, "global_ordinal", lambda: 0)
|
|
|
|
monkeypatch.setattr(runtime, "local_ordinal", lambda: 2)
|
|
|
|
monkeypatch.setattr(runtime, "host_index", lambda: 3)
|
2023-07-14 23:16:42 +00:00
|
|
|
else:
|
2023-07-23 11:39:00 +00:00
|
|
|
from torch_xla.experimental import pjrt
|
2023-07-14 23:16:42 +00:00
|
|
|
|
2023-07-23 11:39:00 +00:00
|
|
|
monkeypatch.setattr(pjrt, "world_size", lambda: 1)
|
|
|
|
monkeypatch.setattr(pjrt, "global_ordinal", lambda: 0)
|
|
|
|
monkeypatch.setattr(pjrt, "local_ordinal", lambda: 2)
|
|
|
|
os.environ["XRT_HOST_ORDINAL"] = "3"
|
2023-04-18 16:52:36 +00:00
|
|
|
|
2022-06-22 08:57:50 +00:00
|
|
|
env = XLAEnvironment()
|
2023-04-18 16:52:36 +00:00
|
|
|
with pytest.raises(NotImplementedError):
|
|
|
|
_ = env.main_address
|
|
|
|
with pytest.raises(NotImplementedError):
|
|
|
|
_ = env.main_port
|
2022-06-22 08:57:50 +00:00
|
|
|
assert env.world_size() == 1
|
|
|
|
assert env.global_rank() == 0
|
|
|
|
assert env.local_rank() == 2
|
|
|
|
assert env.node_rank() == 3
|
|
|
|
env.set_global_rank(100)
|
|
|
|
assert env.global_rank() == 0
|
|
|
|
env.set_world_size(100)
|
|
|
|
assert env.world_size() == 1
|
|
|
|
|
|
|
|
|
|
|
|
def test_detect(monkeypatch):
|
|
|
|
"""Test the detection of a xla environment configuration."""
|
2023-04-28 16:36:22 +00:00
|
|
|
monkeypatch.setattr(lightning.fabric.accelerators.xla.XLAAccelerator, "is_available", lambda: False)
|
2022-06-22 08:57:50 +00:00
|
|
|
assert not XLAEnvironment.detect()
|
|
|
|
|
2023-04-28 16:36:22 +00:00
|
|
|
monkeypatch.setattr(lightning.fabric.accelerators.xla.XLAAccelerator, "is_available", lambda: True)
|
2022-06-22 08:57:50 +00:00
|
|
|
assert XLAEnvironment.detect()
|