lightning/dockers/tpu-tests/tpu_test_cases.jsonnet

56 lines
1.7 KiB
Plaintext

local base = import 'templates/base.libsonnet';
local tpus = import 'templates/tpus.libsonnet';
local utils = import "templates/utils.libsonnet";
local tputests = base.BaseTest {
frameworkPrefix: 'pl',
modelName: 'tpu-tests',
mode: 'postsubmit',
configMaps: [],
timeout: 1200, # 20 minutes, in seconds.
image: 'pytorchlightning/pytorch_lightning',
imageTag: 'base-xla-py{PYTHON_VERSION}-torch{PYTORCH_VERSION}',
tpuSettings+: {
softwareVersion: 'pytorch-{PYTORCH_VERSION}',
},
accelerator: tpus.v3_8,
command: utils.scriptCommand(
|||
source ~/.bashrc
conda activate lightning
mkdir -p /home/runner/work/pytorch-lightning && cd /home/runner/work/pytorch-lightning
git clone https://github.com/Lightning-AI/lightning.git
cd lightning
echo $PWD
git ls-remote --refs origin
git fetch origin "refs/pull/{PR_NUMBER}/head:pr/{PR_NUMBER}" && git checkout "pr/{PR_NUMBER}"
git checkout {SHA}
export PACKAGE_NAME=pytorch
export FREEZE_REQUIREMENTS=1
pip install -e .
echo $KUBE_GOOGLE_CLOUD_TPU_ENDPOINTS
export XRT_TPU_CONFIG="tpu_worker;0;${KUBE_GOOGLE_CLOUD_TPU_ENDPOINTS:7}"
cd tests/tests_pytorch
echo $PWD
# TODO (@kaushikb11): Add device stats tests here
coverage run --source pytorch_lightning -m pytest -v --capture=no \
strategies/test_tpu_spawn.py \
profilers/test_xla_profiler.py \
accelerators/test_tpu.py \
models/test_tpu.py \
plugins/environments/test_xla_environment.py
test_exit_code=$?
echo "\n||| END PYTEST LOGS |||\n"
coverage xml
cat coverage.xml | tr -d '\t'
test $test_exit_code -eq 0
|||
),
};
tputests.oneshotJob