lightning/tests/standalone_tests.sh

#!/bin/bash
# Copyright The PyTorch Lightning team.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
set -e

# this environment variable allows special tests to run
export PL_RUN_STANDALONE_TESTS=1
# python arguments
defaults='-m coverage run --source pytorch_lightning --append -m pytest --capture=no'

# find tests marked as `@RunIf(standalone=True)`. done manually instead of with pytest because it is faster
grep_output=$(grep --recursive --word-regexp 'tests' --regexp 'standalone=True' --include '*.py' --exclude 'tests/conftest.py')

# file paths, remove duplicates
files=$(echo "$grep_output" | cut -f1 -d: | sort | uniq)

# get the list of parametrizations. we need to call them separately. the last two lines are removed.
# note: if there's a syntax error, this will fail with some garbled output
if [[ "$OSTYPE" == "darwin"* ]]; then
  parametrizations=$(python -m pytest $files --collect-only --quiet "$@" | tail -r | sed -e '1,3d' | tail -r)
else
  parametrizations=$(python -m pytest $files --collect-only --quiet "$@" | head -n -2)
fi
parametrizations_arr=($parametrizations)

# tests to skip - space separated
blocklist='tests/profiler/test_profiler.py::test_pytorch_profiler_nested_emit_nvtx tests/utilities/test_warnings.py'
report=''

for i in "${!parametrizations_arr[@]}"; do
  parametrization=${parametrizations_arr[$i]}

  # check blocklist
  if echo $blocklist | grep -F "${parametrization}"; then
    report+="Skipped\t$parametrization\n"
    continue
  fi

  # run the test
  echo "Running ${parametrization}"
  python ${defaults} "${parametrization}"

  report+="Ran\t$parametrization\n"
done

if nvcc --version; then
    nvprof --profile-from-start off -o trace_name.prof -- python ${defaults} tests/profiler/test_profiler.py::test_pytorch_profiler_nested_emit_nvtx
fi

# needs to run outside of `pytest`
python tests/utilities/test_warnings.py
if [ $? -eq 0 ]; then
    report+="Ran\ttests/utilities/test_warnings.py\n"
fi

# test deadlock is properly handled with TorchElastic.
LOGS=$(PL_RUN_STANDALONE_TESTS=1 PL_RECONCILE_PROCESS=1 python -m torch.distributed.run --nproc_per_node=2 --max_restarts 0 -m coverage run --source pytorch_lightning -a tests/plugins/environments/torch_elastic_deadlock.py | grep "SUCCEEDED")
if [ -z "$LOGS" ]; then
    exit 1
fi
report+="Ran\ttests/plugins/environments/torch_elastic_deadlock.py\n"

# test that a user can manually launch individual processes
export PYTHONPATH="${PYTHONPATH}:$(pwd)"
args="--trainer.gpus 2 --trainer.strategy ddp --trainer.max_epochs=1 --trainer.limit_train_batches=1 --trainer.limit_val_batches=1 --trainer.limit_test_batches=1"
MASTER_ADDR="localhost" MASTER_PORT=1234 LOCAL_RANK=1 python pl_examples/basic_examples/mnist_examples/image_classifier_5_lightning_datamodule.py ${args} &
MASTER_ADDR="localhost" MASTER_PORT=1234 LOCAL_RANK=0 python pl_examples/basic_examples/mnist_examples/image_classifier_5_lightning_datamodule.py ${args}
report+="Ran\tmanual ddp launch test\n"

# echo test report
printf '=%.s' {1..80}
printf "\n$report"
printf '=%.s' {1..80}
printf '\n'
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00			`#!/bin/bash`
Simplify optimization Logic (#4984) * Rely on ddp plugin for blocking sync behaviour, and skip if we're using manual optimization * debug * Revert "debug" This reverts commit ccca6b6b * Expose manual reduce for automatic optimization * Add input arguments * Enable parity test * clean imports * Expose hook after to ensure we reset * Fix naming * add * fix test * uniformize optimizer logic * resolve test * resovle flake8 * resolve amp bug * update tests * remove bug * remove optimizer_step in accelerators * typo * update lightning optimizer * set doesn't work with ddp_spawn * resolve flake8 * update threshold * ignore pyright * correct codeFactor * remove useless if * remove zer_grad function * simplify step * remove typo * resolve bug * Apply suggestions from code review * update on comments * resolve bugs * remove tests * Update pytorch_lightning/trainer/configuration_validator.py Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> * simplify testing * add more tests Co-authored-by: SeanNaren <sean@grid.ai> Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> 2020-12-07 12:55:49 +00:00			`# Copyright The PyTorch Lightning team.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`
[bug-fix] Trainer.test points to latest best_model_path (#5161) * resolve bug * update code * add set -e * Update pytorch_lightning/callbacks/model_checkpoint.py Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> * update test * Update tests/checkpointing/test_trainer_checkpoint.py Co-authored-by: Sean Naren <sean.narenthiran@gmail.com> * Update tests/checkpointing/test_trainer_checkpoint.py Co-authored-by: Carlos Mocholí <carlossmocholi@gmail.com> * update on comments * resolve test * convert to set * update * add error triggering * update * update on comments * update * resolve import * update * update * Update pytorch_lightning/plugins/rpc_plugin.py Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> * update Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> Co-authored-by: Sean Naren <sean.narenthiran@gmail.com> Co-authored-by: Carlos Mocholí <carlossmocholi@gmail.com> Co-authored-by: Ubuntu <ubuntu@ip-172-31-62-109.ec2.internal> Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> (cherry picked from commit d5b367871fa3924090ec74bf903bd172bd3e2343) 2021-01-05 10:01:59 +00:00			`set -e`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00
			`# this environment variable allows special tests to run`
Rename special to standalone (#10779) 2021-11-26 17:13:14 +00:00			`export PL_RUN_STANDALONE_TESTS=1`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00			`# python arguments`
Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00			`defaults='-m coverage run --source pytorch_lightning --append -m pytest --capture=no'`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00
Rename special to standalone (#10779) 2021-11-26 17:13:14 +00:00			# find tests marked as `@RunIf(standalone=True)`. done manually instead of with pytest because it is faster
			`grep_output=$(grep --recursive --word-regexp 'tests' --regexp 'standalone=True' --include '*.py' --exclude 'tests/conftest.py')`
Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00
			`# file paths, remove duplicates`
			`files=$(echo "$grep_output" \| cut -f1 -d: \| sort \| uniq)`

			`# get the list of parametrizations. we need to call them separately. the last two lines are removed.`
			`# note: if there's a syntax error, this will fail with some garbled output`
			`if [[ "$OSTYPE" == "darwin"* ]]; then`
Fix standalone test collection (#13177) 2022-05-30 22:14:33 +00:00			`parametrizations=$(python -m pytest $files --collect-only --quiet "$@" \| tail -r \| sed -e '1,3d' \| tail -r)`
Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00			`else`
Fix standalone test collection (#13177) 2022-05-30 22:14:33 +00:00			`parametrizations=$(python -m pytest $files --collect-only --quiet "$@" \| head -n -2)`
Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00			`fi`
			`parametrizations_arr=($parametrizations)`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00
			`# tests to skip - space separated`
Fix standalone test collection (#13177) 2022-05-30 22:14:33 +00:00			`blocklist='tests/profiler/test_profiler.py::test_pytorch_profiler_nested_emit_nvtx tests/utilities/test_warnings.py'`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00			`report=''`

Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00			`for i in "${!parametrizations_arr[@]}"; do`
			`parametrization=${parametrizations_arr[$i]}`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00
Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00			`# check blocklist`
			`if echo $blocklist \| grep -F "${parametrization}"; then`
			`report+="Skipped\t$parametrization\n"`
			`continue`
			`fi`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00
Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00			`# run the test`
			`echo "Running ${parametrization}"`
			`python ${defaults} "${parametrization}"`
DeepSpeed ZeRO Update (#6546) * Add context to call hook to handle all modules defined within the hook * Expose some additional parameters * Added docs, exposed parameters * Make sure we only configure if necessary * Setup activation checkpointing regardless, saves the user having to do it manually * Add some tests that fail currently * update * update * update * add tests * change docstring * resolve accumulate_grad_batches * resolve flake8 * Update DeepSpeed to use latest version, add some comments * add metrics * update * Small formatting fixes, clean up some code * Few cleanups * No need for default state * Fix tests, add some boilerplate that should move eventually * Add hook removal * Add a context manager to handle hook * Small naming cleanup * wip * move save_checkpoint responsability to accelerator * resolve flake8 * add BC * Change recommended scale to 16 * resolve flake8 * update test * update install * update * update test * update * update * update test * resolve flake8 * update * update * update on comments * Push * pull * Update pytorch_lightning/plugins/training_type/deepspeed.py Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> * Update pytorch_lightning/plugins/training_type/deepspeed.py Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> * update * Apply suggestions from code review * Swap to using world size defined by plugin * update * update todo * Remove deepspeed from extra, keep it in the base cuda docker install * Push * pull * update * update * update * update * Minor changes * duplicate * format * format2 Co-authored-by: SeanNaren <sean@grid.ai> Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> Co-authored-by: Sean Naren <sean.narenthiran@gmail.com> Co-authored-by: Carlos Mocholi <carlossmocholi@gmail.com> Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> Co-authored-by: Jirka Borovec <jirka.borovec@seznam.cz> 2021-03-30 17:39:02 +00:00
Support special test parametrizations (#10569) 2021-11-17 15:46:14 +00:00			`report+="Ran\t$parametrization\n"`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00			`done`

[IPU] Add special tests for IPUs 2/n (#7833) * Add special tests for IPUs, run nvprof only if cuda available * Add missing min_gpu 2021-06-04 17:53:09 +00:00			`if nvcc --version; then`
XLA Profiler integration (#8014) 2021-06-28 19:28:05 +00:00			`nvprof --profile-from-start off -o trace_name.prof -- python ${defaults} tests/profiler/test_profiler.py::test_pytorch_profiler_nested_emit_nvtx`
[IPU] Add special tests for IPUs 2/n (#7833) * Add special tests for IPUs, run nvprof only if cuda available * Add missing min_gpu 2021-06-04 17:53:09 +00:00			`fi`
Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00
Actually show deprecation warnings and their line level [2/2] (#8002) Co-authored-by: Adrian Wälchli <aedu.waelchli@gmail.com> 2021-06-21 16:51:53 +00:00			# needs to run outside of `pytest`
			`python tests/utilities/test_warnings.py`
			`if [ $? -eq 0 ]; then`
			`report+="Ran\ttests/utilities/test_warnings.py\n"`
			`fi`

Torch Elastic DDP DeadLock bug fix (#8655) Co-authored-by: Carlos Mocholí <carlossmocholi@gmail.com> 2021-08-02 19:48:43 +00:00			`# test deadlock is properly handled with TorchElastic.`
Drop PyTorch 1.8 support (#13155) * Drop PyTorch 1.8 support * Missed update * Skip profiler test until supported * Upgrade ipu dockerfile pytorch version * Update XLA version 2022-06-15 00:46:44 +00:00			`LOGS=$(PL_RUN_STANDALONE_TESTS=1 PL_RECONCILE_PROCESS=1 python -m torch.distributed.run --nproc_per_node=2 --max_restarts 0 -m coverage run --source pytorch_lightning -a tests/plugins/environments/torch_elastic_deadlock.py \| grep "SUCCEEDED")`
			`if [ -z "$LOGS" ]; then`
			`exit 1`
			`fi`
			`report+="Ran\ttests/plugins/environments/torch_elastic_deadlock.py\n"`
Torch Elastic DDP DeadLock bug fix (#8655) Co-authored-by: Carlos Mocholí <carlossmocholi@gmail.com> 2021-08-02 19:48:43 +00:00
support launching Lightning ddp with traditional command (#7480) Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com> Co-authored-by: Carlos Mocholí <carlossmocholi@gmail.com> Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> 2021-07-14 11:25:36 +00:00			`# test that a user can manually launch individual processes`
MANIFEST.in and setup.py clean-up (#7614) 2021-11-19 14:38:42 +00:00			`export PYTHONPATH="${PYTHONPATH}:$(pwd)"`
Lightning Lite Examples (#9987) Co-authored-by: Kaushik B <kaushikbokka@gmail.com> Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com> Co-authored-by: Justus Schock <12886177+justusschock@users.noreply.github.com> Co-authored-by: SeanNaren <sean@grid.ai> Co-authored-by: Kaushik B <45285388+kaushikb11@users.noreply.github.com> Co-authored-by: thomas chaton <thomas@grid.ai> Co-authored-by: Rohit Gupta <rohitgr1998@gmail.com> Co-authored-by: four4fish <88516121+four4fish@users.noreply.github.com> Co-authored-by: Nicki Skafte Detlefsen <skaftenicki@gmail.com> Co-authored-by: Carlos Mocholi <carlossmocholi@gmail.com> Co-authored-by: Pietro Lesci <61748653+pietrolesci@users.noreply.github.com> 2021-11-02 08:04:29 +00:00			`args="--trainer.gpus 2 --trainer.strategy ddp --trainer.max_epochs=1 --trainer.limit_train_batches=1 --trainer.limit_val_batches=1 --trainer.limit_test_batches=1"`
			`MASTER_ADDR="localhost" MASTER_PORT=1234 LOCAL_RANK=1 python pl_examples/basic_examples/mnist_examples/image_classifier_5_lightning_datamodule.py ${args} &`
			`MASTER_ADDR="localhost" MASTER_PORT=1234 LOCAL_RANK=0 python pl_examples/basic_examples/mnist_examples/image_classifier_5_lightning_datamodule.py ${args}`
support launching Lightning ddp with traditional command (#7480) Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com> Co-authored-by: Carlos Mocholí <carlossmocholi@gmail.com> Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com> 2021-07-14 11:25:36 +00:00			`report+="Ran\tmanual ddp launch test\n"`

Automatically find and run special tests (#6669) 2021-03-26 17:04:59 +00:00			`# echo test report`
			`printf '=%.s' {1..80}`
			`printf "\n$report"`
			`printf '=%.s' {1..80}`
			`printf '\n'`