From 14b28190dd88cef0dcaa7e26bd9b139c55225f15 Mon Sep 17 00:00:00 2001
From: William Falcon <waf2107@columbia.edu>
Date: Sun, 30 Aug 2020 09:31:36 -0400
Subject: [PATCH] simplify docs (#3267)

* updated docs

* updated docs

* updated docs

* updated docs

* updated docs

* updated docs
---
 docs/source/community_examples.rst |  21 +++
 docs/source/index.rst              |  43 +++--
 docs/source/new-project.rst        | 247 ++++++++++++++---------------
 3 files changed, 160 insertions(+), 151 deletions(-)
 create mode 100644 docs/source/community_examples.rst

diff --git a/docs/source/community_examples.rst b/docs/source/community_examples.rst
new file mode 100644
index 0000000000..05db763113
--- /dev/null
+++ b/docs/source/community_examples.rst
@@ -0,0 +1,21 @@
+Community Examples
+==================
+
+- `Contextual Emotion Detection (DoubleDistilBert) <https://github.com/PyTorchLightning/emotion_transformer>`_.
+- `Cotatron: Transcription-Guided Speech Encoder <https://github.com/mindslab-ai/cotatron>`_.
+- `FasterRCNN object detection + Hydra <https://github.com/PyTorchLightning/wheat>`_.
+- `Hyperparameter optimization with Optuna <https://github.com/optuna/optuna/blob/master/examples/pytorch_lightning_simple.py>`_.
+- `Hyperparameter optimization with Ray Tune <https://docs.ray.io/en/master/tune/tutorials/tune-pytorch-lightning.html>`_.
+- `Image Inpainting using Partial Convolutions <https://github.com/ryanwongsa/Image-Inpainting>`_.
+- `MNIST on TPU <https://colab.research.google.com/drive/1-_LKx4HwAxl5M6xPJmqAAu444LTDQoa3#scrollTo=BHBz1_AnamN_>`_.
+- `NER (transformers, TPU) <https://colab.research.google.com/drive/1dBN-wwYUngLYVt985wGs_OKPlK_ANB9D>`_.
+- `NeuralTexture (CVPR) <https://github.com/PyTorchLightning/neuraltexture>`_.
+- `Recurrent Attentive Neural Process <https://github.com/PyTorchLightning/attentive-neural-processes>`_.
+- `Siamese Nets for One-shot Image Recognition <https://github.com/PyTorchLightning/Siamese-Neural-Networks>`_.
+- `Speech Transformers <https://github.com/PyTorchLightning/speech-transformer-pytorch_lightning>`_.
+- `Transformers transfer learning (Huggingface) <https://colab.research.google.com/drive/1F_RNcHzTfFuQf-LeKvSlud6x7jXYkG31#scrollTo=yr7eaxkF-djf>`_.
+- `Transformers text classification <https://github.com/ricardorei/lightning-text-classification>`_.
+- `VAE Library of over 18+ VAE flavors <https://github.com/AntixK/PyTorch-VAE>`_.
+- `Transformers Question Answering (SQuAD) <https://github.com/tshrjn/Finetune-QA/>`_.
+- `Atlas: End-to-End 3D Scene Reconstruction from Posed Images <https://github.com/magicleap/atlas>`_.
+- `Self-Supervised Representation Learning (MoCo and BYOL) <https://github.com/untitled-ai/self_supervised>`_.
\ No newline at end of file
diff --git a/docs/source/index.rst b/docs/source/index.rst
index ecec56f988..10096eb813 100644
--- a/docs/source/index.rst
+++ b/docs/source/index.rst
@@ -15,18 +15,24 @@ PyTorch Lightning Documentation
    introduction_guide
    performance
 
+.. toctree::
+   :maxdepth: 2
+   :name: pl_docs
+   :caption: Lightning API
+
+   lightning-module
+   trainer
+
 .. toctree::
    :maxdepth: 2
    :name: docs
-   :caption: Python API
+   :caption: Optional extensions
 
    callbacks
-   lightning-module
    datamodules
    loggers
    metrics
    results
-   trainer
 
 .. toctree::
    :maxdepth: 1
@@ -37,27 +43,18 @@ PyTorch Lightning Documentation
 
 .. toctree::
    :maxdepth: 1
-   :name: Community Examples
-   :caption: Community Examples
+   :name: Examples
+   :caption: Examples
 
-   Contextual Emotion Detection (DoubleDistilBert) <https://github.com/PyTorchLightning/emotion_transformer>
-   Cotatron: Transcription-Guided Speech Encoder <https://github.com/mindslab-ai/cotatron>
-   FasterRCNN object detection + Hydra <https://github.com/PyTorchLightning/wheat>
-   Hyperparameter optimization with Optuna <https://github.com/optuna/optuna/blob/master/examples/pytorch_lightning_simple.py>
-   Hyperparameter optimization with Ray Tune <https://docs.ray.io/en/master/tune/tutorials/tune-pytorch-lightning.html>
-   Image Inpainting using Partial Convolutions <https://github.com/ryanwongsa/Image-Inpainting>
-   MNIST on TPU <https://colab.research.google.com/drive/1-_LKx4HwAxl5M6xPJmqAAu444LTDQoa3#scrollTo=BHBz1_AnamN_>
-   NER (transformers, TPU) <https://colab.research.google.com/drive/1dBN-wwYUngLYVt985wGs_OKPlK_ANB9D>
-   NeuralTexture (CVPR) <https://github.com/PyTorchLightning/neuraltexture>
-   Recurrent Attentive Neural Process <https://github.com/PyTorchLightning/attentive-neural-processes>
-   Siamese Nets for One-shot Image Recognition <https://github.com/PyTorchLightning/Siamese-Neural-Networks>
-   Speech Transformers <https://github.com/PyTorchLightning/speech-transformer-pytorch_lightning>
-   Transformers transfer learning (Huggingface) <https://colab.research.google.com/drive/1F_RNcHzTfFuQf-LeKvSlud6x7jXYkG31#scrollTo=yr7eaxkF-djf>
-   Transformers text classification <https://github.com/ricardorei/lightning-text-classification>
-   VAE Library of over 18+ VAE flavors <https://github.com/AntixK/PyTorch-VAE>
-   Transformers Question Answering (SQuAD) <https://github.com/tshrjn/Finetune-QA/>
-   Atlas: End-to-End 3D Scene Reconstruction from Posed Images <https://github.com/magicleap/atlas>
-   Self-Supervised Representation Learning (MoCo and BYOL) <https://github.com/untitled-ai/self_supervised>
+   community_examples
+   Autoencoder <https://pytorch-lightning-bolts.readthedocs.io/en/latest/autoencoders.html#autoencoders>
+   BYOL <https://pytorch-lightning-bolts.readthedocs.io/en/latest/self_supervised_models.html#byol>
+   DQN <https://pytorch-lightning-bolts.readthedocs.io/en/latest/reinforce_learn.html#deep-q-network-dqn>
+   GAN <https://pytorch-lightning-bolts.readthedocs.io/en/latest/gans.html#basic-gan>
+   GPT-2 <https://pytorch-lightning-bolts.readthedocs.io/en/latest/convolutional.html#gpt-2>
+   Image-GPT <https://pytorch-lightning-bolts.readthedocs.io/en/latest/convolutional.html#image-gpt>
+   SimCLR <https://pytorch-lightning-bolts.readthedocs.io/en/latest/self_supervised_models.html#simclr>
+   VAE <https://pytorch-lightning-bolts.readthedocs.io/en/latest/autoencoders.html#basic-vae>
 
 .. toctree::
    :maxdepth: 1
diff --git a/docs/source/new-project.rst b/docs/source/new-project.rst
index c0753ff2ee..365d9171d8 100644
--- a/docs/source/new-project.rst
+++ b/docs/source/new-project.rst
@@ -14,7 +14,7 @@
 .. _3-steps:
 
 ####################
-Lightning in 3 steps
+Lightning in 2 steps
 ####################
 
 **In this guide we'll show you how to organize your PyTorch code into Lightning in 3 simple steps.**
@@ -42,12 +42,12 @@ Step 0: Install PyTorch Lightning
 *********************************
 
 
-You can install using `pip <https://pypi.org/project/pytorch-lightning/>`_ 
+You can install using `pip <https://pypi.org/project/pytorch-lightning/>`_
 
 .. code-block:: bash
 
     pip install pytorch-lightning
-    
+
 Or with `conda <https://anaconda.org/conda-forge/pytorch-lightning>`_ (see how to install conda `here <https://docs.conda.io/projects/conda/en/latest/user-guide/install/>`_):
 
 .. code-block:: bash
@@ -92,11 +92,11 @@ Step 1: Define LightningModule
             x = F.relu(x)
             x = self.layer_2(x)
             return x
-            
+
         def configure_optimizers(self):
             optimizer = torch.optim.Adam(self.parameters(), lr=1e-3)
             return optimizer
- 
+
         def training_step(self, batch, batch_idx):
             x, y = batch
             y_hat = self(x)
@@ -116,7 +116,7 @@ The :class:`~pytorch_lightning.core.LightningModule` holds your research code:
 
 A :class:`~pytorch_lightning.core.LightningModule` is a :class:`torch.nn.Module` but with added functionality.
 It organizes your research code into :ref:`hooks`.
-            
+
 In the snippet above we override the basic hooks, but a full list of hooks to customize can be found under :ref:`hooks`.
 
 You can use your :class:`~pytorch_lightning.core.LightningModule` just like a PyTorch model.
@@ -129,14 +129,49 @@ You can use your :class:`~pytorch_lightning.core.LightningModule` just like a Py
     y_hat = model(x)
 
     model.anything_you_can_do_with_pytorch()
-    
+
 More details in :ref:`lightning-module` docs.
 
-Convert your PyTorch Module to Lightning
-========================================
+
+----------
+
+**************************
+Step 2: Fit with a Trainer
+**************************
+
+.. code-block::
+
+    # dataloaders
+    dataset = MNIST(os.getcwd(), download=True, transform=transforms.ToTensor())
+    train, val = random_split(dataset, [55000, 5000])
+    train_loader = DataLoader(train)
+    val_loader = DataLoader(val)
+
+    # init model
+    model = LitModel()
+
+    # most basic trainer, uses good defaults (auto-tensorboard, checkpoints, logs, and more)
+    trainer = pl.Trainer()
+    trainer.fit(model, train_loader, val_loader)
+
+.. note:: Lightning works with pure PyTorch DataLoaders
+
+.. code-block:: python
+
+    train_dataloader = DataLoader(...)
+    val_dataloader = DataLoader(...)
+    trainer.fit(model, train_dataloader, val_dataloader)
+
+-----
+
+**************************************
+How to organize PyTorch into Lightning
+**************************************
+
+To enable your code to work with Lightning, here's how to organize PyTorch into Lightning
 
 1. Move your computational code
--------------------------------
+===============================
 Move the model architecture and forward pass to your :class:`~pytorch_lightning.core.LightningModule`.
 
 .. code-block::
@@ -154,9 +189,9 @@ Move the model architecture and forward pass to your :class:`~pytorch_lightning.
             x = F.relu(x)
             x = self.layer_2(x)
             return x
-            
+
 2. Move the optimizer(s) and schedulers
----------------------------------------
+=======================================
 Move your optimizers to :func:`pytorch_lightning.core.LightningModule.configure_optimizers` hook. Make sure to use the hook parameters (self in this case).
 
 .. code-block::
@@ -166,9 +201,9 @@ Move your optimizers to :func:`pytorch_lightning.core.LightningModule.configure_
         def configure_optimizers(self):
             optimizer = torch.optim.Adam(self.parameters(), lr=1e-3)
             return optimizer
-            
+
 3. Find the train loop "meat"
------------------------------
+=============================
 Lightning automates most of the trining for you, the epoch and batch iterations, all you need to keep is the training step logic. This should go into :func:`pytorch_lightning.core.LightningModule.training_step` hook (make sure to use the hook parameters, self in this case):
 
 .. code-block::
@@ -182,7 +217,7 @@ Lightning automates most of the trining for you, the epoch and batch iterations,
             return loss
 
 4. Find the val loop "meat"
----------------------------
+===========================
 To add an (optional) validation loop add logic to :func:`pytorch_lightning.core.LightningModule.validation_step` hook (make sure to use the hook parameters, self in this case).
 
 .. testcode::
@@ -196,9 +231,9 @@ To add an (optional) validation loop add logic to :func:`pytorch_lightning.core.
             return val_loss
 
 .. note:: model.eval() and torch.no_grad() are called automatically for validation
-            
+
 5. Find the test loop "meat"
------------------------------
+============================
 To add an (optional) test loop add logic to :func:`pytorch_lightning.core.LightningModule.test_step` hook (make sure to use the hook parameters, self in this case).
 
 .. code-block::
@@ -222,11 +257,12 @@ The test loop will not be used until you call.
 .. note:: .test() loads the best checkpoint automatically
 
 6. Remove any .cuda() or to.device() calls
-------------------------------------------
+==========================================
 Your :class:`~pytorch_lightning.core.LightningModule` can automatically run on any hardware!
 
 Optional features
 =================
+
 1. Wrap loss in a TrainResult/EvalResult
 ----------------------------------------
 Instead of returning the loss you can also use :class:`~pytorch_lightning.core.step_result.TrainResult` and :class:`~pytorch_lightning.core.step_result.EvalResult`, plain Dict objects that give you options for logging on every step and/or at the end of the epoch.
@@ -305,45 +341,84 @@ And the lightning equivalent
             all_val_losses = validation_step_outputs.val_loss
             all_predictions = validation_step_outputs.predictions
 
-----------
+Datamodules
+===========
+DataLoader and data processing code tends to end up scattered around.
+Make your data code more reusable by organizing
+it into a :class:`~pytorch_lightning.core.datamodule.LightningDataModule`
 
-**********************************
-Step 2: Fit with Lightning Trainer
-**********************************
+.. code-block:: python
+
+  class MNISTDataModule(pl.LightningDataModule):
+
+        def __init__(self, batch_size=32):
+            super().__init__()
+            self.batch_size = batch_size
+
+        # When doing distributed training, Datamodules have two optional arguments for
+        # granular control over download/prepare/splitting data:
+
+        # OPTIONAL, called only on 1 GPU/machine
+        def prepare_data(self):
+            MNIST(os.getcwd(), train=True, download=True)
+            MNIST(os.getcwd(), train=False, download=True)
+
+        # OPTIONAL, called for every GPU/machine (assigning state is OK)
+        def setup(self, stage):
+            # transforms
+            transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,))
+            ])
+            # split dataset
+            if stage == 'fit':
+                mnist_train = MNIST(os.getcwd(), train=True, transform=transform)
+                self.mnist_train, self.mnist_val = random_split(mnist_train, [55000, 5000])
+            if stage == 'test':
+                self.mnist_test = MNIST(os.getcwd(), train=False, transform=transform)
+
+        # return the dataloader for each split
+        def train_dataloader(self):
+            mnist_train = DataLoader(self.mnist_train, batch_size=self.batch_size)
+            return mnist_train
+
+        def val_dataloader(self):
+            mnist_val = DataLoader(self.mnist_val, batch_size=self.batch_size)
+            return mnist_val
+
+        def test_dataloader(self):
+            mnist_test = DataLoader(self.mnist_test, batch_size=self.batch_size)
+            return mnist_test
+
+:class:`~pytorch_lightning.core.datamodule.LightningDataModule` is designed to enable sharing and reusing data splits
+and transforms across different projects. It encapsulates all the steps needed to process data: downloading,
+tokenizing, processing etc.
+
+Now you can simply pass your :class:`~pytorch_lightning.core.datamodule.LightningDataModule` to
+the :class:`~pytorch_lightning.trainer.Trainer`:
 
 .. code-block::
 
-    # dataloaders
-    dataset = MNIST(os.getcwd(), download=True, transform=transforms.ToTensor())
-    train, val = random_split(dataset, [55000, 5000])
-    train_loader = DataLoader(train)
-    val_loader = DataLoader(val)
-
     # init model
     model = LitModel()
 
-    # most basic trainer, uses good defaults (auto-tensorboard, checkpoints, logs, and more)
+    # init data
+    dm = MNISTDataModule()
+
+    # train
     trainer = pl.Trainer()
-    trainer.fit(model, train_loader, val_loader)
+    trainer.fit(model, dm)
 
-Init :class:`~pytorch_lightning.core.LightningModule`, your PyTorch dataloaders, and then the PyTorch Lightning :class:`~pytorch_lightning.trainer.Trainer`.
-The :class:`~pytorch_lightning.trainer.Trainer` will automate:
+    # test
+    trainer.test(datamodule=dm)
 
-* The epoch iteration
-* The batch iteration
-* The calling of optimizer.step()
-* :ref:`weights-loading`
-* Logging to Tensorboard (see :ref:`loggers` options)
-* :ref:`multi-gpu-training` support
-* :ref:`tpu`
-* :ref:`16-bit` support
+DataModules are specifically useful for building models based on data. Read more on :ref:`data-modules`.
 
-All automated code is rigorously tested and benchmarked.
-
-Check out more flags in the :ref:`trainer` docs.
+----------
 
+********************
 Using CPUs/GPUs/TPUs
-====================
+********************
 It's trivial to use CPUs, GPUs or TPUs in Lightning. There's NO NEED to change your code, simply change the :class:`~pytorch_lightning.trainer.Trainer` options.
 
 .. code-block:: python
@@ -391,90 +466,6 @@ Without changing a SINGLE line of your code, you can now do the following with t
         val_check_interval=0.25
     )
     
-************************
-Step 3: Define Your Data
-************************
-Lightning works with pure PyTorch DataLoaders
-
-.. code-block:: python
-
-    train_dataloader = DataLoader(...)
-    val_dataloader = DataLoader(...)
-    trainer.fit(model, train_dataloader, val_dataloader)
-
-Optional: DataModule
-====================
-DataLoader and data processing code tends to end up scattered around.
-Make your data code more reusable by organizing
-it into a :class:`~pytorch_lightning.core.datamodule.LightningDataModule`
-
-.. code-block:: python
-
-  class MNISTDataModule(pl.LightningDataModule):
-
-        def __init__(self, batch_size=32):
-            super().__init__()
-            self.batch_size = batch_size
-        
-        # When doing distributed training, Datamodules have two optional arguments for
-        # granular control over download/prepare/splitting data: 
-
-        # OPTIONAL, called only on 1 GPU/machine
-        def prepare_data(self):
-            MNIST(os.getcwd(), train=True, download=True)
-            MNIST(os.getcwd(), train=False, download=True)
-
-        # OPTIONAL, called for every GPU/machine (assigning state is OK)
-        def setup(self, stage):
-            # transforms
-            transform=transforms.Compose([
-                transforms.ToTensor(),
-                transforms.Normalize((0.1307,), (0.3081,))
-            ])
-            # split dataset
-            if stage == 'fit':
-                mnist_train = MNIST(os.getcwd(), train=True, transform=transform)
-                self.mnist_train, self.mnist_val = random_split(mnist_train, [55000, 5000])
-            if stage == 'test':
-                self.mnist_test = MNIST(os.getcwd(), train=False, transform=transform)
-
-        # return the dataloader for each split
-        def train_dataloader(self):
-            mnist_train = DataLoader(self.mnist_train, batch_size=self.batch_size)
-            return mnist_train
-
-        def val_dataloader(self):
-            mnist_val = DataLoader(self.mnist_val, batch_size=self.batch_size)
-            return mnist_val
-        
-        def test_dataloader(self):
-            mnist_test = DataLoader(self.mnist_test, batch_size=self.batch_size)
-            return mnist_test
-
-:class:`~pytorch_lightning.core.datamodule.LightningDataModule` is designed to enable sharing and reusing data splits
-and transforms across different projects. It encapsulates all the steps needed to process data: downloading,
-tokenizing, processing etc.
-
-Now you can simply pass your :class:`~pytorch_lightning.core.datamodule.LightningDataModule` to
-the :class:`~pytorch_lightning.trainer.Trainer`:
-
-.. code-block::
-
-    # init model
-    model = LitModel()
-
-    # init data
-    dm = MNISTDataModule()
-
-    # train
-    trainer = pl.Trainer()
-    trainer.fit(model, dm)
-
-    # test
-    trainer.test(datamodule=dm)
-
-DataModules are specifically useful for building models based on data. Read more on :ref:`data-modules`.
-
 **********
 Learn more
 **********