From d05c68af4bdad2ec012cfd547f93524878c3233f Mon Sep 17 00:00:00 2001
From: chaton <thomas@grid.ai>
Date: Wed, 18 Nov 2020 20:03:55 +0000
Subject: [PATCH] [Example] Add Pytorch Geometric Example (#4568)

* add example for Pytorch Geometric

* remove hydra

* add docstring

* remove description

* rename folder

* update script to not break test

* remove .lock

* add Pytorch Geometric to doc

* add docstring at the begining

* add comments

* Update pl_examples/pytorch_ecosystem/pytorch_geometric/README.md

Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com>

* Update pl_examples/pytorch_ecosystem/pytorch_geometric/README.md

Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com>

* Update pl_examples/pytorch_ecosystem/pytorch_geometric/cora_dna.py

Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com>

* add toml

Co-authored-by: Jirka Borovec <Borda@users.noreply.github.com>
Co-authored-by: Jirka Borovec <jirka@pytorchlightning.ai>
---
 MANIFEST.in                                   |   4 +-
 docs/source/index.rst                         |   1 +
 docs/source/pytorch_ecoystem.rst              |   4 +
 .../pytorch_geometric/README.md               |  38 ++
 .../pytorch_geometric/__init__.py             |   0
 .../pytorch_geometric/cora_dna.py             | 375 ++++++++++++++++++
 .../pytorch_geometric/lightning.py            |  31 ++
 .../pytorch_geometric/pyproject.toml          |  25 ++
 8 files changed, 476 insertions(+), 2 deletions(-)
 create mode 100644 docs/source/pytorch_ecoystem.rst
 create mode 100644 pl_examples/pytorch_ecosystem/pytorch_geometric/README.md
 create mode 100644 pl_examples/pytorch_ecosystem/pytorch_geometric/__init__.py
 create mode 100644 pl_examples/pytorch_ecosystem/pytorch_geometric/cora_dna.py
 create mode 100644 pl_examples/pytorch_ecosystem/pytorch_geometric/lightning.py
 create mode 100644 pl_examples/pytorch_ecosystem/pytorch_geometric/pyproject.toml

diff --git a/MANIFEST.in b/MANIFEST.in
index 4cedbd0f44e9e0..4107f885e7b794 100644
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -24,7 +24,6 @@ include *.md
 include LICENSE
 
 exclude *.sh
-exclude *.toml
 exclude *.svg
 recursive-include pytorch_lightning *.py
 
@@ -32,7 +31,7 @@ recursive-include pytorch_lightning *.py
 include pytorch_lightning/py.typed
 
 # include examples
-recursive-include pl_examples *.py *.md *.sh *.txt
+recursive-include pl_examples *.py *.md *.sh *.txt *.toml
 
 # exclude tests from package
 recursive-exclude tests *
@@ -49,6 +48,7 @@ recursive-include docs/source/_images/general/ pl_overview* tf_* tutorial_* PTL1
 recursive-include requirements *.txt
 recursive-exclude requirements *.sh
 include requirements.txt
+include pyproject.toml
 
 # Exclude build configs
 exclude *.yml
diff --git a/docs/source/index.rst b/docs/source/index.rst
index 650c7de6b2ab00..1049a6d16a75d0 100644
--- a/docs/source/index.rst
+++ b/docs/source/index.rst
@@ -76,6 +76,7 @@ PyTorch Lightning Documentation
    :name: Examples
    :caption: Examples
 
+   pytorch_ecoystem
    community_examples
    Autoencoder <https://pytorch-lightning-bolts.readthedocs.io/en/latest/autoencoders.html#autoencoders>
    BYOL <https://pytorch-lightning-bolts.readthedocs.io/en/latest/self_supervised_models.html#byol>
diff --git a/docs/source/pytorch_ecoystem.rst b/docs/source/pytorch_ecoystem.rst
new file mode 100644
index 00000000000000..1be7bb53f8b81c
--- /dev/null
+++ b/docs/source/pytorch_ecoystem.rst
@@ -0,0 +1,4 @@
+Pytorch Ecosystem Examples
+==========================
+
+- `Pytorch Geometric: Deep learning on Graphs and other irregular structures <https://github.com/PyTorchLightning/pytorch-lightning/tree/master/pl_examples/pytorch_ecosystem/pytorch_geometric/README.md>`_.
diff --git a/pl_examples/pytorch_ecosystem/pytorch_geometric/README.md b/pl_examples/pytorch_ecosystem/pytorch_geometric/README.md
new file mode 100644
index 00000000000000..5c9a42d5a8942e
--- /dev/null
+++ b/pl_examples/pytorch_ecosystem/pytorch_geometric/README.md
@@ -0,0 +1,38 @@
+#  [Pytorch Geometric](https://github.com/rusty1s/pytorch_geometric) examples with Lighting
+
+### Introduction
+
+PyTorch Geometric (PyG) is a geometric deep learning extension library for PyTorch. It relies on lower level libraries such as
+
+* PyTorch Cluster: A package consists of a small extension library of highly optimized graph cluster algorithms in Pytorch
+* PyTorch Sparse: A package consists of a small extension library of optimized sparse matrix operations with autograd support in Pytorch
+* PyTorch Scatter: A package consists of a small extension library of highly optimized sparse update (scatter and segment) operations for the use in PyTorch
+
+## Setup
+
+```
+pyenv install 3.7.8
+pyenv local 3.7.8
+python -m venv
+source .venv/bin/activate
+poetry install
+```
+
+Run example
+
+```
+python cora_dna.py
+```
+
+## Current example lists
+
+| `DATASET` | `MODEL` | `TASK` | DATASET DESCRIPTION | MODEL DESCRIPTION                                                                                                                                                                   |                                                                                                                                                                     |
+| :---: | :---: | :---: | :---: | :---: | :---: |
+| Cora | DNA | Node Classification | The citation network datasets "Cora", "CiteSeer" and "PubMed" from the "Revisiting Semi-Supervised Learning with Graph Embeddings" <https://arxiv.org/abs/1603.08861> | The dynamic neighborhood aggregation operator from the "Just Jump: Towards Dynamic Neighborhood Aggregation in Graph Neural Networks"
+
+
+## DATASET SIZES
+
+```
+ 16M    ./cora
+```
diff --git a/pl_examples/pytorch_ecosystem/pytorch_geometric/__init__.py b/pl_examples/pytorch_ecosystem/pytorch_geometric/__init__.py
new file mode 100644
index 00000000000000..e69de29bb2d1d6
diff --git a/pl_examples/pytorch_ecosystem/pytorch_geometric/cora_dna.py b/pl_examples/pytorch_ecosystem/pytorch_geometric/cora_dna.py
new file mode 100644
index 00000000000000..e4e040ff7072ef
--- /dev/null
+++ b/pl_examples/pytorch_ecosystem/pytorch_geometric/cora_dna.py
@@ -0,0 +1,375 @@
+"""Graph Convolution Example using Pytorch Geometric
+
+This example illustrates how one could train a graph convolution model with DNA Conv
+on Cora Dataset using pytorch-lightning. This example will also demonstrate how this
+model can be easily torch-scripted, thanks to Pytorch Geometric.
+"""
+# python imports
+import os
+import os.path as osp
+import sys
+from functools import partial
+from collections import namedtuple
+from argparse import ArgumentParser
+from typing import List, Optional, NamedTuple
+
+# thrid parties libraries
+import numpy as np
+from torch import nn
+import torch
+from torch import Tensor
+from torch.optim import Adam
+import torch.nn.functional as F
+
+# Lightning imports
+from pytorch_lightning import (
+    Trainer,
+    LightningDataModule,
+    LightningModule
+)
+from pytorch_lightning.metrics import Accuracy
+
+try:
+    # Pytorch Geometric imports
+    from torch_geometric.nn import DNAConv, MessagePassing
+    from torch_geometric.data import DataLoader
+    from torch_geometric.datasets import Planetoid
+    import torch_geometric.transforms as T
+    from torch_geometric.data import NeighborSampler
+    from lightning import lightning_logo, nice_print
+except Exception:
+    HAS_PYTORCH_GEOMETRIC = False
+else:
+    HAS_PYTORCH_GEOMETRIC = True
+
+
+# use to make model jittable
+OptTensor = Optional[Tensor]
+ListTensor = List[Tensor]
+
+
+class TensorBatch(NamedTuple):
+    x: Tensor
+    edge_index: ListTensor
+    edge_attr: OptTensor
+    batch: OptTensor
+
+###################################
+#       LightningDataModule       #
+###################################
+
+
+class CoraDataset(LightningDataModule):
+
+    r"""The citation network datasets "Cora", "CiteSeer" and "PubMed" from the
+    `"Revisiting Semi-Supervised Learning with Graph Embeddings"
+    <https://arxiv.org/abs/1603.08861>`_ paper.
+    Nodes represent documents and edges represent citation links.
+    Training, validation and test splits are given by binary masks.
+    c.f https://github.com/rusty1s/pytorch_geometric/blob/master/torch_geometric/datasets/planetoid.py
+    """
+
+    NAME = "cora"
+
+    def __init__(self,
+                 num_workers: int = 1,
+                 batch_size: int = 8,
+                 drop_last: bool = True,
+                 pin_memory: bool = True,
+                 num_layers: int = None):
+        super().__init__()
+
+        assert num_layers is not None
+
+        self._num_workers = num_workers
+        self._batch_size = batch_size
+        self._drop_last = drop_last
+        self._pin_memory = pin_memory
+        self._num_layers = num_layers
+
+        self._transform = T.NormalizeFeatures()
+
+    @property
+    def num_features(self):
+        return 1433
+
+    @property
+    def num_classes(self):
+        return 7
+
+    @property
+    def hyper_parameters(self):
+        # used to inform the model the dataset specifications
+        return {"num_features": self.num_features, "num_classes": self.num_classes}
+
+    def prepare_data(self):
+        path = osp.join(
+            osp.dirname(osp.realpath(__file__)), "..", "..", "data", self.NAME
+        )
+        self.dataset = Planetoid(path, self.NAME, transform=self._transform)
+        self.data = self.dataset[0]
+
+    def create_neighbor_sampler(self, batch_size=2, stage=None):
+        # https://github.com/rusty1s/pytorch_geometric/tree/master/torch_geometric/data/sampler.py#L18
+        return NeighborSampler(
+            self.data.edge_index,
+            # the nodes that should be considered for sampling.
+            node_idx=getattr(self.data, f"{stage}_mask"),
+            # -1 indicates all neighbors will be selected
+            sizes=[self._num_layers, -1],
+            num_workers=self._num_workers,
+            drop_last=self._drop_last,
+            pin_memory=self._pin_memory,
+        )
+
+    def train_dataloader(self):
+        return self.create_neighbor_sampler(stage="train")
+
+    def validation_dataloader(self):
+        return self.create_neighbor_sampler(stage="val")
+
+    def test_dataloader(self):
+        return self.create_neighbor_sampler(stage="test")
+
+    def gather_data_and_convert_to_namedtuple(self, batch, batch_nb):
+        """
+        This function will select features using node_idx
+        and create a NamedTuple Object.
+        """
+
+        usual_keys = ["x", "edge_index", "edge_attr", "batch"]
+        Batch: TensorBatch = namedtuple("Batch", usual_keys)
+        return (
+            Batch(
+                self.data.x[batch[1]],
+                [e.edge_index for e in batch[2]],
+                None,
+                None,
+            ),
+            self.data.y[batch[1]],
+        )
+
+    @staticmethod
+    def add_argparse_args(parser):
+        parser.add_argument("--num_workers", type=int, default=1)
+        parser.add_argument("--batch_size", type=int, default=2)
+        parser.add_argument("--drop_last", default=True)
+        parser.add_argument("--pin_memory", default=True)
+        return parser
+
+
+###############################
+#       LightningModule       #
+###############################
+
+
+class DNAConvNet(LightningModule):
+
+    r"""The dynamic neighborhood aggregation operator from the `"Just Jump:
+    Towards Dynamic Neighborhood Aggregation in Graph Neural Networks"
+    <https://arxiv.org/abs/1904.04849>`_ paper
+    c.f https://github.com/rusty1s/pytorch_geometric/blob/master/torch_geometric/nn/conv/dna_conv.py#L172
+    """
+
+    def __init__(self,
+                 num_layers: int = 2,
+                 hidden_channels: int = 128,
+                 heads: int = 8,
+                 groups: int = 16,
+                 dropout: float = 0.8,
+                 cached: bool = False,
+                 num_features: int = None,
+                 num_classes: int = None,
+                 ):
+        super().__init__()
+
+        assert num_features is not None
+        assert num_classes is not None
+
+        # utils from Lightning to save __init__ arguments
+        self.save_hyperparameters()
+        hparams = self.hparams
+
+        # Instantiate metrics
+        self.val_acc = Accuracy(hparams["num_classes"])
+        self.test_acc = Accuracy(hparams["num_classes"])
+
+        # Define DNA graph convolution model
+        self.hidden_channels = hparams["hidden_channels"]
+        self.lin1 = nn.Linear(hparams["num_features"], hparams["hidden_channels"])
+
+        # Create ModuleList to hold all convolutions
+        self.convs = nn.ModuleList()
+
+        # Iterate through the number of layers
+        for _ in range(hparams["num_layers"]):
+
+            # Create a DNA Convolution - This graph convolution relies on MultiHead Attention mechanism
+            # to route information similar to Transformers.
+            # https://github.com/rusty1s/pytorch_geometric/blob/master/torch_geometric/nn/conv/dna_conv.py#L172
+            self.convs.append(
+                DNAConv(
+                    hparams["hidden_channels"],
+                    hparams["heads"],
+                    hparams["groups"],
+                    dropout=hparams["dropout"],
+                    cached=False,
+                )
+            )
+        # classification MLP
+        self.lin2 = nn.Linear(hparams["hidden_channels"], hparams["num_classes"], bias=False)
+
+    def forward(self, batch: TensorBatch):
+        # batch needs to be typed for making this model jittable.
+        x = batch.x
+        x = F.relu(self.lin1(x))
+        x = F.dropout(x, p=0.5, training=self.training)
+        x_all = x.view(-1, 1, self.hidden_channels)
+
+        # iterate over all convolutions
+        for idx, conv in enumerate(self.convs):
+            # perform convolution using previously concatenated embedding
+            # through edge_index
+            x = F.relu(conv(x_all, batch.edge_index[idx]))
+            x = x.view(-1, 1, self.hidden_channels)
+
+            # concatenate with previously computed embedding
+            x_all = torch.cat([x_all, x], dim=1)
+
+        # extra latest layer embedding
+        x = x_all[:, -1]
+
+        x = F.dropout(x, p=0.5, training=self.training)
+
+        # return logits per nodes
+        return F.log_softmax(self.lin2(x), -1)
+
+    def step(self, batch, batch_nb):
+        typed_batch, targets = self.gather_data_and_convert_to_namedtuple(batch, batch_nb)
+        logits = self(typed_batch)
+        return logits, targets
+
+    def training_step(self, batch, batch_nb):
+        logits, targets = self.step(batch, batch_nb)
+        train_loss = F.nll_loss(logits, targets)
+        self.log("train_loss", train_loss, on_step=True, on_epoch=True, prog_bar=True)
+        return train_loss
+
+    def validation_step(self, batch, batch_nb):
+        logits, targets = self.step(batch, batch_nb)
+        val_loss = F.nll_loss(logits, targets)
+        self.log("val_loss", val_loss, on_step=False, on_epoch=True, prog_bar=True)
+        self.log("val_acc", self.val_acc(logits, targets), on_step=False, on_epoch=True, prog_bar=True)
+
+    def test_step(self, batch, batch_nb):
+        logits, targets = self.step(batch, batch_nb)
+        test_loss = F.nll_loss(logits, targets)
+        self.log("test_loss", test_loss, on_step=False, on_epoch=True, prog_bar=True)
+        self.log("test_acc", self.test_acc(logits, targets), on_step=False, on_epoch=True, prog_bar=True)
+
+    # Use for jittable demonstration.
+
+    def _convert_to_jittable(self, module):
+        for key, m in module._modules.items():
+            if isinstance(m, MessagePassing) and m.jittable is not None:
+                # Pytorch Geometric MessagePassing implements a `.jittable` function
+                # which converts the current module into its jittable version.
+                module._modules[key] = m.jittable()
+            else:
+                self._convert_to_jittable(m)
+        return module
+
+    def jittable(self):
+        for key, m in self._modules.items():
+            self._modules[key] = self._convert_to_jittable(m)
+
+    def configure_optimizers(self):
+        return Adam(self.parameters(), lr=1e-3)
+
+    @staticmethod
+    def add_argparse_args(parser):
+        parser.add_argument("--num_layers", type=int, default=2)
+        parser.add_argument("--hidden_channels", type=int, default=128)
+        parser.add_argument("--heads", type=int, default=8)
+        parser.add_argument("--groups", type=int, default=16)
+        parser.add_argument("--dropout", type=float, default=0.8)
+        parser.add_argument("--cached", type=int, default=0)
+        parser.add_argument("--jit", default=True)
+        return parser
+
+#################################
+#     Instantiate Functions     #
+#################################
+
+
+def instantiate_datamodule(args):
+    datamodule = CoraDataset(
+        num_workers=args.num_workers,
+        batch_size=args.batch_size,
+        drop_last=args.drop_last,
+        pin_memory=args.pin_memory,
+        num_layers=args.num_layers,
+    )
+    return datamodule
+
+
+def instantiate_model(args, datamodule):
+    model = DNAConvNet(
+        num_layers=args.num_layers,
+        hidden_channels=args.hidden_channels,
+        heads=args.heads,
+        groups=args.groups,
+        dropout=args.dropout,
+        # provide dataset specific arguments
+        **datamodule.hyper_parameters,
+    )
+    if args.jit:
+        model.jittable()
+
+    # Attached datamodule function to model
+    model.gather_data_and_convert_to_namedtuple = datamodule.gather_data_and_convert_to_namedtuple
+    return model
+
+
+def get_single_batch(datamodule):
+    for batch in datamodule.test_dataloader():
+        return datamodule.gather_data_and_convert_to_namedtuple(batch, 0)
+
+#######################
+#     Trainer Run     #
+#######################
+
+
+def run(args):
+
+    nice_print("You are about to train a TorchScripted Pytorch Geometric Lightning model !")
+    nice_print(lightning_logo)
+
+    datamodule: LightningDataModule = instantiate_datamodule(args)
+    model: LightningModule = instantiate_model(args, datamodule)
+    trainer = Trainer.from_argparse_args(args)
+    trainer.fit(model, datamodule)
+    trainer.test()
+
+    batch = get_single_batch(datamodule)
+    model.to_torchscript(file_path="model_trace.pt",
+                         method='script',
+                         example_inputs=batch)
+
+    nice_print("Congratulations !")
+    nice_print("You trained your first TorchScripted Pytorch Geometric Lightning model !", last=True)
+
+
+if __name__ == "__main__":
+    if not HAS_PYTORCH_GEOMETRIC:
+        print("Skip training. Pytorch Geometric isn't installed. Please, check README.md !")
+
+    else:
+        parser = ArgumentParser(description="Pytorch Geometric Example")
+        parser = Trainer.add_argparse_args(parser)
+        parser = CoraDataset.add_argparse_args(parser)
+        parser = DNAConvNet.add_argparse_args(parser)
+
+        cmd_line = '--max_epochs 1'.split(' ')
+
+        run(parser.parse_args(cmd_line))
diff --git a/pl_examples/pytorch_ecosystem/pytorch_geometric/lightning.py b/pl_examples/pytorch_ecosystem/pytorch_geometric/lightning.py
new file mode 100644
index 00000000000000..2c765d1449c57f
--- /dev/null
+++ b/pl_examples/pytorch_ecosystem/pytorch_geometric/lightning.py
@@ -0,0 +1,31 @@
+def nice_print(msg, last=False):
+    print()
+    print("\033[0;35m" + msg + "\033[0m")
+    if last:
+        print()
+
+
+lightning_logo = """
+                    ####
+                ###########
+             ####################
+         ############################
+    #####################################
+##############################################
+#########################  ###################
+#######################    ###################
+####################      ####################
+##################       #####################
+################        ######################
+#####################        #################
+######################     ###################
+#####################    #####################
+####################   #######################
+###################  #########################
+##############################################
+    #####################################
+         ############################
+             ####################
+                  ##########
+                     ####
+"""
diff --git a/pl_examples/pytorch_ecosystem/pytorch_geometric/pyproject.toml b/pl_examples/pytorch_ecosystem/pytorch_geometric/pyproject.toml
new file mode 100644
index 00000000000000..99f516323e9769
--- /dev/null
+++ b/pl_examples/pytorch_ecosystem/pytorch_geometric/pyproject.toml
@@ -0,0 +1,25 @@
+[tool.poetry]
+name = "lightning-geometric"
+version = "0.1.0"
+description = "TorchScripted Pytorch Geometric Examples with Pytorch Lightning"
+authors = ["Thomas Chaton <thomas.ai@grid.com>"]
+
+[tool.poetry.dependencies]
+python = "3.7.8"
+torch = "^1.6.0"
+torch-cluster = "^1.5.7"
+torch-sparse = "^0.6.7"
+torch-scatter = "^2.0.5"
+torch-geometric = "^1.6.1"
+pytorch-lightning = "^ 1.0.5"
+openmesh = "^1.1.4"
+torch-spline-conv = "^1.2.0"
+tqdm = "^4.50.0"
+pytest = "^6.1.0"
+
+[tool.poetry.dev-dependencies]
+black = {version = "^20.8b1", allow-prereleases = true}
+
+[build-system]
+requires = ["poetry>=0.12"]
+build-backend = "poetry.masonry.api"