diff --git a/learn2learn/algorithms/lightning/lightning_episodic_module.py b/learn2learn/algorithms/lightning/lightning_episodic_module.py
index 2b4d4d01..1d33226b 100644
--- a/learn2learn/algorithms/lightning/lightning_episodic_module.py
+++ b/learn2learn/algorithms/lightning/lightning_episodic_module.py
@@ -5,6 +5,7 @@
 
 try:
     from pytorch_lightning import LightningModule
+    from pytorch_lightning.trainer.states import TrainerFn
 except ImportError:
     from learn2learn.utils import _ImportRaiser
 
diff --git a/learn2learn/algorithms/lightning/lightning_protonet.py b/learn2learn/algorithms/lightning/lightning_protonet.py
index 6041ab64..20bbb52c 100644
--- a/learn2learn/algorithms/lightning/lightning_protonet.py
+++ b/learn2learn/algorithms/lightning/lightning_protonet.py
@@ -4,7 +4,7 @@
 """
 import numpy as np
 import torch
-
+from typing import Any
 from torch import nn
 from learn2learn.utils import accuracy
 from learn2learn.nn import PrototypicalClassifier
@@ -139,3 +139,7 @@ def meta_learn(self, batch, batch_idx, ways, shots, queries):
         eval_loss = self.loss(logits, query_labels)
         eval_accuracy = accuracy(logits, query_labels)
         return eval_loss, eval_accuracy
+
+    def predict_step(self, batch: Any, batch_idx: int, dataloader_idx: int = 0):
+        embeddings = self.features(batch)
+        return self.classifier(embeddings)
diff --git a/learn2learn/utils/lightning.py b/learn2learn/utils/lightning.py
index 19be43e4..cd6a3b5c 100644
--- a/learn2learn/utils/lightning.py
+++ b/learn2learn/utils/lightning.py
@@ -3,17 +3,152 @@
 """
 Some utilities to interface with PyTorch Lightning.
 """
-
+from typing import Optional, Callable
+import learn2learn as l2l
 import pytorch_lightning as pl
+from torch.utils.data._utils.worker import get_worker_info
+from torch.utils.data._utils.collate import default_collate
+from torch.utils.data import IterableDataset, Dataset
 import sys
 import tqdm
 
 
-class EpisodicBatcher(pl.LightningDataModule):
+class Epochifier(Dataset):
+    def __init__(self, tasks, length):
+        self.tasks = tasks
+        self.length = length
+
+    def __getitem__(self, *args, **kwargs):
+        return self.tasks.sample()
+
+    def __len__(self):
+        return self.length
+
 
-    """
-    nc
-    """
+class TaskDataParallel(IterableDataset):
+
+    def __init__(
+        self,
+        tasks: l2l.data.TaskDataset,
+        epoch_length: int,
+        devices: int = 1,
+        collate_fn: Optional[Callable] = default_collate
+    ):
+        """
+        This class is used to sample epoch_length tasks to represent an epoch.
+
+        It should be used when using DataParallel
+
+        Args:
+            taskset: Dataset used to sample task.
+            epoch_length: The expected epoch length. This requires to be divisible by devices.
+            devices: Number of devices being used.
+            collate_fn: The collate_fn to be applied on multiple tasks
+
+        """
+        self.tasks = tasks
+        self.epoch_length = epoch_length
+        self.devices = devices
+
+        if epoch_length % devices != 0:
+            raise Exception("The `epoch_length` should be the number of `devices`.")
+
+        self.collate_fn = collate_fn
+        self.counter = 0
+
+    def __iter__(self) -> 'TaskDataParallel':
+        self.counter = 0
+        return self
+
+    def __next__(self):
+        if self.counter >= len(self):
+            raise StopIteration
+        self.counter += self.devices
+        tasks = []
+        for _ in range(self.devices):
+            for item in self.tasks.sample():
+                tasks.append(item)
+        if self.collate_fn:
+            tasks = self.collate_fn(tasks)
+        return tasks
+
+    def __len__(self):
+        return self.epoch_length
+
+
+class TaskDistributedDataParallel(IterableDataset):
+
+    def __init__(
+        self,
+        taskset: l2l.data.TaskDataset,
+        global_rank: int,
+        world_size: int,
+        num_workers: int,
+        epoch_length: int,
+        seed: int,
+        requires_divisible: bool = True,
+    ):
+        """
+        This class is used to sample tasks in a distributed setting such as DDP with multiple workers.
+
+        Note: This won't work as expected if `num_workers = 0` and several dataloaders are being iterated on at the same time.
+
+        Args:
+            taskset: Dataset used to sample task.
+            global_rank: Rank of the current process.
+            world_size: Total of number of processes.
+            num_workers: Number of workers to be provided to the DataLoader.
+            epoch_length: The expected epoch length. This requires to be divisible by (num_workers * world_size).
+            seed: The seed will be used on __iter__ call and should be the same for all processes.
+
+        """
+        self.taskset = taskset
+        self.global_rank = global_rank
+        self.world_size = world_size
+        self.num_workers = 1 if num_workers == 0 else num_workers
+        self.worker_world_size = self.world_size * self.num_workers
+        self.epoch_length = epoch_length
+        self.seed = seed
+        self.iteration = 0
+        self.iteration = 0
+        self.requires_divisible = requires_divisible
+        self.counter = 0
+
+        if requires_divisible and epoch_length % self.worker_world_size != 0:
+            raise Exception("The `epoch_length` should be divisible by `world_size`.")
+
+    def __len__(self) -> int:
+        return self.epoch_length // self.world_size
+
+    @property
+    def worker_id(self) -> int:
+        worker_info = get_worker_info()
+        return worker_info.id if worker_info else 0
+
+    @property
+    def worker_rank(self) -> int:
+        is_global_zero = self.global_rank == 0
+        return self.global_rank + self.worker_id + int(not is_global_zero and self.num_workers > 1)
+
+    def __iter__(self):
+        self.iteration += 1
+        self.counter = 0
+        pl.seed_everything(self.seed + self.iteration)
+        return self
+
+    def __next__(self):
+        if self.counter >= len(self):
+            raise StopIteration
+        task_descriptions = []
+        for _ in range(self.worker_world_size):
+            task_descriptions.append(self.taskset.sample_task_description())
+
+        data = self.taskset.get_task(task_descriptions[self.worker_rank])
+        self.counter += 1
+        return data
+
+
+class EpisodicBatcher(pl.LightningDataModule):
 
     def __init__(
         self,
@@ -32,38 +167,24 @@ def __init__(
         self.test_tasks = test_tasks
         self.epoch_length = epoch_length
 
-    @staticmethod
-    def epochify(taskset, epoch_length):
-        class Epochifier(object):
-            def __init__(self, tasks, length):
-                self.tasks = tasks
-                self.length = length
-
-            def __getitem__(self, *args, **kwargs):
-                return self.tasks.sample()
-
-            def __len__(self):
-                return self.length
-
-        return Epochifier(taskset, epoch_length)
-
     def train_dataloader(self):
-        return EpisodicBatcher.epochify(
+        # TODO: Update the logic to use `TaskDataParallel` and `TaskDistributedDataParallel`
+        # along side a DataLoader
+        return Epochifier(
             self.train_tasks,
             self.epoch_length,
         )
 
     def val_dataloader(self):
-        return EpisodicBatcher.epochify(
+        return Epochifier(
             self.validation_tasks,
             self.epoch_length,
         )
 
     def test_dataloader(self):
-        length = self.epoch_length
-        return EpisodicBatcher.epochify(
+        return Epochifier(
             self.test_tasks,
-            length,
+            self.epoch_length,
         )