From f2fc8a27e12939ff6e8ebca60b2c7842b895325e Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 19:41:17 +0000
Subject: [PATCH 01/15] deepmilpanda completed

---
 .../datasets/panda_tiles_dataset.py           |   6 +-
 InnerEye/ML/Histopathology/models/deepmil.py  |   8 +-
 InnerEye/ML/Histopathology/utils/naming.py    |   3 +
 .../classification/DeepSMILEPanda.py          | 114 ++++++++++++++++++
 .../ML/histopathology/models/test_deepmil.py  |  24 ++--
 5 files changed, 142 insertions(+), 13 deletions(-)
 create mode 100644 InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py

diff --git a/InnerEye/ML/Histopathology/datasets/panda_tiles_dataset.py b/InnerEye/ML/Histopathology/datasets/panda_tiles_dataset.py
index 43520a8c9..30097896b 100644
--- a/InnerEye/ML/Histopathology/datasets/panda_tiles_dataset.py
+++ b/InnerEye/ML/Histopathology/datasets/panda_tiles_dataset.py
@@ -30,10 +30,10 @@ class PandaTilesDataset(TilesDataset):
     SPLIT_COLUMN = None  # PANDA does not have an official train/test split
     N_CLASSES = 6
 
-    _RELATIVE_ROOT_FOLDER = "PANDA_tiles_20210926-135446/panda_tiles_level1_224"
+    _RELATIVE_ROOT_FOLDER = Path("PANDA_tiles_20210926-135446/panda_tiles_level1_224")
 
     def __init__(self,
-                 root: Union[str, Path],
+                 root: Path,
                  dataset_csv: Optional[Union[str, Path]] = None,
                  dataset_df: Optional[pd.DataFrame] = None) -> None:
         super().__init__(root=Path(root) / self._RELATIVE_ROOT_FOLDER,
@@ -48,7 +48,7 @@ class PandaTilesDatasetReturnImageLabel(VisionDataset):
     class label.
     """
     def __init__(self,
-                 root: Union[str, Path],
+                 root: Path,
                  dataset_csv: Optional[Union[str, Path]] = None,
                  dataset_df: Optional[pd.DataFrame] = None,
                  transform: Optional[Callable] = None,
diff --git a/InnerEye/ML/Histopathology/models/deepmil.py b/InnerEye/ML/Histopathology/models/deepmil.py
index c9af8c08d..757364660 100644
--- a/InnerEye/ML/Histopathology/models/deepmil.py
+++ b/InnerEye/ML/Histopathology/models/deepmil.py
@@ -166,7 +166,7 @@ def _shared_step(self, batch: Dict, batch_idx: int, stage: str) -> Dict[ResultsK
         bag_labels_list = []
         bag_logits_list = []
         bag_attn_list = []
-        for bag_idx in range(len(batch[TilesDataset.LABEL_COLUMN])):
+        for bag_idx in range(len(batch[self.label_column])):
             images = batch[TilesDataset.IMAGE_COLUMN][bag_idx]
             labels = batch[self.label_column][bag_idx]
             bag_labels_list.append(self.get_bag_label(labels))
@@ -177,7 +177,7 @@ def _shared_step(self, batch: Dict, batch_idx: int, stage: str) -> Dict[ResultsK
         bag_labels = torch.stack(bag_labels_list).view(-1)
 
         if self.n_classes > 1:
-            loss = self.loss_fn(bag_logits, bag_labels)
+            loss = self.loss_fn(bag_logits, bag_labels.long())
         else:
             loss = self.loss_fn(bag_logits.squeeze(1), bag_labels.float())
 
@@ -201,6 +201,10 @@ def _shared_step(self, batch: Dict, batch_idx: int, stage: str) -> Dict[ResultsK
                         ResultsKey.PROB: probs, ResultsKey.PRED_LABEL: preds,
                         ResultsKey.TRUE_LABEL: bag_labels, ResultsKey.BAG_ATTN: bag_attn_list,
                         ResultsKey.IMAGE: batch[TilesDataset.IMAGE_COLUMN]})
+        if (TilesDataset.TILE_X_COLUMN in batch.keys()) and (TilesDataset.TILE_Y_COLUMN in batch.keys()):
+            results.update({ResultsKey.TILE_X: batch[TilesDataset.TILE_X_COLUMN],
+                           ResultsKey.TILE_Y: batch[TilesDataset.TILE_Y_COLUMN]}
+                           )
         return results
 
     def training_step(self, batch: Dict, batch_idx: int) -> Tensor:  # type: ignore
diff --git a/InnerEye/ML/Histopathology/utils/naming.py b/InnerEye/ML/Histopathology/utils/naming.py
index 32d46d54d..1af40015b 100644
--- a/InnerEye/ML/Histopathology/utils/naming.py
+++ b/InnerEye/ML/Histopathology/utils/naming.py
@@ -15,3 +15,6 @@ class ResultsKey(str, Enum):
     PRED_LABEL = 'pred_label'
     TRUE_LABEL = 'true_label'
     BAG_ATTN = 'bag_attn'
+    TILE_X = "x"
+    TILE_Y = "y"
+
diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
new file mode 100644
index 000000000..c68a2bc18
--- /dev/null
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -0,0 +1,114 @@
+#  ------------------------------------------------------------------------------------------
+#  Copyright (c) Microsoft Corporation. All rights reserved.
+#  Licensed under the MIT License (MIT). See LICENSE in the repo root for license information.
+#  ------------------------------------------------------------------------------------------
+
+from typing import Any, Dict
+from pathlib import Path
+import os
+from monai.transforms import Compose
+from pytorch_lightning.callbacks.model_checkpoint import ModelCheckpoint
+from InnerEyePrivate.Common import fixed_paths
+from InnerEye.ML.Histopathology.datamodules.panda_module import PandaTilesDataModule
+from InnerEye.Azure.azure_util import get_default_azure_config_json_path
+from InnerEye.ML.Histopathology.datasets.panda_tiles_dataset import PandaTilesDataset
+from health_ml.networks.layers.attention_layers import GatedAttentionLayer
+from InnerEye.ML.Histopathology.models.transforms import EncodeTilesBatchd, LoadTilesBatchd
+from InnerEye.ML.Histopathology.models.encoders import (HistoSSLEncoder, ImageNetEncoder,
+                                                            ImageNetSimCLREncoder, InnerEyeSSLEncoder)
+from InnerEye.ML.configs.histo_configs.classification.BaseMIL import BaseMIL
+from health_azure.utils import CheckpointDownloader
+class DeepSMILEPanda(BaseMIL):
+    def __init__(self, **kwargs: Any) -> None:
+        default_kwargs = dict(
+            # declared in BaseMIL:
+            pooling_type=GatedAttentionLayer.__name__,
+            # declared in DatasetParams:
+            local_dataset=Path("/tmp/datasets/PANDA_tiles"),
+            # azure_dataset_id="PANDA_tiles",
+            # To mount the dataset instead of downloading in AML, pass --use_dataset_mount in the CLI
+            # declared in TrainerParams:
+            num_epochs=200,
+            recovery_checkpoint_save_interval=10,
+            recovery_checkpoints_save_last_k=-1,
+            # declared in WorkflowParams:
+            number_of_cross_validation_splits=5,
+            cross_validation_split_index=0,
+            # declared in OptimizerParams:
+            l_rate=5e-4,
+            weight_decay=1e-4,
+            adam_betas=(0.9, 0.99),
+        )
+        default_kwargs.update(kwargs)
+        super().__init__(**default_kwargs)
+        super().__init__(**default_kwargs)
+        self.best_checkpoint_filename = "checkpoint_max_val_auroc"
+        self.best_checkpoint_filename_with_suffix = self.best_checkpoint_filename + ".ckpt"
+        self.checkpoint_folder_path = "outputs/checkpoints/"
+        best_checkpoint_callback = ModelCheckpoint(dirpath=self.checkpoint_folder_path,
+                                                   monitor='val/accuracy',
+                                                   filename=self.best_checkpoint_filename,
+                                                   auto_insert_metric_name=False,
+                                                   mode='max')
+        self.callbacks = best_checkpoint_callback
+        
+    @property
+    def cache_dir(self) -> Path:
+        return Path(f"/tmp/innereye_cache/{self.__class__.__name__}-{self.encoder_type}/")
+    
+    def setup(self) -> None:
+        if self.encoder_type == InnerEyeSSLEncoder.__name__:
+            self.downloader = CheckpointDownloader(
+                azure_config_json_path=get_default_azure_config_json_path(),
+                run_recovery_id="hsharma_panda_explore:hsharma_panda_explore_1638437076_357167ae",
+                checkpoint_filename="last.ckpt",
+                download_dir='outputs/'
+            )
+            os.chdir(fixed_paths.repository_root_directory())
+            self.downloader.download_checkpoint_if_necessary()
+        self.encoder = self.get_encoder()
+        self.encoder.cuda()
+        self.encoder.eval()
+    
+    def get_data_module(self) -> PandaTilesDataModule:
+        image_key = PandaTilesDataset.IMAGE_COLUMN
+        transform = Compose([LoadTilesBatchd(image_key, progress=True),
+                             EncodeTilesBatchd(image_key, self.encoder)])
+        return PandaTilesDataModule(root_path=self.local_dataset,
+                                    max_bag_size=self.max_bag_size,
+                                    batch_size=self.batch_size,
+                                    transform=transform,
+                                    cache_mode=self.cache_mode,
+                                    save_precache=self.save_precache,
+                                    cache_dir=self.cache_dir,
+                                    number_of_cross_validation_splits=self.number_of_cross_validation_splits,
+                                    cross_validation_split_index=self.cross_validation_split_index)
+    
+    def get_trainer_arguments(self) -> Dict[str, Any]:
+        # These arguments will be passed through to the Lightning trainer.
+        return {"callbacks": self.callbacks}
+    
+    def get_path_to_best_checkpoint(self) -> Path:
+        """
+        Returns the full path to a checkpoint file that was found to be best during training, whatever criterion
+        was applied there.
+        """
+        # absolute path is required for registering the model.
+        return fixed_paths.repository_root_directory() / self.checkpoint_folder_path / self.best_checkpoint_filename_with_suffix
+
+class PandaImageNetMIL(DeepSMILEPanda):
+    def __init__(self, **kwargs: Any) -> None:
+        super().__init__(encoder_type=ImageNetEncoder.__name__, **kwargs)
+
+class PandaImageNetSimCLRMIL(DeepSMILEPanda):
+    def __init__(self, **kwargs: Any) -> None:
+        super().__init__(encoder_type=ImageNetSimCLREncoder.__name__, **kwargs)
+
+class PandaInnerEyeSSLMIL(DeepSMILEPanda):
+    def __init__(self, **kwargs: Any) -> None:
+        super().__init__(encoder_type=InnerEyeSSLEncoder.__name__, **kwargs)
+
+class PandaHistoSSLMIL(DeepSMILEPanda):
+    def __init__(self, **kwargs: Any) -> None:
+        super().__init__(encoder_type=HistoSSLEncoder.__name__, **kwargs)
+
diff --git a/Tests/ML/histopathology/models/test_deepmil.py b/Tests/ML/histopathology/models/test_deepmil.py
index 60df2f759..6b50bf3b2 100644
--- a/Tests/ML/histopathology/models/test_deepmil.py
+++ b/Tests/ML/histopathology/models/test_deepmil.py
@@ -4,7 +4,7 @@
 #  ------------------------------------------------------------------------------------------
 
 import os
-from typing import Callable, Dict, List
+from typing import Callable, Dict, List, Type
 
 import pytest
 from torch import Tensor, argmax, nn, rand, randint, randn, round, stack, allclose
@@ -12,9 +12,11 @@
 
 from health_ml.networks.layers.attention_layers import AttentionLayer, GatedAttentionLayer
 
-from InnerEye.ML.configs.histo_configs.classification.DeepSMILECrck import DeepSMILECrck
+from InnerEye.ML.lightning_container import LightningContainer
+from InnerEye.ML.configs.histo_configs.classification.DeepSMILECrck import TcgaCrckImageNetMIL
+from InnerEye.ML.configs.histo_configs.classification.DeepSMILEPanda import PandaImageNetMIL
 from InnerEye.ML.Histopathology.datamodules.base_module import TilesDataModule
-from InnerEye.ML.Histopathology.datasets.default_paths import TCGA_CRCK_DATASET_DIR
+from InnerEye.ML.Histopathology.datasets.default_paths import TCGA_CRCK_DATASET_DIR, PANDA_TILES_DATASET_DIR
 from InnerEye.ML.Histopathology.models.deepmil import DeepMILModule
 from InnerEye.ML.Histopathology.models.encoders import ImageNetEncoder, TileEncoder
 from InnerEye.ML.Histopathology.utils.naming import ResultsKey
@@ -103,15 +105,21 @@ def move_batch_to_expected_device(batch: Dict[str, List], use_gpu: bool) -> Dict
             for key, values in batch.items()}
 
 
+CONTAINER_DATASET_DIR = {
+    PandaImageNetMIL: PANDA_TILES_DATASET_DIR,
+    TcgaCrckImageNetMIL: TCGA_CRCK_DATASET_DIR,
+}
+
+
+@pytest.mark.parametrize("container_type", [PandaImageNetMIL,
+                                           TcgaCrckImageNetMIL])
 @pytest.mark.parametrize("use_gpu", [True, False])
-def test_container(use_gpu: bool) -> None:
-    container_type = DeepSMILECrck
-    dataset_dir = TCGA_CRCK_DATASET_DIR
+def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> None:
+    dataset_dir = CONTAINER_DATASET_DIR[container_type]
     if not os.path.isdir(dataset_dir):
         pytest.skip(f"Dataset for container {container_type.__name__} "
                     f"is unavailable: {dataset_dir}")
-
-    container = DeepSMILECrck(encoder_type=ImageNetEncoder.__name__)
+    container = container_type()
     container.setup()
 
     data_module: TilesDataModule = container.get_data_module()

From d4091c6a0c0bffb2503354cdd5d8dbb9e88f9510 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 19:52:38 +0000
Subject: [PATCH 02/15] fix linting

---
 .../classification/DeepSMILEPanda.py          | 86 ++++++++++++-------
 1 file changed, 57 insertions(+), 29 deletions(-)

diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
index c68a2bc18..f12ac1467 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -13,11 +13,20 @@
 from InnerEye.Azure.azure_util import get_default_azure_config_json_path
 from InnerEye.ML.Histopathology.datasets.panda_tiles_dataset import PandaTilesDataset
 from health_ml.networks.layers.attention_layers import GatedAttentionLayer
-from InnerEye.ML.Histopathology.models.transforms import EncodeTilesBatchd, LoadTilesBatchd
-from InnerEye.ML.Histopathology.models.encoders import (HistoSSLEncoder, ImageNetEncoder,
-                                                            ImageNetSimCLREncoder, InnerEyeSSLEncoder)
+from InnerEye.ML.Histopathology.models.transforms import (
+    EncodeTilesBatchd,
+    LoadTilesBatchd,
+)
+from InnerEye.ML.Histopathology.models.encoders import (
+    HistoSSLEncoder,
+    ImageNetEncoder,
+    ImageNetSimCLREncoder,
+    InnerEyeSSLEncoder,
+)
 from InnerEye.ML.configs.histo_configs.classification.BaseMIL import BaseMIL
 from health_azure.utils import CheckpointDownloader
+
+
 class DeepSMILEPanda(BaseMIL):
     def __init__(self, **kwargs: Any) -> None:
         default_kwargs = dict(
@@ -43,72 +52,91 @@ def __init__(self, **kwargs: Any) -> None:
         super().__init__(**default_kwargs)
         super().__init__(**default_kwargs)
         self.best_checkpoint_filename = "checkpoint_max_val_auroc"
-        self.best_checkpoint_filename_with_suffix = self.best_checkpoint_filename + ".ckpt"
+        self.best_checkpoint_filename_with_suffix = (
+            self.best_checkpoint_filename + ".ckpt"
+        )
         self.checkpoint_folder_path = "outputs/checkpoints/"
-        best_checkpoint_callback = ModelCheckpoint(dirpath=self.checkpoint_folder_path,
-                                                   monitor='val/accuracy',
-                                                   filename=self.best_checkpoint_filename,
-                                                   auto_insert_metric_name=False,
-                                                   mode='max')
+        best_checkpoint_callback = ModelCheckpoint(
+            dirpath=self.checkpoint_folder_path,
+            monitor="val/accuracy",
+            filename=self.best_checkpoint_filename,
+            auto_insert_metric_name=False,
+            mode="max",
+        )
         self.callbacks = best_checkpoint_callback
-        
+
     @property
     def cache_dir(self) -> Path:
-        return Path(f"/tmp/innereye_cache/{self.__class__.__name__}-{self.encoder_type}/")
-    
+        return Path(
+            f"/tmp/innereye_cache/{self.__class__.__name__}-{self.encoder_type}/"
+        )
+
     def setup(self) -> None:
         if self.encoder_type == InnerEyeSSLEncoder.__name__:
             self.downloader = CheckpointDownloader(
                 azure_config_json_path=get_default_azure_config_json_path(),
                 run_recovery_id="hsharma_panda_explore:hsharma_panda_explore_1638437076_357167ae",
                 checkpoint_filename="last.ckpt",
-                download_dir='outputs/'
+                download_dir="outputs/",
             )
             os.chdir(fixed_paths.repository_root_directory())
             self.downloader.download_checkpoint_if_necessary()
         self.encoder = self.get_encoder()
         self.encoder.cuda()
         self.encoder.eval()
-    
+
     def get_data_module(self) -> PandaTilesDataModule:
         image_key = PandaTilesDataset.IMAGE_COLUMN
-        transform = Compose([LoadTilesBatchd(image_key, progress=True),
-                             EncodeTilesBatchd(image_key, self.encoder)])
-        return PandaTilesDataModule(root_path=self.local_dataset,
-                                    max_bag_size=self.max_bag_size,
-                                    batch_size=self.batch_size,
-                                    transform=transform,
-                                    cache_mode=self.cache_mode,
-                                    save_precache=self.save_precache,
-                                    cache_dir=self.cache_dir,
-                                    number_of_cross_validation_splits=self.number_of_cross_validation_splits,
-                                    cross_validation_split_index=self.cross_validation_split_index)
-    
+        transform = Compose(
+            [
+                LoadTilesBatchd(image_key, progress=True),
+                EncodeTilesBatchd(image_key, self.encoder),
+            ]
+        )
+        return PandaTilesDataModule(
+            root_path=self.local_dataset,
+            max_bag_size=self.max_bag_size,
+            batch_size=self.batch_size,
+            transform=transform,
+            cache_mode=self.cache_mode,
+            save_precache=self.save_precache,
+            cache_dir=self.cache_dir,
+            number_of_cross_validation_splits=self.number_of_cross_validation_splits,
+            cross_validation_split_index=self.cross_validation_split_index,
+        )
+
     def get_trainer_arguments(self) -> Dict[str, Any]:
         # These arguments will be passed through to the Lightning trainer.
         return {"callbacks": self.callbacks}
-    
+
     def get_path_to_best_checkpoint(self) -> Path:
         """
         Returns the full path to a checkpoint file that was found to be best during training, whatever criterion
         was applied there.
         """
         # absolute path is required for registering the model.
-        return fixed_paths.repository_root_directory() / self.checkpoint_folder_path / self.best_checkpoint_filename_with_suffix
+        return (
+            fixed_paths.repository_root_directory()
+            / self.checkpoint_folder_path
+            / self.best_checkpoint_filename_with_suffix
+        )
+
 
 class PandaImageNetMIL(DeepSMILEPanda):
     def __init__(self, **kwargs: Any) -> None:
         super().__init__(encoder_type=ImageNetEncoder.__name__, **kwargs)
 
+
 class PandaImageNetSimCLRMIL(DeepSMILEPanda):
     def __init__(self, **kwargs: Any) -> None:
         super().__init__(encoder_type=ImageNetSimCLREncoder.__name__, **kwargs)
 
+
 class PandaInnerEyeSSLMIL(DeepSMILEPanda):
     def __init__(self, **kwargs: Any) -> None:
         super().__init__(encoder_type=InnerEyeSSLEncoder.__name__, **kwargs)
 
+
 class PandaHistoSSLMIL(DeepSMILEPanda):
     def __init__(self, **kwargs: Any) -> None:
         super().__init__(encoder_type=HistoSSLEncoder.__name__, **kwargs)
-

From b0e14916a8037281756f3112cac755da6a3a9865 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 19:56:53 +0000
Subject: [PATCH 03/15] changelog

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c4733a078..e60972024 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -35,6 +35,7 @@ jobs that run in AzureML.
 -([#614](https://github.com/microsoft/InnerEye-DeepLearning/pull/614)) Checkpoint downloading falls back to looking into AzureML if no checkpoints on disk
 -([#613](https://github.com/microsoft/InnerEye-DeepLearning/pull/613)) Add additional tests for histopathology datasets
 -([#616](https://github.com/microsoft/InnerEye-DeepLearning/pull/616)) Add more histopathology configs and tests
+-([#619](https://github.com/microsoft/InnerEye-DeepLearning/pull/616)) Add DeepMIL PANDA
 
 ### Changed
 - ([#588](https://github.com/microsoft/InnerEye-DeepLearning/pull/588)) Replace SciPy with PIL.PngImagePlugin.PngImageFile to load png files.

From 26f646322472d0da1a3e7a5b8d4c989ae70e17bc Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 19:58:37 +0000
Subject: [PATCH 04/15] changelog

---
 CHANGELOG.md | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index e60972024..83a68d7c2 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -28,6 +28,7 @@ jobs that run in AzureML.
 - ([#554](https://github.com/microsoft/InnerEye-DeepLearning/pull/554)) Added a parameter `pretraining_dataset_id` to
   `NIH_COVID_BYOL` to specify the name of the SSL training dataset.
 - ([#560](https://github.com/microsoft/InnerEye-DeepLearning/pull/560)) Added pre-commit hooks.
+-([#619](https://github.com/microsoft/InnerEye-DeepLearning/pull/616)) Add DeepMIL PANDA
 - ([#559](https://github.com/microsoft/InnerEye-DeepLearning/pull/559)) Adding the accompanying code for the ["Active label cleaning: Improving dataset quality under resource constraints"](https://arxiv.org/abs/2109.00574) paper. The code can be found in the [InnerEye-DataQuality](InnerEye-DataQuality/README.md) subfolder. It provides tools for training noise robust models, running label cleaning simulation and loading our label cleaning benchmark datasets.
 - ([#589](https://github.com/microsoft/InnerEye-DeepLearning/pull/589)) Add `LightningContainer.update_azure_config()`
   hook to enable overriding `AzureConfig` parameters from a container (e.g. `experiment_name`, `cluster`, `num_nodes`).
@@ -35,8 +36,6 @@ jobs that run in AzureML.
 -([#614](https://github.com/microsoft/InnerEye-DeepLearning/pull/614)) Checkpoint downloading falls back to looking into AzureML if no checkpoints on disk
 -([#613](https://github.com/microsoft/InnerEye-DeepLearning/pull/613)) Add additional tests for histopathology datasets
 -([#616](https://github.com/microsoft/InnerEye-DeepLearning/pull/616)) Add more histopathology configs and tests
--([#619](https://github.com/microsoft/InnerEye-DeepLearning/pull/616)) Add DeepMIL PANDA
-
 ### Changed
 - ([#588](https://github.com/microsoft/InnerEye-DeepLearning/pull/588)) Replace SciPy with PIL.PngImagePlugin.PngImageFile to load png files.
 - ([#576](https://github.com/microsoft/InnerEye-DeepLearning/pull/576)) The console output is no longer written to stdout.txt because AzureML handles that better now

From 5f46d24f1e324a5ab7ef105b897194f6726a4e31 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 19:59:39 +0000
Subject: [PATCH 05/15] fix conflict changelog

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 83a68d7c2..008da28f6 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -36,6 +36,7 @@ jobs that run in AzureML.
 -([#614](https://github.com/microsoft/InnerEye-DeepLearning/pull/614)) Checkpoint downloading falls back to looking into AzureML if no checkpoints on disk
 -([#613](https://github.com/microsoft/InnerEye-DeepLearning/pull/613)) Add additional tests for histopathology datasets
 -([#616](https://github.com/microsoft/InnerEye-DeepLearning/pull/616)) Add more histopathology configs and tests
+
 ### Changed
 - ([#588](https://github.com/microsoft/InnerEye-DeepLearning/pull/588)) Replace SciPy with PIL.PngImagePlugin.PngImageFile to load png files.
 - ([#576](https://github.com/microsoft/InnerEye-DeepLearning/pull/576)) The console output is no longer written to stdout.txt because AzureML handles that better now

From 721190f598aad61355ec0212915256088a044129 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 20:02:27 +0000
Subject: [PATCH 06/15] fix changelog

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 008da28f6..0eca314d9 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -28,7 +28,7 @@ jobs that run in AzureML.
 - ([#554](https://github.com/microsoft/InnerEye-DeepLearning/pull/554)) Added a parameter `pretraining_dataset_id` to
   `NIH_COVID_BYOL` to specify the name of the SSL training dataset.
 - ([#560](https://github.com/microsoft/InnerEye-DeepLearning/pull/560)) Added pre-commit hooks.
--([#619](https://github.com/microsoft/InnerEye-DeepLearning/pull/616)) Add DeepMIL PANDA
+-([#619](https://github.com/microsoft/InnerEye-DeepLearning/pull/619)) Add DeepMIL PANDA
 - ([#559](https://github.com/microsoft/InnerEye-DeepLearning/pull/559)) Adding the accompanying code for the ["Active label cleaning: Improving dataset quality under resource constraints"](https://arxiv.org/abs/2109.00574) paper. The code can be found in the [InnerEye-DataQuality](InnerEye-DataQuality/README.md) subfolder. It provides tools for training noise robust models, running label cleaning simulation and loading our label cleaning benchmark datasets.
 - ([#589](https://github.com/microsoft/InnerEye-DeepLearning/pull/589)) Add `LightningContainer.update_azure_config()`
   hook to enable overriding `AzureConfig` parameters from a container (e.g. `experiment_name`, `cluster`, `num_nodes`).

From b7f7bcef3bcc67b3275ebf6eefe3c9291e1f6fa8 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 20:40:31 +0000
Subject: [PATCH 07/15] fixing some wrong import

---
 InnerEye/Azure/azure_util.py                  | 136 ++++++++++++------
 .../classification/DeepSMILEPanda.py          |   2 +-
 2 files changed, 96 insertions(+), 42 deletions(-)

diff --git a/InnerEye/Azure/azure_util.py b/InnerEye/Azure/azure_util.py
index 7dc20d534..c361af861 100644
--- a/InnerEye/Azure/azure_util.py
+++ b/InnerEye/Azure/azure_util.py
@@ -52,14 +52,20 @@ def split_recovery_id(id: str) -> Tuple[str, str]:
     """
     components = id.strip().split(EXPERIMENT_RUN_SEPARATOR)
     if len(components) > 2:
-        raise ValueError("recovery_id must be in the format: 'experiment_name:run_id', but got: {}".format(id))
+        raise ValueError(
+            "recovery_id must be in the format: 'experiment_name:run_id', but got: {}".format(
+                id
+            )
+        )
     elif len(components) == 2:
         return components[0], components[1]
     else:
         recovery_id_regex = r"^(\w+)_\d+_[0-9a-f]+$|^(\w+)_\d+$"
         match = re.match(recovery_id_regex, id)
         if not match:
-            raise ValueError("The recovery ID was not in the expected format: {}".format(id))
+            raise ValueError(
+                "The recovery ID was not in the expected format: {}".format(id)
+            )
         return (match.group(1) or match.group(2)), id
 
 
@@ -77,9 +83,15 @@ def fetch_run(workspace: Workspace, run_recovery_id: str) -> Run:
     try:
         experiment_to_recover = Experiment(workspace, experiment)
     except Exception as ex:
-        raise Exception(f"Unable to retrieve run {run} in experiment {experiment}: {str(ex)}")
+        raise Exception(
+            f"Unable to retrieve run {run} in experiment {experiment}: {str(ex)}"
+        )
     run_to_recover = fetch_run_for_experiment(experiment_to_recover, run)
-    logging.info("Fetched run #{} {} from experiment {}.".format(run, run_to_recover.number, experiment))
+    logging.info(
+        "Fetched run #{} {} from experiment {}.".format(
+            run, run_to_recover.number, experiment
+        )
+    )
     return run_to_recover
 
 
@@ -94,9 +106,13 @@ def fetch_run_for_experiment(experiment_to_recover: Experiment, run_id: str) ->
     except Exception:
         available_runs = experiment_to_recover.get_runs()
         available_ids = ", ".join([run.id for run in available_runs])
-        raise (Exception(
-            "Run {} not found for experiment: {}. Available runs are: {}".format(
-                run_id, experiment_to_recover.name, available_ids)))
+        raise (
+            Exception(
+                "Run {} not found for experiment: {}. Available runs are: {}".format(
+                    run_id, experiment_to_recover.name, available_ids
+                )
+            )
+        )
 
 
 def fetch_runs(experiment: Experiment, filters: List[str]) -> List[Run]:
@@ -116,8 +132,11 @@ def fetch_runs(experiment: Experiment, filters: List[str]) -> List[Run]:
     return exp_runs
 
 
-def fetch_child_runs(run: Run, status: Optional[str] = None,
-                     expected_number_cross_validation_splits: int = 0) -> List[Run]:
+def fetch_child_runs(
+    run: Run,
+    status: Optional[str] = None,
+    expected_number_cross_validation_splits: int = 0,
+) -> List[Run]:
     """
     Fetch child runs for the provided runs that have the provided AML status (or fetch all by default)
     and have a run_recovery_id tag value set (this is to ignore superfluous AML infrastructure platform runs).
@@ -138,18 +157,25 @@ def fetch_child_runs(run: Run, status: Optional[str] = None,
         if 0 < expected_number_cross_validation_splits != len(children_runs):
             logging.warning(
                 f"The expected number of child runs was {expected_number_cross_validation_splits}."
-                f"Fetched only: {len(children_runs)} runs. Now trying to fetch them manually.")
-            run_ids_to_evaluate = [f"{create_run_recovery_id(run)}_{i}"
-                                   for i in range(expected_number_cross_validation_splits)]
-            children_runs = [fetch_run(run.experiment.workspace, id) for id in run_ids_to_evaluate]
+                f"Fetched only: {len(children_runs)} runs. Now trying to fetch them manually."
+            )
+            run_ids_to_evaluate = [
+                f"{create_run_recovery_id(run)}_{i}"
+                for i in range(expected_number_cross_validation_splits)
+            ]
+            children_runs = [
+                fetch_run(run.experiment.workspace, id) for id in run_ids_to_evaluate
+            ]
     if status is not None:
-        children_runs = [child_run for child_run in children_runs if child_run.get_status() == status]
+        children_runs = [
+            child_run for child_run in children_runs if child_run.get_status() == status
+        ]
     return children_runs
 
 
 def is_ensemble_run(run: Run) -> bool:
     """Checks if the run was an ensemble of multiple models"""
-    return run.get_tags().get(IS_ENSEMBLE_KEY_NAME) == 'True'
+    return run.get_tags().get(IS_ENSEMBLE_KEY_NAME) == "True"
 
 
 def to_azure_friendly_string(x: Optional[str]) -> Optional[str]:
@@ -160,7 +186,7 @@ def to_azure_friendly_string(x: Optional[str]) -> Optional[str]:
     if x is None:
         return x
     else:
-        return re.sub('_+', '_', re.sub(r'\W+', '_', x))
+        return re.sub("_+", "_", re.sub(r"\W+", "_", x))
 
 
 def to_azure_friendly_container_path(path: Path) -> str:
@@ -178,7 +204,7 @@ def is_offline_run_context(run_context: Run) -> bool:
     :param run_context: Context of the run to check
     :return:
     """
-    return not hasattr(run_context, 'experiment')
+    return not hasattr(run_context, "experiment")
 
 
 def get_run_context_or_default(run: Optional[Run] = None) -> Run:
@@ -199,7 +225,12 @@ def get_cross_validation_split_index(run: Run) -> int:
     if is_offline_run_context(run):
         return DEFAULT_CROSS_VALIDATION_SPLIT_INDEX
     else:
-        return int(run.get_tags().get(CROSS_VALIDATION_SPLIT_INDEX_TAG_KEY, DEFAULT_CROSS_VALIDATION_SPLIT_INDEX))
+        return int(
+            run.get_tags().get(
+                CROSS_VALIDATION_SPLIT_INDEX_TAG_KEY,
+                DEFAULT_CROSS_VALIDATION_SPLIT_INDEX,
+            )
+        )
 
 
 def is_cross_validation_child_run(run: Run) -> bool:
@@ -220,7 +251,7 @@ def strip_prefix(string: str, prefix: str) -> str:
     :return: Input string with prefix removed.
     """
     if string.startswith(prefix):
-        return string[len(prefix):]
+        return string[len(prefix) :]
     return string
 
 
@@ -256,9 +287,7 @@ def is_parent_run(run: Run) -> bool:
     return PARENT_RUN_CONTEXT and run.id == PARENT_RUN_CONTEXT.id
 
 
-def download_run_output_file(blob_path: Path,
-                             destination: Path,
-                             run: Run) -> Path:
+def download_run_output_file(blob_path: Path, destination: Path, run: Run) -> Path:
     """
     Downloads a single file from the run's default output directory: DEFAULT_AML_UPLOAD_DIR ("outputs").
     For example, if blobs_path = "foo/bar.csv", then the run result file "outputs/foo/bar.csv" will be downloaded
@@ -270,17 +299,21 @@ def download_run_output_file(blob_path: Path,
     """
     blobs_prefix = str((fixed_paths.DEFAULT_AML_UPLOAD_DIR / blob_path).as_posix())
     destination = destination / blob_path.name
-    logging.info(f"Downloading single file from run {run.id}: {blobs_prefix} -> {str(destination)}")
+    logging.info(
+        f"Downloading single file from run {run.id}: {blobs_prefix} -> {str(destination)}"
+    )
     try:
         run.download_file(blobs_prefix, str(destination), _validate_checksum=True)
     except Exception as ex:
-        raise ValueError(f"Unable to download file '{blobs_prefix}' from run {run.id}") from ex
+        raise ValueError(
+            f"Unable to download file '{blobs_prefix}' from run {run.id}"
+        ) from ex
     return destination
 
 
-def download_run_outputs_by_prefix(blobs_prefix: Path,
-                                   destination: Path,
-                                   run: Run) -> None:
+def download_run_outputs_by_prefix(
+    blobs_prefix: Path, destination: Path, run: Run
+) -> None:
     """
     Download all the blobs from the run's default output directory: DEFAULT_AML_UPLOAD_DIR ("outputs") that
     have a given prefix (folder structure). When saving, the prefix string will be stripped off. For example,
@@ -291,19 +324,25 @@ def download_run_outputs_by_prefix(blobs_prefix: Path,
     :param destination: Local path to save the downloaded blobs to.
     """
     prefix_str = str((fixed_paths.DEFAULT_AML_UPLOAD_DIR / blobs_prefix).as_posix())
-    logging.info(f"Downloading multiple files from run {run.id}: {prefix_str} -> {str(destination)}")
+    logging.info(
+        f"Downloading multiple files from run {run.id}: {prefix_str} -> {str(destination)}"
+    )
     # There is a download_files function, but that can time out when downloading several large checkpoints file
     # (120sec timeout for all files).
     for file in run.get_file_names():
         if file.startswith(prefix_str):
-            target_path = file[len(prefix_str):]
+            target_path = file[len(prefix_str) :] 
             if target_path.startswith("/"):
                 target_path = target_path[1:]
                 logging.info(f"Downloading {file}")
-                run.download_file(file, str(destination / target_path), _validate_checksum=True)
+                run.download_file(
+                    file, str(destination / target_path), _validate_checksum=True
+                )
             else:
-                logging.warning(f"Skipping file {file}, because the desired prefix {prefix_str} is not aligned with "
-                                f"the folder structure")
+                logging.warning(
+                    f"Skipping file {file}, because the desired prefix {prefix_str} is not aligned with "
+                    f"the folder structure"
+                )
 
 
 def is_running_on_azure_agent() -> bool:
@@ -314,10 +353,9 @@ def is_running_on_azure_agent() -> bool:
     return bool(os.environ.get("AGENT_OS", None))
 
 
-def get_comparison_baseline_paths(outputs_folder: Path,
-                                  blob_path: Path, run: Run,
-                                  dataset_csv_file_name: str) -> \
-        Tuple[Optional[Path], Optional[Path]]:
+def get_comparison_baseline_paths(
+    outputs_folder: Path, blob_path: Path, run: Run, dataset_csv_file_name: str
+) -> Tuple[Optional[Path], Optional[Path]]:
     run_rec_id = run.id
     # We usually find dataset.csv in the same directory as metrics.csv, but we sometimes
     # have to look higher up.
@@ -328,21 +366,29 @@ def get_comparison_baseline_paths(outputs_folder: Path,
     for blob_path_parent in step_up_directories(blob_path):
         try:
             comparison_dataset_path = download_run_output_file(
-                blob_path_parent / dataset_csv_file_name, destination_folder, run)
+                blob_path_parent / dataset_csv_file_name, destination_folder, run
+            )
             break
         except (ValueError, UserErrorException):
-            logging.warning(f"cannot find {dataset_csv_file_name} at {blob_path_parent} in {run_rec_id}")
+            logging.warning(
+                f"cannot find {dataset_csv_file_name} at {blob_path_parent} in {run_rec_id}"
+            )
         except NotADirectoryError:
             logging.warning(f"{blob_path_parent} is not a directory")
             break
         if comparison_dataset_path is None:
-            logging.warning(f"cannot find {dataset_csv_file_name} at or above {blob_path} in {run_rec_id}")
+            logging.warning(
+                f"cannot find {dataset_csv_file_name} at or above {blob_path} in {run_rec_id}"
+            )
     # Look for epoch_NNN/Test/metrics.csv
     try:
         comparison_metrics_path = download_run_output_file(
-            blob_path / SUBJECT_METRICS_FILE_NAME, destination_folder, run)
+            blob_path / SUBJECT_METRICS_FILE_NAME, destination_folder, run
+        )
     except (ValueError, UserErrorException):
-        logging.warning(f"cannot find {SUBJECT_METRICS_FILE_NAME} at {blob_path} in {run_rec_id}")
+        logging.warning(
+            f"cannot find {SUBJECT_METRICS_FILE_NAME} at {blob_path} in {run_rec_id}"
+        )
     return (comparison_dataset_path, comparison_metrics_path)
 
 
@@ -357,3 +403,11 @@ def step_up_directories(path: Path) -> Generator[Path, None, None]:
         if parent == path:
             break
         path = parent
+
+
+def get_default_azure_config_json_path() -> Path:
+    """
+    Gets the path to the project's default Azure config JSON file.
+    """
+    azure_config_json_path = fixed_paths.repository_root_directory() / "config.json"
+    return azure_config_json_path
diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
index f12ac1467..c95efcc82 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -8,7 +8,7 @@
 import os
 from monai.transforms import Compose
 from pytorch_lightning.callbacks.model_checkpoint import ModelCheckpoint
-from InnerEyePrivate.Common import fixed_paths
+from InnerEye.Common import fixed_paths
 from InnerEye.ML.Histopathology.datamodules.panda_module import PandaTilesDataModule
 from InnerEye.Azure.azure_util import get_default_azure_config_json_path
 from InnerEye.ML.Histopathology.datasets.panda_tiles_dataset import PandaTilesDataset

From 5c4f65696f5b57d14157e0581b22ba02da8c449f Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Mon, 13 Dec 2021 20:43:29 +0000
Subject: [PATCH 08/15] more fixes

---
 .../ML/configs/histo_configs/classification/DeepSMILEPanda.py   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
index c95efcc82..fed0e808c 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -34,7 +34,7 @@ def __init__(self, **kwargs: Any) -> None:
             pooling_type=GatedAttentionLayer.__name__,
             # declared in DatasetParams:
             local_dataset=Path("/tmp/datasets/PANDA_tiles"),
-            # azure_dataset_id="PANDA_tiles",
+            azure_dataset_id="PANDA_tiles",
             # To mount the dataset instead of downloading in AML, pass --use_dataset_mount in the CLI
             # declared in TrainerParams:
             num_epochs=200,

From fc0342acad03be93577457346819d15b0d31a970 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Tue, 14 Dec 2021 10:20:07 +0000
Subject: [PATCH 09/15] fix mypy

---
 .../classification/DeepSMILECrck.py           |  79 ++++++++----
 .../classification/DeepSMILEPanda.py          |   4 +-
 .../ML/histopathology/models/test_deepmil.py  | 121 +++++++++++-------
 3 files changed, 125 insertions(+), 79 deletions(-)

diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILECrck.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILECrck.py
index a2c1900f0..df2394f68 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILECrck.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILECrck.py
@@ -23,11 +23,22 @@
 from InnerEye.Common import fixed_paths
 from InnerEye.ML.configs.histo_configs.classification.BaseMIL import BaseMIL
 from InnerEye.ML.Histopathology.datamodules.base_module import TilesDataModule
-from InnerEye.ML.Histopathology.datamodules.tcga_crck_module import TcgaCrckTilesDataModule
-from InnerEye.ML.Histopathology.models.encoders import (HistoSSLEncoder, ImageNetEncoder,
-                                                            ImageNetSimCLREncoder, InnerEyeSSLEncoder)
-from InnerEye.ML.Histopathology.models.transforms import EncodeTilesBatchd, LoadTilesBatchd
-from InnerEye.ML.Histopathology.datasets.tcga_crck_tiles_dataset import TcgaCrck_TilesDataset
+from InnerEye.ML.Histopathology.datamodules.tcga_crck_module import (
+    TcgaCrckTilesDataModule,
+)
+from InnerEye.ML.Histopathology.models.encoders import (
+    HistoSSLEncoder,
+    ImageNetEncoder,
+    ImageNetSimCLREncoder,
+    InnerEyeSSLEncoder,
+)
+from InnerEye.ML.Histopathology.models.transforms import (
+    EncodeTilesBatchd,
+    LoadTilesBatchd,
+)
+from InnerEye.ML.Histopathology.datasets.tcga_crck_tiles_dataset import (
+    TcgaCrck_TilesDataset,
+)
 
 
 class DeepSMILECrck(BaseMIL):
@@ -36,21 +47,17 @@ def __init__(self, **kwargs: Any) -> None:
         default_kwargs = dict(
             # declared in BaseMIL:
             pooling_type=GatedAttentionLayer.__name__,
-
             # declared in DatasetParams:
             local_dataset=Path("/tmp/datasets/TCGA-CRCk"),
             azure_dataset_id="TCGA-CRCk",
             # To mount the dataset instead of downloading in AML, pass --use_dataset_mount in the CLI
-
             # declared in TrainerParams:
             num_epochs=16,
             recovery_checkpoint_save_interval=16,
             recovery_checkpoints_save_last_k=-1,
-
             # declared in WorkflowParams:
             number_of_cross_validation_splits=5,
             cross_validation_split_index=0,
-
             # declared in OptimizerParams:
             l_rate=5e-4,
             weight_decay=1e-4,
@@ -60,33 +67,45 @@ def __init__(self, **kwargs: Any) -> None:
         super().__init__(**default_kwargs)
 
         self.best_checkpoint_filename = "checkpoint_max_val_auroc"
-        self.best_checkpoint_filename_with_suffix = self.best_checkpoint_filename + ".ckpt"
+        self.best_checkpoint_filename_with_suffix = (
+            self.best_checkpoint_filename + ".ckpt"
+        )
         self.checkpoint_folder_path = "outputs/checkpoints/"
 
-        best_checkpoint_callback = ModelCheckpoint(dirpath=self.checkpoint_folder_path,
-                                                   monitor='val/auroc',
-                                                   filename=self.best_checkpoint_filename,
-                                                   auto_insert_metric_name=False,
-                                                   mode='max')
+        best_checkpoint_callback = ModelCheckpoint(
+            dirpath=self.checkpoint_folder_path,
+            monitor="val/auroc",
+            filename=self.best_checkpoint_filename,
+            auto_insert_metric_name=False,
+            mode="max",
+        )
         self.callbacks = best_checkpoint_callback
 
     @property
     def cache_dir(self) -> Path:
-        return Path(f"/tmp/innereye_cache/{self.__class__.__name__}-{self.encoder_type}/")
+        return Path(
+            f"/tmp/innereye_cache1/{self.__class__.__name__}-{self.encoder_type}/"
+        )
 
     def get_data_module(self) -> TilesDataModule:
         image_key = TcgaCrck_TilesDataset.IMAGE_COLUMN
-        transform = Compose([LoadTilesBatchd(image_key, progress=True),
-                             EncodeTilesBatchd(image_key, self.encoder)])
-        return TcgaCrckTilesDataModule(root_path=self.local_dataset,
-                                       max_bag_size=self.max_bag_size,
-                                       batch_size=self.batch_size,
-                                       transform=transform,
-                                       cache_mode=self.cache_mode,
-                                       save_precache=self.save_precache,
-                                       cache_dir=self.cache_dir,
-                                       number_of_cross_validation_splits=self.number_of_cross_validation_splits,
-                                       cross_validation_split_index=self.cross_validation_split_index)
+        transform = Compose(
+            [
+                LoadTilesBatchd(image_key, progress=True),
+                EncodeTilesBatchd(image_key, self.encoder),
+            ]
+        )
+        return TcgaCrckTilesDataModule(
+            root_path=self.local_dataset,
+            max_bag_size=self.max_bag_size,
+            batch_size=self.batch_size,
+            transform=transform,
+            cache_mode=self.cache_mode,
+            save_precache=self.save_precache,
+            cache_dir=self.cache_dir,
+            number_of_cross_validation_splits=self.number_of_cross_validation_splits,
+            cross_validation_split_index=self.cross_validation_split_index,
+        )
 
     def get_trainer_arguments(self) -> Dict[str, Any]:
         # These arguments will be passed through to the Lightning trainer.
@@ -98,7 +117,11 @@ def get_path_to_best_checkpoint(self) -> Path:
         was applied there.
         """
         # absolute path is required for registering the model.
-        return fixed_paths.repository_root_directory() / self.checkpoint_folder_path / self.best_checkpoint_filename_with_suffix
+        return (
+            fixed_paths.repository_root_directory()
+            / self.checkpoint_folder_path
+            / self.best_checkpoint_filename_with_suffix
+        )
 
 
 class TcgaCrckImageNetMIL(DeepSMILECrck):
diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
index fed0e808c..f42c42362 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -68,7 +68,7 @@ def __init__(self, **kwargs: Any) -> None:
     @property
     def cache_dir(self) -> Path:
         return Path(
-            f"/tmp/innereye_cache/{self.__class__.__name__}-{self.encoder_type}/"
+            f"/tmp/innereye_cache1/{self.__class__.__name__}-{self.encoder_type}/"
         )
 
     def setup(self) -> None:
@@ -94,7 +94,7 @@ def get_data_module(self) -> PandaTilesDataModule:
             ]
         )
         return PandaTilesDataModule(
-            root_path=self.local_dataset,
+            root_path=self.local_dataset,  # noqa
             max_bag_size=self.max_bag_size,
             batch_size=self.batch_size,
             transform=transform,
diff --git a/Tests/ML/histopathology/models/test_deepmil.py b/Tests/ML/histopathology/models/test_deepmil.py
index 6b50bf3b2..04d86e1b4 100644
--- a/Tests/ML/histopathology/models/test_deepmil.py
+++ b/Tests/ML/histopathology/models/test_deepmil.py
@@ -4,19 +4,29 @@
 #  ------------------------------------------------------------------------------------------
 
 import os
-from typing import Callable, Dict, List, Type
+from typing import Callable, Dict, List, Type  # noqa
 
 import pytest
 from torch import Tensor, argmax, nn, rand, randint, randn, round, stack, allclose
 from torchvision.models import resnet18
 
-from health_ml.networks.layers.attention_layers import AttentionLayer, GatedAttentionLayer
+from health_ml.networks.layers.attention_layers import (
+    AttentionLayer,
+    GatedAttentionLayer,
+)
 
 from InnerEye.ML.lightning_container import LightningContainer
-from InnerEye.ML.configs.histo_configs.classification.DeepSMILECrck import TcgaCrckImageNetMIL
-from InnerEye.ML.configs.histo_configs.classification.DeepSMILEPanda import PandaImageNetMIL
+from InnerEye.ML.configs.histo_configs.classification.DeepSMILECrck import (
+    TcgaCrckImageNetMIL,
+)
+from InnerEye.ML.configs.histo_configs.classification.DeepSMILEPanda import (
+    PandaImageNetMIL,
+)
 from InnerEye.ML.Histopathology.datamodules.base_module import TilesDataModule
-from InnerEye.ML.Histopathology.datasets.default_paths import TCGA_CRCK_DATASET_DIR, PANDA_TILES_DATASET_DIR
+from InnerEye.ML.Histopathology.datasets.default_paths import (
+    TCGA_CRCK_DATASET_DIR,
+    PANDA_TILES_DATASET_DIR,
+)
 from InnerEye.ML.Histopathology.models.deepmil import DeepMILModule
 from InnerEye.ML.Histopathology.models.encoders import ImageNetEncoder, TileEncoder
 from InnerEye.ML.Histopathology.utils.naming import ResultsKey
@@ -32,23 +42,27 @@ def get_supervised_imagenet_encoder() -> TileEncoder:
 @pytest.mark.parametrize("max_bag_size", [1, 7])
 @pytest.mark.parametrize("pool_hidden_dim", [1, 5])
 @pytest.mark.parametrize("pool_out_dim", [1, 6])
-def test_lightningmodule(n_classes: int,
-                         pooling_layer: Callable[[int, int, int], nn.Module],
-                         batch_size: int,
-                         max_bag_size: int,
-                         pool_hidden_dim: int,
-                         pool_out_dim: int) -> None:
+def test_lightningmodule(
+    n_classes: int,
+    pooling_layer: Callable[[int, int, int], nn.Module],
+    batch_size: int,
+    max_bag_size: int,
+    pool_hidden_dim: int,
+    pool_out_dim: int,
+) -> None:
 
     assert n_classes > 0
 
     # hard-coded here to avoid test explosion; correctness of other encoders is tested elsewhere
     encoder = get_supervised_imagenet_encoder()
-    module = DeepMILModule(encoder=encoder,
-                           label_column='label',
-                           n_classes=n_classes,
-                           pooling_layer=pooling_layer,
-                           pool_hidden_dim=pool_hidden_dim,
-                           pool_out_dim=pool_out_dim)
+    module = DeepMILModule(
+        encoder=encoder,
+        label_column="label",
+        n_classes=n_classes,
+        pooling_layer=pooling_layer,
+        pool_hidden_dim=pool_hidden_dim,
+        pool_out_dim=pool_out_dim,
+    )
 
     bag_images = rand([batch_size, max_bag_size, *module.encoder.input_dim])
     bag_labels_list = []
@@ -58,7 +72,7 @@ def test_lightningmodule(n_classes: int,
         if n_classes > 1:
             labels = randint(n_classes, size=(max_bag_size,))
         else:
-            labels = randint(n_classes+1, size=(max_bag_size,))
+            labels = randint(n_classes + 1, size=(max_bag_size,))
         bag_labels_list.append(module.get_bag_label(labels))
         logit, attn = module(bag)
         assert logit.shape == (1, n_classes)
@@ -94,15 +108,19 @@ def test_lightningmodule(n_classes: int,
     assert preds.shape[0] == batch_size
 
     for metric_name, metric_object in module.train_metrics.items():
-        if (batch_size > 1) or (not metric_name == 'auroc'):
+        if (batch_size > 1) or (not metric_name == "auroc"):
             score = metric_object(preds.view(-1, 1), bag_labels.view(-1, 1))
             assert score >= 0 and score <= 1
 
 
 def move_batch_to_expected_device(batch: Dict[str, List], use_gpu: bool) -> Dict:
-    device = 'cuda' if use_gpu else 'cpu'
-    return {key: [value.to(device) if isinstance(value, Tensor) else value for value in values]
-            for key, values in batch.items()}
+    device = "cuda" if use_gpu else "cpu"
+    return {
+        key: [
+            value.to(device) if isinstance(value, Tensor) else value for value in values
+        ]
+        for key, values in batch.items()
+    }
 
 
 CONTAINER_DATASET_DIR = {
@@ -111,14 +129,15 @@ def move_batch_to_expected_device(batch: Dict[str, List], use_gpu: bool) -> Dict
 }
 
 
-@pytest.mark.parametrize("container_type", [PandaImageNetMIL,
-                                           TcgaCrckImageNetMIL])
+@pytest.mark.parametrize("container_type", [PandaImageNetMIL, TcgaCrckImageNetMIL])
 @pytest.mark.parametrize("use_gpu", [True, False])
 def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> None:
     dataset_dir = CONTAINER_DATASET_DIR[container_type]
     if not os.path.isdir(dataset_dir):
-        pytest.skip(f"Dataset for container {container_type.__name__} "
-                    f"is unavailable: {dataset_dir}")
+        pytest.skip(
+            f"Dataset for container {container_type.__name__} "
+            f"is unavailable: {dataset_dir}"
+        )
     container = container_type()
     container.setup()
 
@@ -132,10 +151,10 @@ def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> N
     for batch_idx, batch in enumerate(train_data_loader):
         batch = move_batch_to_expected_device(batch, use_gpu)
         loss = module.training_step(batch, batch_idx)
-        loss.retain_grad()
-        loss.backward()
-        assert loss.grad is not None
-        assert loss.shape == ()
+        loss.retain_grad()  # noqa
+        loss.backward()  # noqa
+        assert loss.grad is not None  # noqa
+        assert loss.shape == ()  # noqa
         assert isinstance(loss, Tensor)
         break
 
@@ -143,7 +162,7 @@ def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> N
     for batch_idx, batch in enumerate(val_data_loader):
         batch = move_batch_to_expected_device(batch, use_gpu)
         loss = module.validation_step(batch, batch_idx)
-        assert loss.shape == ()
+        assert loss.shape == ()  # noqa
         assert isinstance(loss, Tensor)
         break
 
@@ -151,7 +170,7 @@ def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> N
     for batch_idx, batch in enumerate(test_data_loader):
         batch = move_batch_to_expected_device(batch, use_gpu)
         outputs_dict = module.test_step(batch, batch_idx)
-        loss = outputs_dict[ResultsKey.LOSS]
+        loss = outputs_dict[ResultsKey.LOSS]  # noqa
         assert loss.shape == ()
         assert isinstance(loss, Tensor)
         break
@@ -160,22 +179,24 @@ def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> N
 def test_class_weights_binary() -> None:
     class_weights = Tensor([0.5, 3.5])
     n_classes = 1
-    module = DeepMILModule(encoder=get_supervised_imagenet_encoder(),
-                           label_column='label',
-                           n_classes=n_classes,
-                           pooling_layer=AttentionLayer,
-                           pool_hidden_dim=5,
-                           pool_out_dim=1,
-                           class_weights=class_weights)
+    module = DeepMILModule(
+        encoder=get_supervised_imagenet_encoder(),
+        label_column="label",
+        n_classes=n_classes,
+        pooling_layer=AttentionLayer,
+        pool_hidden_dim=5,
+        pool_out_dim=1,
+        class_weights=class_weights,
+    )
     logits = Tensor(randn(1, n_classes))
-    bag_label = randint(n_classes+1, size=(1,))
+    bag_label = randint(n_classes + 1, size=(1,))
 
-    pos_weight = Tensor([class_weights[1]/(class_weights[0]+1e-5)])
+    pos_weight = Tensor([class_weights[1] / (class_weights[0] + 1e-5)])
     loss_weighted = module.loss_fn(logits.squeeze(1), bag_label.float())
     criterion_unweighted = nn.BCEWithLogitsLoss()
     loss_unweighted = criterion_unweighted(logits.squeeze(1), bag_label.float())
     if bag_label.item() == 1:
-        assert allclose(loss_weighted, pos_weight*loss_unweighted)
+        assert allclose(loss_weighted, pos_weight * loss_unweighted)
     else:
         assert allclose(loss_weighted, loss_unweighted)
 
@@ -183,13 +204,15 @@ def test_class_weights_binary() -> None:
 def test_class_weights_multiclass() -> None:
     class_weights = Tensor([0.33, 0.33, 0.33])
     n_classes = 3
-    module = DeepMILModule(encoder=get_supervised_imagenet_encoder(),
-                           label_column='label',
-                           n_classes=n_classes,
-                           pooling_layer=AttentionLayer,
-                           pool_hidden_dim=5,
-                           pool_out_dim=1,
-                           class_weights=class_weights)
+    module = DeepMILModule(
+        encoder=get_supervised_imagenet_encoder(),
+        label_column="label",
+        n_classes=n_classes,
+        pooling_layer=AttentionLayer,
+        pool_hidden_dim=5,
+        pool_out_dim=1,
+        class_weights=class_weights,
+    )
     logits = Tensor(randn(1, n_classes))
     bag_label = randint(n_classes, size=(1,))
 

From 028fcd8b0518caa885ff8ff558804507e48b9a09 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Tue, 14 Dec 2021 10:21:49 +0000
Subject: [PATCH 10/15] removing black formatting, it adds too much noise

---
 .pre-commit-config.yaml | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 342c8dfc7..b3778fa5b 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -27,9 +27,3 @@ repos:
     rev: v1.5.7
     hooks:
     - id: autopep8
-
--   repo: https://github.com/ambv/black
-    rev: 21.9b0
-    hooks:
-    - id: black
-      language_version: python3.7

From fe770c6a54566f701fa50f24f75e33651cbd7a0b Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Tue, 14 Dec 2021 14:11:38 +0000
Subject: [PATCH 11/15] moving checkpoint name into seprate file

---
 .../ML/configs/histo_configs/classification/DeepSMILEPanda.py  | 3 ++-
 InnerEye/ML/configs/histo_configs/run_ids.py                   | 1 +
 2 files changed, 3 insertions(+), 1 deletion(-)
 create mode 100644 InnerEye/ML/configs/histo_configs/run_ids.py

diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
index f42c42362..0fbd940bf 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -24,6 +24,7 @@
     InnerEyeSSLEncoder,
 )
 from InnerEye.ML.configs.histo_configs.classification.BaseMIL import BaseMIL
+from InnerEye.ML.configs.histo_configs.run_ids import innereye_ssl_checkpoint
 from health_azure.utils import CheckpointDownloader
 
 
@@ -75,7 +76,7 @@ def setup(self) -> None:
         if self.encoder_type == InnerEyeSSLEncoder.__name__:
             self.downloader = CheckpointDownloader(
                 azure_config_json_path=get_default_azure_config_json_path(),
-                run_recovery_id="hsharma_panda_explore:hsharma_panda_explore_1638437076_357167ae",
+                run_recovery_id=innereye_ssl_checkpoint,
                 checkpoint_filename="last.ckpt",
                 download_dir="outputs/",
             )
diff --git a/InnerEye/ML/configs/histo_configs/run_ids.py b/InnerEye/ML/configs/histo_configs/run_ids.py
new file mode 100644
index 000000000..0c9ca2163
--- /dev/null
+++ b/InnerEye/ML/configs/histo_configs/run_ids.py
@@ -0,0 +1 @@
+innereye_ssl_checkpoint = "hsharma_panda_explore:hsharma_panda_explore_1638437076_357167ae"

From 862825a7320eb6e195d29526d86ed760b3e2bbfa Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Tue, 14 Dec 2021 14:30:09 +0000
Subject: [PATCH 12/15] fix linting

---
 InnerEye/ML/Histopathology/datamodules/panda_module.py       | 5 ++++-
 .../configs/histo_configs/classification/DeepSMILEPanda.py   | 2 +-
 Tests/ML/histopathology/models/test_deepmil.py               | 2 +-
 3 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/InnerEye/ML/Histopathology/datamodules/panda_module.py b/InnerEye/ML/Histopathology/datamodules/panda_module.py
index c28073a25..64b974ca6 100644
--- a/InnerEye/ML/Histopathology/datamodules/panda_module.py
+++ b/InnerEye/ML/Histopathology/datamodules/panda_module.py
@@ -3,7 +3,7 @@
 #  Licensed under the MIT License (MIT). See LICENSE in the repo root for license information.
 #  ------------------------------------------------------------------------------------------
 
-from typing import Tuple
+from typing import Tuple, Any
 
 from InnerEye.ML.Histopathology.datamodules.base_module import TilesDataModule
 from InnerEye.ML.Histopathology.datasets.panda_tiles_dataset import PandaTilesDataset
@@ -15,6 +15,9 @@ class PandaTilesDataModule(TilesDataModule):
     Method get_splits() returns the train, val, test splits from the PANDA dataset
     """
 
+    def __init__(self, **kwargs: Any) -> None:
+        super().__init__(**kwargs)
+
     def get_splits(self) -> Tuple[PandaTilesDataset, PandaTilesDataset, PandaTilesDataset]:
         dataset = PandaTilesDataset(self.root_path)
         splits = DatasetSplits.from_proportions(dataset.dataset_df.reset_index(),
diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
index 0fbd940bf..1ebeaeaa5 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -95,7 +95,7 @@ def get_data_module(self) -> PandaTilesDataModule:
             ]
         )
         return PandaTilesDataModule(
-            root_path=self.local_dataset,  # noqa
+            root_path=self.local_dataset,
             max_bag_size=self.max_bag_size,
             batch_size=self.batch_size,
             transform=transform,
diff --git a/Tests/ML/histopathology/models/test_deepmil.py b/Tests/ML/histopathology/models/test_deepmil.py
index 04d86e1b4..1f367a715 100644
--- a/Tests/ML/histopathology/models/test_deepmil.py
+++ b/Tests/ML/histopathology/models/test_deepmil.py
@@ -141,7 +141,7 @@ def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> N
     container = container_type()
     container.setup()
 
-    data_module: TilesDataModule = container.get_data_module()
+    data_module: TilesDataModule = container.get_data_module()  # noqa
     data_module.max_bag_size = 10
     module = container.create_model()
     if use_gpu:

From ec4f5823ffba4b44f37c58055f7c35730a3d5a42 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Tue, 14 Dec 2021 14:36:18 +0000
Subject: [PATCH 13/15] feedback from Max

---
 InnerEye/ML/Histopathology/models/deepmil.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/InnerEye/ML/Histopathology/models/deepmil.py b/InnerEye/ML/Histopathology/models/deepmil.py
index 757364660..e42eacb84 100644
--- a/InnerEye/ML/Histopathology/models/deepmil.py
+++ b/InnerEye/ML/Histopathology/models/deepmil.py
@@ -3,6 +3,7 @@
 #  Licensed under the MIT License (MIT). See LICENSE in the repo root for license information.
 #  ------------------------------------------------------------------------------------------
 
+import logging
 from pathlib import Path
 import pandas as pd
 import numpy as np
@@ -201,10 +202,14 @@ def _shared_step(self, batch: Dict, batch_idx: int, stage: str) -> Dict[ResultsK
                         ResultsKey.PROB: probs, ResultsKey.PRED_LABEL: preds,
                         ResultsKey.TRUE_LABEL: bag_labels, ResultsKey.BAG_ATTN: bag_attn_list,
                         ResultsKey.IMAGE: batch[TilesDataset.IMAGE_COLUMN]})
+
         if (TilesDataset.TILE_X_COLUMN in batch.keys()) and (TilesDataset.TILE_Y_COLUMN in batch.keys()):
             results.update({ResultsKey.TILE_X: batch[TilesDataset.TILE_X_COLUMN],
                            ResultsKey.TILE_Y: batch[TilesDataset.TILE_Y_COLUMN]}
                            )
+        else:
+            logging.warning("Coordinates not found in batch. If this is not expected check your input tiles dataset.")
+
         return results
 
     def training_step(self, batch: Dict, batch_idx: int) -> Tensor:  # type: ignore

From 18e18de247bb01e7155d757d1089351fd4317f1b Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Tue, 14 Dec 2021 14:47:16 +0000
Subject: [PATCH 14/15] using get_workspace from himl_azure

---
 InnerEye/Azure/azure_util.py                         | 12 ++----------
 .../histo_configs/classification/DeepSMILEPanda.py   | 10 ++++++----
 2 files changed, 8 insertions(+), 14 deletions(-)

diff --git a/InnerEye/Azure/azure_util.py b/InnerEye/Azure/azure_util.py
index c361af861..856c9f747 100644
--- a/InnerEye/Azure/azure_util.py
+++ b/InnerEye/Azure/azure_util.py
@@ -251,7 +251,7 @@ def strip_prefix(string: str, prefix: str) -> str:
     :return: Input string with prefix removed.
     """
     if string.startswith(prefix):
-        return string[len(prefix) :]
+        return string[len(prefix):]
     return string
 
 
@@ -331,7 +331,7 @@ def download_run_outputs_by_prefix(
     # (120sec timeout for all files).
     for file in run.get_file_names():
         if file.startswith(prefix_str):
-            target_path = file[len(prefix_str) :] 
+            target_path = file[len(prefix_str):]
             if target_path.startswith("/"):
                 target_path = target_path[1:]
                 logging.info(f"Downloading {file}")
@@ -403,11 +403,3 @@ def step_up_directories(path: Path) -> Generator[Path, None, None]:
         if parent == path:
             break
         path = parent
-
-
-def get_default_azure_config_json_path() -> Path:
-    """
-    Gets the path to the project's default Azure config JSON file.
-    """
-    azure_config_json_path = fixed_paths.repository_root_directory() / "config.json"
-    return azure_config_json_path
diff --git a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
index 1ebeaeaa5..17f61921f 100644
--- a/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
+++ b/InnerEye/ML/configs/histo_configs/classification/DeepSMILEPanda.py
@@ -8,11 +8,14 @@
 import os
 from monai.transforms import Compose
 from pytorch_lightning.callbacks.model_checkpoint import ModelCheckpoint
+
+from health_azure.utils import CheckpointDownloader
+from health_azure.utils import get_workspace
+from health_ml.networks.layers.attention_layers import GatedAttentionLayer
 from InnerEye.Common import fixed_paths
 from InnerEye.ML.Histopathology.datamodules.panda_module import PandaTilesDataModule
-from InnerEye.Azure.azure_util import get_default_azure_config_json_path
 from InnerEye.ML.Histopathology.datasets.panda_tiles_dataset import PandaTilesDataset
-from health_ml.networks.layers.attention_layers import GatedAttentionLayer
+
 from InnerEye.ML.Histopathology.models.transforms import (
     EncodeTilesBatchd,
     LoadTilesBatchd,
@@ -25,7 +28,6 @@
 )
 from InnerEye.ML.configs.histo_configs.classification.BaseMIL import BaseMIL
 from InnerEye.ML.configs.histo_configs.run_ids import innereye_ssl_checkpoint
-from health_azure.utils import CheckpointDownloader
 
 
 class DeepSMILEPanda(BaseMIL):
@@ -75,7 +77,7 @@ def cache_dir(self) -> Path:
     def setup(self) -> None:
         if self.encoder_type == InnerEyeSSLEncoder.__name__:
             self.downloader = CheckpointDownloader(
-                azure_config_json_path=get_default_azure_config_json_path(),
+                azure_config_json_path=get_workspace(),
                 run_recovery_id=innereye_ssl_checkpoint,
                 checkpoint_filename="last.ckpt",
                 download_dir="outputs/",

From 35b5bde760223b99d72a28c2c0a9bd8435844b04 Mon Sep 17 00:00:00 2001
From: vsalvatelli <vsalvatelli@microsoft.com>
Date: Tue, 14 Dec 2021 15:23:28 +0000
Subject: [PATCH 15/15] trying to fix types in test_deepmil

---
 .../ML/histopathology/models/test_deepmil.py  | 29 ++++++++++++-------
 1 file changed, 18 insertions(+), 11 deletions(-)

diff --git a/Tests/ML/histopathology/models/test_deepmil.py b/Tests/ML/histopathology/models/test_deepmil.py
index 1f367a715..797b3080c 100644
--- a/Tests/ML/histopathology/models/test_deepmil.py
+++ b/Tests/ML/histopathology/models/test_deepmil.py
@@ -17,10 +17,10 @@
 
 from InnerEye.ML.lightning_container import LightningContainer
 from InnerEye.ML.configs.histo_configs.classification.DeepSMILECrck import (
-    TcgaCrckImageNetMIL,
+    DeepSMILECrck,
 )
 from InnerEye.ML.configs.histo_configs.classification.DeepSMILEPanda import (
-    PandaImageNetMIL,
+    DeepSMILEPanda,
 )
 from InnerEye.ML.Histopathology.datamodules.base_module import TilesDataModule
 from InnerEye.ML.Histopathology.datasets.default_paths import (
@@ -124,12 +124,13 @@ def move_batch_to_expected_device(batch: Dict[str, List], use_gpu: bool) -> Dict
 
 
 CONTAINER_DATASET_DIR = {
-    PandaImageNetMIL: PANDA_TILES_DATASET_DIR,
-    TcgaCrckImageNetMIL: TCGA_CRCK_DATASET_DIR,
+    DeepSMILEPanda: PANDA_TILES_DATASET_DIR,
+    DeepSMILECrck: TCGA_CRCK_DATASET_DIR,
 }
 
 
-@pytest.mark.parametrize("container_type", [PandaImageNetMIL, TcgaCrckImageNetMIL])
+@pytest.mark.parametrize("container_type", [DeepSMILEPanda,
+                                            DeepSMILECrck])
 @pytest.mark.parametrize("use_gpu", [True, False])
 def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> None:
     dataset_dir = CONTAINER_DATASET_DIR[container_type]
@@ -138,10 +139,16 @@ def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> N
             f"Dataset for container {container_type.__name__} "
             f"is unavailable: {dataset_dir}"
         )
-    container = container_type()
+    if container_type is DeepSMILECrck:
+        container = DeepSMILECrck(encoder_type=ImageNetEncoder.__name__)
+    elif container_type is DeepSMILEPanda:
+        container = DeepSMILEPanda(encoder_type=ImageNetEncoder.__name__)
+    else:
+        container = container_type()
+
     container.setup()
 
-    data_module: TilesDataModule = container.get_data_module()  # noqa
+    data_module: TilesDataModule = container.get_data_module()  # type: ignore
     data_module.max_bag_size = 10
     module = container.create_model()
     if use_gpu:
@@ -151,10 +158,10 @@ def test_container(container_type: Type[LightningContainer], use_gpu: bool) -> N
     for batch_idx, batch in enumerate(train_data_loader):
         batch = move_batch_to_expected_device(batch, use_gpu)
         loss = module.training_step(batch, batch_idx)
-        loss.retain_grad()  # noqa
-        loss.backward()  # noqa
-        assert loss.grad is not None  # noqa
-        assert loss.shape == ()  # noqa
+        loss.retain_grad()
+        loss.backward()
+        assert loss.grad is not None
+        assert loss.shape == ()
         assert isinstance(loss, Tensor)
         break