Project-MONAI
diff --git a/‎.gitignore
Lines changed: 10 additions & 0 deletions b/‎.gitignore
Lines changed: 10 additions & 0 deletions
diff --git a/‎3d_classification/densenet_training_array.ipynb
Lines changed: 59 additions & 32 deletions b/‎3d_classification/densenet_training_array.ipynb
Lines changed: 59 additions & 32 deletions
diff --git a/‎federated_learning/breast_density_challenge/.dockerignore
Lines changed: 3 additions & 0 deletions b/‎federated_learning/breast_density_challenge/.dockerignore
Lines changed: 3 additions & 0 deletions
diff --git a/‎federated_learning/breast_density_challenge/.gitignore
Lines changed: 12 additions & 0 deletions b/‎federated_learning/breast_density_challenge/.gitignore
Lines changed: 12 additions & 0 deletions
diff --git a/‎federated_learning/breast_density_challenge/Dockerfile
Lines changed: 36 additions & 0 deletions b/‎federated_learning/breast_density_challenge/Dockerfile
Lines changed: 36 additions & 0 deletions
diff --git a/‎federated_learning/breast_density_challenge/README.md
Lines changed: 176 additions & 0 deletions b/‎federated_learning/breast_density_challenge/README.md
Lines changed: 176 additions & 0 deletions
@@ -138,3 +138,13 @@ tests/testing_data/*Hippocampus*
 # Ignore torch saves
 */torch/runs
 logs
+*/runs
+lightning_logs
+
+# ignore automatically created files
+*.ts
+nohup.out
+deepgrow/ignite/_image.nii.gz
+*.zip
+deployment/bentoml/mednist_classifier_bentoml.py
+deployment/ray/mednist_classifier_start.py
@@ -131,40 +131,17 @@
     }
    ],
    "source": [
-    "# set this in your environment or previous cell to wherever IXI is downloaded and extracted\n",
+    "# Set data directory\n",
     "directory = os.environ.get(\"MONAI_DATA_DIRECTORY\")\n",
-    "\n",
-    "if directory is None:\n",
-    "    resource = \"http://biomedic.doc.ic.ac.uk/brain-development/downloads/IXI/IXI-T1.tar\"\n",
-    "    md5 = \"34901a0593b41dd19c1a1f746eac2d58\"\n",
-    "\n",
-    "    root_dir = tempfile.mkdtemp()\n",
-    "\n",
-    "    dataset_dir = os.path.join(root_dir, \"ixi\")\n",
-    "    tarfile_name = f\"{dataset_dir}.tar\"\n",
-    "\n",
-    "    download_and_extract(resource, tarfile_name, dataset_dir, md5)\n",
-    "else:\n",
-    "    root_dir = directory\n",
-    "\n",
+    "root_dir = tempfile.mkdtemp() if directory is None else directory\n",
     "print(root_dir)"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 4,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "<class 'torch.Tensor'> torch.Size([3, 1, 96, 96, 96]) tensor([[1., 0.],\n",
-      "        [1., 0.],\n",
-      "        [1., 0.]]) torch.Size([3, 2])\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "# IXI dataset as a demo, downloadable from https://brain-development.org/ixi-dataset/\n",
     "images = [\n",
@@ -195,8 +172,58 @@
     "\n",
     "# Represent labels in one-hot format for binary classifier training,\n",
     "# BCEWithLogitsLoss requires target to have same shape as input\n",
-    "labels = torch.nn.functional.one_hot(torch.as_tensor(labels)).float()\n",
+    "labels = torch.nn.functional.one_hot(torch.as_tensor(labels)).float()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "ixi.tar: 100%|██████████| 4.51G/4.51G [08:19<00:00, 9.70MB/s]   \n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "2022-05-04 12:23:06,530 - INFO - Downloaded: /mnt/data/rbrown/Documents/Data/MONAI/ixi.tar\n",
+      "2022-05-04 12:23:13,734 - INFO - Verified 'ixi.tar', md5: 34901a0593b41dd19c1a1f746eac2d58.\n",
+      "2022-05-04 12:23:13,735 - INFO - Writing into directory: /mnt/data/rbrown/Documents/Data/MONAI/ixi.\n"
+     ]
+    }
+   ],
+   "source": [
+    "if not os.path.isfile(images[0]):\n",
+    "    resource = \"http://biomedic.doc.ic.ac.uk/brain-development/downloads/IXI/IXI-T1.tar\"\n",
+    "    md5 = \"34901a0593b41dd19c1a1f746eac2d58\"\n",
     "\n",
+    "    dataset_dir = os.path.join(root_dir, \"ixi\")\n",
+    "    tarfile_name = f\"{dataset_dir}.tar\"\n",
+    "\n",
+    "    download_and_extract(resource, tarfile_name, dataset_dir, md5)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'torch.Tensor'> torch.Size([3, 1, 96, 96, 96]) tensor([[1., 0.],\n",
+      "        [1., 0.],\n",
+      "        [1., 0.]]) torch.Size([3, 2])\n"
+     ]
+    }
+   ],
+   "source": [
     "# Define transforms\n",
     "train_transforms = Compose([ScaleIntensity(), AddChannel(), Resize((96, 96, 96)), RandRotate90(), EnsureType()])\n",
     "\n",
@@ -220,7 +247,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
@@ -367,7 +394,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -395,7 +422,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -405,7 +432,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 10,
    "metadata": {
     "scrolled": true,
     "tags": []
@@ -462,7 +489,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 11,
    "metadata": {},
    "outputs": [],
    "source": [
 
@@ -0,0 +1,3 @@
+# Ignore the following files/folders during docker build
+
+__pycache__/
@@ -0,0 +1,12 @@
+# IDE
+.idea/
+
+# artifacts
+poc/
+*.pyc
+result_*
+*.pth
+logs
+
+# example data
+*preprocessed*
@@ -0,0 +1,36 @@
+# use python base image
+FROM python:3.8.10
+ENV DEBIAN_FRONTEND noninteractive
+
+# specify the server FQDN as commandline argument
+ARG server_fqdn
+RUN echo "Setting up FL workspace wit FQDN: ${server_fqdn}"
+
+# add your code to container
+COPY code /code
+
+# add code to path
+ENV PYTHONPATH=${PYTHONPATH}:"/code"
+
+# install dependencies
+# RUN python -m pip install --upgrade pip
+RUN pip3 install tensorboard sklearn torchvision
+RUN pip3 install monai==0.8.1
+RUN pip3 install nvflare==2.0.16
+
+# mount nvflare from source
+#RUN pip install tenseal
+#WORKDIR /code
+#RUN git clone https://github.com/NVIDIA/NVFlare.git
+#ENV PYTHONPATH=${PYTHONPATH}:"/code/NVFlare"
+
+# download pretrained weights
+ENV TORCH_HOME=/opt/torch
+RUN python3 /code/pt/utils/download_model.py --model_url=https://download.pytorch.org/models/resnet18-f37072fd.pth
+
+# prepare FL workspace
+WORKDIR /code
+RUN sed -i "s|{SERVER_FQDN}|${server_fqdn}|g" fl_project.yml
+RUN python3 -m nvflare.lighter.provision -p fl_project.yml
+RUN cp -r workspace/fl_project/prod_00 fl_workspace
+RUN mv fl_workspace/${server_fqdn} fl_workspace/server
@@ -0,0 +1,176 @@
+## MammoFL_MICCAI2022
+
+Reference implementation for
+[ACR-NVIDIA-NCI Breast Density FL challenge](http://BreastDensityFL.acr.org).
+
+Held in conjunction with [MICCAI 2022](https://conferences.miccai.org/2022/en/).
+
+
+------------------------------------------------
+## 1. Run Training using [NVFlare](https://github.com/NVIDIA/NVFlare) reference implementation
+
+We provide a minimal example of how to implement Federated Averaging using [NVFlare 2.0](https://github.com/NVIDIA/NVFlare) and [MONAI](https://monai.io/) to train
+ a breast density prediction model with ResNet18.
+
+### 1.1 Download example data
+Follow the steps described in [./data/README.md](./data/README.md) to download an example breast density mammography dataset.
+Note, the data used in the actual challenge will be different. We do however follow the same preprocessing steps and
+use the same four BI-RADS breast density classes for prediction, See [./code/pt/utils/preprocess_dicomdir.py](./code/pt/utils/preprocess_dicomdir.py) for details.
+
+We provide a set of random data splits. Please download them using
+```
+python3 ./code/pt/utils/download_datalists_and_predictions.py
+```
+After download, they will be available as `./data/dataset_blinded_site-*.json` which follows the same format as what
+will be used in the challenge.
+Please do not modify the data list filenames in the configs as they will be the same during the challenge.
+
+Note, the location of the dataset and data lists will be given by the system.
+Do not change the locations given in [config_fed_client.json](./code/configs/mammo_fedavg/config/config_fed_client.json):
+```
+  "DATASET_ROOT": "/data/preprocessed",
+  "DATALIST_PREFIX": "/data/dataset_blinded_",
+```
+
+### 1.2 Build container
+The argument specifies the FQDN (Fully Qualified Domain Name) of the FL server. Use `localhost` when simulating FL on your machine.
+```
+./build_docker.sh localhost
+```
+Note, all code and pretrained models need to be included in the docker image.
+The virtual machines running the containers will not have public internet access during training.
+For an example, please see the `download_model.py` used to download ImageNet pretrained weights in this example.
+
+The Dockerfile will be submitted using the [MedICI platform](https://www.medici-challenges.org).
+For detailed instructions, see the [challenge website](http://BreastDensityFL.acr.org).
+
+### 1.3 Run server and clients containers, and start training
+Run all commands at once using. Note this will also create separate logs under `./logs`
+```
+./run_all_fl.sh
+```
+Note, the GPU index to use for each client is specified inside `run_all_fl.sh`.
+See the individual `run_docker_site-*.sh` commands described below.
+Note, the server script will automatically kill all running container used in this example
+and final results will be placed under `./result_server`.
+
+(optional) Run each command in a separate terminals to get site-specific printouts in separate windows.
+
+The argument for each shell script specifies the GPU index to be used.
+```
+./run_docker_server.sh
+./run_docker_site-1.sh 0
+./run_docker_site-2.sh 1
+./run_docker_site-3.sh 0
+```
+
+### 1.4 (Optional) Visualize training using TensorBoard
+After training completed, the training curves can be visualized using
+```
+tensorboard --logdir=./result_server
+```
+A visualization of the global accuracy and [Kappa](https://scikit-learn.org/stable/modules/generated/sklearn.metrics.cohen_kappa_score.html) validation scores for each site with the provided example data is shown below.
+The current setup runs on a machine with two NVIDIA GPUs with 12GB memory each.
+The runtime for this experiment is about 45 minutes.
+You can adjust the argument to the `run_docker_site-*.sh` scripts to specify different
+GPU indices if needed in your environment.
+
+![](./figs/example_data_val_global_acc_kappa.png)
+
+### 1.5 (Optional) Kill all containers
+If you didn't use `run_all_fl.sh`, all containers can be killed by running
+```
+docker kill server site-1 site-2 site-3
+```
+
+
+------------------------------------------------
+## 2. Modify the FL algorithm
+
+You can modify and extend the provided example code under [./code/pt](./code/pt).
+
+You could use other components available at [NVFlare](https://github.com/NVIDIA/NVFlare)
+or enhance the training pipeline using your custom code or features of other libraries.
+
+See the [NVFlare examples](https://github.com/NVIDIA/NVFlare/tree/main/examples) for features that could be utilized in this challenge.
+
+### 2.1 Debugging the learning algorithm
+
+The example NVFlare `Learner` class is implemented at [./code/pt/learners/mammo_learner.py](./code/pt/learners/mammo_learner.py).
+You can debug the file using the `MockClientEngine` as shown in the script by running
+```
+python3 code/pt/learners/mammo_learner.py
+```
+Furthermore, you can test it inside the container, by first running
+```
+./run_docker_debug.sh
+```
+Note, set `inside_container = True` to reflect the changed filepaths inside the container.
+
+
+------------------------------------------------
+## 3. Bring your own FL framework
+If you would like to use your own FL framework to participate in the challenge,
+please modify the Dockerfile accordingly to include all the dependencies.
+
+Your container needs to provide the following scripts that implement the starting of server, clients, and finalizing of the server.
+They will be executed by the system in the following order.
+
+### 3.1 start server
+```
+/code/start_server.sh
+```
+
+### 3.2 start each client (in parallel)
+```
+/code/start_site-1.sh
+/code/start_site-2.sh
+/code/start_site-3.sh
+```
+
+### 3.3 finalize the server
+```
+/code/finalize_server.sh
+```
+For an example on how the challenge system will execute these commands, see the provided `run_docker*.sh` scripts.
+
+### 3.4 Communication
+The communication channels for FL will be restricted to the ports specified in [fl_project.yml](./code/fl_project.yml).
+Your FL framework will also need those ports for implementing the communication.
+
+### 3.5 Results
+Results will need to be written to `/result/predictions.json`.
+Please follow the format produced by the reference implementation at [./result_server_example/predictions.json](./result_server_example/predictions.json)
+(available after running `python3 ./code/pt/utils/download_datalists_and_predictions.py`)
+The code is expected to return a json file containing at least list of image names and prediction probabilities for each breast density class
+for the global model (should be named `SRV_best_FL_global_model.pt`).
+```
+{
+	"site-1": {
+		"SRV_best_FL_global_model.pt": {
+            ...
+			"test_probs": [{
+				"image": "Calc-Test_P_00643_LEFT_MLO.npy",
+				"probs": [0.005602597258985043, 0.7612965703010559, 0.23040543496608734, 0.0026953918859362602]
+			}, {
+			...
+    },
+	"site-2": {
+		"SRV_best_FL_global_model.pt": {
+            ...
+			"test_probs": [{
+				"image": "Calc-Test_P_00643_LEFT_MLO.npy",
+				"probs": [0.005602597258985043, 0.7612965703010559, 0.23040543496608734, 0.0026953918859362602]
+			}, {
+			...
+    },
+	"site-3": {
+		"SRV_best_FL_global_model.pt": {
+            ...
+			"test_probs": [{
+				"image": "Calc-Test_P_00643_LEFT_MLO.npy",
+				"probs": [0.005602597258985043, 0.7612965703010559, 0.23040543496608734, 0.0026953918859362602]
+			}, {
+			...
+    }
+```
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+# Ignore the following files/folders during docker build`
	`2`	`+`
	`3`	`+__pycache__/`