Project-MONAI
diff --git a/‎automatic_mixed_precision.ipynb
Lines changed: 63 additions & 48 deletions b/‎automatic_mixed_precision.ipynb
Lines changed: 63 additions & 48 deletions
diff --git a/‎brats_segmentation_3d.ipynb
Lines changed: 35 additions & 8 deletions b/‎brats_segmentation_3d.ipynb
Lines changed: 35 additions & 8 deletions
diff --git a/‎cache_dataset_speed.ipynb
Lines changed: 41 additions & 14 deletions b/‎cache_dataset_speed.ipynb
Lines changed: 41 additions & 14 deletions
@@ -115,7 +115,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [
     {
@@ -143,7 +143,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -165,7 +165,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -185,7 +185,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -225,7 +225,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 6,
    "metadata": {
     "scrolled": true
    },
@@ -349,44 +349,52 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Tue Aug 11 05:17:40 2020       \r\n",
-      "+-----------------------------------------------------------------------------+\r\n",
-      "| NVIDIA-SMI 440.44       Driver Version: 440.44       CUDA Version: 10.2     |\r\n",
-      "|-------------------------------+----------------------+----------------------+\r\n",
-      "| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |\r\n",
-      "| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |\r\n",
-      "|===============================+======================+======================|\r\n",
-      "|   0  Tesla V100-PCIE...  Off  | 00000000:02:00.0 Off |                    0 |\r\n",
-      "| N/A   38C    P0    36W / 250W |   3329MiB / 32510MiB |      0%      Default |\r\n",
-      "+-------------------------------+----------------------+----------------------+\r\n",
-      "|   1  Tesla V100-PCIE...  Off  | 00000000:03:00.0 Off |                    0 |\r\n",
-      "| N/A   40C    P0    38W / 250W |   4722MiB / 32510MiB |      0%      Default |\r\n",
-      "+-------------------------------+----------------------+----------------------+\r\n",
-      "                                                                               \r\n",
-      "+-----------------------------------------------------------------------------+\r\n",
-      "| Processes:                                                       GPU Memory |\r\n",
-      "|  GPU       PID   Type   Process name                             Usage      |\r\n",
-      "|=============================================================================|\r\n",
-      "+-----------------------------------------------------------------------------+\r\n"
+      "Tesla V100-PCIE-32GB\n",
+      "|===========================================================================|\n",
+      "|                  PyTorch CUDA memory summary, device ID 0                 |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "|            CUDA OOMs: 0            |        cudaMalloc retries: 0         |\n",
+      "|===========================================================================|\n",
+      "|        Metric         | Cur Usage  | Peak Usage | Tot Alloc  | Tot Freed  |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Allocated memory      |       0 B  |    1152 MB |  200906 MB |  200906 MB |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Active memory         |       0 B  |    1152 MB |  200906 MB |  200906 MB |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| GPU reserved memory   |    2112 MB |    2112 MB |    2112 MB |       0 B  |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Non-releasable memory |       0 B  |  455384 KB |  100324 MB |  100324 MB |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Allocations           |       0    |     609    |   30778    |   30778    |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Active allocs         |       0    |     609    |   30778    |   30778    |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| GPU reserved segments |      58    |      58    |      58    |       0    |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Non-releasable allocs |       0    |      73    |   20653    |   20653    |\n",
+      "|===========================================================================|\n",
+      "\n"
      ]
     }
    ],
    "source": [
-    "! nvidia-smi"
+    "print(torch.cuda.get_device_name(0))\n",
+    "print(torch.cuda.memory_summary(0, abbreviated=True))"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "## Enable deterministic and train without AMP"
+    "## Enable deterministic and train without AMP\n",
+    "In order to correctly measure the memory usage, please restart the notebook and skip above AMP training."
    ]
   },
   {
@@ -411,37 +419,44 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Tue Aug 11 05:20:12 2020       \r\n",
-      "+-----------------------------------------------------------------------------+\r\n",
-      "| NVIDIA-SMI 440.44       Driver Version: 440.44       CUDA Version: 10.2     |\r\n",
-      "|-------------------------------+----------------------+----------------------+\r\n",
-      "| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |\r\n",
-      "| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |\r\n",
-      "|===============================+======================+======================|\r\n",
-      "|   0  Tesla V100-PCIE...  Off  | 00000000:02:00.0 Off |                    0 |\r\n",
-      "| N/A   41C    P0    37W / 250W |   4579MiB / 32510MiB |      0%      Default |\r\n",
-      "+-------------------------------+----------------------+----------------------+\r\n",
-      "|   1  Tesla V100-PCIE...  Off  | 00000000:03:00.0 Off |                    0 |\r\n",
-      "| N/A   40C    P0    38W / 250W |   4722MiB / 32510MiB |      0%      Default |\r\n",
-      "+-------------------------------+----------------------+----------------------+\r\n",
-      "                                                                               \r\n",
-      "+-----------------------------------------------------------------------------+\r\n",
-      "| Processes:                                                       GPU Memory |\r\n",
-      "|  GPU       PID   Type   Process name                             Usage      |\r\n",
-      "|=============================================================================|\r\n",
-      "+-----------------------------------------------------------------------------+\r\n"
+      "Tesla V100-PCIE-32GB\n",
+      "|===========================================================================|\n",
+      "|                  PyTorch CUDA memory summary, device ID 0                 |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "|            CUDA OOMs: 0            |        cudaMalloc retries: 0         |\n",
+      "|===========================================================================|\n",
+      "|        Metric         | Cur Usage  | Peak Usage | Tot Alloc  | Tot Freed  |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Allocated memory      |       0 B  |    1730 MB |  279807 MB |  279807 MB |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Active memory         |       0 B  |    1730 MB |  279807 MB |  279807 MB |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| GPU reserved memory   |    3266 MB |    3266 MB |    3266 MB |       0 B  |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Non-releasable memory |       0 B  |  630502 KB |  111299 MB |  111299 MB |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Allocations           |       0    |     542    |   25170    |   25170    |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Active allocs         |       0    |     542    |   25170    |   25170    |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| GPU reserved segments |      58    |      58    |      58    |       0    |\n",
+      "|---------------------------------------------------------------------------|\n",
+      "| Non-releasable allocs |       0    |      59    |   15985    |   15985    |\n",
+      "|===========================================================================|\n",
+      "\n"
      ]
     }
    ],
    "source": [
-    "! nvidia-smi"
+    "print(torch.cuda.get_device_name(0))\n",
+    "print(torch.cuda.memory_summary(0, abbreviated=True))"
    ]
   },
   {
 
@@ -77,11 +77,33 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "metadata": {
     "tags": []
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "MONAI version: 0.1.0+318.ga2cd842\n",
+      "Python version: 3.6.9 |Anaconda, Inc.| (default, Jul 30 2019, 19:07:31)  [GCC 7.3.0]\n",
+      "Numpy version: 1.18.1\n",
+      "Pytorch version: 1.6.0\n",
+      "\n",
+      "Optional dependencies:\n",
+      "Pytorch Ignite version: 0.3.0\n",
+      "Nibabel version: 3.0.1\n",
+      "scikit-image version: 0.15.0\n",
+      "Pillow version: 7.0.0\n",
+      "Tensorboard version: 2.1.0\n",
+      "\n",
+      "For details about installing the optional dependencies, please visit:\n",
+      "    https://docs.monai.io/en/latest/installation.html#installing-the-recommended-dependencies\n",
+      "\n"
+     ]
+    }
+   ],
    "source": [
     "# Copyright 2020 MONAI Consortium\n",
     "# Licensed under the Apache License, Version 2.0 (the \"License\");\n",
@@ -98,7 +120,6 @@
     "import shutil\n",
     "import tempfile\n",
     "\n",
-    "import IPython\n",
     "import matplotlib.pyplot as plt\n",
     "import numpy as np\n",
     "import torch\n",
@@ -142,11 +163,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {
     "tags": []
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "/workspace/data/medical\n"
+     ]
+    }
+   ],
    "source": [
     "directory = os.environ.get(\"MONAI_DATA_DIRECTORY\")\n",
     "root_dir = tempfile.mkdtemp if directory is None else directory\n",
@@ -487,9 +516,7 @@
     "                f\"current epoch: {epoch + 1} current mean dice: {metric:.4f}\"\n",
     "                f\" tc: {metric_tc:.4f} wt: {metric_wt:.4f} et: {metric_et:.4f}\"\n",
     "                f\"\\nbest mean dice: {best_metric:.4f} at epoch: {best_metric_epoch}\"\n",
-    "            )\n",
-    "\n",
-    "    IPython.display.clear_output()"
+    "            )"
    ]
   },
   {
 
@@ -51,11 +51,33 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {
     "tags": []
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "MONAI version: 0.1.0+318.ga2cd842.dirty\n",
+      "Python version: 3.6.9 |Anaconda, Inc.| (default, Jul 30 2019, 19:07:31)  [GCC 7.3.0]\n",
+      "Numpy version: 1.18.1\n",
+      "Pytorch version: 1.6.0\n",
+      "\n",
+      "Optional dependencies:\n",
+      "Pytorch Ignite version: 0.3.0\n",
+      "Nibabel version: 3.0.1\n",
+      "scikit-image version: 0.15.0\n",
+      "Pillow version: 7.0.0\n",
+      "Tensorboard version: 2.1.0\n",
+      "\n",
+      "For details about installing the optional dependencies, please visit:\n",
+      "    https://docs.monai.io/en/latest/installation.html#installing-the-recommended-dependencies\n",
+      "\n"
+     ]
+    }
+   ],
    "source": [
     "# Copyright 2020 MONAI Consortium\n",
     "# Licensed under the Apache License, Version 2.0 (the \"License\");\n",
@@ -74,7 +96,6 @@
     "import tempfile\n",
     "import time\n",
     "\n",
-    "import IPython\n",
     "import matplotlib.pyplot as plt\n",
     "import torch\n",
     "\n",
@@ -115,11 +136,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "metadata": {
     "tags": []
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "/workspace/data/medical\n"
+     ]
+    }
+   ],
    "source": [
     "directory = os.environ.get(\"MONAI_DATA_DIRECTORY\")\n",
     "root_dir = tempfile.mkdtemp() if directory is None else directory\n",
@@ -138,7 +167,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {
     "tags": []
    },
@@ -149,8 +178,8 @@
     "\n",
     "compressed_file = os.path.join(root_dir, \"Task09_Spleen.tar\")\n",
     "data_dir = os.path.join(root_dir, \"Task09_Spleen\")\n",
-    "\n",
-    "download_and_extract(resource, compressed_file, root_dir, md5)"
+    "if not os.path.exists(data_dir):\n",
+    "    download_and_extract(resource, compressed_file, root_dir, md5)"
    ]
   },
   {
@@ -359,8 +388,6 @@
     "        print(f\"time consuming of epoch {epoch + 1} is: {(time.time() - epoch_start):.4f}\")\n",
     "        epoch_times.append(time.time() - epoch_start)\n",
     "\n",
-    "        IPython.display.clear_output()\n",
-    "\n",
     "    print(\n",
     "        f\"train completed, best_metric: {best_metric:.4f} at epoch: {best_metric_epoch}\"\n",
     "        f\" total time: {(time.time() - total_start):.4f}\"\n",
@@ -507,16 +534,16 @@
     "\n",
     "plt.subplot(2, 2, 3)\n",
     "plt.title(\"Cache Epoch Average Loss\")\n",
-    "x = [i + 1 for i in range(len(epoch_loss_values))]\n",
-    "y = epoch_loss_values\n",
+    "x = [i + 1 for i in range(len(cache_epoch_loss_values))]\n",
+    "y = cache_epoch_loss_values\n",
     "plt.xlabel(\"epoch\")\n",
     "plt.grid(alpha=0.4, linestyle=\":\")\n",
     "plt.plot(x, y, color=\"green\")\n",
     "\n",
     "plt.subplot(2, 2, 4)\n",
     "plt.title(\"Cache Val Mean Dice\")\n",
-    "x = [i + 1 for i in range(len(metric_values))]\n",
-    "y = metric_values\n",
+    "x = [i + 1 for i in range(len(cache_metric_values))]\n",
+    "y = cache_metric_values\n",
     "plt.xlabel(\"epoch\")\n",
     "plt.grid(alpha=0.4, linestyle=\":\")\n",
     "plt.plot(x, y, color=\"green\")\n",