Project-MONAI
diff --git a/‎auto3dseg/notebooks/auto_runner.ipynb
Lines changed: 53 additions & 136 deletions b/‎auto3dseg/notebooks/auto_runner.ipynb
Lines changed: 53 additions & 136 deletions
@@ -10,10 +10,10 @@
     "\n",
     "Specifically, it will show the features below:\n",
     "1. Use `AutoRunner` with an input config file `input.yaml` example\n",
-    "2. How to prepare an `input.yaml`\n",
-    "3. How to configure the input/ouput folders\n",
+    "2. How to prepare the config file `input.yaml`\n",
+    "3. How to configure the paths for inputs, outputs, and intermediate results\n",
     "4. How to set the internal parameters of **Auto3DSeg** components\n",
-    "5. How to apply hyper parameter optimization\n",
+    "5. How to use a 3rd party hyper parameter optimization(HPO) package with `AutoRunner`\n",
     "\n",
     "## Setup environment"
    ]
@@ -36,18 +36,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/opt/conda/lib/python3.8/site-packages/tqdm/auto.py:22: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
-      "  from .autonotebook import tqdm as notebook_tqdm\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "import os\n",
     "import tempfile\n",
@@ -82,7 +73,7 @@
     "\n",
     "compressed_file = os.path.join(root_dir, msd_task + \".tar\")\n",
     "dataroot = os.path.join(root_dir, msd_task)\n",
-    "if os.path.exists(dataroot):\n",
+    "if not os.path.exists(dataroot):\n",
     "    download_and_extract(resource, compressed_file, root_dir)\n",
     "\n",
     "datalist_file = os.path.join(\"..\", \"tasks\", \"msd\", msd_task, \"msd_\" + msd_task.lower() + \"_folds.json\")"
@@ -97,19 +88,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
-    "data_src_cfg = {\n",
+    "input_cfg = {\n",
     "    \"name\": msd_task,  # optional, it is only for your own record\n",
     "    \"task\": \"segmentation\",  # optional, it is only for your own record\n",
     "    \"modality\": \"MRI\",  # required\n",
     "    \"datalist\": datalist_file,  # required\n",
     "    \"dataroot\": dataroot,  # required\n",
     "}\n",
     "input = './input.yaml'\n",
-    "ConfigParser.export_config_file(data_src_cfg, input)"
+    "ConfigParser.export_config_file(input_cfg, input)"
    ]
   },
   {
@@ -154,7 +145,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "runner = AutoRunner(input=data_src_cfg)\n",
+    "runner = AutoRunner(input=input_cfg)\n",
     "# runner.run()"
    ]
   },
@@ -169,21 +160,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:37,812 - INFO - ./my_workspace does not exists. Creating...\n",
-      "2022-10-18 08:11:37,813 - INFO - ./my_workspace created to save all results\n",
-      "2022-10-18 08:11:37,815 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/my_workspace/input.yaml\n",
-      "2022-10-18 08:11:37,818 - INFO - The output_dir is not specified. /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/my_workspace/ensemble_output will be used to save ensemble predictions\n",
-      "2022-10-18 08:11:37,819 - INFO - Directory /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/my_workspace/ensemble_output is created to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "runner = AutoRunner(work_dir='./my_workspace', input=input)\n",
     "# runner.run()"
@@ -203,19 +182,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:37,936 - INFO - Work directory ./work_dir is used to save all results\n",
-      "2022-10-18 08:11:37,938 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/input.yaml\n",
-      "2022-10-18 08:11:37,940 - INFO - The output_dir is not specified. /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/ensemble_output will be used to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "# This will restart from scratch and not use any cached results\n",
     "runner = AutoRunner(input=input, not_use_cache=True)\n",
@@ -238,19 +207,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:38,055 - INFO - Work directory ./work_dir is used to save all results\n",
-      "2022-10-18 08:11:38,057 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/input.yaml\n",
-      "2022-10-18 08:11:38,061 - INFO - Directory ./output_dir is created to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "runner = AutoRunner(input=input, output_dir='./output_dir')\n",
     "# runner.run()"
@@ -268,19 +227,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:38,182 - INFO - Work directory ./work_dir is used to save all results\n",
-      "2022-10-18 08:11:38,186 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/input.yaml\n",
-      "2022-10-18 08:11:38,194 - INFO - The output_dir is not specified. /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/ensemble_output will be used to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "runner = AutoRunner(input=input)\n",
     "runner.set_num_fold(num_fold=2)\n",
@@ -302,13 +251,16 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
-    "max_epochs = 2000\n",
+    "max_epochs = 2\n",
     "\n",
-    "num_gpus = 1 if \"multigpu\" in data_src_cfg and not data_src_cfg[\"multigpu\"] else torch.cuda.device_count()\n",
+    "# safeguard to ensure max_epochs is greater or equal to 2\n",
+    "max_epochs = max(max_epochs, 2)\n",
+    "\n",
+    "num_gpus = 1 if \"multigpu\" in input_cfg and not input_cfg[\"multigpu\"] else torch.cuda.device_count()\n",
     "\n",
     "num_epoch = max_epochs\n",
     "num_images_per_batch = 2\n",
@@ -326,7 +278,7 @@
     "}\n",
     "runner = AutoRunner(input=input)\n",
     "runner.set_training_params(params=train_param)\n",
-    "# runner.run()\n"
+    "# runner.run()"
    ]
   },
   {
@@ -340,19 +292,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:38,613 - INFO - Work directory ./work_dir is used to save all results\n",
-      "2022-10-18 08:11:38,615 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/input.yaml\n",
-      "2022-10-18 08:11:38,618 - INFO - The output_dir is not specified. /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/ensemble_output will be used to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "runner = AutoRunner(input=input)\n",
     "runner.set_ensemble_method(ensemble_method_name=\"AlgoEnsembleBestByFold\")\n",
@@ -368,19 +310,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:38,783 - INFO - Work directory ./work_dir is used to save all results\n",
-      "2022-10-18 08:11:38,784 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/input.yaml\n",
-      "2022-10-18 08:11:38,786 - INFO - The output_dir is not specified. /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/ensemble_output will be used to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "# set model ensemble method\n",
     "pred_params = {\n",
@@ -397,30 +329,25 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "## Train model with HPO (NNI Grid-search)\n",
+    "## Train model with HPO\n",
     "\n",
     "**Auto3DSeg** supports hyper parameter optimization (HPO) via `NNI` and `Optuna` backends.\n",
+    "If you wound like to the use `Optuna`, please check the [notebook](hpo_optuna.ipynb) for detailed usage.\n",
+    "\n",
+    "Here we demonstrate the HPO option with `NNI` by Microsoft.\n",
+    "Please install it via `pip install nni` if you hope to execute HPO with it in tutorial and haven't done so in the beginning of the notebook.\n",
     "AutoRunner supports `NNI` backend with a grid search method via automatically generating a the `NNI` config and run `nnictl` commands in subprocess.\n",
     "\n",
-    "Note: to run the HPO, you need to ensure the development environment has `nni` package.\n",
-    "Please refer to the [MONAI Installation Guide](https://docs.monai.io/en/stable/installation.html#installing-the-recommended-dependencies) for how to install the recommended dependencies."
+    "## Use `AutoRunner` with `NNI` backend to perform grid-search\n",
+    "\n",
+    "After `runner.run()` is executed, `nni` will attempt to start a web service using port 8088 by default. If you are running the tutorial in a remote host, please make sure the port is available on the system."
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:38,907 - INFO - Work directory ./work_dir is used to save all results\n",
-      "2022-10-18 08:11:38,908 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/input.yaml\n",
-      "2022-10-18 08:11:38,910 - INFO - The output_dir is not specified. /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/ensemble_output will be used to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "runner = AutoRunner(input=input, hpo=True)\n",
     "search_space = {\"learning_rate\": {\"_type\": \"choice\", \"_value\": [0.0001, 0.001, 0.01, 0.1]}}\n",
@@ -451,19 +378,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "2022-10-18 08:11:39,042 - INFO - Work directory ./work_dir is used to save all results\n",
-      "2022-10-18 08:11:39,046 - INFO - Loading ./input.yaml for AutoRunner and making a copy in /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/input.yaml\n",
-      "2022-10-18 08:11:39,054 - INFO - The output_dir is not specified. /workspace/monai/tutorials-in-dev/auto3dseg/notebooks/work_dir/ensemble_output will be used to save ensemble predictions\n"
-     ]
-    }
-   ],
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "runner = AutoRunner(input=input, hpo=True)\n",
     "hpo_params = {\"maxTrialNumber\": 20}\n",
@@ -496,7 +413,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3.8.10 64-bit",
+   "display_name": "Python 3.8.13 ('base')",
    "language": "python",
    "name": "python3"
   },
@@ -510,12 +427,12 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.10"
+   "version": "3.8.13"
   },
   "orig_nbformat": 4,
   "vscode": {
    "interpreter": {
-    "hash": "916dbcbb3f70747c44a77c7bcd40155683ae19c65e1c03b4aa3499c5328201f1"
+    "hash": "d4d1e4263499bec80672ea0156c357c1ee493ec2b1c70f0acce89fc37c4a6abe"
    }
   }
  },