Skip to content

Commit 43e9c9f

Browse files
committed
[DLMED] update for test
Signed-off-by: Nic Ma <[email protected]>
1 parent e8f8b26 commit 43e9c9f

File tree

3 files changed

+28
-14
lines changed

3 files changed

+28
-14
lines changed

modules/bundles/spleen_segmentation/configs/train.json

Lines changed: 9 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -4,13 +4,12 @@
44
"$import os",
55
"$import ignite"
66
],
7-
"determinism": "$monai.utils.set_determinism(seed=123)",
8-
"cudnn_opt": "$setattr(torch.backends.cudnn, 'benchmark', True)",
9-
"device": "$torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')",
10-
"ckpt_dir": "/workspace/data/medical/tutorials/modules/bundles/spleen_segmentation/models",
7+
"bundle_root": "/workspace/data/medical/tutorials/modules/bundles/spleen_segmentation",
8+
"ckpt_dir": "$@bundle_root + '/models'",
119
"dataset_dir": "/workspace/data/medical/Task09_Spleen",
1210
"images": "$list(sorted(glob.glob(@dataset_dir + '/imagesTr/*.nii.gz')))",
1311
"labels": "$list(sorted(glob.glob(@dataset_dir + '/labelsTr/*.nii.gz')))",
12+
"device": "$torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')",
1413
"network_def": {
1514
"_target_": "UNet",
1615
"spatial_dims": 3,
@@ -143,7 +142,6 @@
143142
},
144143
"trainer": {
145144
"_target_": "SupervisedTrainer",
146-
"_requires_": ["@ddp_init", "@determinism", "@cudnn_opt"],
147145
"max_epochs": 100,
148146
"device": "@device",
149147
"train_data_loader": "@train#dataloader",
@@ -232,5 +230,10 @@
232230
"val_handlers": "@validate#handlers",
233231
"amp": true
234232
}
235-
}
233+
},
234+
"training": [
235+
"$monai.utils.set_determinism(seed=123)",
236+
"$setattr(torch.backends.cudnn, 'benchmark', True)",
237+
"$@train#trainer.run()"
238+
]
236239
}

modules/bundles/spleen_segmentation/configs/train_multi_gpu.json

Lines changed: 12 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -5,12 +5,9 @@
55
"$import ignite",
66
"$import torch.distributed as dist"
77
],
8-
"ddp_init": "$dist.init_process_group(backend='nccl', init_method='env://')",
9-
"determinism": "$monai.utils.set_determinism(seed=123)",
10-
"cudnn_opt": "$setattr(torch.backends.cudnn, 'benchmark', True)",
118
"device": "$torch.device(f'cuda:{dist.get_rank()}')",
12-
"set_device": "$torch.cuda.set_device(@device)",
13-
"ckpt_dir": "/workspace/data/medical/tutorials/modules/bundles/spleen_segmentation/models",
9+
"bundle_root": "/workspace/data/medical/tutorials/modules/bundles/spleen_segmentation",
10+
"ckpt_dir": "$@bundle_root + '/models'",
1411
"dataset_dir": "/workspace/data/medical/Task09_Spleen",
1512
"images": "$list(sorted(glob.glob(@dataset_dir + '/imagesTr/*.nii.gz')))",
1613
"labels": "$list(sorted(glob.glob(@dataset_dir + '/labelsTr/*.nii.gz')))",
@@ -160,7 +157,6 @@
160157
},
161158
"trainer": {
162159
"_target_": "SupervisedTrainer",
163-
"_requires_": ["@ddp_init", "@set_device", "@determinism", "@cudnn_opt"],
164160
"max_epochs": 100,
165161
"device": "@device",
166162
"train_data_loader": "@train#dataloader",
@@ -176,6 +172,7 @@
176172
},
177173
"validate": {
178174
"preprocessing": {
175+
179176
"_target_": "Compose",
180177
"transforms": [
181178
"%train#preprocessing#transforms#0",
@@ -256,5 +253,13 @@
256253
"val_handlers": "$@validate#handlers if dist.get_rank() > 0 else None",
257254
"amp": true
258255
}
259-
}
256+
},
257+
"training": [
258+
"$dist.init_process_group(backend='nccl', init_method='env://')",
259+
"$torch.cuda.set_device(@device)",
260+
"$monai.utils.set_determinism(seed=123)",
261+
"$setattr(torch.backends.cudnn, 'benchmark', True)",
262+
"$@train#trainer.run()",
263+
"$dist.destroy_process_group()"
264+
]
260265
}

modules/bundles/spleen_segmentation/docs/README.md

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,13 @@ Mean Dice = 0.96
2626
Execute training:
2727

2828
```
29-
python -m monai.bundle run "'train#trainer'" --meta_file configs/metadata.json --config_file configs/train.json --logging_file configs/logging.conf
29+
python -m monai.bundle run training --meta_file configs/metadata.json --config_file configs/train.json --logging_file configs/logging.conf
30+
```
31+
32+
Execute multi-GPU training:
33+
34+
```
35+
torchrun --nproc_per_node=2 -m monai.bundle run training --meta_file configs/metadata.json --config_file configs/train_multi_gpu.json --logging_file configs/logging.conf
3036
```
3137

3238
Execute inference:

0 commit comments

Comments
 (0)