|
336 | 336 | " model_config_filepath,\n",
|
337 | 337 | " \"--model_def\",\n",
|
338 | 338 | " model_def_filepath,\n",
|
| 339 | + " \"--num_gpus\",\n", |
| 340 | + " str(num_gpus),\n", |
339 | 341 | "]\n",
|
340 | 342 | "\n",
|
341 | 343 | "run_torchrun(module, module_args, num_gpus=num_gpus)"
|
|
457 | 459 | "INFO:training:[config] num_train_timesteps -> 1000.\n",
|
458 | 460 | "INFO:training:num_files_train: 2\n",
|
459 | 461 | "INFO:training:Training from scratch.\n",
|
460 |
| - "INFO:training:Scaling factor set to 0.89132159948349.\n", |
461 |
| - "INFO:training:scale_factor -> 0.89132159948349.\n", |
| 462 | + "INFO:training:Scaling factor set to 0.8903454542160034.\n", |
| 463 | + "INFO:training:scale_factor -> 0.8903454542160034.\n", |
462 | 464 | "INFO:training:torch.set_float32_matmul_precision -> highest.\n",
|
463 | 465 | "INFO:training:Epoch 1, lr 0.0001.\n",
|
464 |
| - "INFO:training:[2024-09-24 03:46:57] epoch 1, iter 1/2, loss: 0.7984, lr: 0.000100000000.\n", |
465 |
| - "INFO:training:[2024-09-24 03:46:58] epoch 1, iter 2/2, loss: 0.7911, lr: 0.000056250000.\n", |
466 |
| - "INFO:training:epoch 1 average loss: 0.7947.\n", |
| 466 | + "INFO:training:[2024-09-30 06:30:33] epoch 1, iter 1/2, loss: 0.7974, lr: 0.000100000000.\n", |
| 467 | + "INFO:training:[2024-09-30 06:30:33] epoch 1, iter 2/2, loss: 0.7939, lr: 0.000056250000.\n", |
| 468 | + "INFO:training:epoch 1 average loss: 0.7957.\n", |
467 | 469 | "INFO:training:Epoch 2, lr 2.5e-05.\n",
|
468 |
| - "INFO:training:[2024-09-24 03:46:59] epoch 2, iter 1/2, loss: 0.7910, lr: 0.000025000000.\n", |
469 |
| - "INFO:training:[2024-09-24 03:46:59] epoch 2, iter 2/2, loss: 0.7897, lr: 0.000006250000.\n", |
470 |
| - "INFO:training:epoch 2 average loss: 0.7903.\n", |
| 470 | + "INFO:training:[2024-09-30 06:30:35] epoch 2, iter 1/2, loss: 0.7902, lr: 0.000025000000.\n", |
| 471 | + "INFO:training:[2024-09-30 06:30:35] epoch 2, iter 2/2, loss: 0.7889, lr: 0.000006250000.\n", |
| 472 | + "INFO:training:epoch 2 average loss: 0.7895.\n", |
471 | 473 | "\n"
|
472 | 474 | ]
|
473 | 475 | }
|
|
484 | 486 | " model_config_filepath,\n",
|
485 | 487 | " \"--model_def\",\n",
|
486 | 488 | " model_def_filepath,\n",
|
| 489 | + " \"--num_gpus\",\n", |
| 490 | + " str(num_gpus),\n", |
487 | 491 | "]\n",
|
488 | 492 | "\n",
|
489 | 493 | "run_torchrun(module, module_args, num_gpus=num_gpus)"
|
|
518 | 522 | "output_type": "stream",
|
519 | 523 | "text": [
|
520 | 524 | "\n",
|
521 |
| - "INFO:inference:Using cuda:0 of 1 with random seed: 62801\n", |
| 525 | + "INFO:inference:Using cuda:0 of 1 with random seed: 93612\n", |
522 | 526 | "INFO:inference:[config] ckpt_filepath -> ./temp_work_dir/./models/diff_unet_ckpt.pt.\n",
|
523 |
| - "INFO:inference:[config] random_seed -> 62801.\n", |
| 527 | + "INFO:inference:[config] random_seed -> 93612.\n", |
524 | 528 | "INFO:inference:[config] output_prefix -> unet_3d.\n",
|
525 | 529 | "INFO:inference:[config] output_size -> (256, 256, 128).\n",
|
526 | 530 | "INFO:inference:[config] out_spacing -> (1.0, 1.0, 0.75).\n",
|
527 | 531 | "INFO:root:`controllable_anatomy_size` is not provided.\n",
|
528 | 532 | "INFO:inference:checkpoints ./temp_work_dir/./models/diff_unet_ckpt.pt loaded.\n",
|
529 |
| - "INFO:inference:scale_factor -> 0.89132159948349.\n", |
| 533 | + "INFO:inference:scale_factor -> 0.8903454542160034.\n", |
530 | 534 | "INFO:inference:num_downsample_level -> 4, divisor -> 4.\n",
|
531 | 535 | "INFO:inference:noise: cuda:0, torch.float32, <class 'torch.Tensor'>\n",
|
532 | 536 | "\n",
|
533 | 537 | " 0%| | 0/10 [00:00<?, ?it/s]\n",
|
534 |
| - " 10%|███████▍ | 1/10 [00:00<00:02, 3.62it/s]\n", |
535 |
| - " 40%|█████████████████████████████▌ | 4/10 [00:00<00:00, 12.53it/s]\n", |
536 |
| - " 80%|███████████████████████████████████████████████████████████▏ | 8/10 [00:00<00:00, 19.54it/s]\n", |
537 |
| - "100%|█████████████████████████████████████████████████████████████████████████| 10/10 [00:00<00:00, 18.16it/s]\n", |
538 |
| - "INFO:inference:Saved ./temp_work_dir/./predictions/unet_3d_seed62801_size256x256x128_spacing1.00x1.00x0.75_20240924034721.nii.gz.\n", |
| 538 | + " 10%|███████▍ | 1/10 [00:00<00:02, 3.48it/s]\n", |
| 539 | + " 40%|█████████████████████████████▌ | 4/10 [00:00<00:00, 12.23it/s]\n", |
| 540 | + " 80%|███████████████████████████████████████████████████████████▏ | 8/10 [00:00<00:00, 19.26it/s]\n", |
| 541 | + "100%|█████████████████████████████████████████████████████████████████████████| 10/10 [00:00<00:00, 17.80it/s]\n", |
| 542 | + "INFO:inference:Saved ./temp_work_dir/./predictions/unet_3d_seed93612_size256x256x128_spacing1.00x1.00x0.75_20240930063144_rank0.nii.gz.\n", |
539 | 543 | "\n"
|
540 | 544 | ]
|
541 | 545 | }
|
|
552 | 556 | " model_config_filepath,\n",
|
553 | 557 | " \"--model_def\",\n",
|
554 | 558 | " model_def_filepath,\n",
|
| 559 | + " \"--num_gpus\",\n", |
| 560 | + " str(num_gpus),\n", |
555 | 561 | "]\n",
|
556 | 562 | "\n",
|
557 | 563 | "run_torchrun(module, module_args, num_gpus=num_gpus)\n",
|
|
562 | 568 | ],
|
563 | 569 | "metadata": {
|
564 | 570 | "kernelspec": {
|
565 |
| - "display_name": "Python 3 (ipykernel)", |
| 571 | + "display_name": "Python 3", |
566 | 572 | "language": "python",
|
567 | 573 | "name": "python3"
|
568 | 574 | },
|
|
0 commit comments