project-monai commited on Mar 26

Commit

7226a40

verified ·

1 Parent(s): 1414cb8

Upload lung_nodule_ct_detection version 0.6.9

Browse files

Files changed (20) hide show

.gitattributes +1 -0
LICENSE +201 -0
configs/evaluate.json +50 -0
configs/inference.json +221 -0
configs/inference_trt.json +13 -0
configs/logging.conf +21 -0
configs/metadata.json +107 -0
configs/train.json +452 -0
docs/README.md +163 -0
docs/data_license.txt +11 -0
models/model.pt +3 -0
models/model.ts +3 -0
scripts/__init__.py +14 -0
scripts/cocometric_ignite.py +111 -0
scripts/detection_inferer.py +66 -0
scripts/detection_saver.py +126 -0
scripts/evaluator.py +173 -0
scripts/trainer.py +228 -0
scripts/utils.py +26 -0
scripts/warmup_scheduler.py +89 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+models/model.ts filter=lfs diff=lfs merge=lfs -text

LICENSE ADDED Viewed

	@@ -0,0 +1,201 @@

+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+   1. Definitions.
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+   END OF TERMS AND CONDITIONS
+   APPENDIX: How to apply the Apache License to your work.
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+   Copyright [yyyy] [name of copyright owner]
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+       http://www.apache.org/licenses/LICENSE-2.0
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.

configs/evaluate.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+    "test_datalist": "$monai.data.load_decathlon_datalist(@data_list_file_path, is_segmentation=True, data_list_key='validation', base_dir=@dataset_dir)",
+    "validate#dataset": {
+        "_target_": "Dataset",
+        "data": "$@test_datalist",
+        "transform": "@validate#preprocessing"
+    },
+    "validate#key_metric": {
+        "val_coco": {
+            "_target_": "scripts.cocometric_ignite.IgniteCocoMetric",
+            "coco_metric_monai": "$monai.apps.detection.metrics.coco.COCOMetric(classes=['nodule'], iou_list=[0.1], max_detection=[100])",
+            "output_transform": "$monai.handlers.from_engine(['pred', 'label'])",
+            "box_key": "box",
+            "label_key": "label",
+            "pred_score_key": "label_scores",
+            "reduce_scalar": false
+        }
+    },
+    "validate#handlers": [
+        {
+            "_target_": "CheckpointLoader",
+            "load_path": "$@ckpt_dir + '/model.pt'",
+            "load_dict": {
+                "model": "@network"
+            }
+        },
+        {
+            "_target_": "StatsHandler",
+            "iteration_log": false
+        },
+        {
+            "_target_": "MetricsSaver",
+            "save_dir": "@output_dir",
+            "metrics": [
+                "val_coco"
+            ],
+            "metric_details": [
+                "val_coco"
+            ],
+            "batch_transform": "$lambda x: [xx['image'].meta for xx in x]",
+            "summary_ops": "*"
+        }
+    ],
+    "initialize": [
+        "$setattr(torch.backends.cudnn, 'benchmark', True)"
+    ],
+    "run": [
+        "$@validate#evaluator.run()"
+    ]
+}

configs/inference.json ADDED Viewed

	@@ -0,0 +1,221 @@

+{
+    "whether_raw_luna16": false,
+    "whether_resampled_luna16": "$(not @whether_raw_luna16)",
+    "imports": [
+        "$import glob",
+        "$import numpy",
+        "$import os"
+    ],
+    "bundle_root": ".",
+    "image_key": "image",
+    "ckpt_dir": "$@bundle_root + '/models'",
+    "output_dir": "$@bundle_root + '/eval'",
+    "output_filename": "result_luna16_fold0.json",
+    "data_list_file_path": "$@bundle_root + '/LUNA16_datasplit/dataset_fold0.json'",
+    "dataset_dir": "/datasets/LUNA16_Images_resample",
+    "test_datalist": "$monai.data.load_decathlon_datalist(@data_list_file_path, is_segmentation=True, data_list_key='validation', base_dir=@dataset_dir)",
+    "device": "$torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')",
+    "amp": true,
+    "load_pretrain": true,
+    "spatial_dims": 3,
+    "num_classes": 1,
+    "force_sliding_window": false,
+    "size_divisible": [
+        16,
+        16,
+        8
+    ],
+    "infer_patch_size": [
+        512,
+        512,
+        192
+    ],
+    "anchor_generator": {
+        "_target_": "monai.apps.detection.utils.anchor_utils.AnchorGeneratorWithAnchorShape",
+        "feature_map_scales": [
+            1,
+            2,
+            4
+        ],
+        "base_anchor_shapes": [
+            [
+                6,
+                8,
+                4
+            ],
+            [
+                8,
+                6,
+                5
+            ],
+            [
+                10,
+                10,
+                6
+            ]
+        ]
+    },
+    "backbone": "$monai.networks.nets.resnet.resnet50(spatial_dims=3,n_input_channels=1,conv1_t_stride=[2,2,1],conv1_t_size=[7,7,7])",
+    "feature_extractor": "$monai.apps.detection.networks.retinanet_network.resnet_fpn_feature_extractor(@backbone,3,False,[1,2],None)",
+    "network_def": {
+        "_target_": "RetinaNet",
+        "spatial_dims": "@spatial_dims",
+        "num_classes": "@num_classes",
+        "num_anchors": 3,
+        "feature_extractor": "@feature_extractor",
+        "size_divisible": "@size_divisible",
+        "use_list_output": false
+    },
+    "network": "$@network_def.to(@device)",
+    "detector": {
+        "_target_": "RetinaNetDetector",
+        "network": "@network",
+        "anchor_generator": "@anchor_generator",
+        "debug": false,
+        "spatial_dims": "@spatial_dims",
+        "num_classes": "@num_classes",
+        "size_divisible": "@size_divisible"
+    },
+    "detector_ops": [
+        "[email protected]_target_keys(box_key='box', label_key='label')",
+        "[email protected]_box_selector_parameters(score_thresh=0.02,topk_candidates_per_level=1000,nms_thresh=0.22,detections_per_img=300)",
+        "[email protected]_sliding_window_inferer(roi_size=@infer_patch_size,overlap=0.25,sw_batch_size=1,mode='constant',device='cpu')"
+    ],
+    "preprocessing": {
+        "_target_": "Compose",
+        "transforms": [
+            {
+                "_target_": "LoadImaged",
+                "keys": "@image_key",
+                "_disabled_": "@whether_raw_luna16"
+            },
+            {
+                "_target_": "LoadImaged",
+                "keys": "@image_key",
+                "reader": "itkreader",
+                "affine_lps_to_ras": true,
+                "_disabled_": "@whether_resampled_luna16"
+            },
+            {
+                "_target_": "EnsureChannelFirstd",
+                "keys": "@image_key"
+            },
+            {
+                "_target_": "Orientationd",
+                "keys": "@image_key",
+                "axcodes": "RAS"
+            },
+            {
+                "_target_": "Spacingd",
+                "keys": "@image_key",
+                "pixdim": [
+                    0.703125,
+                    0.703125,
+                    1.25
+                ],
+                "_disabled_": "@whether_resampled_luna16"
+            },
+            {
+                "_target_": "ScaleIntensityRanged",
+                "keys": "@image_key",
+                "a_min": -1024.0,
+                "a_max": 300.0,
+                "b_min": 0.0,
+                "b_max": 1.0,
+                "clip": true
+            },
+            {
+                "_target_": "EnsureTyped",
+                "keys": "@image_key"
+            }
+        ]
+    },
+    "dataset": {
+        "_target_": "Dataset",
+        "data": "$@test_datalist",
+        "transform": "@preprocessing"
+    },
+    "dataloader": {
+        "_target_": "DataLoader",
+        "dataset": "@dataset",
+        "batch_size": 1,
+        "shuffle": false,
+        "num_workers": 4,
+        "collate_fn": "$monai.data.utils.no_collation"
+    },
+    "inferer": {
+        "_target_": "scripts.detection_inferer.RetinaNetInferer",
+        "detector": "@detector",
+        "force_sliding_window": "@force_sliding_window"
+    },
+    "postprocessing": {
+        "_target_": "Compose",
+        "transforms": [
+            {
+                "_target_": "ClipBoxToImaged",
+                "box_keys": "box",
+                "label_keys": "label",
+                "box_ref_image_keys": "@image_key",
+                "remove_empty": true
+            },
+            {
+                "_target_": "AffineBoxToWorldCoordinated",
+                "box_keys": "box",
+                "box_ref_image_keys": "@image_key",
+                "affine_lps_to_ras": true
+            },
+            {
+                "_target_": "ConvertBoxModed",
+                "box_keys": "box",
+                "src_mode": "xyzxyz",
+                "dst_mode": "cccwhd"
+            },
+            {
+                "_target_": "DeleteItemsd",
+                "keys": [
+                    "@image_key"
+                ]
+            }
+        ]
+    },
+    "handlers": [
+        {
+            "_target_": "StatsHandler",
+            "iteration_log": false
+        },
+        {
+            "_target_": "scripts.detection_saver.DetectionSaver",
+            "output_dir": "@output_dir",
+            "filename": "@output_filename",
+            "batch_transform": "$lambda x: [xx['image'].meta for xx in x]",
+            "output_transform": "$lambda x: [@postprocessing({**xx['pred'],'image':xx['image']}) for xx in x]",
+            "pred_box_key": "box",
+            "pred_label_key": "label",
+            "pred_score_key": "label_scores"
+        }
+    ],
+    "evaluator": {
+        "_target_": "scripts.evaluator.DetectionEvaluator",
+        "_requires_": "@detector_ops",
+        "device": "@device",
+        "val_data_loader": "@dataloader",
+        "network": "@network",
+        "inferer": "@inferer",
+        "val_handlers": "@handlers",
+        "amp": "@amp"
+    },
+    "checkpointloader": {
+        "_target_": "CheckpointLoader",
+        "load_path": "$@bundle_root + '/models/model.pt'",
+        "load_dict": {
+            "model": "@network"
+        }
+    },
+    "initialize": [
+        "$setattr(torch.backends.cudnn, 'benchmark', True)",
+        "$@checkpointloader(@evaluator) if @load_pretrain else None"
+    ],
+    "run": [
+        "[email protected]()"
+    ]
+}

configs/inference_trt.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+    "imports": [
+        "$import glob",
+        "$import os",
+        "$import torch_tensorrt"
+    ],
+    "force_sliding_window": true,
+    "network_def": "$torch.jit.load(@bundle_root + '/models/model_trt.ts')",
+    "evaluator#amp": false,
+    "initialize": [
+        "$setattr(torch.backends.cudnn, 'benchmark', True)"
+    ]
+}

configs/logging.conf ADDED Viewed

	@@ -0,0 +1,21 @@

+[loggers]
+keys=root
+[handlers]
+keys=consoleHandler
+[formatters]
+keys=fullFormatter
+[logger_root]
+level=INFO
+handlers=consoleHandler
+[handler_consoleHandler]
+class=StreamHandler
+level=INFO
+formatter=fullFormatter
+args=(sys.stdout,)
+[formatter_fullFormatter]
+format=%(asctime)s - %(name)s - %(levelname)s - %(message)s

configs/metadata.json ADDED Viewed

	@@ -0,0 +1,107 @@

+{
+    "schema": "https://github.com/Project-MONAI/MONAI-extra-test-data/releases/download/0.8.1/meta_schema_20240725.json",
+    "version": "0.6.9",
+    "changelog": {
+        "0.6.9": "update to huggingface hosting and fix missing dependencies",
+        "0.6.8": "update issue for IgniteInfo",
+        "0.6.7": "use monai 1.4 and update large files",
+        "0.6.6": "update to use monai 1.3.1",
+        "0.6.5": "remove notes for trt_export in readme",
+        "0.6.4": "add notes for trt_export in readme",
+        "0.6.3": "add load_pretrain flag for infer",
+        "0.6.2": "add checkpoint loader for infer",
+        "0.6.1": "fix format error",
+        "0.6.0": "remove meta_dict usage",
+        "0.5.9": "use monai 1.2.0",
+        "0.5.8": "update TRT memory requirement in readme",
+        "0.5.7": "add dataset dir example",
+        "0.5.6": "add the ONNX-TensorRT way of model conversion",
+        "0.5.5": "update retrained validation results and training curve",
+        "0.5.4": "add non-deterministic note",
+        "0.5.3": "adapt to BundleWorkflow interface",
+        "0.5.2": "black autofix format and add name tag",
+        "0.5.1": "modify dataset key name",
+        "0.5.0": "use detection inferer",
+        "0.4.5": "fixed some small changes with formatting in readme",
+        "0.4.4": "add data resource to readme",
+        "0.4.3": "update val patch size to avoid warning in monai 1.0.1",
+        "0.4.2": "update to use monai 1.0.1",
+        "0.4.1": "fix license Copyright error",
+        "0.4.0": "add support for raw images",
+        "0.3.0": "update license files",
+        "0.2.0": "unify naming",
+        "0.1.1": "add reference for LIDC dataset",
+        "0.1.0": "complete the model package"
+    },
+    "monai_version": "1.4.0",
+    "pytorch_version": "2.4.0",
+    "numpy_version": "1.24.4",
+    "required_packages_version": {
+        "nibabel": "5.2.1",
+        "pytorch-ignite": "0.4.11",
+        "torchvision": "0.19.0",
+        "tensorboard": "2.17.0"
+    },
+    "supported_apps": {},
+    "name": "Lung nodule CT detection",
+    "task": "CT lung nodule detection",
+    "description": "A pre-trained model for volumetric (3D) detection of the lung lesion from CT image on LUNA16 dataset",
+    "authors": "MONAI team",
+    "copyright": "Copyright (c) MONAI Consortium",
+    "data_source": "https://luna16.grand-challenge.org/Home/",
+    "data_type": "nibabel",
+    "image_classes": "1 channel data, CT at 0.703125 x 0.703125 x 1.25 mm",
+    "label_classes": "dict data, containing Nx6 box and Nx1 classification labels.",
+    "pred_classes": "dict data, containing Nx6 box, Nx1 classification labels, Nx1 classification scores.",
+    "eval_metrics": {
+        "mAP_IoU_0.10_0.50_0.05_MaxDet_100": 0.852,
+        "AP_IoU_0.10_MaxDet_100": 0.858,
+        "mAR_IoU_0.10_0.50_0.05_MaxDet_100": 0.998,
+        "AR_IoU_0.10_MaxDet_100": 1.0
+    },
+    "intended_use": "This is an example, not to be used for diagnostic purposes",
+    "references": [
+        "Lin, Tsung-Yi, et al. 'Focal loss for dense object detection. ICCV 2017"
+    ],
+    "network_data_format": {
+        "inputs": {
+            "image": {
+                "type": "image",
+                "format": "magnitude",
+                "modality": "CT",
+                "num_channels": 1,
+                "spatial_shape": [
+                    "16*n",
+                    "16*n",
+                    "8*n"
+                ],
+                "dtype": "float16",
+                "value_range": [
+                    0,
+                    1
+                ],
+                "is_patch_data": true,
+                "channel_def": {
+                    "0": "image"
+                }
+            }
+        },
+        "outputs": {
+            "pred": {
+                "type": "object",
+                "format": "dict",
+                "dtype": "float16",
+                "num_channels": 1,
+                "spatial_shape": [
+                    "n",
+                    "n",
+                    "n"
+                ],
+                "value_range": [
+                    -10000,
+                    10000
+                ]
+            }
+        }
+    }
+}

configs/train.json ADDED Viewed

	@@ -0,0 +1,452 @@

+{
+    "imports": [
+        "$import glob",
+        "$import os"
+    ],
+    "bundle_root": ".",
+    "ckpt_dir": "$@bundle_root + '/models'",
+    "output_dir": "$@bundle_root + '/eval'",
+    "data_list_file_path": "$@bundle_root + '/LUNA16_datasplit/dataset_fold0.json'",
+    "dataset_dir": "/datasets/LUNA16_Images_resample",
+    "train_datalist": "$monai.data.load_decathlon_datalist(@data_list_file_path, is_segmentation=True, data_list_key='training', base_dir=@dataset_dir)",
+    "device": "$torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')",
+    "epochs": 300,
+    "val_interval": 5,
+    "learning_rate": 0.01,
+    "amp": true,
+    "batch_size": 4,
+    "patch_size": [
+        192,
+        192,
+        80
+    ],
+    "val_patch_size": [
+        512,
+        512,
+        192
+    ],
+    "anchor_generator": {
+        "_target_": "monai.apps.detection.utils.anchor_utils.AnchorGeneratorWithAnchorShape",
+        "feature_map_scales": [
+            1,
+            2,
+            4
+        ],
+        "base_anchor_shapes": [
+            [
+                6,
+                8,
+                4
+            ],
+            [
+                8,
+                6,
+                5
+            ],
+            [
+                10,
+                10,
+                6
+            ]
+        ]
+    },
+    "backbone": "$monai.networks.nets.resnet.resnet50(spatial_dims=3,n_input_channels=1,conv1_t_stride=[2,2,1],conv1_t_size=[7,7,7])",
+    "feature_extractor": "$monai.apps.detection.networks.retinanet_network.resnet_fpn_feature_extractor(@backbone,3,False,[1,2],None)",
+    "network_def": {
+        "_target_": "RetinaNet",
+        "spatial_dims": 3,
+        "num_classes": 1,
+        "num_anchors": 3,
+        "feature_extractor": "@feature_extractor",
+        "size_divisible": [
+            16,
+            16,
+            8
+        ]
+    },
+    "network": "$@network_def.to(@device)",
+    "detector": {
+        "_target_": "RetinaNetDetector",
+        "network": "@network",
+        "anchor_generator": "@anchor_generator",
+        "debug": false
+    },
+    "detector_ops": [
+        "[email protected]_atss_matcher(num_candidates=4, center_in_gt=False)",
+        "[email protected]_hard_negative_sampler(batch_size_per_image=64,positive_fraction=0.3,pool_size=20,min_neg=16)",
+        "[email protected]_target_keys(box_key='box', label_key='label')",
+        "[email protected]_box_selector_parameters(score_thresh=0.02,topk_candidates_per_level=1000,nms_thresh=0.22,detections_per_img=300)",
+        "[email protected]_sliding_window_inferer(roi_size=@val_patch_size,overlap=0.25,sw_batch_size=1,mode='constant',device='cpu')"
+    ],
+    "optimizer": {
+        "_target_": "torch.optim.SGD",
+        "params": "[email protected]()",
+        "lr": "@learning_rate",
+        "momentum": 0.9,
+        "weight_decay": 3e-05,
+        "nesterov": true
+    },
+    "after_scheduler": {
+        "_target_": "torch.optim.lr_scheduler.StepLR",
+        "optimizer": "@optimizer",
+        "step_size": 160,
+        "gamma": 0.1
+    },
+    "lr_scheduler": {
+        "_target_": "scripts.warmup_scheduler.GradualWarmupScheduler",
+        "optimizer": "@optimizer",
+        "multiplier": 1,
+        "total_epoch": 10,
+        "after_scheduler": "@after_scheduler"
+    },
+    "train": {
+        "preprocessing_transforms": [
+            {
+                "_target_": "LoadImaged",
+                "keys": "image"
+            },
+            {
+                "_target_": "EnsureChannelFirstd",
+                "keys": "image"
+            },
+            {
+                "_target_": "EnsureTyped",
+                "keys": [
+                    "image",
+                    "box"
+                ]
+            },
+            {
+                "_target_": "EnsureTyped",
+                "keys": "label",
+                "dtype": "$torch.long"
+            },
+            {
+                "_target_": "Orientationd",
+                "keys": "image",
+                "axcodes": "RAS"
+            },
+            {
+                "_target_": "ScaleIntensityRanged",
+                "keys": "image",
+                "a_min": -1024.0,
+                "a_max": 300.0,
+                "b_min": 0.0,
+                "b_max": 1.0,
+                "clip": true
+            },
+            {
+                "_target_": "ConvertBoxToStandardModed",
+                "box_keys": "box",
+                "mode": "cccwhd"
+            },
+            {
+                "_target_": "AffineBoxToImageCoordinated",
+                "box_keys": "box",
+                "box_ref_image_keys": "image",
+                "affine_lps_to_ras": true
+            }
+        ],
+        "random_transforms": [
+            {
+                "_target_": "RandCropBoxByPosNegLabeld",
+                "image_keys": "image",
+                "box_keys": "box",
+                "label_keys": "label",
+                "spatial_size": "@patch_size",
+                "whole_box": true,
+                "num_samples": "@batch_size",
+                "pos": 1,
+                "neg": 1
+            },
+            {
+                "_target_": "RandZoomBoxd",
+                "image_keys": "image",
+                "box_keys": "box",
+                "label_keys": "label",
+                "box_ref_image_keys": "image",
+                "prob": 0.2,
+                "min_zoom": 0.7,
+                "max_zoom": 1.4,
+                "padding_mode": "constant",
+                "keep_size": true
+            },
+            {
+                "_target_": "ClipBoxToImaged",
+                "box_keys": "box",
+                "label_keys": "label",
+                "box_ref_image_keys": "image",
+                "remove_empty": true
+            },
+            {
+                "_target_": "RandFlipBoxd",
+                "image_keys": "image",
+                "box_keys": "box",
+                "box_ref_image_keys": "image",
+                "prob": 0.5,
+                "spatial_axis": 0
+            },
+            {
+                "_target_": "RandFlipBoxd",
+                "image_keys": "image",
+                "box_keys": "box",
+                "box_ref_image_keys": "image",
+                "prob": 0.5,
+                "spatial_axis": 1
+            },
+            {
+                "_target_": "RandFlipBoxd",
+                "image_keys": "image",
+                "box_keys": "box",
+                "box_ref_image_keys": "image",
+                "prob": 0.5,
+                "spatial_axis": 2
+            },
+            {
+                "_target_": "RandRotateBox90d",
+                "image_keys": "image",
+                "box_keys": "box",
+                "box_ref_image_keys": "image",
+                "prob": 0.75,
+                "max_k": 3,
+                "spatial_axes": [
+                    0,
+                    1
+                ]
+            },
+            {
+                "_target_": "BoxToMaskd",
+                "box_keys": "box",
+                "label_keys": "label",
+                "box_mask_keys": "box_mask",
+                "box_ref_image_keys": "image",
+                "min_fg_label": 0,
+                "ellipse_mask": true
+            },
+            {
+                "_target_": "RandRotated",
+                "keys": [
+                    "image",
+                    "box_mask"
+                ],
+                "mode": [
+                    "nearest",
+                    "nearest"
+                ],
+                "prob": 0.2,
+                "range_x": 0.5236,
+                "range_y": 0.5236,
+                "range_z": 0.5236,
+                "keep_size": true,
+                "padding_mode": "zeros"
+            },
+            {
+                "_target_": "MaskToBoxd",
+                "box_keys": [
+                    "box"
+                ],
+                "label_keys": [
+                    "label"
+                ],
+                "box_mask_keys": [
+                    "box_mask"
+                ],
+                "min_fg_label": 0
+            },
+            {
+                "_target_": "DeleteItemsd",
+                "keys": "box_mask"
+            },
+            {
+                "_target_": "RandGaussianNoised",
+                "keys": "image",
+                "prob": 0.1,
+                "mean": 0.0,
+                "std": 0.1
+            },
+            {
+                "_target_": "RandGaussianSmoothd",
+                "keys": "image",
+                "prob": 0.1,
+                "sigma_x": [
+                    0.5,
+                    1.0
+                ],
+                "sigma_y": [
+                    0.5,
+                    1.0
+                ],
+                "sigma_z": [
+                    0.5,
+                    1.0
+                ]
+            },
+            {
+                "_target_": "RandScaleIntensityd",
+                "keys": "image",
+                "factors": 0.25,
+                "prob": 0.15
+            },
+            {
+                "_target_": "RandShiftIntensityd",
+                "keys": "image",
+                "offsets": 0.1,
+                "prob": 0.15
+            },
+            {
+                "_target_": "RandAdjustContrastd",
+                "keys": "image",
+                "prob": 0.3,
+                "gamma": [
+                    0.7,
+                    1.5
+                ]
+            }
+        ],
+        "final_transforms": [
+            {
+                "_target_": "EnsureTyped",
+                "keys": [
+                    "image",
+                    "box"
+                ]
+            },
+            {
+                "_target_": "EnsureTyped",
+                "keys": "label",
+                "dtype": "$torch.long"
+            },
+            {
+                "_target_": "ToTensord",
+                "keys": [
+                    "image",
+                    "box",
+                    "label"
+                ]
+            }
+        ],
+        "preprocessing": {
+            "_target_": "Compose",
+            "transforms": "$@train#preprocessing_transforms + @train#random_transforms + @train#final_transforms"
+        },
+        "dataset": {
+            "_target_": "Dataset",
+            "data": "$@train_datalist[: int(0.95 * len(@train_datalist))]",
+            "transform": "@train#preprocessing"
+        },
+        "dataloader": {
+            "_target_": "DataLoader",
+            "dataset": "@train#dataset",
+            "batch_size": 1,
+            "shuffle": true,
+            "num_workers": 4,
+            "collate_fn": "$monai.data.utils.no_collation"
+        },
+        "handlers": [
+            {
+                "_target_": "LrScheduleHandler",
+                "lr_scheduler": "@lr_scheduler",
+                "print_lr": true
+            },
+            {
+                "_target_": "ValidationHandler",
+                "validator": "@validate#evaluator",
+                "epoch_level": true,
+                "interval": "@val_interval"
+            },
+            {
+                "_target_": "StatsHandler",
+                "tag_name": "train_loss",
+                "output_transform": "$lambda x: monai.handlers.from_engine(['loss'], first=True)(x)[0]"
+            },
+            {
+                "_target_": "TensorBoardStatsHandler",
+                "log_dir": "@output_dir",
+                "tag_name": "train_loss",
+                "output_transform": "$lambda x: monai.handlers.from_engine(['loss'], first=True)(x)[0]"
+            }
+        ],
+        "trainer": {
+            "_target_": "scripts.trainer.DetectionTrainer",
+            "_requires_": "@detector_ops",
+            "max_epochs": "@epochs",
+            "device": "@device",
+            "train_data_loader": "@train#dataloader",
+            "detector": "@detector",
+            "optimizer": "@optimizer",
+            "train_handlers": "@train#handlers",
+            "amp": "@amp"
+        }
+    },
+    "validate": {
+        "preprocessing": {
+            "_target_": "Compose",
+            "transforms": "$@train#preprocessing_transforms + @train#final_transforms"
+        },
+        "dataset": {
+            "_target_": "Dataset",
+            "data": "$@train_datalist[int(0.95 * len(@train_datalist)): ]",
+            "transform": "@validate#preprocessing"
+        },
+        "dataloader": {
+            "_target_": "DataLoader",
+            "dataset": "@validate#dataset",
+            "batch_size": 1,
+            "shuffle": false,
+            "num_workers": 2,
+            "collate_fn": "$monai.data.utils.no_collation"
+        },
+        "inferer": {
+            "_target_": "scripts.detection_inferer.RetinaNetInferer",
+            "detector": "@detector"
+        },
+        "handlers": [
+            {
+                "_target_": "StatsHandler",
+                "iteration_log": false
+            },
+            {
+                "_target_": "TensorBoardStatsHandler",
+                "log_dir": "@output_dir",
+                "iteration_log": false
+            },
+            {
+                "_target_": "CheckpointSaver",
+                "save_dir": "@ckpt_dir",
+                "save_dict": {
+                    "model": "@network"
+                },
+                "save_key_metric": true,
+                "key_metric_filename": "model.pt"
+            }
+        ],
+        "key_metric": {
+            "val_coco": {
+                "_target_": "scripts.cocometric_ignite.IgniteCocoMetric",
+                "coco_metric_monai": "$monai.apps.detection.metrics.coco.COCOMetric(classes=['nodule'], iou_list=[0.1], max_detection=[100])",
+                "output_transform": "$monai.handlers.from_engine(['pred', 'label'])",
+                "box_key": "box",
+                "label_key": "label",
+                "pred_score_key": "label_scores",
+                "reduce_scalar": true
+            }
+        },
+        "evaluator": {
+            "_target_": "scripts.evaluator.DetectionEvaluator",
+            "_requires_": "@detector_ops",
+            "device": "@device",
+            "val_data_loader": "@validate#dataloader",
+            "network": "@network",
+            "inferer": "@validate#inferer",
+            "key_val_metric": "@validate#key_metric",
+            "val_handlers": "@validate#handlers",
+            "amp": "@amp"
+        }
+    },
+    "initialize": [
+        "$monai.utils.set_determinism(seed=0)"
+    ],
+    "run": [
+        "$@train#trainer.run()"
+    ]
+}

docs/README.md ADDED Viewed

	@@ -0,0 +1,163 @@

+# Model Overview
+A pre-trained model for volumetric (3D) detection of the lung nodule from CT image.
+This model is trained on LUNA16 dataset (https://luna16.grand-challenge.org/Home/), using the RetinaNet (Lin, Tsung-Yi, et al. "Focal loss for dense object detection." ICCV 2017. https://arxiv.org/abs/1708.02002).
+![model workflow](https://developer.download.nvidia.com/assets/Clara/Images/monai_retinanet_detection_workflow.png)
+## Data
+The dataset we are experimenting in this example is LUNA16 (https://luna16.grand-challenge.org/Home/), which is based on [LIDC-IDRI database](https://wiki.cancerimagingarchive.net/display/Public/LIDC-IDRI) [3,4,5].
+LUNA16 is a public dataset of CT lung nodule detection. Using raw CT scans, the goal is to identify locations of possible nodules, and to assign a probability for being a nodule to each location.
+Disclaimer: We are not the host of the data. Please make sure to read the requirements and usage policies of the data and give credit to the authors of the dataset! We acknowledge the National Cancer Institute and the Foundation for the National Institutes of Health, and their critical role in the creation of the free publicly available LIDC/IDRI Database used in this study.
+### 10-fold data splitting
+We follow the official 10-fold data splitting from LUNA16 challenge and generate data split json files using the script from [nnDetection](https://github.com/MIC-DKFZ/nnDetection/blob/main/projects/Task016_Luna/scripts/prepare.py).
+Please download the resulted json files from https://github.com/Project-MONAI/MONAI-extra-test-data/releases/download/0.8.1/LUNA16_datasplit-20220615T233840Z-001.zip.
+In these files, the values of "box" are the ground truth boxes in world coordinate.
+### Data resampling
+The raw CT images in LUNA16 have various of voxel sizes. The first step is to resample them to the same voxel size.
+In this model, we resampled them into 0.703125 x 0.703125 x 1.25 mm.
+Please following the instruction in Section 3.1 of https://github.com/Project-MONAI/tutorials/tree/main/detection to do the resampling.
+### Data download
+The mhd/raw original data can be downloaded from [LUNA16](https://luna16.grand-challenge.org/Home/). The DICOM original data can be downloaded from [LIDC-IDRI database](https://wiki.cancerimagingarchive.net/display/Public/LIDC-IDRI) [3,4,5]. You will need to resample the original data to start training.
+Alternatively, we provide [resampled nifti images](https://drive.google.com/drive/folders/1JozrufA1VIZWJIc5A1EMV3J4CNCYovKK?usp=share_link) and a copy of [original mhd/raw images](https://drive.google.com/drive/folders/1-enN4eNEnKmjltevKg3W2V-Aj0nriQWE?usp=share_link) from [LUNA16](https://luna16.grand-challenge.org/Home/) for users to download.
+## Training configuration
+The training was performed with the following:
+- GPU: at least 16GB GPU memory, requires 32G when exporting TRT model
+- Actual Model Input: 192 x 192 x 80
+- AMP: True
+- Optimizer: Adam
+- Learning Rate: 1e-2
+- Loss: BCE loss and L1 loss
+### Input
+1 channel
+- List of 3D CT patches
+### Output
+In Training Mode: A dictionary of classification and box regression loss.
+In Evaluation Mode: A list of dictionaries of predicted box, classification label, and classification score.
+## Performance
+Coco metric is used for evaluating the performance of the model. The pre-trained model was trained and validated on data fold 0. This model achieves a mAP=0.852, mAR=0.998, AP(IoU=0.1)=0.858, AR(IoU=0.1)=1.0.
+Please note that this bundle is non-deterministic because of the max pooling layer used in the network. Therefore, reproducing the training process may not get exactly the same performance.
+Please refer to https://pytorch.org/docs/stable/notes/randomness.html#reproducibility for more details about reproducibility.
+#### Training Loss
+![A graph showing the detection train loss](https://developer.download.nvidia.com/assets/Clara/Images/monai_retinanet_detection_train_loss_v2.png)
+#### Validation Accuracy
+The validation accuracy in this curve is the mean of mAP, mAR, AP(IoU=0.1), and AR(IoU=0.1) in Coco metric.
+![A graph showing the detection val accuracy](https://developer.download.nvidia.com/assets/Clara/Images/monai_retinanet_detection_val_acc_v2.png)
+#### TensorRT speedup
+The `lung_nodule_ct_detection` bundle supports acceleration with TensorRT through the ONNX-TensorRT method. The table below displays the speedup ratios observed on an A100 80G GPU. Please note that when using the TensorRT model for inference, the `force_sliding_window` parameter in the `inference.json` file must be set to `true`. This ensures that the bundle uses the `SlidingWindowInferer` during inference and maintains the input spatial size of the network. Otherwise, if given an input with spatial size less than the `infer_patch_size`, the input spatial size of the network would be changed.
+| method | torch_fp32(ms) | torch_amp(ms) | trt_fp32(ms) | trt_fp16(ms) | speedup amp | speedup fp32 | speedup fp16 | amp vs fp16|
+| :---: | :---: | :---: | :---: | :---: | :---: | :---: | :---: | :---: |
+| model computation | 7449.84 | 996.08 | 976.67 | 626.90 | 7.63 | 7.63 | 11.88 | 1.56 |
+| end2end | 36458.26 | 7259.35 | 6420.60 | 4698.34 | 5.02 | 5.68 | 7.76 | 1.55 |
+Where:
+- `model computation` means the speedup ratio of model's inference with a random input without preprocessing and postprocessing
+- `end2end` means run the bundle end-to-end with the TensorRT based model.
+- `torch_fp32` and `torch_amp` are for the PyTorch models with or without `amp` mode.
+- `trt_fp32` and `trt_fp16` are for the TensorRT based models converted in corresponding precision.
+- `speedup amp`, `speedup fp32` and `speedup fp16` are the speedup ratios of corresponding models versus the PyTorch float32 model
+- `amp vs fp16` is the speedup ratio between the PyTorch amp model and the TensorRT float16 based model.
+Currently, the only available method to accelerate this model is through ONNX-TensorRT. However, the Torch-TensorRT method is under development and will be available in the near future.
+This result is benchmarked under:
+ - TensorRT: 8.5.3+cuda11.8
+ - Torch-TensorRT Version: 1.4.0
+ - CPU Architecture: x86-64
+ - OS: ubuntu 20.04
+ - Python version:3.8.10
+ - CUDA version: 12.0
+ - GPU models and configuration: A100 80G
+## MONAI Bundle Commands
+In addition to the Pythonic APIs, a few command line interfaces (CLI) are provided to interact with the bundle. The CLI supports flexible use cases, such as overriding configs at runtime and predefining arguments in a file.
+For more details usage instructions, visit the [MONAI Bundle Configuration Page](https://docs.monai.io/en/latest/config_syntax.html).
+#### Execute training:
+```
+python -m monai.bundle run --config_file configs/train.json
+```
+Please note that if the default dataset path is not modified with the actual path in the bundle config files, you can also override it by using `--dataset_dir`:
+```
+python -m monai.bundle run --config_file configs/train.json --dataset_dir <actual dataset path>
+```
+#### Override the `train` config to execute evaluation with the trained model:
+```
+python -m monai.bundle run --config_file "['configs/train.json','configs/evaluate.json']"
+```
+#### Execute inference on resampled LUNA16 images by setting `"whether_raw_luna16": false` in `inference.json`:
+```
+python -m monai.bundle run --config_file configs/inference.json
+```
+With the same command, we can execute inference on original LUNA16 images by setting `"whether_raw_luna16": true` in `inference.json`. Remember to also set `"data_list_file_path": "$@bundle_root + '/LUNA16_datasplit/mhd_original/dataset_fold0.json'"` and change `"dataset_dir"`.
+Note that in inference.json, the transform "LoadImaged" in "preprocessing" and "AffineBoxToWorldCoordinated" in "postprocessing" has `"affine_lps_to_ras": true`.
+This depends on the input images. LUNA16 needs `"affine_lps_to_ras": true`.
+It is possible that your inference dataset should set `"affine_lps_to_ras": false`.
+#### Export checkpoint to TensorRT based models with fp32 or fp16 precision
+```bash
+python -m monai.bundle trt_export --net_id network_def --filepath models/model_trt.ts --ckpt_file models/model.pt --meta_file configs/metadata.json --config_file configs/inference.json --precision <fp32/fp16> --input_shape "[1, 1, 512, 512, 192]"  --use_onnx "True" --use_trace "True" --onnx_output_names "['output_0', 'output_1', 'output_2', 'output_3', 'output_4', 'output_5']" --network_def#use_list_output "True"
+```
+#### Execute inference with the TensorRT model
+```
+python -m monai.bundle run --config_file "['configs/inference.json', 'configs/inference_trt.json']"
+```
+# References
+[1] Lin, Tsung-Yi, et al. "Focal loss for dense object detection." ICCV 2017. https://arxiv.org/abs/1708.02002)
+[2] Baumgartner and Jaeger et al. "nnDetection: A self-configuring method for medical object detection." MICCAI 2021. https://arxiv.org/pdf/2106.00817.pdf
+[3] Armato III, S. G., McLennan, G., Bidaut, L., McNitt-Gray, M. F., Meyer, C. R., Reeves, A. P., Zhao, B., Aberle, D. R., Henschke, C. I., Hoffman, E. A., Kazerooni, E. A., MacMahon, H., Van Beek, E. J. R., Yankelevitz, D., Biancardi, A. M., Bland, P. H., Brown, M. S., Engelmann, R. M., Laderach, G. E., Max, D., Pais, R. C. , Qing, D. P. Y. , Roberts, R. Y., Smith, A. R., Starkey, A., Batra, P., Caligiuri, P., Farooqi, A., Gladish, G. W., Jude, C. M., Munden, R. F., Petkovska, I., Quint, L. E., Schwartz, L. H., Sundaram, B., Dodd, L. E., Fenimore, C., Gur, D., Petrick, N., Freymann, J., Kirby, J., Hughes, B., Casteele, A. V., Gupte, S., Sallam, M., Heath, M. D., Kuhn, M. H., Dharaiya, E., Burns, R., Fryd, D. S., Salganicoff, M., Anand, V., Shreter, U., Vastagh, S., Croft, B. Y., Clarke, L. P. (2015). Data From LIDC-IDRI [Data set]. The Cancer Imaging Archive. https://doi.org/10.7937/K9/TCIA.2015.LO9QL9SX
+[4] Armato SG 3rd, McLennan G, Bidaut L, McNitt-Gray MF, Meyer CR, Reeves AP, Zhao B, Aberle DR, Henschke CI, Hoffman EA, Kazerooni EA, MacMahon H, Van Beeke EJ, Yankelevitz D, Biancardi AM, Bland PH, Brown MS, Engelmann RM, Laderach GE, Max D, Pais RC, Qing DP, Roberts RY, Smith AR, Starkey A, Batrah P, Caligiuri P, Farooqi A, Gladish GW, Jude CM, Munden RF, Petkovska I, Quint LE, Schwartz LH, Sundaram B, Dodd LE, Fenimore C, Gur D, Petrick N, Freymann J, Kirby J, Hughes B, Casteele AV, Gupte S, Sallamm M, Heath MD, Kuhn MH, Dharaiya E, Burns R, Fryd DS, Salganicoff M, Anand V, Shreter U, Vastagh S, Croft BY.  The Lung Image Database Consortium (LIDC) and Image Database Resource Initiative (IDRI): A completed reference database of lung nodules on CT scans. Medical Physics, 38: 915--931, 2011. DOI: https://doi.org/10.1118/1.3528204
+[5] Clark, K., Vendt, B., Smith, K., Freymann, J., Kirby, J., Koppel, P., Moore, S., Phillips, S., Maffitt, D., Pringle, M., Tarbox, L., & Prior, F. (2013). The Cancer Imaging Archive (TCIA): Maintaining and Operating a Public Information Repository. Journal of Digital Imaging, 26(6), 1045–1057. https://doi.org/10.1007/s10278-013-9622-7
+# License
+Copyright (c) MONAI Consortium
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.

docs/data_license.txt ADDED Viewed

	@@ -0,0 +1,11 @@

+Third Party Licenses
+-----------------------------------------------------------------------
+/*********************************************************************/
+i. LUng Nodule Analysis 2016
+   https://luna16.grand-challenge.org/Home/
+   https://creativecommons.org/licenses/by/4.0/
+ii.  Lung Image Database Consortium image collection (LIDC-IDRI)
+   https://wiki.cancerimagingarchive.net/display/Public/LIDC-IDRI
+   https://creativecommons.org/licenses/by/3.0/

models/model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5e79231466adae93a6fe8e8594029e9add142914e223b879aa0343bb2402d01
+size 83709381

models/model.ts ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68afd1ed4be8d01196d575d13931dab24cc50d46a74528a47d54496ba29e2583
+size 83784539

scripts/__init__.py ADDED Viewed

	@@ -0,0 +1,14 @@

+# Copyright (c) MONAI Consortium
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#     http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# from .evaluator import EnsembleEvaluator, Evaluator, SupervisedEvaluator
+# from .multi_gpu_supervised_trainer import create_multigpu_supervised_evaluator, create_multigpu_supervised_trainer
+from .trainer import DetectionTrainer

scripts/cocometric_ignite.py ADDED Viewed

	@@ -0,0 +1,111 @@

+from typing import Callable, Dict, Sequence, Union
+import torch
+from ignite.metrics.metric import Metric, reinit__is_reduced, sync_all_reduce
+from monai.apps.detection.metrics.coco import COCOMetric
+from monai.apps.detection.metrics.matching import matching_batch
+from monai.data import box_utils
+from .utils import detach_to_numpy
+class IgniteCocoMetric(Metric):
+    def __init__(
+        self,
+        coco_metric_monai: Union[None, COCOMetric] = None,
+        box_key="box",
+        label_key="label",
+        pred_score_key="label_scores",
+        output_transform: Callable = lambda x: x,
+        device: Union[str, torch.device, None] = None,
+        reduce_scalar: bool = True,
+    ):
+        r"""
+        Computes coco detection metric in Ignite.
+        Args:
+            coco_metric_monai: the coco metric in monai.
+                If not given, will asume COCOMetric(classes=[0], iou_list=[0.1], max_detection=[100])
+            box_key: box key in the ground truth target dict and prediction dict.
+            label_key: classification label key in the ground truth target dict and prediction dict.
+            pred_score_key: classification score key in the prediction dict.
+            output_transform: A callable that is used to transform the Engine’s
+                process_function’s output into the form expected by the metric.
+            device: specifies which device updates are accumulated on.
+                Setting the metric’s device to be the same as your update arguments ensures
+                the update method is non-blocking. By default, CPU.
+            reduce_scalar: if True, will return the average value of coc metric values;
+                if False, will return an dictionary of coc metric.
+        Examples:
+            To use with ``Engine`` and ``process_function``,
+             simply attach the metric instance to the engine.
+            The output of the engine's ``process_function`` needs to be in format of
+            ``(y_pred, y)`` or ``{'y_pred': y_pred, 'y': y, ...}``.
+            For more information on how metric works with :class:`~ignite.engine.engine.Engine`,
+             visit :ref:`attach-engine`.
+            .. include:: defaults.rst
+                :start-after: :orphan:
+            .. testcode::
+                coco = IgniteCocoMetric()
+                coco.attach(default_evaluator, 'coco')
+                preds = [
+                    {
+                        'box': torch.Tensor([[1,1,1,2,2,2]]),
+                        'label':torch.Tensor([0]),
+                        'label_scores':torch.Tensor([0.8])
+                    }
+                ]
+                target = [{'box': torch.Tensor([[1,1,1,2,2,2]]), 'label':torch.Tensor([0])}]
+                state = default_evaluator.run([[preds, target]])
+                print(state.metrics['coco'])
+            .. testoutput::
+                1.0...
+        .. versionadded:: 0.4.3
+        """
+        self.box_key = box_key
+        self.label_key = label_key
+        self.pred_score_key = pred_score_key
+        if coco_metric_monai is None:
+            self.coco_metric = COCOMetric(classes=[0], iou_list=[0.1], max_detection=[100])
+        else:
+            self.coco_metric = coco_metric_monai
+        self.reduce_scalar = reduce_scalar
+        if device is None:
+            device = torch.device("cpu")
+        super(IgniteCocoMetric, self).__init__(output_transform=output_transform, device=device)
+    @reinit__is_reduced
+    def reset(self) -> None:
+        self.val_targets_all = []
+        self.val_outputs_all = []
+    @reinit__is_reduced
+    def update(self, output: Sequence[Dict]) -> None:
+        y_pred, y = output[0], output[1]
+        self.val_outputs_all += y_pred
+        self.val_targets_all += y
+    @sync_all_reduce("val_targets_all", "val_outputs_all")
+    def compute(self) -> float:
+        self.val_outputs_all = detach_to_numpy(self.val_outputs_all)
+        self.val_targets_all = detach_to_numpy(self.val_targets_all)
+        results_metric = matching_batch(
+            iou_fn=box_utils.box_iou,
+            iou_thresholds=self.coco_metric.iou_thresholds,
+            pred_boxes=[val_data_i[self.box_key] for val_data_i in self.val_outputs_all],
+            pred_classes=[val_data_i[self.label_key] for val_data_i in self.val_outputs_all],
+            pred_scores=[val_data_i[self.pred_score_key] for val_data_i in self.val_outputs_all],
+            gt_boxes=[val_data_i[self.box_key] for val_data_i in self.val_targets_all],
+            gt_classes=[val_data_i[self.label_key] for val_data_i in self.val_targets_all],
+        )
+        val_epoch_metric_dict = self.coco_metric(results_metric)[0]
+        if self.reduce_scalar:
+            val_epoch_metric = val_epoch_metric_dict.values()
+            val_epoch_metric = sum(val_epoch_metric) / len(val_epoch_metric)
+            return val_epoch_metric
+        else:
+            return val_epoch_metric_dict

scripts/detection_inferer.py ADDED Viewed

	@@ -0,0 +1,66 @@

+# Copyright (c) MONAI Consortium
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#     http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Any, List, Union
+import numpy as np
+import torch
+from monai.apps.detection.networks.retinanet_detector import RetinaNetDetector
+from monai.inferers.inferer import Inferer
+from torch import Tensor
+class RetinaNetInferer(Inferer):
+    """
+    RetinaNet Inferer takes RetinaNet as input
+    Args:
+        detector: the RetinaNetDetector that converts network output BxCxMxN or BxCxMxNxP
+            map into boxes and classification scores.
+        force_sliding_window: whether to force using a SlidingWindowInferer to do the inference.
+                If False, will check the input spatial size to decide whether to simply
+                forward the network or using SlidingWindowInferer.
+                If True, will force using SlidingWindowInferer to do the inference.
+        args: other optional args to be passed to detector.
+        kwargs: other optional keyword args to be passed to detector.
+    """
+    def __init__(self, detector: RetinaNetDetector, force_sliding_window: bool = False) -> None:
+        Inferer.__init__(self)
+        self.detector = detector
+        self.sliding_window_size = None
+        self.force_sliding_window = force_sliding_window
+        if self.detector.inferer is not None:
+            if hasattr(self.detector.inferer, "roi_size"):
+                self.sliding_window_size = np.prod(self.detector.inferer.roi_size)
+    def __call__(self, inputs: Union[List[Tensor], Tensor], network: torch.nn.Module, *args: Any, **kwargs: Any):
+        """Unified callable function API of Inferers.
+        Args:
+            inputs: model input data for inference.
+            network: target detection network to execute inference.
+                supports callable that fullfilles requirements of network in
+                monai.apps.detection.networks.retinanet_detector.RetinaNetDetector``
+            args: optional args to be passed to ``network``.
+            kwargs: optional keyword args to be passed to ``network``.
+        """
+        self.detector.network = network
+        self.detector.training = self.detector.network.training
+        # if image smaller than sliding window roi size, no need to use sliding window inferer
+        # use sliding window inferer only when image is large
+        use_inferer = (
+            self.force_sliding_window
+            or self.sliding_window_size is not None
+            and not all([data_i[0, ...].numel() < self.sliding_window_size for data_i in inputs])
+        )
+        return self.detector(inputs, *args, use_inferer=use_inferer, **kwargs)

scripts/detection_saver.py ADDED Viewed

	@@ -0,0 +1,126 @@

+# Copyright (c) MONAI Consortium
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#     http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+import os
+import warnings
+from typing import TYPE_CHECKING, Callable, Optional
+from monai.handlers.classification_saver import ClassificationSaver
+from monai.utils import IgniteInfo, evenly_divisible_all_gather, min_version, optional_import, string_list_all_gather
+from .utils import detach_to_numpy
+idist, _ = optional_import("ignite", IgniteInfo.OPT_IMPORT_VERSION, min_version, "distributed")
+Events, _ = optional_import("ignite.engine", IgniteInfo.OPT_IMPORT_VERSION, min_version, "Events")
+if TYPE_CHECKING:
+    from ignite.engine import Engine
+else:
+    Engine, _ = optional_import("ignite.engine", IgniteInfo.OPT_IMPORT_VERSION, min_version, "Engine")
+class DetectionSaver(ClassificationSaver):
+    """
+    Event handler triggered on completing every iteration to save the classification predictions as json file.
+    If running in distributed data parallel, only saves json file in the specified rank.
+    """
+    def __init__(
+        self,
+        output_dir: str = "./",
+        filename: str = "predictions.json",
+        overwrite: bool = True,
+        batch_transform: Callable = lambda x: x,
+        output_transform: Callable = lambda x: x,
+        name: Optional[str] = None,
+        save_rank: int = 0,
+        pred_box_key: str = "box",
+        pred_label_key: str = "label",
+        pred_score_key: str = "label_scores",
+    ) -> None:
+        """
+        Args:
+            output_dir: if `saver=None`, output json file directory.
+            filename: if `saver=None`, name of the saved json file name.
+            overwrite: if `saver=None`, whether to overwriting existing file content, if True,
+                will clear the file before saving. otherwise, will append new content to the file.
+            batch_transform: a callable that is used to extract the `meta_data` dictionary of
+                the input images from `ignite.engine.state.batch`. the purpose is to get the input
+                filenames from the `meta_data` and store with classification results together.
+                `engine.state` and `batch_transform` inherit from the ignite concept:
+                https://pytorch.org/ignite/concepts.html#state, explanation and usage example are in the tutorial:
+                https://github.com/Project-MONAI/tutorials/blob/master/modules/batch_output_transform.ipynb.
+            output_transform: a callable that is used to extract the model prediction data from
+                `ignite.engine.state.output`. the first dimension of its output will be treated as
+                the batch dimension. each item in the batch will be saved individually.
+                `engine.state` and `output_transform` inherit from the ignite concept:
+                https://pytorch.org/ignite/concepts.html#state, explanation and usage example are in the tutorial:
+                https://github.com/Project-MONAI/tutorials/blob/master/modules/batch_output_transform.ipynb.
+            name: identifier of logging.logger to use, defaulting to `engine.logger`.
+            save_rank: only the handler on specified rank will save to json file in multi-gpus validation,
+                default to 0.
+            pred_box_key: box key in the prediction dict.
+            pred_label_key: classification label key in the prediction dict.
+            pred_score_key: classification score key in the prediction dict.
+        """
+        super().__init__(
+            output_dir=output_dir,
+            filename=filename,
+            overwrite=overwrite,
+            batch_transform=batch_transform,
+            output_transform=output_transform,
+            name=name,
+            save_rank=save_rank,
+            saver=None,
+        )
+        self.pred_box_key = pred_box_key
+        self.pred_label_key = pred_label_key
+        self.pred_score_key = pred_score_key
+    def _finalize(self, _engine: Engine) -> None:
+        """
+        All gather classification results from ranks and save to json file.
+        Args:
+            _engine: Ignite Engine, unused argument.
+        """
+        ws = idist.get_world_size()
+        if self.save_rank >= ws:
+            raise ValueError("target save rank is greater than the distributed group size.")
+        # self._outputs is supposed to be a list of dict
+        # self._outputs[i] should be have at least three keys: pred_box_key, pred_label_key, pred_score_key
+        # self._filenames is supposed to be a list of str
+        outputs = self._outputs
+        filenames = self._filenames
+        if ws > 1:
+            outputs = evenly_divisible_all_gather(outputs, concat=False)
+            filenames = string_list_all_gather(filenames)
+        if len(filenames) != len(outputs):
+            warnings.warn(f"filenames length: {len(filenames)} doesn't match outputs length: {len(outputs)}.")
+        # save to json file only in the expected rank
+        if idist.get_rank() == self.save_rank:
+            results = [
+                {
+                    self.pred_box_key: detach_to_numpy(o[self.pred_box_key]).tolist(),
+                    self.pred_label_key: detach_to_numpy(o[self.pred_label_key]).tolist(),
+                    self.pred_score_key: detach_to_numpy(o[self.pred_score_key]).tolist(),
+                    "image": f,
+                }
+                for o, f in zip(outputs, filenames)
+            ]
+            with open(os.path.join(self.output_dir, self.filename), "w") as outfile:
+                json.dump(results, outfile, indent=4)

scripts/evaluator.py ADDED Viewed

	@@ -0,0 +1,173 @@

+# Copyright (c) MONAI Consortium
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#     http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from __future__ import annotations
+from typing import TYPE_CHECKING, Any, Callable, Dict, Iterable, List, Optional, Sequence, Tuple, Union
+import torch
+from monai.apps.detection.networks.retinanet_detector import RetinaNetDetector
+from monai.engines.evaluator import SupervisedEvaluator
+from monai.engines.utils import IterationEvents, default_metric_cmp_fn
+from monai.transforms import Transform
+from monai.utils import ForwardMode, IgniteInfo, min_version, optional_import
+from monai.utils.enums import CommonKeys as Keys
+from torch.utils.data import DataLoader
+from .detection_inferer import RetinaNetInferer
+if TYPE_CHECKING:
+    from ignite.engine import Engine, EventEnum
+    from ignite.metrics import Metric
+else:
+    Engine, _ = optional_import("ignite.engine", IgniteInfo.OPT_IMPORT_VERSION, min_version, "Engine")
+    Metric, _ = optional_import("ignite.metrics", IgniteInfo.OPT_IMPORT_VERSION, min_version, "Metric")
+    EventEnum, _ = optional_import("ignite.engine", IgniteInfo.OPT_IMPORT_VERSION, min_version, "EventEnum")
+__all__ = ["DetectionEvaluator"]
+def detection_prepare_val_batch(
+    batchdata: List[Dict[str, torch.Tensor]],
+    device: Optional[Union[str, torch.device]] = None,
+    non_blocking: bool = False,
+    **kwargs,
+) -> Union[Tuple[torch.Tensor, Optional[torch.Tensor]], torch.Tensor]:
+    """
+    Default function to prepare the data for current iteration.
+    Args `batchdata`, `device`, `non_blocking` refer to the ignite API:
+    https://pytorch.org/ignite/v0.4.8/generated/ignite.engine.create_supervised_trainer.html.
+    `kwargs` supports other args for `Tensor.to()` API.
+    Returns:
+        image, label(optional).
+    """
+    inputs = [
+        batch_data_i["image"].to(device=device, non_blocking=non_blocking, **kwargs) for batch_data_i in batchdata
+    ]
+    if isinstance(batchdata[0].get(Keys.LABEL), torch.Tensor):
+        targets = [
+            dict(
+                label=batch_data_i["label"].to(device=device, non_blocking=non_blocking, **kwargs),
+                box=batch_data_i["box"].to(device=device, non_blocking=non_blocking, **kwargs),
+            )
+            for batch_data_i in batchdata
+        ]
+        return (inputs, targets)
+    return inputs, None
+class DetectionEvaluator(SupervisedEvaluator):
+    """
+    Supervised detection evaluation method with image and label, inherits from ``SupervisedEvaluator`` and ``Workflow``.
+    Args:
+        device: an object representing the device on which to run.
+        val_data_loader: Ignite engine use data_loader to run, must be Iterable, typically be torch.DataLoader.
+        network: detector to evaluate in the evaluator, should be regular PyTorch `torch.nn.Module`.
+        epoch_length: number of iterations for one epoch, default to `len(val_data_loader)`.
+        non_blocking: if True and this copy is between CPU and GPU, the copy may occur asynchronously
+            with respect to the host. For other cases, this argument has no effect.
+        prepare_batch: function to parse expected data (usually `image`, `label` and other network args)
+            from `engine.state.batch` for every iteration, for more details please refer to:
+            https://pytorch.org/ignite/generated/ignite.engine.create_supervised_trainer.html.
+        iteration_update: the callable function for every iteration, expect to accept `engine`
+            and `engine.state.batch` as inputs, return data will be stored in `engine.state.output`.
+            if not provided, use `self._iteration()` instead. for more details please refer to:
+            https://pytorch.org/ignite/generated/ignite.engine.engine.Engine.html.
+        inferer: inference method that execute model forward on input data, like: SlidingWindow, etc.
+        postprocessing: execute additional transformation for the model output data.
+            Typically, several Tensor based transforms composed by `Compose`.
+        key_val_metric: compute metric when every iteration completed, and save average value to
+            engine.state.metrics when epoch completed. key_val_metric is the main metric to compare and save the
+            checkpoint into files.
+        additional_metrics: more Ignite metrics that also attach to Ignite Engine.
+        metric_cmp_fn: function to compare current key metric with previous best key metric value,
+            it must accept 2 args (current_metric, previous_best) and return a bool result: if `True`, will update
+            `best_metric` and `best_metric_epoch` with current metric and epoch, default to `greater than`.
+        val_handlers: every handler is a set of Ignite Event-Handlers, must have `attach` function, like:
+            CheckpointHandler, StatsHandler, etc.
+        amp: whether to enable auto-mixed-precision evaluation, default is False.
+        mode: model forward mode during evaluation, should be 'eval' or 'train',
+            which maps to `model.eval()` or `model.train()`, default to 'eval'.
+        event_names: additional custom ignite events that will register to the engine.
+            new events can be a list of str or `ignite.engine.events.EventEnum`.
+        event_to_attr: a dictionary to map an event to a state attribute, then add to `engine.state`.
+            for more details, check: https://pytorch.org/ignite/generated/ignite.engine.engine.Engine.html
+            #ignite.engine.engine.Engine.register_events.
+        decollate: whether to decollate the batch-first data to a list of data after model computation,
+            recommend `decollate=True` when `postprocessing` uses components from `monai.transforms`.
+            default to `True`.
+        to_kwargs: dict of other args for `prepare_batch` API when converting the input data, except for
+            `device`, `non_blocking`.
+        amp_kwargs: dict of the args for `torch.cuda.amp.autocast()` API, for more details:
+            https://pytorch.org/docs/stable/amp.html#torch.cuda.amp.autocast.
+    """
+    def __init__(
+        self,
+        device: torch.device,
+        val_data_loader: Iterable | DataLoader,
+        network: RetinaNetDetector,
+        epoch_length: int | None = None,
+        non_blocking: bool = False,
+        prepare_batch: Callable = detection_prepare_val_batch,
+        iteration_update: Callable[[Engine, Any], Any] | None = None,
+        inferer: RetinaNetInferer | None = None,
+        postprocessing: Transform | None = None,
+        key_val_metric: dict[str, Metric] | None = None,
+        additional_metrics: dict[str, Metric] | None = None,
+        metric_cmp_fn: Callable = default_metric_cmp_fn,
+        val_handlers: Sequence | None = None,
+        amp: bool = False,
+        mode: ForwardMode | str = ForwardMode.EVAL,
+        event_names: list[str | EventEnum] | None = None,
+        event_to_attr: dict | None = None,
+        decollate: bool = True,
+        to_kwargs: dict | None = None,
+        amp_kwargs: dict | None = None,
+    ) -> None:
+        super().__init__(
+            device=device,
+            val_data_loader=val_data_loader,
+            network=network,
+            epoch_length=epoch_length,
+            non_blocking=non_blocking,
+            prepare_batch=prepare_batch,
+            iteration_update=iteration_update,
+            inferer=inferer,
+            postprocessing=postprocessing,
+            key_val_metric=key_val_metric,
+            additional_metrics=additional_metrics,
+            metric_cmp_fn=metric_cmp_fn,
+            val_handlers=val_handlers,
+            amp=amp,
+            mode=mode,
+            event_names=event_names,
+            event_to_attr=event_to_attr,
+            decollate=decollate,
+            to_kwargs=to_kwargs,
+            amp_kwargs=amp_kwargs,
+        )
+    def _register_decollate(self):
+        """
+        Register the decollate operation for batch data, will execute after model forward and loss forward.
+        """
+        @self.on(IterationEvents.MODEL_COMPLETED)
+        def _decollate_data(engine: Engine) -> None:
+            output_list = []
+            for i in range(len(engine.state.output[Keys.IMAGE])):
+                output_list.append({})
+                for k in engine.state.output.keys():
+                    if engine.state.output[k] is not None:
+                        output_list[i][k] = engine.state.output[k][i]
+            engine.state.output = output_list

scripts/trainer.py ADDED Viewed

	@@ -0,0 +1,228 @@

+# Copyright (c) MONAI Consortium
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#     http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from __future__ import annotations
+from typing import TYPE_CHECKING, Any, Callable, Dict, Iterable, List, Optional, Sequence, Tuple, Union
+import torch
+from monai.engines.trainer import Trainer
+from monai.engines.utils import IterationEvents, default_metric_cmp_fn
+from monai.inferers import Inferer
+from monai.transforms import Transform
+from monai.utils import IgniteInfo, min_version, optional_import
+from monai.utils.enums import CommonKeys as Keys
+from torch.optim.optimizer import Optimizer
+from torch.utils.data import DataLoader
+if TYPE_CHECKING:
+    from ignite.engine import Engine, EventEnum
+    from ignite.metrics import Metric
+else:
+    Engine, _ = optional_import("ignite.engine", IgniteInfo.OPT_IMPORT_VERSION, min_version, "Engine")
+    Metric, _ = optional_import("ignite.metrics", IgniteInfo.OPT_IMPORT_VERSION, min_version, "Metric")
+    EventEnum, _ = optional_import("ignite.engine", IgniteInfo.OPT_IMPORT_VERSION, min_version, "EventEnum")
+__all__ = ["DetectionTrainer"]
+def detection_prepare_batch(
+    batchdata: List[Dict[str, torch.Tensor]],
+    device: Optional[Union[str, torch.device]] = None,
+    non_blocking: bool = False,
+    **kwargs,
+) -> Union[Tuple[torch.Tensor, Optional[torch.Tensor]], torch.Tensor]:
+    """
+    Default function to prepare the data for current iteration.
+    Args `batchdata`, `device`, `non_blocking` refer to the ignite API:
+    https://pytorch.org/ignite/v0.4.8/generated/ignite.engine.create_supervised_trainer.html.
+    `kwargs` supports other args for `Tensor.to()` API.
+    Returns:
+        image, label(optional).
+    """
+    inputs = [
+        batch_data_ii["image"].to(device=device, non_blocking=non_blocking, **kwargs)
+        for batch_data_i in batchdata
+        for batch_data_ii in batch_data_i
+    ]
+    if isinstance(batchdata[0][0].get(Keys.LABEL), torch.Tensor):
+        targets = [
+            dict(
+                label=batch_data_ii["label"].to(device=device, non_blocking=non_blocking, **kwargs),
+                box=batch_data_ii["box"].to(device=device, non_blocking=non_blocking, **kwargs),
+            )
+            for batch_data_i in batchdata
+            for batch_data_ii in batch_data_i
+        ]
+        return (inputs, targets)
+    return inputs, None
+class DetectionTrainer(Trainer):
+    """
+    Supervised detection training method with image and label, inherits from ``Trainer`` and ``Workflow``.
+    Args:
+        device: an object representing the device on which to run.
+        max_epochs: the total epoch number for trainer to run.
+        train_data_loader: Ignite engine use data_loader to run, must be Iterable or torch.DataLoader.
+        detector: detector to train in the trainer, should be regular PyTorch `torch.nn.Module`.
+        optimizer: the optimizer associated to the detector, should be regular PyTorch optimizer from `torch.optim`
+            or its subclass.
+        epoch_length: number of iterations for one epoch, default to `len(train_data_loader)`.
+        non_blocking: if True and this copy is between CPU and GPU, the copy may occur asynchronously
+            with respect to the host. For other cases, this argument has no effect.
+        prepare_batch: function to parse expected data (usually `image`,`box`, `label` and other detector args)
+            from `engine.state.batch` for every iteration, for more details please refer to:
+            https://pytorch.org/ignite/generated/ignite.engine.create_supervised_trainer.html.
+        iteration_update: the callable function for every iteration, expect to accept `engine`
+            and `engine.state.batch` as inputs, return data will be stored in `engine.state.output`.
+            if not provided, use `self._iteration()` instead. for more details please refer to:
+            https://pytorch.org/ignite/generated/ignite.engine.engine.Engine.html.
+        inferer: inference method that execute model forward on input data, like: SlidingWindow, etc.
+        postprocessing: execute additional transformation for the model output data.
+            Typically, several Tensor based transforms composed by `Compose`.
+        key_train_metric: compute metric when every iteration completed, and save average value to
+            engine.state.metrics when epoch completed. key_train_metric is the main metric to compare and save the
+            checkpoint into files.
+        additional_metrics: more Ignite metrics that also attach to Ignite Engine.
+        metric_cmp_fn: function to compare current key metric with previous best key metric value,
+            it must accept 2 args (current_metric, previous_best) and return a bool result: if `True`, will update
+            `best_metric` and `best_metric_epoch` with current metric and epoch, default to `greater than`.
+        train_handlers: every handler is a set of Ignite Event-Handlers, must have `attach` function, like:
+            CheckpointHandler, StatsHandler, etc.
+        amp: whether to enable auto-mixed-precision training, default is False.
+        event_names: additional custom ignite events that will register to the engine.
+            new events can be a list of str or `ignite.engine.events.EventEnum`.
+        event_to_attr: a dictionary to map an event to a state attribute, then add to `engine.state`.
+            for more details, check: https://pytorch.org/ignite/generated/ignite.engine.engine.Engine.html
+            #ignite.engine.engine.Engine.register_events.
+        decollate: whether to decollate the batch-first data to a list of data after model computation,
+            recommend `decollate=True` when `postprocessing` uses components from `monai.transforms`.
+            default to `True`.
+        optim_set_to_none: when calling `optimizer.zero_grad()`, instead of setting to zero, set the grads to None.
+            more details: https://pytorch.org/docs/stable/generated/torch.optim.Optimizer.zero_grad.html.
+        to_kwargs: dict of other args for `prepare_batch` API when converting the input data, except for
+            `device`, `non_blocking`.
+        amp_kwargs: dict of the args for `torch.cuda.amp.autocast()` API, for more details:
+            https://pytorch.org/docs/stable/amp.html#torch.cuda.amp.autocast.
+    """
+    def __init__(
+        self,
+        device: torch.device,
+        max_epochs: int,
+        train_data_loader: Iterable | DataLoader,
+        detector: torch.nn.Module,
+        optimizer: Optimizer,
+        epoch_length: int | None = None,
+        non_blocking: bool = False,
+        prepare_batch: Callable = detection_prepare_batch,
+        iteration_update: Callable[[Engine, Any], Any] | None = None,
+        inferer: Inferer | None = None,
+        postprocessing: Transform | None = None,
+        key_train_metric: dict[str, Metric] | None = None,
+        additional_metrics: dict[str, Metric] | None = None,
+        metric_cmp_fn: Callable = default_metric_cmp_fn,
+        train_handlers: Sequence | None = None,
+        amp: bool = False,
+        event_names: list[str | EventEnum] | None = None,
+        event_to_attr: dict | None = None,
+        decollate: bool = True,
+        optim_set_to_none: bool = False,
+        to_kwargs: dict | None = None,
+        amp_kwargs: dict | None = None,
+    ) -> None:
+        super().__init__(
+            device=device,
+            max_epochs=max_epochs,
+            data_loader=train_data_loader,
+            epoch_length=epoch_length,
+            non_blocking=non_blocking,
+            prepare_batch=prepare_batch,
+            iteration_update=iteration_update,
+            postprocessing=postprocessing,
+            key_metric=key_train_metric,
+            additional_metrics=additional_metrics,
+            metric_cmp_fn=metric_cmp_fn,
+            handlers=train_handlers,
+            amp=amp,
+            event_names=event_names,
+            event_to_attr=event_to_attr,
+            decollate=decollate,
+            to_kwargs=to_kwargs,
+            amp_kwargs=amp_kwargs,
+        )
+        self.detector = detector
+        self.optimizer = optimizer
+        self.optim_set_to_none = optim_set_to_none
+    def _iteration(self, engine, batchdata: dict[str, torch.Tensor]):
+        """
+        Callback function for the Supervised Training processing logic of 1 iteration in Ignite Engine.
+        Return below items in a dictionary:
+            - IMAGE: image Tensor data for model input, already moved to device.
+            - BOX: box regression loss corresponding to the image, already moved to device.
+            - LABEL: classification loss corresponding to the image, already moved to device.
+            - LOSS: weighted sum of loss values computed by loss function.
+        Args:
+            engine: `DetectionTrainer` to execute operation for an iteration.
+            batchdata: input data for this iteration, usually can be dictionary or tuple of Tensor data.
+        Raises:
+            ValueError: When ``batchdata`` is None.
+        """
+        if batchdata is None:
+            raise ValueError("Must provide batch data for current iteration.")
+        batch = engine.prepare_batch(batchdata, engine.state.device, engine.non_blocking, **engine.to_kwargs)
+        if len(batch) == 2:
+            inputs, targets = batch
+            args: tuple = ()
+            kwargs: dict = {}
+        else:
+            inputs, targets, args, kwargs = batch
+        # put iteration outputs into engine.state
+        engine.state.output = {Keys.IMAGE: inputs, Keys.LABEL: targets}
+        def _compute_pred_loss(w_cls: float = 1.0, w_box_reg: float = 1.0):
+            """
+            Args:
+                w_cls: weight of classification loss
+                w_box_reg: weight of box regression loss
+            """
+            outputs = engine.detector(inputs, targets)
+            engine.state.output[engine.detector.cls_key] = outputs[engine.detector.cls_key]
+            engine.state.output[engine.detector.box_reg_key] = outputs[engine.detector.box_reg_key]
+            engine.state.output[Keys.LOSS] = (
+                w_cls * outputs[engine.detector.cls_key] + w_box_reg * outputs[engine.detector.box_reg_key]
+            )
+            engine.fire_event(IterationEvents.LOSS_COMPLETED)
+        engine.detector.train()
+        engine.optimizer.zero_grad(set_to_none=engine.optim_set_to_none)
+        if engine.amp and engine.scaler is not None:
+            with torch.cuda.amp.autocast(**engine.amp_kwargs):
+                inputs = [img.to(torch.float16) for img in inputs]
+                _compute_pred_loss()
+            engine.scaler.scale(engine.state.output[Keys.LOSS]).backward()
+            engine.fire_event(IterationEvents.BACKWARD_COMPLETED)
+            engine.scaler.step(engine.optimizer)
+            engine.scaler.update()
+        else:
+            _compute_pred_loss()
+            engine.state.output[Keys.LOSS].backward()
+            engine.fire_event(IterationEvents.BACKWARD_COMPLETED)
+            engine.optimizer.step()
+        return engine.state.output

scripts/utils.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from typing import Dict, List, Union
+import numpy as np
+import torch
+def detach_to_numpy(data: Union[List, Dict, torch.Tensor]) -> Union[List, Dict, torch.Tensor]:
+    """
+    Recursively detach elements in data
+    """
+    if isinstance(data, torch.Tensor):
+        return data.cpu().detach().numpy()  # pytype: disable=attribute-error
+    elif isinstance(data, np.ndarray):
+        return data
+    elif isinstance(data, list):
+        return [detach_to_numpy(d) for d in data]
+    elif isinstance(data, dict):
+        for k in data.keys():
+            data[k] = detach_to_numpy(data[k])
+        return data
+    else:
+        raise ValueError("data should be tensor, numpy array, dict, or list.")

scripts/warmup_scheduler.py ADDED Viewed

	@@ -0,0 +1,89 @@

+# Copyright (c) MONAI Consortium
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#     http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+This script is adapted from
+https://github.com/ildoonet/pytorch-gradual-warmup-lr/blob/master/warmup_scheduler/scheduler.py
+"""
+from torch.optim.lr_scheduler import ReduceLROnPlateau, _LRScheduler
+class GradualWarmupScheduler(_LRScheduler):
+    """Gradually warm-up(increasing) learning rate in optimizer.
+    Proposed in 'Accurate, Large Minibatch SGD: Training ImageNet in 1 Hour'.
+    Args:
+        optimizer (Optimizer): Wrapped optimizer.
+        multiplier: target learning rate = base lr * multiplier if multiplier > 1.0.
+            if multiplier = 1.0, lr starts from 0 and ends up with the base_lr.
+        total_epoch: target learning rate is reached at total_epoch, gradually
+        after_scheduler: after target_epoch, use this scheduler(eg. ReduceLROnPlateau)
+    """
+    def __init__(self, optimizer, multiplier, total_epoch, after_scheduler=None):
+        self.multiplier = multiplier
+        if self.multiplier < 1.0:
+            raise ValueError("multiplier should be greater thant or equal to 1.")
+        self.total_epoch = total_epoch
+        self.after_scheduler = after_scheduler
+        self.finished = False
+        super(GradualWarmupScheduler, self).__init__(optimizer)
+    def get_lr(self):
+        self.last_epoch = max(1, self.last_epoch)  # to avoid epoch=0 thus lr=0
+        if self.last_epoch > self.total_epoch:
+            if self.after_scheduler:
+                if not self.finished:
+                    self.after_scheduler.base_lrs = [base_lr * self.multiplier for base_lr in self.base_lrs]
+                    self.finished = True
+                return self.after_scheduler.get_last_lr()
+            return [base_lr * self.multiplier for base_lr in self.base_lrs]
+        if self.multiplier == 1.0:
+            return [base_lr * (float(self.last_epoch) / self.total_epoch) for base_lr in self.base_lrs]
+        else:
+            return [
+                base_lr * ((self.multiplier - 1.0) * self.last_epoch / self.total_epoch + 1.0)
+                for base_lr in self.base_lrs
+            ]
+    def step_reduce_lr_on_plateau(self, metrics, epoch=None):
+        if epoch is None:
+            epoch = self.last_epoch + 1
+        self.last_epoch = (
+            epoch if epoch != 0 else 1
+        )  # ReduceLROnPlateau is called at the end of epoch, whereas others are called at beginning
+        if self.last_epoch <= self.total_epoch:
+            warmup_lr = [
+                base_lr * ((self.multiplier - 1.0) * self.last_epoch / self.total_epoch + 1.0)
+                for base_lr in self.base_lrs
+            ]
+            for param_group, lr in zip(self.optimizer.param_groups, warmup_lr):
+                param_group["lr"] = lr
+        else:
+            if epoch is None:
+                self.after_scheduler.step(metrics, None)
+            else:
+                self.after_scheduler.step(metrics, epoch - self.total_epoch)
+    def step(self, epoch=None, metrics=None):
+        if not isinstance(self.after_scheduler, ReduceLROnPlateau):
+            if self.finished and self.after_scheduler:
+                if epoch is None:
+                    self.after_scheduler.step(None)
+                else:
+                    self.after_scheduler.step(epoch - self.total_epoch)
+                self._last_lr = self.after_scheduler.get_last_lr()
+            else:
+                return super(GradualWarmupScheduler, self).step(epoch)
+        else:
+            self.step_reduce_lr_on_plateau(metrics, epoch)