Source code for InnerEye.ML.configs.segmentation.HeadAndNeckBase

#  ------------------------------------------------------------------------------------------
#  Copyright (c) Microsoft Corporation. All rights reserved.
#  Licensed under the MIT License (MIT). See LICENSE in the repo root for license information.
#  ------------------------------------------------------------------------------------------
import random
from typing import Any, List, Optional

import pandas as pd

from InnerEye.Common.type_annotations import TupleInt3
from InnerEye.ML.config import MixtureLossComponent, PhotometricNormalizationMethod, SegmentationLoss, \
    SegmentationModelBase, SliceExclusionRule, SummedProbabilityRule, equally_weighted_classes
from InnerEye.ML.deep_learning_config import OptimizerType
from InnerEye.ML.utils.model_metadata_util import generate_random_colours_list
from InnerEye.ML.utils.split_dataset import DatasetSplits

RANDOM_COLOUR_GENERATOR = random.Random(0)


[docs]class HeadAndNeckBase(SegmentationModelBase):
    """
    Head and Neck radiotherapy image segmentation model.

    This configuration needs to be supplied with a value for azure_dataset_id that refers to your
    dataset. You may also supply a value for num_structures, feature_channels or any other feature. For example,
    with the appropriate dataset, this would build the model whose results are reported in the `InnerEye team's
    paper <https://pubmed.ncbi.nlm.nih.gov/33252691/>`_::

        class HeadAndNeckPaper(HeadAndNeckBase):
            def __init__(self):
                super().__init__(
                    azure_dataset_id="foo_bar_baz",
                    num_structures=10
                )

    """

    def __init__(self,
                 ground_truth_ids: List[str],
                 ground_truth_ids_display_names: Optional[List[str]] = None,
                 colours: Optional[List[TupleInt3]] = None,
                 fill_holes: Optional[List[bool]] = None,
                 roi_interpreted_types: Optional[List[str]] = None,
                 class_weights: Optional[List[float]] = None,
                 slice_exclusion_rules: Optional[List[SliceExclusionRule]] = None,
                 summed_probability_rules: Optional[List[SummedProbabilityRule]] = None,
                 num_feature_channels: Optional[int] = None,
                 **kwargs: Any) -> None:
        """
        Creates a new instance of the class.

        :param ground_truth_ids: List of ground truth ids.
        :param ground_truth_ids_display_names: Optional list of ground truth id display names. If
            present then must be of the same length as ground_truth_ids.

        :param colours: Optional list of colours. If
            present then must be of the same length as ground_truth_ids.

        :param fill_holes: Optional list of fill hole flags. If
            present then must be of the same length as ground_truth_ids.

        :param roi_interpreted_types: Optional list of roi_interpreted_types. If
            present then must be of the same length as ground_truth_ids.

        :param class_weights: Optional list of class weights. If
            present then must be of the same length as ground_truth_ids + 1.

        :param slice_exclusion_rules: Optional list of SliceExclusionRules.
        :param summed_probability_rules: Optional list of SummedProbabilityRule.
        :param num_feature_channels: Optional number of feature channels.
        :param kwargs: Additional arguments that will be passed through to the SegmentationModelBase constructor.
        """
        # Number of training epochs
        num_epochs = 120
        num_structures = len(ground_truth_ids)
        colours = colours or generate_random_colours_list(RANDOM_COLOUR_GENERATOR, num_structures)
        fill_holes = fill_holes or [True] * num_structures
        roi_interpreted_types = roi_interpreted_types or ["ORGAN"] * num_structures
        ground_truth_ids_display_names = ground_truth_ids_display_names or [f"zz_{x}" for x in ground_truth_ids]
        # The amount of GPU memory required increases with both the number of structures and the
        # number of feature channels. The following is a sensible default to avoid out-of-memory,
        # but you can override is by passing in another (singleton list) value for feature_channels
        # from a subclass.
        num_feature_channels = num_feature_channels or (32 if num_structures <= 20 else 26)
        bg_weight = 0.02 if len(ground_truth_ids) > 1 else 0.25
        class_weights = class_weights or equally_weighted_classes(ground_truth_ids, background_weight=bg_weight)
        # In case of vertical overlap between brainstem and spinal_cord, we separate them
        # by converting brainstem voxels to cord, as the latter is clinically more sensitive.
        # We do the same to separate SPC and MPC; in this case, the direction of change is unimportant,
        # so we choose SPC-to-MPC arbitrarily.
        slice_exclusion_rules = slice_exclusion_rules or []
        summed_probability_rules = summed_probability_rules or []
        super().__init__(
            should_validate=False,  # we'll validate after kwargs are added
            num_epochs=num_epochs,
            architecture="UNet3D",
            kernel_size=3,
            train_batch_size=1,
            inference_batch_size=1,
            feature_channels=[num_feature_channels],
            crop_size=(96, 288, 288),
            test_crop_size=(144, 512, 512),
            inference_stride_size=(72, 256, 256),
            image_channels=["ct"],
            norm_method=PhotometricNormalizationMethod.CtWindow,
            level=50,
            window=600,
            l_rate=1e-3,
            min_l_rate=1e-5,
            l_rate_polynomial_gamma=0.9,
            optimizer_type=OptimizerType.Adam,
            opt_eps=1e-4,
            adam_betas=(0.9, 0.999),
            momentum=0.9,
            use_mixed_precision=True,
            use_model_parallel=True,
            monitoring_interval_seconds=0,
            num_dataload_workers=2,
            loss_type=SegmentationLoss.Mixture,
            mixture_loss_components=[MixtureLossComponent(0.5, SegmentationLoss.Focal, 0.2),
                                     MixtureLossComponent(0.5, SegmentationLoss.SoftDice, 0.1)],
            ground_truth_ids=ground_truth_ids,
            ground_truth_ids_display_names=ground_truth_ids_display_names,
            largest_connected_component_foreground_classes=ground_truth_ids,
            colours=colours,
            fill_holes=fill_holes,
            roi_interpreted_types=roi_interpreted_types,
            class_weights=class_weights,
            slice_exclusion_rules=slice_exclusion_rules,
            summed_probability_rules=summed_probability_rules,
        )
        self.add_and_validate(kwargs)

[docs]    def get_model_train_test_dataset_splits(self, dataset_df: pd.DataFrame) -> DatasetSplits:
        return DatasetSplits.from_proportions(dataset_df, proportion_train=0.8, proportion_val=0.05,
                                              proportion_test=0.15,
                                              random_seed=0)