datacentric-challenge/predict.py at main · ClinicalDataScience/datacentric-challenge · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
import os
import random
import time
from typing import Dict, List, Optional, Union

import monai.transforms as mt
import numpy as np
import torch
import typer
from autopet3.datacentric.utils import SimpleParser, get_file_dict_nn, read_split
from autopet3.fixed.dynunet import NNUnet
from autopet3.fixed.evaluation import AutoPETMetricAggregator
from autopet3.fixed.utils import plot_results
from omegaconf import OmegaConf
from tqdm import tqdm

app = typer.Typer()


class PredictModel:
    """The PredictModel class is responsible for preprocessing input data, loading and evaluating models, and making
    predictions using an ensemble of models. It also supports test-time augmentation (TTA) for improved predictions.
    The class can run the prediction pipeline on CT and PET image files, save the output, and optionally evaluate the
    results.

    Example Usage
    # Create an instance of PredictModel
    model_paths = ["model1.ckpt", "model2.ckpt", "model3.ckpt"]
    predictor = PredictModel(model_paths, sw_batch_size=6, tta=True, random_flips=2)

    # Run the prediction pipeline
    ct_file_path = "ct_image.nii.gz"
    pet_file_path = "pet_image.nii.gz"
    label = "label_image.nii.gz"
    save_path = "output_folder"
    metrics = predictor.run(ct_file_path, pet_file_path, label=label, save_path=save_path, verbose=True)
    """

    def __init__(self, model_paths: List[str], sw_batch_size: int = 6, tta: bool = False, random_flips: int = 0):
        """Initialize the class with the given parameters.
        Args:
            model_paths (List[str]): List of model paths.
            sw_batch_size (int, optional): Batch size for the model. Defaults to 6.
            tta (bool, optional): Flag for test-time augmentation. Defaults to False.
            random_flips (int, optional): Number of random flips. Defaults to 0.
        Returns:
            None

        """
        self.ckpts = model_paths
        self.transform = None
        self.sw_batch_size = sw_batch_size
        self.tta = tta
        self.tta_flips = [[2], [3], [4], [2, 3], [2, 4], [3, 4], [2, 3, 4]]
        self.random_flips = np.clip(random_flips, 0, len(self.tta_flips))

    @staticmethod
    def preprocess(input: Dict[str, str]) -> torch.Tensor:
        """Preprocesses the input data by applying a series of transformations to the CT and PET images.
        Args:
            input (Dict[str, str]): A dictionary containing the paths to the CT and PET images.
        Returns:
            torch.Tensor: The preprocessed input data as a tensor with a batch dimension.

        """
        # Define the percentile values for CT and PET images
        ct_percentiles = (-832.062744140625, 1127.758544921875)
        ct_norm = torch.Tensor((107.73438968591431, 286.34403119451997))
        pet_percentiles = (1.0433332920074463, 51.211158752441406)
        pet_norm = torch.Tensor((7.063827929027176, 7.960414805306728))

        # Define the spacing for the images
        spacing = (2.0364201068878174, 2.03642010688781740, 3.0)

        # Define a list of transforms
        keys = ["ct", "pet"]
        transforms = [
            mt.LoadImaged(keys=keys),
            mt.EnsureChannelFirstd(keys=keys),
            mt.EnsureTyped(keys=keys),
            mt.Orientationd(keys=keys, axcodes="LAS"),
            mt.Spacingd(
                keys=keys,
                pixdim=spacing,
                mode="bilinear",
            ),
            mt.ScaleIntensityRanged(
                keys=["ct"], a_min=ct_percentiles[0], a_max=ct_percentiles[1], b_min=0, b_max=1, clip=True
            ),
            mt.ScaleIntensityRanged(
                keys=["pet"], a_min=pet_percentiles[0], a_max=pet_percentiles[1], b_min=0, b_max=1, clip=True
            ),
            mt.ScaleIntensityRanged(
                keys=["ct"], a_min=0, a_max=1, b_min=ct_percentiles[0], b_max=ct_percentiles[1], clip=True
            ),
            mt.ScaleIntensityRanged(
                keys=["pet"], a_min=0, a_max=1, b_min=pet_percentiles[0], b_max=pet_percentiles[1], clip=True
            ),
            mt.NormalizeIntensityd(keys=["ct"], subtrahend=ct_norm[0], divisor=ct_norm[1]),
            mt.NormalizeIntensityd(keys=["pet"], subtrahend=pet_norm[0], divisor=pet_norm[1]),
            mt.ConcatItemsd(keys=keys, name="image", dim=0),
            mt.EnsureTyped(keys=keys),
            mt.ToTensord(keys=keys),
        ]

        # Compose and apply the transforms, add batch dimension
        transform = mt.Compose(transforms)
        output = transform(input)["image"][None, ...]
        return output

    def load_and_evaluate_model(self, model_path: str, input: torch.Tensor) -> torch.Tensor:
        """Load a model from a given path and evaluate it on the input tensor.

        Args:
            model_path (str): The path to the model checkpoint.
            input (torch.Tensor): The input tensor for evaluation.

        Returns:
            torch.Tensor: The evaluation result after applying the model.

        """
        net = NNUnet.load_from_checkpoint(model_path, sw_batch_size=self.sw_batch_size)
        net.eval()
        net.cuda()
        with torch.no_grad(), torch.autocast(device_type="cuda", dtype=torch.bfloat16):
            if self.tta:
                pred = self.tta_inference(net, input)
            else:
                pred = net.forward_logits(input)
        return torch.sigmoid(pred)

    def predict_ensemble(self, input: torch.Tensor) -> torch.Tensor:
        """Predicts the class label for the given input using an ensemble of models.
        Args:
            input (torch.Tensor): The input tensor to be predicted.
        Returns:
            torch.Tensor: The predicted class labels for the input.

        """
        predictions = [self.load_and_evaluate_model(model, input) for model in self.ckpts]
        averaged_predictions = torch.mean(torch.stack(predictions), dim=0)
        return torch.ge(averaged_predictions, 0.5)

    def tta_inference(self, model: NNUnet, input: torch.Tensor) -> torch.Tensor:
        """Perform test-time augmentation (TTA) inference on the given model and input tensor.
        Args:
            model (NNUnet): The model to perform inference on.
            input (torch.Tensor): The input tensor to be augmented and evaluated.
        Returns:
                torch.Tensor: The predicted output tensor after applying TTA.
        Description:
        This function performs test-time augmentation (TTA) inference on the given model and input tensor.
        It applies a series of transformations to the input tensor and evaluates the model on the augmented tensor.
        The transformations include flipping the input tensor along different axes.
        The augmented predictions are then averaged to obtain the final predicted output tensor.

        """
        prediction = model.forward_logits(input)

        if self.random_flips == 0:
            flips_to_apply = self.tta_flips
        else:
            flips_to_apply = random.sample(self.tta_flips, self.random_flips)

        for flip_idx in flips_to_apply:  # tqdm(flips_to_apply, desc="TTA"):
            prediction += self.flip(model.forward_logits(self.flip(input, flip_idx)), flip_idx)
        prediction /= len(flips_to_apply) + 1
        return prediction

    @staticmethod
    def flip(data, axis):
        return torch.flip(data, dims=axis)

    def run(
        self, ct_file_path: str, pet_file_path: str, label: str = None, save_path: str = None, verbose: bool = False
    ) -> Union[int, dict]:
        """Runs the prediction pipeline on the given CT and PET image files.
        Args:
            ct_file_path (str): The path to the CT image file.
            pet_file_path (str): The path to the PET image file.
            label (str, optional): The path to the ground truth label image file. Defaults to None.
            save_path (str, optional): The path to save the output image. Defaults to None.
            verbose (bool, optional): Whether to print the timings. Defaults to False.
        Returns:
            int: 0 if the pipeline is successfully run or dict containing the metrics if evaluation is enabled.
        This function performs the following steps:
        1. Preprocessing: Loads the PET image, applies preprocessing to the CT and PET images, and stores the
        preprocessed data.
        2. Prediction: Predicts the output using an ensemble of models and TTA if TTA is enabled.
        3. Save Output: Resamples the prediction to match the reference image and saves it as a NIfTI file.
        4. Evaluation (optional): If a label image is provided, loads the ground truth label image, performs orientation
        and spacing adjustment, plots the results, and computes metrics.
        5. Print Timings: Prints the timings for preprocessing, prediction, saving, and total time.
        Note: The function assumes that the necessary models and preprocessing steps have been set up before calling
        this function.

        """
        start_time = time.time()

        # Preprocessing
        reference = mt.LoadImage()(pet_file_path)
        data = self.preprocess({"ct": ct_file_path, "pet": pet_file_path})
        preprocessing_time = time.time() - start_time

        # Prediction
        start_prediction = time.time()
        prediction = self.predict_ensemble(data.cuda())
        prediction_time = time.time() - start_prediction

        # Resample and save output
        start_saving = time.time()

        output = mt.ResampleToMatch()(prediction[0], reference[None, ...], mode="nearest")
        if save_path is not None:
            mt.SaveImage(
                output_dir=save_path,
                output_ext=".nii.gz",
                output_postfix="pred",
                separate_folder=False,
                output_dtype=np.uint8,
            )(output[0])
        saving_time = time.time() - start_saving

        # Evaluation
        if label is not None:
            ground_truth = mt.LoadImage()(label)
            test_aggregator = AutoPETMetricAggregator()
            test_aggregator(output[0], ground_truth)
            metrics = test_aggregator.compute()

            # Multiply with volume spacing -> to voxel_vol in ml
            volume = np.prod(reference.meta["pixdim"][1:4]) / 1000
            metrics = {
                "dice_score": metrics["dice_score"],
                "fp_volume": metrics["false_positives"] * volume,
                "fn_volume": metrics["false_negatives"] * volume,
            }
            if verbose:
                plot_results(output[0], ground_truth)
                print("Spacing:", reference.meta["pixdim"][1:4])
                print(metrics)
            return metrics

        if verbose:
            total_time = time.time() - start_time
            print(f"Data preprocessing time: {preprocessing_time} seconds")
            print(f"Prediction time: {prediction_time} seconds")
            print(f"Saving time: {saving_time} seconds")
            print(f"Total time: {total_time} seconds")
        return 0


@app.command()
def infer(
    ct_file_path: str,
    pet_file_path: str,
    label: Optional[str] = None,
    save_path: Optional[str] = None,
    verbose: bool = False,
    model_paths: List[str] = typer.Argument(..., help="Paths to the model checkpoints"),
    sw_batch_size: int = 6,
    tta: bool = False,
    random_flips: int = 0,
):
    predict = PredictModel(model_paths, sw_batch_size, tta, random_flips)
    result = predict.run(ct_file_path, pet_file_path, label, save_path, verbose)
    typer.echo(result)


@app.command()
def evaluate(
    config: str = "config/test_predict.yml",
    sw_batch_size: int = 6,
    tta: bool = False,
    random_flips: int = 0,
    result_path: Optional[str] = "test/",
):
    config = OmegaConf.load(config)
    model_paths = [config.model.ckpt_path] if isinstance(config.model.ckpt_path, str) else config.model.ckpt_path
    predict = PredictModel(model_paths, sw_batch_size=sw_batch_size, tta=tta, random_flips=random_flips)
    parser = SimpleParser(os.path.join(result_path, "results_tta.json"))
    split = read_split(config.data.splits_file, config.data.fold)
    files = get_file_dict_nn(config.data.data_dir, split["val"], suffix=".nii.gz")
    for file in tqdm(files, desc="Predicting"):
        result = predict.run(str(file["ct"]), str(file["pet"]), label=str(file["label"]), verbose=False)
        parser.write(file, result)


if __name__ == "__main__":
    app()
    # example
    # python predict.py infer "test/data/imagesTr/psma_95b833d46f153cd2_2017-11-18_0000.nii.gz"
    # "test/data/imagesTr/psma_95b833d46f153cd2_2017-11-18_0001.nii.gz"  --model-paths "test/epoch=581_fold0.ckpt"
    # --save-path test / --verbose