пре 1 недеља · 56a6a93e65
--- a/config.toml
+++ b/config.toml
@@ -17,4 +17,4 @@ learning_rate = 0.0001
 
															 num_epochs = 30
														
 
															 [output]
														
 
															-path = "../models/Full_Ensemble(50x30)/"
														
 
															+path = "/home/nschense/Medphys_Research/models/Full_Ensemble(50x30)_PTSPLIT/"
														
--- a/data/dataset.py
+++ b/data/dataset.py
@@ -190,3 +190,24 @@ def initalize_dataloaders(
 
															     return [
														
 
															         DataLoader(dataset, batch_size=batch_size, shuffle=True) for dataset in datasets
														
 
															     ]
														
 
															+
														
 
															+
														
 
															+def divide_dataset_by_patient_id(
														
 
															+    dataset: ADNIDataset,
														
 
															+    ptids: List[Tuple[int, int]],
														
 
															+    ratios: Tuple[float, float, float],
														
 
															+    seed: int,
														
 
															+) -> List[data.Subset[ADNIDataset]]:
														
 
															+    """
														
 
															+    Divides the dataset into training, validation, and test sets based on patient IDs.
														
 
															+    Ensures that all samples from the same patient are in the same set.
														
 
															+
														
 
															+    Args:
														
 
															+        dataset (ADNIDataset): The dataset to divide.
														
 
															+        ptids (List[Tuple[int, int]]): A list of tuples containing image file ids and their corresponding patient IDs.
														
 
															+        ratios (Tuple[float, float, float]): The ratios for training, validation, and test sets.
														
 
															+        seed (int): The random seed for reproducibility.
														
 
															+    Returns:
														
 
															+        List[data.Subset[ADNIDataset]]: A list of subsets for training, validation, and test sets.
														
 
															+
														
 
															+    """
														
--- a/evaluation/confidence_percentile.py
+++ b/evaluation/confidence_percentile.py
@@ -0,0 +1,73 @@
 
															+import xarray as xr
														
 
															+import numpy as np
														
 
															+import sys
														
 
															+import os
														
 
															+
														
 
															+import matplotlib.pyplot as plt
														
 
															+
														
 
															+
														
 
															+sys.path.append(
														
 
															+    os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))
														
 
															+)  # to allow imports from parent directory
														
 
															+from utils.config import config
														
 
															+import pathlib as pl
														
 
															+
														
 
															+import colorama as clr
														
 
															+
														
 
															+model_dataset_path = pl.Path(config["output"]["path"]) / "model_evaluation_results.nc"
														
 
															+array = xr.open_dataset(model_dataset_path)  # type: ignore
														
 
															+
														
 
															+
														
 
															+predictions: xr.DataArray = array["predictions"]
														
 
															+labels: xr.DataArray = array["labels"]
														
 
															+
														
 
															+# Make plots directory if it doesn't exist
														
 
															+plots_dir = pl.Path(config["output"]["path"]) / "plots"
														
 
															+plots_dir.mkdir(parents=True, exist_ok=True)
														
 
															+
														
 
															+# This script calculates and plots accuracy vs minimum confidence percentile threshold
														
 
															+
														
 
															+# Average predictions across models
														
 
															+avg_predictions = predictions.mean(dim="model")
														
 
															+# Get confidence scores for the positive class
														
 
															+confidence_scores = avg_predictions.sel(img_class=1).values
														
 
															+true_labels = labels.sel(label=1).values
														
 
															+
														
 
															+
														
 
															+# Calculate accuracy at different confidence percentiles
														
 
															+percentiles = np.linspace(0, 100, num=21)
														
 
															+accuracies = []
														
 
															+for p in percentiles:
														
 
															+    absolute_confidences = 2 * np.abs(confidence_scores - 0.5)
														
 
															+    threshold = np.percentile(absolute_confidences, p)
														
 
															+
														
 
															+    # Filter the predictions such that only those with absolute confidence above the threshold are considered
														
 
															+    selected_indices = np.where(absolute_confidences >= threshold)[0]
														
 
															+    if len(selected_indices) == 0:
														
 
															+        accuracies.append(0.0)
														
 
															+        continue
														
 
															+    selected_confidences = confidence_scores[selected_indices]
														
 
															+    selected_true_labels = true_labels[selected_indices]
														
 
															+
														
 
															+    predicted_positive = selected_confidences >= 0.5
														
 
															+    true_positive = selected_true_labels == 1
														
 
															+
														
 
															+    correct_predictions = (predicted_positive == true_positive).sum().item()
														
 
															+    total_predictions = len(selected_confidences)
														
 
															+    accuracy = correct_predictions / total_predictions if total_predictions > 0 else 0.0
														
 
															+    accuracies.append(accuracy)
														
 
															+
														
 
															+# Plot accuracy vs confidence percentile threshold
														
 
															+plt.figure(figsize=(10, 6))
														
 
															+plt.plot(percentiles, accuracies, marker="o")
														
 
															+plt.title("Accuracy vs Confidence Percentile Threshold")
														
 
															+plt.xlabel("Confidence Percentile Threshold")
														
 
															+plt.ylabel("Accuracy")
														
 
															+plt.grid()
														
 
															+plt.xticks(percentiles)
														
 
															+
														
 
															+plt.savefig(
														
 
															+    pl.Path(config["output"]["path"])
														
 
															+    / "plots"
														
 
															+    / "accuracy_vs_confidence_percentile.png"
														
 
															+)
														
--- a/evaluation/sanity_check.py
+++ b/evaluation/sanity_check.py
@@ -0,0 +1,134 @@
 
															+import xarray as xr
														
 
															+import numpy as np
														
 
															+import sys
														
 
															+import os
														
 
															+
														
 
															+
														
 
															+sys.path.append(
														
 
															+    os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))
														
 
															+)  # to allow imports from parent directory
														
 
															+from utils.config import config
														
 
															+import pathlib as pl
														
 
															+
														
 
															+import colorama as clr
														
 
															+
														
 
															+model_dataset_path = pl.Path(config["output"]["path"]) / "model_evaluation_results.nc"
														
 
															+array = xr.open_dataset(model_dataset_path)  # type: ignore
														
 
															+
														
 
															+
														
 
															+predictions: xr.DataArray = array["predictions"]
														
 
															+labels: xr.DataArray = array["labels"]
														
 
															+
														
 
															+# Average predictions across models
														
 
															+avg_predictions = predictions.mean(dim="model")
														
 
															+
														
 
															+
														
 
															+# Sort from highest to lowest confidence for the positive class (img_class=1)
														
 
															+sorted_indices = np.argsort(-avg_predictions.sel(img_class=1).values)
														
 
															+sorted_avg_predictions = avg_predictions.isel(img_id=sorted_indices)
														
 
															+sorted_labels = labels.isel(img_id=sorted_indices)
														
 
															+
														
 
															+# Print out all predictions with their labels
														
 
															+top_n = sorted_avg_predictions.sizes[
														
 
															+    "img_id"
														
 
															+]  # Change this value to print more or fewer
														
 
															+print(
														
 
															+    clr.Fore.CYAN
														
 
															+    + f"Top {top_n} Predictions (Confidence for Positive Class):"
														
 
															+    + clr.Style.RESET_ALL
														
 
															+)
														
 
															+for i in range(top_n):
														
 
															+    confidence = sorted_avg_predictions.sel(img_class=1).isel(img_id=i).item()
														
 
															+    label = sorted_labels.isel(img_id=i, label=1).values
														
 
															+
														
 
															+    correctness = (
														
 
															+        "CORRECT"
														
 
															+        if (confidence >= 0.5 and label == 1) or (confidence < 0.5 and label == 0)
														
 
															+        else "INCORRECT"
														
 
															+    )
														
 
															+    color = clr.Fore.GREEN if correctness == "CORRECT" else clr.Fore.RED
														
 
															+    print(
														
 
															+        f"Image ID: {sorted_avg_predictions.img_id.isel(img_id=i).item():<8}, "
														
 
															+        f"Confidence: {confidence:.4f}, "
														
 
															+        f"Label: {label:<3}, " + color + f"{correctness:<9}" + clr.Style.RESET_ALL
														
 
															+    )
														
 
															+
														
 
															+
														
 
															+# Calculate overall accuracy
														
 
															+predicted_positive = avg_predictions.sel(img_class=1) >= 0.5
														
 
															+true_positive = labels.sel(label=1) == 1
														
 
															+correct_predictions = (predicted_positive == true_positive).sum().item()
														
 
															+total_predictions = len(avg_predictions.img_id)
														
 
															+overall_accuracy = (
														
 
															+    correct_predictions / total_predictions if total_predictions > 0 else 0.0
														
 
															+)
														
 
															+print(
														
 
															+    clr.Fore.MAGENTA
														
 
															+    + f"\nOverall Accuracy (Threshold 0.5): {overall_accuracy:.4f}"
														
 
															+    + clr.Style.RESET_ALL
														
 
															+)
														
 
															+
														
 
															+
														
 
															+# Then go through all individual models and print out their accuracies for comparison, sorted from highest to lowest
														
 
															+model_accuracies = []
														
 
															+for model_idx in predictions.coords["model"].values:
														
 
															+    model_preds = predictions.sel(model=model_idx)
														
 
															+    predicted_positive = model_preds.sel(img_class=1) >= 0.5
														
 
															+    correct_predictions = (predicted_positive == true_positive).sum().item()
														
 
															+    accuracy = correct_predictions / total_predictions if total_predictions > 0 else 0.0
														
 
															+    model_accuracies.append((model_idx, accuracy))
														
 
															+
														
 
															+# Sort by accuracy
														
 
															+model_accuracies.sort(key=lambda x: x[1], reverse=True)
														
 
															+print(
														
 
															+    clr.Fore.CYAN
														
 
															+    + f"\nIndividual Model Accuracies (Threshold 0.5):"
														
 
															+    + clr.Style.RESET_ALL
														
 
															+)
														
 
															+for model_idx, accuracy in model_accuracies:
														
 
															+    print(f"Model {int(model_idx):<3}: Accuracy: {accuracy:.4f}")
														
 
															+
														
 
															+
														
 
															+# Then calculate the average accuracy if we were to ensemble the top K models, for K=1 to total number of models
														
 
															+total_models = len(predictions.coords["model"].values)
														
 
															+ensemble_accuracies = []
														
 
															+for k in range(1, total_models + 1):
														
 
															+    top_k_models = [ma[0] for ma in model_accuracies[:k]]
														
 
															+    ensemble_preds = predictions.sel(model=top_k_models).mean(dim="model")
														
 
															+    predicted_positive = ensemble_preds.sel(img_class=1) >= 0.5
														
 
															+    correct_predictions = (predicted_positive == true_positive).sum().item()
														
 
															+    accuracy = correct_predictions / total_predictions if total_predictions > 0 else 0.0
														
 
															+    ensemble_accuracies.append((k, accuracy))
														
 
															+print(
														
 
															+    clr.Fore.CYAN
														
 
															+    + f"\nEnsemble Accuracies for Top K Models (Threshold 0.5):"
														
 
															+    + clr.Style.RESET_ALL
														
 
															+)
														
 
															+for k, accuracy in ensemble_accuracies:
														
 
															+    print(f"Top {k:<3} Models: Ensemble Accuracy: {accuracy:.4f}")
														
 
															+
														
 
															+
														
 
															+# Finally, identify the top 5 most confidently incorrect predictions
														
 
															+incorrect_predictions = []
														
 
															+for i in range(len(avg_predictions.img_id)):
														
 
															+    confidence = avg_predictions.sel(img_class=1).isel(img_id=i).item()
														
 
															+    label = labels.isel(img_id=i, label=1).values
														
 
															+    predicted_label = 1 if confidence >= 0.5 else 0
														
 
															+    if predicted_label != label:
														
 
															+        incorrect_predictions.append((i, confidence, label))
														
 
															+# Sort by confidence
														
 
															+incorrect_predictions.sort(key=lambda x: -abs(x[1] - 0.5))
														
 
															+top_incorrect = incorrect_predictions[:5]
														
 
															+print(
														
 
															+    clr.Fore.YELLOW
														
 
															+    + f"\nTop 5 Most Confident Incorrect Predictions:"
														
 
															+    + clr.Style.RESET_ALL
														
 
															+)
														
 
															+for i, confidence, label in top_incorrect:
														
 
															+    predicted_label = 1 if confidence >= 0.5 else 0
														
 
															+    print(
														
 
															+        f"Image ID: {avg_predictions.img_id.isel(img_id=i).item():<8}, "
														
 
															+        f"Confidence: {confidence:.4f}, "
														
 
															+        f"Predicted Label: {predicted_label:<3}, "
														
 
															+        f"True Label: {label:<3}"
														
 
															+    )
														
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,27 +1,48 @@
 
															-filelock==3.18.0
														
 
															-fsspec==2025.3.2
														
 
															+colorama==0.4.6
														
 
															+contourpy==1.3.3
														
 
															+cycler==0.12.1
														
 
															+filelock==3.13.1
														
 
															+fonttools==4.60.1
														
 
															+fsspec==2024.6.1
														
 
															 jaxtyping==0.3.2
														
 
															-Jinja2==3.1.6
														
 
															-MarkupSafe==3.0.2
														
 
															+Jinja2==3.1.4
														
 
															+kiwisolver==1.4.9
														
 
															+MarkupSafe==2.1.5
														
 
															+matplotlib==3.10.7
														
 
															 mpmath==1.3.0
														
 
															-networkx==3.4.2
														
 
															+networkx==3.3
														
 
															 nibabel==5.3.2
														
 
															-numpy==2.2.6
														
 
															+numpy==2.1.2
														
 
															+nvidia-cublas-cu12==12.9.1.4
														
 
															+nvidia-cuda-cupti-cu12==12.9.79
														
 
															+nvidia-cuda-nvrtc-cu12==12.9.86
														
 
															+nvidia-cuda-runtime-cu12==12.9.79
														
 
															+nvidia-cudnn-cu12==9.10.2.21
														
 
															+nvidia-cufft-cu12==11.4.1.4
														
 
															+nvidia-cufile-cu12==1.14.1.1
														
 
															+nvidia-curand-cu12==10.3.10.19
														
 
															+nvidia-cusolver-cu12==11.7.5.82
														
 
															+nvidia-cusparse-cu12==12.5.10.65
														
 
															+nvidia-cusparselt-cu12==0.7.1
														
 
															+nvidia-nccl-cu12==2.27.3
														
 
															+nvidia-nvjitlink-cu12==12.9.86
														
 
															+nvidia-nvtx-cu12==12.9.79
														
 
															 packaging==25.0
														
 
															-pandas==2.2.3
														
 
															-pillow==11.2.1
														
 
															+pandas==2.3.2
														
 
															+pillow==11.0.0
														
 
															+pyparsing==3.2.5
														
 
															 python-dateutil==2.9.0.post0
														
 
															 pytz==2025.2
														
 
															 result==0.17.0
														
 
															-scipy==1.15.3
														
 
															-setuptools==80.8.0
														
 
															+scipy==1.16.2
														
 
															+setuptools==70.2.0
														
 
															 six==1.17.0
														
 
															-sympy==1.13.1
														
 
															-torch==2.6.0
														
 
															-torchaudio==2.6.0
														
 
															-torchvision==0.21.0
														
 
															+sympy==1.13.3
														
 
															+torch==2.8.0+cu129
														
 
															+torchvision==0.23.0+cu129
														
 
															 tqdm==4.67.1
														
 
															-typing_extensions==4.13.2
														
 
															+triton==3.4.0
														
 
															+typing_extensions==4.12.2
														
 
															 tzdata==2025.2
														
 
															-wadler_lindig==0.1.6
														
 
															-xarray==2025.4.0
														
 
															+wadler_lindig==0.1.7
														
 
															+xarray==2025.9.0