vor 4 Tagen · db8827e3fe
--- a/config.toml
+++ b/config.toml
@@ -1,7 +1,7 @@
 
				 [data]
			
 
				-mri_files_path = "/data/data_wnx1/_Data/AlzheimersDL/CNN+RNN-2class-1cnn+data/PET_volumes_customtemplate_float32/"
			
 
				+mri_files_path = "../data/PET_volumes_customtemplate_float32/"
			
 
				 xls_file_path = "LP_ADNIMERGE.csv"
			
 
				-seed = 1
			
 
				+seed = 42
			
 
				 data_splits = [0.7, 0.2, 0.1] # train, validation, test
			
 
				 image_channels = 1
			
 
				 clin_data_channels = 2
			
@@ -9,12 +9,12 @@ num_classes = 2 # AD, NL
 
				 
			
 
				 
			
 
				 [training]
			
 
				-device = "cuda:1" # "cpu", "cuda", "mps"
			
 
				+device = "cuda:0" # "cpu", "cuda", "mps"
			
 
				 batch_size = 32
			
 
				-ensemble_size = 5
			
 
				-droprate = 0.1
			
 
				-learning_rate = 0.001
			
 
				-num_epochs = 10
			
 
				+ensemble_size = 50
			
 
				+droprate = 0.05
			
 
				+learning_rate = 0.0001
			
 
				+num_epochs = 30
			
 
				 
			
 
				 [output]
			
 
				-path = "../models/5x10/"
			
 
				+path = "../models/Full_Ensemble(50x30)/"
			
--- a/data/dataset.py
+++ b/data/dataset.py
@@ -104,8 +104,12 @@ def load_adni_data_from_file(
 
				 
			
 
				         if "AD" in filename:
			
 
				             file_expected_class = torch.tensor([1.0, 0.0])
			
 
				-        elif "CN" in filename:
			
 
				+        elif "NL" in filename:
			
 
				             file_expected_class = torch.tensor([0.0, 1.0])
			
 
				+        else:
			
 
				+            raise ValueError(
			
 
				+                f"Filename {filename} does not contain a valid class identifier (AD or CN)."
			
 
				+            )
			
 
				 
			
 
				         mri_data_unstacked.append(file_mri_data)
			
 
				         expected_classes_unstacked.append(file_expected_class)
			
--- a/evaluate_models.py
+++ b/evaluate_models.py
@@ -0,0 +1,128 @@
 
				+# This program evaluates every model on the combined validation and test set, then saves the results to a netcdf file.
			
 
				+
			
 
				+import torch
			
 
				+import xarray as xr
			
 
				+from torch.utils.data import DataLoader
			
 
				+import numpy as np
			
 
				+
			
 
				+
			
 
				+# Config
			
 
				+from model.cnn import CNN3D
			
 
				+from utils.config import config
			
 
				+import pathlib as pl
			
 
				+import pandas as pd
			
 
				+import json
			
 
				+
			
 
				+
			
 
				+# Custom modules
			
 
				+from data.dataset import (
			
 
				+    load_adni_data_from_file,
			
 
				+    divide_dataset,
			
 
				+    initalize_dataloaders,
			
 
				+    ADNIDataset,
			
 
				+)
			
 
				+
			
 
				+mri_files = pl.Path(config["data"]["mri_files_path"]).glob("*.nii")
			
 
				+xls_file = pl.Path(config["data"]["xls_file_path"])
			
 
				+
			
 
				+
			
 
				+def xls_pre(df: pd.DataFrame) -> pd.DataFrame:
			
 
				+    """
			
 
				+    Preprocess the Excel DataFrame.
			
 
				+    This function can be customized to filter or modify the DataFrame as needed.
			
 
				+    """
			
 
				+
			
 
				+    data = df[["Image Data ID", "Sex", "Age (current)"]]
			
 
				+    data["Sex"] = data["Sex"].str.strip()  # type: ignore
			
 
				+    data = data.replace({"M": 0, "F": 1})  # type: ignore
			
 
				+    data.set_index("Image Data ID")  # type: ignore
			
 
				+
			
 
				+    return data
			
 
				+
			
 
				+
			
 
				+dataset = load_adni_data_from_file(
			
 
				+    mri_files, xls_file, device=config["training"]["device"], xls_preprocessor=xls_pre
			
 
				+)
			
 
				+
			
 
				+# Divide the dataset into training and validation sets, using the same seed as training
			
 
				+with open(pl.Path(config["output"]["path"]) / "config.json") as f:
			
 
				+    training_config = json.load(f)
			
 
				+    try:
			
 
				+        loaded_seed = int(training_config["data"]["seed"])
			
 
				+    except (ValueError, KeyError) as e:
			
 
				+        print(
			
 
				+            f"Warning: No previous seed found for dataset division, using seed from config. Error: {e}"
			
 
				+        )
			
 
				+        loaded_seed = config["data"]["seed"]
			
 
				+
			
 
				+
			
 
				+datasets = divide_dataset(dataset, config["data"]["data_splits"], seed=loaded_seed)
			
 
				+
			
 
				+
			
 
				+# Initialize the dataloaders
			
 
				+train_loader, val_loader, test_loader = initalize_dataloaders(
			
 
				+    datasets, batch_size=config["training"]["batch_size"]
			
 
				+)
			
 
				+
			
 
				+
			
 
				+# Combine validation and test sets for final evaluation
			
 
				+combined_loader: DataLoader[ADNIDataset] = torch.utils.data.DataLoader(
			
 
				+    torch.utils.data.ConcatDataset([val_loader.dataset, test_loader.dataset]),
			
 
				+    batch_size=1,
			
 
				+    shuffle=False,
			
 
				+)
			
 
				+
			
 
				+
			
 
				+# 50 models are too large to load into memory at once, so we will load and evaluate them one at a time
			
 
				+model_dir = pl.Path(config["output"]["path"])
			
 
				+model_files = sorted(model_dir.glob("model_run_*.pt"))
			
 
				+
			
 
				+placeholder = np.zeros(
			
 
				+    (len(model_files), len(combined_loader), config["data"]["num_classes"]),
			
 
				+    dtype=np.float32,
			
 
				+)  # Placeholder for results
			
 
				+
			
 
				+placeholder[:] = np.nan  # Fill with NaNs for easier identification of missing data
			
 
				+dimensions = ["model", "batch", "img_class"]
			
 
				+coords = {
			
 
				+    "model": [int(mf.stem.split("_")[2]) for mf in model_files],
			
 
				+    "batch": list(range(len(combined_loader))),
			
 
				+    "img_class": list(range(config["data"]["num_classes"])),
			
 
				+}
			
 
				+
			
 
				+results = xr.DataArray(placeholder, coords=coords, dims=dimensions)
			
 
				+
			
 
				+for model_file in model_files:
			
 
				+    model_num = int(model_file.stem.split("_")[2])
			
 
				+    print(f"Evaluating model {model_num}...")
			
 
				+
			
 
				+    # Load the model state
			
 
				+    model = (
			
 
				+        CNN3D(
			
 
				+            image_channels=config["data"]["image_channels"],
			
 
				+            clin_data_channels=config["data"]["clin_data_channels"],
			
 
				+            num_classes=config["data"]["num_classes"],
			
 
				+            droprate=config["training"]["droprate"],
			
 
				+        )
			
 
				+        .float()
			
 
				+        .to(config["training"]["device"])
			
 
				+    )
			
 
				+
			
 
				+    model.load_state_dict(
			
 
				+        torch.load(model_file, map_location=config["training"]["device"]), strict=False
			
 
				+    )
			
 
				+    model.eval()
			
 
				+
			
 
				+    with torch.no_grad():
			
 
				+        for batch_idx, (mri_batch, xls_batch, labels_batch) in enumerate(
			
 
				+            combined_loader
			
 
				+        ):
			
 
				+            outputs = model((mri_batch.float(), xls_batch.float()))
			
 
				+            probabilities = outputs.cpu().numpy()[0, :]  # type: ignore
			
 
				+
			
 
				+            results.loc[model_num, batch_idx, :] = probabilities  # type: ignore
			
 
				+
			
 
				+# Save results to netcdf file
			
 
				+output_path = pl.Path(config["output"]["path"]) / "model_evaluation_results.nc"
			
 
				+results.to_netcdf(output_path, mode="w")  # type: ignore
			
 
				+print(f"Results saved to {output_path}")
			
--- a/generate_statistics.py
+++ b/generate_statistics.py
@@ -0,0 +1,2 @@
 
				+import xarray as xr
			
 
				+from utils.config import config
			
--- a/train_model.py
+++ b/train_model.py
@@ -3,11 +3,13 @@ import torch.nn as nn
 
				 import torch
			
 
				 import torch.optim as optim
			
 
				 
			
 
				+
			
 
				 # Config
			
 
				 from utils.config import config
			
 
				 import pathlib as pl
			
 
				 import pandas as pd
			
 
				 import json
			
 
				+import sqlite3 as sql
			
 
				 
			
 
				 
			
 
				 # Custom modules
			
@@ -88,6 +90,12 @@ for run_num in range(config["training"]["ensemble_size"]):
 
				         .to(config["training"]["device"])
			
 
				     )
			
 
				 
			
 
				+    # Set up intermediate model directory
			
 
				+    intermediate_model_dir = pl.Path(config["output"]["path"]) / "intermediate_models"
			
 
				+    if not intermediate_model_dir.exists():
			
 
				+        intermediate_model_dir.mkdir(parents=True, exist_ok=True)
			
 
				+    print(f"Intermediate models will be saved to {intermediate_model_dir}")
			
 
				+
			
 
				     # Set up the optimizer and loss function
			
 
				     optimizer = optim.Adam(model.parameters(), lr=config["training"]["learning_rate"])
			
 
				     criterion = nn.BCELoss()
			
@@ -100,7 +108,7 @@ for run_num in range(config["training"]["ensemble_size"]):
 
				         optimizer=optimizer,
			
 
				         criterion=criterion,
			
 
				         num_epochs=config["training"]["num_epochs"],
			
 
				-        learning_rate=config["training"]["learning_rate"],
			
 
				+        output_path=pl.Path(config["output"]["path"]),
			
 
				     )
			
 
				 
			
 
				     # Test model
			
@@ -120,33 +128,60 @@ for run_num in range(config["training"]["ensemble_size"]):
 
				     torch.save(model.state_dict(), model_save_path)
			
 
				     print(f"Model saved to {model_save_path}")
			
 
				 
			
 
				-    # Save the training history
			
 
				-    history_save_path = (
			
 
				-        pl.Path(config["output"]["path"]) / f"history_run_{run_num + 1}.nc"
			
 
				-    )
			
 
				+    # Save test results and history by appending to the sql database
			
 
				+    results_save_path = pl.Path(config["output"]["path"]) / f"results.sqlite"
			
 
				+    with sql.connect(results_save_path) as conn:
			
 
				+        # Create results table if it doesn't exist
			
 
				+        conn.execute(
			
 
				+            """
			
 
				+            CREATE TABLE IF NOT EXISTS results (
			
 
				+                run INTEGER PRIMARY KEY,
			
 
				+                test_loss REAL,
			
 
				+                test_accuracy REAL
			
 
				+            )
			
 
				+            """
			
 
				+        )
			
 
				+        # Insert the results
			
 
				+        conn.execute(
			
 
				+            """
			
 
				+            INSERT INTO results (run, test_loss, test_accuracy)
			
 
				+            VALUES (?, ?, ?)
			
 
				+            """,
			
 
				+            (run_num + 1, test_loss, test_acc),
			
 
				+        )
			
 
				 
			
 
				-    history.to_netcdf(history_save_path, mode="w")  # type: ignore
			
 
				-    print(f"Training history saved to {history_save_path}")
			
 
				-
			
 
				-    # Save test results by appending to the results file
			
 
				-    test_results_save_path = pl.Path(config["output"]["path"]) / f"results.json"
			
 
				-    with open(test_results_save_path, "r+") as f:
			
 
				-        try:
			
 
				-            results = json.load(f)
			
 
				-        except json.JSONDecodeError:
			
 
				-            # If the file is empty or not a valid JSON, initialize an empty list
			
 
				-            print("No previous results found, initializing results list.")
			
 
				-            results = []
			
 
				-
			
 
				-        results.append(  # type: ignore
			
 
				-            {
			
 
				-                "run": run_num + 1,
			
 
				-                "test_loss": test_loss,
			
 
				-                "test_accuracy": test_acc,
			
 
				-            }
			
 
				+        # Create a new table for the run history
			
 
				+        conn.execute(
			
 
				+            f"""
			
 
				+            CREATE TABLE IF NOT EXISTS history_run_{run_num + 1} (
			
 
				+                epoch INTEGER PRIMARY KEY,
			
 
				+                train_loss REAL,
			
 
				+                val_loss REAL,
			
 
				+                train_acc REAL,
			
 
				+                val_acc REAL
			
 
				+            )
			
 
				+            """
			
 
				         )
			
 
				-        f.seek(0)
			
 
				-        json.dump(results, f, indent=4)
			
 
				+        # Insert the history
			
 
				+        for epoch, row in history.iterrows():
			
 
				+            values = (
			
 
				+                epoch,
			
 
				+                float(row["train_loss"]),
			
 
				+                float(row["val_loss"]),
			
 
				+                float(row["train_acc"]),
			
 
				+                float(row["val_acc"]),
			
 
				+            )
			
 
				+
			
 
				+            conn.execute(
			
 
				+                f"""
			
 
				+                INSERT INTO history_run_{run_num + 1} (epoch, train_loss, val_loss, train_acc, val_acc)
			
 
				+                VALUES (?, ?, ?, ?, ?)
			
 
				+                """,
			
 
				+                values,  # type: ignore
			
 
				+            )
			
 
				+
			
 
				+        conn.commit()
			
 
				+    print(f"Results and history saved to {results_save_path}")
			
 
				     print(f"Run {run_num + 1}/{config['training']['ensemble_size']} completed\n")
			
 
				 
			
 
				 # Completion message
			
--- a/utils/training.py
+++ b/utils/training.py
@@ -6,6 +6,8 @@ from data.dataset import ADNIDataset
 
				 from typing import Tuple
			
 
				 from tqdm import tqdm
			
 
				 import numpy as np
			
 
				+import pathlib as pl
			
 
				+import pandas as pd
			
 
				 
			
 
				 type TrainMetrics = Tuple[
			
 
				     float, float, float, float
			
@@ -122,8 +124,8 @@ def train_model(
 
				     optimizer: torch.optim.Optimizer,
			
 
				     criterion: nn.Module,
			
 
				     num_epochs: int,
			
 
				-    learning_rate: float,
			
 
				-) -> Tuple[nn.Module, xr.DataArray]:
			
 
				+    output_path: pl.Path,
			
 
				+) -> Tuple[nn.Module, pd.DataFrame]:
			
 
				     """
			
 
				     Trains the model using the provided training and validation data loaders.
			
 
				 
			
@@ -168,18 +170,18 @@ def train_model(
 
				         # If we are at 25, 50, or 75% of the epochs, save the model
			
 
				         if num_epochs > 4:
			
 
				             if (epoch + 1) % (num_epochs // 4) == 0:
			
 
				-                torch.save(model.state_dict(), f"model_epoch_{epoch + 1}.pth")
			
 
				+                model_save_path = (
			
 
				+                    output_path / "intermediate_models" / f"model_epoch_{epoch + 1}.pt"
			
 
				+                )
			
 
				+                torch.save(model.state_dict(), model_save_path)
			
 
				                 print(f"Model saved at epoch {epoch + 1}")
			
 
				 
			
 
				     # return the trained model and the traning history
			
 
				 
			
 
				-    history = xr.DataArray(
			
 
				-        data=nhist,
			
 
				-        dims=["epoch", "metric"],
			
 
				-        coords={
			
 
				-            "epoch": range(num_epochs),
			
 
				-            "metric": ["train_loss", "val_loss", "train_acc", "val_acc"],
			
 
				-        },
			
 
				+    history = pd.DataFrame(
			
 
				+        data=nhist.astype(np.float32),
			
 
				+        columns=["train_loss", "val_loss", "train_acc", "val_acc"],
			
 
				+        index=np.arange(1, num_epochs + 1),
			
 
				     )
			
 
				 
			
 
				     return model, history