diff --git a/fetus-event-detection-classification/experiments.json b/fetus-event-detection-classification/experiments.json
new file mode 100644
index 0000000..d3defc4
--- /dev/null
+++ b/fetus-event-detection-classification/experiments.json
@@ -0,0 +1,74 @@
+[
+    {
+        "name": "all_dataset_k1",
+        "k_fold": 1,
+        "dataset_type": "all",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    },
+    {
+        "name": "fetus_dataset_k1",
+        "k_fold": 1,
+        "dataset_type": "fetus",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    },
+    {
+        "name": "mother_dataset_k1",
+        "k_fold": 1,
+        "dataset_type": "mother",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    },
+    {
+        "name": "fetus_mother_dataset_k1",
+        "k_fold": 1,
+        "dataset_type": "fetus-mother",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    },
+    {
+        "name": "mother_fetus_dataset_k1",
+        "k_fold": 1,
+        "dataset_type": "mother-fetus",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    },
+    {
+        "name": "all_dataset_k5",
+        "k_fold": 5,
+        "dataset_type": "all",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    },
+    {
+        "name": "fetus_dataset_k5",
+        "k_fold": 5,
+        "dataset_type": "fetus",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    },
+    {
+        "name": "mother_dataset_k5",
+        "k_fold": 5,
+        "dataset_type": "mother",
+        "oversampling": false,
+        "undersampling": false,
+        "epochs": 50,
+        "path": "~/Documents/womb-wise-data"
+    }
+]
\ No newline at end of file
diff --git a/fetus-event-detection-classification/src/experiments.py b/fetus-event-detection-classification/src/experiments.py
new file mode 100644
index 0000000..ba42ecd
--- /dev/null
+++ b/fetus-event-detection-classification/src/experiments.py
@@ -0,0 +1,83 @@
+import json
+import os
+
+
+def create_experiments(experiments_path, base_path):
+    if os.path.exists(experiments_path):
+        with open(experiments_path, "r") as f:
+            return json.load(f)
+
+    experiments = [
+        {
+            "name": "all_dataset_k1",
+            "k_fold": 1,
+            "dataset_type": "all",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+        {
+            "name": "fetus_dataset_k1",
+            "k_fold": 1,
+            "dataset_type": "fetus",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+        {
+            "name": "mother_dataset_k1",
+            "k_fold": 1,
+            "dataset_type": "mother",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+        {
+            "name": "fetus_mother_dataset_k1",
+            "k_fold": 1,
+            "dataset_type": "fetus-mother",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+        {
+            "name": "mother_fetus_dataset_k1",
+            "k_fold": 1,
+            "dataset_type": "mother-fetus",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+        {
+            "name": "all_dataset_k5",
+            "k_fold": 5,
+            "dataset_type": "all",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+        {
+            "name": "fetus_dataset_k5",
+            "k_fold": 5,
+            "dataset_type": "fetus",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+        {
+            "name": "mother_dataset_k5",
+            "k_fold": 5,
+            "dataset_type": "mother",
+            "oversampling": False,
+            "undersampling": False,
+            "epochs": 50,
+        },
+    ]
+
+    for experiment in experiments:
+        experiment["path"] = base_path
+
+    with open(experiments_path, "w") as f:
+        json.dump(experiments, f, indent=4)
+
+    return experiments
diff --git a/fetus-event-detection-classification/src/main.py b/fetus-event-detection-classification/src/main.py
index cc0c968..259ccfd 100755
--- a/fetus-event-detection-classification/src/main.py
+++ b/fetus-event-detection-classification/src/main.py
@@ -9,18 +9,17 @@ import torch.nn as nn
 import torch.optim as optim
 from torch.utils.data import Dataset, DataLoader
 import seaborn as sns
-import argparse
 from imblearn.over_sampling import RandomOverSampler
 from imblearn.under_sampling import RandomUnderSampler
 from collections import Counter
 from sklearn.model_selection import StratifiedKFold
 from sklearn.model_selection import train_test_split
-from datetime import datetime
 
 from load_dataset import get_dataset
 from model import SimpleLSTM
 from training import training_loop
 from validation import validation
+from experiments import create_experiments
 
 warnings.simplefilter(action="ignore", category=FutureWarning)
 
@@ -53,8 +52,6 @@ def setup_model_training(
         optimizer, mode="min", factor=0.1, patience=25
     )
 
-    # criterion = nn.CrossEntropyLoss()
-    # criterion = nn.BCELoss()
     criterion = nn.BCEWithLogitsLoss()
 
     return (model, optimizer, scheduler, criterion)
@@ -161,112 +158,31 @@ class FetusDataset(Dataset):
         x = self.data[idx]["data"]
         y = self.data[idx]["label"]
 
-        # Conversione del tipo di dato
         x = x.astype(np.float32)
         y = np.eye(self.classes)[y]
 
-        # Conversione in tensori
         x = torch.tensor(x, dtype=torch.float32)
         y = torch.tensor(y, dtype=torch.int32)
 
-        # Gestione di valori NaN o infiniti
         x = torch.nan_to_num(
             x
-        )  # Sostituisce NaN con 0 e valori infiniti con numeri molto grandi o piccoli
+        )
 
-        # Normalizzazione solo durante il training
         if self.train:
             mean = x.mean()
             std = x.std()
 
-            # Normalizzazione condizionale (solo se std > 0)
             if std > 0:
                 x = (x - mean) / std
 
         return x, y
 
 
-def createArgParser():
-    parser = argparse.ArgumentParser(description="Womb Wise")
-    parser.add_argument(
-        "-rd",
-        "--reload-dataset",
-        action="store_true",
-        help="Reload the dataset",
-    )
-
-    # path to the dataset
-    parser.add_argument(
-        "-p",
-        "--path",
-        action="store",
-        help="Path to the dataset",
-        default="~/Documents/womb-wise-data",
-    )
-
-    # epoch
-    parser.add_argument(
-        "-e",
-        "--epochs",
-        action="store",
-        help="Number of epochs",
-        default=10,
-    )
-
-    parser.add_argument(
-        "-k",
-        "--kfold",
-        action="store",
-        help="Number of folds for kfold cross validation",
-        default=1,
-    )
-
-    parser.add_argument(
-        "-o",
-        "--oversampling",
-        action="store_true",
-        help="Apply oversampling",
-    )
-
-    parser.add_argument(
-        "-u",
-        "--undersampling",
-        action="store_true",
-        help="Apply undersampling",
-    )
-
-    parser.add_argument(
-        "-d",
-        "--dataset",
-        action="store",
-        default="all",
-        choices=["all", "fetus", "mother", "fetus-mother", "mother-fetus"],
-        help="Choose the dataset: all, fetus, mother or train with mother and test with fetus or viceversa",
-    )
-
-    args = parser.parse_args()
-
-    print(
-        f"""
-    ARGS:
-    \n
-    reload-dataset: {args.reload_dataset}
-    path: {args.path}
-    epochs: {args.epochs}
-    kfold: {args.kfold}
-    oversampling: {args.oversampling}
-    undersampling: {args.undersampling}
-    dataset: {args.dataset}
-    """
-    )
-    return args
-
-
 if __name__ == "__main__":
+    BASE_PATH = "~/Documents/womb-wise-data"
     CLASSES = ["baseline", "opcl", "yawn"]
     FEATURE_SIZE = 10
     SERIES_LENGTH = 60
-    # SINGLE_FRAME_LENGTH = FEATURE_SIZE * SERIES_LENGTH
     BATCH_SIZE = 4
     WEIGHT_DECAY = 1e-5
     LEARNING_RATE = 1e-3
@@ -275,29 +191,8 @@ if __name__ == "__main__":
     DROP_OUT = 0.0
     NUM_LAYERS = 2
     EPS = 1e-7
+    EARLY_STOPPING = True
 
-    TEST_NAME = "0_k1_all"
-    # TEST_NAME = "1_k1_fetus"
-    # TEST_NAME = "2_k1_mother"
-    # TEST_NAME = "3_k1_mother_fetus"
-    # TEST_NAME = "4_k1_fetus_mother"
-    # TEST_NAME = "5_k5_all"
-    # TEST_NAME = "6_k5_fetus"
-    # TEST_NAME = "7_k5_mother"
-
-    if not os.path.exists("output/" + TEST_NAME):
-        os.makedirs("output/" + TEST_NAME)
-
-    if not os.path.exists("output/" + TEST_NAME + "/weights"):
-        os.makedirs("output/" + TEST_NAME + "/weights")
-
-    if not os.path.exists("output/" + TEST_NAME + "/confusion_matrix"):
-        os.makedirs("output/" + TEST_NAME + "/confusion_matrix")
-
-    if not os.path.exists("output/" + TEST_NAME + "/metrics"):
-        os.makedirs("output/" + TEST_NAME + "/metrics")
-
-    # fix the seed
     seed = 42
     np.random.seed(seed)
     torch.manual_seed(seed)
@@ -305,392 +200,198 @@ if __name__ == "__main__":
     torch.cuda.manual_seed_all(seed)
 
     device = get_device()
-    args = createArgParser()
 
-    PATH = args.path
-    EPOCHS = int(args.epochs)
-    K_FOLD = int(args.kfold)
-    OVER_SAMPLING = args.oversampling
-    UNDER_SAMPLING = args.undersampling
-    EARLY_STOPPING = True
-    DATASET_TYPE = args.dataset
+    experiments = create_experiments("experiments.json", BASE_PATH)
+    for experiment in experiments:
+        TEST_NAME = experiment["name"]
+        K_FOLD = experiment["k_fold"]
+        OVER_SAMPLING = experiment["oversampling"]
+        UNDER_SAMPLING = experiment["undersampling"]
+        DATASET_TYPE = experiment["dataset_type"]
+        EPOCHS = experiment["epochs"]
+        PATH = experiment["path"]
 
+        print(f"Running experiment: {TEST_NAME}")
 
-    if os.path.exists("dataset.csv") and args.reload_dataset is False:
-        dataset = pd.read_csv("dataset.csv")
-        mother = pd.read_csv("mother.csv")
-        fetus = pd.read_csv("fetus.csv")
-    else:
-        baseline_fetus = get_dataset(
-            PATH +"/Ultrasound_Scans/tracked_frames/",
-            "baseline",
-        )
-        yawn_fetus = get_dataset(
-            PATH + "/Ultrasound_Scans/tracked_frames/",
-            "yawn",
-        )
-        opcl_fetus = get_dataset(
-            PATH + "/Ultrasound_Scans/tracked_frames/",
-            "opcl",
-        )
+        if not os.path.exists("output/" + TEST_NAME):
+            os.makedirs("output/" + TEST_NAME)
 
-        fetus = pd.concat([baseline_fetus, yawn_fetus, opcl_fetus])
+        if not os.path.exists("output/" + TEST_NAME + "/weights"):
+            os.makedirs("output/" + TEST_NAME + "/weights")
 
-        baseline_mother = get_dataset(
-            PATH + "/Mothers_videos/Tracked/",
-            "baseline",
-        )
-        yawn_mother = get_dataset(
-            PATH + "/Mothers_videos/Tracked/",
-            "yawn",
-        )
-        opcl_mother = get_dataset(
-            PATH + "/Mothers_videos/Tracked/",
-            "opcl",
-        )
+        if not os.path.exists("output/" + TEST_NAME + "/confusion_matrix"):
+            os.makedirs("output/" + TEST_NAME + "/confusion_matrix")
 
-        mother = pd.concat([baseline_mother, yawn_mother, opcl_mother])
-        fetus["type"] = "fetus"
-        mother["type"] = "mother"
-
-        fetus.to_csv("fetus.csv")
-        mother.to_csv("mother.csv")
-
-        dataset = pd.concat([mother, fetus])
-        dataset.to_csv("dataset.csv")
-
-
-
-    mother = mother.drop(columns=["top_bottom_distance"])
-    fetus = fetus.drop(columns=["top_bottom_distance"])
-    dataset = dataset.drop(columns=["top_bottom_distance"])
-    grouped_dataset = dataset.groupby(["label", "frame", "test", "type"])
-    grouped_mother = mother.groupby(["label", "frame", "test"])
-    grouped_fetus = fetus.groupby(["label", "frame", "test"])
-
-    data: List[Dict[np.ndarray, int]] = []
-    mother_data: List[Dict[np.ndarray, int]] = []
-    fetus_data: List[Dict[np.ndarray, int]] = []
-
-    for name, group in grouped_mother:
-        label = group["label"]
-        frame = group["frame"]
-        test = group["test"]
-
-        group = group.drop(columns=["test", "frame", "label", "type"])
-
-        group.set_index("image_name", inplace=True)
-
-        if group.columns[0] == "Unnamed: 0":
-            group = group.drop(columns=["Unnamed: 0"])
-
-        group = group.to_numpy()
-
-        if group.shape[0] < SERIES_LENGTH:
-            group = np.vstack(
-                [group, np.zeros((SERIES_LENGTH - group.shape[0], FEATURE_SIZE))]
-            )
-
-        elif group.shape[0] > SERIES_LENGTH:
-            group = group[:SERIES_LENGTH]
-
-        group = group.astype(np.float32)
-
-        label = CLASSES.index(label.iat[0])
-        mother_data.append(
-            {
-                "data": group,
-                "label": label,
-            }
-        )
-
-    for name, group in grouped_fetus:
-        label = group["label"]
-        frame = group["frame"]
-        test = group["test"]
-
-        group = group.drop(columns=["test", "frame", "label", "type"])
-
-        group.set_index("image_name", inplace=True)
-
-        if group.columns[0] == "Unnamed: 0":
-            group = group.drop(columns=["Unnamed: 0"])
-
-        group = group.to_numpy()
-
-        if group.shape[0] < SERIES_LENGTH:
-            group = np.vstack(
-                [group, np.zeros((SERIES_LENGTH - group.shape[0], FEATURE_SIZE))]
-            )
-
-        elif group.shape[0] > SERIES_LENGTH:
-            group = group[:SERIES_LENGTH]
-
-        group = group.astype(np.float32)
-
-        label = CLASSES.index(label.iat[0])
-        fetus_data.append(
-            {
-                "data": group,
-                "label": label,
-            }
-        )
-
-    for name, group in grouped_dataset:
-        label = group["label"]
-        frame = group["frame"]
-        test = group["test"]
-        data_type = group["type"]
-
-        group = group.drop(columns=["test", "frame", "label", "type"])
-
-        group.set_index("image_name", inplace=True)
-
-        if group.columns[0] == "Unnamed: 0":
-            group = group.drop(columns=["Unnamed: 0"])
-
-        group = group.to_numpy()
-
-        if group.shape[0] < SERIES_LENGTH:
-            group = np.vstack(
-                [group, np.zeros((SERIES_LENGTH - group.shape[0], FEATURE_SIZE))]
-            )
-
-        elif group.shape[0] > SERIES_LENGTH:
-            group = group[:SERIES_LENGTH]
-
-        group = group.astype(np.float32)
-
-        label = CLASSES.index(label.iat[0])
-        data.append(
-            {
-                "data": group,
-                "label": label,
-            }
-        )
-
-    if K_FOLD == 1:
-
-        x_all = [d["data"] for d in data]
-        y_all = [d["label"] for d in data]
-
-        x_mother = [d["data"] for d in mother_data]
-        y_mother = [d["label"] for d in mother_data]
-
-        x_fetus = [d["data"] for d in fetus_data]
-        y_fetus = [d["label"] for d in fetus_data]
-
-        (train_loader_all, test_loader_all) = create_loaders(
-            x_all,
-            y_all,
-            data,
-            over=OVER_SAMPLING,
-            under=UNDER_SAMPLING,
-            classes=CLASSES,
-            batch_size=BATCH_SIZE,
-        )
-
-        (train_loader_mother, test_loader_mother) = create_loaders(
-            x_mother,
-            y_mother,
-            mother_data,
-            over=OVER_SAMPLING,
-            under=UNDER_SAMPLING,
-            classes=CLASSES,
-            batch_size=BATCH_SIZE,
-        )
-
-        (train_loader_fetus, test_loader_fetus) = create_loaders(
-            x_fetus,
-            y_fetus,
-            fetus_data,
-            over=OVER_SAMPLING,
-            under=UNDER_SAMPLING,
-            classes=CLASSES,
-            batch_size=BATCH_SIZE,
-        )
-
-        (model, optimizer, scheduler, criterion) = setup_model_training(
-            input_size=FEATURE_SIZE,
-            hidden_size=HIDDEN_SIZE,
-            num_layers=NUM_LAYERS,
-            num_classes=len(CLASSES),
-            sequence_length=SERIES_LENGTH,
-            device=device,
-            lr=LEARNING_RATE,
-            weight_decay=WEIGHT_DECAY,
-            eps=EPS,
-        )
-
-        if DATASET_TYPE == "all":
-            train_loader = train_loader_all
-            test_loader = test_loader_all
-
-        elif DATASET_TYPE == "fetus":
-            train_loader = train_loader_fetus
-            test_loader = test_loader_fetus
-
-        elif DATASET_TYPE == "mother":
-            train_loader = train_loader_mother
-            test_loader = test_loader_mother
-
-        elif DATASET_TYPE == "fetus-mother":
-            train_loader = train_loader_fetus
-            test_loader = test_loader_mother
-
-        elif DATASET_TYPE == "mother-fetus":
-            train_loader = train_loader_mother
-            test_loader = test_loader_fetus
+        if not os.path.exists("output/" + TEST_NAME + "/metrics"):
+            os.makedirs("output/" + TEST_NAME + "/metrics")
 
+        if os.path.exists("dataset.csv") and os.path.exists("mother.csv") and os.path.exists("fetus.csv"):
+            dataset = pd.read_csv("dataset.csv")
+            mother = pd.read_csv("mother.csv")
+            fetus = pd.read_csv("fetus.csv")
         else:
-            Exception("Invalid dataset type")
+            baseline_fetus = get_dataset(
+                PATH + "/Ultrasound_Scans/tracked_frames/",
+                "baseline",
+            )
+            yawn_fetus = get_dataset(
+                PATH + "/Ultrasound_Scans/tracked_frames/",
+                "yawn",
+            )
+            opcl_fetus = get_dataset(
+                PATH + "/Ultrasound_Scans/tracked_frames/",
+                "opcl",
+            )
 
-        trained_model = training_loop(
-            model=model,
-            train_loader=train_loader,
-            test_loader=test_loader,
-            optimizer=optimizer,
-            scheduler=scheduler,
-            criterion=criterion,
-            device=device,
-            epochs=EPOCHS,
-            early_stopping=EARLY_STOPPING,
-            log_dir="output/" + TEST_NAME + "/metrics",
-        )
+            fetus = pd.concat([baseline_fetus, yawn_fetus, opcl_fetus])
 
-        loss, conf_matrix, classification_rep = validation(
-            trained_model,
-            test_loader,
-            criterion,
-            device,
-        )
+            baseline_mother = get_dataset(
+                PATH + "/Mothers_videos/Tracked/",
+                "baseline",
+            )
+            yawn_mother = get_dataset(
+                PATH + "/Mothers_videos/Tracked/",
+                "yawn",
+            )
+            opcl_mother = get_dataset(
+                PATH + "/Mothers_videos/Tracked/",
+                "opcl",
+            )
 
-        # save classification report to a file
-        df = pd.DataFrame(classification_rep).transpose()
-        df.to_csv("output/" + TEST_NAME + "/metrics/classification_report.csv")
+            mother = pd.concat([baseline_mother, yawn_mother, opcl_mother])
+            fetus["type"] = "fetus"
+            mother["type"] = "mother"
 
-        torch.save(
-            trained_model.state_dict(),
-            "output/" + TEST_NAME + "/weights/model.pth",
-        )
+            fetus.to_csv("fetus.csv")
+            mother.to_csv("mother.csv")
 
-        plt.figure(figsize=(19.20, 10.80))
-        plt.title("Confusion Matrix")
-        sns.heatmap(
-            conf_matrix,
-            annot=True,
-            fmt=".2f",
-            xticklabels=["Baseline", "Opcl", "Yawn"],
-            yticklabels=["Baseline", "Opcl", "Yawn"],
-            cmap="viridis",
-        )
+            dataset = pd.concat([mother, fetus])
+            dataset.to_csv("dataset.csv")
 
-        plt.xlabel("Predicted")
-        plt.ylabel("Actual")
+        mother = mother.drop(columns=["top_bottom_distance"])
+        fetus = fetus.drop(columns=["top_bottom_distance"])
+        dataset = dataset.drop(columns=["top_bottom_distance"])
+        grouped_dataset = dataset.groupby(["label", "frame", "test", "type"])
+        grouped_mother = mother.groupby(["label", "frame", "test"])
+        grouped_fetus = fetus.groupby(["label", "frame", "test"])
 
-        plt.savefig("output/" + TEST_NAME + "/confusion_matrix/confusion_matrix.png")
+        data: List[Dict[np.ndarray, int]] = []
+        mother_data: List[Dict[np.ndarray, int]] = []
+        fetus_data: List[Dict[np.ndarray, int]] = []
 
-        plt.figure(figsize=(19.20, 10.80))
-        plt.title("Confusion Matrix Percentage")
-        conf_matrix_percent = conf_matrix.astype('float') / conf_matrix.sum(axis=1)[:, np.newaxis] * 100
-        sns.heatmap(
-            conf_matrix_percent,
-            annot=True,
-            fmt=".2f",
-            xticklabels=["Baseline", "Opcl", "Yawn"],
-            yticklabels=["Baseline", "Opcl", "Yawn"],
-            cmap="viridis",
-        )
+        for name, group in grouped_mother:
+            label = group["label"]
+            frame = group["frame"]
+            test = group["test"]
 
-        plt.xlabel("Predicted")
-        plt.ylabel("Actual")
+            group = group.drop(columns=["test", "frame", "label", "type"])
 
-        plt.savefig("output/" + TEST_NAME + "/confusion_matrix/confusion_matrix_percentage.png")
+            group.set_index("image_name", inplace=True)
 
-    else:
-        x_all = [d["data"] for d in data]
-        y_all = [d["label"] for d in data]
+            if group.columns[0] == "Unnamed: 0":
+                group = group.drop(columns=["Unnamed: 0"])
 
-        x_mother = [d["data"] for d in mother_data]
-        y_mother = [d["label"] for d in mother_data]
+            group = group.to_numpy()
 
-        x_fetus = [d["data"] for d in fetus_data]
-        y_fetus = [d["label"] for d in fetus_data]
+            if group.shape[0] < SERIES_LENGTH:
+                group = np.vstack(
+                    [group, np.zeros(
+                        (SERIES_LENGTH - group.shape[0], FEATURE_SIZE))]
+                )
 
-        (train_loader_all, test_loader_all) = create_loaders(
-            x_all,
-            y_all,
-            data,
-            over=OVER_SAMPLING,
-            under=UNDER_SAMPLING,
-            classes=CLASSES,
-            batch_size=BATCH_SIZE,
-        )
+            elif group.shape[0] > SERIES_LENGTH:
+                group = group[:SERIES_LENGTH]
 
-        (train_loader_mother, test_loader_mother) = create_loaders(
-            x_mother,
-            y_mother,
-            mother_data,
-            over=OVER_SAMPLING,
-            under=UNDER_SAMPLING,
-            classes=CLASSES,
-            batch_size=BATCH_SIZE,
-        )
+            group = group.astype(np.float32)
 
-        (train_loader_fetus, test_loader_fetus) = create_loaders(
-            x_fetus,
-            y_fetus,
-            fetus_data,
-            over=OVER_SAMPLING,
-            under=UNDER_SAMPLING,
-            classes=CLASSES,
-            batch_size=BATCH_SIZE,
-        )
+            label = CLASSES.index(label.iat[0])
+            mother_data.append(
+                {
+                    "data": group,
+                    "label": label,
+                }
+            )
 
-        (model, optimizer, scheduler, criterion) = setup_model_training(
-            input_size=FEATURE_SIZE,
-            hidden_size=HIDDEN_SIZE,
-            num_layers=NUM_LAYERS,
-            num_classes=len(CLASSES),
-            sequence_length=SERIES_LENGTH,
-            device=device,
-            lr=LEARNING_RATE,
-            weight_decay=WEIGHT_DECAY,
-            eps=EPS,
-        )
+        for name, group in grouped_fetus:
+            label = group["label"]
+            frame = group["frame"]
+            test = group["test"]
 
-        kf = StratifiedKFold(n_splits=K_FOLD, shuffle=True, random_state=seed)
-        model_index = 0
+            group = group.drop(columns=["test", "frame", "label", "type"])
 
-        x = None
-        y = None
+            group.set_index("image_name", inplace=True)
 
-        if DATASET_TYPE == "all":
-            x = [d["data"] for d in data]
-            y = [d["label"] for d in data]
-        elif DATASET_TYPE == "fetus":
-            x = [d["data"] for d in fetus_data]
-            y = [d["label"] for d in fetus_data]
-        elif DATASET_TYPE == "mother":
-            x = [d["data"] for d in mother_data]
-            y = [d["label"] for d in mother_data]
+            if group.columns[0] == "Unnamed: 0":
+                group = group.drop(columns=["Unnamed: 0"])
 
-        # TODO: HOW TO HANDLE THIS CASES? for the mixed training and validation
-        else:
-            Exception("Invalid dataset type")
+            group = group.to_numpy()
 
-        for train_index, test_index in kf.split(X=x, y=y):
-            train_data = [data[i] for i in train_index]
-            test_data = [data[i] for i in test_index]
+            if group.shape[0] < SERIES_LENGTH:
+                group = np.vstack(
+                    [group, np.zeros(
+                        (SERIES_LENGTH - group.shape[0], FEATURE_SIZE))]
+                )
 
-            data = train_data + test_data
+            elif group.shape[0] > SERIES_LENGTH:
+                group = group[:SERIES_LENGTH]
 
-            x = [d["data"] for d in train_data]
-            y = [d["label"] for d in train_data]
+            group = group.astype(np.float32)
 
-            (train_loader, test_loader) = create_loaders(
-                x,
-                y,
+            label = CLASSES.index(label.iat[0])
+            fetus_data.append(
+                {
+                    "data": group,
+                    "label": label,
+                }
+            )
+
+        for name, group in grouped_dataset:
+            label = group["label"]
+            frame = group["frame"]
+            test = group["test"]
+            data_type = group["type"]
+
+            group = group.drop(columns=["test", "frame", "label", "type"])
+
+            group.set_index("image_name", inplace=True)
+
+            if group.columns[0] == "Unnamed: 0":
+                group = group.drop(columns=["Unnamed: 0"])
+
+            group = group.to_numpy()
+
+            if group.shape[0] < SERIES_LENGTH:
+                group = np.vstack(
+                    [group, np.zeros(
+                        (SERIES_LENGTH - group.shape[0], FEATURE_SIZE))]
+                )
+
+            elif group.shape[0] > SERIES_LENGTH:
+                group = group[:SERIES_LENGTH]
+
+            group = group.astype(np.float32)
+
+            label = CLASSES.index(label.iat[0])
+            data.append(
+                {
+                    "data": group,
+                    "label": label,
+                }
+            )
+
+        if K_FOLD == 1:
+            x_all = [d["data"] for d in data]
+            y_all = [d["label"] for d in data]
+
+            x_mother = [d["data"] for d in mother_data]
+            y_mother = [d["label"] for d in mother_data]
+
+            x_fetus = [d["data"] for d in fetus_data]
+            y_fetus = [d["label"] for d in fetus_data]
+
+            (train_loader_all, test_loader_all) = create_loaders(
+                x_all,
+                y_all,
                 data,
                 over=OVER_SAMPLING,
                 under=UNDER_SAMPLING,
@@ -698,6 +399,26 @@ if __name__ == "__main__":
                 batch_size=BATCH_SIZE,
             )
 
+            (train_loader_mother, test_loader_mother) = create_loaders(
+                x_mother,
+                y_mother,
+                mother_data,
+                over=OVER_SAMPLING,
+                under=UNDER_SAMPLING,
+                classes=CLASSES,
+                batch_size=BATCH_SIZE,
+            )
+
+            (train_loader_fetus, test_loader_fetus) = create_loaders(
+                x_fetus,
+                y_fetus,
+                fetus_data,
+                over=OVER_SAMPLING,
+                under=UNDER_SAMPLING,
+                classes=CLASSES,
+                batch_size=BATCH_SIZE,
+            )
+
             (model, optimizer, scheduler, criterion) = setup_model_training(
                 input_size=FEATURE_SIZE,
                 hidden_size=HIDDEN_SIZE,
@@ -710,6 +431,29 @@ if __name__ == "__main__":
                 eps=EPS,
             )
 
+            if DATASET_TYPE == "all":
+                train_loader = train_loader_all
+                test_loader = test_loader_all
+
+            elif DATASET_TYPE == "fetus":
+                train_loader = train_loader_fetus
+                test_loader = test_loader_fetus
+
+            elif DATASET_TYPE == "mother":
+                train_loader = train_loader_mother
+                test_loader = test_loader_mother
+
+            elif DATASET_TYPE == "fetus-mother":
+                train_loader = train_loader_fetus
+                test_loader = test_loader_mother
+
+            elif DATASET_TYPE == "mother-fetus":
+                train_loader = train_loader_mother
+                test_loader = test_loader_fetus
+
+            else:
+                Exception("Invalid dataset type")
+
             trained_model = training_loop(
                 model=model,
                 train_loader=train_loader,
@@ -720,7 +464,7 @@ if __name__ == "__main__":
                 device=device,
                 epochs=EPOCHS,
                 early_stopping=EARLY_STOPPING,
-                log_dir="output/" + TEST_NAME + "/metrics/" + f"{model_index}",
+                log_dir="output/" + TEST_NAME + "/metrics",
             )
 
             loss, conf_matrix, classification_rep = validation(
@@ -730,20 +474,15 @@ if __name__ == "__main__":
                 device,
             )
 
-            # save classification report to a file
             df = pd.DataFrame(classification_rep).transpose()
-            df.to_csv(
-                "output/"
-                + TEST_NAME
-                + "/metrics/classification_report_"
-                + str(model_index)
-                + ".csv"
-            )
+            df.to_csv("output/" + TEST_NAME +
+                      "/metrics/classification_report.csv")
 
             torch.save(
                 trained_model.state_dict(),
-                "output/" + TEST_NAME + "/weights/model_" + str(model_index) + ".pth",
+                "output/" + TEST_NAME + "/weights/model.pth",
             )
+
             plt.figure(figsize=(19.20, 10.80))
             plt.title("Confusion Matrix")
             sns.heatmap(
@@ -757,16 +496,14 @@ if __name__ == "__main__":
 
             plt.xlabel("Predicted")
             plt.ylabel("Actual")
-            plt.savefig(
-                "output/"
-                + TEST_NAME
-                + "/confusion_matrix/confusion_matrix_"
-                + str(model_index)
-                + ".png"
-            )
-            conf_matrix_percent = conf_matrix.astype('float') / conf_matrix.sum(axis=1)[:, np.newaxis] * 100
+
+            plt.savefig("output/" + TEST_NAME +
+                        "/confusion_matrix/confusion_matrix.png")
+
             plt.figure(figsize=(19.20, 10.80))
             plt.title("Confusion Matrix Percentage")
+            conf_matrix_percent = conf_matrix.astype(
+                'float') / conf_matrix.sum(axis=1)[:, np.newaxis] * 100
             sns.heatmap(
                 conf_matrix_percent,
                 annot=True,
@@ -778,11 +515,189 @@ if __name__ == "__main__":
 
             plt.xlabel("Predicted")
             plt.ylabel("Actual")
-            plt.savefig(
-                "output/"
-                + TEST_NAME
-                + "/confusion_matrix/confusion_matrix_percentage_"
-                + str(model_index)
-                + ".png"
+
+            plt.savefig("output/" + TEST_NAME +
+                        "/confusion_matrix/confusion_matrix_percentage.png")
+
+        else:
+            x_all = [d["data"] for d in data]
+            y_all = [d["label"] for d in data]
+
+            x_mother = [d["data"] for d in mother_data]
+            y_mother = [d["label"] for d in mother_data]
+
+            x_fetus = [d["data"] for d in fetus_data]
+            y_fetus = [d["label"] for d in fetus_data]
+
+            (train_loader_all, test_loader_all) = create_loaders(
+                x_all,
+                y_all,
+                data,
+                over=OVER_SAMPLING,
+                under=UNDER_SAMPLING,
+                classes=CLASSES,
+                batch_size=BATCH_SIZE,
             )
-            model_index += 1
+
+            (train_loader_mother, test_loader_mother) = create_loaders(
+                x_mother,
+                y_mother,
+                mother_data,
+                over=OVER_SAMPLING,
+                under=UNDER_SAMPLING,
+                classes=CLASSES,
+                batch_size=BATCH_SIZE,
+            )
+
+            (train_loader_fetus, test_loader_fetus) = create_loaders(
+                x_fetus,
+                y_fetus,
+                fetus_data,
+                over=OVER_SAMPLING,
+                under=UNDER_SAMPLING,
+                classes=CLASSES,
+                batch_size=BATCH_SIZE,
+            )
+
+            (model, optimizer, scheduler, criterion) = setup_model_training(
+                input_size=FEATURE_SIZE,
+                hidden_size=HIDDEN_SIZE,
+                num_layers=NUM_LAYERS,
+                num_classes=len(CLASSES),
+                sequence_length=SERIES_LENGTH,
+                device=device,
+                lr=LEARNING_RATE,
+                weight_decay=WEIGHT_DECAY,
+                eps=EPS,
+            )
+
+            kf = StratifiedKFold(
+                n_splits=K_FOLD, shuffle=True, random_state=seed)
+            model_index = 0
+
+            x = None
+            y = None
+
+            if DATASET_TYPE == "all":
+                x = [d["data"] for d in data]
+                y = [d["label"] for d in data]
+            elif DATASET_TYPE == "fetus":
+                x = [d["data"] for d in fetus_data]
+                y = [d["label"] for d in fetus_data]
+            elif DATASET_TYPE == "mother":
+                x = [d["data"] for d in mother_data]
+                y = [d["label"] for d in mother_data]
+
+            # TODO: HOW TO HANDLE THIS CASES? for the mixed training and validation
+            else:
+                Exception("Invalid dataset type")
+
+            for train_index, test_index in kf.split(X=x, y=y):
+                train_data = [data[i] for i in train_index]
+                test_data = [data[i] for i in test_index]
+
+                data = train_data + test_data
+
+                x = [d["data"] for d in train_data]
+                y = [d["label"] for d in train_data]
+
+                (train_loader, test_loader) = create_loaders(
+                    x,
+                    y,
+                    data,
+                    over=OVER_SAMPLING,
+                    under=UNDER_SAMPLING,
+                    classes=CLASSES,
+                    batch_size=BATCH_SIZE,
+                )
+
+                (model, optimizer, scheduler, criterion) = setup_model_training(
+                    input_size=FEATURE_SIZE,
+                    hidden_size=HIDDEN_SIZE,
+                    num_layers=NUM_LAYERS,
+                    num_classes=len(CLASSES),
+                    sequence_length=SERIES_LENGTH,
+                    device=device,
+                    lr=LEARNING_RATE,
+                    weight_decay=WEIGHT_DECAY,
+                    eps=EPS,
+                )
+
+                trained_model = training_loop(
+                    model=model,
+                    train_loader=train_loader,
+                    test_loader=test_loader,
+                    optimizer=optimizer,
+                    scheduler=scheduler,
+                    criterion=criterion,
+                    device=device,
+                    epochs=EPOCHS,
+                    early_stopping=EARLY_STOPPING,
+                    log_dir="output/" + TEST_NAME +
+                    "/metrics/" + f"{model_index}",
+                )
+
+                loss, conf_matrix, classification_rep = validation(
+                    trained_model,
+                    test_loader,
+                    criterion,
+                    device,
+                )
+
+                df = pd.DataFrame(classification_rep).transpose()
+                df.to_csv(
+                    "output/"
+                    + TEST_NAME
+                    + "/metrics/classification_report_"
+                    + str(model_index)
+                    + ".csv"
+                )
+
+                torch.save(
+                    trained_model.state_dict(),
+                    "output/" + TEST_NAME + "/weights/model_" +
+                    str(model_index) + ".pth",
+                )
+                plt.figure(figsize=(19.20, 10.80))
+                plt.title("Confusion Matrix")
+                sns.heatmap(
+                    conf_matrix,
+                    annot=True,
+                    fmt=".2f",
+                    xticklabels=["Baseline", "Opcl", "Yawn"],
+                    yticklabels=["Baseline", "Opcl", "Yawn"],
+                    cmap="viridis",
+                )
+
+                plt.xlabel("Predicted")
+                plt.ylabel("Actual")
+                plt.savefig(
+                    "output/"
+                    + TEST_NAME
+                    + "/confusion_matrix/confusion_matrix_"
+                    + str(model_index)
+                    + ".png"
+                )
+                conf_matrix_percent = conf_matrix.astype(
+                    'float') / conf_matrix.sum(axis=1)[:, np.newaxis] * 100
+                plt.figure(figsize=(19.20, 10.80))
+                plt.title("Confusion Matrix Percentage")
+                sns.heatmap(
+                    conf_matrix_percent,
+                    annot=True,
+                    fmt=".2f",
+                    xticklabels=["Baseline", "Opcl", "Yawn"],
+                    yticklabels=["Baseline", "Opcl", "Yawn"],
+                    cmap="viridis",
+                )
+
+                plt.xlabel("Predicted")
+                plt.ylabel("Actual")
+                plt.savefig(
+                    "output/"
+                    + TEST_NAME
+                    + "/confusion_matrix/confusion_matrix_percentage_"
+                    + str(model_index)
+                    + ".png"
+                )
+                model_index += 1