diff --git a/generate_new_lesions/generate_histograms.py b/generate_new_lesions/generate_histograms.py
deleted file mode 100644
index 5c5401e1..00000000
--- a/generate_new_lesions/generate_histograms.py
+++ /dev/null
@@ -1,161 +0,0 @@
-"""
-Generate histograms of the images from the pathology and healthy datasets.
-
-Example:
-    python generate_histograms.py
-    -dir-pathology
-    ~/data/sci-zurich-nnunet/Dataset525_tSCILesionsZurich/imagesTr
-    -dir-healthy
-    ~/data/data-multi-subject-nnunet/Dataset526_SpineGenericMultiSubject/imagesTr/
-
-"""
-
-import os
-import argparse
-
-import pandas as pd
-import numpy as np
-import seaborn as sns
-import matplotlib.pyplot as plt
-
-from spinalcordtoolbox.image import Image
-
-
-def get_parser():
-    parser = argparse.ArgumentParser()
-    parser.add_argument("-dir-pathology", default="imagesTr", type=str, required=True,
-                        help="Path to raw images from pathology dataset (i.e. SCI-Zurich)")
-    parser.add_argument("-dir-healthy", default="imagesTr", type=str, required=True,
-                        help="Path to raw images from the healthy dataset (i.e. Spine Generic Multi)")
-
-    return parser
-
-
-def create_histogram(dir_path, title):
-
-    # get all subjects
-    cases = os.listdir(dir_path)
-    # remove '.DS_Store' from the list
-    if '.DS_Store' in cases:
-        cases.remove('.DS_Store')
-
-    # Initialize dictionaries to store histograms for individual subjects
-    dict_hist = dict()
-    dict_hist_sc = dict()
-    dict_hist_lesion = dict()
-
-    # Initialize the figure
-    fig, axs = plt.subplots(1, 2, tight_layout=True)
-    # Loop across all subjects
-    for i, sub in enumerate(cases, 1):
-
-        print(f'Processing subject {i}/{len(cases)}')
-
-        # Whole image
-        path_image = os.path.join(dir_path, sub)
-        im = Image(path_image)
-        # Get numpy array
-        im_data = im.data
-        # Normalize images to range 0 and 1
-        im_data = (im_data - np.min(im_data)) / (np.max(im_data) - np.min(im_data))
-
-        # Spinal cord only
-        path_mask = os.path.join(dir_path.replace('imagesTr', 'masksTr'), sub)
-        # Remove _0000 from the filename
-        path_mask = path_mask.replace('_0000', '')
-        im_mask = Image(path_mask)
-        # Get numpy array
-        im_mask_data = im_mask.data
-
-        # Lesion (available only for sci-zurich dataset)
-        if 'sub-zh' in sub:
-            path_lesion = os.path.join(dir_path.replace('imagesTr', 'labelsTr'), sub)
-            # Remove _0000 from the filename
-            path_lesion = path_lesion.replace('_0000', '')
-            im_lesion = Image(path_lesion)
-            # Get numpy array
-            im_lesion_data = im_lesion.data
-
-        # Check if im_data and im_mask_data have the same shape
-        if im_data.shape == im_mask_data.shape:
-
-            # Whole image
-            # Get histogram using np.histogram
-            hist, bin_edges = np.histogram(im_data, bins=50, range=(0, 1))
-            # Store histogram in dictionary
-            dict_hist[sub] = hist
-
-            # Spinal cord only
-            if 'sub-zh' in sub:
-                im_data_sc = im_data[(im_mask_data > 0) & (im_lesion_data == 0)]
-            else:
-                im_data_sc = im_data[im_mask_data > 0]
-            # Get histogram using np.histogram
-            hist_sc, bin_edges = np.histogram(im_data_sc, bins=50, range=(0, 1))
-            # Store histogram in dictionary
-            dict_hist_sc[sub] = hist_sc
-
-            # Lesion (available only for sci-zurich dataset)
-            if 'sub-zh' in sub:
-                im_data_lesion = im_data[im_lesion_data > 0]
-                # Get histogram using np.histogram
-                hist_lesion, bin_edges = np.histogram(im_data_lesion, bins=50, range=(0, 1))
-                # Store histogram in dictionary
-                dict_hist_lesion[sub] = hist_lesion
-
-            # Plot histograms
-            axs[0].hist(im_data.flatten(), bins=50, histtype='step', range=(0, 1), alpha=0.6)
-            axs[0].set_title('Whole image')
-            axs[1].hist(im_data_sc.flatten(), bins=50, histtype='step', range=(0, 1), alpha=0.6)
-            axs[1].set_title('Spinal cord only')
-        else:
-            print(f'Skipping subject {sub} because image and SC mask have different shapes.')
-
-    # Compute mean histogram across subjects
-    hist_mean = pd.DataFrame.from_dict(dict_hist, orient='index').mean()
-    hist_sc_mean = pd.DataFrame.from_dict(dict_hist_sc, orient='index').mean()
-    if 'sub-zh' in sub:
-        hist_lesion_mean = pd.DataFrame.from_dict(dict_hist_lesion, orient='index').mean()
-
-    # # Plot using sns.distplot
-    # sns.displot(pd.DataFrame.from_dict(dict_hist, orient='index'), bins=50, kind="kde")
-    # sns.distplot(hist_mean, bins=50, ax=axs[0])
-    # sns.distplot(hist_sc_mean, bins=50, ax=axs[1])
-
-    axs[0].plot(bin_edges[:-1], hist_mean, label='Mean histogram', color='red', linewidth=2)
-    axs[1].plot(bin_edges[:-1], hist_sc_mean, label='Mean histogram SC', color='red', linewidth=2)
-    if 'sub-zh' in sub:
-        axs[1].plot(bin_edges[:-1], hist_lesion_mean, label='Mean histogram lesion', color='blue', linewidth=2)
-
-    # Add legend
-    axs[0].legend()
-    axs[1].legend()
-
-    # Adjust ylim for axs[1]
-    axs[1].set_ylim([0, 0.3 * np.max(hist_sc_mean)])
-
-    # Add master title
-    fig.suptitle(title)
-
-    # Save figure
-    plt.savefig('histogram_' + title + '.png')
-    print('Histogram saved as histogram_' + title + '.png')
-    # Close figure
-    plt.close()
-
-
-def main():
-    # Parse the command line arguments
-    parser = get_parser()
-    args = parser.parse_args()
-
-    # Expand user (i.e. ~) in paths
-    args.dir_healthy = os.path.expanduser(args.dir_healthy)
-    args.dir_pathology = os.path.expanduser(args.dir_pathology)
-
-    create_histogram(args.dir_pathology, 'patho')
-    create_histogram(args.dir_healthy, 'healthy')
-
-
-if __name__ == '__main__':
-    main()
diff --git a/generate_new_lesions/generate_new_lesion.py b/generate_new_lesions/generate_new_lesion.py
deleted file mode 100644
index f8cebbde..00000000
--- a/generate_new_lesions/generate_new_lesion.py
+++ /dev/null
@@ -1,508 +0,0 @@
-"""
-Take lesion from subject_b and insert it into subject_a
-
-Activate SCT conda environment:
-    source ${SCT_DIR}/python/etc/profile.d/conda.sh
-    conda activate venv_sct
-
-Run:
-    python generate_new_lesion.py
-
-nnUNet data structure is required.
-TODO: switch to BIDS?
-"""
-import os
-import sys
-import time
-import argparse
-import numpy as np
-from scipy.ndimage import binary_dilation, generate_binary_structure
-import nibabel as nib
-
-from spinalcordtoolbox.image import Image, zeros_like
-from spinalcordtoolbox.resampling import resample_nib
-
-from utils import get_centerline, get_lesion_volume, keep_largest_component, fetch_subject_and_session, \
-    generate_histogram
-
-# TODO: Check out Diffusion models for synthesizing new images + lesions 
-
-
-def get_parser():
-    parser = argparse.ArgumentParser()
-    parser.add_argument("-num", default=100, type=int, help="Total number of newly generated subjects. Default: 100")
-    parser.add_argument("-dir-pathology", default="imagesTr", type=str,
-                        help="Path to raw images from pathology dataset (i.e. SCI-Zurich)")
-    parser.add_argument("-dir-lesions", default="labelsTr", type=str,
-                        help="Path to lesion labels from pathology dataset (i.e. SCI-Zurich)")
-    parser.add_argument("-dir-masks-pathology", default="masksTr", type=str,
-                        help="Path to SC masks from pathology dataset (i.e. SCI-Zurich)")
-    parser.add_argument("-dir-healthy", default="imagesTr", type=str,
-                        help="Path to raw images from the healthy dataset (i.e. Spine Generic Multi)")
-    parser.add_argument("-dir-masks-healthy", default="masksTr", type=str,
-                        help="Path to SC masks from healthy dataset (i.e. Spine Generic Multi)")
-    parser.add_argument("-dir-save", default="labelsTr", type=str,
-                        help="Path to save new lesion samples")
-    parser.add_argument("-seed", default=99, type=int, help="Random seed used for subject mixing. Default: 99")
-    parser.add_argument("-resample", default=False, action='store_true',
-                        help="Resample the augmented images to the resolution of pathological dataset. Default: False")
-    parser.add_argument("-qc", default=False, action='store_true', help="Perform QC using sct_qc. Default: False")
-    parser.add_argument("-histogram", default=False, action='store_true', help="Create histograms. Default: False")
-    parser.add_argument("-min-lesion-vol", "--min-lesion-volume", default=200, type=float,
-                        help="Minimum lesion volume in mm^3. Default: 200")
-    # parser.add_argument("--mask_save_path", "-mask-pth", default="mask", type=str,
-    #                     help="Path to save carved masks")
-
-    return parser
-
-
-def insert_lesion(im_augmented, im_augmented_lesion, im_patho_data, im_patho_sc_dil_data, im_patho_lesion_data, 
-                  im_healthy_sc_data, coords, new_position, lesion_sc_ratio_patho):
-    """"
-    Insert lesion from the bounding box to the im_augmented
-    """
-    # Get bounding box coordinates
-    x0, y0, z0 = coords.min(axis=0)
-    x1, y1, z1 = coords.max(axis=0) + 1  # slices are exclusive at the top
-
-    # Get coordinates where to insert the lesion
-    x, y, z = new_position
-
-    # TODO - take angle of the centerline into account when projecting the lesion
-    # TODO for Nathan - rewrite this without 3 loops
-
-    for x_step, x_cor in enumerate(range(x0, x1)):
-        for y_step, y_cor in enumerate(range(y0, y1)):
-            for z_step, z_cor in enumerate(range(z0, z1)):
-                # Check that dimensions do not overflow
-                if x + x_step >= im_augmented.shape[0] or y + y_step >= im_augmented.shape[1] or z + z_step >= im_augmented.shape[2]:
-                    continue
-                
-                # Insert only voxels corresponding to the lesion mask
-                # Also make sure that the new lesion is not projected outside of the SC
-                if im_patho_lesion_data[x_cor, y_cor, z_cor] > 0 and im_healthy_sc_data[x + x_step, y + y_step, z + z_step] > 0:
-                    # # Lesion inserted into the target image
-                    # im_augmented[x + x_step, y + y_step, z + z_step] = im_patho_data[x_cor, y_cor, z_cor] * intensity_ratio_scs   # original
-
-                    # Simply copy the lesion voxels
-                    im_augmented[x + x_step, y + y_step, z + z_step] = im_patho_data[x_cor, y_cor, z_cor]
-                                                            
-                    # Lesion mask
-                    im_augmented_lesion[x + x_step, y + y_step, z + z_step] = im_patho_lesion_data[x_cor, y_cor, z_cor]
-
-
-    # dilate the augmented lesion mask same as before
-    im_augmented_lesion_dilated = im_augmented_lesion.copy()
-    im_augmented_lesion_dilated = binary_dilation(im_augmented_lesion_dilated, structure=generate_binary_structure(3, 5), iterations=3)
-    # extract only the dilated region of the lesion from the healthy SC
-    im_healthy_sc_dil_data = im_healthy_sc_data * im_augmented_lesion_dilated
-    # print(f"non zero elements in healthy SC after dilation: {np.count_nonzero(im_healthy_sc_data)}")
-
-    # TODO: check whether this is the same as multiplying element-wise
-    # compute the intensity ratio of the SCs of the patho and healthy image
-    # intensity_ratio_scs = np.mean(im_augmented[im_healthy_sc_dil_data > 0]) / np.mean(im_patho_data[im_patho_sc_dil_data > 0])  # with lesion
-    intensity_ratio_scs = np.mean(im_augmented[(im_healthy_sc_dil_data > 0) & (im_augmented_lesion == 0)]) / \
-                                    np.mean(im_patho_data[(im_patho_sc_dil_data > 0) & (im_patho_lesion_data == 0)])  # without lesion
-    # print(f"Mean Intensity ratio of augmented/patho SC: {intensity_ratio_scs}")
-
-    # modify the augmented lesion voxels with the intensity ratio
-    im_augmented[im_augmented_lesion > 0] = im_augmented[im_augmented_lesion > 0] * intensity_ratio_scs
-
-    # compute the lesion/SC intensity ratio in the augmented image
-    # lesion_sc_ratio_augmented = np.mean(im_augmented[im_augmented_lesion > 0]) / np.mean(im_augmented[im_healthy_sc_dil_data > 0])
-    lesion_sc_ratio_augmented = np.mean(im_augmented[im_augmented_lesion > 0]) / np.mean(im_augmented[(im_healthy_sc_dil_data > 0) & (im_augmented_lesion == 0)])
-    print(f"Mean Lesion/SC Intensity Ratio of Augmented Subject (AFTER LESION INSERTION): {lesion_sc_ratio_augmented}")
-
-    # modify the intensity ratio of augmented lesion to be similar to that of the patho lesion
-    im_augmented[im_augmented_lesion > 0] = im_augmented[im_augmented_lesion > 0] * lesion_sc_ratio_patho / lesion_sc_ratio_augmented
-
-    # recompute the lesion/SC intensity ratio in the augmented image
-    lesion_sc_ratio_augmented = np.mean(im_augmented[im_augmented_lesion > 0]) / np.mean(im_augmented[(im_healthy_sc_dil_data > 0) & (im_augmented_lesion == 0)])
-    print(f"Mean Lesion/SC Intensity Ratio of Augmented Subject (AFTER INTENSITY MODIFICATION): {lesion_sc_ratio_augmented}")
-
-    return im_augmented, im_augmented_lesion, im_healthy_sc_dil_data
-
-
-def generate_new_sample(sub_healthy, sub_patho, args, index):
-
-    """
-    Load pathological subject image, spinal cord segmentation, and lesion mask
-    """
-    # Construct paths
-    path_image_patho = os.path.join(args.dir_pathology, sub_patho + '_0000.nii.gz')
-    path_label_patho = os.path.join(args.dir_lesions, sub_patho + '.nii.gz')
-    path_mask_sc_patho = os.path.join(args.dir_masks_pathology, sub_patho + '.nii.gz')
-
-    # Load image_patho, label_patho, and mask_sc_patho
-    im_patho = Image(path_image_patho)
-    im_patho_sc = Image(path_mask_sc_patho)
-    im_patho_lesion = Image(path_label_patho)
-
-    im_patho_orientation_native = im_patho.orientation
-    print(f"Pathological subject {path_image_patho}: {im_patho_orientation_native}, {im_patho.dim[0:3]}, {im_patho.dim[4:7]}")
-    # TODO: consider reorienting back to native orientation
-
-    # Reorient to RPI
-    im_patho.change_orientation("RPI")
-    im_patho_sc.change_orientation("RPI")
-    im_patho_lesion.change_orientation("RPI")
-    print("Reoriented to RPI")
-
-    # Get numpy arrays
-    im_patho_data = im_patho.data
-    im_patho_sc_data = im_patho_sc.data
-    im_patho_lesion_data = im_patho_lesion.data
-
-    # Check if image and spinal cord mask have the same shape, if not, skip this subject
-    if im_patho_data.shape != im_patho_sc_data.shape:
-        print("WARNING: image_patho and label_patho have different shapes --> skipping subject\n")
-        return False
-
-    # Check if lesion volume is less than X mm^3, if yes, skip this subject
-    im_patho_lesion_vol = get_lesion_volume(im_patho_lesion_data, im_patho.dim[4:7], debug=False)
-    if im_patho_lesion_vol < args.min_lesion_volume:
-        print("WARNING: lesion volume is too small --> skipping subject\n")
-        return False
-
-
-    """
-    Load healthy subject image and spinal cord segmentation
-    """
-    # Construct paths
-    path_image_healthy = os.path.join(args.dir_healthy, sub_healthy + '_0000.nii.gz')
-    path_mask_sc_healthy = os.path.join(args.dir_masks_healthy, sub_healthy + '.nii.gz')
-
-    # Load image_healthy and mask_sc
-    im_healthy = Image(path_image_healthy)
-    im_healthy_sc = Image(path_mask_sc_healthy)
-
-    im_healthy_orientation_native = im_healthy.orientation
-    print(f"Healthy subject {path_image_healthy}: {im_healthy_orientation_native}, {im_healthy.dim[0:3]}, {im_healthy.dim[4:7]}")
-
-    # Reorient to RPI
-    im_healthy.change_orientation("RPI")
-    im_healthy_sc.change_orientation("RPI")
-    print("Reoriented to RPI")
-
-
-    """
-    Resample healthy subject image and spinal cord mask to the spacing of pathology subject
-    """
-    if args.resample:
-        # Resample healthy subject to the spacing of pathology subject
-        # print(f'Resampling healthy subject image and SC mask to the spacing of pathology subject ({path_image_patho}).')
-
-        # print(f'Before resampling - Image Shape: {im_healthy.dim[0:3]}, Image Resolution: {im_healthy.dim[4:7]}')
-        # new_lesion_vol = get_lesion_volume(new_lesion.data, new_lesion.dim[4:7], debug=False)
-        # print(f'Lesion volume before resampling: {new_lesion_vol} mm3')
-
-        # Fetch voxel size of pathology subject (will be used for resampling)
-        # Note: get_zooms() is nibabel function that returns voxel size in mm (same as SCT's im_patho.dim[4:7])
-        im_patho_voxel_size = im_patho.header.get_zooms()
-
-        # Resample
-        # Note: we cannot use 'image_dest=' option because we do not want to introduce padding or cropping
-        im_healthy = resample_nib(im_healthy, new_size=im_patho_voxel_size, new_size_type='mm', interpolation='linear')
-        # new_lesion = resample_nib(new_lesion, new_size=im_patho_voxel_size, new_size_type='mm', interpolation='linear')
-        im_healthy_sc = resample_nib(im_healthy_sc, new_size=im_patho_voxel_size, new_size_type='mm', interpolation='linear')
-        # new_sc = resample_nib(new_sc, new_size=im_patho_voxel_size, new_size_type='mm', interpolation='linear')
-
-        print(f'After resampling - Image Shape: {im_healthy.dim[0:3]}, Image Resolution: {im_healthy.dim[4:7]}')
-
-    # Get numpy arrays
-    im_healthy_data = im_healthy.data
-    im_healthy_sc_data = im_healthy_sc.data
-
-    # Check if image and spinal cord mask have the same shape, if not, skip this subject
-    if im_healthy_data.shape != im_healthy_sc_data.shape:
-        print("Warning: image_healthy and mask_sc have different shapes --> skipping subject")
-        return False
-
-    # # normalize images to range 0 and 1 using min-max normalization
-    # im_healthy_data = (im_healthy_data - np.min(im_healthy_data)) / (np.max(im_healthy_data) - np.min(im_healthy_data))
-    # im_patho_data = (im_patho_data - np.min(im_patho_data)) / (np.max(im_patho_data) - np.min(im_patho_data))
-    # normalize with Z-score
-    im_healthy_data = (im_healthy_data - np.mean(im_healthy_data)) / (np.std(im_healthy_data) + 1e-8)
-    im_patho_data = (im_patho_data - np.mean(im_patho_data)) / (np.std(im_patho_data) + 1e-8)
-
-    # first, try equalizing the histograms of the two images using SC masks
-    # im_healthy_data[im_healthy_sc_data > 0] = exposure.match_histograms(im_healthy_data[im_healthy_sc_data > 0], 
-    #                                                                     im_patho_data[im_patho_sc_data > 0], channel_axis=-1)
-
-    # # match histogram of healthy image to pathological image
-    # print(im_patho_data.shape)
-    # im_healthy_data_matched = match_histogram_3D(source_volume=im_healthy_data, target_volume=im_patho_data)
-    # im_healthy_data_matched_nii = nib.Nifti1Image(im_healthy_data_matched, im_healthy.affine, im_healthy.header)
-    # nib.save(im_healthy_data_matched_nii, os.path.join(args.dir_save.replace("labelsTr", "intermediate_niftis"),
-    #                                                      f"{sub_healthy}_hist-matched.nii.gz"))
-
-    """
-    Get intensity ratio between healthy and pathological SC and normalize images.
-    The ratio is used to multiply the lesion in the healthy image.
-    """    
-    # First, compute the ratio of intensities between lesion and SC in the pathological image
-    # Extract SC mask in the neighbourhood of the lesion
-    # print(f"non zero elements in patho SC before dilation: {np.count_nonzero(im_patho_sc_data)}")
-    # print(f"non zero elements in lesion: {np.count_nonzero(im_patho_lesion_data)}")
-    im_patho_lesion_data_dilated = binary_dilation(im_patho_lesion_data, structure=generate_binary_structure(3, 5), iterations=3)
-    im_patho_sc_dil_data = im_patho_sc_data * im_patho_lesion_data_dilated
-    
-    # lesion_sc_ratio_patho = np.mean(im_patho_data[im_patho_lesion_data > 0]) / np.mean(im_patho_data[im_patho_sc_dil_data > 0])    # with lesion
-    lesion_sc_ratio_patho = np.mean(im_patho_data[im_patho_lesion_data > 0]) / np.mean(im_patho_data[(im_patho_sc_dil_data > 0) & (im_patho_lesion_data == 0)])    # without lesion
-    print(f"Mean lesion/SC Intensity Ratio of Patho Subject {sub_patho}: {lesion_sc_ratio_patho}")
-    # Make sure the intensity ratio is always > 1 (i.e. the lesion is always brighter than the healthy SC)
-    if lesion_sc_ratio_patho < 1:
-        lesion_sc_ratio_patho = 1 / lesion_sc_ratio_patho
-        print(f"Mean lesion/SC Intensity Ratio of Patho Subject {sub_patho} (after inversion): {lesion_sc_ratio_patho}")
-
-    """
-    Main logic - copy lesion from pathological image to healthy image
-    """
-    # Initialize Image instances for the new target and lesion
-    im_augmented = zeros_like(im_healthy)
-    im_augmented_lesion = zeros_like(im_healthy)
-
-    # Create a copy of the healthy SC mask. The mask will have the proper output name and will be saved under masksTr
-    # folder. The mask is useful for lesion QC (using sct_qc) or nnU-Net region-based training
-    # (https://github.com/MIC-DKFZ/nnUNet/blob/master/documentation/region_based_training.md)
-    new_sc = im_healthy_sc.copy()
-
-    # Create 3D bounding box around non-zero pixels (i.e., around the lesion)
-    lesion_coords = np.argwhere(im_patho_lesion_data > 0)
-
-    # Get centerline from healthy SC seg. The centerline is used to project the lesion from the pathological image
-    healthy_centerline = get_centerline(im_healthy_sc_data)
-    # Make sure that the z-axis is at the max of the SC mask so that it is not mapped on the brainstem
-    healthy_centerline_cropped = healthy_centerline[round(len(healthy_centerline)*0.1):
-                                                    round(len(healthy_centerline)*0.75)]
-    # TODO: Check what's the origin - bottom left or top left. Because using 0.25-0.9 seems to place lesions at the 
-    # top levels but 0.1-0.75 does not do so
-
-    # Select random coordinate on the centerline
-    # index is used to have different seed for every subject to have different lesion positions across different subjects
-    rng = np.random.default_rng(args.seed + index)
-
-    # NOTE: This loop is required because the lesion from the original patho image could be cropped if it is going
-    # outside of the SC in the healthy image. So, the loop continues until the lesion inserted in the healthy image
-    # is greater than args.min_lesion_volume
-    i = 0
-    while True:
-        # Initialize numpy arrays with the same shape as the healthy image
-        im_augmented_data = np.copy(im_healthy_data)
-        im_augmented_lesion_data = np.zeros_like(im_healthy_data)
-
-        # New position for the lesion
-        new_position = healthy_centerline_cropped[rng.integers(0, len(healthy_centerline_cropped) - 1)]
-        print(f"Trying to insert lesion at {new_position}")
-
-        # Insert lesion from the bounding box to the im_augmented
-        im_augmented_data, im_augmented_lesion_data, im_healthy_sc_dil_data = insert_lesion(im_augmented_data, im_augmented_lesion_data, im_patho_data,
-                                                         im_patho_sc_dil_data, im_patho_lesion_data, im_healthy_sc_data,
-                                                         lesion_coords, new_position, lesion_sc_ratio_patho)
-
-        # Inserted lesion can be divided into several parts (due to the crop by the healthy SC mask and SC curvature).
-        # In such case, keep only the largest part.
-        # NOTE: im_augmented_lesion_data could still be empty if the coordinates of lesion bbox are overflowing out of healthy SC, 
-        # essentially never reaching the second if statement in insert_lesion() function. As a result, we get 
-        # "ValueError: attempt to get argmax of an empty sequence" error in keep_largest_component() function.
-        # So, check if im_augmented_lesion_data is empty and if so, try again (with a different position)
-        if not im_augmented_lesion_data.any():
-            print(f"Lesion inserted at {new_position} is empty. Trying again...")
-            continue
-        
-        im_augmented_lesion_data = keep_largest_component(im_augmented_lesion_data)
-        # Insert back intensity values from the original healthy image everywhere where the lesion is zero. In other
-        # words, keep only the largest part of the lesion and replace the rest with the original healthy image.
-        im_augmented_data[im_augmented_lesion_data == 0] = im_healthy_data[im_augmented_lesion_data == 0]
-
-        # Check if inserted lesion is larger then min_lesion_volume
-        # NOTE: we are doing this check because the lesion can smaller due to crop by the spinal cord mask
-        lesion_vol = get_lesion_volume(im_augmented_lesion_data, im_augmented_lesion.dim[4:7], debug=False)
-        if lesion_vol > args.min_lesion_volume:
-            print(f"Lesion inserted at {new_position}")
-            break
-
-        if i == 10:
-            print(f"WARNING: Tried 10 times to insert lesion but failed. Skipping this subject...")
-            return False
-        i += 1
-
-    # # Revert the histogram matching
-    # im_augmented_data = match_histogram_3D(im_augmented_data, target_volume=im_healthy_data)
-    # im_augmented_data_nii = nib.Nifti1Image(im_augmented_data, im_healthy.affine, im_healthy.header)
-    # nib.save(im_augmented_data_nii, os.path.join(args.dir_save.replace("labelsTr", "intermediate_niftis"),
-    #                                                 f"{sub_healthy}_hist-revert.nii.gz"))
-
-    # Insert newly created target and lesion into Image instances
-    im_augmented.data = im_augmented_data
-    im_augmented_lesion.data = im_augmented_lesion_data
-
-    # Add a final check to ensure that the im_augmented_lesion is not empty
-    if np.sum(im_augmented_lesion.data) == 0:
-        print(f"WARNING: (augmented) im_augmented_lesion is empty. Check code again. Gracefully exiting....")
-        sys.exit(1)
-
-    # Convert i to string and add 3 leading zeros
-    s = str(index).zfill(3)
-
-    """
-    Save im_augmented and im_augmented_lesion
-    """
-    # Get subject and session IDs from the healthy image
-    subjectID_healthy, sessionID_healthy, _ = fetch_subject_and_session(sub_healthy)
-    # Get subject and session IDs from the patho image
-    subjectID_patho, sessionID_patho, _ = fetch_subject_and_session(sub_patho)
-
-    if sessionID_patho is None:
-        subject_name_out = subjectID_healthy + '_' + subjectID_patho + '_' + s
-    # NOTE: Zurich also has sessions (e.g. sub-zh11_ses-01)
-    else:
-        subject_name_out = subjectID_healthy + '_' + subjectID_patho + '_' + sessionID_patho + '_' + s
-
-    if args.histogram:
-        # Generate healthy-patho pair histogram
-        generate_histogram(im_healthy_data, im_healthy_sc_data, im_healthy_sc_dil_data,
-                           im_patho_data, im_patho_sc_data, im_patho_sc_dil_data, im_patho_lesion_data,
-                           im_augmented_data, im_augmented_lesion_data, new_sc.data,
-                           sub_healthy, sub_patho, subject_name_out,
-                           output_dir=args.dir_save.replace("labelsTr", "histograms"))
-
-    if subjectID_patho.startswith('sub-zh'):
-        qc_plane = 'sagittal'
-    else:
-        qc_plane = 'axial'
-
-    im_augmented_path = os.path.join(args.dir_healthy, subject_name_out + '_0000.nii.gz')
-    im_augmented_lesion_path = os.path.join(args.dir_save, subject_name_out + '.nii.gz')
-    new_sc_path = os.path.join(args.dir_masks_healthy, subject_name_out + '.nii.gz')
-
-    im_augmented.save(im_augmented_path)
-    print(f'Saving {im_augmented_path}; {im_augmented.orientation, im_augmented.dim[4:7]}')
-    im_augmented_lesion.save(im_augmented_lesion_path)
-    print(f'Saving {im_augmented_lesion_path}; {im_augmented_lesion.orientation, im_augmented_lesion.dim[4:7]}')
-    new_sc.save(new_sc_path)
-    print(f'Saving {new_sc_path}; {new_sc.orientation, new_sc.dim[4:7]}')
-    print('')
-
-    # Generate QC
-    if args.qc:
-        # Binarize im_augmented_lesion (sct_qc supports only binary masks)
-        im_augmented_lesion_bin_path = im_augmented_lesion_path.replace('.nii.gz', '_bin.nii.gz')
-        os.system(f'sct_maths -i {im_augmented_lesion_path} -bin 0 -o {im_augmented_lesion_bin_path}')
-        # Example: sct_qc -i t2.nii.gz -s t2_seg.nii.gz -d t2_lesion.nii.gz -p sct_deepseg_lesion -plane axial
-        os.system(f'sct_qc -i {im_augmented_path} -s {new_sc_path} -d {im_augmented_lesion_bin_path} -p sct_deepseg_lesion '
-                  f'-plane {qc_plane} -qc {args.dir_save.replace("labelsTr", "qc")} -qc-subject {subject_name_out}')
-        # Remove binarized lesion
-        os.remove(im_augmented_lesion_bin_path)
-
-    return True
-
-
-def main():
-    # Parse the command line arguments
-    parser = get_parser()
-    args = parser.parse_args()
-
-    # Expand user (i.e. ~) in paths
-    args.dir_healthy = os.path.expanduser(args.dir_healthy)
-    args.dir_masks_healthy = os.path.expanduser(args.dir_masks_healthy)
-    args.dir_pathology = os.path.expanduser(args.dir_pathology)
-    args.dir_lesions = os.path.expanduser(args.dir_lesions)
-    args.dir_masks_pathology = os.path.expanduser(args.dir_masks_pathology)
-    args.dir_save = os.path.expanduser(args.dir_save)
-
-    # get all pathology cases
-    # TODO - maybe could be changed to args.dir_pathology
-    cases_patho = os.listdir(args.dir_lesions)
-    # remove '.DS_Store' from Cases list
-    if '.DS_Store' in cases_patho:
-        cases_patho.remove('.DS_Store')
-    simple_cases_patho = [case.split('.')[0] for i, case in enumerate(cases_patho) if 'Mix' not in case]
-    cases_patho = simple_cases_patho
-
-    # get all healthy cases
-    # TODO - maybe could be changed to args.dir_healthy
-    cases_healthy = os.listdir(args.dir_masks_healthy)
-    # remove '.DS_Store' from Cases list
-    if '.DS_Store' in cases_healthy:
-        cases_healthy.remove('.DS_Store')
-    simple_cases_healthy = [case.split('.')[0] for i, case in enumerate(cases_healthy) if 'Mix' not in case]
-    cases_healthy = simple_cases_healthy
-
-    # Check if number of samples to generate is not larger than the number of available subjects
-    # Because we want to use each healthy subject only once
-    if args.num > len(cases_healthy):
-        sys.exit(f"Number of samples to generate ({args.num}) is larger than the number of available "
-                 f"subjects ({len(cases_patho)})")
-
-    """
-    Mix pathology and healthy subjects
-    """
-    print("Random seed: ", args.seed)
-    rng = np.random.default_rng(args.seed)
-    # Get random indices for pathology and healthy subjects
-    patho_random_list = rng.choice(len(cases_patho), args.num*2) # *2 because we need same number of patho and healthy
-    healthy_random_list = rng.choice(len(cases_healthy), args.num, replace=False)
-
-    # Duplicate healthy list (we need more subjects because some pair might be skipped, for example due to no lesion)
-    healthy_random_list = np.tile(healthy_random_list, 2)
-
-    # Combine both lists
-    rand_index = np.vstack((patho_random_list, healthy_random_list))
-    # Keep only unique combinations (to avoid mixing the same subjects)
-    rand_index = np.unique(rand_index, axis=1)
-    # np.unique sorts the array, so we need to shuffle it again
-    rng.shuffle(rand_index.T)
-
-    num_of_samples_generated = 0
-
-    """
-    Start generating new samples
-    """
-    for i in range(len(rand_index[0])):
-
-        # wait 0.1 seconds to avoid print overlapping
-        time.sleep(0.1)
-
-        rand_index_patho = rand_index[0][i]
-        rand_index_healthy = rand_index[1][i]
-
-        sub_patho = cases_patho[rand_index_patho]
-        sub_healthy = cases_healthy[rand_index_healthy]
-
-        # SCI-Zurich example where lesion is only slight hyperintense
-        # sub_patho = 'sub-zh37_ses-01_029'
-        # sub_healthy = 'sub-tokyoIngenia05_213'
-        
-        # NOTE: sub-5740 in SCI-Colorado has a weird contrast range when viewed on FSLeyes. It is 
-        # causing in the augmentation, hence it is skipped for now.
-        if 'sub-5740' in sub_patho:
-            print("Encountered sub-5740, skipping...")
-            continue
-
-        # Strip .nii.gz from the subject name
-        sub_healthy = sub_healthy.replace('.nii.gz', '')
-        sub_patho = sub_patho.replace('.nii.gz', '')
-
-        print(f"\nHealthy subject: {sub_healthy}, Patho subject: {sub_patho}")
-
-        # If augmentation is done successfully (True is returned), break the loop and continue to the next sample
-        # If augmentation is not done successfully (False is returned), continue the while loop and try again
-        if generate_new_sample(sub_healthy=sub_healthy, sub_patho=sub_patho, args=args, index=i):
-            num_of_samples_generated += 1
-            print('-' * 50)
-            print(f"Number of samples generated: {num_of_samples_generated}/{args.num}")
-            print('-' * 50)
-
-        # If we have generated the required number of samples, break the for loop
-        if num_of_samples_generated == args.num:
-            break
-
-        # wait 0.1 seconds to avoid print overlapping
-        time.sleep(0.1)
-
-    print("\nFinished generating new samples!")
-
-
-if __name__ == '__main__':
-    main()
diff --git a/generate_new_lesions/utils.py b/generate_new_lesions/utils.py
deleted file mode 100644
index cd67e286..00000000
--- a/generate_new_lesions/utils.py
+++ /dev/null
@@ -1,200 +0,0 @@
-import os
-import re
-import numpy as np
-
-import matplotlib.pyplot as plt
-
-from scipy import ndimage
-from skimage import measure
-from spinalcordtoolbox.image import Image, zeros_like
-import skimage.exposure as exposure
-
-
-def coefficient_of_variation(masked_image):
-    return np.std(masked_image, ddof=1) / np.mean(masked_image) * 100
-
-
-def save_image_to_nifti(im, im_path, im_name):
-    """
-    Save image to nifti file
-    """
-    if not os.path.exists(im_path):
-        os.makedirs(im_path, exist_ok=True)
-    im_nifti = Image(im)
-    # im_nifti.setFileName(os.path.join(im_path, im_name))
-    im_nifti.save(os.path.join(im_path, im_name))
-
-
-def get_centerline(im_healthy_sc_data):
-    # Get centerline of the healthy SC
-    # for each slice in the mask_sc, get the center coordinate of the z-axis
-    num_z_slices = im_healthy_sc_data.shape[2]
-    healthy_centerline = list()
-    for z in range(num_z_slices):
-        x, y = ndimage.center_of_mass(im_healthy_sc_data[:, :, z])
-        # check if not nan (because spinal cord mask covers only spinal cord, not the whole image and all slices)
-        if not np.isnan(x) and not np.isnan(y):
-            healthy_centerline.append((round(x), round(y), z))
-
-    return healthy_centerline
-
-
-def get_lesion_volume(im_patho_lesion_data, voxel_dims, debug=False):
-    # Compute volume
-    nonzero_voxel_count = np.count_nonzero(im_patho_lesion_data)
-    voxel_size = np.prod(voxel_dims)
-    nonzero_voxel_volume = nonzero_voxel_count * voxel_size
-
-    if debug:
-        print("Voxel size = {}".format(voxel_size))
-        print("Number of non-zero voxels = {}".format(nonzero_voxel_count))
-        print(f"Volume of non-zero voxels = {nonzero_voxel_volume:.2f} mm^3")
-
-    return nonzero_voxel_volume
-
-
-def keep_largest_component(new_lesion_data):
-    """
-    Keep only the largest connected component in the lesion mask
-    """
-    # Get connected components
-    labels = measure.label(new_lesion_data)
-    # Get number of connected components
-    num_components = labels.max()
-    # Get size of each connected component
-    component_sizes = np.bincount(labels.ravel())
-    # Get largest connected component
-    largest_component = np.argmax(component_sizes[1:]) + 1
-    # Keep only the largest connected component
-    new_lesion_data[labels != largest_component] = 0
-
-    return new_lesion_data
-
-
-def fetch_subject_and_session(filename_path):
-    """
-    Get subject ID, session ID and filename from the input BIDS-compatible filename or file path
-    The function works both on absolute file path as well as filename
-    More about BIDS - https://bids-specification.readthedocs.io/en/stable/04-modality-specific-files/01-magnetic-resonance-imaging-data.html#anatomy-imaging-data
-    :param filename_path: input nifti filename (e.g., sub-001_ses-01_T1w.nii.gz) or file path
-    (e.g., /home/user/MRI/bids/sub-001/ses-01/anat/sub-001_ses-01_T1w.nii.gz
-    :return: subjectID: subject ID (e.g., sub-001)
-    :return: sessionID: session ID (e.g., ses-01)
-    :return: filename: nii filename (e.g., sub-001_ses-01_T1w.nii.gz)
-    """
-
-    _, filename = os.path.split(filename_path)              # Get just the filename (i.e., remove the path)
-    subject = re.search('sub-(.*?)[_/]', filename_path)     # [_/] slash or underscore
-    subjectID = subject.group(0)[:-1] if subject else None    # [:-1] removes the last underscore or slash
-    session = re.findall(r'ses-..', filename_path)
-    sessionID = session[0] if session else None               # Return None if there is no session
-    # REGEX explanation
-    # \d - digit
-    # \d? - no or one occurrence of digit
-    # *? - match the previous element as few times as possible (zero or more times)
-    # . - any character
-
-    return subjectID, sessionID, filename
-
-
-def generate_histogram(im_healthy_data, im_healthy_sc_data, im_healthy_sc_dil_data,
-                       im_patho_data, im_patho_sc_data, im_patho_sc_dil_data, im_patho_lesion_data,
-                       im_augmented_data, im_augmented_lesion_data, new_sc_data,
-                       sub_healthy, sub_patho, subject_name_out,
-                       output_dir):
-    """
-    Generate healthy-patho pair histogram for the whole image and for their SCs
-    :param im_healthy_data: healthy image data
-    :param im_healthy_sc_data: healthy image SC data
-    :param im_patho_data: patho image data
-    :param im_patho_sc_data: patho image SC data
-    :param im_patho_lesion_data: patho image lesion data
-    :param figure_path: path to save the figure
-    """
-
-    # Check if directory exists, if not create it
-    if not os.path.exists(output_dir):
-        os.makedirs(output_dir)
-    figure_path = output_dir + f"/{subject_name_out}_histogram.png"
-
-    # Create 1x2 subplots
-    fig, axs = plt.subplots(1, 1, tight_layout=True, figsize=(7, 4))
-    # # Whole images
-    # axs[0].hist(im_healthy_data.flatten(), bins=50, range=(0, 1), label=f'Healthy subject ({sub_healthy})',
-    #             alpha=0.3, histtype='step', linewidth=3, color='green')
-    # axs[0].hist(im_patho_data.flatten(), bins=50, range=(0, 1), label=f'Patho subject ({sub_patho})',
-    #             alpha=0.3, histtype='step', linewidth=3, color='red')
-    # axs[0].hist(im_augmented_data.flatten(), bins=50, range=(0, 1), label=f'Augmented subject ({subject_name_out})',
-    #             alpha=0.3, histtype='step', linewidth=3, color='blue')
-    # axs[0].set_title('Whole image')
-
-    # Spinal cords only
-    # Healthy SC
-    # axs[1].hist(im_healthy_data[im_healthy_sc_data > 0].flatten(), bins=50, range=(0, 1),
-    #             label=f'Healthy SC ({sub_healthy})', alpha=0.3, histtype='step', linewidth=3, color='green')
-    # # Patho SC minus lesion
-    # axs[1].hist(im_patho_data[(im_patho_sc_data > 0) & (im_patho_lesion_data == 0)].flatten(), bins=50, range=(0, 1),
-    #             label=f'Patho SC ({sub_patho})', alpha=0.3, histtype='step', linewidth=3, color='red')
-    # Patho SC dilated minus lesion
-    axs.hist(im_patho_data[(im_patho_sc_dil_data > 0) & (im_patho_lesion_data == 0)].flatten(), bins=50, range=None, #(0, 1),
-                label=f'Patho SC dilated ({sub_patho})', alpha=0.9, histtype='step', linewidth=3, color='green')
-    # Augmented SC dilated minus lesion
-    axs.hist(im_augmented_data[(im_healthy_sc_dil_data > 0) & (im_augmented_lesion_data == 0)].flatten(), bins=50, range=None, # (0, 1),
-                label=f'Augmented SC dilated ({subject_name_out})', alpha=0.7, histtype='step', linewidth=3, color='blue')
-    # Lesion only
-    axs.hist(im_patho_data[im_patho_lesion_data > 0].flatten(), bins=50, range=None, #(0, 1),
-                label=f'Patho lesion ({sub_patho})', alpha=0.9, histtype='step', linewidth=3, color='lightgreen')
-    # Augmented lesion only
-    axs.hist(im_augmented_data[im_augmented_lesion_data > 0].flatten(), bins=50, range=None, #(0, 1),
-                label=f'Augmented lesion ({subject_name_out})', alpha=0.9, histtype='step', linewidth=3, color='lightblue')
-    axs.set_title('Spinal cord only')
-
-    # Add legend to top right corner and decrease font size
-    axs.legend(loc='upper right', prop={'size': 8})
-    # axs[1].legend(loc='upper right', prop={'size': 8})
-    # Add x labels
-    axs.set_xlabel('Normalized Intensity')
-    # axs[1].set_xlabel('Normalized Intensity')
-    # Add y labels
-    axs.set_ylabel('Count')
-    # axs[1].set_ylabel('Count')
-    # Save plot
-    plt.savefig(figure_path, dpi=300)
-    print(f"Saved histogram to {figure_path}")
-    # Close plot
-    plt.close(fig)
-
-
-# helper functions for histogram matching
-def match_histogram(source_slice, target_slice):
-    matched_slice = exposure.match_histograms(source_slice, target_slice)
-    return matched_slice
-
-def match_histogram_3D(source_volume, target_volume):
-
-    # # Resample the volumes to a common shape
-    # common_shape = (
-    #     max(source_volume.shape[0], target_volume.shape[0]),
-    #     max(source_volume.shape[1], target_volume.shape[1]),
-    #     max(source_volume.shape[2], target_volume.shape[2])
-    #     )
-    # print(f"Common shape: {common_shape}")
-    
-    # # source_volume_resampled = zoom(source_volume, np.array(common_shape) / np.array(source_volume.shape))
-    # source_volume_resampled = zoom(source_volume, np.array(target_volume.shape) / np.array(source_volume.shape))
-    # print(f"Source volume resampled shape: {source_volume_resampled.shape}")
-    # # target_volume_resampled = zoom(target_volume, np.array(common_shape) / np.array(target_volume.shape))
-    # # print(f"Target volume resampled shape: {target_volume_resampled.shape}")
-    
-    # Perform histogram matching for each slice in the resampled volumes
-    matched_volume = np.empty_like(source_volume)
-    # for z in range(common_shape[2]):
-    for z in range(source_volume.shape[0]):
-        # matched_volume_resampled[..., z] = match_histogram(source_volume_resampled[..., z], target_volume_resampled[..., z])
-        matched_volume[z, ...] = match_histogram(source_volume[z, ...], target_volume[z, ...])
-    
-    # Rescale the matched volume back to the original shape
-    # matched_volume = zoom(matched_volume_resampled, source_volume.shape / common_shape)
-    # matched_volume = zoom(matched_volume_resampled, np.array(target_volume.shape) / np.array(common_shape))
-    
-    return matched_volume