Source code for src.helpers.utilities

import argparse
import json
import pprint

import matplotlib as mpl
from sklearn import metrics

from src.data_model.data_model import *

LOGGER = logging.getLogger(__name__)


# *================================= metrics =================================*
[docs]def get_iou_score(y_true: np.array, y_pred: np.array) -> float:
    """
    Calculates the Intersection over Union score given a mask and a prediction.

    :param y_true: the true mask corresponding to the prediction
    :param y_pred: the prediction
    :return: IoU
    """
    intersection = np.logical_and(y_true, y_pred)
    union = np.logical_or(y_true, y_pred)
    iou_score = np.sum(intersection) / np.sum(union)

    return iou_score


[docs]def classification_report(predictions: List[np.array],
                          masks: List[np.array],
                          save_path: str = None) -> pd.DataFrame:
    """
    Generates a classification report by comparing each mask and prediction
    in the input list of predictions and masks. If a save path is provided
    then the classification report is saved. The metrics returned in the
    report are: IoU, AUC_PR, Precision, Recall, F1, Accuracy, FN, FP, TN,
    and TP.

    :param predictions: a list of predictions
    :param masks: a list of masks corresponding to the predictions
    :param save_path: the output path to saved the classifcation report
    :return: a classification report df
    """
    metric_df = pd.DataFrame({"IoU": [], "Precision": [], "Recall": [],
                              "F1": [], "Accuracy": [], "AUC_PR": [],
                              "FN": [], "FP": [], "TN": [], "TP": []})

    with tqdm(total=len(predictions), file=sys.stdout) as pbar:
        for pred, mask in zip(predictions, masks):
            # grab the original image and reconstructed image
            y_true = mask.round().flatten()
            y_pred = pred.flatten()

            avg_pr = metrics.average_precision_score(y_true, y_pred)

            y_pred = y_pred.round()

            tn, fp, fn, tp = metrics.confusion_matrix(y_true, y_pred,
                                                      labels=[0,1]).ravel()
            iou = get_iou_score(y_true, y_pred)

            # set values to 0 if there are no true positives
            if tp > 0:
                precision = tp / (tp + fp)
                recall = tp / (tp + fn)
                f1 = tp / (tp + 0.5 * (fn + fp))
            else:
                precision = 0
                recall = 0
                f1 = 0

            d = {"IoU": iou,
                 "AUC_PR": avg_pr,
                 "Precision": precision,
                 "Recall": recall,
                 "F1": f1,
                 "Accuracy": (tp + tn) / (tp + fn + tn + fp),
                 "FN": fn,
                 "FP": fp,
                 "TN": tn,
                 "TP": tp}

            metric_df = metric_df.append(d, ignore_index=True)

            pbar.update(1)

        if save_path:
            metric_df.to_csv(save_path)

    return metric_df


# *=============================== data model ================================*
[docs]def create_file_name(output_folder_path, output_file_name, i,
                     placeholder_size):
    """
    Creates the output folder path if it doesn't exist. The input number,
    i, is zero padded according to the placeholder size and appended to
    the output filename. This filename is appended to the output folder path
    and returned.

    :param output_folder_path: the output folder path
    :param output_file_name: the filename to which the zero-padded number
     must be appended
    :param i: the number to zero pad
    :param placeholder_size: determines how much to zero pad i; i.e. if
     placeholder size is 3 and i =1, the number used in the filename will be 001
    :return: an output file path
    """
    Path(output_folder_path).mkdir(parents=True, exist_ok=True)

    file_name, extension = \
        str.rsplit(output_file_name, ".", 1)
    final_file_name = f"{file_name}_{i:0{placeholder_size}}.{extension}"
    final_file_name = os.path.join(output_folder_path, final_file_name)

    return final_file_name


[docs]def trim_image_array(image_array: np.array,
                     output_size: int,
                     axis: str,
                     trim_dir: int) -> np.array:
    """
    Trims an image, either from the start or the end, along a single axis.

    :param image_array: the input image
    :param output_size: the output size of the image; i.e. informs how much
     of the image to trim
    :param axis: one of either "x", "y" or both
    :param trim_dir: the trim direction, either -1 or 1; 1 trims from the
     start of the image and -1 trims from the end
    :return: the trimmed image
    """
    image_shape = image_array.shape

    if axis not in ["x", "y"]:
        raise ValueError("Please input one of 'x', 'y' as the axis")

    if trim_dir not in [-1, 1]:
        raise ValueError("Please input one of -1 or 1 as the trim "
                         "direction")

    if axis == "y":
        diff = image_shape[0] - output_size
    if axis == "x":
        diff = image_shape[1] - output_size
        image_array = image_array.transpose()

    if trim_dir == 1:
        # exclude the first x_diff columns
        image_array = image_array[diff:, :]
    if trim_dir == -1:
        # exclude the last x_diff rows
        image_array = image_array[:-diff, :]

    if axis == "x":
        image_array = image_array.transpose()

    return image_array


# *================================== plots ==================================*
[docs]def update_plot_format(default: bool = False) -> None:
    """
    Updates the matplotlib RC. This function can also be used to set the rc
    back to the default configuration.

    :param default: whether to set the RC to the custom config or to the
     default config
    :return: None
    """
    if default:
        mpl.rcParams.update(mpl.rcParamsDefault)
    else:
        # Project specific params
        LOGGER.info(
            "Note these changes will apply the entire session, please run  "
            "this function with `default = True` to restore default "
            "matplotlib settings")
        mpl.rcParams['lines.linewidth'] = 3
        mpl.rcParams['axes.spines.top'] = False
        mpl.rcParams['axes.spines.right'] = False
        mpl.rcParams['axes.linewidth'] = 1.5
        mpl.rcParams['xtick.labelsize'] = 12
        mpl.rcParams['ytick.labelsize'] = 12


# *================================= dataset =================================*
[docs]def create_subfolders(path: Path, folder: str) -> None:
    """
    Creates leaf and mask subfolders at the given base path and folder.

    :param path: base path
    :param folder: the folder in the path under which the subfolders should
     be created
    :return: None
    """
    path.joinpath(folder, "leaves").mkdir(parents=True,
                                          exist_ok=True)
    path.joinpath(folder, "masks").mkdir(parents=True,
                                         exist_ok=True)


# *============================== all __main__ ===============================*
[docs]def create_sequence_objects(sequence_input: Dict):
    """
    Creates a list of LeafSequence and MaskSequence objects.

    :param sequence_input: a dict with the details of how the sequence
     should be created; this dict can control in which mode the sequence
     objects are created in
    :return: a list of LeafSequence and a list MaskSequence objects
    """
    lseqs = []
    mseqs = []

    leaf_dict = sequence_input["leaves"]["input"]
    if leaf_dict is not None:
        leaf_keys = list(leaf_dict.keys())
        for vals in zip(*list(leaf_dict.values())):
            kwargs = {key: val for key, val in zip(leaf_keys, vals)}
            lseqs.append(LeafSequence(**kwargs))

    mask_dict = sequence_input["masks"]["input"]
    if mask_dict is not None:
        mask_keys = list(mask_dict.keys())
        for vals in zip(*list(mask_dict.values())):
            kwargs = {key: val for key, val in zip(mask_keys, vals)}
            mseqs.append(MaskSequence(**kwargs))

    return lseqs, mseqs


[docs]def load_image_objects(seq_objects,
                       load_images: bool = False,
                       **kwargs) -> None:
    """
    Creates image object for each sequence object in a list of sequence
    objects. No object is return but the sequence objects are mutated.

    :param seq_objects: the list of sequence objects whose images need to be
     created
    :param load_images: whether image arrays for the created objects should
     be loaded
    :param kwargs: kwargs for loading image, if load_images is true
    :return: None
    """
    LOGGER.info(f"Creating image objects for "
                f"{seq_objects[0].__class__.__name__}")

    for seq in seq_objects:
        LOGGER.info(f"Creating {seq.num_files} objects")
        seq.load_extracted_images(load_image=load_images, **kwargs)


# *============================ package __main__ =============================*
# *------------------------------- procedures --------------------------------*
[docs]def trim_sequence_images(seq_objects,
                         x_size_dir_list: List[Tuple[int, int]] = None,
                         y_size_dir_list: List[Tuple[int, int]] = None,
                         overwrite: bool = False,
                         **kwargs) -> None:
    """
    Trims either a images in a list MaskSequence or LeafSequence objects. No
    object is returned but the trim images are saved.

    :param seq_objects: either a list of MaskSequence or LeafSequence objects
    :param y_size_dir_list: a list of tuples; each tuple is in the format of
     (output size, trim_direction), where trim direction is either 1 or -1,
     which indicates to trim from either the top or bottom respectively
    :param x_size_dir_list: a list of tuples; each tuple is in the format of
     (output size, trim_direction), where trim direction is either 1 or -1,
     which indicates to trim from either the left or right respectively
    :param overwrite: whether tiles that exist at the same file path should
     be overwritten
    :param kwargs: kwargs for loading the images in the sequence object
    :return: None
    """
    for seq, x_size_dir, y_size_dir in \
            zip(seq_objects, x_size_dir_list, y_size_dir_list):
        seq.load_image_array(**kwargs)

        seq.trim_image_sequence(x_size_dir, y_size_dir, overwrite)

        seq.unload_extracted_images()


# *-------------------------------- argparse ---------------------------------*
[docs]def parse_arguments() -> argparse.Namespace:
    """
     Argument parser

    :return: An argparse namespace
    """
    parser = argparse.ArgumentParser("Perform operations using the "
                                     "plant-image-segmentation code base")

    parser.add_argument(
        "-i", "--interactive", action="store_true", default=False,
        help="flag to run the script in interactive mode")

    parser.add_argument("-j", "--json_path", metavar="\b", type=str,
                        help="path to input parameters for an action")

    subparsers = parser.add_subparsers(
        title="actions", description='possible actions using this module')

    parser.add_argument("-fj", "--filepath_json", metavar="\b", type=str,
                        help="path to a JSON file with the required "
                             "parameters to create LeafSequence and "
                             "MaskSequence objects")

    parser_extract_images = subparsers.add_parser("extract_images",
                                                  help="extraction help")
    parser_extract_images.set_defaults(which='extract_images')

    parser_extract_images.add_argument(
        "--leaf_output_path", "-lo", metavar="\b",
        help="output paths, if the paths are in the input json enter "
             "\"same\"")

    parser_extract_images.add_argument(
        "--mask_output_path", "-mo", metavar="\b",
        help="output paths, if the paths are in the input json enter "
             "\"same\"")

    parser_extract_images.add_argument(
        "--overwrite", "-o", action="store_true", default=False,
        help="overwrite existing images, note this flag is applied to both "
             "mask and leaf images")

    parser_extract_images.add_argument(
        "--binarise", "-b", action="store_true", default=False,
        help="save binary masks")

    parser_extract_tiles = subparsers.add_parser("extract_tiles",
                                                 help="extraction help")
    parser_extract_tiles.set_defaults(which="extract_tiles")

    parser_extract_tiles.add_argument("-sx", "--stride_x", metavar="\b",
                                      type=int, help="x stride size")
    parser_extract_tiles.add_argument("-sy", "--stride_y", metavar="\b",
                                      type=int, help="y stride size")
    parser_extract_tiles.add_argument("-lx", "--length_x", metavar="\b",
                                      type=int, help="tile x length")
    parser_extract_tiles.add_argument("-ly", "--length_y", metavar="\b",
                                      type=int, help="tile y length")

    parser_extract_tiles.add_argument(
        "--leaf_output_path", "-lo", metavar="\b",
        help="output paths, if you want to use "
             "the default path enter  \"default\", if the paths are in "
             "the input json enter  \"same\"")

    parser_extract_tiles.add_argument(
        "--mask_output_path", "-mo", metavar="\b",
        help="output paths, if you want to use "
             "the default path enter  \"default\", if the paths are in "
             "the input json enter  \"same\"")

    parser_extract_tiles.add_argument(
        "--overwrite", "-o", action="store_true", default=False,
        help="overwrite existing images, note this flag is applied to both "
             "mask and leaf images")

    parser_trim_sequence = subparsers.add_parser(
        "trim_sequence", help="trims every image in an image sequence ")
    parser_trim_sequence.set_defaults(which='trim_sequence')

    parser_trim_sequence.add_argument(
        "--mask", "-m", action="store_true", default=False,
        help="whether the mask sequence should be trimmed, default is for "
             "the leaf sequence to be trimmed")
    parser_trim_sequence.add_argument(
        "--y_size_dir", "-ysd", metavar="\b",
        help="y output size and direction to be passed in as a tuple, "
             "where a 1 or -1 indicated to trim either top or bottom "
             "respectively")
    parser_trim_sequence.add_argument(
        "--x_size_dir", "-xsd", metavar="\b",
        help="x output size and direction to be passed in as a tuple, "
             "where a 1 or -1 indicated to trim either left or right "
             "respectively")
    parser_trim_sequence.add_argument(
        "--overwrite", "-o", action="store_true", default=False,
        help="whether or not the image being trimmed should be overwritten")

    parser_plot_profile = subparsers.add_parser(
        "plot_profile", help="plot an embolism profile")
    parser_plot_profile.set_defaults(which="plot_profile")
    parser_plot_profile.add_argument(
        "--output_path", "-o", type=str, metavar="\b", help="The plot output "
                                                            "path")
    parser_plot_profile.add_argument(
        "--show", "-s", action="store_true", help="flag indicating if the "
                                                  "plot should be shown")
    parser_plot_profile.add_argument(
        "--leaf_names", "-ln", type=str, metavar="\b",
        help="leaf names to be used in plot title")

    parser_plot_embolism_counts = subparsers.add_parser(
        "plot_embolism_counts", help="plot the embolism count profile for a "
                                     "dataset")
    parser_plot_embolism_counts.set_defaults(which="plot_embolism_counts")
    parser_plot_embolism_counts.add_argument(
        "--output_path", "-o", type=str, metavar="\b", help="The plot output "
                                                            "path")
    parser_plot_embolism_counts.add_argument(
        "--show", "-s", action="store_true", help="flag indicating if the "
                                                  "plot should be shown")
    parser_plot_embolism_counts.add_argument(
        "--leaf_names", "-ln", type=str, metavar="\b",
        help="leaf names to be used in plot title")
    parser_plot_embolism_counts.add_argument(
        "--tile", "-t", action="store_true",
        help="indicates if the plot should be created using tiles")
    parser_plot_embolism_counts.add_argument(
        "--leaf_embolism_only", "-leo", action="store_true",
        help="should only full leaves with embolisms be used")
    parser_plot_embolism_counts.add_argument(
        "--percent", "-p", action="store_true",
        help="should the plot y-axis be expressed as a percent")

    parser_eda_df = subparsers.add_parser(
        "eda_df", help="extract an eda dataframe")
    parser_eda_df.set_defaults(which="eda_df")

    parser_eda_df.add_argument(
        "csv_output_path", help="output paths, if the paths are in the input "
                                "json enter \"same\"")
    parser_eda_df.add_argument("--tiles", "-t", action="store_true")

    parser_databunch_df = subparsers.add_parser(
        "databunch_df", help="extract an databunch dataframe")
    parser_databunch_df.set_defaults(which="databunch_df")

    parser_databunch_df.add_argument(
        "csv_output_path", help="output paths, if the paths are in the input"
                                " json enter \"same\"")

    parser_databunch_df.add_argument("--tiles", "-t", action="store_true")
    parser_databunch_df.add_argument("--tile_embolism_only", "-teo",
                                     action="store_true",
                                     help="should only tiles with embolisms "
                                          "be used")
    parser_databunch_df.add_argument(
        "--leaf_embolism_only", "-leo", action="store_true",
        help="should only full leaves with embolisms be used")

    parser_prediction = subparsers.add_parser(
        "predict", help="generate predictions using a saved model")
    parser_prediction.set_defaults(which="predict")
    parser_prediction.add_argument(
        "--model_path", "-mp", type=str, metavar="\b",
        help="the path to the saved model weights to restore")
    parser_prediction.add_argument(
        "--threshold", "-t", type=str, metavar="\b",
        help="classification threshold to determine if a pixel is an embolism "
             "or not.")
    parser_prediction.add_argument(
        "--csv_path", "-cp", type=str, metavar="\b",
        help="csv path of where the classification report should be saved; "
             "this flag determines if a classification report is generated")
    parser_prediction.add_argument(
        "--leaf_shape", "-ls", type=str, metavar="\b",
        help="leaf shape, please separate each number by a ';'")

    parser_dataset = subparsers.add_parser(
        "create_dataset", help="create a dataset for model training")
    parser_dataset.set_defaults(which="create_dataset")
    parser_dataset.add_argument(
        "--dataset_path", "-dp", type=str, metavar="\b",
        help="the path where the dataset should be created,including the "
             "dataset name")
    parser_dataset.add_argument(
        "--downsample_split", "-ds", type=float, metavar="\b",
        help="the fraction of non-embolism images to remove")
    parser_dataset.add_argument(
        "--test_split", "-ts", type=float, metavar="\b",
        help="the fraction of the data to use for a test set")
    parser_dataset.add_argument(
        "--val_split", "-vs", type=float, metavar="\b",
        help="the fraction of the data to use for a val set")

    # TODO: add either or to lolo and test split
    parser_dataset.add_argument(
        "--lolo", "-l", type=int, metavar="\b",
        help="the leaf to leave out for the test set")

    parser_dataset = subparsers.add_parser(
        "augment_dataset", help="augment a dataset for model training")
    parser_dataset.set_defaults(which="augment_dataset")

    args = parser.parse_args()
    return args


# *--------------------------- interactive prompt ----------------------------*
[docs]def print_options_dict(output_dict: Dict) -> None:
    """
    Print a formatted version of the results of the output dict generated by
    the input prompt

    :param output_dict: the output dict to print
    :return: None
    """
    print(f"\nYour chosen configuration is:\n")
    for i, (key, val) in enumerate(output_dict.items()):
        if i == 0:
            num = "  "
        else:
            num = str(i) + "."
        if isinstance(val, dict):
            print_str = "\n" + pprint.pformat(val) + "\n"
        else:
            print_str = val

        print(f"{num} {(' '.join(key.split('_'))).capitalize() :<20}:"
              f" {print_str}")


[docs]def requirements(operation: int) -> None:
    """
    Used to add the requirements for a particular operation to the input
    prompt.

    :param operation: the operation whose requirements should be printed
    :return: None
    """
    if operation == 8:
         print("\nNote:"
               "\n - Only one of either Mask or Leaf sequences can be trimmed "
               "at a time")
    if operation == 9:
        print("\nRequirements:"
              "\n - This action currently only works using the default "
              "chips-<> object locations; that is the chips-<> folder "
              "should be in the parent folder of where your mask and "
              "leaf images respectively."
              "\n - All mask tiles and leaf tiles must have the same "
              "extension respectively.")
    if operation == 10:
        print("\nNote: Only embolism leaves will be augmented"
              "\nRequirements:"
              "\n - The dataset folder structure should follow the default "
              "structure, which is created when using option 9 (above)."
              "\n -  Please ensure that the following format is followed in "
              "the images to be augmented: "
              "<name>_<image_number>_<tile_number>; this is required both "
              "for linking and for naming")


[docs]def interactive_prompt() -> Dict:
    """
    Interactive prompt which allows users to interact with the code base.
    The results are returned as a dict. There is an option, through the
    prompt, to save the input as a json to be used again.

    :return: None
    """
    happy = False
    options_list = set((-1,))
    operation_names = ["extract_images", "extract_tiles", "plot_profile",
                       "plot_embolism_counts", "eda_df", "databunch_df",
                       "predict", "trim_sequence", "create_dataset",
                       "augment_dataset"]

    while not happy:
        if -1 in options_list:
            output_dict = {}

            print("* What action would you like to take?\n"
                  "------------ Extraction ------------\n"
                  " 1. Extract images\n"
                  " 2. Extract tiles\n"
                  "------------- Plotting -------------\n"
                  " 3. Plot embolism profile\n"
                  " 4. Plot embolism count barplot\n"
                  "--------------- EDA ----------------\n"
                  " 5. EDA DataFrame\n"
                  " 6. DataBunch DataFrame\n"
                  "------------ Prediction ------------\n"
                  " 7. Tensorflow Model\n"
                  "------------- General --------------\n"
                  " 8. Trim sequence\n"
                  "------------- Dataset --------------\n"
                  " 9. Create Dataset\n"
                  "10. Augment Dataset"
                  )

            operation = int(input("Please select your operation: "))
            output_dict["which"] = operation_names[operation - 1]

            # Include the max of all options: 1 - 11
            # This is the number of unique questions
            options_list.update(range(1, 11))

            options_list.remove(-1)
        print("Please separate multiple answers by a ';'. NOTE: the individual"
              "file paths cannot contain semi-colons")

        requirements(operation)

        if 1 in options_list:
            leaf_input_path = input(
                "\n1. Where are the leaf images that you would like to"
                " use?\nPlease include the filename pattern if"
                " necessary\n(Leave this blank to skip)\nAnswer: ")

            output_dict["leaves"] = {
                "input": {"folder_path": [], "filename_pattern": []},
                "format": {}}

            # capture leave format, questions depends on whether leaves have
            # been extracted. Grouped with option 1
            if operation == 1:
                print("\nWould you like to shift the leaves by 256 before "
                      "extracting?\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                leaves_format = int(input("Please choose a number: "))

                output_dict["leaves"]["format"]["shift_256"] = (
                        leaves_format == 1)
            else:
                print("\nWould you like to load your image in a specific "
                      "format?\n"
                      "Note: if this is left blank, the images will be loaded "
                      "in their default format\n"
                      "   Options:\n"
                      "   0: uint8\n"
                      "   1: shifted -256 (don't chose this option unless "
                      "images were shifted by +256 when saved)")

                leaves_format = input("Please choose a number: ")
                if leaves_format == "":
                    leaves_format = None
                else:
                    leaves_format = int(leaves_format)

                if leaves_format == 0:
                    output_dict["leaves"]["format"]["transform_uint8"] = True
                elif leaves_format == 1:
                    output_dict["leaves"]["format"]["shift_256"] = True

            if leaf_input_path:
                for path in leaf_input_path.split(";"):
                    folder_path, filename = path.rsplit("/", 1)
                    output_dict["leaves"]["input"]["folder_path"].append(
                        folder_path + "/")
                    output_dict["leaves"]["input"]["filename_pattern"].append(
                        filename)

            options_list.remove(1)

        if 2 in options_list:
            mask_input_path = input(
                "\n2. Where are the mask images that you would like to"
                " use include the filename pattern if"
                " necessary\n(Leave this blank to skip)\nAnswer: ")

            if operation == 1:
                output_dict["masks"] = {
                    "input": {"mpf_path": mask_input_path.split(";")}}
            else:
                output_dict["masks"] = {
                    "input": {"folder_path": [], "filename_pattern": []}}

                if mask_input_path:
                    for path in mask_input_path.split(";"):
                        folder_path, filename = path.rsplit("/", 1)
                        output_dict["masks"]["input"]["folder_path"].append(
                            folder_path + "/")
                        output_dict["masks"]["input"][
                            "filename_pattern"].append(filename)

                options_list.remove(2)

        if operation == 1 or operation == 2:
            if 3 in options_list:
                if leaf_input_path:
                    leaf_output_path = input(
                        "\n3. Where do you want to save the extracted leaves."
                        "\n   Please also include the file name."
                        "\nAnswer: ")

                    output_dict["leaf_output_path"] = leaf_output_path
                else:
                    print("\nYou did not enter a leaf directory, so question 3"
                          " will be skipped.")
                    output_dict["leaf_output_path"] = None

                options_list.remove(3)

            if 4 in options_list:
                if mask_input_path:
                    mask_output_path = input(
                        "\n4. Where do you want to save the extracted masks."
                        "\n   Please also include the file name."
                        "\nAnswer: ")

                    output_dict["mask_output_path"] = mask_output_path
                else:
                    print("\nYou did not enter a mask directory, so question 4"
                          " will be skipped.")

                    output_dict["mask_output_path"] = None

                options_list.remove(4)

            if 5 in options_list:
                print("\n5. Would you like to overwrite any existing "
                      "extracted images?\n"
                      "   Options:\n"
                      "   0: False\n"
                      "   1: True")
                overwrite = input("Please choose a number: ")
                overwrite = int(overwrite) == 1

                output_dict["overwrite"] = overwrite

                options_list.remove(5)

        if operation == 1:
            if 6 in options_list:
                if mask_input_path:
                    print("\n6. Would you like to save binarised masks - i.e."
                          " pixel values as 0, 1?\n"
                          "   Options:\n"
                          "   0: False\n"
                          "   1: True")
                    binarise = input("Please choose a number: ")
                    binarise = int(binarise) == 1

                    output_dict["binarise"] = binarise
                else:
                    print("\nYou did not enter a mask directory, so question 6"
                          " will be skipped.")

                    output_dict["binarise"] = None

                options_list.remove(6)

        if operation == 2:
            if 6 in options_list:
                sx = input("\n6. Please enter the size of the x stride: ")

                output_dict["stride_x"] = int(sx)

                options_list.remove(6)

            if 7 in options_list:
                sy = input("\n7. Please enter the size of the y stride: ")

                output_dict["stride_y"] = int(sy)

                options_list.remove(7)

            if 8 in options_list:
                lx = input("\n8. Please enter the width of the tile"
                           " (x length): ")

                output_dict["length_x"] = int(lx)

                options_list.remove(8)

            if 9 in options_list:
                ly = input("\n9. Please enter the length of the tile"
                           " (y length): ")

                output_dict["length_y"] = int(ly)

                options_list.remove(9)

        if operation == 3 or operation == 4:
            if 3 in options_list:
                output_path = input(
                    "\n3. Please enter the image output paths, enter a"
                    " path, including the filename, for each image."
                    "\nAnswer: ")

                output_dict["output_path"] = output_path

                options_list.remove(3)

            if 4 in options_list:
                leaf_names = input(
                    "\n4. What leaf names should be used in the plot "
                    "title?\nPlease enter a name per leaf: ")

                output_dict["leaf_names"] = leaf_names

                options_list.remove(4)

            if 5 in options_list:
                print("\n5. Would you like to display the plot before exiting"
                      " the script?\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                show = input("Please choose a number: ")
                show = int(show) == 1

                output_dict["show"] = show

                options_list.remove(5)

        if operation == 4:
            if 6 in options_list:
                print("\n6. Should only leaves with embolisms be used?\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                leo = input("Please choose a number: ")
                leo = int(leo) == 1

                output_dict["leaf_embolism_only"] = leo

                options_list.remove(6)

            if 7 in options_list:
                print("\n7. Would you like to create the plot using image "
                      "tiles\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                tile = input("Please choose a number: ")
                tile = int(tile) == 1

                output_dict["tile"] = tile

                options_list.remove(7)

            if 8 in options_list:
                print("\n8. Should the y-axis scale use percentages?\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                percent = input("Please choose a number: ")
                percent = int(percent) == 1

                output_dict["percent"] = percent

                options_list.remove(8)

        if operation == 5 or operation == 6:
            if 3 in options_list:
                csv_output_path = input(
                    "\n3. Where do you want to save the csv output?."
                    "\n   Please also include the file name."
                    "\nAnswer: ")

                output_dict["csv_output_path"] = csv_output_path

                options_list.remove(3)

            if 4 in options_list:
                print("\n4. Would you like to create the data frame using"
                      " tiles\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                tiles = input("Please choose a number: ")
                tiles = int(tiles) == 1

                output_dict["tiles"] = tiles

                options_list.remove(4)

            if 5 in options_list and operation == 5:
                print("\n5. Please choose which fields you would like included"
                      " in the EDA DataFrame\n"
                      "Options:\n"
                      "0: Linked filename\n"
                      "1: Unique range\n"
                      "2: Embolism percent\n"
                      "3: Intersection\n"
                      "4: Has embolism\n")

                eda_options = input("Choose the relevant number(s) separated"
                                    " by a ';' : ").split(";")

                output_dict["eda_df_options"] = {"linked_filename": False,
                                                 "unique_range": False,
                                                 "embolism_percent": False,
                                                 "intersection": False,
                                                 "has_embolism": False}

                eda_df_options = list(output_dict["eda_df_options"])

                for option in eda_options:
                    output_dict["eda_df_options"][
                        eda_df_options[int(option)]] = True

                options_list.remove(5)

        if operation == 6:
            if 5 in options_list:
                print("\n5. Should only leaves with embolisms be used?\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                leo = input("Please choose a number: ")
                leo = int(leo) == 1

                output_dict["leaf_embolism_only"] = leo

                options_list.remove(5)

            if 6 in options_list:
                if tiles:
                    print("\n6. Should only tiles with embolisms be used?\n"
                          "   Options:\n"
                          "   0: No\n"
                          "   1: Yes")
                    teo = input("Please choose a number: ")
                    teo = int(teo) == 1
                else:
                    teo = False

                output_dict["tile_embolism_only"] = teo

                options_list.remove(6)

        if operation == 7:
            if 3 in options_list:
                model_path = input("\n3. Please provide the model weights "
                                   "path: ")

                output_dict["model_path"] = model_path

                options_list.remove(3)

            if 4 in options_list:
                leaf_shape = input("\n4. Please enter the leaf image shape: ")

                output_dict["leaf_shape"] = leaf_shape

                options_list.remove(4)

            if 5 in options_list:
                threshold = input(
                    "\n5. Please enter the classification threshold to "
                    "determine if a pixel is an embolism or not."
                    "\n(Leave this blank to use 0.5) \nAnswer: ")

                if not threshold:
                    threshold = 0.5

                output_dict["threshold"] = float(threshold)

                options_list.remove(5)

            if 6 in options_list:
                csv_path = input(
                    "\n6 Please provide a .csv save path if you would "
                    "like to generate a classification report."
                    "\n(Leave this blank to skip)\nAnswer: ")

                output_dict["csv_path"] = csv_path

                options_list.remove(6)

        if operation == 8:
            if 3 in options_list:
                ysd = input(
                    "\n3. What is the y output size and directions?"
                    "\n   Note, for direction, a 1 or -1 indicates to trim"
                    " either the top or bottom respectively."
                    "\n Leave this blank to skip."
                    "\nPlease provide your answer as a tuple, and please"
                    " separate these answers by a ';' (if no trimming is "
                    "required for a particular sequence answer 'None'): ")

                if ysd == "":
                    ysd = None

                output_dict["y_size_dir"] = ysd

                options_list.remove(3)

            if 4 in options_list:
                xsd = input(
                    "\n4. What is the x output size and directions?"
                    "\n   Note, for direction, a 1 or -1 indicates to trim"
                    " either the left or right respectively."
                    "\n Leave this blank to skip."
                    "\nPlease provide your answer as a tuple, and please"
                    " separate these answers by a ';' (if no trimming is "
                    "required for a particular sequence answer 'None'): ")

                if xsd == "":
                    xsd = None

                output_dict["x_size_dir"] = xsd

                options_list.remove(4)

            if 5 in options_list:
                print("\n5. Would you like to overwrite any existing "
                      "extracted images?\n"
                      "   Options:\n"
                      "   0: False\n"
                      "   1: True")
                overwrite = input("Please choose a number: ")
                overwrite = int(overwrite) == 1

                output_dict["overwrite"] = overwrite

                options_list.remove(5)

            if 6 in options_list:
                print("\n6. Would you like to trim mask images (instead of "
                      "leaf images)?\n"
                      "   Options:\n"
                      "   0: No\n"
                      "   1: Yes")
                trim_masks = input("Please choose a number: ")
                trim_masks = int(trim_masks) == 1

                output_dict["mask"] = trim_masks

                options_list.remove(6)

        if operation == 9:
            if 3 in options_list:
                dataset_path = input(
                    "\n3. Where would you like to save the dataset? "
                    "\nPlease provide a path, including the dataset name"
                    "\nAnswer: ")

                output_dict["dataset_path"] = dataset_path

            if 4 in options_list:
                downsample_split = input(
                    "\n4. What fraction of the non-embolism samples would you "
                    "like to remove? "
                    "\n Please enter a value between 0 and <1; enter 0 for no "
                    "downsampling."
                    "\nAnswer: ")

                output_dict["downsample_split"] = float(downsample_split)

            if 5 in options_list:
                val_split = input(
                    "\n5. What fraction of the data would you like to use "
                    "for a validation set ? "
                    "\n Please enter a value between 0 and <1; enter 0 for no "
                    "validation set."
                    "\nAnswer: ")

                output_dict["val_split"] = float(val_split)


            if 6 in options_list:
                test_split = input(
                    "\n6. What fraction of the data would you like to use "
                    "for a test set? "
                    "\n Please enter a value between 0 and <1; enter 0 for no "
                    "test set."
                    "\n If you want to use a complete leaf as a test set, "
                    "please enter 0 and answer the next question."
                    "\nAnswer: ")

                output_dict["test_split"] = float(test_split)

            if 7 in options_list:
                lolo = input(
                    "\n7. If you would like to use a complete leaf for the "
                    "test test, please provide the number of the leaf in "
                    "from questions 1 and 2; i.e. the position of the leaf "
                    "in your entry string." 
                    "\n Note: the count starts at 1"
                    "\n Leave this blank to skip"
                    "\nAnswer: ")

                output_dict["lolo"] = lolo

        if operation not in list(range(1, 11)):
            raise ValueError("Please choose an option from the input list")

        print_options_dict(output_dict)

        options_list = input(
            "\nIf you are satisfied with this configurations, please enter 0."
            "\nIf not, please enter the number(s) of the options you would"
            " like to change.\nTo restart please enter -1."
            "\nSeparate multiple options by a ';' : ")
        options_list = set([int(choice) for choice in options_list.split(";")])

        if len(options_list) == 1 and 0 in options_list:
            happy = True
        elif 0 in options_list:
            print("\nYou entered options in addition to 0, so 0 will be "
                  "removed")
            options_list.remove(0)

    save_path = input("\nIf you would like to save this configuration"
                      " please enter the full json file name, including"
                      " the file path: ")

    if save_path:
        with open(save_path, 'w') as file:
            json.dump(output_dict, file)

    return output_dict
# *===========================================================================*