Source code for metamorphic_relations.Results

import numpy as np
import matplotlib.pyplot as plt
import json
from tabulate import tabulate

from metamorphic_relations.Info import Info


[docs]class Results:
    """
    Create an object to store and manipulate the results given multiple sets of metamorphic relations (MRs)

    :param original_results: the results using the original data
    :param GMR_results: the results when augmenting the data with generic MRs (GMRs)
    :param DSMR_results: the results when augmenting the data with domain specific MRs (DSMRs)
    :param all_MR_results: the results when augmenting the data with GMRs and DSMRs
    :param individual_results: a list of results from individual MRs
    """

    def __init__(self, original_results: Info = None, GMR_results: Info = None, DSMR_results: Info = None,
                 all_MR_results: Info = None, individual_results: list[Info] = None):

        self.original_results = original_results
        self.GMR_results = GMR_results
        self.DSMR_results = DSMR_results
        self.all_MR_results = all_MR_results
        self.individual_results = individual_results

[docs]    def graph(self, set_name: str = "", train_f1s: bool = False, test_f1s: bool = True, original_counts: bool = True,
              show_sets: tuple[bool, bool, bool, bool] = (True, True, True, True)):
        """
        Graphs the results of the deep learning with MRs

        :param set_name: the name of the set trained, to be used in the title
        :param train_f1s: choose whether to show the train F1 scores
        :param test_f1s: choose whether to show the test F1 scores
        :param original_counts: choose whether to show the F1 scores against the number of original training elements or the actual counts (number of training elements after the MRs)
        :param show_sets: the sets of results to show of ["original_results", "GMR_results", "DSMR_results", "all_MR_results"]. E.g. [True, False, True, False] shows ["original_results", "DSMR_results"]
        """

        if not train_f1s and not test_f1s:
            raise Exception("Must choose to show either the training or testing results")
        if train_f1s and test_f1s:
            raise Exception("Cannot choose to show both the training and testing results together")
        if len(show_sets) != 4:
            raise Exception("show_sets must have four boolean values")

        legend = ["Unaltered Data", "Data + Generic MRs", "Data + Domain Specific MRs",
                  "Data + Generic & Domain Specific MRs"]
        legend = np.array(legend)[np.array(show_sets)]

        xs = []
        ys = []

        title = set_name + " "
        y_label = ""

        if original_counts:
            title += "Original Number of Data Points vs "
            x_label = "Number of given Data Points of Original Set"
            xs += self.get_forall_sets(show_sets, lambda x: x.original_count)
        else:
            title += "Actual Number of Data Points vs "
            x_label = "Number of given Data Points after MRs Applied"
            xs += self.get_forall_sets(show_sets, lambda x: x.actual_count)

        if train_f1s:
            title += "Train F1"
            y_label = "Train Macro F1 Score"
            ys += self.get_forall_sets(show_sets, lambda x: x.train_f1)
        elif test_f1s:
            title += "Test F1"
            y_label = "Test Macro F1 Score"
            ys += self.get_forall_sets(show_sets, lambda x: x.test_f1)

        plt.title(title)
        plt.xlabel(x_label)
        plt.ylabel(y_label)
        plt.xscale("log", base=2)
        [plt.scatter(xs[i], ys[i]) for i in range(len(xs))]
        plt.legend(legend)
        plt.show()

[docs]    def graph_all(self, set_name: str = ""):
        """
        Graphs the train and test results using original and actual counts

        :param set_name: the name of the set trained, to be used in all the graph titles
        """

        self.graph(set_name=set_name, train_f1s=True, test_f1s=False)
        self.graph(set_name=set_name)
        self.graph(set_name=set_name, train_f1s=True, test_f1s=False, original_counts=False)
        self.graph(set_name=set_name, original_counts=False)

[docs]    def print_individual(self):
        """
        Prints the individual results as a table
        """

        if self.individual_results is None:
            raise Exception("No individual results")

        table = [["No MRs", self.original_results.actual_count[0], round(self.original_results.train_f1[0], 4),
                  round(self.original_results.test_f1[0], 4)]]

        for result in self.individual_results:
            table.append(
                (result.name, result.actual_count[0], round(result.train_f1[0], 4), round(result.test_f1[0], 4)))

        table = sorted(table, key=lambda x: x[3], reverse=True)

        print(tabulate(table, headers=["MR Name", "Data Count", "Train F1", "Test F1"]))

[docs]    def get_forall_sets(self, is_set: tuple[bool, bool, bool, bool] = (True, True, True, True), get_set_function=None) -> list:
        """
        For all sets of results which are not None call a function

        :param is_set: the sets of results to use of ["original_results", "GMR_results", "DSMR_results", "all_MR_results"]. E.g. [True, False, True, False] uses ["original_results", "DSMR_results"]
        :param function get_set_function: the function to be used with the result sets
        :return: the results of the function for each non None set
        """

        if len(is_set) != 4:
            raise Exception("is_set must have four boolean values")

        results = []

        if is_set[0] and self.original_results is not None:
            results.append(get_set_function(self.original_results))

        if is_set[1] and self.GMR_results is not None:
            results.append(get_set_function(self.GMR_results))

        if is_set[2] and self.DSMR_results is not None:
            results.append(get_set_function(self.DSMR_results))

        if is_set[3] and self.all_MR_results is not None:
            results.append(get_set_function(self.all_MR_results))

        return results

[docs]    def write_to_file(self, filename: str) -> str:
        """
        Writes the results to a file

        :param filename: the file (or path) to write the data to
        :return: a string representation of the Results object
        """

        text = {"original_results": Results.get_JSON(self.original_results),
                "GMR_results": Results.get_JSON(self.GMR_results),
                "DSMR_results": Results.get_JSON(self.DSMR_results),
                "all_MR_results": Results.get_JSON(self.all_MR_results)}

        if self.individual_results is None:
            text["individual_results"] = "None"
        else:
            text["individual_results"] = ';'.join([Results.get_JSON(i) for i in self.individual_results])

        text = json.dumps(text)

        with open(filename, 'w') as file:
            file.write(text)

        return text

[docs]    @staticmethod
    def read_from_file(filename: str):
        """
        Reads results from a file in the Results class json format

        :param filename: the file (or path) to read the data from
        :return: a Results object
        :rtype: Results
        """

        file = open(filename, "r")

        text = file.read()

        str_results = json.loads(text)

        original_results = Info.from_JSON(str_results["original_results"])
        GMR_results = Info.from_JSON(str_results["GMR_results"])
        DSMR_results = Info.from_JSON(str_results["DSMR_results"])
        all_MR_results = Info.from_JSON(str_results["all_MR_results"])
        individual_results_list = str_results["individual_results"].split(";")
        individual_results = [Info.from_JSON(s) for s in individual_results_list]

        results = Results(original_results, GMR_results, DSMR_results, all_MR_results, individual_results)

        return results

[docs]    @staticmethod
    def get_JSON(info: Info | list[Info] = None) -> str:
        """

        :param info: the Info or list of Info objects to convert
        :return: None or a string in JSON form for the object
        """

        if info is None:
            return "None"
        else:
            return info.to_JSON()