Documentation for Calculation Module¶

`check_properties(*args)` ¶

Check if all the arguments have values.

Parameters:

Name	Type	Description	Default
`args`	`list`	All the arguments.	`()`

Returns:

Name	Type	Description
`float`		The mean of arguments that have values.

Source code in nebula/addons/trustworthiness/calculation.py

def check_properties(*args):
    """
    Check if all the arguments have values.

    Args:
        args (list): All the arguments.

    Returns:
        float: The mean of arguments that have values.
    """

    result = map(lambda x: x is not None and x != "", args)
    return np.mean(list(result))

`get_avg_loss_accuracy(loss_files, accuracy_files)` ¶

Calculates the mean accuracy and loss models of the nodes.

Parameters:

Name	Type	Description	Default
`loss_files`	`list`	Files that contain the loss of the models of the nodes.	required
`accuracy_files`	`list`	Files that contain the acurracies of the models of the nodes.	required

Returns:

Type	Description
	3-tupla: The mean loss of the models, the mean accuracies of the models, the standard deviation of the accuracies of the models.

Source code in nebula/addons/trustworthiness/calculation.py

def get_avg_loss_accuracy(loss_files, accuracy_files):
    """
    Calculates the mean accuracy and loss models of the nodes.

    Args:
        loss_files (list): Files that contain the loss of the models of the nodes.
        accuracy_files (list): Files that contain the acurracies of the models of the nodes.

    Returns:
        3-tupla: The mean loss of the models, the mean accuracies of the models, the standard deviation of the accuracies of the models.
    """
    total_accuracy = 0
    total_loss = 0
    number_files = len(loss_files)
    accuracies = []

    for file_loss, file_accuracy in zip(loss_files, accuracy_files, strict=False):
        with open(file_loss) as f:
            loss = f.read()

        with open(file_accuracy) as f:
            accuracy = f.read()

        total_loss += float(loss)
        total_accuracy += float(accuracy)
        accuracies.append(float(accuracy))

    avg_loss = total_loss / number_files
    avg_accuracy = total_accuracy / number_files

    std_accuracy = statistics.stdev(accuracies)

    return avg_loss, avg_accuracy, std_accuracy

`get_bytes_models(models_files)` ¶

Calculates the mean bytes of the final models of the nodes.

Parameters:

Name	Type	Description	Default
`models_files`	`list`	List of final models.	required

Returns:

Name	Type	Description
`float`		The mean bytes of the models.

Source code in nebula/addons/trustworthiness/calculation.py

def get_bytes_models(models_files):
    """
    Calculates the mean bytes of the final models of the nodes.

    Args:
        models_files (list): List of final models.

    Returns:
        float: The mean bytes of the models.
    """

    total_models_size = 0
    number_models = len(models_files)

    for file in models_files:
        model_size = os.path.getsize(file)
        total_models_size += model_size

    avg_model_size = total_models_size / number_models

    return avg_model_size

`get_bytes_sent_recv(bytes_sent_files, bytes_recv_files)` ¶

Calculates the mean bytes sent and received of the nodes.

Parameters:

Name	Type	Description	Default
`bytes_sent_files`	`list`	Files that contain the bytes sent of the nodes.	required
`bytes_recv_files`	`list`	Files that contain the bytes received of the nodes.	required

Returns:

Type	Description
	4-tupla: The total bytes sent, the total bytes received, the mean bytes sent and the mean bytes received of the nodes.

Source code in nebula/addons/trustworthiness/calculation.py

def get_bytes_sent_recv(bytes_sent_files, bytes_recv_files):
    """
    Calculates the mean bytes sent and received of the nodes.

    Args:
        bytes_sent_files (list): Files that contain the bytes sent of the nodes.
        bytes_recv_files (list): Files that contain the bytes received of the nodes.

    Returns:
        4-tupla: The total bytes sent, the total bytes received, the mean bytes sent and the mean bytes received of the nodes.
    """
    total_upload_bytes = 0
    total_download_bytes = 0
    number_files = len(bytes_sent_files)

    for file_bytes_sent, file_bytes_recv in zip(bytes_sent_files, bytes_recv_files, strict=False):
        with open(file_bytes_sent) as f:
            bytes_sent = f.read()

        with open(file_bytes_recv) as f:
            bytes_recv = f.read()

        total_upload_bytes += int(bytes_sent)
        total_download_bytes += int(bytes_recv)

    avg_upload_bytes = total_upload_bytes / number_files
    avg_download_bytes = total_download_bytes / number_files
    return (
        total_upload_bytes,
        total_download_bytes,
        avg_upload_bytes,
        avg_download_bytes,
    )

`get_clever_score(model, test_sample, nb_classes, learning_rate)` ¶

Calculates the CLEVER score.

Parameters:

Name	Type	Description	Default
`model`	`object`	The model.	required
`test_sample`	`object`	One test sample to calculate the CLEVER score.	required
`nb_classes`	`int`	The nb_classes of the model.	required
`learning_rate`	`float`	The learning rate of the model.	required

Returns:

Name	Type	Description
`float`		The CLEVER score.

Source code in nebula/addons/trustworthiness/calculation.py

def get_clever_score(model, test_sample, nb_classes, learning_rate):
    """
    Calculates the CLEVER score.

    Args:
        model (object): The model.
        test_sample (object): One test sample to calculate the CLEVER score.
        nb_classes (int): The nb_classes of the model.
        learning_rate (float): The learning rate of the model.

    Returns:
        float: The CLEVER score.
    """

    images, _ = test_sample
    background = images[-1]

    criterion = nn.CrossEntropyLoss()
    optimizer = optim.Adam(model.parameters(), learning_rate)

    # Create the ART classifier
    classifier = PyTorchClassifier(
        model=model,
        loss=criterion,
        optimizer=optimizer,
        input_shape=(1, 28, 28),
        nb_classes=nb_classes,
    )

    score_untargeted = clever_u(
        classifier,
        background.numpy(),
        10,
        5,
        R_L2,
        norm=2,
        pool_factor=3,
        verbose=False,
    )
    return score_untargeted

`get_cv(list=None, std=None, mean=None)` ¶

Get the coefficient of variation.

Parameters:

Name	Type	Description	Default
`list`	`list`	List in which the coefficient of variation will be calculated.	`None`
`std`	`float`	Standard deviation of a list.	`None`
`mean`	`float`	Mean of a list.	`None`

Returns:

Name	Type	Description
`float`		The coefficient of variation calculated.

Source code in nebula/addons/trustworthiness/calculation.py

def get_cv(list=None, std=None, mean=None):
    """
    Get the coefficient of variation.

    Args:
        list (list): List in which the coefficient of variation will be calculated.
        std (float): Standard deviation of a list.
        mean (float): Mean of a list.

    Returns:
        float: The coefficient of variation calculated.
    """
    if std is not None and mean is not None:
        return std / mean

    if list is not None:
        return np.std(list) / np.mean(list)

    return 0

`get_elapsed_time(scenario)` ¶

Calculates the elapsed time during the execution of the scenario.

Parameters:

Name	Type	Description	Default
`scenario`	`object`	Scenario required.	required

Returns:

Name	Type	Description
`float`		The elapsed time.

Source code in nebula/addons/trustworthiness/calculation.py

def get_elapsed_time(scenario):
    """
    Calculates the elapsed time during the execution of the scenario.

    Args:
        scenario (object): Scenario required.

    Returns:
        float: The elapsed time.
    """
    start_time = scenario[1]
    end_time = scenario[2]

    start_date = datetime.strptime(start_time, "%d/%m/%Y %H:%M:%S")
    end_date = datetime.strptime(end_time, "%d/%m/%Y %H:%M:%S")

    elapsed_time = (end_date - start_date).total_seconds() / 60

    return elapsed_time

`get_feature_importance_cv(model, test_sample)` ¶

Calculates the coefficient of variation of the feature importance.

Parameters:

Name	Type	Description	Default
`model`	`object`	The model.	required
`test_sample`	`object`	One test sample to calculate the feature importance.	required

Returns:

Name	Type	Description
`float`		The coefficient of variation of the feature importance.

Source code in nebula/addons/trustworthiness/calculation.py

def get_feature_importance_cv(model, test_sample):
    """
    Calculates the coefficient of variation of the feature importance.

    Args:
        model (object): The model.
        test_sample (object): One test sample to calculate the feature importance.

    Returns:
        float: The coefficient of variation of the feature importance.
    """

    try:
        cv = 0
        batch_size = 10
        device = "cpu"

        if isinstance(model, torch.nn.Module):
            batched_data, _ = test_sample

            n = batch_size
            m = math.floor(0.8 * n)

            background = batched_data[:m].to(device)
            test_data = batched_data[m:n].to(device)

            e = shap.DeepExplainer(model, background)
            shap_values = e.shap_values(test_data)
            if shap_values is not None and len(shap_values) > 0:
                sums = np.array([shap_values[i].sum() for i in range(len(shap_values))])
                abs_sums = np.absolute(sums)
                cv = variation(abs_sums)
    except Exception as e:
        logger.warning("Could not compute feature importance CV with shap")
        cv = 1
    if math.isnan(cv):
        cv = 1
    return cv

`get_global_privacy_risk(dp, epsilon, n)` ¶

Calculates the global privacy risk by epsilon and the number of clients.

Parameters:

Name	Type	Description	Default
`dp`	`bool`	Indicates if differential privacy is used or not.	required
`epsilon`	`int`	The epsilon value.	required
`n`	`int`	The number of clients in the scenario.	required

Returns:

Name	Type	Description
`float`		The global privacy risk.

Source code in nebula/addons/trustworthiness/calculation.py

def get_global_privacy_risk(dp, epsilon, n):
    """
    Calculates the global privacy risk by epsilon and the number of clients.

    Args:
        dp (bool): Indicates if differential privacy is used or not.
        epsilon (int): The epsilon value.
        n (int): The number of clients in the scenario.

    Returns:
        float: The global privacy risk.
    """

    if dp is True and isinstance(epsilon, numbers.Number):
        return 1 / (1 + (n - 1) * math.pow(e, -epsilon))
    else:
        return 1

`get_map_value_score(score_key, score_map)` ¶

Finds the score by the score_key in the score_map and returns the value.

Parameters:

Name	Type	Description	Default
`score_key`	`string`	The key to look up in the score_map.	required
`score_map`	`dict`	The score map defined in the eval_metrics.json file.	required

Returns:

Name	Type	Description
`float`		The score obtained in the score_map.

Source code in nebula/addons/trustworthiness/calculation.py

def get_map_value_score(score_key, score_map):
    """
    Finds the score by the score_key in the score_map and returns the value.

    Args:
        score_key (string): The key to look up in the score_map.
        score_map (dict): The score map defined in the eval_metrics.json file.

    Returns:
        float: The score obtained in the score_map.
    """
    score = 0
    if score_map is None:
        logger.warning("Score map is missing")
    else:
        score = score_map[score_key]
    return score

`get_mapped_score(score_key, score_map)` ¶

Finds the score by the score_key in the score_map.

Parameters:

Name	Type	Description	Default
`score_key`	`string`	The key to look up in the score_map.	required
`score_map`	`dict`	The score map defined in the eval_metrics.json file.	required

Returns:

Name	Type	Description
`float`		The normalized score of [0, 1].

Source code in nebula/addons/trustworthiness/calculation.py

def get_mapped_score(score_key, score_map):
    """
    Finds the score by the score_key in the score_map.

    Args:
        score_key (string): The key to look up in the score_map.
        score_map (dict): The score map defined in the eval_metrics.json file.

    Returns:
        float: The normalized score of [0, 1].
    """
    score = 0
    if score_map is None:
        logger.warning("Score map is missing")
    else:
        keys = [key for key, value in score_map.items()]
        scores = [value for key, value in score_map.items()]
        normalized_scores = get_normalized_scores(scores)
        normalized_score_map = dict(zip(keys, normalized_scores, strict=False))
        score = normalized_score_map.get(score_key, np.nan)

    return score

`get_normalized_scores(scores)` ¶

Calculates the normalized scores of a list.

Parameters:

Name	Type	Description	Default
`scores`	`list`	The values that will be normalized.	required

Returns:

Name	Type	Description
`list`		The normalized list.

Source code in nebula/addons/trustworthiness/calculation.py

def get_normalized_scores(scores):
    """
    Calculates the normalized scores of a list.

    Args:
        scores (list): The values that will be normalized.

    Returns:
        list: The normalized list.
    """
    normalized = [(x - np.min(scores)) / (np.max(scores) - np.min(scores)) for x in scores]
    return normalized

`get_range_score(value, ranges, direction='asc')` ¶

Maps the value to a range and gets the score by the range and direction.

Parameters:

Name	Type	Description	Default
`value`	`int`	The input score.	required
`ranges`	`list`	The ranges defined.	required
`direction`	`string`	Asc means the higher the range the higher the score, desc means otherwise.	`'asc'`

Returns:

Name	Type	Description
`float`		The normalized score of [0, 1].

Source code in nebula/addons/trustworthiness/calculation.py

def get_range_score(value, ranges, direction="asc"):
    """
    Maps the value to a range and gets the score by the range and direction.

    Args:
        value (int): The input score.
        ranges (list): The ranges defined.
        direction (string): Asc means the higher the range the higher the score, desc means otherwise.

    Returns:
        float: The normalized score of [0, 1].
    """

    if not (type(value) == int or type(value) == float):
        logger.warning("Input value is not a number")
        logger.warning(f"{value}")
        return 0
    else:
        score = 0
        if ranges is None:
            logger.warning("Score ranges are missing")
        else:
            total_bins = len(ranges) + 1
            bin = np.digitize(value, ranges, right=True)
            score = 1 - (bin / total_bins) if direction == "desc" else bin / total_bins
        return score

`get_scaled_score(value, scale, direction)` ¶

Maps a score of a specific scale into the scale between zero and one.

Parameters:

Name	Type	Description	Default
`value`	`int or float`	The raw value of the metric.	required
`scale`	`list`	List containing the minimum and maximum value the value can fall in between.	required

Returns:

Name	Type	Description
`float`		The normalized score of [0, 1].

Source code in nebula/addons/trustworthiness/calculation.py

def get_scaled_score(value, scale: list, direction: str):
    """
    Maps a score of a specific scale into the scale between zero and one.

    Args:
        value (int or float): The raw value of the metric.
        scale (list): List containing the minimum and maximum value the value can fall in between.

    Returns:
        float: The normalized score of [0, 1].
    """

    score = 0
    try:
        value_min, value_max = scale[0], scale[1]
    except Exception:
        logger.warning("Score minimum or score maximum is missing. The minimum has been set to 0 and the maximum to 1")
        value_min, value_max = 0, 1
    if not value:
        logger.warning("Score value is missing. Set value to zero")
    else:
        low, high = 0, 1
        if value >= value_max:
            score = 1
        elif value <= value_min:
            score = 0
        else:
            diff = value_max - value_min
            diffScale = high - low
            score = (float(value) - value_min) * (float(diffScale) / diff) + low
        if direction == "desc":
            score = high - score

    return score

`get_true_score(value, direction)` ¶

Returns the negative of the value if direction is 'desc', otherwise returns value.

Parameters:

Name	Type	Description	Default
`value`	`int`	The input score.	required
`direction`	`string`	Asc means the higher the range the higher the score, desc means otherwise.	required

Returns:

Name	Type	Description
`float`		The score obtained.

Source code in nebula/addons/trustworthiness/calculation.py

def get_true_score(value, direction):
    """
    Returns the negative of the value if direction is 'desc', otherwise returns value.

    Args:
        value (int): The input score.
        direction (string): Asc means the higher the range the higher the score, desc means otherwise.

    Returns:
        float: The score obtained.
    """

    if value is True:
        return 1
    elif value is False:
        return 0
    else:
        if not (type(value) == int or type(value) == float):
            logger.warning("Input value is not a number")
            logger.warning(f"{value}.")
            return 0
        else:
            if direction == "desc":
                return 1 - value
            else:
                return value

`get_value(value)` ¶

Get the value of a metric.

Parameters:

Name	Type	Description	Default
`value`	`float`	The value of the metric.	required

Returns:

Name	Type	Description
`float`		The value of the metric.

Source code in nebula/addons/trustworthiness/calculation.py

def get_value(value):
    """
    Get the value of a metric.

    Args:
        value (float): The value of the metric.

    Returns:
        float: The value of the metric.
    """

    return value

`stop_emissions_tracking_and_save(tracker, outdir, emissions_file, role, workload, sample_size=0)` ¶

Stops emissions tracking object from CodeCarbon and saves relevant information to emissions.csv file.

Parameters:

Name	Type	Description	Default
`tracker`	`object`	The emissions tracker object holding information.	required
`outdir`	`str`	The path of the output directory of the experiment.	required
`emissions_file`	`str`	The path to the emissions file.	required
`role`	`str`	Either client or server depending on the role.	required
`workload`	`str`	Either aggregation or training depending on the workload.	required
`sample_size`	`int`	The number of samples used for training, if aggregation 0.	`0`

Source code in nebula/addons/trustworthiness/calculation.py

def stop_emissions_tracking_and_save(
    tracker: EmissionsTracker,
    outdir: str,
    emissions_file: str,
    role: str,
    workload: str,
    sample_size: int = 0,
):
    """
    Stops emissions tracking object from CodeCarbon and saves relevant information to emissions.csv file.

    Args:
        tracker (object): The emissions tracker object holding information.
        outdir (str): The path of the output directory of the experiment.
        emissions_file (str): The path to the emissions file.
        role (str): Either client or server depending on the role.
        workload (str): Either aggregation or training depending on the workload.
        sample_size (int): The number of samples used for training, if aggregation 0.
    """

    tracker.stop()

    emissions_file = os.path.join(outdir, emissions_file)

    if exists(emissions_file):
        df = pd.read_csv(emissions_file)
    else:
        df = pd.DataFrame(
            columns=[
                "role",
                "energy_grid",
                "emissions",
                "workload",
                "CPU_model",
                "GPU_model",
            ]
        )
    try:
        energy_grid = (tracker.final_emissions_data.emissions / tracker.final_emissions_data.energy_consumed) * 1000
        df = pd.concat(
            [
                df,
                pd.DataFrame({
                    "role": role,
                    "energy_grid": [energy_grid],
                    "emissions": [tracker.final_emissions_data.emissions],
                    "workload": workload,
                    "CPU_model": tracker.final_emissions_data.cpu_model
                    if tracker.final_emissions_data.cpu_model
                    else "None",
                    "GPU_model": tracker.final_emissions_data.gpu_model
                    if tracker.final_emissions_data.gpu_model
                    else "None",
                    "CPU_used": True if tracker.final_emissions_data.cpu_energy else False,
                    "GPU_used": True if tracker.final_emissions_data.gpu_energy else False,
                    "energy_consumed": tracker.final_emissions_data.energy_consumed,
                    "sample_size": sample_size,
                }),
            ],
            ignore_index=True,
        )
        df.to_csv(emissions_file, encoding="utf-8", index=False)
    except Exception as e:
        logger.warning(e)

Documentation for Calculation Module¶

check_properties(*args) ¶

get_avg_loss_accuracy(loss_files, accuracy_files) ¶

get_bytes_models(models_files) ¶

get_bytes_sent_recv(bytes_sent_files, bytes_recv_files) ¶

get_clever_score(model, test_sample, nb_classes, learning_rate) ¶

get_cv(list=None, std=None, mean=None) ¶

get_elapsed_time(scenario) ¶

get_feature_importance_cv(model, test_sample) ¶

get_global_privacy_risk(dp, epsilon, n) ¶

get_map_value_score(score_key, score_map) ¶

get_mapped_score(score_key, score_map) ¶

get_normalized_scores(scores) ¶

get_range_score(value, ranges, direction='asc') ¶

get_scaled_score(value, scale, direction) ¶

get_true_score(value, direction) ¶

get_value(value) ¶

stop_emissions_tracking_and_save(tracker, outdir, emissions_file, role, workload, sample_size=0) ¶

`check_properties(*args)` ¶

`get_avg_loss_accuracy(loss_files, accuracy_files)` ¶

`get_bytes_models(models_files)` ¶

`get_bytes_sent_recv(bytes_sent_files, bytes_recv_files)` ¶

`get_clever_score(model, test_sample, nb_classes, learning_rate)` ¶

`get_cv(list=None, std=None, mean=None)` ¶

`get_elapsed_time(scenario)` ¶

`get_feature_importance_cv(model, test_sample)` ¶

`get_global_privacy_risk(dp, epsilon, n)` ¶

`get_map_value_score(score_key, score_map)` ¶

`get_mapped_score(score_key, score_map)` ¶

`get_normalized_scores(scores)` ¶

`get_range_score(value, ranges, direction='asc')` ¶

`get_scaled_score(value, scale, direction)` ¶

`get_true_score(value, direction)` ¶

`get_value(value)` ¶

`stop_emissions_tracking_and_save(tracker, outdir, emissions_file, role, workload, sample_size=0)` ¶