This part of the project documentation focuses on an information-oriented approach. Use it as a reference for the technical implementation of the mlpForecaster project code.

evaluate_point_forecast

evaluate_point_forecast(outputs)

Evaluates point forecasts by computing daily pointwise metrics.

Parameters:

outputs (dict) –

A dictionary containing the true values, predicted values, and associated metadata. Expected keys: 'true' (ndarray): The true values. 'loc' (ndarray): The predicted values. 'index' (ndarray): The timestamps for each prediction. 'targets' (list): The names of the target variables.

Returns:

tuple –

A tuple containing: - pd_metrics (dict): DataFrame of combined metrics for each target variable. - split_metrics (dict): Dictionary of metrics split by target variable. - logs (dict): Any additional logs generated during the evaluation.

Source code in mlpforecast/metrics/deterministic.py

def evaluate_point_forecast(outputs):
    """
    Evaluates point forecasts by computing daily pointwise metrics.

    Args:
        outputs (dict): A dictionary containing the true values, predicted values, and associated metadata.
            Expected keys:
                'true' (ndarray): The true values.
                'loc' (ndarray): The predicted values.
                'index' (ndarray): The timestamps for each prediction.
                'targets' (list): The names of the target variables.

    Returns:
        (tuple): A tuple containing:
            - pd_metrics (dict): DataFrame of combined metrics for each target variable.
            - split_metrics (dict): Dictionary of metrics split by target variable.
            - logs (dict): Any additional logs generated during the evaluation.
    """
    pd_metrics = pd.DataFrame()
    for i in range(len(outputs["true"])):
        metrics = []

        for j in range(outputs["true"].shape[-1]):
            true = outputs["true"][i, :, j]
            pred = outputs["loc"][i, :, j]

            point_scores = get_daily_pointwise_metrics(pred, true, None)
            point_scores.insert(0, "target", outputs["targets"][j])
            metrics.append(point_scores)

        metrics_df = pd.concat(metrics)
        df = pd.DataFrame(outputs["index"][i], columns=["Date"])
        df["Date"] = pd.to_datetime(df["Date"], unit="ns")
        metrics_df.insert(0, "timestamp", df.Date.dt.round("D").unique()[-1])
        pd_metrics = pd.concat([pd_metrics, metrics_df], axis=0)
    pd_metrics.set_index("timestamp", inplace=True)

    return pd_metrics

get_nbias

get_nbias(y, y_hat, axis=0)

Calculates the normalized bias (NBias) between the true values and predicted values.

NBias is defined as the sum of the difference between the true values and predicted values, normalized by the sum of the true and predicted values.

Parameters:

y (ndarray) –

The true values.
y_hat (ndarray) –

The predicted values.
axis (int, default: 0 ) –

The axis along which to compute the NBias. Default is 0.

Returns:

float –

The normalized bias value.

Source code in mlpforecast/metrics/deterministic.py

def get_nbias(y, y_hat, axis=0):
    """
    Calculates the normalized bias (NBias) between the true values and predicted values.

    NBias is defined as the sum of the difference between the true values and predicted values,
    normalized by the sum of the true and predicted values.

    Args:
        y (ndarray): The true values.
        y_hat (ndarray): The predicted values.
        axis (int, optional): The axis along which to compute the NBias. Default is 0.

    Returns:
        (float): The normalized bias value.
    """
    epsilon = np.finfo(np.float64).eps  # Small value to avoid division by zero
    scale = y + y_hat  # Sum of true and predicted values
    nbias = (y - y_hat) / np.maximum(scale, epsilon)  # Normalized bias calculation
    output_errors = nbias
    return np.sum(
        output_errors, axis=axis
    )  # Sum of output errors along the specified axis

get_pointwise_metrics

get_pointwise_metrics(
    pred: array, true: array, target_range: float = None
)

Calculate pointwise metrics

Parameters:

pred (array) –

predicted values
true (array) –

true values
target_range (float, default: None ) –

range of the target variable

Returns:

dict –

pointwise metrics

Source code in mlpforecast/metrics/deterministic.py

def get_pointwise_metrics(pred: np.array, true: np.array, target_range: float = None):
    """
    Calculate pointwise metrics

    Args:
        pred (np.array): predicted values
        true (np.array): true values
        target_range (float): range of the target variable

    Returns:
        (dict): pointwise metrics

    """
    assert pred.ndim == 1, "pred must be 1-dimensional"
    assert true.ndim == 1, "pred must be 1-dimensional"
    assert pred.shape == true.shape, "pred and true must have the same shape"
    target_range = true.max() - true.min() if target_range is None else target_range

    mse = mean_squared_error(true, pred)
    rmse = np.sqrt(mean_squared_error(true, pred))
    nrmse = min(rmse / target_range, 1)
    mae = mean_absolute_error(true, pred)
    mape = mean_absolute_percentage_error(true, pred)
    corr = np.corrcoef(true, pred)[0, 1]
    max_res = max_error(pred, true)
    d2_err = d2_absolute_error_score(pred, true)
    nbias = get_nbias(true, pred)
    corr = np.corrcoef(true, pred)[0, 1]
    r2 = r2_score(pred, true)
    smape = get_smape(true, pred)

    return {
        "MSE": mse,
        "RMSE": rmse,
        "NRMSE": nrmse,
        "MAE": mae,
        "MAPE(%)": mape * 100,
        "CORR": corr,
        "MAX-error": max_res,
        "D2-error": d2_err,
        "NBIAS": nbias,
        "R2-error": r2,
        "SMAPE(%)": smape * 100,
    }

get_smape

get_smape(y, y_hat, axis=0)

Calculates the Symmetric Mean Absolute Percentage Error (SMAPE) between the true values and predicted values.

SMAPE is defined as the average of the absolute percentage errors, normalized by the sum of the absolute values of the true and predicted values.

Parameters:

y (ndarray) –

The true values.
y_hat (ndarray) –

The predicted values.
axis (int, default: 0 ) –

The axis along which to compute the SMAPE. Default is 0.

Returns:

float –

The symmetric mean absolute percentage error value.

Source code in mlpforecast/metrics/deterministic.py

def get_smape(y, y_hat, axis=0):
    """
    Calculates the Symmetric Mean Absolute Percentage Error (SMAPE) between the true values and predicted values.

    SMAPE is defined as the average of the absolute percentage errors, normalized by the sum of the absolute values of
    the true and predicted values.

    Args:
        y (ndarray): The true values.
        y_hat (ndarray): The predicted values.
        axis (int, optional): \
              The axis along which to compute the SMAPE. Default is 0.

    Returns:
        (float): The symmetric mean absolute percentage error value.
    """
    epsilon = np.finfo(np.float64).eps
    # Small value to avoid division by zero
    scale = np.abs(y) + np.abs(y_hat)
    # Sum of absolute true and predicted values
    output_errors = 2 * (
        np.abs(y - y_hat) / np.maximum(scale, epsilon)
    )  # SMAPE calculation
    return np.average(output_errors, axis=axis)