PyPI - tsadmetrics - Versions diffs - 0.1.0__py3-none-any.whl - Mend

tsadmetrics 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

tsadmetrics/__init__.py +17 -0
tsadmetrics/binary_metrics.py +962 -0
tsadmetrics/metric_utils.py +320 -0
tsadmetrics/non_binary_metrics.py +92 -0
tsadmetrics/py.typed +0 -0
tsadmetrics/ts_aware_utils.py +2 -0
tsadmetrics/utils.py +42 -0
tsadmetrics-0.1.0.dist-info/METADATA +10 -0
tsadmetrics-0.1.0.dist-info/RECORD +11 -0
tsadmetrics-0.1.0.dist-info/WHEEL +5 -0
tsadmetrics-0.1.0.dist-info/top_level.txt +1 -0

tsadmetrics/metric_utils.py ADDED Viewed

@@ -0,0 +1,320 @@
+import numpy as np
+from _tsadeval.metrics import Binary_anomalies, pointwise_to_full_series, segmentwise_to_full_series, DelayThresholdedPointAdjust
+def get_tp_tn_fp_fn_point_wise(y_true: np.array,y_pred: np.array):
+    TP,TN,FP,FN=0,0,0,0
+    for true,pred in zip(y_true,y_pred):
+        if true==pred:
+            if true==1:
+                TP+=1
+            else:
+                TN+=1
+        else:
+            if true==1:
+                FN+=1
+            else:
+                FP+=1
+    return TP,TN,FP,FN
+def get_events(y_true,anomaly=True):
+    events = []
+    start_idx = None
+    v = 0
+    if anomaly:
+        v = 1
+    else:
+        v = 0
+    for i, val in enumerate(y_true):
+        if val == v:  # Si encontramos el inicio de un evento
+            if start_idx is None:
+                start_idx = i  # Establecemos el inicio del evento
+        elif start_idx is not None:  # Si encontramos el final de un evento
+            events.append((start_idx, i - 1))  # Agregamos el evento a la lista de eventos
+            start_idx = None  # Restablecemos el inicio del evento
+    if start_idx is not None:  # Si al final de la secuencia aún estamos dentro de un evento
+        events.append((start_idx, len(y_true) - 1))  # Agregamos el evento final a la lista de eventos
+    return events
+def calculate_intersection(event1, event2):
+    start_intersection = max(event1[0], event2[0])
+    end_intersection = min(event1[1], event2[1])
+    # If there is an intersection, return the range of the intersection, otherwise return None
+    if start_intersection <= end_intersection:
+        return [start_intersection, end_intersection]
+    else:
+        return None
+def get_tp_tn_fp_fn_point_adjusted(y_true: np.array,y_pred: np.array):
+    TP, TN, FP, FN = get_tp_tn_fp_fn_point_wise(y_true, y_pred)
+    TP=0
+    FN=0
+    y_true_events = get_events(y_true,anomaly=True)
+    y_pred_events = get_events(y_pred,anomaly=True)
+    i_true = 0
+    i_pred = 0
+    while i_true<len(y_true_events):
+        detected = False
+        while i_pred<len(y_pred_events) and y_true_events[i_true][1]>y_pred_events[i_pred][0]:
+            if calculate_intersection(y_true_events[i_true],y_pred_events[i_pred]) is not None:
+                TP+= y_true_events[i_true][1]-y_true_events[i_true][0]+1
+                detected=True
+                break
+            elif y_true_events[i_true][0]>y_pred_events[i_pred][1]:
+                i_pred+=1
+        if not detected:
+            FN+= y_true_events[i_true][1]-y_true_events[i_true][0]+1
+        i_true+=1
+    return TP, TN, FP, FN
+def get_tp_tn_fp_fn_delay_th_point_adjusted(y_true: np.array,y_pred: np.array,k: int):
+    TP, TN, FP, FN = get_tp_tn_fp_fn_point_wise(y_true, y_pred)
+    TP=0
+    FN=0
+    y_true_events = get_events(y_true,anomaly=True)
+    y_pred_events = get_events(y_pred,anomaly=True)
+    i_true = 0
+    i_pred = 0
+    while i_true<len(y_true_events):
+        detected = False
+        while i_pred<len(y_pred_events) and y_true_events[i_true][1]>y_pred_events[i_pred][0]:
+            intersec = calculate_intersection(y_true_events[i_true],y_pred_events[i_pred])
+            if intersec is not None and intersec[0]-y_true_events[i_true][0]<k:
+                TP+= y_true_events[i_true][1]-y_true_events[i_true][0]+1
+                detected=True
+                break
+            else:
+                i_pred+=1
+        if not detected:
+            FN+= y_true_events[i_true][1]-y_true_events[i_true][0]+1
+        i_true+=1
+    return TP, TN, FP, FN
+def get_tp_tn_fp_fn_point_adjusted_at_k(y_true: np.array,y_pred: np.array, k: float):
+    TP, TN, FP, FN = get_tp_tn_fp_fn_point_wise(y_true, y_pred)
+    TP=0
+    FN=0
+    y_true_events = get_events(y_true,anomaly=True)
+    y_pred_events = get_events(y_pred,anomaly=True)
+    i_true = 0
+    i_pred = 0
+    while i_true<len(y_true_events):
+        detected = False
+        while i_pred<len(y_pred_events) and y_true_events[i_true][1]>y_pred_events[i_pred][0]:
+            intersec = calculate_intersection(y_true_events[i_true],y_pred_events[i_pred])
+            if intersec is not None:
+                event_size = y_true_events[i_true][1]-y_true_events[i_true][0]+1
+                intersec_size = intersec[1]-intersec[0]+1
+            if intersec is not None and intersec_size/event_size>=k:
+                TP+= y_true_events[i_true][1]-y_true_events[i_true][0]+1
+                detected=True
+                break
+            else:
+                i_pred+=1
+        if not detected:
+            FN+= y_true_events[i_true][1]-y_true_events[i_true][0]+1
+        i_true+=1
+    return TP, TN, FP, FN
+def get_tp_tn_fp_fn_latency_sparsity_aw(y_true: np.array, y_pred: np.array, ni: int):
+    batched_shape = (int(np.ceil(y_pred.shape[0] / ni)), 1)
+    label_batch = np.zeros(batched_shape)
+    pred_batch = np.zeros(batched_shape)
+    actual = np.copy(y_true)
+    predict = np.copy(y_pred)
+    detect_state = False  # triggered when a True anomaly is detected by model
+    anomaly_batch_count = 0
+    i, i_ni = 0, 0
+    step = ni
+    while i < len(y_true) and step > 1:
+        j = min(i + step, len(y_true))  # end of ni (batch) starting at i
+        # Adjust step size if needed
+        if step > 2 and actual[i:j].sum() > 1:
+            if np.diff(np.where(actual[i:j])).max() > 1:  # if it finds an interruption in the true label continuity
+                step = min(int((j - i) / 2), 2)  # reduce step size
+                label_batch = np.append(label_batch, [[0]], axis=0)
+                pred_batch = np.append(pred_batch, [[0]], axis=0)  # increase size
+                j = i + step
+            else:
+                step = ni
+        else:
+            step = ni
+        # Start rolling window scoring
+        if actual[i:j].max():  # If label = T
+            if not actual[i]:  # if first value is normal
+                detect_state = False
+            s = actual[i:j].argmax()  # this is the index of the first occurrence
+            if detect_state:  # if anomaly was previously detected by model
+                anomaly_batch_count += 1
+                pred_batch[i_ni], label_batch[i_ni], predict[i + s:j] = 1, 1, 1
+            elif predict[i:j].max():  # if alert was detected with T
+                detect_state = True  # turn on detection state
+                anomaly_batch_count += 1
+                pred_batch[i_ni], label_batch[i_ni], predict[i + s:j] = 1, 1, 1
+            else:
+                detect_state = False
+                label_batch[i_ni] = 1
+        else:
+            detect_state = False
+            if predict[i:j].max():  # if False positive
+                pred_batch[i_ni] = 1
+        i += step
+        i_ni += 1
+    if ni == 1:
+        return get_tp_tn_fp_fn_point_wise(actual, predict)
+    return get_tp_tn_fp_fn_point_wise(label_batch.flatten().astype(int), pred_batch.flatten().astype(int))
+def get_tp_fp_fn_segment_wise(y_true: np.array,y_pred: np.array):
+    y_true_anomaly_events = get_events(y_true)
+    pred_anomaly_events = get_events(y_pred)
+    y_true_normal_events = get_events(y_true,False)
+    pred_normal_events = get_events(y_pred,False)
+    TP = 0
+    FN = 0
+    FP = 0
+    #TP
+    i = 0
+    for e_p in pred_anomaly_events:
+        c, d = e_p
+        while i<len(y_true_anomaly_events):
+            e_g = y_true_anomaly_events[i]
+            a, b = e_g
+            if a>d:
+              break
+            if b<c:
+                i+=1
+                continue
+            else:
+              if max(a, c) <= min(b, d):
+                  TP+=1
+            i+=1
+    #FN
+    FN = len(y_true_anomaly_events) - TP
+    #FP
+    i = 0
+    for e_p in y_true_normal_events:
+        c, d = e_p
+        while i<len(pred_anomaly_events):
+            e_g = pred_anomaly_events[i]
+            a, b = e_g
+            if a>d:
+                break
+            if b<c:
+                i+=1
+                continue
+            if calculate_intersection(e_g, e_p) is not None:
+                FP+=1
+            i+=1
+    return TP, FP, FN
+def is_full_series(length: int, anomalies: np.array):
+    # [1 0 1 1 0]
+    return len(anomalies.shape) == 1 and len(anomalies) == length
+def is_pointwise(length: int, anomalies: np.array):
+    # [0 2 3]
+    return len(anomalies.shape) == 1 and len(anomalies) < length
+def is_segmentwise(length: int, anomalies: np.array):
+    # [[0 0] [2 3]]
+    return len(anomalies.shape) == 2
+def transform_to_full_series(length: int, anomalies: np.array):
+    if is_full_series(length, anomalies):
+        return anomalies
+    elif is_pointwise(anomalies):
+        return pointwise_to_full_series(anomalies, length)
+    elif is_segmentwise(length, anomalies):
+        return segmentwise_to_full_series(anomalies, length)
+    else:
+        raise ValueError(f"Illegal shape of anomalies:\n{anomalies}")
+def counting_method(y_true: np.array, y_pred: np.array, k: int):
+    em,da,ma,fa = 0,0,0,0
+    for gt,pa in zip(y_true,y_pred):
+        if gt==1 and pa==1:
+            em+=1
+        elif gt==0 and pa==1:
+            fa+=1
+        else:
+            pass
+    b = DelayThresholdedPointAdjust(len(y_true),y_true,y_pred,k=k)
+    da = b.tp-em
+    ma = b.fn
+    return em,da,ma,fa
+#Range Based utils
+def cardinality(n_intersections,mode):
+    if mode == 'one':
+        return 1
+    elif mode == 'reciprocal':
+        if n_intersections==0:
+            return 1
+        else:
+            return float(1/n_intersections)
+    else:
+        raise Exception("Error, wrong cardinality mode.")
+def size(anomaly_range, overlap_set, position, bias):
+    if overlap_set == None:
+        return 0
+    my_value = 0
+    max_value = 0
+    anomaly_length = anomaly_range[1] - anomaly_range[0] + 1
+    for i in range(1,anomaly_length+1):
+        bias_value = position(i, anomaly_length,bias)
+        max_value += bias_value
+        if  anomaly_range[0]+i-1 >= overlap_set[0] and anomaly_range[0]+i-1 <= overlap_set[1]:
+            my_value += bias_value
+    return my_value / max_value
+def position(i, anomaly_length,bias):
+    if bias == 'flat':
+        return 1
+    elif bias == 'front-end':
+        return anomaly_length - i + 1
+    elif bias == 'back-end':
+        return i
+    elif bias == 'middle':
+        if i <= anomaly_length / 2:
+            return i
+        else:
+            return anomaly_length - i + 1
+    else:
+        raise Exception("Error, wrong bias value.")

tsadmetrics/non_binary_metrics.py ADDED Viewed

@@ -0,0 +1,92 @@
+import numpy as np
+from _tsadeval.metrics import *
+from .metric_utils import transform_to_full_series
+from sklearn.metrics import auc
+from .binary_metrics import point_adjusted_precision, point_adjusted_recall, segment_wise_precision, segment_wise_recall
+from pate.PATE_metric import PATE
+def precision_at_k(y_true : np.array ,y_anomaly_scores:  np.array):
+    m = PatK_pw(y_true,y_anomaly_scores)
+    return m.get_score()
+def auc_roc_pw(y_true : np.array ,y_anomaly_scores:  np.array):
+    m = AUC_ROC(y_true,y_anomaly_scores)
+    return m.get_score()
+def auc_pr_pw(y_true : np.array ,y_anomaly_scores:  np.array):
+    m = AUC_PR_pw(y_true,y_anomaly_scores)
+    return m.get_score()
+def auc_pr_pa(y_true: np.array, y_anomaly_scores: np.array):
+    thresholds = np.unique(y_anomaly_scores)[::-1]  # Descending order
+    precisions = [1]
+    recalls = [0]
+    for t in thresholds[:-1]:
+        y_pred = (y_anomaly_scores >= t).astype(int)
+        precisions.append(point_adjusted_precision(y_true, y_pred))
+        recalls.append(point_adjusted_recall(y_true, y_pred))
+    recalls.append(1)
+    precisions.append(0)
+    auc_value = auc(recalls, precisions)
+    return auc_value
+def auc_pr_sw(y_true: np.array, y_anomaly_scores: np.array):
+    thresholds = np.unique(y_anomaly_scores)[::-1]  # Descending order
+    precisions = [1]
+    recalls = [0]
+    for t in thresholds[:-1]:
+        y_pred = (y_anomaly_scores >= t).astype(int)
+        precisions.append(segment_wise_precision(y_true, y_pred))
+        recalls.append(segment_wise_recall(y_true, y_pred))
+    recalls.append(1)
+    precisions.append(0)
+    auc_value = auc(recalls, precisions)
+    return auc_value
+def vus_roc(y_true : np.array ,y_anomaly_scores:  np.array, window=4):
+    m = VUS_ROC(y_true,y_anomaly_scores,max_window=window)
+    return m.get_score()
+def vus_pr(y_true : np.array ,y_anomaly_scores:  np.array,  window=4):
+    m = VUS_PR(y_true,y_anomaly_scores,max_window=window)
+    return m.get_score()
+def real_pate(y_true: np.array, y_anomaly_scores: np.array, early: int, delay: int):
+    """
+    Calculate PATE score for anomaly detection in time series.
+    The PATE score is the ratio of the number of true positives to the sum of true positives, false positives, and false negatives, within a given early and delay range.
+    Parameters:
+    y_true (np.array): The ground truth binary labels for the time series data.
+    y_anomaly_scores (np.array): The predicted binary labels for the time series data.
+    early (int): The maximum number of time steps before an anomaly must be predicted to be considered early.
+    delay (int): The maximum number of time steps after an anomaly must be predicted to be considered delayed.
+    Returns:
+    float: The PATE score.
+    """
+    return PATE(y_true, y_anomaly_scores, early, delay, binary_scores=False)

tsadmetrics/py.typed ADDED Viewed

File without changes

tsadmetrics/ts_aware_utils.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ from .utils import get_events
2	+

tsadmetrics/utils.py ADDED Viewed

@@ -0,0 +1,42 @@
+import numpy as np
+import pandas as pd
+def compute_metrics(y_true: np.array,y_pred: np.array,metrics: list, metrics_params: dict, is_anomaly_score = False):
+    """
+    Computes the specified metrics for the given true and predicted values.
+    Parameters:
+    - y_true (np.array): True labels.
+    - y_pred (np.array): Predicted labels or scores.
+    - metrics (list): List of metric names to compute.
+    - metrics_params (dict): Dictionary of parameters for each metric.
+    - is_anomaly_score (bool): Flag indicating if y_true and y_pred are anomaly scores. Otherwise, they are treated as binary labels.
+    Returns:
+    - metrics_df (DataFrame): DataFrame containing the computed metrics and their values.
+    """
+    if not is_anomaly_score:
+        #Chech if y_true and y_pred are binary labels
+        if not (np.array_equal(np.unique(y_true), [0, 1]) and np.array_equal(np.unique(y_pred), [0, 1])):
+            raise ValueError("y_true and y_pred must be binary labels (0 or 1) when is_anomaly_score is False. Which is the default.")
+    else:
+        # Check if y_true and y_pred are anomaly scores
+        if not (np.array_equal(np.unique(y_true), [0, 1]) and np.array_equal(np.unique(y_pred), [0, 1])):
+            raise ValueError("y_true and y_pred must be anomaly scores in range [0,1] when is_anomaly_score is True.")
+    results = {}
+    for metric in metrics:
+        metric_name = metric[0]
+        metric_func = metric[1]
+        metric_value = metric_func(y_true, y_pred, **metrics_params.get(metric_name, {}))
+        # Store the result in the DataFrame
+        results[metric_name] = metric_value
+    metrics_df = pd.DataFrame(columns=['metric_name', 'metric_value'])
+    metrics_df['metric_name'] = results.keys()
+    metrics_df['metric_value'] = results.values()
+    return metrics_df

tsadmetrics-0.1.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,10 @@
+Metadata-Version: 2.1
+Name: tsadmetrics
+Version: 0.1.0
+Summary: Librería para evaluación de detección de anomalías en series temporales
+Home-page: https://github.com/pathsko/TSADmetrics
+Author: Pedro Rafael Velasco Priego
+Author-email: Pedro Rafael Velasco Priego <i12veprp@uco.es>
+Requires-Python: >=3.6
+Description-Content-Type: text/markdown

tsadmetrics-0.1.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,11 @@
+tsadmetrics/__init__.py,sha256=sETF4u0XMjY-1h2RJb7GyEAngvQ1e62RC7TolT-cKJ0,1571
+tsadmetrics/binary_metrics.py,sha256=6yp4Dqg0_M_bJvyoWVgjAr4rLnGIDzHd7CzCRKqJVso,37739
+tsadmetrics/metric_utils.py,sha256=HtcgQ3sqnfoOQ-QnDctNiaRGDXRuFvGzMGhoS2HWYIg,10476
+tsadmetrics/non_binary_metrics.py,sha256=2F_qsV7wf-IMAB158uA9U0DC5l2apTAyK6XPN2roI7k,2895
+tsadmetrics/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+tsadmetrics/ts_aware_utils.py,sha256=RbgSAVLWeMtA0ZrvBw-_lT0b0ygFn9a1TxSW5cQAwmg,31
+tsadmetrics/utils.py,sha256=G0yWxgTZ9MBzyB0XDLrO2TMwmtm4hssDp5Sr0CG9FqY,1834
+tsadmetrics-0.1.0.dist-info/METADATA,sha256=uJkICqyBIEcjkBuDUrj_28MGzwmUCBepr8wYU3ob3eY,350
+tsadmetrics-0.1.0.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
+tsadmetrics-0.1.0.dist-info/top_level.txt,sha256=rRMFvkwJRUuenl0__YY_3BNr-rkdhAdj28iICkpC5a4,12
+tsadmetrics-0.1.0.dist-info/RECORD,,

tsadmetrics-0.1.0.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,5 @@
+Wheel-Version: 1.0
+Generator: setuptools (75.3.2)
+Root-Is-Purelib: true
+Tag: py3-none-any

tsadmetrics-0.1.0.dist-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ tsadmetrics