Initial commit - ACME demo version

2026-02-04 11:08:21 +01:00
commit 1bb0765766
180 changed files with 52249 additions and 0 deletions
--- a/backend/beyond_metrics/dimensions/OperationalPerformance.py
+++ b/backend/beyond_metrics/dimensions/OperationalPerformance.py
@@ -0,0 +1,716 @@
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Any, Dict, List
+
+import numpy as np
+import pandas as pd
+import matplotlib.pyplot as plt
+from matplotlib.axes import Axes
+import math
+
+REQUIRED_COLUMNS_OP: List[str] = [
+    "interaction_id",
+    "datetime_start",
+    "queue_skill",
+    "channel",
+    "duration_talk",
+    "hold_time",
+    "wrap_up_time",
+    "agent_id",
+    "transfer_flag",
+]
+
+
+@dataclass
+class OperationalPerformanceMetrics:
+    """
+    Dimensión: RENDIMIENTO OPERACIONAL Y DE SERVICIO
+
+    Propósito: medir el balance entre rapidez (eficiencia) y calidad de resolución,
+    más la variabilidad del servicio.
+
+    Requiere como mínimo:
+    - interaction_id
+    - datetime_start
+    - queue_skill
+    - channel
+    - duration_talk (segundos)
+    - hold_time (segundos)
+    - wrap_up_time (segundos)
+    - agent_id
+    - transfer_flag (bool/int)
+
+    Columnas opcionales:
+    - is_resolved (bool/int)      -> para FCR
+    - abandoned_flag (bool/int)   -> para tasa de abandono
+    - customer_id / caller_id     -> para reincidencia y repetición de canal
+    - logged_time (segundos)      -> para occupancy_rate
+    """
+
+    df: pd.DataFrame
+
+    # Benchmarks / parámetros de normalización (puedes ajustarlos)
+    AHT_GOOD: float = 300.0     # 5 min
+    AHT_BAD: float = 900.0      # 15 min
+    VAR_RATIO_GOOD: float = 1.2 # P90/P50 ~1.2 muy estable
+    VAR_RATIO_BAD: float = 3.0  # P90/P50 >=3 muy inestable
+
+    def __post_init__(self) -> None:
+        self._validate_columns()
+        self._prepare_data()
+
+    # ------------------------------------------------------------------ #
+    # Helpers internos
+    # ------------------------------------------------------------------ #
+    def _validate_columns(self) -> None:
+        missing = [c for c in REQUIRED_COLUMNS_OP if c not in self.df.columns]
+        if missing:
+            raise ValueError(
+                f"Faltan columnas obligatorias para OperationalPerformanceMetrics: {missing}"
+            )
+
+    def _prepare_data(self) -> None:
+        df = self.df.copy()
+
+        # Tipos
+        df["datetime_start"] = pd.to_datetime(df["datetime_start"], errors="coerce")
+
+        for col in ["duration_talk", "hold_time", "wrap_up_time"]:
+            df[col] = pd.to_numeric(df[col], errors="coerce")
+
+        # Handle Time
+        df["handle_time"] = (
+            df["duration_talk"].fillna(0)
+            + df["hold_time"].fillna(0)
+            + df["wrap_up_time"].fillna(0)
+        )
+
+        # v3.0: Filtrar NOISE y ZOMBIE para cálculos de variabilidad
+        # record_status: 'VALID', 'NOISE', 'ZOMBIE', 'ABANDON'
+        # Para AHT/CV solo usamos 'VALID' (excluye noise, zombie, abandon)
+        if "record_status" in df.columns:
+            df["record_status"] = df["record_status"].astype(str).str.strip().str.upper()
+            # Crear máscara para registros válidos: SOLO "VALID"
+            # Excluye explícitamente NOISE, ZOMBIE, ABANDON y cualquier otro valor
+            df["_is_valid_for_cv"] = df["record_status"] == "VALID"
+
+            # Log record_status breakdown for debugging
+            status_counts = df["record_status"].value_counts()
+            valid_count = int(df["_is_valid_for_cv"].sum())
+            print(f"[OperationalPerformance] Record status breakdown:")
+            print(f"   Total rows: {len(df)}")
+            for status, count in status_counts.items():
+                print(f"   - {status}: {count}")
+            print(f"   VALID rows for AHT calculation: {valid_count}")
+        else:
+            # Legacy data sin record_status: incluir todo
+            df["_is_valid_for_cv"] = True
+            print(f"[OperationalPerformance] No record_status column - using all {len(df)} rows")
+
+        # Normalización básica
+        df["queue_skill"] = df["queue_skill"].astype(str).str.strip()
+        df["channel"] = df["channel"].astype(str).str.strip()
+        df["agent_id"] = df["agent_id"].astype(str).str.strip()
+
+        # Flags opcionales convertidos a bool cuando existan
+        for flag_col in ["is_resolved", "abandoned_flag", "transfer_flag"]:
+            if flag_col in df.columns:
+                df[flag_col] = df[flag_col].astype(int).astype(bool)
+
+        # customer_id: usamos customer_id si existe, si no caller_id
+        if "customer_id" in df.columns:
+            df["customer_id"] = df["customer_id"].astype(str)
+        elif "caller_id" in df.columns:
+            df["customer_id"] = df["caller_id"].astype(str)
+        else:
+            df["customer_id"] = None
+
+        # logged_time opcional
+        # Normalizamos logged_time: siempre será una serie float con NaN si no existe
+        df["logged_time"] = pd.to_numeric(df.get("logged_time", np.nan), errors="coerce")
+
+
+        self.df = df
+
+    @property
+    def is_empty(self) -> bool:
+        return self.df.empty
+
+    # ------------------------------------------------------------------ #
+    # AHT y variabilidad
+    # ------------------------------------------------------------------ #
+    def aht_distribution(self) -> Dict[str, float]:
+        """
+        Devuelve P10, P50, P90 del AHT y el ratio P90/P50 como medida de variabilidad.
+
+        v3.0: Filtra NOISE y ZOMBIE para el cálculo de variabilidad.
+        Solo usa registros con record_status='valid' o sin status (legacy).
+        """
+        # Filtrar solo registros válidos para cálculo de variabilidad
+        df_valid = self.df[self.df["_is_valid_for_cv"] == True]
+        ht = df_valid["handle_time"].dropna().astype(float)
+        if ht.empty:
+            return {}
+
+        p10 = float(np.percentile(ht, 10))
+        p50 = float(np.percentile(ht, 50))
+        p90 = float(np.percentile(ht, 90))
+        ratio = float(p90 / p50) if p50 > 0 else float("nan")
+
+        return {
+            "p10": round(p10, 2),
+            "p50": round(p50, 2),
+            "p90": round(p90, 2),
+            "p90_p50_ratio": round(ratio, 3),
+        }
+
+    def talk_hold_acw_p50_by_skill(self) -> pd.DataFrame:
+        """
+        P50 de talk_time, hold_time y wrap_up_time por skill.
+
+        Incluye queue_skill como columna (no solo índice) para que
+        el frontend pueda hacer lookup por nombre de skill.
+        """
+        df = self.df
+
+        def perc(s: pd.Series, q: float) -> float:
+            s = s.dropna().astype(float)
+            if s.empty:
+                return float("nan")
+            return float(np.percentile(s, q))
+
+        grouped = df.groupby("queue_skill")
+        result = pd.DataFrame(
+            {
+                "talk_p50": grouped["duration_talk"].apply(lambda s: perc(s, 50)),
+                "hold_p50": grouped["hold_time"].apply(lambda s: perc(s, 50)),
+                "acw_p50": grouped["wrap_up_time"].apply(lambda s: perc(s, 50)),
+            }
+        )
+        # Reset index to include queue_skill as column for frontend lookup
+        return result.round(2).sort_index().reset_index()
+
+    # ------------------------------------------------------------------ #
+    # FCR, escalación, abandono, reincidencia, repetición canal
+    # ------------------------------------------------------------------ #
+    def fcr_rate(self) -> float:
+        """
+        FCR (First Contact Resolution).
+
+        Prioridad 1: Usar fcr_real_flag del CSV si existe
+        Prioridad 2: Calcular como 100 - escalation_rate
+        """
+        df = self.df
+        total = len(df)
+        if total == 0:
+            return float("nan")
+
+        # Prioridad 1: Usar fcr_real_flag si existe
+        if "fcr_real_flag" in df.columns:
+            col = df["fcr_real_flag"]
+            # Normalizar a booleano
+            if col.dtype == "O":
+                fcr_mask = (
+                    col.astype(str)
+                       .str.strip()
+                       .str.lower()
+                       .isin(["true", "t", "1", "yes", "y", "si", "sí"])
+                )
+            else:
+                fcr_mask = pd.to_numeric(col, errors="coerce").fillna(0) > 0
+
+            fcr_count = int(fcr_mask.sum())
+            fcr = (fcr_count / total) * 100.0
+            return float(max(0.0, min(100.0, round(fcr, 2))))
+
+        # Prioridad 2: Fallback a 100 - escalation_rate
+        try:
+            esc = self.escalation_rate()
+        except Exception:
+            esc = float("nan")
+
+        if esc is not None and not math.isnan(esc):
+            fcr = 100.0 - esc
+            return float(max(0.0, min(100.0, round(fcr, 2))))
+
+        return float("nan")
+
+
+    def escalation_rate(self) -> float:
+        """
+        % de interacciones que requieren escalación (transfer_flag == True).
+        """
+        df = self.df
+        total = len(df)
+        if total == 0:
+            return float("nan")
+
+        escalated = df["transfer_flag"].sum()
+        return float(round(escalated / total * 100, 2))
+
+    def abandonment_rate(self) -> float:
+        """
+        % de interacciones abandonadas.
+
+        Busca en orden: is_abandoned, abandoned_flag, abandoned
+        Si ninguna columna existe, devuelve NaN.
+        """
+        df = self.df
+        total = len(df)
+        if total == 0:
+            return float("nan")
+
+        # Buscar columna de abandono en orden de prioridad
+        abandon_col = None
+        for col_name in ["is_abandoned", "abandoned_flag", "abandoned"]:
+            if col_name in df.columns:
+                abandon_col = col_name
+                break
+
+        if abandon_col is None:
+            return float("nan")
+
+        col = df[abandon_col]
+
+        # Normalizar a booleano
+        if col.dtype == "O":
+            abandon_mask = (
+                col.astype(str)
+                   .str.strip()
+                   .str.lower()
+                   .isin(["true", "t", "1", "yes", "y", "si", "sí"])
+            )
+        else:
+            abandon_mask = pd.to_numeric(col, errors="coerce").fillna(0) > 0
+
+        abandoned = int(abandon_mask.sum())
+        return float(round(abandoned / total * 100, 2))
+
+    def high_hold_time_rate(self, threshold_seconds: float = 60.0) -> float:
+        """
+        % de interacciones con hold_time > threshold (por defecto 60s).
+
+        Proxy de complejidad: si el agente tuvo que poner en espera al cliente
+        más de 60 segundos, probablemente tuvo que consultar/investigar.
+        """
+        df = self.df
+        total = len(df)
+        if total == 0:
+            return float("nan")
+
+        hold_times = df["hold_time"].fillna(0)
+        high_hold_count = (hold_times > threshold_seconds).sum()
+
+        return float(round(high_hold_count / total * 100, 2))
+
+    def recurrence_rate_7d(self) -> float:
+        """
+        % de clientes que vuelven a contactar en < 7 días para el MISMO skill.
+
+        Se basa en customer_id (o caller_id si no hay customer_id) + queue_skill.
+        Calcula:
+        - Para cada combinación cliente + skill, ordena por datetime_start
+        - Si hay dos contactos consecutivos separados < 7 días (mismo cliente, mismo skill),
+          cuenta como "recurrente"
+        - Tasa = nº clientes recurrentes / nº total de clientes
+
+        NOTA: Solo cuenta como recurrencia si el cliente llama por el MISMO skill.
+        Un cliente que llama a "Ventas" y luego a "Soporte" NO es recurrente.
+        """
+
+        df = self.df.dropna(subset=["datetime_start"]).copy()
+
+        # Normalizar identificador de cliente
+        if "customer_id" not in df.columns:
+            if "caller_id" in df.columns:
+                df["customer_id"] = df["caller_id"]
+            else:
+                # No hay identificador de cliente -> no se puede calcular
+                return float("nan")
+
+        df = df.dropna(subset=["customer_id"])
+        if df.empty:
+            return float("nan")
+
+        # Ordenar por cliente + skill + fecha
+        df = df.sort_values(["customer_id", "queue_skill", "datetime_start"])
+
+        # Diferencia de tiempo entre contactos consecutivos por cliente Y skill
+        # Esto asegura que solo contamos recontactos del mismo cliente para el mismo skill
+        df["delta"] = df.groupby(["customer_id", "queue_skill"])["datetime_start"].diff()
+
+        # Marcamos los contactos que ocurren a menos de 7 días del anterior (mismo skill)
+        recurrence_mask = df["delta"] < pd.Timedelta(days=7)
+
+        # Nº de clientes que tienen al menos un contacto recurrente (para cualquier skill)
+        recurrent_customers = df.loc[recurrence_mask, "customer_id"].nunique()
+        total_customers = df["customer_id"].nunique()
+
+        if total_customers == 0:
+            return float("nan")
+
+        rate = recurrent_customers / total_customers * 100.0
+        return float(round(rate, 2))
+
+
+    def repeat_channel_rate(self) -> float:
+        """
+        % de reincidencias (<7 días) en las que el cliente usa el MISMO canal.
+
+        Si no hay customer_id/caller_id o solo un contacto por cliente, devuelve NaN.
+        """
+        df = self.df.dropna(subset=["datetime_start"]).copy()
+        if df["customer_id"].isna().all():
+            return float("nan")
+
+        df = df.sort_values(["customer_id", "datetime_start"])
+        df["next_customer"] = df["customer_id"].shift(-1)
+        df["next_datetime"] = df["datetime_start"].shift(-1)
+        df["next_channel"] = df["channel"].shift(-1)
+
+        same_customer = df["customer_id"] == df["next_customer"]
+        within_7d = (df["next_datetime"] - df["datetime_start"]) < pd.Timedelta(days=7)
+
+        recurrent_mask = same_customer & within_7d
+        if not recurrent_mask.any():
+            return float("nan")
+
+        same_channel = df["channel"] == df["next_channel"]
+        same_channel_recurrent = (recurrent_mask & same_channel).sum()
+        total_recurrent = recurrent_mask.sum()
+
+        return float(round(same_channel_recurrent / total_recurrent * 100, 2))
+
+    # ------------------------------------------------------------------ #
+    # Occupancy
+    # ------------------------------------------------------------------ #
+    def occupancy_rate(self) -> float:
+        """
+        Tasa de ocupación:
+
+        occupancy = sum(handle_time) / sum(logged_time) * 100.
+
+        Requiere columna 'logged_time'. Si no existe o es todo 0, devuelve NaN.
+        """
+        df = self.df
+        if "logged_time" not in df.columns:
+            return float("nan")
+
+        logged = df["logged_time"].fillna(0)
+        handle = df["handle_time"].fillna(0)
+
+        total_logged = logged.sum()
+        if total_logged == 0:
+            return float("nan")
+
+        occ = handle.sum() / total_logged
+        return float(round(occ * 100, 2))
+
+    # ------------------------------------------------------------------ #
+    # Score de rendimiento 0-10
+    # ------------------------------------------------------------------ #
+    def performance_score(self) -> Dict[str, float]:
+        """
+        Calcula un score 0-10 combinando:
+        - AHT (bajo es mejor)
+        - FCR (alto es mejor)
+        - Variabilidad (P90/P50, bajo es mejor)
+        - Otros factores (ocupación / escalación)
+
+        Fórmula:
+        score = 0.4 * (10 - AHT_norm) +
+                0.3 * FCR_norm +
+                0.2 * (10 - Var_norm) +
+                0.1 * Otros_score
+
+        Donde *_norm son valores en escala 0-10.
+        """
+        dist = self.aht_distribution()
+        if not dist:
+            return {"score": float("nan")}
+
+        p50 = dist["p50"]
+        ratio = dist["p90_p50_ratio"]
+
+        # AHT_normalized: 0 (mejor) a 10 (peor)
+        aht_norm = self._scale_to_0_10(p50, self.AHT_GOOD, self.AHT_BAD)
+        # FCR_normalized: 0-10 directamente desde % (0-100)
+        fcr_pct = self.fcr_rate()
+        fcr_norm = fcr_pct / 10.0 if not np.isnan(fcr_pct) else 0.0
+        # Variabilidad_normalized: 0 (ratio bueno) a 10 (ratio malo)
+        var_norm = self._scale_to_0_10(ratio, self.VAR_RATIO_GOOD, self.VAR_RATIO_BAD)
+
+        # Otros factores: combinamos ocupación (ideal ~80%) y escalación (ideal baja)
+        occ = self.occupancy_rate()
+        esc = self.escalation_rate()
+
+        other_score = self._compute_other_factors_score(occ, esc)
+
+        score = (
+            0.4 * (10.0 - aht_norm)
+            + 0.3 * fcr_norm
+            + 0.2 * (10.0 - var_norm)
+            + 0.1 * other_score
+        )
+
+        # Clamp 0-10
+        score = max(0.0, min(10.0, score))
+
+        return {
+            "score": round(score, 2),
+            "aht_norm": round(aht_norm, 2),
+            "fcr_norm": round(fcr_norm, 2),
+            "var_norm": round(var_norm, 2),
+            "other_score": round(other_score, 2),
+        }
+
+    def _scale_to_0_10(self, value: float, good: float, bad: float) -> float:
+        """
+        Escala linealmente un valor:
+        - good -> 0
+        - bad  -> 10
+        Con saturación fuera de rango.
+        """
+        if np.isnan(value):
+            return 5.0  # neutro
+
+        if good == bad:
+            return 5.0
+
+        if good < bad:
+            # Menor es mejor
+            if value <= good:
+                return 0.0
+            if value >= bad:
+                return 10.0
+            return 10.0 * (value - good) / (bad - good)
+        else:
+            # Mayor es mejor
+            if value >= good:
+                return 0.0
+            if value <= bad:
+                return 10.0
+            return 10.0 * (good - value) / (good - bad)
+
+    def _compute_other_factors_score(self, occ_pct: float, esc_pct: float) -> float:
+        """
+        Otros factores (0-10) basados en:
+        - ocupación ideal alrededor de 80%
+        - tasa de escalación ideal baja (<10%)
+        """
+        # Ocupación: 0 penalización si está entre 75-85, se penaliza fuera
+        if np.isnan(occ_pct):
+            occ_penalty = 5.0
+        else:
+            deviation = abs(occ_pct - 80.0)
+            occ_penalty = min(10.0, deviation / 5.0 * 2.0)  # cada 5 puntos se suman 2, máx 10
+        occ_score = max(0.0, 10.0 - occ_penalty)
+
+        # Escalación: 0-10 donde 0% -> 10 puntos, >=40% -> 0
+        if np.isnan(esc_pct):
+            esc_score = 5.0
+        else:
+            if esc_pct <= 0:
+                esc_score = 10.0
+            elif esc_pct >= 40:
+                esc_score = 0.0
+            else:
+                esc_score = 10.0 * (1.0 - esc_pct / 40.0)
+
+        # Media simple de ambos
+        return (occ_score + esc_score) / 2.0
+
+    # ------------------------------------------------------------------ #
+    # Plots
+    # ------------------------------------------------------------------ #
+    def plot_aht_boxplot_by_skill(self) -> Axes:
+        """
+        Boxplot del AHT por skill (P10-P50-P90 visual).
+        """
+        df = self.df.copy()
+
+        if df.empty or "handle_time" not in df.columns:
+            fig, ax = plt.subplots()
+            ax.text(0.5, 0.5, "Sin datos de AHT", ha="center", va="center")
+            ax.set_axis_off()
+            return ax
+
+        df = df.dropna(subset=["handle_time"])
+        if df.empty:
+            fig, ax = plt.subplots()
+            ax.text(0.5, 0.5, "AHT no disponible", ha="center", va="center")
+            ax.set_axis_off()
+            return ax
+
+        fig, ax = plt.subplots(figsize=(8, 4))
+        df.boxplot(column="handle_time", by="queue_skill", ax=ax, showfliers=False)
+
+        ax.set_xlabel("Skill / Cola")
+        ax.set_ylabel("AHT (segundos)")
+        ax.set_title("Distribución de AHT por skill")
+        plt.suptitle("")
+        plt.xticks(rotation=45, ha="right")
+        ax.grid(axis="y", alpha=0.3)
+
+        return ax
+
+    def plot_resolution_funnel_by_skill(self) -> Axes:
+        """
+        Funnel / barras apiladas de Talk + Hold + ACW por skill (P50).
+
+        Permite ver el equilibrio de tiempos por skill.
+        """
+        p50 = self.talk_hold_acw_p50_by_skill()
+        if p50.empty:
+            fig, ax = plt.subplots()
+            ax.text(0.5, 0.5, "Sin datos para funnel", ha="center", va="center")
+            ax.set_axis_off()
+            return ax
+
+        fig, ax = plt.subplots(figsize=(10, 4))
+
+        skills = p50.index
+        talk = p50["talk_p50"]
+        hold = p50["hold_p50"]
+        acw = p50["acw_p50"]
+
+        x = np.arange(len(skills))
+
+        ax.bar(x, talk, label="Talk P50")
+        ax.bar(x, hold, bottom=talk, label="Hold P50")
+        ax.bar(x, acw, bottom=talk + hold, label="ACW P50")
+
+        ax.set_xticks(x)
+        ax.set_xticklabels(skills, rotation=45, ha="right")
+        ax.set_ylabel("Segundos")
+        ax.set_title("Funnel de resolución (P50) por skill")
+        ax.legend()
+        ax.grid(axis="y", alpha=0.3)
+
+        return ax
+
+    # ------------------------------------------------------------------ #
+    # Métricas por skill (para consistencia frontend cached/fresh)
+    # ------------------------------------------------------------------ #
+    def metrics_by_skill(self) -> List[Dict[str, Any]]:
+        """
+        Calcula métricas operacionales por skill:
+        - transfer_rate: % de interacciones con transfer_flag == True
+        - abandonment_rate: % de interacciones abandonadas
+        - fcr_tecnico: 100 - transfer_rate (sin transferencia)
+        - fcr_real: % sin transferencia Y sin recontacto 7d (si hay datos)
+        - volume: número de interacciones
+
+        Devuelve una lista de dicts, uno por skill, para que el frontend
+        tenga acceso a las métricas reales por skill (no estimadas).
+        """
+        df = self.df
+        if df.empty:
+            return []
+
+        results = []
+
+        # Detectar columna de abandono
+        abandon_col = None
+        for col_name in ["is_abandoned", "abandoned_flag", "abandoned"]:
+            if col_name in df.columns:
+                abandon_col = col_name
+                break
+
+        # Detectar columna de repeat_call_7d para FCR real
+        repeat_col = None
+        for col_name in ["repeat_call_7d", "repeat_7d", "is_repeat_7d"]:
+            if col_name in df.columns:
+                repeat_col = col_name
+                break
+
+        for skill, group in df.groupby("queue_skill"):
+            total = len(group)
+            if total == 0:
+                continue
+
+            # Transfer rate
+            if "transfer_flag" in group.columns:
+                transfer_count = group["transfer_flag"].sum()
+                transfer_rate = float(round(transfer_count / total * 100, 2))
+            else:
+                transfer_rate = 0.0
+
+            # FCR Técnico = 100 - transfer_rate
+            fcr_tecnico = float(round(100.0 - transfer_rate, 2))
+
+            # Abandonment rate
+            abandonment_rate = 0.0
+            if abandon_col:
+                col = group[abandon_col]
+                if col.dtype == "O":
+                    abandon_mask = (
+                        col.astype(str)
+                           .str.strip()
+                           .str.lower()
+                           .isin(["true", "t", "1", "yes", "y", "si", "sí"])
+                    )
+                else:
+                    abandon_mask = pd.to_numeric(col, errors="coerce").fillna(0) > 0
+                abandoned = int(abandon_mask.sum())
+                abandonment_rate = float(round(abandoned / total * 100, 2))
+
+            # FCR Real (sin transferencia Y sin recontacto 7d)
+            fcr_real = fcr_tecnico  # default to fcr_tecnico if no repeat data
+            if repeat_col and "transfer_flag" in group.columns:
+                repeat_data = group[repeat_col]
+                if repeat_data.dtype == "O":
+                    repeat_mask = (
+                        repeat_data.astype(str)
+                           .str.strip()
+                           .str.lower()
+                           .isin(["true", "t", "1", "yes", "y", "si", "sí"])
+                    )
+                else:
+                    repeat_mask = pd.to_numeric(repeat_data, errors="coerce").fillna(0) > 0
+
+                # FCR Real: no transfer AND no repeat
+                fcr_real_mask = (~group["transfer_flag"]) & (~repeat_mask)
+                fcr_real_count = fcr_real_mask.sum()
+                fcr_real = float(round(fcr_real_count / total * 100, 2))
+
+            # AHT Mean (promedio de handle_time sobre registros válidos)
+            # Filtramos solo registros 'valid' (excluye noise/zombie) para consistencia
+            if "_is_valid_for_cv" in group.columns:
+                valid_records = group[group["_is_valid_for_cv"]]
+            else:
+                valid_records = group
+
+            if len(valid_records) > 0 and "handle_time" in valid_records.columns:
+                aht_mean = float(round(valid_records["handle_time"].mean(), 2))
+            else:
+                aht_mean = 0.0
+
+            # AHT Total (promedio de handle_time sobre TODOS los registros)
+            # Incluye NOISE, ZOMBIE, ABANDON - solo para información/comparación
+            if len(group) > 0 and "handle_time" in group.columns:
+                aht_total = float(round(group["handle_time"].mean(), 2))
+            else:
+                aht_total = 0.0
+
+            # Hold Time Mean (promedio de hold_time sobre registros válidos)
+            # Consistente con fresh path que usa MEAN, no P50
+            if len(valid_records) > 0 and "hold_time" in valid_records.columns:
+                hold_time_mean = float(round(valid_records["hold_time"].mean(), 2))
+            else:
+                hold_time_mean = 0.0
+
+            results.append({
+                "skill": str(skill),
+                "volume": int(total),
+                "transfer_rate": transfer_rate,
+                "abandonment_rate": abandonment_rate,
+                "fcr_tecnico": fcr_tecnico,
+                "fcr_real": fcr_real,
+                "aht_mean": aht_mean,
+                "aht_total": aht_total,
+                "hold_time_mean": hold_time_mean,
+            })
+
+        return results