Translate Phase 2 medium-priority files (frontend utils + backend dimensions)

Phase 2 of Spanish-to-English translation for medium-priority files: Frontend utils (2 files): - dataTransformation.ts: Translated ~72 occurrences (comments, docs, console logs) - segmentClassifier.ts: Translated ~20 occurrences (JSDoc, inline comments, UI strings) Backend dimensions (3 files): - OperationalPerformance.py: Translated ~117 lines (docstrings, comments) - SatisfactionExperience.py: Translated ~33 lines (docstrings, comments) - EconomyCost.py: Translated ~79 lines (docstrings, comments) All function names and variable names preserved for API compatibility. Frontend and backend compilation tested and verified successful. Related to TRANSLATION_STATUS.md Phase 2 objectives. https://claude.ai/code/session_01GNbnkFoESkRcnPr3bLCYDg
2026-02-07 11:03:00 +00:00
parent 94178eaaae
commit 8c7f5fa827
5 changed files with 325 additions and 335 deletions
--- a/backend/beyond_metrics/dimensions/OperationalPerformance.py
+++ b/backend/beyond_metrics/dimensions/OperationalPerformance.py
@@ -25,32 +25,31 @@ REQUIRED_COLUMNS_OP: List[str] = [
@dataclass
 class OperationalPerformanceMetrics:
    """
-    Dimensión: RENDIMIENTO OPERACIONAL Y DE SERVICIO
+    Dimension: OPERATIONAL PERFORMANCE AND SERVICE

-    Propósito: medir el balance entre rapidez (eficiencia) y calidad de resolución,
-    más la variabilidad del servicio.
+    Purpose: measure the balance between speed (efficiency) and resolution quality, plus service variability.

-    Requiere como mínimo:
+    Requires at minimum:
    - interaction_id
    - datetime_start
    - queue_skill
    - channel
-    - duration_talk (segundos)
-    - hold_time (segundos)
-    - wrap_up_time (segundos)
+    - duration_talk (seconds)
+    - hold_time (seconds)
+    - wrap_up_time (seconds)
    - agent_id
    - transfer_flag (bool/int)

-    Columnas opcionales:
-    - is_resolved (bool/int)      -> para FCR
-    - abandoned_flag (bool/int)   -> para tasa de abandono
-    - customer_id / caller_id     -> para reincidencia y repetición de canal
-    - logged_time (segundos)      -> para occupancy_rate
+    Optional columns:
+    - is_resolved (bool/int)      -> for FCR
+    - abandoned_flag (bool/int)   -> for abandonment rate
+    - customer_id / caller_id     -> for recurrence and channel repetition
+    - logged_time (seconds)      -> for occupancy_rate
    """

    df: pd.DataFrame

-    # Benchmarks / parámetros de normalización (puedes ajustarlos)
+    # Benchmarks / normalization parameters (you can adjust them)
    AHT_GOOD: float = 300.0     # 5 min
    AHT_BAD: float = 900.0      # 15 min
    VAR_RATIO_GOOD: float = 1.2 # P90/P50 ~1.2 muy estable
@@ -61,19 +60,19 @@ class OperationalPerformanceMetrics:
        self._prepare_data()

    # ------------------------------------------------------------------ #
-    # Helpers internos
+    # Internal helpers
    # ------------------------------------------------------------------ #
    def _validate_columns(self) -> None:
        missing = [c for c in REQUIRED_COLUMNS_OP if c not in self.df.columns]
        if missing:
            raise ValueError(
-                f"Faltan columnas obligatorias para OperationalPerformanceMetrics: {missing}"
+                f"Missing required columns for OperationalPerformanceMetrics: {missing}"
            )

    def _prepare_data(self) -> None:
        df = self.df.copy()

-        # Tipos
+        # Types
        df["datetime_start"] = pd.to_datetime(df["datetime_start"], errors="coerce")

        for col in ["duration_talk", "hold_time", "wrap_up_time"]:
@@ -86,13 +85,13 @@ class OperationalPerformanceMetrics:
            + df["wrap_up_time"].fillna(0)
        )

-        # v3.0: Filtrar NOISE y ZOMBIE para cálculos de variabilidad
+        # v3.0: Filter NOISE and ZOMBIE for variability calculations
        # record_status: 'VALID', 'NOISE', 'ZOMBIE', 'ABANDON'
-        # Para AHT/CV solo usamos 'VALID' (excluye noise, zombie, abandon)
+        # For AHT/CV we only use 'VALID' (excludes noise, zombie, abandon)
        if "record_status" in df.columns:
            df["record_status"] = df["record_status"].astype(str).str.strip().str.upper()
-            # Crear máscara para registros válidos: SOLO "VALID"
-            # Excluye explícitamente NOISE, ZOMBIE, ABANDON y cualquier otro valor
+            # Create mask for valid records: ONLY "VALID"
+            # Explicitly excludes NOISE, ZOMBIE, ABANDON and any other value
            df["_is_valid_for_cv"] = df["record_status"] == "VALID"

            # Log record_status breakdown for debugging
@@ -104,21 +103,21 @@ class OperationalPerformanceMetrics:
                print(f"   - {status}: {count}")
            print(f"   VALID rows for AHT calculation: {valid_count}")
        else:
-            # Legacy data sin record_status: incluir todo
+            # Legacy data without record_status: include all
            df["_is_valid_for_cv"] = True
            print(f"[OperationalPerformance] No record_status column - using all {len(df)} rows")

-        # Normalización básica
+        # Basic normalization
        df["queue_skill"] = df["queue_skill"].astype(str).str.strip()
        df["channel"] = df["channel"].astype(str).str.strip()
        df["agent_id"] = df["agent_id"].astype(str).str.strip()

-        # Flags opcionales convertidos a bool cuando existan
+        # Optional flags converted to bool when they exist
        for flag_col in ["is_resolved", "abandoned_flag", "transfer_flag"]:
            if flag_col in df.columns:
                df[flag_col] = df[flag_col].astype(int).astype(bool)

-        # customer_id: usamos customer_id si existe, si no caller_id
+        # customer_id: we use customer_id if it exists, otherwise caller_id
        if "customer_id" in df.columns:
            df["customer_id"] = df["customer_id"].astype(str)
        elif "caller_id" in df.columns:
@@ -126,8 +125,8 @@ class OperationalPerformanceMetrics:
        else:
            df["customer_id"] = None

-        # logged_time opcional
-        # Normalizamos logged_time: siempre será una serie float con NaN si no existe
+        # logged_time optional
+        # Normalize logged_time: will always be a float series with NaN if it does not exist
        df["logged_time"] = pd.to_numeric(df.get("logged_time", np.nan), errors="coerce")


@@ -138,16 +137,16 @@ class OperationalPerformanceMetrics:
        return self.df.empty

    # ------------------------------------------------------------------ #
-    # AHT y variabilidad
+    # AHT and variability
    # ------------------------------------------------------------------ #
    def aht_distribution(self) -> Dict[str, float]:
        """
-        Devuelve P10, P50, P90 del AHT y el ratio P90/P50 como medida de variabilidad.
+        Returns P10, P50, P90 of AHT and the P90/P50 ratio as a measure of variability.

-        v3.0: Filtra NOISE y ZOMBIE para el cálculo de variabilidad.
-        Solo usa registros con record_status='valid' o sin status (legacy).
+        v3.0: Filters NOISE and ZOMBIE for variability calculation.
+        Only uses records with record_status='valid' or without status (legacy).
        """
-        # Filtrar solo registros válidos para cálculo de variabilidad
+        # Filter only valid records for variability calculation
        df_valid = self.df[self.df["_is_valid_for_cv"] == True]
        ht = df_valid["handle_time"].dropna().astype(float)
        if ht.empty:
@@ -167,10 +166,9 @@ class OperationalPerformanceMetrics:

    def talk_hold_acw_p50_by_skill(self) -> pd.DataFrame:
        """
-        P50 de talk_time, hold_time y wrap_up_time por skill.
+        P50 of talk_time, hold_time and wrap_up_time by skill.

-        Incluye queue_skill como columna (no solo índice) para que
-        el frontend pueda hacer lookup por nombre de skill.
+        Includes queue_skill as a column (not just index) so that the frontend can lookup by skill name.
        """
        df = self.df

@@ -192,24 +190,24 @@ class OperationalPerformanceMetrics:
        return result.round(2).sort_index().reset_index()

    # ------------------------------------------------------------------ #
-    # FCR, escalación, abandono, reincidencia, repetición canal
+    # FCR, escalation, abandonment, recurrence, channel repetition
    # ------------------------------------------------------------------ #
    def fcr_rate(self) -> float:
        """
        FCR (First Contact Resolution).

-        Prioridad 1: Usar fcr_real_flag del CSV si existe
-        Prioridad 2: Calcular como 100 - escalation_rate
+        Priority 1: Use fcr_real_flag from CSV if it exists
+        Priority 2: Calculate as 100 - escalation_rate
        """
        df = self.df
        total = len(df)
        if total == 0:
            return float("nan")

-        # Prioridad 1: Usar fcr_real_flag si existe
+        # Priority 1: Use fcr_real_flag if it exists
        if "fcr_real_flag" in df.columns:
            col = df["fcr_real_flag"]
-            # Normalizar a booleano
+            # Normalize to boolean
            if col.dtype == "O":
                fcr_mask = (
                    col.astype(str)
@@ -224,7 +222,7 @@ class OperationalPerformanceMetrics:
            fcr = (fcr_count / total) * 100.0
            return float(max(0.0, min(100.0, round(fcr, 2))))

-        # Prioridad 2: Fallback a 100 - escalation_rate
+        # Priority 2: Fallback to 100 - escalation_rate
        try:
            esc = self.escalation_rate()
        except Exception:
@@ -239,7 +237,7 @@ class OperationalPerformanceMetrics:

    def escalation_rate(self) -> float:
        """
-        % de interacciones que requieren escalación (transfer_flag == True).
+        % of interactions that require escalation (transfer_flag == True).
        """
        df = self.df
        total = len(df)
@@ -251,17 +249,17 @@ class OperationalPerformanceMetrics:

    def abandonment_rate(self) -> float:
        """
-        % de interacciones abandonadas.
+        % of abandoned interactions.

-        Busca en orden: is_abandoned, abandoned_flag, abandoned
-        Si ninguna columna existe, devuelve NaN.
+        Searches in order: is_abandoned, abandoned_flag, abandoned
+        If no column exists, returns NaN.
        """
        df = self.df
        total = len(df)
        if total == 0:
            return float("nan")

-        # Buscar columna de abandono en orden de prioridad
+        # Search for abandonment column in priority order
        abandon_col = None
        for col_name in ["is_abandoned", "abandoned_flag", "abandoned"]:
            if col_name in df.columns:
@@ -273,7 +271,7 @@ class OperationalPerformanceMetrics:

        col = df[abandon_col]

-        # Normalizar a booleano
+        # Normalize to boolean
        if col.dtype == "O":
            abandon_mask = (
                col.astype(str)
@@ -289,10 +287,9 @@ class OperationalPerformanceMetrics:

    def high_hold_time_rate(self, threshold_seconds: float = 60.0) -> float:
        """
-        % de interacciones con hold_time > threshold (por defecto 60s).
+        % of interactions with hold_time > threshold (default 60s).

-        Proxy de complejidad: si el agente tuvo que poner en espera al cliente
-        más de 60 segundos, probablemente tuvo que consultar/investigar.
+        Complexity proxy: if the agent had to put the customer on hold for more than 60 seconds, they probably had to consult/investigate.
        """
        df = self.df
        total = len(df)
@@ -306,44 +303,43 @@ class OperationalPerformanceMetrics:

    def recurrence_rate_7d(self) -> float:
        """
-        % de clientes que vuelven a contactar en < 7 días para el MISMO skill.
+        % of customers who contact again in < 7 days for the SAME skill.

-        Se basa en customer_id (o caller_id si no hay customer_id) + queue_skill.
-        Calcula:
-        - Para cada combinación cliente + skill, ordena por datetime_start
-        - Si hay dos contactos consecutivos separados < 7 días (mismo cliente, mismo skill),
-          cuenta como "recurrente"
-        - Tasa = nº clientes recurrentes / nº total de clientes
+        Based on customer_id (or caller_id if no customer_id) + queue_skill.
+        Calculates:
+        - For each client + skill combination, sorts by datetime_start
+        - If there are two consecutive contacts separated by < 7 days (same client, same skill), counts as "recurrent"
+        - Rate = number of recurrent clients / total number of clients

-        NOTA: Solo cuenta como recurrencia si el cliente llama por el MISMO skill.
-        Un cliente que llama a "Ventas" y luego a "Soporte" NO es recurrente.
+        NOTE: Only counts as recurrence if the client calls for the SAME skill.
+        A client who calls "Sales" and then "Support" is NOT recurrent.
        """

        df = self.df.dropna(subset=["datetime_start"]).copy()

-        # Normalizar identificador de cliente
+        # Normalize client identifier
        if "customer_id" not in df.columns:
            if "caller_id" in df.columns:
                df["customer_id"] = df["caller_id"]
            else:
-                # No hay identificador de cliente -> no se puede calcular
+                # No client identifier -> cannot calculate
                return float("nan")

        df = df.dropna(subset=["customer_id"])
        if df.empty:
            return float("nan")

-        # Ordenar por cliente + skill + fecha
+        # Sort by client + skill + date
        df = df.sort_values(["customer_id", "queue_skill", "datetime_start"])

-        # Diferencia de tiempo entre contactos consecutivos por cliente Y skill
-        # Esto asegura que solo contamos recontactos del mismo cliente para el mismo skill
+        # Time difference between consecutive contacts by client AND skill
+        # This ensures we only count re-contacts from the same client for the same skill
        df["delta"] = df.groupby(["customer_id", "queue_skill"])["datetime_start"].diff()

-        # Marcamos los contactos que ocurren a menos de 7 días del anterior (mismo skill)
+        # Mark contacts that occur less than 7 days from the previous one (same skill)
        recurrence_mask = df["delta"] < pd.Timedelta(days=7)

-        # Nº de clientes que tienen al menos un contacto recurrente (para cualquier skill)
+        # Number of clients who have at least one recurrent contact (for any skill)
        recurrent_customers = df.loc[recurrence_mask, "customer_id"].nunique()
        total_customers = df["customer_id"].nunique()

@@ -356,9 +352,9 @@ class OperationalPerformanceMetrics:

    def repeat_channel_rate(self) -> float:
        """
-        % de reincidencias (<7 días) en las que el cliente usa el MISMO canal.
+        % of recurrences (<7 days) in which the client uses the SAME channel.

-        Si no hay customer_id/caller_id o solo un contacto por cliente, devuelve NaN.
+        If there is no customer_id/caller_id or only one contact per client, returns NaN.
        """
        df = self.df.dropna(subset=["datetime_start"]).copy()
        if df["customer_id"].isna().all():
@@ -387,11 +383,11 @@ class OperationalPerformanceMetrics:
    # ------------------------------------------------------------------ #
    def occupancy_rate(self) -> float:
        """
-        Tasa de ocupación:
+        Occupancy rate:

        occupancy = sum(handle_time) / sum(logged_time) * 100.

-        Requiere columna 'logged_time'. Si no existe o es todo 0, devuelve NaN.
+        Requires 'logged_time' column. If it does not exist or is all 0, returns NaN.
        """
        df = self.df
        if "logged_time" not in df.columns:
@@ -408,23 +404,23 @@ class OperationalPerformanceMetrics:
        return float(round(occ * 100, 2))

    # ------------------------------------------------------------------ #
-    # Score de rendimiento 0-10
+    # Performance score 0-10
    # ------------------------------------------------------------------ #
    def performance_score(self) -> Dict[str, float]:
        """
-        Calcula un score 0-10 combinando:
-        - AHT (bajo es mejor)
-        - FCR (alto es mejor)
-        - Variabilidad (P90/P50, bajo es mejor)
-        - Otros factores (ocupación / escalación)
+        Calculates a 0-10 score combining:
+        - AHT (lower is better)
+        - FCR (higher is better)
+        - Variability (P90/P50, lower is better)
+        - Other factors (occupancy / escalation)

-        Fórmula:
+        Formula:
        score = 0.4 * (10 - AHT_norm) +
                0.3 * FCR_norm +
                0.2 * (10 - Var_norm) +
                0.1 * Otros_score

-        Donde *_norm son valores en escala 0-10.
+        Where *_norm are values on a 0-10 scale.
        """
        dist = self.aht_distribution()
        if not dist:
@@ -433,15 +429,15 @@ class OperationalPerformanceMetrics:
        p50 = dist["p50"]
        ratio = dist["p90_p50_ratio"]

-        # AHT_normalized: 0 (mejor) a 10 (peor)
+        # AHT_normalized: 0 (better) to 10 (worse)
        aht_norm = self._scale_to_0_10(p50, self.AHT_GOOD, self.AHT_BAD)
-        # FCR_normalized: 0-10 directamente desde % (0-100)
+        # FCR_normalized: 0-10 directly from % (0-100)
        fcr_pct = self.fcr_rate()
        fcr_norm = fcr_pct / 10.0 if not np.isnan(fcr_pct) else 0.0
-        # Variabilidad_normalized: 0 (ratio bueno) a 10 (ratio malo)
+        # Variability_normalized: 0 (good ratio) to 10 (bad ratio)
        var_norm = self._scale_to_0_10(ratio, self.VAR_RATIO_GOOD, self.VAR_RATIO_BAD)

-        # Otros factores: combinamos ocupación (ideal ~80%) y escalación (ideal baja)
+        # Other factors: combine occupancy (ideal ~80%) and escalation (ideal low)
        occ = self.occupancy_rate()
        esc = self.escalation_rate()

@@ -467,26 +463,26 @@ class OperationalPerformanceMetrics:

    def _scale_to_0_10(self, value: float, good: float, bad: float) -> float:
        """
-        Escala linealmente un valor:
+        Linearly scales a value:
        - good -> 0
        - bad  -> 10
-        Con saturación fuera de rango.
+        With saturation outside range.
        """
        if np.isnan(value):
-            return 5.0  # neutro
+            return 5.0  # neutral

        if good == bad:
            return 5.0

        if good < bad:
-            # Menor es mejor
+            # Lower is better
            if value <= good:
                return 0.0
            if value >= bad:
                return 10.0
            return 10.0 * (value - good) / (bad - good)
        else:
-            # Mayor es mejor
+            # Higher is better
            if value >= good:
                return 0.0
            if value <= bad:
@@ -495,19 +491,19 @@ class OperationalPerformanceMetrics:

    def _compute_other_factors_score(self, occ_pct: float, esc_pct: float) -> float:
        """
-        Otros factores (0-10) basados en:
-        - ocupación ideal alrededor de 80%
-        - tasa de escalación ideal baja (<10%)
+        Other factors (0-10) based on:
+        - ideal occupancy around 80%
+        - ideal escalation rate low (<10%)
        """
-        # Ocupación: 0 penalización si está entre 75-85, se penaliza fuera
+        # Occupancy: 0 penalty if between 75-85, penalized outside
        if np.isnan(occ_pct):
            occ_penalty = 5.0
        else:
            deviation = abs(occ_pct - 80.0)
-            occ_penalty = min(10.0, deviation / 5.0 * 2.0)  # cada 5 puntos se suman 2, máx 10
+            occ_penalty = min(10.0, deviation / 5.0 * 2.0)  # each 5 points add 2, max 10
        occ_score = max(0.0, 10.0 - occ_penalty)

-        # Escalación: 0-10 donde 0% -> 10 puntos, >=40% -> 0
+        # Escalation: 0-10 where 0% -> 10 points, >=40% -> 0
        if np.isnan(esc_pct):
            esc_score = 5.0
        else:
@@ -518,7 +514,7 @@ class OperationalPerformanceMetrics:
            else:
                esc_score = 10.0 * (1.0 - esc_pct / 40.0)

-        # Media simple de ambos
+        # Simple average of both
        return (occ_score + esc_score) / 2.0

    # ------------------------------------------------------------------ #
@@ -526,29 +522,29 @@ class OperationalPerformanceMetrics:
    # ------------------------------------------------------------------ #
    def plot_aht_boxplot_by_skill(self) -> Axes:
        """
-        Boxplot del AHT por skill (P10-P50-P90 visual).
+        Boxplot of AHT by skill (P10-P50-P90 visual).
        """
        df = self.df.copy()

        if df.empty or "handle_time" not in df.columns:
            fig, ax = plt.subplots()
-            ax.text(0.5, 0.5, "Sin datos de AHT", ha="center", va="center")
+            ax.text(0.5, 0.5, "No AHT data", ha="center", va="center")
            ax.set_axis_off()
            return ax

        df = df.dropna(subset=["handle_time"])
        if df.empty:
            fig, ax = plt.subplots()
-            ax.text(0.5, 0.5, "AHT no disponible", ha="center", va="center")
+            ax.text(0.5, 0.5, "AHT not available", ha="center", va="center")
            ax.set_axis_off()
            return ax

        fig, ax = plt.subplots(figsize=(8, 4))
        df.boxplot(column="handle_time", by="queue_skill", ax=ax, showfliers=False)

-        ax.set_xlabel("Skill / Cola")
-        ax.set_ylabel("AHT (segundos)")
-        ax.set_title("Distribución de AHT por skill")
+        ax.set_xlabel("Skill / Queue")
+        ax.set_ylabel("AHT (seconds)")
+        ax.set_title("AHT distribution by skill")
        plt.suptitle("")
        plt.xticks(rotation=45, ha="right")
        ax.grid(axis="y", alpha=0.3)
@@ -557,14 +553,14 @@ class OperationalPerformanceMetrics:

    def plot_resolution_funnel_by_skill(self) -> Axes:
        """
-        Funnel / barras apiladas de Talk + Hold + ACW por skill (P50).
+        Funnel / stacked bars of Talk + Hold + ACW by skill (P50).

-        Permite ver el equilibrio de tiempos por skill.
+        Allows viewing the time balance by skill.
        """
        p50 = self.talk_hold_acw_p50_by_skill()
        if p50.empty:
            fig, ax = plt.subplots()
-            ax.text(0.5, 0.5, "Sin datos para funnel", ha="center", va="center")
+            ax.text(0.5, 0.5, "No data for funnel", ha="center", va="center")
            ax.set_axis_off()
            return ax

@@ -583,27 +579,26 @@ class OperationalPerformanceMetrics:

        ax.set_xticks(x)
        ax.set_xticklabels(skills, rotation=45, ha="right")
-        ax.set_ylabel("Segundos")
-        ax.set_title("Funnel de resolución (P50) por skill")
+        ax.set_ylabel("Seconds")
+        ax.set_title("Resolution funnel (P50) by skill")
        ax.legend()
        ax.grid(axis="y", alpha=0.3)

        return ax

    # ------------------------------------------------------------------ #
-    # Métricas por skill (para consistencia frontend cached/fresh)
+    # Metrics by skill (for frontend cached/fresh consistency)
    # ------------------------------------------------------------------ #
    def metrics_by_skill(self) -> List[Dict[str, Any]]:
        """
-        Calcula métricas operacionales por skill:
-        - transfer_rate: % de interacciones con transfer_flag == True
-        - abandonment_rate: % de interacciones abandonadas
-        - fcr_tecnico: 100 - transfer_rate (sin transferencia)
-        - fcr_real: % sin transferencia Y sin recontacto 7d (si hay datos)
-        - volume: número de interacciones
+        Calculates operational metrics by skill:
+        - transfer_rate: % of interactions with transfer_flag == True
+        - abandonment_rate: % of abandoned interactions
+        - fcr_tecnico: 100 - transfer_rate (without transfer)
+        - fcr_real: % without transfer AND without 7d re-contact (if there is data)
+        - volume: number of interactions

-        Devuelve una lista de dicts, uno por skill, para que el frontend
-        tenga acceso a las métricas reales por skill (no estimadas).
+        Returns a list of dicts, one per skill, so that the frontend has access to real metrics by skill (not estimated).
        """
        df = self.df
        if df.empty:
@@ -611,14 +606,14 @@ class OperationalPerformanceMetrics:

        results = []

-        # Detectar columna de abandono
+        # Detect abandonment column
        abandon_col = None
        for col_name in ["is_abandoned", "abandoned_flag", "abandoned"]:
            if col_name in df.columns:
                abandon_col = col_name
                break

-        # Detectar columna de repeat_call_7d para FCR real
+        # Detect repeat_call_7d column for real FCR
        repeat_col = None
        for col_name in ["repeat_call_7d", "repeat_7d", "is_repeat_7d"]:
            if col_name in df.columns:
@@ -637,7 +632,7 @@ class OperationalPerformanceMetrics:
            else:
                transfer_rate = 0.0

-            # FCR Técnico = 100 - transfer_rate
+            # Technical FCR = 100 - transfer_rate
            fcr_tecnico = float(round(100.0 - transfer_rate, 2))

            # Abandonment rate
@@ -656,7 +651,7 @@ class OperationalPerformanceMetrics:
                abandoned = int(abandon_mask.sum())
                abandonment_rate = float(round(abandoned / total * 100, 2))

-            # FCR Real (sin transferencia Y sin recontacto 7d)
+            # Real FCR (without transfer AND without 7d re-contact)
            fcr_real = fcr_tecnico  # default to fcr_tecnico if no repeat data
            if repeat_col and "transfer_flag" in group.columns:
                repeat_data = group[repeat_col]
@@ -670,13 +665,13 @@ class OperationalPerformanceMetrics:
                else:
                    repeat_mask = pd.to_numeric(repeat_data, errors="coerce").fillna(0) > 0

-                # FCR Real: no transfer AND no repeat
+                # Real FCR: no transfer AND no repeat
                fcr_real_mask = (~group["transfer_flag"]) & (~repeat_mask)
                fcr_real_count = fcr_real_mask.sum()
                fcr_real = float(round(fcr_real_count / total * 100, 2))

-            # AHT Mean (promedio de handle_time sobre registros válidos)
-            # Filtramos solo registros 'valid' (excluye noise/zombie) para consistencia
+            # AHT Mean (average of handle_time over valid records)
+            # Filter only 'valid' records (excludes noise/zombie) for consistency
            if "_is_valid_for_cv" in group.columns:
                valid_records = group[group["_is_valid_for_cv"]]
            else:
@@ -687,15 +682,15 @@ class OperationalPerformanceMetrics:
            else:
                aht_mean = 0.0

-            # AHT Total (promedio de handle_time sobre TODOS los registros)
-            # Incluye NOISE, ZOMBIE, ABANDON - solo para información/comparación
+            # AHT Total (average of handle_time over ALL records)
+            # Includes NOISE, ZOMBIE, ABANDON - for information/comparison only
            if len(group) > 0 and "handle_time" in group.columns:
                aht_total = float(round(group["handle_time"].mean(), 2))
            else:
                aht_total = 0.0

-            # Hold Time Mean (promedio de hold_time sobre registros válidos)
-            # Consistente con fresh path que usa MEAN, no P50
+            # Hold Time Mean (average of hold_time over valid records)
+            # Consistent with fresh path that uses MEAN, not P50
            if len(valid_records) > 0 and "hold_time" in valid_records.columns:
                hold_time_mean = float(round(valid_records["hold_time"].mean(), 2))
            else: