npm - cdp-edge - Versions diffs - 2.0.4 → 2.0.5 - Mend

cdp-edge 2.0.4 → 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/dist/commands/install.js +1 -1
package/dist/commands/setup.js +326 -111
package/extracted-skill/tracking-events-generator/INTEGRACAO-COMPLETA.md +89 -0
package/extracted-skill/tracking-events-generator/MELHORIAS-IMPLEMENTADAS.md +101 -0
package/extracted-skill/tracking-events-generator/agents/devops-agent.md +11 -0
package/extracted-skill/tracking-events-generator/agents/intelligence-agent.md +27 -0
package/extracted-skill/tracking-events-generator/agents/master-orchestrator.md +1 -1
package/extracted-skill/tracking-events-generator/knowledge-base.md +172 -0
package/package.json +1 -1
package/server-edge-tracker/INSTALAR.md +27 -3
package/server-edge-tracker/SEGMENTATION-DOCS.md +69 -0
package/server-edge-tracker/index.js +11 -0
package/server-edge-tracker/migrate-v7.sql +64 -0
package/server-edge-tracker/modules/dispatch/meta.js +16 -0
package/server-edge-tracker/modules/intelligence.js +120 -3
package/server-edge-tracker/modules/ml/logistic.js +195 -0
package/server-edge-tracker/modules/ml/ltv.js +100 -0
package/server-edge-tracker/modules/ml/matchquality.js +176 -0
package/server-edge-tracker/schema-indexes.sql +7 -7
package/server-edge-tracker/worker.js +395 -4
package/server-edge-tracker/wrangler.toml +13 -0

package/server-edge-tracker/modules/intelligence.js CHANGED Viewed

@@ -6,6 +6,9 @@
 import { sha256 } from './utils.js';
 import { getHealthMetrics, generateDailyReport, logIntelligence } from './db.js';
 import { sendCallMeBot } from './dispatch/whatsapp.js';
+import { autoDecideAbWinner } from './ml/ltv.js';
+import { analyzeMatchQuality, alertMatchQuality, purgeOldMatchQualityLogs } from './ml/matchquality.js';
+import { trainLogisticRegression, extractFeatures, saveWeights, LTV_WEIGHTS_KV_KEY } from './ml/logistic.js';
 // ── Versões esperadas das APIs ────────────────────────────────────────────────
 const EXPECTED_API_VERSIONS = {
@@ -77,6 +80,62 @@ export async function auditErrorRates(env, runType) {
   return alerts;
 }
+// ── Treinar modelo LTV (regressão logística com dados reais do D1) ────────────
+export async function trainLtvModel(env) {
+  if (!env.DB) return { skipped: 'DB não disponível' };
+  try {
+    // Busca leads com informação de conversão (compra confirmada)
+    const rows = await env.DB.prepare(`
+      SELECT
+        l.utm_source,
+        l.utm_medium,
+        l.engagement_score,
+        l.intention_level,
+        CAST(julianday('now') - julianday(l.created_at) AS INTEGER) AS days_since_lead,
+        CASE WHEN l.email IS NOT NULL AND l.email != '' THEN 1 ELSE 0 END AS has_email,
+        CASE WHEN l.phone IS NOT NULL AND l.phone != '' THEN 1 ELSE 0 END AS has_phone,
+        CASE WHEN (l.country = 'br' OR l.country = 'BR' OR l.country IS NULL) THEN 1 ELSE 0 END AS is_br,
+        CAST(strftime('%H', l.created_at) AS INTEGER) AS hour,
+        CASE WHEN EXISTS (
+          SELECT 1 FROM events e
+          WHERE e.user_id = l.user_id
+            AND e.event_name IN ('Purchase', 'purchase', 'PURCHASE')
+            AND e.created_at > l.created_at
+        ) THEN 1 ELSE 0 END AS label
+      FROM leads l
+      WHERE l.created_at >= datetime('now', '-90 days')
+      LIMIT 5000
+    `).all();
+    const dataset = (rows.results || []).map(row => ({
+      features: extractFeatures(row),
+      label:    row.label || 0,
+    }));
+    const model = trainLogisticRegression(dataset);
+    if (!model) {
+      console.log('[LTV Train] Dados insuficientes para treinar modelo');
+      return { skipped: 'dados insuficientes', samples: dataset.length };
+    }
+    await saveWeights(env.DB, model);
+    // Invalidar cache KV para que próximas requests carreguem o modelo novo
+    if (env.GEO_CACHE) {
+      env.GEO_CACHE.delete(LTV_WEIGHTS_KV_KEY).catch(() => {});
+    }
+    console.log(`[LTV Train] Modelo treinado: ${dataset.length} samples, accuracy=${(model.accuracy * 100).toFixed(1)}%, positive_rate=${(model.positiveRate * 100).toFixed(1)}%`);
+    return { trained: true, samples: dataset.length, accuracy: model.accuracy, positiveRate: model.positiveRate };
+  } catch (err) {
+    console.error('[LTV Train] Erro:', err.message);
+    return { error: err.message };
+  }
+}
 // ── Runner principal do Intelligence Agent ────────────────────────────────────
 export async function runIntelligenceAgent(env, runType) {
   console.log(`[Intelligence Agent] Iniciando ${runType}`);
@@ -97,7 +156,61 @@ export async function runIntelligenceAgent(env, runType) {
     console.warn(`[Intelligence Agent] ${errorAlerts.length} alertas de taxa de erro enviados`);
   }
-  // 4. Auditoria mensal adicional
+  // 4. Treinar modelo LTV (toda semana)
+  const ltvTrainResult = await trainLtvModel(env);
+  if (ltvTrainResult.trained) {
+    console.log(`[Intelligence Agent] LTV model treinado: accuracy=${(ltvTrainResult.accuracy * 100).toFixed(1)}%`);
+    if (env.DB) {
+      await logIntelligence(env.DB, runType, 'ltv', 'model_training', 'ok',
+        `accuracy=${(ltvTrainResult.accuracy * 100).toFixed(1)}%`, null,
+        `Modelo LTV re-treinado com ${ltvTrainResult.samples} amostras`
+      ).catch(() => {});
+    }
+  } else {
+    console.log(`[Intelligence Agent] LTV model: ${ltvTrainResult.skipped || ltvTrainResult.error || 'sem dados'}`);
+  }
+  // 5. Auto-decisão de winner no A/B LTV Test
+  try {
+    const abResult = await autoDecideAbWinner(env);
+    if (abResult?.decided) {
+      console.log(`[Intelligence Agent] A/B LTV winner auto-decidido: test_id=${abResult.test_id}, winner=${abResult.winner_name}`);
+      await sendIntelligenceAlert(env, 'info',
+        `A/B LTV Test — Winner Declarado Automaticamente`,
+        `🏆 Vencedor: ${abResult.winner_name}\n📈 Melhoria: +${abResult.improvement?.toFixed(1) ?? '?'}pp vs controle\n🆔 Test ID: ${abResult.test_id}\n\n✅ Prompt vencedor ativado automaticamente`
+      );
+      if (env.DB) {
+        await logIntelligence(env.DB, runType, 'ltv', 'ab_auto_winner', 'ok',
+          abResult.winner_name, null,
+          `A/B winner auto-decidido: test ${abResult.test_id}, melhoria ${abResult.improvement?.toFixed(1)}pp`
+        ).catch(() => {});
+      }
+    }
+  } catch (err) {
+    console.error('[Intelligence Agent] A/B auto-decide error:', err.message);
+  }
+  // 6. Match Quality — análise + alertas
+  try {
+    const mqAnalysis = await analyzeMatchQuality(env);
+    if (mqAnalysis) {
+      console.log(`[Intelligence Agent] Match Quality: score=${mqAnalysis.composite_score ?? 0}%, alerts=${mqAnalysis.alerts?.length ?? 0}`);
+      await alertMatchQuality(env, mqAnalysis);
+      if (env.DB && mqAnalysis.total > 0) {
+        await logIntelligence(env.DB, runType, 'meta', 'match_quality', mqAnalysis.alerts?.length > 0 ? 'warning' : 'ok',
+          `${mqAnalysis.composite_score ?? 0}%`, '45%',
+          `Match quality 2h: email=${mqAnalysis.email_rate ?? 0}%, fbp=${mqAnalysis.fbp_rate ?? 0}%, score=${mqAnalysis.composite_score ?? 0}%`
+        ).catch(() => {});
+      }
+    }
+  } catch (err) {
+    console.error('[Intelligence Agent] Match quality analysis error:', err.message);
+  }
+  // 7. Auditoria mensal adicional
   if (runType === 'monthly_audit') {
     if (env.DB) {
       try {
@@ -115,14 +228,18 @@ export async function runIntelligenceAgent(env, runType) {
       } catch (err) {
         console.error('LTV audit error:', err.message);
       }
+      // Purge de logs antigos de match quality (> 30 dias)
+      await purgeOldMatchQualityLogs(env.DB);
+      console.log('[Intelligence Agent] Match quality logs antigos purgados');
     }
   }
-  // 5. Customer Match sync semanal
+  // 8. Customer Match sync semanal
   const cmResult = await syncMetaCustomAudience(env);
   console.log(`[Intelligence Agent] Customer Match Meta: sent=${cmResult?.sent ?? 0}, received=${cmResult?.num_received ?? 0}`);
-  console.log(`[Intelligence Agent] ${runType} concluído`);
+  console.log(`[Intelligence Agent] ${runType} concluído — LTV model, A/B auto-decide, match quality, customer match`);
 }
 // ── syncMetaCustomAudience — D1 → Meta Custom Audiences ─────────────────────

package/server-edge-tracker/modules/ml/logistic.js ADDED Viewed

@@ -0,0 +1,195 @@
+/**
+ * CDP Edge — Logistic Regression (pure JS, sem deps externas)
+ * Treina modelo de predição de conversão com dados reais do D1.
+ *
+ * Features usadas (todas normalizadas 0-1):
+ *   utm_source, engagement_score, intention_level, recency,
+ *   has_email, has_phone, is_br, hour_normalized
+ */
+// ── Feature Engineering ───────────────────────────────────────────────────────
+const UTM_SCORES = {
+  facebook: 0.90, instagram: 0.90, meta: 0.90,
+  google:   0.82, youtube:   0.82,
+  tiktok:   0.75,
+  email:    0.68, sms: 0.68,
+  organic:  0.30,
+  direct:   0.20,
+};
+const INTENTION_SCORES = {
+  comprador:   1.00, high_intent: 1.00,
+  interessado: 0.60,
+  nurture:     0.30,
+  curioso:     0.15,
+};
+export function extractFeatures(row) {
+  const src       = (row.utm_source || '').toLowerCase().trim();
+  const intention = (row.intention_level || '').toLowerCase().trim();
+  const daysSince = row.days_since_lead || 0;
+  return [
+    UTM_SCORES[src] ?? (src ? 0.10 : 0.05),                    // utm_score
+    Math.min((row.engagement_score || 0) / 5, 1),               // engagement (0-5 → 0-1)
+    INTENTION_SCORES[intention] ?? 0,                           // intention
+    Math.max(0, 1 - daysSince / 90),                            // recency (0=90 dias, 1=hoje)
+    row.has_email    ? 1 : 0,                                   // has_email
+    row.has_phone    ? 1 : 0,                                   // has_phone
+    row.is_br        ? 1 : 0,                                   // is_br
+    ((row.hour || 12) / 23),                                    // hour normalized
+  ];
+}
+// ── Sigmoid ───────────────────────────────────────────────────────────────────
+function sigmoid(z) {
+  if (z > 20)  return 1;
+  if (z < -20) return 0;
+  return 1 / (1 + Math.exp(-z));
+}
+function dot(weights, features) {
+  return features.reduce((sum, f, i) => sum + (weights[i] || 0) * f, 0);
+}
+// ── Treinamento ───────────────────────────────────────────────────────────────
+/**
+ * Treina regressão logística com gradiente descendente.
+ * @param {Array<{features: number[], label: number}>} dataset
+ * @param {{ iterations?, learningRate?, lambda? }} opts
+ * @returns {{ bias, weights, accuracy, positiveRate }}
+ */
+export function trainLogisticRegression(dataset, opts = {}) {
+  if (!dataset || dataset.length < 50) {
+    return null; // dados insuficientes
+  }
+  const iterations   = opts.iterations   || 200;
+  const learningRate = opts.learningRate  || 0.1;
+  const lambda       = opts.lambda        || 0.01; // L2 regularization
+  const nFeatures    = dataset[0].features.length;
+  let bias    = 0;
+  let weights = new Array(nFeatures).fill(0);
+  const positives = dataset.filter(d => d.label === 1).length;
+  const positiveRate = positives / dataset.length;
+  // Se menos de 5% positivos, não treina (dados de compra insuficientes)
+  if (positiveRate < 0.03) return null;
+  for (let iter = 0; iter < iterations; iter++) {
+    let dBias    = 0;
+    const dWeights = new Array(nFeatures).fill(0);
+    for (const { features, label } of dataset) {
+      const z     = dot(weights, features) + bias;
+      const pred  = sigmoid(z);
+      const error = pred - label;
+      dBias += error;
+      for (let j = 0; j < nFeatures; j++) {
+        dWeights[j] += error * features[j];
+      }
+    }
+    const n = dataset.length;
+    bias -= learningRate * (dBias / n);
+    for (let j = 0; j < nFeatures; j++) {
+      // L2: penaliza pesos grandes para evitar overfitting
+      weights[j] -= learningRate * ((dWeights[j] / n) + lambda * weights[j]);
+    }
+  }
+  // Calcular acurácia no conjunto de treino
+  let correct = 0;
+  const threshold = positiveRate > 0.3 ? 0.5 : Math.max(0.3, positiveRate * 1.5);
+  for (const { features, label } of dataset) {
+    const z    = dot(weights, features) + bias;
+    const pred = sigmoid(z) >= threshold ? 1 : 0;
+    if (pred === label) correct++;
+  }
+  const accuracy = correct / dataset.length;
+  return {
+    bias,
+    weights,
+    accuracy,
+    positiveRate,
+    sampleSize: dataset.length,
+    threshold,
+    featureNames: ['utm_score', 'engagement', 'intention', 'recency', 'has_email', 'has_phone', 'is_br', 'hour'],
+    trainedAt: new Date().toISOString(),
+  };
+}
+// ── Inferência ────────────────────────────────────────────────────────────────
+/**
+ * Prediz score de conversão (0-100) usando pesos treinados.
+ * @param {{ bias, weights, threshold }} model
+ * @param {number[]} features
+ * @returns {number} score 0-100
+ */
+export function predictWithWeights(model, features) {
+  const z    = dot(model.weights, features) + model.bias;
+  const prob = sigmoid(z);
+  return Math.round(prob * 100);
+}
+// ── Helpers de persistência ───────────────────────────────────────────────────
+export const LTV_WEIGHTS_KV_KEY = 'ltv_weights_active';
+export async function loadActiveWeights(env) {
+  // 1. Tentar KV (cache ~7 dias)
+  if (env.GEO_CACHE) {
+    try {
+      const cached = await env.GEO_CACHE.get(LTV_WEIGHTS_KV_KEY, 'json');
+      if (cached?.weights?.length) return cached;
+    } catch {}
+  }
+  // 2. Fallback: D1
+  if (!env.DB) return null;
+  try {
+    const row = await env.DB.prepare(
+      `SELECT weights_json FROM ltv_model_weights WHERE is_active = 1 ORDER BY trained_at DESC LIMIT 1`
+    ).first();
+    if (!row?.weights_json) return null;
+    const model = JSON.parse(row.weights_json);
+    // Popular KV para próximas requests
+    if (env.GEO_CACHE && model?.weights?.length) {
+      env.GEO_CACHE.put(LTV_WEIGHTS_KV_KEY, JSON.stringify(model), { expirationTtl: 604800 }).catch(() => {});
+    }
+    return model;
+  } catch {
+    return null;
+  }
+}
+export async function saveWeights(DB, model) {
+  if (!DB || !model) return;
+  const now = new Date().toISOString();
+  // Desativar modelo anterior
+  await DB.prepare(`UPDATE ltv_model_weights SET is_active = 0 WHERE is_active = 1`).run();
+  // Inserir novo como ativo
+  await DB.prepare(`
+    INSERT INTO ltv_model_weights (trained_at, is_active, sample_size, positive_rate, accuracy, weights_json)
+    VALUES (?, 1, ?, ?, ?, ?)
+  `).bind(
+    now,
+    model.sampleSize,
+    model.positiveRate,
+    model.accuracy,
+    JSON.stringify(model),
+  ).run();
+}

package/server-edge-tracker/modules/ml/ltv.js CHANGED Viewed

@@ -3,11 +3,43 @@
  * predictLtv, getLtvAbVariation, recordAbAssignment, handlers /api/ltv/*
  */
+import { extractFeatures, predictWithWeights, loadActiveWeights } from './logistic.js';
 // Cache key para o teste ativo (KV — evita hit no D1 a cada request /track)
 const AB_LTV_CACHE_KEY = 'ab_ltv_active_test';
 // ── predictLtv — Heurística em 5 dimensões (0-100 pts) ───────────────────────
 export async function predictLtv(env, payload, request, customSystemPrompt = null) {
+  // ── Tentar modelo treinado (regressão logística real) ─────────────────────
+  // Se existir modelo ativo no KV/D1, usa-o em vez da heurística manual.
+  // Fallback automático para heurística se modelo não disponível.
+  try {
+    const model = await loadActiveWeights(env);
+    if (model?.weights?.length) {
+      const hour    = new Date().getUTCHours();
+      const country = (payload.country || request?.cf?.country || '').toUpperCase();
+      const features = extractFeatures({
+        utm_source:      payload.utmSource,
+        engagement_score: parseFloat(payload.engagementScore || 0),
+        intention_level: payload.intentionLevel,
+        days_since_lead: 0,  // evento atual = recência máxima
+        has_email:       !!payload.email,
+        has_phone:       !!payload.phone,
+        is_br:           country === 'BR',
+        hour,
+      });
+      const score100 = predictWithWeights(model, features);
+      const ltvClass    = score100 >= 70 ? 'High' : score100 >= 40 ? 'Medium' : 'Low';
+      const ltvMultiplier = score100 >= 70 ? 3.5 : score100 >= 40 ? 1.8 : 0.8;
+      const productValue  = payload.value ? parseFloat(payload.value) : 0;
+      const baseValue     = productValue > 0 ? productValue : 197;
+      const predictedValue = Math.round(baseValue * ltvMultiplier * 100) / 100;
+      return { score: score100, class: ltvClass, value: predictedValue, source: 'model' };
+    }
+  } catch { /* fallback para heurística */ }
   let score = 0;
   // 1. Engajamento browser (0–30)
@@ -318,3 +350,71 @@ export async function handleLtvAbTestWinner(env, request, headers) {
     return new Response(JSON.stringify({ error: err.message }), { status: 500, headers });
   }
 }
+// ── autoDecideAbWinner — declara winner automaticamente via cron ──────────────
+// Critério: todas as variações com amostra >= min_sample
+//           E diferença de accuracy_score >= 5pp entre melhor e controle
+export async function autoDecideAbWinner(env) {
+  if (!env.DB) return { decided: false, reason: 'no_db' };
+  try {
+    // Buscar teste ativo
+    const test = await env.DB.prepare(
+      `SELECT id, name, min_sample, status FROM ltv_ab_tests WHERE status = 'running' ORDER BY id DESC LIMIT 1`
+    ).first();
+    if (!test) return { decided: false, reason: 'no_running_test' };
+    // Buscar performance das variações
+    const perf = await env.DB.prepare(
+      `SELECT * FROM v_ab_test_performance WHERE test_id = ?`
+    ).bind(test.id).all();
+    const variations = perf.results || [];
+    if (variations.length < 2) return { decided: false, reason: 'insufficient_variations' };
+    // Verificar se todas têm amostra suficiente
+    const allReady = variations.every(v => (v.total_assigned || 0) >= test.min_sample);
+    if (!allReady) {
+      const minAssigned = Math.min(...variations.map(v => v.total_assigned || 0));
+      return { decided: false, reason: `sample_insufficient (${minAssigned}/${test.min_sample})` };
+    }
+    // Encontrar melhor e controle
+    const best    = variations.reduce((a, b) => (b.accuracy_score || 0) > (a.accuracy_score || 0) ? b : a);
+    const control = variations.find(v => v.is_control) || variations[0];
+    const bestScore    = parseFloat(best.accuracy_score    || 0);
+    const controlScore = parseFloat(control.accuracy_score || 0);
+    const diff         = bestScore - controlScore;
+    // Empate técnico → controle vence (determinístico)
+    if (diff < 0.05) {
+      return { decided: false, reason: `difference_too_small (${(diff * 100).toFixed(1)}pp < 5pp)` };
+    }
+    // Declarar winner
+    await env.DB.prepare(
+      `UPDATE ltv_ab_tests SET winner_id = ?, status = 'completed', completed_at = datetime('now') WHERE id = ?`
+    ).bind(best.variation_id, test.id).run();
+    if (env.GEO_CACHE) await env.GEO_CACHE.delete(AB_LTV_CACHE_KEY);
+    console.log(`[AB-LTV] Winner auto-declarado: teste ${test.id}, variação "${best.variation_name}" (+${(diff * 100).toFixed(1)}pp)`);
+    return {
+      decided:       true,
+      test_id:       test.id,
+      test_name:     test.name,
+      winner_id:     best.variation_id,
+      winner_name:   best.variation_name,
+      improvement:   `+${(diff * 100).toFixed(1)}pp`,
+      is_control_winner: best.variation_id === control.variation_id,
+      winning_prompt: best.system_prompt || null,
+    };
+  } catch (err) {
+    console.error('[AB-LTV] autoDecide error:', err.message);
+    return { decided: false, reason: err.message };
+  }
+}

package/server-edge-tracker/modules/ml/matchquality.js ADDED Viewed

@@ -0,0 +1,176 @@
+/**
+ * CDP Edge — Match Quality (Fase 5)
+ * Rastreia qualidade dos dados enviados ao Meta CAPI.
+ * Detecta degradação e alerta via CallMeBot.
+ * Tenta auto-correção onde possível.
+ */
+import { sendCallMeBot } from '../dispatch/whatsapp.js';
+// ── Thresholds de alerta ──────────────────────────────────────────────────────
+const THRESHOLDS = {
+  email_rate_min:   0.40,  // < 40% dos eventos com email → alerta
+  fbp_rate_min:     0.30,  // < 30% com fbp cookie → alerta
+  composite_min:    0.45,  // < 45% score composto → alerta crítico
+  min_events_alert: 10,    // mínimo de eventos nas últimas 2h para disparar alerta
+};
+// ── Log de qualidade (chamado em meta.js a cada dispatch) ─────────────────────
+/**
+ * Registra flags de qualidade de um evento no D1 (background, não bloqueia).
+ */
+export async function logMatchQuality(DB, eventName, payload, recovered = {}) {
+  if (!DB) return;
+  try {
+    await DB.prepare(`
+      INSERT INTO match_quality_log (
+        event_name, has_email, has_phone, has_fbp, has_fbc, has_external_id,
+        was_email_recovered, was_utm_restored
+      ) VALUES (?,?,?,?,?,?,?,?)
+    `).bind(
+      eventName,
+      payload.email    ? 1 : 0,
+      payload.phone    ? 1 : 0,
+      payload.fbp      ? 1 : 0,
+      payload.fbc      ? 1 : 0,
+      payload.userId   ? 1 : 0,
+      recovered.email  ? 1 : 0,
+      recovered.utm    ? 1 : 0,
+    ).run();
+  } catch { /* não bloquear dispatch */ }
+}
+// ── Auto-correção de payload ───────────────────────────────────────────────────
+/**
+ * Tenta enriquecer o payload com dados do Identity Graph antes do envio ao Meta.
+ * Retorna { payload enriquecido, flags de recuperação }.
+ */
+export async function autoEnrichPayload(env, payload) {
+  const recovered = { email: false, utm: false };
+  if (!env.DB) return { payload, recovered };
+  // 1. Tentar recuperar email/fbp/fbc do perfil pelo userId
+  if (!payload.email && payload.userId) {
+    try {
+      const profile = await env.DB.prepare(
+        `SELECT email, fbp, fbc, phone FROM user_profiles WHERE user_id = ? LIMIT 1`
+      ).bind(payload.userId).first();
+      if (profile) {
+        if (profile.email && !payload.email) {
+          payload.email   = profile.email;
+          recovered.email = true;
+        }
+        if (profile.fbp && !payload.fbp)  payload.fbp = profile.fbp;
+        if (profile.fbc && !payload.fbc)  payload.fbc = profile.fbc;
+        if (profile.phone && !payload.phone) payload.phone = profile.phone;
+      }
+    } catch {}
+  }
+  // 2. UTM Resurrection já foi tentada no /track handler (payload.utmRestored)
+  if (payload.utmRestored) recovered.utm = true;
+  return { payload, recovered };
+}
+// ── Análise de qualidade (chamada pelo cron) ─────────────────────────────────
+/**
+ * Analisa a qualidade das últimas 2h e retorna métricas + alertas.
+ */
+export async function analyzeMatchQuality(env) {
+  if (!env.DB) return null;
+  try {
+    const row = await env.DB.prepare(`
+      SELECT
+        COUNT(*)                             AS total,
+        ROUND(AVG(has_email)       * 100, 1) AS email_rate,
+        ROUND(AVG(has_phone)       * 100, 1) AS phone_rate,
+        ROUND(AVG(has_fbp)         * 100, 1) AS fbp_rate,
+        ROUND(AVG(has_fbc)         * 100, 1) AS fbc_rate,
+        ROUND(AVG(has_external_id) * 100, 1) AS ext_id_rate,
+        ROUND(AVG(was_email_recovered) * 100, 1) AS email_recovered_rate,
+        ROUND((AVG(has_email)*0.4 + AVG(has_fbp)*0.3 + AVG(has_phone)*0.2 + AVG(has_fbc)*0.1) * 100, 1) AS composite_score
+      FROM match_quality_log
+      WHERE logged_at >= datetime('now', '-2 hours')
+    `).first();
+    if (!row || row.total < THRESHOLDS.min_events_alert) return { total: row?.total || 0, alerts: [] };
+    const alerts = [];
+    if ((row.email_rate || 0) < THRESHOLDS.email_rate_min * 100) {
+      alerts.push({
+        type:    'email_low',
+        metric:  `email_rate: ${row.email_rate}%`,
+        message: `Taxa de email baixa: ${row.email_rate}% (mínimo: ${THRESHOLDS.email_rate_min * 100}%)`,
+      });
+    }
+    if ((row.fbp_rate || 0) < THRESHOLDS.fbp_rate_min * 100) {
+      alerts.push({
+        type:    'fbp_low',
+        metric:  `fbp_rate: ${row.fbp_rate}%`,
+        message: `Cookie fbp ausente em ${100 - row.fbp_rate}% dos eventos — verificar cdpTrack.js`,
+      });
+    }
+    if ((row.composite_score || 0) < THRESHOLDS.composite_min * 100) {
+      alerts.push({
+        type:    'composite_critical',
+        metric:  `composite: ${row.composite_score}%`,
+        message: `Score composto de match quality crítico: ${row.composite_score}%`,
+        severity: 'critical',
+      });
+    }
+    return { ...row, alerts };
+  } catch (err) {
+    console.error('[MatchQuality] analyze error:', err.message);
+    return null;
+  }
+}
+// ── Alerta via CallMeBot ──────────────────────────────────────────────────────
+export async function alertMatchQuality(env, analysis) {
+  if (!analysis || analysis.alerts.length === 0) return;
+  const hasCritical = analysis.alerts.some(a => a.severity === 'critical');
+  const icon        = hasCritical ? '🚨' : '⚠️';
+  const lines = [
+    `${icon} CDP Edge — Match Quality Alert`,
+    ``,
+    `📊 Últimas 2h (${analysis.total} eventos):`,
+    `  Email:     ${analysis.email_rate ?? 0}% ${(analysis.email_rate ?? 0) < 40 ? '❌' : '✅'}`,
+    `  fbp:       ${analysis.fbp_rate   ?? 0}% ${(analysis.fbp_rate   ?? 0) < 30 ? '❌' : '✅'}`,
+    `  Score:     ${analysis.composite_score ?? 0}%`,
+    ``,
+    `🔍 Problemas:`,
+    ...analysis.alerts.map(a => `  · ${a.message}`),
+    ``,
+    `🛠 Ações automáticas já ativas:`,
+    `  · Identity Graph recovery: ${analysis.email_recovered_rate ?? 0}% emails recuperados`,
+    `  · UTM Resurrection ativa`,
+    ``,
+    new Date().toLocaleString('pt-BR', { timeZone: 'America/Sao_Paulo' }),
+  ];
+  await sendCallMeBot(env, lines.join('\n'));
+}
+// ── Purge periódico (mensal) ──────────────────────────────────────────────────
+export async function purgeOldMatchQualityLogs(DB) {
+  if (!DB) return;
+  try {
+    await DB.prepare(
+      `DELETE FROM match_quality_log WHERE logged_at < datetime('now', '-30 days')`
+    ).run();
+  } catch {}
+}

package/server-edge-tracker/schema-indexes.sql CHANGED Viewed

@@ -46,13 +46,13 @@ CREATE INDEX IF NOT EXISTS idx_profiles_email_updated
 -- ── fraud_signals: dashboard e alertas ───────────────────────────────────────
--- handleFraudAlerts: filtra por ip + período
-CREATE INDEX IF NOT EXISTS idx_fraud_ip_created
-  ON fraud_signals(ip_address, created_at DESC);
+-- handleFraudAlerts: filtra por ip + período (coluna: detected_at)
+CREATE INDEX IF NOT EXISTS idx_fraud_ip_detected
+  ON fraud_signals(ip_address, detected_at DESC);
 -- handleFraudStats: fraud_score >= threshold ordenado por data
-CREATE INDEX IF NOT EXISTS idx_fraud_score_created
-  ON fraud_signals(fraud_score DESC, created_at DESC);
+CREATE INDEX IF NOT EXISTS idx_fraud_score_detected
+  ON fraud_signals(fraud_score DESC, detected_at DESC);
 -- ── ltv_ab_assignments: resultados de A/B test ───────────────────────────────
@@ -62,6 +62,6 @@ CREATE INDEX IF NOT EXISTS idx_ab_testid_class
 -- ── ml_segment_members: join com leads para bidding ─────────────────────────
--- handleBiddingRecommend: segment_id lookup
+-- handleBiddingRecommend: segment_id lookup (coluna: assigned_at)
 CREATE INDEX IF NOT EXISTS idx_seg_members_segid
-  ON ml_segment_members(segment_id, joined_at DESC);
+  ON ml_segment_members(cluster_id, assigned_at DESC);