npm - @saulwade/swl-ses - Versions diffs - 1.5.1 → 1.5.2 - Mend

@saulwade/swl-ses 1.5.1 → 1.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (133) hide show

package/CLAUDE.md +225 -209
package/README.md +561 -561
package/agentes/arquitecto-swl.md +33 -1
package/agentes/nemesis-auditor-swl.md +59 -19
package/bin/swl-mcp-server.js +214 -214
package/comandos/swl/.evolved.json +22 -22
package/comandos/swl/contribuir.md +233 -233
package/comandos/swl/nemesis.md +230 -56
package/gateway/lib/event-channel.js +191 -191
package/habilidades/backend-production-resilience/SKILL.md +288 -288
package/habilidades/benchmark-memoria/SKILL.md +186 -186
package/habilidades/diagrama-arquitectura/assets/template.html +276 -276
package/habilidades/doubt-driven-review/SKILL.md +171 -171
package/habilidades/doubt-driven-review/recursos/EXAMPLES.md +130 -130
package/habilidades/ejecutar-task-iterativo/SKILL.md +278 -278
package/habilidades/eval-framework/SKILL.md +212 -212
package/habilidades/feynman-auditor-swl/SKILL.md +123 -123
package/habilidades/feynman-auditor-swl/recursos/preguntas-language-agnostic.md +108 -108
package/habilidades/harness-claude-code/SKILL.md +299 -299
package/habilidades/infra-github-actions/SKILL.md +166 -166
package/habilidades/legacy-code-rescue/SKILL.md +267 -267
package/habilidades/manejo-errores/.evolved.json +8 -8
package/habilidades/meta-skills-estandar/SKILL.md +207 -4
package/habilidades/meta-skills-estandar/recursos/convencion-examples.md +93 -93
package/habilidades/meta-skills-estandar/recursos/skills-as-agents.md +163 -163
package/habilidades/nemesis-evaluacion-json/SKILL.md +266 -0
package/habilidades/nemesis-redistribuir/SKILL.md +341 -0
package/habilidades/node-experto/SKILL.md +94 -4
package/habilidades/patrones-python/SKILL.md +229 -229
package/habilidades/patrones-python/recursos/patrones-avanzados.md +469 -469
package/habilidades/planear-fase/SKILL.md +319 -319
package/habilidades/protocolo-revision-swl/SKILL.md +350 -276
package/habilidades/release-semver/.evolved.json +8 -8
package/habilidades/state-inconsistency-auditor-swl/SKILL.md +166 -166
package/habilidades/state-inconsistency-auditor-swl/recursos/coupled-state-patterns.md +147 -147
package/habilidades/tdd-workflow/SKILL.md +121 -4
package/habilidades/testing-python/SKILL.md +340 -340
package/habilidades/web-fetcher-routing/SKILL.md +75 -75
package/hooks/check-update.js +31 -3
package/hooks/claudemd-bloat-detector.js +161 -161
package/hooks/lib/agent-routing.js +107 -107
package/hooks/lib/auto-consolidator.js +335 -335
package/hooks/lib/error-classifier.js +308 -308
package/hooks/lib/merkle-audit.js +96 -96
package/hooks/lib/provenance-tracker.js +191 -191
package/hooks/lib/rate-limit-tracker.js +253 -253
package/hooks/lib/resource-quota.js +122 -122
package/hooks/lib/retry-jitter.js +165 -165
package/hooks/lib/security-net.js +201 -201
package/hooks/lib/skill-auditor.js +588 -588
package/hooks/lib/sync-status.js +228 -228
package/hooks/lib/taint-tracker.js +107 -107
package/hooks/lib/text-similarity.js +241 -241
package/hooks/lib/toon-compressor.js +245 -245
package/hooks/registro-turnos.js +209 -209
package/hooks/sugerir-regenerar-inventario.js +170 -170
package/hooks/validar-formato-post-subagente.js +140 -140
package/hooks/validar-memoria-hook.js +218 -218
package/instintos/prompt-appendices.yaml +57 -57
package/manifiestos/agent-output-schemas.json +57 -57
package/manifiestos/modulos.json +1324 -1321
package/manifiestos/skills-lock.json +1114 -1114
package/package.json +2 -2
package/plantillas/auditor-veto-template.md +105 -105
package/plantillas/github-workflows/README.md +47 -47
package/plantillas/github-workflows/release-please.yml +44 -44
package/plantillas/github-workflows/swl-ci.yml +107 -107
package/plantillas/github-workflows/swl-security.yml +51 -51
package/plugin.json +353 -351
package/reglas/analisis-previo-tareas-grandes.md +172 -172
package/reglas/arreglar-al-detectar.md +147 -147
package/reglas/fragmentos-compartidos.md +152 -152
package/reglas/harness-claude-code.md +213 -213
package/reglas/registro-componentes-nuevos.md +192 -0
package/reglas/usar-context7.md +226 -226
package/schemas/diary-entry.schema.json +80 -80
package/scripts/actualizar.js +110 -1
package/scripts/audit-tools/audit-history.js +330 -330
package/scripts/audit-tools/bundle-tracker.js +290 -290
package/scripts/audit-tools/canary-monitor.js +352 -352
package/scripts/audit-tools/code-profiler.js +605 -605
package/scripts/audit-tools/dep-doctor.js +320 -320
package/scripts/audit-tools/env-validator.js +206 -206
package/scripts/audit-tools/lib/fs-walk.js +48 -48
package/scripts/audit-tools/lib/output.js +23 -23
package/scripts/audit-tools/migration-checker.js +392 -392
package/scripts/audit-tools/pentest-scanner.js +1436 -1436
package/scripts/benchmark-memoria.js +167 -167
package/scripts/configurar-branch-protection.js +418 -418
package/scripts/derivar-feature-list.js +489 -489
package/scripts/detectar-aprendizajes-duplicados.js +151 -151
package/scripts/doctor.js +27 -0
package/scripts/field-report.js +199 -199
package/scripts/generar-checklists-consolidados.js +273 -273
package/scripts/generar-inventario.js +420 -420
package/scripts/generar-matriz-lenguajes.js +271 -271
package/scripts/lib/artefactos-python.js +43 -43
package/scripts/lib/benchmark-metrics.js +160 -160
package/scripts/lib/budget-enforcer.js +252 -252
package/scripts/lib/configurar-ci.js +380 -380
package/scripts/lib/contadores-inventario.js +217 -217
package/scripts/lib/detectar-stack-detallado.js +307 -307
package/scripts/lib/diary-entry.js +234 -234
package/scripts/lib/eval-metrics-store.js +218 -218
package/scripts/lib/eval-quality.js +171 -171
package/scripts/lib/eval-schemas.js +144 -144
package/scripts/lib/eval-self-correct.js +106 -106
package/scripts/lib/eval-validator.js +185 -185
package/scripts/lib/expandir-targets.js +71 -71
package/scripts/lib/jaccard-similarity.js +98 -98
package/scripts/lib/longmemeval-runner.js +125 -125
package/scripts/lib/mcp_config.py +127 -0
package/scripts/lib/npm-version.js +261 -261
package/scripts/lib/paquetes-conocidos.js +50 -50
package/scripts/lib/prompt-builder.js +264 -264
package/scripts/lib/rrf-fusion.js +175 -175
package/scripts/lib/scoring-instintos.js +277 -277
package/scripts/lib/semantic-search.js +252 -252
package/scripts/lib/toml-merge.js +204 -204
package/scripts/lib/transformadores/codex.js +375 -375
package/scripts/lib/transformadores/cursor.js +359 -359
package/scripts/limpiar-artefactos-python.js +131 -131
package/scripts/mcp-orchestrator.py +8 -18
package/scripts/mcp-pool-manager.py +12 -23
package/scripts/mcp-server/README.md +170 -170
package/scripts/mcp-server/auth.js +105 -105
package/scripts/mcp-server/cache.js +106 -106
package/scripts/mcp-server/telemetry.js +78 -78
package/scripts/migrar-csv-a-array.js +168 -168
package/scripts/migrar-fase-dominio.js +201 -201
package/scripts/publicar.js +511 -511
package/scripts/run-eval.js +141 -141
package/scripts/validar-userland-vacio.js +110 -110

package/scripts/lib/expandir-targets.js CHANGED Viewed

@@ -1,71 +1,71 @@
-'use strict';
-/**
- * Expansión de --target (CSV) y --all-runtimes para multi-target install.
- *
- * ADR-0019 Sub-fase 2.5.
- *
- * Extraído de bin/swl-ses.js para permitir tests unitarios. NUNCA debe tener
- * side effects fuera de logging — solo manipula la lista de strings.
- *
- * @module scripts/lib/expandir-targets
- */
-const { listarRuntimesInstalables, RUNTIMES } = require('./detectar-runtime');
-/**
- * Expande las opciones del CLI a un array de target IDs.
- *
- * Reglas:
- *  - `all_runtimes` tiene prioridad sobre `target`. Si ambos vienen, se loggea
- *    aviso (vía `logger.warn`) y se usa `all_runtimes`.
- *  - `target='a,b,c'` → ['a','b','c'].
- *  - `target='claude'` → ['claude'].
- *  - Sin nada → ['claude'] (default histórico, backward-compat).
- *  - Duplicados se deduplican preservando el primer orden.
- *  - Targets desconocidos se omiten con aviso (logger.warn).
- *
- * @param {object} opciones - Objeto con `target` (string|undefined) y `all_runtimes` (bool).
- * @param {object} [logger] - Sustituible para tests. Default console.
- * @returns {{ targets: string[], omitidos: string[], errores: string[] }}
- */
-function expandirTargets(opciones, logger) {
-  const log = logger || console;
-  const omitidos = [];
-  const errores = [];
-  let candidatos;
-  if (opciones.all_runtimes) {
-    if (opciones.target && typeof opciones.target === 'string') {
-      log.warn && log.warn('[expandir-targets] --all-runtimes tiene prioridad sobre --target; se ignora --target.');
-    }
-    candidatos = listarRuntimesInstalables();
-  } else if (typeof opciones.target === 'string' && opciones.target.includes(',')) {
-    candidatos = opciones.target.split(',').map(s => s.trim()).filter(Boolean);
-  } else if (typeof opciones.target === 'string' && opciones.target.length > 0) {
-    candidatos = [opciones.target.trim()];
-  } else {
-    candidatos = ['claude']; // backward-compat
-  }
-  const visto = new Set();
-  const targets = [];
-  for (const t of candidatos) {
-    if (visto.has(t)) continue;
-    visto.add(t);
-    if (!RUNTIMES[t]) {
-      log.warn && log.warn(`[expandir-targets] Target desconocido omitido: "${t}". Disponibles: ${Object.keys(RUNTIMES).join(', ')}`);
-      omitidos.push(t);
-      continue;
-    }
-    targets.push(t);
-  }
-  if (targets.length === 0) {
-    errores.push('Ningún target válido tras expansión.');
-  }
-  return { targets, omitidos, errores };
-}
-module.exports = { expandirTargets };
+'use strict';
+/**
+ * Expansión de --target (CSV) y --all-runtimes para multi-target install.
+ *
+ * ADR-0019 Sub-fase 2.5.
+ *
+ * Extraído de bin/swl-ses.js para permitir tests unitarios. NUNCA debe tener
+ * side effects fuera de logging — solo manipula la lista de strings.
+ *
+ * @module scripts/lib/expandir-targets
+ */
+const { listarRuntimesInstalables, RUNTIMES } = require('./detectar-runtime');
+/**
+ * Expande las opciones del CLI a un array de target IDs.
+ *
+ * Reglas:
+ *  - `all_runtimes` tiene prioridad sobre `target`. Si ambos vienen, se loggea
+ *    aviso (vía `logger.warn`) y se usa `all_runtimes`.
+ *  - `target='a,b,c'` → ['a','b','c'].
+ *  - `target='claude'` → ['claude'].
+ *  - Sin nada → ['claude'] (default histórico, backward-compat).
+ *  - Duplicados se deduplican preservando el primer orden.
+ *  - Targets desconocidos se omiten con aviso (logger.warn).
+ *
+ * @param {object} opciones - Objeto con `target` (string|undefined) y `all_runtimes` (bool).
+ * @param {object} [logger] - Sustituible para tests. Default console.
+ * @returns {{ targets: string[], omitidos: string[], errores: string[] }}
+ */
+function expandirTargets(opciones, logger) {
+  const log = logger || console;
+  const omitidos = [];
+  const errores = [];
+  let candidatos;
+  if (opciones.all_runtimes) {
+    if (opciones.target && typeof opciones.target === 'string') {
+      log.warn && log.warn('[expandir-targets] --all-runtimes tiene prioridad sobre --target; se ignora --target.');
+    }
+    candidatos = listarRuntimesInstalables();
+  } else if (typeof opciones.target === 'string' && opciones.target.includes(',')) {
+    candidatos = opciones.target.split(',').map(s => s.trim()).filter(Boolean);
+  } else if (typeof opciones.target === 'string' && opciones.target.length > 0) {
+    candidatos = [opciones.target.trim()];
+  } else {
+    candidatos = ['claude']; // backward-compat
+  }
+  const visto = new Set();
+  const targets = [];
+  for (const t of candidatos) {
+    if (visto.has(t)) continue;
+    visto.add(t);
+    if (!RUNTIMES[t]) {
+      log.warn && log.warn(`[expandir-targets] Target desconocido omitido: "${t}". Disponibles: ${Object.keys(RUNTIMES).join(', ')}`);
+      omitidos.push(t);
+      continue;
+    }
+    targets.push(t);
+  }
+  if (targets.length === 0) {
+    errores.push('Ningún target válido tras expansión.');
+  }
+  return { targets, omitidos, errores };
+}
+module.exports = { expandirTargets };

package/scripts/lib/jaccard-similarity.js CHANGED Viewed

@@ -1,98 +1,98 @@
-'use strict';
-/**
- * jaccard-similarity.js — Métrica de Jaccard sobre conjuntos de tokens.
- *
- * Patrón adoptado de `temp/agentmemory-main/src/functions/auto-forget.ts`
- * para detectar memorias contradictorias/duplicadas con vocabulario compartido.
- *
- * Jaccard(A, B) = |A ∩ B| / |A ∪ B|
- *
- * Propiedades:
- *   - Rango [0, 1]: 0 = sin overlap, 1 = idénticos.
- *   - Simétrico: J(A, B) = J(B, A).
- *   - Independiente de longitudes absolutas (ambos cortos pueden ser 1.0).
- *
- * Sin dependencias — Node stdlib only. Funciones puras.
- *
- * @module scripts/lib/jaccard-similarity
- */
-// ── constantes ────────────────────────────────────────────────────────────────
-/** Longitud mínima de un token para ser considerado significativo. */
-const MIN_TOKEN_LENGTH = 3;
-/** Stop words en español que se excluyen del análisis. */
-const STOP_WORDS = new Set([
-  'que', 'los', 'las', 'del', 'una', 'por', 'con', 'para', 'como',
-  'sin', 'mas', 'sus', 'lo', 'le', 'la', 'el', 'al', 'no', 'es',
-  'se', 'de', 'en', 'un', 'a', 'y', 'o', 'pero', 'cuando',
-  'donde', 'porque', 'desde', 'hasta', 'sobre', 'bajo', 'entre',
-  'esta', 'este', 'esto', 'esa', 'ese', 'eso', 'tras', 'durante',
-  'mediante', 'segun', 'asi', 'tan', 'ya', 'aun', 'aunque',
-  // English equivalents (frequently mixed in technical text)
-  'the', 'and', 'for', 'with', 'this', 'that', 'have', 'from',
-  'are', 'was', 'will', 'not', 'has', 'had', 'but', 'can',
-]);
-// ── funciones puras ───────────────────────────────────────────────────────────
-/**
- * Convierte un texto en un Set de tokens significativos (lowercase, sin stop
- * words, longitud mínima). Preserva acentos.
- *
- * @param {string} text
- * @returns {Set<string>}
- */
-function tokenize(text) {
-  if (!text || typeof text !== 'string') return new Set();
-  return new Set(
-    String(text)
-      .toLowerCase()
-      .replace(/[`*_~\[\](){}<>#"'\-.,;:!?\/\\]/g, ' ')
-      .split(/\s+/)
-      .filter(t => t.length >= MIN_TOKEN_LENGTH && !STOP_WORDS.has(t)),
-  );
-}
-/**
- * Jaccard similarity entre dos Sets.
- *
- * @param {Set} setA
- * @param {Set} setB
- * @returns {number} en [0, 1]
- */
-function jaccard(setA, setB) {
-  if (!(setA instanceof Set) || !(setB instanceof Set)) return 0;
-  if (setA.size === 0 && setB.size === 0) return 0;
-  if (setA.size === 0 || setB.size === 0) return 0;
-  let intersection = 0;
-  for (const token of setA) {
-    if (setB.has(token)) intersection++;
-  }
-  const union = setA.size + setB.size - intersection;
-  return union === 0 ? 0 : intersection / union;
-}
-/**
- * Conveniencia: jaccard sobre dos textos.
- *
- * @param {string} a
- * @param {string} b
- * @returns {number} en [0, 1]
- */
-function similarity(a, b) {
-  return jaccard(tokenize(a), tokenize(b));
-}
-// ── exports ───────────────────────────────────────────────────────────────────
-module.exports = {
-  tokenize,
-  jaccard,
-  similarity,
-  MIN_TOKEN_LENGTH,
-  STOP_WORDS,
-};
+'use strict';
+/**
+ * jaccard-similarity.js — Métrica de Jaccard sobre conjuntos de tokens.
+ *
+ * Patrón adoptado de `temp/agentmemory-main/src/functions/auto-forget.ts`
+ * para detectar memorias contradictorias/duplicadas con vocabulario compartido.
+ *
+ * Jaccard(A, B) = |A ∩ B| / |A ∪ B|
+ *
+ * Propiedades:
+ *   - Rango [0, 1]: 0 = sin overlap, 1 = idénticos.
+ *   - Simétrico: J(A, B) = J(B, A).
+ *   - Independiente de longitudes absolutas (ambos cortos pueden ser 1.0).
+ *
+ * Sin dependencias — Node stdlib only. Funciones puras.
+ *
+ * @module scripts/lib/jaccard-similarity
+ */
+// ── constantes ────────────────────────────────────────────────────────────────
+/** Longitud mínima de un token para ser considerado significativo. */
+const MIN_TOKEN_LENGTH = 3;
+/** Stop words en español que se excluyen del análisis. */
+const STOP_WORDS = new Set([
+  'que', 'los', 'las', 'del', 'una', 'por', 'con', 'para', 'como',
+  'sin', 'mas', 'sus', 'lo', 'le', 'la', 'el', 'al', 'no', 'es',
+  'se', 'de', 'en', 'un', 'a', 'y', 'o', 'pero', 'cuando',
+  'donde', 'porque', 'desde', 'hasta', 'sobre', 'bajo', 'entre',
+  'esta', 'este', 'esto', 'esa', 'ese', 'eso', 'tras', 'durante',
+  'mediante', 'segun', 'asi', 'tan', 'ya', 'aun', 'aunque',
+  // English equivalents (frequently mixed in technical text)
+  'the', 'and', 'for', 'with', 'this', 'that', 'have', 'from',
+  'are', 'was', 'will', 'not', 'has', 'had', 'but', 'can',
+]);
+// ── funciones puras ───────────────────────────────────────────────────────────
+/**
+ * Convierte un texto en un Set de tokens significativos (lowercase, sin stop
+ * words, longitud mínima). Preserva acentos.
+ *
+ * @param {string} text
+ * @returns {Set<string>}
+ */
+function tokenize(text) {
+  if (!text || typeof text !== 'string') return new Set();
+  return new Set(
+    String(text)
+      .toLowerCase()
+      .replace(/[`*_~\[\](){}<>#"'\-.,;:!?\/\\]/g, ' ')
+      .split(/\s+/)
+      .filter(t => t.length >= MIN_TOKEN_LENGTH && !STOP_WORDS.has(t)),
+  );
+}
+/**
+ * Jaccard similarity entre dos Sets.
+ *
+ * @param {Set} setA
+ * @param {Set} setB
+ * @returns {number} en [0, 1]
+ */
+function jaccard(setA, setB) {
+  if (!(setA instanceof Set) || !(setB instanceof Set)) return 0;
+  if (setA.size === 0 && setB.size === 0) return 0;
+  if (setA.size === 0 || setB.size === 0) return 0;
+  let intersection = 0;
+  for (const token of setA) {
+    if (setB.has(token)) intersection++;
+  }
+  const union = setA.size + setB.size - intersection;
+  return union === 0 ? 0 : intersection / union;
+}
+/**
+ * Conveniencia: jaccard sobre dos textos.
+ *
+ * @param {string} a
+ * @param {string} b
+ * @returns {number} en [0, 1]
+ */
+function similarity(a, b) {
+  return jaccard(tokenize(a), tokenize(b));
+}
+// ── exports ───────────────────────────────────────────────────────────────────
+module.exports = {
+  tokenize,
+  jaccard,
+  similarity,
+  MIN_TOKEN_LENGTH,
+  STOP_WORDS,
+};

package/scripts/lib/longmemeval-runner.js CHANGED Viewed

@@ -1,125 +1,125 @@
-'use strict';
-/**
- * longmemeval-runner.js — Adapter que ejecuta queries del benchmark contra
- * `hooks/lib/memory-search` y devuelve métricas.
- *
- * Patrón adoptado de `temp/agentmemory-main/benchmark/longmemeval-bench.ts`.
- * Adaptado: en lugar de cargar haystack desde el dataset, usa el estado
- * actual del proyecto SWL (APRENDIZAJES.md, sesiones, instintos).
- *
- * El dataset es un JSONL donde cada línea es:
- * {
- *   "question_id":  "q-001",
- *   "question":     "texto libre de la query",
- *   "gold_ids":     ["apr-N", "ses-YYYY-MM-DD-HHMM"],
- *   "category":     "decision" | "patron" | "anti-patron" | "gotcha" | ...,
- *   "status":       "real" | "placeholder"
- * }
- *
- * @module scripts/lib/longmemeval-runner
- */
-const fs   = require('fs');
-const path = require('path');
-const memorySearch     = require('../../hooks/lib/memory-search');
-const benchmarkMetrics = require('./benchmark-metrics');
-// ── parser de dataset ─────────────────────────────────────────────────────────
-/**
- * Parsea un archivo JSONL del dataset.
- * @param {string} ruta
- * @returns {object[]}
- */
-function leerDataset(ruta) {
-  if (!fs.existsSync(ruta)) {
-    throw new Error(`Dataset no encontrado: ${ruta}`);
-  }
-  const contenido = fs.readFileSync(ruta, 'utf8');
-  const entries = [];
-  let lineNum = 0;
-  for (const linea of contenido.split('\n')) {
-    lineNum++;
-    if (!linea.trim()) continue;
-    if (linea.trim().startsWith('//')) continue; // comentarios
-    try {
-      entries.push(JSON.parse(linea));
-    } catch (err) {
-      throw new Error(`JSONL malformado en línea ${lineNum}: ${err.message}`);
-    }
-  }
-  return entries;
-}
-// ── ejecución de query individual ─────────────────────────────────────────────
-/**
- * Ejecuta una query del benchmark contra memoria SWL y compara con gold.
- *
- * @param {string} baseDir - Raíz del proyecto.
- * @param {object} entry - Una línea del dataset.
- * @param {object} [opts]
- * @param {number} [opts.limit=20] - Top-k a recuperar.
- * @returns {object} Métricas + ids retrieved + entry original.
- */
-function ejecutarEntry(baseDir, entry, opts = {}) {
-  const limit = opts.limit || 20;
-  const inicio = Date.now();
-  const resultados = memorySearch.search(baseDir, entry.question, { limit });
-  const latencyMs = Date.now() - inicio;
-  const retrievedIds = resultados.map(r => r.id);
-  const goldIds = Array.isArray(entry.gold_ids) ? entry.gold_ids : [];
-  const metricas = benchmarkMetrics.calcularMetricas(retrievedIds, goldIds);
-  return {
-    question_id: entry.question_id || 'unknown',
-    question: entry.question,
-    category: entry.category || null,
-    status: entry.status || 'unknown',
-    retrievedIds,
-    goldIds,
-    metricas,
-    latencyMs,
-  };
-}
-/**
- * Ejecuta el dataset completo y devuelve resultados + métricas agregadas.
- *
- * @param {string} baseDir
- * @param {string} datasetPath
- * @param {object} [opts]
- * @returns {{ entries: object[], promedio: object, dataset: object }}
- */
-function ejecutarDataset(baseDir, datasetPath, opts = {}) {
-  const entries = leerDataset(datasetPath);
-  const resultados = entries.map(e => ejecutarEntry(baseDir, e, opts));
-  const promedio = benchmarkMetrics.promediar(resultados.map(r => r.metricas));
-  // Estadísticas del dataset
-  const placeholderCount = entries.filter(e => e.status === 'placeholder').length;
-  const realCount = entries.filter(e => e.status === 'real').length;
-  const datasetMeta = {
-    total: entries.length,
-    real: realCount,
-    placeholder: placeholderCount,
-    significativo: realCount >= 30,
-  };
-  return {
-    entries: resultados,
-    promedio,
-    dataset: datasetMeta,
-  };
-}
-// ── exports ───────────────────────────────────────────────────────────────────
-module.exports = {
-  leerDataset,
-  ejecutarEntry,
-  ejecutarDataset,
-};
+'use strict';
+/**
+ * longmemeval-runner.js — Adapter que ejecuta queries del benchmark contra
+ * `hooks/lib/memory-search` y devuelve métricas.
+ *
+ * Patrón adoptado de `temp/agentmemory-main/benchmark/longmemeval-bench.ts`.
+ * Adaptado: en lugar de cargar haystack desde el dataset, usa el estado
+ * actual del proyecto SWL (APRENDIZAJES.md, sesiones, instintos).
+ *
+ * El dataset es un JSONL donde cada línea es:
+ * {
+ *   "question_id":  "q-001",
+ *   "question":     "texto libre de la query",
+ *   "gold_ids":     ["apr-N", "ses-YYYY-MM-DD-HHMM"],
+ *   "category":     "decision" | "patron" | "anti-patron" | "gotcha" | ...,
+ *   "status":       "real" | "placeholder"
+ * }
+ *
+ * @module scripts/lib/longmemeval-runner
+ */
+const fs   = require('fs');
+const path = require('path');
+const memorySearch     = require('../../hooks/lib/memory-search');
+const benchmarkMetrics = require('./benchmark-metrics');
+// ── parser de dataset ─────────────────────────────────────────────────────────
+/**
+ * Parsea un archivo JSONL del dataset.
+ * @param {string} ruta
+ * @returns {object[]}
+ */
+function leerDataset(ruta) {
+  if (!fs.existsSync(ruta)) {
+    throw new Error(`Dataset no encontrado: ${ruta}`);
+  }
+  const contenido = fs.readFileSync(ruta, 'utf8');
+  const entries = [];
+  let lineNum = 0;
+  for (const linea of contenido.split('\n')) {
+    lineNum++;
+    if (!linea.trim()) continue;
+    if (linea.trim().startsWith('//')) continue; // comentarios
+    try {
+      entries.push(JSON.parse(linea));
+    } catch (err) {
+      throw new Error(`JSONL malformado en línea ${lineNum}: ${err.message}`);
+    }
+  }
+  return entries;
+}
+// ── ejecución de query individual ─────────────────────────────────────────────
+/**
+ * Ejecuta una query del benchmark contra memoria SWL y compara con gold.
+ *
+ * @param {string} baseDir - Raíz del proyecto.
+ * @param {object} entry - Una línea del dataset.
+ * @param {object} [opts]
+ * @param {number} [opts.limit=20] - Top-k a recuperar.
+ * @returns {object} Métricas + ids retrieved + entry original.
+ */
+function ejecutarEntry(baseDir, entry, opts = {}) {
+  const limit = opts.limit || 20;
+  const inicio = Date.now();
+  const resultados = memorySearch.search(baseDir, entry.question, { limit });
+  const latencyMs = Date.now() - inicio;
+  const retrievedIds = resultados.map(r => r.id);
+  const goldIds = Array.isArray(entry.gold_ids) ? entry.gold_ids : [];
+  const metricas = benchmarkMetrics.calcularMetricas(retrievedIds, goldIds);
+  return {
+    question_id: entry.question_id || 'unknown',
+    question: entry.question,
+    category: entry.category || null,
+    status: entry.status || 'unknown',
+    retrievedIds,
+    goldIds,
+    metricas,
+    latencyMs,
+  };
+}
+/**
+ * Ejecuta el dataset completo y devuelve resultados + métricas agregadas.
+ *
+ * @param {string} baseDir
+ * @param {string} datasetPath
+ * @param {object} [opts]
+ * @returns {{ entries: object[], promedio: object, dataset: object }}
+ */
+function ejecutarDataset(baseDir, datasetPath, opts = {}) {
+  const entries = leerDataset(datasetPath);
+  const resultados = entries.map(e => ejecutarEntry(baseDir, e, opts));
+  const promedio = benchmarkMetrics.promediar(resultados.map(r => r.metricas));
+  // Estadísticas del dataset
+  const placeholderCount = entries.filter(e => e.status === 'placeholder').length;
+  const realCount = entries.filter(e => e.status === 'real').length;
+  const datasetMeta = {
+    total: entries.length,
+    real: realCount,
+    placeholder: placeholderCount,
+    significativo: realCount >= 30,
+  };
+  return {
+    entries: resultados,
+    promedio,
+    dataset: datasetMeta,
+  };
+}
+// ── exports ───────────────────────────────────────────────────────────────────
+module.exports = {
+  leerDataset,
+  ejecutarEntry,
+  ejecutarDataset,
+};