@saulwade/swl-ses 1.4.0 → 1.4.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CLAUDE.md +4 -3
- package/README.md +15 -14
- package/agentes/nemesis-auditor-swl.md +161 -0
- package/bin/swl-mcp-server.js +187 -187
- package/comandos/swl/.evolved.json +22 -22
- package/comandos/swl/contribuir.md +233 -233
- package/comandos/swl/nemesis.md +122 -0
- package/comandos/swl/salud.md +34 -0
- package/comandos/swl/verificar.md +45 -0
- package/gateway/lib/event-channel.js +191 -191
- package/habilidades/backend-production-resilience/SKILL.md +288 -288
- package/habilidades/benchmark-memoria/SKILL.md +186 -186
- package/habilidades/diagrama-arquitectura/assets/template.html +276 -276
- package/habilidades/doubt-driven-review/SKILL.md +171 -171
- package/habilidades/doubt-driven-review/recursos/EXAMPLES.md +130 -130
- package/habilidades/eval-framework/SKILL.md +212 -212
- package/habilidades/feynman-auditor-swl/SKILL.md +123 -0
- package/habilidades/feynman-auditor-swl/recursos/preguntas-language-agnostic.md +108 -0
- package/habilidades/harness-claude-code/SKILL.md +299 -299
- package/habilidades/infra-github-actions/SKILL.md +166 -166
- package/habilidades/legacy-code-rescue/SKILL.md +267 -267
- package/habilidades/manejo-errores/.evolved.json +8 -8
- package/habilidades/meta-skills-estandar/recursos/convencion-examples.md +93 -93
- package/habilidades/meta-skills-estandar/recursos/skills-as-agents.md +163 -163
- package/habilidades/patrones-python/SKILL.md +229 -229
- package/habilidades/patrones-python/recursos/patrones-avanzados.md +469 -469
- package/habilidades/planear-fase/SKILL.md +319 -319
- package/habilidades/release-semver/.evolved.json +8 -8
- package/habilidades/state-inconsistency-auditor-swl/SKILL.md +166 -0
- package/habilidades/state-inconsistency-auditor-swl/recursos/coupled-state-patterns.md +147 -0
- package/habilidades/testing-python/SKILL.md +340 -340
- package/habilidades/web-fetcher-routing/SKILL.md +75 -0
- package/hooks/claudemd-bloat-detector.js +161 -161
- package/hooks/lib/agent-routing.js +107 -107
- package/hooks/lib/auto-consolidator.js +335 -335
- package/hooks/lib/error-classifier.js +308 -308
- package/hooks/lib/merkle-audit.js +96 -96
- package/hooks/lib/provenance-tracker.js +191 -191
- package/hooks/lib/rate-limit-tracker.js +253 -253
- package/hooks/lib/resource-quota.js +122 -122
- package/hooks/lib/retry-jitter.js +165 -165
- package/hooks/lib/security-net.js +201 -0
- package/hooks/lib/skill-auditor.js +588 -588
- package/hooks/lib/sync-status.js +228 -228
- package/hooks/lib/taint-tracker.js +107 -107
- package/hooks/lib/text-similarity.js +241 -241
- package/hooks/lib/toon-compressor.js +245 -245
- package/hooks/registro-turnos.js +209 -209
- package/hooks/sugerir-regenerar-inventario.js +170 -170
- package/hooks/validar-formato-post-subagente.js +140 -140
- package/hooks/validar-memoria-hook.js +218 -218
- package/instintos/prompt-appendices.yaml +57 -57
- package/manifiestos/agent-output-schemas.json +57 -57
- package/manifiestos/modulos.json +41 -6
- package/manifiestos/perfiles.json +2 -1
- package/manifiestos/skills-lock.json +30 -9
- package/package.json +2 -2
- package/plantillas/auditor-veto-template.md +105 -105
- package/plantillas/github-workflows/README.md +47 -47
- package/plantillas/github-workflows/release-please.yml +44 -44
- package/plantillas/github-workflows/swl-ci.yml +107 -107
- package/plantillas/github-workflows/swl-security.yml +51 -51
- package/plugin.json +10 -2
- package/reglas/analisis-previo-tareas-grandes.md +172 -172
- package/reglas/arreglar-al-detectar.md +147 -147
- package/reglas/fragmentos-compartidos.md +152 -152
- package/reglas/harness-claude-code.md +213 -213
- package/reglas/usar-context7.md +226 -226
- package/schemas/diary-entry.schema.json +80 -80
- package/scripts/audit-tools/audit-history.js +330 -0
- package/scripts/audit-tools/bundle-tracker.js +290 -0
- package/scripts/audit-tools/canary-monitor.js +352 -0
- package/scripts/audit-tools/code-profiler.js +605 -0
- package/scripts/audit-tools/dep-doctor.js +320 -0
- package/scripts/audit-tools/env-validator.js +206 -0
- package/scripts/audit-tools/lib/fs-walk.js +48 -0
- package/scripts/audit-tools/lib/output.js +23 -0
- package/scripts/audit-tools/migration-checker.js +392 -0
- package/scripts/audit-tools/pentest-scanner.js +1436 -0
- package/scripts/benchmark-memoria.js +167 -167
- package/scripts/configurar-branch-protection.js +418 -418
- package/scripts/detectar-aprendizajes-duplicados.js +151 -151
- package/scripts/field-report.js +199 -199
- package/scripts/generar-checklists-consolidados.js +273 -273
- package/scripts/generar-inventario.js +420 -420
- package/scripts/generar-matriz-lenguajes.js +271 -271
- package/scripts/lib/artefactos-python.js +43 -43
- package/scripts/lib/benchmark-metrics.js +160 -160
- package/scripts/lib/budget-enforcer.js +252 -252
- package/scripts/lib/configurar-ci.js +380 -380
- package/scripts/lib/contadores-inventario.js +217 -217
- package/scripts/lib/detectar-stack-detallado.js +307 -307
- package/scripts/lib/diary-entry.js +234 -234
- package/scripts/lib/eval-metrics-store.js +218 -218
- package/scripts/lib/eval-quality.js +171 -171
- package/scripts/lib/eval-schemas.js +144 -144
- package/scripts/lib/eval-self-correct.js +106 -106
- package/scripts/lib/eval-validator.js +185 -185
- package/scripts/lib/jaccard-similarity.js +98 -98
- package/scripts/lib/longmemeval-runner.js +125 -125
- package/scripts/lib/manifiestos.js +42 -1
- package/scripts/lib/npm-version.js +261 -261
- package/scripts/lib/paquetes-conocidos.js +50 -50
- package/scripts/lib/prompt-builder.js +264 -264
- package/scripts/lib/rrf-fusion.js +175 -175
- package/scripts/lib/scoring-instintos.js +277 -277
- package/scripts/lib/semantic-search.js +252 -252
- package/scripts/limpiar-artefactos-python.js +131 -131
- package/scripts/mcp-server/README.md +128 -128
- package/scripts/mcp-server/handlers.js +206 -206
- package/scripts/migrar-csv-a-array.js +168 -168
- package/scripts/migrar-fase-dominio.js +201 -201
- package/scripts/publicar.js +511 -511
- package/scripts/run-eval.js +141 -141
- package/scripts/validar-manifest.js +231 -195
- package/scripts/validar-userland-vacio.js +110 -110
package/scripts/run-eval.js
CHANGED
|
@@ -1,141 +1,141 @@
|
|
|
1
|
-
#!/usr/bin/env node
|
|
2
|
-
'use strict';
|
|
3
|
-
|
|
4
|
-
/**
|
|
5
|
-
* run-eval.js — CLI para ejecutar evaluaciones del eval framework.
|
|
6
|
-
*
|
|
7
|
-
* Uso:
|
|
8
|
-
* node scripts/run-eval.js <ruta-eval.json>
|
|
9
|
-
*
|
|
10
|
-
* Formato del archivo JSON de eval:
|
|
11
|
-
* {
|
|
12
|
-
* "functionId": "memoria-busqueda::search",
|
|
13
|
-
* "schemaName": "MEMORY_SEARCH_RESULT_SCHEMA", // opcional, valida output
|
|
14
|
-
* "qualityScorer": "scoreObservacion", // opcional, calcula calidad
|
|
15
|
-
* "input": { ... }, // datos de entrada
|
|
16
|
-
* "expectedKeys": ["id", "tipo", "titulo"], // opcional, valida presencia
|
|
17
|
-
* "output": { ... } // output a evaluar
|
|
18
|
-
* }
|
|
19
|
-
*
|
|
20
|
-
* Exit codes:
|
|
21
|
-
* 0 - eval pasa (valid: true)
|
|
22
|
-
* 1 - eval falla (valid: false) o error de I/O
|
|
23
|
-
* 2 - error de uso (argumentos inválidos)
|
|
24
|
-
*/
|
|
25
|
-
|
|
26
|
-
const fs = require('fs');
|
|
27
|
-
const path = require('path');
|
|
28
|
-
|
|
29
|
-
const schemas = require('./lib/eval-schemas');
|
|
30
|
-
const validator = require('./lib/eval-validator');
|
|
31
|
-
const quality = require('./lib/eval-quality');
|
|
32
|
-
const metricsStore = require('./lib/eval-metrics-store');
|
|
33
|
-
|
|
34
|
-
function uso() {
|
|
35
|
-
console.error('Uso: node scripts/run-eval.js <ruta-eval.json>');
|
|
36
|
-
console.error(' node scripts/run-eval.js --rebuild-aggregate');
|
|
37
|
-
process.exit(2);
|
|
38
|
-
}
|
|
39
|
-
|
|
40
|
-
function ejecutarEval(ruta) {
|
|
41
|
-
if (!fs.existsSync(ruta)) {
|
|
42
|
-
console.error(`Archivo no existe: ${ruta}`);
|
|
43
|
-
return 1;
|
|
44
|
-
}
|
|
45
|
-
|
|
46
|
-
let definicion;
|
|
47
|
-
try {
|
|
48
|
-
definicion = JSON.parse(fs.readFileSync(ruta, 'utf8'));
|
|
49
|
-
} catch (err) {
|
|
50
|
-
console.error(`Error parseando ${ruta}: ${err.message}`);
|
|
51
|
-
return 1;
|
|
52
|
-
}
|
|
53
|
-
|
|
54
|
-
const { functionId, schemaName, qualityScorer, output } = definicion;
|
|
55
|
-
if (!functionId || typeof functionId !== 'string') {
|
|
56
|
-
console.error('functionId requerido en el archivo de eval');
|
|
57
|
-
return 1;
|
|
58
|
-
}
|
|
59
|
-
|
|
60
|
-
const inicio = Date.now();
|
|
61
|
-
let valid = true;
|
|
62
|
-
let errors = [];
|
|
63
|
-
let qualityScore = null;
|
|
64
|
-
|
|
65
|
-
// Validar contra schema si se especifica
|
|
66
|
-
if (schemaName) {
|
|
67
|
-
const schema = schemas[schemaName];
|
|
68
|
-
if (!schema) {
|
|
69
|
-
console.error(`Schema desconocido: ${schemaName}. Disponibles: ${Object.keys(schemas).filter(k => k.endsWith('_SCHEMA')).join(', ')}`);
|
|
70
|
-
return 1;
|
|
71
|
-
}
|
|
72
|
-
const r = validator.validar(output, schema);
|
|
73
|
-
valid = valid && r.valid;
|
|
74
|
-
if (!r.valid) errors.push(...r.errors);
|
|
75
|
-
}
|
|
76
|
-
|
|
77
|
-
// Validar campos esperados si se especifican
|
|
78
|
-
if (Array.isArray(definicion.expectedKeys)) {
|
|
79
|
-
for (const key of definicion.expectedKeys) {
|
|
80
|
-
if (!output || !(key in output)) {
|
|
81
|
-
valid = false;
|
|
82
|
-
errors.push(`expectedKey faltante: ${key}`);
|
|
83
|
-
}
|
|
84
|
-
}
|
|
85
|
-
}
|
|
86
|
-
|
|
87
|
-
// Calcular quality score si se especifica
|
|
88
|
-
if (qualityScorer) {
|
|
89
|
-
const scorer = quality[qualityScorer];
|
|
90
|
-
if (typeof scorer !== 'function') {
|
|
91
|
-
console.error(`Quality scorer desconocido: ${qualityScorer}. Disponibles: ${Object.keys(quality).join(', ')}`);
|
|
92
|
-
return 1;
|
|
93
|
-
}
|
|
94
|
-
qualityScore = scorer(output);
|
|
95
|
-
}
|
|
96
|
-
|
|
97
|
-
const latencyMs = Date.now() - inicio;
|
|
98
|
-
const exito = valid;
|
|
99
|
-
|
|
100
|
-
// Persistir resultado
|
|
101
|
-
const baseDir = process.cwd();
|
|
102
|
-
metricsStore.registrar(baseDir, {
|
|
103
|
-
functionId,
|
|
104
|
-
latencyMs,
|
|
105
|
-
success: exito,
|
|
106
|
-
qualityScore,
|
|
107
|
-
metadata: { schemaName, qualityScorer, evalFile: path.basename(ruta) },
|
|
108
|
-
});
|
|
109
|
-
|
|
110
|
-
// Reportar
|
|
111
|
-
console.log(JSON.stringify({
|
|
112
|
-
functionId,
|
|
113
|
-
valid,
|
|
114
|
-
errors: errors.length > 0 ? errors : undefined,
|
|
115
|
-
qualityScore,
|
|
116
|
-
latencyMs,
|
|
117
|
-
}, null, 2));
|
|
118
|
-
|
|
119
|
-
return valid ? 0 : 1;
|
|
120
|
-
}
|
|
121
|
-
|
|
122
|
-
function main() {
|
|
123
|
-
const args = process.argv.slice(2);
|
|
124
|
-
if (args.length === 0) uso();
|
|
125
|
-
|
|
126
|
-
if (args[0] === '--rebuild-aggregate') {
|
|
127
|
-
const r = metricsStore.reconstruirAgregado(process.cwd());
|
|
128
|
-
console.log(`Agregado reconstruido: ${r.rebuilt} eventos, ${r.functions} funciones únicas.`);
|
|
129
|
-
process.exit(0);
|
|
130
|
-
}
|
|
131
|
-
|
|
132
|
-
process.exit(ejecutarEval(args[0]));
|
|
133
|
-
}
|
|
134
|
-
|
|
135
|
-
if (require.main === module) {
|
|
136
|
-
main();
|
|
137
|
-
}
|
|
138
|
-
|
|
139
|
-
module.exports = {
|
|
140
|
-
ejecutarEval,
|
|
141
|
-
};
|
|
1
|
+
#!/usr/bin/env node
|
|
2
|
+
'use strict';
|
|
3
|
+
|
|
4
|
+
/**
|
|
5
|
+
* run-eval.js — CLI para ejecutar evaluaciones del eval framework.
|
|
6
|
+
*
|
|
7
|
+
* Uso:
|
|
8
|
+
* node scripts/run-eval.js <ruta-eval.json>
|
|
9
|
+
*
|
|
10
|
+
* Formato del archivo JSON de eval:
|
|
11
|
+
* {
|
|
12
|
+
* "functionId": "memoria-busqueda::search",
|
|
13
|
+
* "schemaName": "MEMORY_SEARCH_RESULT_SCHEMA", // opcional, valida output
|
|
14
|
+
* "qualityScorer": "scoreObservacion", // opcional, calcula calidad
|
|
15
|
+
* "input": { ... }, // datos de entrada
|
|
16
|
+
* "expectedKeys": ["id", "tipo", "titulo"], // opcional, valida presencia
|
|
17
|
+
* "output": { ... } // output a evaluar
|
|
18
|
+
* }
|
|
19
|
+
*
|
|
20
|
+
* Exit codes:
|
|
21
|
+
* 0 - eval pasa (valid: true)
|
|
22
|
+
* 1 - eval falla (valid: false) o error de I/O
|
|
23
|
+
* 2 - error de uso (argumentos inválidos)
|
|
24
|
+
*/
|
|
25
|
+
|
|
26
|
+
const fs = require('fs');
|
|
27
|
+
const path = require('path');
|
|
28
|
+
|
|
29
|
+
const schemas = require('./lib/eval-schemas');
|
|
30
|
+
const validator = require('./lib/eval-validator');
|
|
31
|
+
const quality = require('./lib/eval-quality');
|
|
32
|
+
const metricsStore = require('./lib/eval-metrics-store');
|
|
33
|
+
|
|
34
|
+
function uso() {
|
|
35
|
+
console.error('Uso: node scripts/run-eval.js <ruta-eval.json>');
|
|
36
|
+
console.error(' node scripts/run-eval.js --rebuild-aggregate');
|
|
37
|
+
process.exit(2);
|
|
38
|
+
}
|
|
39
|
+
|
|
40
|
+
function ejecutarEval(ruta) {
|
|
41
|
+
if (!fs.existsSync(ruta)) {
|
|
42
|
+
console.error(`Archivo no existe: ${ruta}`);
|
|
43
|
+
return 1;
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
let definicion;
|
|
47
|
+
try {
|
|
48
|
+
definicion = JSON.parse(fs.readFileSync(ruta, 'utf8'));
|
|
49
|
+
} catch (err) {
|
|
50
|
+
console.error(`Error parseando ${ruta}: ${err.message}`);
|
|
51
|
+
return 1;
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
const { functionId, schemaName, qualityScorer, output } = definicion;
|
|
55
|
+
if (!functionId || typeof functionId !== 'string') {
|
|
56
|
+
console.error('functionId requerido en el archivo de eval');
|
|
57
|
+
return 1;
|
|
58
|
+
}
|
|
59
|
+
|
|
60
|
+
const inicio = Date.now();
|
|
61
|
+
let valid = true;
|
|
62
|
+
let errors = [];
|
|
63
|
+
let qualityScore = null;
|
|
64
|
+
|
|
65
|
+
// Validar contra schema si se especifica
|
|
66
|
+
if (schemaName) {
|
|
67
|
+
const schema = schemas[schemaName];
|
|
68
|
+
if (!schema) {
|
|
69
|
+
console.error(`Schema desconocido: ${schemaName}. Disponibles: ${Object.keys(schemas).filter(k => k.endsWith('_SCHEMA')).join(', ')}`);
|
|
70
|
+
return 1;
|
|
71
|
+
}
|
|
72
|
+
const r = validator.validar(output, schema);
|
|
73
|
+
valid = valid && r.valid;
|
|
74
|
+
if (!r.valid) errors.push(...r.errors);
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
// Validar campos esperados si se especifican
|
|
78
|
+
if (Array.isArray(definicion.expectedKeys)) {
|
|
79
|
+
for (const key of definicion.expectedKeys) {
|
|
80
|
+
if (!output || !(key in output)) {
|
|
81
|
+
valid = false;
|
|
82
|
+
errors.push(`expectedKey faltante: ${key}`);
|
|
83
|
+
}
|
|
84
|
+
}
|
|
85
|
+
}
|
|
86
|
+
|
|
87
|
+
// Calcular quality score si se especifica
|
|
88
|
+
if (qualityScorer) {
|
|
89
|
+
const scorer = quality[qualityScorer];
|
|
90
|
+
if (typeof scorer !== 'function') {
|
|
91
|
+
console.error(`Quality scorer desconocido: ${qualityScorer}. Disponibles: ${Object.keys(quality).join(', ')}`);
|
|
92
|
+
return 1;
|
|
93
|
+
}
|
|
94
|
+
qualityScore = scorer(output);
|
|
95
|
+
}
|
|
96
|
+
|
|
97
|
+
const latencyMs = Date.now() - inicio;
|
|
98
|
+
const exito = valid;
|
|
99
|
+
|
|
100
|
+
// Persistir resultado
|
|
101
|
+
const baseDir = process.cwd();
|
|
102
|
+
metricsStore.registrar(baseDir, {
|
|
103
|
+
functionId,
|
|
104
|
+
latencyMs,
|
|
105
|
+
success: exito,
|
|
106
|
+
qualityScore,
|
|
107
|
+
metadata: { schemaName, qualityScorer, evalFile: path.basename(ruta) },
|
|
108
|
+
});
|
|
109
|
+
|
|
110
|
+
// Reportar
|
|
111
|
+
console.log(JSON.stringify({
|
|
112
|
+
functionId,
|
|
113
|
+
valid,
|
|
114
|
+
errors: errors.length > 0 ? errors : undefined,
|
|
115
|
+
qualityScore,
|
|
116
|
+
latencyMs,
|
|
117
|
+
}, null, 2));
|
|
118
|
+
|
|
119
|
+
return valid ? 0 : 1;
|
|
120
|
+
}
|
|
121
|
+
|
|
122
|
+
function main() {
|
|
123
|
+
const args = process.argv.slice(2);
|
|
124
|
+
if (args.length === 0) uso();
|
|
125
|
+
|
|
126
|
+
if (args[0] === '--rebuild-aggregate') {
|
|
127
|
+
const r = metricsStore.reconstruirAgregado(process.cwd());
|
|
128
|
+
console.log(`Agregado reconstruido: ${r.rebuilt} eventos, ${r.functions} funciones únicas.`);
|
|
129
|
+
process.exit(0);
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
process.exit(ejecutarEval(args[0]));
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
if (require.main === module) {
|
|
136
|
+
main();
|
|
137
|
+
}
|
|
138
|
+
|
|
139
|
+
module.exports = {
|
|
140
|
+
ejecutarEval,
|
|
141
|
+
};
|