monomind 1.10.57 → 1.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (232) hide show
  1. package/.claude/agents/core/coordinator.md +71 -0
  2. package/.claude/agents/generated/case-analyst.md +50 -0
  3. package/.claude/agents/generated/copy-editor.md +45 -0
  4. package/.claude/agents/generated/court-reporter.md +50 -0
  5. package/.claude/agents/generated/defender.md +51 -0
  6. package/.claude/agents/generated/editor-in-chief.md +45 -0
  7. package/.claude/agents/generated/fact-checker.md +45 -0
  8. package/.claude/agents/generated/judge.md +51 -0
  9. package/.claude/agents/generated/prosecutor.md +51 -0
  10. package/.claude/agents/generated/reporter.md +45 -0
  11. package/.claude/commands/hooks/README.md +1 -1
  12. package/.claude/commands/hooks/overview.md +1 -1
  13. package/.claude/commands/mastermind/_repeat.md +1 -1
  14. package/.claude/commands/mastermind/do.md +3 -1
  15. package/.claude/commands/mastermind/help.md +2 -2
  16. package/.claude/commands/mastermind/master.md +39 -6
  17. package/.claude/commands/mastermind/memory.md +1 -1
  18. package/.claude/commands/memory/memory-search.md +2 -2
  19. package/.claude/commands/monitoring/status.md +1 -1
  20. package/.claude/commands/{browse.md → monobrowse.md} +2 -2
  21. package/.claude/commands/sparc.md +1 -1
  22. package/.claude/helpers/handlers/graph-status-handler.cjs +1 -1
  23. package/.claude/helpers/loop-tracker.cjs +1 -1
  24. package/.claude/scheduled_tasks.lock +1 -1
  25. package/.claude/skills/agent-browser-testing/SKILL.md +1 -1
  26. package/.claude/skills/hooks-automation/SKILL.md +0 -3
  27. package/.claude/skills/mastermind/build.md +1 -1
  28. package/.claude/skills/mastermind/code-quality-reviewer-prompt.md +60 -0
  29. package/.claude/skills/mastermind/content.md +1 -1
  30. package/.claude/skills/mastermind/createorg.md +79 -2
  31. package/.claude/skills/mastermind/design.md +3 -1
  32. package/.claude/skills/mastermind/finance.md +1 -1
  33. package/.claude/skills/mastermind/implementer-prompt.md +109 -0
  34. package/.claude/skills/mastermind/marketing.md +1 -1
  35. package/.claude/skills/mastermind/ops.md +1 -1
  36. package/.claude/skills/mastermind/plan.md +20 -2
  37. package/.claude/skills/mastermind/release.md +1 -1
  38. package/.claude/skills/mastermind/research.md +1 -1
  39. package/.claude/skills/mastermind/review.md +1 -1
  40. package/.claude/skills/mastermind/sales.md +1 -1
  41. package/.claude/skills/mastermind/spec-reviewer-prompt.md +63 -0
  42. package/.claude/skills/sparc-methodology/SKILL.md +3 -3
  43. package/.claude/skills/swarm-advanced/SKILL.md +1 -4
  44. package/.claude-plugin/README.md +1 -2
  45. package/.claude-plugin/docs/PLUGIN_SUMMARY.md +0 -1
  46. package/README.md +18 -32
  47. package/package.json +1 -1
  48. package/packages/@monomind/cli/README.md +18 -32
  49. package/packages/@monomind/cli/dist/src/agents/registry-builder.d.ts +1 -7
  50. package/packages/@monomind/cli/dist/src/agents/registry-builder.js +10 -6
  51. package/packages/@monomind/cli/dist/src/benchmarks/benchmark-runner.d.ts +59 -12
  52. package/packages/@monomind/cli/dist/src/benchmarks/benchmark-runner.js +67 -13
  53. package/packages/@monomind/cli/dist/src/benchmarks/pretrain/index.d.ts +0 -13
  54. package/packages/@monomind/cli/dist/src/commands/agent-wasm.d.ts +2 -2
  55. package/packages/@monomind/cli/dist/src/commands/agent-wasm.js +5 -5
  56. package/packages/@monomind/cli/dist/src/commands/agent.js +1 -6
  57. package/packages/@monomind/cli/dist/src/commands/analyze.d.ts +1 -1
  58. package/packages/@monomind/cli/dist/src/commands/analyze.js +8 -18
  59. package/packages/@monomind/cli/dist/src/commands/doctor.js +53 -3
  60. package/packages/@monomind/cli/dist/src/commands/embeddings.js +9 -33
  61. package/packages/@monomind/cli/dist/src/commands/hooks.js +24 -76
  62. package/packages/@monomind/cli/dist/src/commands/index.d.ts +4 -6
  63. package/packages/@monomind/cli/dist/src/commands/index.js +8 -15
  64. package/packages/@monomind/cli/dist/src/commands/init.js +2 -2
  65. package/packages/@monomind/cli/dist/src/commands/issues.js +16 -11
  66. package/packages/@monomind/cli/dist/src/commands/memory.js +6 -6
  67. package/packages/@monomind/cli/dist/src/commands/migrate.js +1 -2
  68. package/packages/@monomind/cli/dist/src/commands/monograph.js +18 -11
  69. package/packages/@monomind/cli/dist/src/commands/monovector/backup.d.ts +11 -0
  70. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/backup.js +25 -25
  71. package/packages/@monomind/cli/dist/src/commands/monovector/benchmark.d.ts +11 -0
  72. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/benchmark.js +14 -14
  73. package/packages/@monomind/cli/dist/src/commands/monovector/import.d.ts +18 -0
  74. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/import.js +21 -21
  75. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/index.d.ts +6 -6
  76. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/index.js +22 -22
  77. package/packages/@monomind/cli/dist/src/commands/monovector/init.d.ts +11 -0
  78. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/init.js +36 -36
  79. package/packages/@monomind/cli/dist/src/commands/monovector/migrate.d.ts +11 -0
  80. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/migrate.js +16 -16
  81. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/optimize.d.ts +2 -2
  82. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/optimize.js +10 -10
  83. package/packages/@monomind/cli/dist/src/commands/monovector/setup.d.ts +18 -0
  84. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/setup.js +77 -77
  85. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/status.d.ts +2 -2
  86. package/packages/@monomind/cli/dist/src/commands/{ruvector → monovector}/status.js +34 -34
  87. package/packages/@monomind/cli/dist/src/commands/neural.d.ts +1 -1
  88. package/packages/@monomind/cli/dist/src/commands/neural.js +31 -608
  89. package/packages/@monomind/cli/dist/src/commands/performance.js +7 -10
  90. package/packages/@monomind/cli/dist/src/commands/plugins.js +3 -4
  91. package/packages/@monomind/cli/dist/src/commands/process.js +5 -12
  92. package/packages/@monomind/cli/dist/src/commands/progress.js +16 -16
  93. package/packages/@monomind/cli/dist/src/commands/route.d.ts +2 -2
  94. package/packages/@monomind/cli/dist/src/commands/route.js +23 -23
  95. package/packages/@monomind/cli/dist/src/commands/status.js +0 -3
  96. package/packages/@monomind/cli/dist/src/commands/swarm.js +2 -3
  97. package/packages/@monomind/cli/dist/src/config-adapter.js +27 -0
  98. package/packages/@monomind/cli/dist/src/consensus/audit-writer.d.ts +44 -17
  99. package/packages/@monomind/cli/dist/src/dlq/dlq-replayer.d.ts +1 -1
  100. package/packages/@monomind/cli/dist/src/index.js +5 -5
  101. package/packages/@monomind/cli/dist/src/init/claudemd-generator.js +10 -14
  102. package/packages/@monomind/cli/dist/src/init/executor.js +17 -27
  103. package/packages/@monomind/cli/dist/src/init/helpers-generator.js +2 -2
  104. package/packages/@monomind/cli/dist/src/init/types.d.ts +1 -1
  105. package/packages/@monomind/cli/dist/src/mcp-client.js +1 -7
  106. package/packages/@monomind/cli/dist/src/mcp-server.js +9 -1
  107. package/packages/@monomind/cli/dist/src/mcp-tools/agent-tools.js +1 -52
  108. package/packages/@monomind/cli/dist/src/mcp-tools/analyze-tools.js +5 -5
  109. package/packages/@monomind/cli/dist/src/mcp-tools/browser-tools.d.ts +1 -1
  110. package/packages/@monomind/cli/dist/src/mcp-tools/browser-tools.js +6 -5
  111. package/packages/@monomind/cli/dist/src/mcp-tools/coordination-tools.d.ts +1 -1
  112. package/packages/@monomind/cli/dist/src/mcp-tools/coordination-tools.js +51 -54
  113. package/packages/@monomind/cli/dist/src/mcp-tools/daa-tools.d.ts +1 -1
  114. package/packages/@monomind/cli/dist/src/mcp-tools/embeddings-tools.js +10 -10
  115. package/packages/@monomind/cli/dist/src/mcp-tools/guidance-tools.js +0 -24
  116. package/packages/@monomind/cli/dist/src/mcp-tools/hooks-tools.js +189 -480
  117. package/packages/@monomind/cli/dist/src/mcp-tools/index.d.ts +0 -2
  118. package/packages/@monomind/cli/dist/src/mcp-tools/index.js +0 -2
  119. package/packages/@monomind/cli/dist/src/mcp-tools/monograph-compat.d.ts +334 -0
  120. package/packages/@monomind/cli/dist/src/mcp-tools/monograph-compat.js +1108 -0
  121. package/packages/@monomind/cli/dist/src/mcp-tools/monograph-tools.js +76 -34
  122. package/packages/@monomind/cli/dist/src/mcp-tools/neural-tools.d.ts +1 -1
  123. package/packages/@monomind/cli/dist/src/mcp-tools/neural-tools.js +2 -2
  124. package/packages/@monomind/cli/dist/src/mcp-tools/ruvllm-tools.d.ts +2 -2
  125. package/packages/@monomind/cli/dist/src/mcp-tools/ruvllm-tools.js +3 -3
  126. package/packages/@monomind/cli/dist/src/mcp-tools/terminal-tools.d.ts +1 -1
  127. package/packages/@monomind/cli/dist/src/mcp-tools/terminal-tools.js +29 -19
  128. package/packages/@monomind/cli/dist/src/mcp-tools/wasm-agent-tools.d.ts +1 -1
  129. package/packages/@monomind/cli/dist/src/mcp-tools/wasm-agent-tools.js +2 -2
  130. package/packages/@monomind/cli/dist/src/memory/intelligence.js +14 -8
  131. package/packages/@monomind/cli/dist/src/memory/memory-bridge.d.ts +17 -2
  132. package/packages/@monomind/cli/dist/src/memory/memory-bridge.js +76 -23
  133. package/packages/@monomind/cli/dist/src/memory/memory-initializer.d.ts +2 -2
  134. package/packages/@monomind/cli/dist/src/memory/memory-initializer.js +37 -39
  135. package/packages/@monomind/cli/dist/src/monovector/capabilities.d.ts +34 -0
  136. package/packages/@monomind/cli/dist/src/monovector/capabilities.js +37 -0
  137. package/packages/@monomind/cli/dist/src/monovector/command-outcomes.d.ts +37 -0
  138. package/packages/@monomind/cli/dist/src/monovector/command-outcomes.js +87 -0
  139. package/packages/@monomind/cli/dist/src/monovector/coverage-router.d.ts +103 -0
  140. package/packages/@monomind/cli/dist/src/monovector/coverage-router.js +337 -0
  141. package/packages/@monomind/cli/dist/src/monovector/coverage-tools.d.ts +14 -0
  142. package/packages/@monomind/cli/dist/src/monovector/coverage-tools.js +112 -0
  143. package/packages/@monomind/cli/dist/src/{ruvector → monovector}/diff-classifier.d.ts +2 -2
  144. package/packages/@monomind/cli/dist/src/monovector/index.d.ts +61 -0
  145. package/packages/@monomind/cli/dist/src/monovector/index.js +67 -0
  146. package/packages/@monomind/cli/dist/src/monovector/init-state.d.ts +35 -0
  147. package/packages/@monomind/cli/dist/src/monovector/init-state.js +36 -0
  148. package/packages/@monomind/cli/dist/src/monovector/route-outcomes.d.ts +55 -0
  149. package/packages/@monomind/cli/dist/src/monovector/route-outcomes.js +137 -0
  150. package/packages/@monomind/cli/dist/src/parser.js +3 -3
  151. package/packages/@monomind/cli/dist/src/plugins/store/discovery.js +0 -31
  152. package/packages/@monomind/cli/dist/src/production/circuit-breaker.d.ts +26 -6
  153. package/packages/@monomind/cli/dist/src/production/error-handler.d.ts +55 -30
  154. package/packages/@monomind/cli/dist/src/production/index.d.ts +3 -20
  155. package/packages/@monomind/cli/dist/src/production/index.js +3 -15
  156. package/packages/@monomind/cli/dist/src/production/monitoring.d.ts +54 -34
  157. package/packages/@monomind/cli/dist/src/production/monitoring.js +12 -14
  158. package/packages/@monomind/cli/dist/src/production/rate-limiter.d.ts +64 -19
  159. package/packages/@monomind/cli/dist/src/production/rate-limiter.js +5 -5
  160. package/packages/@monomind/cli/dist/src/production/retry.js +4 -2
  161. package/packages/@monomind/cli/dist/src/services/claim-service.d.ts +50 -59
  162. package/packages/@monomind/cli/dist/src/services/claim-service.js +83 -50
  163. package/packages/@monomind/cli/dist/src/services/config-file-manager.js +8 -1
  164. package/packages/@monomind/cli/dist/src/services/worker-daemon.js +4 -0
  165. package/packages/@monomind/cli/dist/src/types.d.ts +13 -0
  166. package/packages/@monomind/cli/package.json +13 -13
  167. package/packages/@monomind/guidance/dist/index.d.ts +1 -1
  168. package/packages/@monomind/guidance/dist/index.js +1 -1
  169. package/packages/@monomind/guidance/package.json +1 -2
  170. package/scripts/build-monovector.sh +10 -0
  171. package/scripts/publish-monovector.sh +20 -0
  172. package/.claude/commands/monomind/adr.md +0 -11
  173. package/.claude/commands/monomind/budget.md +0 -7
  174. package/.claude/commands/monomind/createtask.md +0 -277
  175. package/.claude/commands/monomind/do.md +0 -498
  176. package/.claude/commands/monomind/graph-status.md +0 -7
  177. package/.claude/commands/monomind/help.md +0 -118
  178. package/.claude/commands/monomind/idea.md +0 -273
  179. package/.claude/commands/monomind/improve.md +0 -352
  180. package/.claude/commands/monomind/loops.md +0 -7
  181. package/.claude/commands/monomind/memory.md +0 -230
  182. package/.claude/commands/monomind/repeat.md +0 -257
  183. package/.claude/commands/monomind/review.md +0 -317
  184. package/.claude/commands/monomind/specialagents.md +0 -125
  185. package/.claude/commands/monomind/swarm.md +0 -161
  186. package/.claude/commands/monomind/understand.md +0 -139
  187. package/.claude/commands/training/README.md +0 -39
  188. package/.claude/commands/training/neural-patterns.md +0 -73
  189. package/.claude/commands/training/neural-train.md +0 -79
  190. package/packages/@monomind/cli/dist/src/commands/appliance-advanced.d.ts +0 -9
  191. package/packages/@monomind/cli/dist/src/commands/appliance-advanced.js +0 -238
  192. package/packages/@monomind/cli/dist/src/commands/appliance.d.ts +0 -8
  193. package/packages/@monomind/cli/dist/src/commands/appliance.js +0 -406
  194. package/packages/@monomind/cli/dist/src/commands/ruvector/backup.d.ts +0 -11
  195. package/packages/@monomind/cli/dist/src/commands/ruvector/benchmark.d.ts +0 -11
  196. package/packages/@monomind/cli/dist/src/commands/ruvector/import.d.ts +0 -18
  197. package/packages/@monomind/cli/dist/src/commands/ruvector/init.d.ts +0 -11
  198. package/packages/@monomind/cli/dist/src/commands/ruvector/migrate.d.ts +0 -11
  199. package/packages/@monomind/cli/dist/src/commands/ruvector/setup.d.ts +0 -18
  200. package/packages/@monomind/cli/dist/src/ruvector/agent-wasm.d.ts +0 -182
  201. package/packages/@monomind/cli/dist/src/ruvector/agent-wasm.js +0 -316
  202. package/packages/@monomind/cli/dist/src/ruvector/ast-analyzer.d.ts +0 -67
  203. package/packages/@monomind/cli/dist/src/ruvector/ast-analyzer.js +0 -277
  204. package/packages/@monomind/cli/dist/src/ruvector/coverage-router.d.ts +0 -160
  205. package/packages/@monomind/cli/dist/src/ruvector/coverage-router.js +0 -539
  206. package/packages/@monomind/cli/dist/src/ruvector/coverage-tools.d.ts +0 -33
  207. package/packages/@monomind/cli/dist/src/ruvector/coverage-tools.js +0 -157
  208. package/packages/@monomind/cli/dist/src/ruvector/enhanced-model-router.d.ts +0 -146
  209. package/packages/@monomind/cli/dist/src/ruvector/enhanced-model-router.js +0 -551
  210. package/packages/@monomind/cli/dist/src/ruvector/flash-attention.d.ts +0 -195
  211. package/packages/@monomind/cli/dist/src/ruvector/flash-attention.js +0 -643
  212. package/packages/@monomind/cli/dist/src/ruvector/graph-analyzer.d.ts +0 -187
  213. package/packages/@monomind/cli/dist/src/ruvector/graph-analyzer.js +0 -929
  214. package/packages/@monomind/cli/dist/src/ruvector/index.d.ts +0 -67
  215. package/packages/@monomind/cli/dist/src/ruvector/index.js +0 -88
  216. package/packages/@monomind/cli/dist/src/ruvector/lora-adapter.d.ts +0 -218
  217. package/packages/@monomind/cli/dist/src/ruvector/lora-adapter.js +0 -455
  218. package/packages/@monomind/cli/dist/src/ruvector/model-router.d.ts +0 -222
  219. package/packages/@monomind/cli/dist/src/ruvector/model-router.js +0 -512
  220. package/packages/@monomind/cli/dist/src/ruvector/moe-router.d.ts +0 -213
  221. package/packages/@monomind/cli/dist/src/ruvector/moe-router.js +0 -649
  222. package/packages/@monomind/cli/dist/src/ruvector/q-learning-router.d.ts +0 -217
  223. package/packages/@monomind/cli/dist/src/ruvector/q-learning-router.js +0 -712
  224. package/packages/@monomind/cli/dist/src/ruvector/ruvllm-wasm.d.ts +0 -179
  225. package/packages/@monomind/cli/dist/src/ruvector/ruvllm-wasm.js +0 -363
  226. package/packages/@monomind/cli/dist/src/ruvector/semantic-router.d.ts +0 -77
  227. package/packages/@monomind/cli/dist/src/ruvector/semantic-router.js +0 -178
  228. package/packages/@monomind/cli/dist/src/ruvector/vector-db.d.ts +0 -69
  229. package/packages/@monomind/cli/dist/src/ruvector/vector-db.js +0 -243
  230. package/packages/@monomind/cli/dist/src/services/ruvector-training.d.ts +0 -222
  231. package/packages/@monomind/cli/dist/src/services/ruvector-training.js +0 -696
  232. /package/packages/@monomind/cli/dist/src/{ruvector → monovector}/diff-classifier.js +0 -0
@@ -1,649 +0,0 @@
1
- /**
2
- * Mixture of Experts (MoE) Router for Dynamic Agent Routing
3
- *
4
- * Features:
5
- * - 8 expert slots for specialized agent types
6
- * - Gating network for soft expert selection (top-k)
7
- * - Online weight updates via reward signals
8
- * - Load balancing with auxiliary loss
9
- * - Weight persistence to .swarm/moe-weights.json
10
- *
11
- * Architecture:
12
- * - Input: 384-dim task embedding (from ONNX)
13
- * - Hidden: 128-dim layer with ReLU
14
- * - Output: 8-dim softmax weights
15
- *
16
- * @module moe-router
17
- */
18
- import { existsSync, mkdirSync, readFileSync, writeFileSync, renameSync } from 'fs';
19
- import { dirname, join } from 'path';
20
- /**
21
- * Expert names in order (index corresponds to expert slot)
22
- */
23
- export const EXPERT_NAMES = [
24
- 'coder',
25
- 'tester',
26
- 'reviewer',
27
- 'architect',
28
- 'security',
29
- 'performance',
30
- 'researcher',
31
- 'coordinator',
32
- ];
33
- /**
34
- * Number of experts (fixed at 8)
35
- */
36
- export const NUM_EXPERTS = 8;
37
- /**
38
- * Input dimension (384 from ONNX MiniLM-L6-v2)
39
- */
40
- export const INPUT_DIM = 384;
41
- /**
42
- * Hidden layer dimension
43
- */
44
- export const HIDDEN_DIM = 128;
45
- /**
46
- * Default configuration
47
- */
48
- const DEFAULT_CONFIG = {
49
- topK: 2,
50
- learningRate: 0.01,
51
- temperature: 1.0,
52
- loadBalanceCoef: 0.01,
53
- weightsPath: '.swarm/moe-weights.json',
54
- autoSaveInterval: 50,
55
- enableNoise: true,
56
- noiseStd: 0.1,
57
- };
58
- // ============================================================================
59
- // Matrix Operations
60
- // ============================================================================
61
- /**
62
- * Initialize weights using Xavier/Glorot initialization
63
- */
64
- function xavierInit(fanIn, fanOut) {
65
- const std = Math.sqrt(2.0 / (fanIn + fanOut));
66
- const weights = new Float32Array(fanIn * fanOut);
67
- for (let i = 0; i < weights.length; i++) {
68
- // Box-Muller transform for normal distribution
69
- const u1 = Math.random();
70
- const u2 = Math.random();
71
- const z = Math.sqrt(-2 * Math.log(u1 + 1e-8)) * Math.cos(2 * Math.PI * u2);
72
- weights[i] = z * std;
73
- }
74
- return weights;
75
- }
76
- /**
77
- * Matrix-vector multiplication: y = Wx
78
- * W is stored row-major: [rows * cols]
79
- */
80
- function matmul(W, x, rows, cols, out) {
81
- for (let i = 0; i < rows; i++) {
82
- let sum = 0;
83
- const rowOffset = i * cols;
84
- // 4x loop unrolling for SIMD-friendly access
85
- let j = 0;
86
- for (; j + 3 < cols; j += 4) {
87
- sum +=
88
- W[rowOffset + j] * x[j] +
89
- W[rowOffset + j + 1] * x[j + 1] +
90
- W[rowOffset + j + 2] * x[j + 2] +
91
- W[rowOffset + j + 3] * x[j + 3];
92
- }
93
- // Handle remainder
94
- for (; j < cols; j++) {
95
- sum += W[rowOffset + j] * x[j];
96
- }
97
- out[i] = sum;
98
- }
99
- }
100
- /**
101
- * Vector addition: y = x + b
102
- */
103
- function addBias(x, b, out) {
104
- for (let i = 0; i < x.length; i++) {
105
- out[i] = x[i] + b[i];
106
- }
107
- }
108
- /**
109
- * ReLU activation: y = max(0, x)
110
- */
111
- function relu(x, out) {
112
- for (let i = 0; i < x.length; i++) {
113
- out[i] = x[i] > 0 ? x[i] : 0;
114
- }
115
- }
116
- /**
117
- * Softmax with temperature: y_i = exp(x_i/T) / sum(exp(x_j/T))
118
- */
119
- function softmax(x, temperature, out) {
120
- // Find max for numerical stability
121
- let maxVal = x[0];
122
- for (let i = 1; i < x.length; i++) {
123
- if (x[i] > maxVal)
124
- maxVal = x[i];
125
- }
126
- // Compute exp and sum
127
- let sum = 0;
128
- for (let i = 0; i < x.length; i++) {
129
- out[i] = Math.exp((x[i] - maxVal) / temperature);
130
- sum += out[i];
131
- }
132
- // Normalize
133
- const invSum = 1.0 / (sum + 1e-8);
134
- for (let i = 0; i < x.length; i++) {
135
- out[i] *= invSum;
136
- }
137
- }
138
- /**
139
- * Compute entropy of distribution: H = -sum(p * log(p))
140
- */
141
- function entropy(p) {
142
- let h = 0;
143
- for (let i = 0; i < p.length; i++) {
144
- if (p[i] > 1e-8) {
145
- h -= p[i] * Math.log(p[i]);
146
- }
147
- }
148
- return h;
149
- }
150
- /**
151
- * Add Gaussian noise for exploration
152
- */
153
- function addNoise(x, std, out) {
154
- for (let i = 0; i < x.length; i++) {
155
- const u1 = Math.random();
156
- const u2 = Math.random();
157
- const z = Math.sqrt(-2 * Math.log(u1 + 1e-8)) * Math.cos(2 * Math.PI * u2);
158
- out[i] = x[i] + z * std;
159
- }
160
- }
161
- // ============================================================================
162
- // MoE Router Implementation
163
- // ============================================================================
164
- /**
165
- * Mixture of Experts Router
166
- *
167
- * Implements a two-layer gating network:
168
- * - Layer 1: Linear(384, 128) + ReLU
169
- * - Layer 2: Linear(128, 8) + Softmax
170
- *
171
- * Uses top-k expert selection with load balancing.
172
- */
173
- export class MoERouter {
174
- config;
175
- // Network weights (pre-allocated Float32Arrays)
176
- W1; // [HIDDEN_DIM x INPUT_DIM]
177
- b1; // [HIDDEN_DIM]
178
- W2; // [NUM_EXPERTS x HIDDEN_DIM]
179
- b2; // [NUM_EXPERTS]
180
- // Intermediate buffers (pre-allocated, no GC pressure)
181
- hidden; // [HIDDEN_DIM]
182
- hiddenWithBias; // [HIDDEN_DIM]
183
- hiddenActivated; // [HIDDEN_DIM]
184
- logits; // [NUM_EXPERTS]
185
- logitsWithBias; // [NUM_EXPERTS]
186
- noisyLogits; // [NUM_EXPERTS]
187
- probs; // [NUM_EXPERTS]
188
- // Gradient buffers for online learning
189
- gradW2; // [NUM_EXPERTS x HIDDEN_DIM]
190
- gradb2; // [NUM_EXPERTS]
191
- gradW1; // [HIDDEN_DIM x INPUT_DIM]
192
- gradb1; // [HIDDEN_DIM]
193
- gradHidden; // [HIDDEN_DIM]
194
- // Statistics
195
- routingCounts; // [NUM_EXPERTS]
196
- totalRoutings = 0;
197
- updateCount = 0;
198
- avgReward = 0;
199
- // Cache for last input (for gradient computation)
200
- lastInput = null;
201
- lastHiddenActivated = null;
202
- lastProbs = null;
203
- lastSelectedExperts = [];
204
- constructor(config = {}) {
205
- this.config = { ...DEFAULT_CONFIG, ...config };
206
- // Initialize weights
207
- this.W1 = xavierInit(INPUT_DIM, HIDDEN_DIM);
208
- this.b1 = new Float32Array(HIDDEN_DIM);
209
- this.W2 = xavierInit(HIDDEN_DIM, NUM_EXPERTS);
210
- this.b2 = new Float32Array(NUM_EXPERTS);
211
- // Pre-allocate intermediate buffers
212
- this.hidden = new Float32Array(HIDDEN_DIM);
213
- this.hiddenWithBias = new Float32Array(HIDDEN_DIM);
214
- this.hiddenActivated = new Float32Array(HIDDEN_DIM);
215
- this.logits = new Float32Array(NUM_EXPERTS);
216
- this.logitsWithBias = new Float32Array(NUM_EXPERTS);
217
- this.noisyLogits = new Float32Array(NUM_EXPERTS);
218
- this.probs = new Float32Array(NUM_EXPERTS);
219
- // Pre-allocate gradient buffers
220
- this.gradW2 = new Float32Array(NUM_EXPERTS * HIDDEN_DIM);
221
- this.gradb2 = new Float32Array(NUM_EXPERTS);
222
- this.gradW1 = new Float32Array(HIDDEN_DIM * INPUT_DIM);
223
- this.gradb1 = new Float32Array(HIDDEN_DIM);
224
- this.gradHidden = new Float32Array(HIDDEN_DIM);
225
- // Statistics
226
- this.routingCounts = new Float32Array(NUM_EXPERTS);
227
- }
228
- /**
229
- * Initialize router, loading persisted weights if available
230
- */
231
- async initialize() {
232
- await this.loadWeights();
233
- }
234
- /**
235
- * Route task to top-k experts based on embedding
236
- *
237
- * @param taskEmbedding - 384-dim task embedding from ONNX
238
- * @returns Routing result with selected experts and weights
239
- */
240
- route(taskEmbedding) {
241
- // Convert to Float32Array if needed
242
- const input = taskEmbedding instanceof Float32Array
243
- ? taskEmbedding
244
- : new Float32Array(taskEmbedding);
245
- // Validate input dimension
246
- if (input.length !== INPUT_DIM) {
247
- throw new Error(`Expected embedding dimension ${INPUT_DIM}, got ${input.length}`);
248
- }
249
- // Forward pass through gating network
250
- // Layer 1: Linear + ReLU
251
- matmul(this.W1, input, HIDDEN_DIM, INPUT_DIM, this.hidden);
252
- addBias(this.hidden, this.b1, this.hiddenWithBias);
253
- relu(this.hiddenWithBias, this.hiddenActivated);
254
- // Layer 2: Linear
255
- matmul(this.W2, this.hiddenActivated, NUM_EXPERTS, HIDDEN_DIM, this.logits);
256
- addBias(this.logits, this.b2, this.logitsWithBias);
257
- // Add noise for exploration if enabled
258
- if (this.config.enableNoise) {
259
- addNoise(this.logitsWithBias, this.config.noiseStd, this.noisyLogits);
260
- }
261
- else {
262
- this.noisyLogits.set(this.logitsWithBias);
263
- }
264
- // Softmax to get probabilities
265
- softmax(this.noisyLogits, this.config.temperature, this.probs);
266
- // Select top-k experts
267
- const expertIndices = this.selectTopK(this.probs, this.config.topK);
268
- // Compute load balance loss
269
- const loadBalanceLoss = this.computeLoadBalanceLoss();
270
- // Compute entropy
271
- const routingEntropy = entropy(this.probs);
272
- // Update statistics
273
- for (const idx of expertIndices) {
274
- this.routingCounts[idx]++;
275
- }
276
- this.totalRoutings++;
277
- // Cache for gradient computation
278
- this.lastInput = new Float32Array(input);
279
- this.lastHiddenActivated = new Float32Array(this.hiddenActivated);
280
- this.lastProbs = new Float32Array(this.probs);
281
- this.lastSelectedExperts = expertIndices;
282
- // Build result
283
- const totalWeight = expertIndices.reduce((sum, idx) => sum + this.probs[idx], 0);
284
- const experts = expertIndices.map((idx) => ({
285
- name: EXPERT_NAMES[idx],
286
- index: idx,
287
- weight: this.probs[idx] / (totalWeight + 1e-8), // Normalize weights
288
- score: this.probs[idx],
289
- }));
290
- return {
291
- experts,
292
- allScores: Array.from(this.probs),
293
- loadBalanceLoss,
294
- entropy: routingEntropy,
295
- };
296
- }
297
- /**
298
- * Update expert weights based on reward signal
299
- *
300
- * Uses REINFORCE-style gradient update:
301
- * gradient = reward * d_log_prob / d_weights
302
- *
303
- * @param expert - Expert that received the reward
304
- * @param reward - Reward signal (-1 to 1, positive = good)
305
- */
306
- updateExpertWeights(expert, reward) {
307
- const expertIdx = typeof expert === 'number' ? expert : EXPERT_NAMES.indexOf(expert);
308
- if (expertIdx < 0 || expertIdx >= NUM_EXPERTS) {
309
- console.warn(`[MoE] Invalid expert: ${expert}`);
310
- return;
311
- }
312
- if (!this.lastInput || !this.lastHiddenActivated || !this.lastProbs) {
313
- console.warn('[MoE] No cached forward pass for gradient computation');
314
- return;
315
- }
316
- // Clamp reward to [-1, 1]
317
- const clampedReward = Math.max(-1, Math.min(1, reward));
318
- // Compute gradients using REINFORCE
319
- // For softmax: d_log_p_i / d_logit_j = delta_ij - p_j
320
- // gradient = reward * (1 - p_expert) for selected expert
321
- // gradient = reward * (-p_j) for other experts
322
- // Clear gradient buffers
323
- this.gradW2.fill(0);
324
- this.gradb2.fill(0);
325
- this.gradW1.fill(0);
326
- this.gradb1.fill(0);
327
- this.gradHidden.fill(0);
328
- // Gradient w.r.t. logits (before softmax)
329
- for (let i = 0; i < NUM_EXPERTS; i++) {
330
- if (i === expertIdx) {
331
- this.gradb2[i] = clampedReward * (1 - this.lastProbs[i]);
332
- }
333
- else {
334
- this.gradb2[i] = clampedReward * (-this.lastProbs[i]);
335
- }
336
- }
337
- // Gradient w.r.t. W2: outer product of gradb2 and hiddenActivated
338
- for (let i = 0; i < NUM_EXPERTS; i++) {
339
- const rowOffset = i * HIDDEN_DIM;
340
- for (let j = 0; j < HIDDEN_DIM; j++) {
341
- this.gradW2[rowOffset + j] = this.gradb2[i] * this.lastHiddenActivated[j];
342
- }
343
- }
344
- // Backprop through W2 to get gradient w.r.t. hidden
345
- for (let j = 0; j < HIDDEN_DIM; j++) {
346
- let sum = 0;
347
- for (let i = 0; i < NUM_EXPERTS; i++) {
348
- sum += this.gradb2[i] * this.W2[i * HIDDEN_DIM + j];
349
- }
350
- this.gradHidden[j] = sum;
351
- }
352
- // Backprop through ReLU: gradient is 0 where activation was 0
353
- for (let j = 0; j < HIDDEN_DIM; j++) {
354
- if (this.lastHiddenActivated[j] <= 0) {
355
- this.gradHidden[j] = 0;
356
- }
357
- }
358
- // Gradient w.r.t. b1
359
- this.gradb1.set(this.gradHidden);
360
- // Gradient w.r.t. W1: outer product of gradHidden and input
361
- for (let i = 0; i < HIDDEN_DIM; i++) {
362
- const rowOffset = i * INPUT_DIM;
363
- for (let j = 0; j < INPUT_DIM; j++) {
364
- this.gradW1[rowOffset + j] = this.gradHidden[i] * this.lastInput[j];
365
- }
366
- }
367
- // Apply gradients with learning rate
368
- const lr = this.config.learningRate;
369
- for (let i = 0; i < this.W2.length; i++) {
370
- this.W2[i] += lr * this.gradW2[i];
371
- }
372
- for (let i = 0; i < this.b2.length; i++) {
373
- this.b2[i] += lr * this.gradb2[i];
374
- }
375
- for (let i = 0; i < this.W1.length; i++) {
376
- this.W1[i] += lr * this.gradW1[i];
377
- }
378
- for (let i = 0; i < this.b1.length; i++) {
379
- this.b1[i] += lr * this.gradb1[i];
380
- }
381
- // Update statistics
382
- this.updateCount++;
383
- this.avgReward = (this.avgReward * (this.updateCount - 1) + clampedReward) / this.updateCount;
384
- // Auto-save
385
- if (this.config.autoSaveInterval > 0 &&
386
- this.updateCount % this.config.autoSaveInterval === 0) {
387
- this.saveWeights().catch(() => { }); // Fire and forget
388
- }
389
- }
390
- /**
391
- * Get load balance statistics across all experts
392
- */
393
- getLoadBalance() {
394
- const counts = {};
395
- const utilization = {};
396
- const total = this.totalRoutings || 1;
397
- const idealUtilization = 1 / NUM_EXPERTS;
398
- for (let i = 0; i < NUM_EXPERTS; i++) {
399
- const name = EXPERT_NAMES[i];
400
- counts[name] = this.routingCounts[i];
401
- utilization[name] = this.routingCounts[i] / total;
402
- }
403
- // Compute Gini coefficient
404
- const gini = this.computeGiniCoefficient();
405
- // Compute coefficient of variation
406
- const mean = total / NUM_EXPERTS;
407
- let variance = 0;
408
- for (let i = 0; i < NUM_EXPERTS; i++) {
409
- variance += Math.pow(this.routingCounts[i] - mean, 2);
410
- }
411
- variance /= NUM_EXPERTS;
412
- const cv = Math.sqrt(variance) / (mean + 1e-8);
413
- return {
414
- utilization,
415
- totalRoutings: this.totalRoutings,
416
- routingCounts: counts,
417
- giniCoefficient: gini,
418
- coefficientOfVariation: cv,
419
- };
420
- }
421
- /**
422
- * Get router statistics
423
- */
424
- getStats() {
425
- return {
426
- totalRoutings: this.totalRoutings,
427
- updateCount: this.updateCount,
428
- avgReward: this.avgReward,
429
- topK: this.config.topK,
430
- temperature: this.config.temperature,
431
- learningRate: this.config.learningRate,
432
- giniCoefficient: this.computeGiniCoefficient(),
433
- };
434
- }
435
- /**
436
- * Reset all statistics and routing counts
437
- */
438
- resetStats() {
439
- this.routingCounts.fill(0);
440
- this.totalRoutings = 0;
441
- this.updateCount = 0;
442
- this.avgReward = 0;
443
- }
444
- /**
445
- * Load weights from persistence file
446
- */
447
- async loadWeights(path) {
448
- const weightsPath = path ? path : join(process.cwd(), this.config.weightsPath);
449
- try {
450
- if (!existsSync(weightsPath)) {
451
- return false;
452
- }
453
- const data = readFileSync(weightsPath, 'utf-8');
454
- const model = JSON.parse(data);
455
- // Validate version
456
- if (!model.version || !model.version.startsWith('1.')) {
457
- console.warn(`[MoE] Incompatible model version: ${model.version}`);
458
- return false;
459
- }
460
- // Load weights with dimension validation
461
- const w1 = new Float32Array(model.weights.W1.flat());
462
- const b1 = new Float32Array(model.weights.b1);
463
- const w2 = new Float32Array(model.weights.W2.flat());
464
- const b2 = new Float32Array(model.weights.b2);
465
- if (w1.length !== INPUT_DIM * HIDDEN_DIM || b1.length !== HIDDEN_DIM ||
466
- w2.length !== HIDDEN_DIM * NUM_EXPERTS || b2.length !== NUM_EXPERTS) {
467
- console.warn('[MoE] Weight dimensions mismatch — reinitializing');
468
- return false;
469
- }
470
- this.W1 = w1;
471
- this.b1 = b1;
472
- this.W2 = w2;
473
- this.b2 = b2;
474
- // Load stats
475
- this.updateCount = model.stats.updateCount || 0;
476
- this.avgReward = model.stats.avgReward || 0;
477
- this.routingCounts = new Float32Array(model.stats.routingCounts || new Array(NUM_EXPERTS).fill(0));
478
- this.totalRoutings = this.routingCounts.reduce((a, b) => a + b, 0);
479
- return true;
480
- }
481
- catch (err) {
482
- console.warn(`[MoE] Failed to load weights: ${err}`);
483
- return false;
484
- }
485
- }
486
- /**
487
- * Save weights to persistence file
488
- */
489
- async saveWeights(path) {
490
- const weightsPath = path ? path : join(process.cwd(), this.config.weightsPath);
491
- try {
492
- // Ensure directory exists
493
- const dir = dirname(weightsPath);
494
- if (!existsSync(dir)) {
495
- mkdirSync(dir, { recursive: true });
496
- }
497
- // Convert Float32Arrays to nested arrays for JSON
498
- const W1_2d = [];
499
- for (let i = 0; i < HIDDEN_DIM; i++) {
500
- W1_2d.push(Array.from(this.W1.slice(i * INPUT_DIM, (i + 1) * INPUT_DIM)));
501
- }
502
- const W2_2d = [];
503
- for (let i = 0; i < NUM_EXPERTS; i++) {
504
- W2_2d.push(Array.from(this.W2.slice(i * HIDDEN_DIM, (i + 1) * HIDDEN_DIM)));
505
- }
506
- const model = {
507
- version: '1.0.0',
508
- config: {
509
- topK: this.config.topK,
510
- temperature: this.config.temperature,
511
- learningRate: this.config.learningRate,
512
- loadBalanceCoef: this.config.loadBalanceCoef,
513
- },
514
- weights: {
515
- W1: W1_2d,
516
- b1: Array.from(this.b1),
517
- W2: W2_2d,
518
- b2: Array.from(this.b2),
519
- },
520
- stats: {
521
- updateCount: this.updateCount,
522
- routingCounts: Array.from(this.routingCounts),
523
- avgReward: this.avgReward,
524
- },
525
- metadata: {
526
- savedAt: new Date().toISOString(),
527
- expertNames: [...EXPERT_NAMES],
528
- },
529
- };
530
- const tmp = weightsPath + '.tmp';
531
- writeFileSync(tmp, JSON.stringify(model, null, 2));
532
- renameSync(tmp, weightsPath);
533
- return true;
534
- }
535
- catch (err) {
536
- console.warn(`[MoE] Failed to save weights: ${err}`);
537
- return false;
538
- }
539
- }
540
- /**
541
- * Reset weights to random initialization
542
- */
543
- resetWeights() {
544
- this.W1 = xavierInit(INPUT_DIM, HIDDEN_DIM);
545
- this.b1.fill(0);
546
- this.W2 = xavierInit(HIDDEN_DIM, NUM_EXPERTS);
547
- this.b2.fill(0);
548
- this.resetStats();
549
- }
550
- // ============================================================================
551
- // Private Methods
552
- // ============================================================================
553
- /**
554
- * Select top-k indices from probabilities
555
- */
556
- selectTopK(probs, k) {
557
- // Create index-value pairs and sort by value descending
558
- const pairs = [];
559
- for (let i = 0; i < probs.length; i++) {
560
- pairs.push([i, probs[i]]);
561
- }
562
- pairs.sort((a, b) => b[1] - a[1]);
563
- // Return top-k indices
564
- return pairs.slice(0, k).map((p) => p[0]);
565
- }
566
- /**
567
- * Compute load balance loss for regularization
568
- *
569
- * Uses auxiliary loss from Switch Transformer:
570
- * L_balance = N * sum(f_i * P_i)
571
- * where f_i = fraction of tokens routed to expert i
572
- * P_i = average routing probability to expert i
573
- */
574
- computeLoadBalanceLoss() {
575
- if (this.totalRoutings === 0)
576
- return 0;
577
- let loss = 0;
578
- for (let i = 0; i < NUM_EXPERTS; i++) {
579
- const fraction = this.routingCounts[i] / this.totalRoutings;
580
- const avgProb = this.probs[i]; // Current routing prob
581
- loss += fraction * avgProb;
582
- }
583
- return NUM_EXPERTS * loss * this.config.loadBalanceCoef;
584
- }
585
- /**
586
- * Compute Gini coefficient for load distribution
587
- */
588
- computeGiniCoefficient() {
589
- if (this.totalRoutings === 0)
590
- return 0;
591
- // Sort counts
592
- const sorted = Array.from(this.routingCounts).sort((a, b) => a - b);
593
- const n = sorted.length;
594
- const mean = this.totalRoutings / n;
595
- // Compute Gini using the formula: G = (2 * sum(i * x_i) - (n+1) * sum(x_i)) / (n * sum(x_i))
596
- let weightedSum = 0;
597
- for (let i = 0; i < n; i++) {
598
- weightedSum += (i + 1) * sorted[i];
599
- }
600
- const gini = (2 * weightedSum - (n + 1) * this.totalRoutings) /
601
- (n * this.totalRoutings + 1e-8);
602
- return Math.max(0, gini);
603
- }
604
- }
605
- // ============================================================================
606
- // Singleton Instance
607
- // ============================================================================
608
- let moeRouterInstance = null;
609
- let _moeInitPromise = null;
610
- /**
611
- * Get singleton MoE router instance
612
- *
613
- * @param config - Optional configuration (only used on first call)
614
- * @returns MoE router instance
615
- */
616
- export function getMoERouter(config) {
617
- if (!moeRouterInstance) {
618
- moeRouterInstance = new MoERouter(config);
619
- _moeInitPromise = moeRouterInstance.initialize().catch((err) => {
620
- console.warn('[MoE] Failed to initialize router:', err);
621
- });
622
- }
623
- return moeRouterInstance;
624
- }
625
- /**
626
- * Get singleton MoE router instance, waiting for initialization to complete
627
- *
628
- * @param config - Optional configuration (only used on first call)
629
- * @returns Promise resolving to fully initialized MoE router instance
630
- */
631
- export async function getMoERouterReady(config) {
632
- const router = getMoERouter(config);
633
- if (_moeInitPromise)
634
- await _moeInitPromise;
635
- return router;
636
- }
637
- /**
638
- * Reset singleton instance (for testing)
639
- */
640
- export function resetMoERouter() {
641
- moeRouterInstance = null;
642
- }
643
- /**
644
- * Factory function to create new router
645
- */
646
- export function createMoERouter(config) {
647
- return new MoERouter(config);
648
- }
649
- //# sourceMappingURL=moe-router.js.map