@jinn-network/client 0.1.8 → 0.1.9-canary.144d87d2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (397) hide show
  1. package/README.md +6 -0
  2. package/dist/adapters/mech/adapter.d.ts +21 -1
  3. package/dist/adapters/mech/adapter.js +77 -10
  4. package/dist/adapters/mech/adapter.js.map +1 -1
  5. package/dist/adapters/mech/contracts.js +62 -28
  6. package/dist/adapters/mech/contracts.js.map +1 -1
  7. package/dist/adapters/mech/safe-revert.d.ts +4 -0
  8. package/dist/adapters/mech/safe-revert.js +5 -1
  9. package/dist/adapters/mech/safe-revert.js.map +1 -1
  10. package/dist/adapters/mech/safe.js +5 -1
  11. package/dist/adapters/mech/safe.js.map +1 -1
  12. package/dist/adapters/mech/verdict-code.js +1 -1
  13. package/dist/adapters/mech/verdict-code.js.map +1 -1
  14. package/dist/api/bootstrap-endpoint.d.ts +1 -0
  15. package/dist/api/bootstrap-endpoint.js +1 -0
  16. package/dist/api/bootstrap-endpoint.js.map +1 -1
  17. package/dist/api/discovery-endpoint.d.ts +1 -0
  18. package/dist/api/discovery-endpoint.js +24 -0
  19. package/dist/api/discovery-endpoint.js.map +1 -1
  20. package/dist/api/fleet-build.d.ts +1 -7
  21. package/dist/api/fleet-build.js +0 -7
  22. package/dist/api/fleet-build.js.map +1 -1
  23. package/dist/api/gather-status.d.ts +8 -2
  24. package/dist/api/gather-status.js +29 -117
  25. package/dist/api/gather-status.js.map +1 -1
  26. package/dist/api/loop-completion-build.d.ts +79 -0
  27. package/dist/api/loop-completion-build.js +155 -0
  28. package/dist/api/loop-completion-build.js.map +1 -0
  29. package/dist/api/operator-artifacts-endpoint.js +1 -1
  30. package/dist/api/operator-artifacts-endpoint.js.map +1 -1
  31. package/dist/api/peers.js +2 -0
  32. package/dist/api/peers.js.map +1 -1
  33. package/dist/api/setup-endpoints.d.ts +32 -0
  34. package/dist/api/setup-endpoints.js +94 -24
  35. package/dist/api/setup-endpoints.js.map +1 -1
  36. package/dist/api/solvernets-endpoints.js +4 -1
  37. package/dist/api/solvernets-endpoints.js.map +1 -1
  38. package/dist/api/status-build.d.ts +43 -33
  39. package/dist/api/status-build.js +3 -26
  40. package/dist/api/status-build.js.map +1 -1
  41. package/dist/api/status-rollup-build.d.ts +0 -4
  42. package/dist/api/status-rollup-build.js +0 -4
  43. package/dist/api/status-rollup-build.js.map +1 -1
  44. package/dist/api/stop-hook.d.ts +1 -1
  45. package/dist/api/stop-hook.js +1 -1
  46. package/dist/api/stop-hook.js.map +1 -1
  47. package/dist/build-info.json +4 -4
  48. package/dist/build-meta.json +1 -1
  49. package/dist/cli/commands/codedigest-revert-check.js +6 -2
  50. package/dist/cli/commands/codedigest-revert-check.js.map +1 -1
  51. package/dist/cli/commands/doctor.d.ts +3 -0
  52. package/dist/cli/commands/doctor.js +37 -2
  53. package/dist/cli/commands/doctor.js.map +1 -1
  54. package/dist/cli/commands/eval.d.ts +87 -0
  55. package/dist/cli/commands/eval.js +481 -0
  56. package/dist/cli/commands/eval.js.map +1 -0
  57. package/dist/cli/commands/rewards.d.ts +2 -0
  58. package/dist/cli/commands/rewards.js +30 -3
  59. package/dist/cli/commands/rewards.js.map +1 -1
  60. package/dist/cli/commands/solver-nets.js +68 -0
  61. package/dist/cli/commands/solver-nets.js.map +1 -1
  62. package/dist/cli/commands/status.js +0 -1
  63. package/dist/cli/commands/status.js.map +1 -1
  64. package/dist/cli/index.js +2 -0
  65. package/dist/cli/index.js.map +1 -1
  66. package/dist/config.d.ts +102 -15
  67. package/dist/config.js +166 -19
  68. package/dist/config.js.map +1 -1
  69. package/dist/daemon/ai-units-gate.d.ts +6 -6
  70. package/dist/daemon/ai-units-gate.js +11 -10
  71. package/dist/daemon/ai-units-gate.js.map +1 -1
  72. package/dist/daemon/balance-topup-loop.js +3 -0
  73. package/dist/daemon/balance-topup-loop.js.map +1 -1
  74. package/dist/daemon/checkpoint-loop.js +2 -2
  75. package/dist/daemon/creator.d.ts +1 -0
  76. package/dist/daemon/creator.js +26 -14
  77. package/dist/daemon/creator.js.map +1 -1
  78. package/dist/daemon/daemon.d.ts +15 -0
  79. package/dist/daemon/daemon.js +78 -22
  80. package/dist/daemon/daemon.js.map +1 -1
  81. package/dist/daemon/eviction-loop.d.ts +7 -0
  82. package/dist/daemon/eviction-loop.js +19 -3
  83. package/dist/daemon/eviction-loop.js.map +1 -1
  84. package/dist/daemon/jinn-claim-loop.js +3 -0
  85. package/dist/daemon/jinn-claim-loop.js.map +1 -1
  86. package/dist/daemon/join-applier.d.ts +35 -0
  87. package/dist/daemon/join-applier.js +49 -0
  88. package/dist/daemon/join-applier.js.map +1 -0
  89. package/dist/daemon/loop-heartbeat.d.ts +34 -0
  90. package/dist/daemon/loop-heartbeat.js +39 -0
  91. package/dist/daemon/loop-heartbeat.js.map +1 -0
  92. package/dist/daemon/reward-claim-loop.js +4 -1
  93. package/dist/daemon/reward-claim-loop.js.map +1 -1
  94. package/dist/daemon/watchdog-loop.d.ts +84 -0
  95. package/dist/daemon/watchdog-loop.js +91 -0
  96. package/dist/daemon/watchdog-loop.js.map +1 -0
  97. package/dist/dashboard/assets/index-8tAiMbUV.css +1 -0
  98. package/dist/dashboard/assets/index-D6a-DfaM.js +171 -0
  99. package/dist/dashboard/index.html +2 -2
  100. package/dist/discovery/http.d.ts +17 -0
  101. package/dist/discovery/http.js +295 -25
  102. package/dist/discovery/http.js.map +1 -1
  103. package/dist/discovery/onchain.js +155 -1
  104. package/dist/discovery/onchain.js.map +1 -1
  105. package/dist/discovery/types.d.ts +106 -0
  106. package/dist/discovery/types.js +40 -0
  107. package/dist/discovery/types.js.map +1 -1
  108. package/dist/discovery/with-fallback.js +14 -0
  109. package/dist/discovery/with-fallback.js.map +1 -1
  110. package/dist/earning/bootstrap.d.ts +25 -0
  111. package/dist/earning/bootstrap.js +79 -28
  112. package/dist/earning/bootstrap.js.map +1 -1
  113. package/dist/earning/faucet.d.ts +1 -1
  114. package/dist/earning/faucet.js +2 -2
  115. package/dist/earning/faucet.js.map +1 -1
  116. package/dist/earning/safe-adapter.js +11 -0
  117. package/dist/earning/safe-adapter.js.map +1 -1
  118. package/dist/earning/stolas-claim.js +5 -5
  119. package/dist/earning/types.d.ts +1 -1
  120. package/dist/earning/types.js +1 -1
  121. package/dist/earning/types.js.map +1 -1
  122. package/dist/eval/eval-harness-run.d.ts +63 -0
  123. package/dist/eval/eval-harness-run.js +123 -0
  124. package/dist/eval/eval-harness-run.js.map +1 -0
  125. package/dist/eval/orchestrator.d.ts +224 -0
  126. package/dist/eval/orchestrator.js +250 -0
  127. package/dist/eval/orchestrator.js.map +1 -0
  128. package/dist/eval/paired.d.ts +68 -0
  129. package/dist/eval/paired.js +93 -0
  130. package/dist/eval/paired.js.map +1 -0
  131. package/dist/eval/resolve-slate-tasks.d.ts +35 -0
  132. package/dist/eval/resolve-slate-tasks.js +56 -0
  133. package/dist/eval/resolve-slate-tasks.js.map +1 -0
  134. package/dist/eval/screen-discovery.d.ts +22 -0
  135. package/dist/eval/screen-discovery.js +71 -0
  136. package/dist/eval/screen-discovery.js.map +1 -0
  137. package/dist/eval/screen-progress.d.ts +41 -0
  138. package/dist/eval/screen-progress.js +60 -0
  139. package/dist/eval/screen-progress.js.map +1 -0
  140. package/dist/eval/screen-runner.d.ts +30 -0
  141. package/dist/eval/screen-runner.js +289 -0
  142. package/dist/eval/screen-runner.js.map +1 -0
  143. package/dist/eval/screen.d.ts +107 -0
  144. package/dist/eval/screen.js +159 -0
  145. package/dist/eval/screen.js.map +1 -0
  146. package/dist/eval/slope.d.ts +29 -0
  147. package/dist/eval/slope.js +46 -0
  148. package/dist/eval/slope.js.map +1 -0
  149. package/dist/eval/train-sequence.d.ts +35 -0
  150. package/dist/eval/train-sequence.js +59 -0
  151. package/dist/eval/train-sequence.js.map +1 -0
  152. package/dist/eval/wilson.d.ts +45 -0
  153. package/dist/eval/wilson.js +48 -0
  154. package/dist/eval/wilson.js.map +1 -0
  155. package/dist/events/types.d.ts +1 -1
  156. package/dist/events/types.js +1 -1
  157. package/dist/events/types.js.map +1 -1
  158. package/dist/harnesses/engine/canonical-json.js +5 -3
  159. package/dist/harnesses/engine/canonical-json.js.map +1 -1
  160. package/dist/harnesses/engine/engine.d.ts +24 -0
  161. package/dist/harnesses/engine/engine.js +72 -9
  162. package/dist/harnesses/engine/engine.js.map +1 -1
  163. package/dist/harnesses/engine/packaging.js +1 -1
  164. package/dist/harnesses/engine/packaging.js.map +1 -1
  165. package/dist/harnesses/engine/persistence.d.ts +17 -0
  166. package/dist/harnesses/engine/persistence.js +28 -0
  167. package/dist/harnesses/engine/persistence.js.map +1 -1
  168. package/dist/harnesses/impls/claude-mcp-hyperliquid/mcp-tools.d.ts +1 -1
  169. package/dist/harnesses/impls/claude-mcp-hyperliquid/mcp-tools.js +1 -1
  170. package/dist/harnesses/impls/claude-mcp-hyperliquid/mcp-tools.js.map +1 -1
  171. package/dist/harnesses/impls/hermes-agent/adapter.d.ts +2 -0
  172. package/dist/harnesses/impls/hermes-agent/adapter.js +8 -5
  173. package/dist/harnesses/impls/hermes-agent/adapter.js.map +1 -1
  174. package/dist/harnesses/impls/hermes-agent/bootstrap.d.ts +1 -0
  175. package/dist/harnesses/impls/hermes-agent/bootstrap.js +6 -1
  176. package/dist/harnesses/impls/hermes-agent/bootstrap.js.map +1 -1
  177. package/dist/harnesses/impls/hermes-agent/harness.d.ts +17 -3
  178. package/dist/harnesses/impls/hermes-agent/harness.js +68 -5
  179. package/dist/harnesses/impls/hermes-agent/harness.js.map +1 -1
  180. package/dist/harnesses/impls/index.d.ts +2 -0
  181. package/dist/harnesses/impls/index.js +9 -0
  182. package/dist/harnesses/impls/index.js.map +1 -1
  183. package/dist/harnesses/impls/jinn-repo-evaluator/eval-runner.d.ts +34 -0
  184. package/dist/harnesses/impls/jinn-repo-evaluator/eval-runner.js +111 -0
  185. package/dist/harnesses/impls/jinn-repo-evaluator/eval-runner.js.map +1 -0
  186. package/dist/harnesses/impls/jinn-repo-evaluator/evaluator.d.ts +24 -0
  187. package/dist/harnesses/impls/jinn-repo-evaluator/evaluator.js +19 -0
  188. package/dist/harnesses/impls/jinn-repo-evaluator/evaluator.js.map +1 -0
  189. package/dist/harnesses/impls/jinn-repo-evaluator/harness.d.ts +64 -0
  190. package/dist/harnesses/impls/jinn-repo-evaluator/harness.js +125 -0
  191. package/dist/harnesses/impls/jinn-repo-evaluator/harness.js.map +1 -0
  192. package/dist/harnesses/impls/jinn-repo-evaluator/repro.d.ts +32 -0
  193. package/dist/harnesses/impls/jinn-repo-evaluator/repro.js +73 -0
  194. package/dist/harnesses/impls/jinn-repo-evaluator/repro.js.map +1 -0
  195. package/dist/harnesses/impls/learner/adapters/claude-code.js +5 -0
  196. package/dist/harnesses/impls/learner/adapters/claude-code.js.map +1 -1
  197. package/dist/harnesses/impls/learner/harness.d.ts +17 -1
  198. package/dist/harnesses/impls/learner/harness.js +51 -1
  199. package/dist/harnesses/impls/learner/harness.js.map +1 -1
  200. package/dist/harnesses/impls/learner/harvest.d.ts +2 -0
  201. package/dist/harnesses/impls/learner/harvest.js +51 -1
  202. package/dist/harnesses/impls/learner/harvest.js.map +1 -1
  203. package/dist/harnesses/impls/learner/plugin-path.js +1 -0
  204. package/dist/harnesses/impls/learner/plugin-path.js.map +1 -1
  205. package/dist/harnesses/impls/swe-rebench-v2-evaluator/harness.js +3 -1
  206. package/dist/harnesses/impls/swe-rebench-v2-evaluator/harness.js.map +1 -1
  207. package/dist/harnesses/impls/swe-rebench-v2-evaluator/index.d.ts +2 -2
  208. package/dist/harnesses/impls/swe-rebench-v2-evaluator/index.js +3 -1
  209. package/dist/harnesses/impls/swe-rebench-v2-evaluator/index.js.map +1 -1
  210. package/dist/harnesses/readiness-registry.d.ts +10 -0
  211. package/dist/harnesses/readiness-registry.js +13 -0
  212. package/dist/harnesses/readiness-registry.js.map +1 -1
  213. package/dist/harnesses/types.d.ts +14 -0
  214. package/dist/learner/revert-decision.d.ts +16 -1
  215. package/dist/learner/revert-decision.js +38 -18
  216. package/dist/learner/revert-decision.js.map +1 -1
  217. package/dist/learner/revert-stats.d.ts +14 -0
  218. package/dist/learner/revert-stats.js +42 -0
  219. package/dist/learner/revert-stats.js.map +1 -1
  220. package/dist/local-provider-url.d.ts +3 -0
  221. package/dist/local-provider-url.js +28 -0
  222. package/dist/local-provider-url.js.map +1 -0
  223. package/dist/main.js +94 -25
  224. package/dist/main.js.map +1 -1
  225. package/dist/mcp/operator-server.js +1 -1
  226. package/dist/mcp/operator-server.js.map +1 -1
  227. package/dist/mcp/server.js +1 -1
  228. package/dist/mcp/server.js.map +1 -1
  229. package/dist/plugins/learner/.claude-plugin/plugin.json +1 -1
  230. package/dist/plugins/learner/.codex-plugin/plugin.json +1 -1
  231. package/dist/plugins/learner/hooks/session-start +30 -1
  232. package/dist/plugins/learner/skills/learn/consolidator-prompt.md +4 -0
  233. package/dist/preflight/deployment-readiness.d.ts +147 -0
  234. package/dist/preflight/deployment-readiness.js +366 -0
  235. package/dist/preflight/deployment-readiness.js.map +1 -0
  236. package/dist/preflight/pidfile-liveness.d.ts +7 -1
  237. package/dist/preflight/pidfile-liveness.js +14 -0
  238. package/dist/preflight/pidfile-liveness.js.map +1 -1
  239. package/dist/rpc/transport.d.ts +43 -5
  240. package/dist/rpc/transport.js +131 -30
  241. package/dist/rpc/transport.js.map +1 -1
  242. package/dist/scripts/swe-rebench-v2-seed-pool.json +2 -1
  243. package/dist/solver-nets/registry.d.ts +19 -0
  244. package/dist/solver-nets/registry.js +95 -66
  245. package/dist/solver-nets/registry.js.map +1 -1
  246. package/dist/solver-types/_jinn-repo-pool.d.ts +27 -0
  247. package/dist/solver-types/_jinn-repo-pool.js +27 -0
  248. package/dist/solver-types/_jinn-repo-pool.js.map +1 -0
  249. package/dist/solver-types/_swe-rebench-v2-held-out-slate.d.ts +76 -0
  250. package/dist/solver-types/_swe-rebench-v2-held-out-slate.js +156 -0
  251. package/dist/solver-types/_swe-rebench-v2-held-out-slate.js.map +1 -0
  252. package/dist/solver-types/_swe-rebench-v2-pool-recovery.d.ts +81 -0
  253. package/dist/solver-types/_swe-rebench-v2-pool-recovery.js +116 -0
  254. package/dist/solver-types/_swe-rebench-v2-pool-recovery.js.map +1 -0
  255. package/dist/solver-types/_swe-rebench-v2-state.d.ts +9 -0
  256. package/dist/solver-types/_swe-rebench-v2-state.js +14 -0
  257. package/dist/solver-types/_swe-rebench-v2-state.js.map +1 -1
  258. package/dist/solver-types/_swe-rebench-v2-validated-pool.d.ts +30 -0
  259. package/dist/solver-types/_swe-rebench-v2-validated-pool.js +40 -0
  260. package/dist/solver-types/_swe-rebench-v2-validated-pool.js.map +1 -1
  261. package/dist/solver-types/index.js +2 -0
  262. package/dist/solver-types/index.js.map +1 -1
  263. package/dist/solver-types/jinn-repo-admit.d.ts +17 -0
  264. package/dist/solver-types/jinn-repo-admit.js +16 -0
  265. package/dist/solver-types/jinn-repo-admit.js.map +1 -0
  266. package/dist/solver-types/jinn-repo-auto.d.ts +60 -0
  267. package/dist/solver-types/jinn-repo-auto.js +163 -0
  268. package/dist/solver-types/jinn-repo-auto.js.map +1 -0
  269. package/dist/solver-types/jinn-repo-definition.d.ts +15 -0
  270. package/dist/solver-types/jinn-repo-definition.js +34 -0
  271. package/dist/solver-types/jinn-repo-definition.js.map +1 -0
  272. package/dist/solver-types/jinn-repo-extract.d.ts +16 -0
  273. package/dist/solver-types/jinn-repo-extract.js +32 -0
  274. package/dist/solver-types/jinn-repo-extract.js.map +1 -0
  275. package/dist/solver-types/jinn-repo.d.ts +21 -0
  276. package/dist/solver-types/jinn-repo.js +23 -0
  277. package/dist/solver-types/jinn-repo.js.map +1 -0
  278. package/dist/solver-types/learner-loop-test.js +1 -1
  279. package/dist/solver-types/learner-loop-test.js.map +1 -1
  280. package/dist/solver-types/slates/held-out-slate.swe-rebench-v2.v1.json +20 -0
  281. package/dist/solver-types/slates/held-out-slate.swe-rebench-v2.v2.json +19 -0
  282. package/dist/solver-types/slates/held-out-slate.swe-rebench-v2.v2.screening-report.json +628 -0
  283. package/dist/solver-types/solver-type.d.ts +8 -0
  284. package/dist/solver-types/swe-rebench-v2.d.ts +2 -0
  285. package/dist/solver-types/swe-rebench-v2.js +115 -10
  286. package/dist/solver-types/swe-rebench-v2.js.map +1 -1
  287. package/dist/solvernets/launched-record-dispatcher.d.ts +5 -0
  288. package/dist/solvernets/launched-record-dispatcher.js +8 -1
  289. package/dist/solvernets/launched-record-dispatcher.js.map +1 -1
  290. package/dist/solvernets/registry-client-erc8004.js +29 -37
  291. package/dist/solvernets/registry-client-erc8004.js.map +1 -1
  292. package/dist/solvernets/registry-client.d.ts +6 -0
  293. package/dist/solvernets/store.d.ts +1 -1
  294. package/dist/solvernets/store.js +8 -3
  295. package/dist/solvernets/store.js.map +1 -1
  296. package/dist/spend/ai-units-config.d.ts +10 -0
  297. package/dist/spend/ai-units-config.js +7 -1
  298. package/dist/spend/ai-units-config.js.map +1 -1
  299. package/dist/spend/ai-units.d.ts +51 -0
  300. package/dist/spend/ai-units.js +73 -0
  301. package/dist/spend/ai-units.js.map +1 -1
  302. package/dist/spend/record.js +12 -5
  303. package/dist/spend/record.js.map +1 -1
  304. package/dist/store/store.d.ts +91 -5
  305. package/dist/store/store.js +170 -7
  306. package/dist/store/store.js.map +1 -1
  307. package/dist/trajectory/harness-bundle-schema.d.ts +1 -1
  308. package/dist/trajectory/harness-bundle-schema.js +1 -1
  309. package/dist/trajectory/harness-bundle-schema.js.map +1 -1
  310. package/dist/trajectory/schema.d.ts +1 -1
  311. package/dist/trajectory/schema.js +1 -1
  312. package/dist/trajectory/schema.js.map +1 -1
  313. package/dist/trajectory/transcript-parsers/types.d.ts +1 -1
  314. package/dist/trajectory/transcript-parsers/types.js +1 -1
  315. package/dist/trajectory/transcript-parsers/types.js.map +1 -1
  316. package/dist/types/envelope.d.ts +1 -1
  317. package/dist/types/envelope.js +1 -1
  318. package/dist/types/envelope.js.map +1 -1
  319. package/dist/types/payloads/index.d.ts +1 -1
  320. package/dist/types/payloads/index.js +7 -1
  321. package/dist/types/payloads/index.js.map +1 -1
  322. package/dist/types/payloads/portfolio-v0.d.ts +1 -1
  323. package/dist/types/payloads/portfolio-v0.js +1 -1
  324. package/dist/types/payloads/portfolio-v0.js.map +1 -1
  325. package/dist/types/payloads/prediction-apy-v0.d.ts +1 -1
  326. package/dist/types/payloads/prediction-apy-v0.js +1 -1
  327. package/dist/types/payloads/prediction-apy-v0.js.map +1 -1
  328. package/dist/types/payloads/prediction-v0.d.ts +1 -1
  329. package/dist/types/payloads/prediction-v0.js +1 -1
  330. package/dist/types/payloads/prediction-v0.js.map +1 -1
  331. package/dist/types/portfolio.d.ts +1 -1
  332. package/dist/types/portfolio.js +1 -1
  333. package/dist/types/portfolio.js.map +1 -1
  334. package/dist/types/prediction-apy.d.ts +1 -1
  335. package/dist/types/prediction-apy.js +1 -1
  336. package/dist/types/prediction-apy.js.map +1 -1
  337. package/dist/types/prediction.d.ts +1 -1
  338. package/dist/types/prediction.js +1 -1
  339. package/dist/types/prediction.js.map +1 -1
  340. package/dist/types/session-provenance.d.ts +1 -1
  341. package/dist/types/session-provenance.js +1 -1
  342. package/dist/types/session-provenance.js.map +1 -1
  343. package/dist/types/task-document.d.ts +1 -1
  344. package/dist/types/task-document.js +1 -1
  345. package/dist/types/task-document.js.map +1 -1
  346. package/dist/types/task.d.ts +1 -1
  347. package/dist/types/task.js +1 -1
  348. package/dist/types/task.js.map +1 -1
  349. package/dist/types/window.d.ts +1 -1
  350. package/dist/types/window.js +1 -1
  351. package/dist/types/window.js.map +1 -1
  352. package/dist/vendor/@jinn-network/sdk/dist/checkpoint.d.ts +1 -1
  353. package/dist/vendor/@jinn-network/sdk/dist/checkpoint.js +1 -1
  354. package/dist/vendor/@jinn-network/sdk/dist/contracts.d.ts +3 -2
  355. package/dist/vendor/@jinn-network/sdk/dist/contracts.js +49 -0
  356. package/dist/vendor/@jinn-network/sdk/dist/jinn-repo.d.ts +44 -0
  357. package/dist/vendor/@jinn-network/sdk/dist/jinn-repo.js +25 -0
  358. package/dist/vendor/@jinn-network/sdk/dist/json-schema.d.ts +1 -1
  359. package/dist/vendor/@jinn-network/sdk/dist/json-schema.js +1 -1
  360. package/dist/vendor/@jinn-network/sdk/dist/payloads/jinn-repo.d.ts +38 -0
  361. package/dist/vendor/@jinn-network/sdk/dist/payloads/jinn-repo.js +22 -0
  362. package/dist/vendor/@jinn-network/sdk/dist/payloads/prediction-v1.d.ts +1 -1
  363. package/dist/vendor/@jinn-network/sdk/dist/payloads/prediction-v1.js +1 -1
  364. package/dist/vendor/@jinn-network/sdk/dist/payloads/session-derived.d.ts +1 -1
  365. package/dist/vendor/@jinn-network/sdk/dist/payloads/session-derived.js +1 -1
  366. package/dist/vendor/@jinn-network/sdk/dist/payloads/swe-rebench-v2.d.ts +109 -2
  367. package/dist/vendor/@jinn-network/sdk/dist/payloads/swe-rebench-v2.js +26 -2
  368. package/dist/vendor/@jinn-network/sdk/dist/prediction-v1.d.ts +1 -1
  369. package/dist/vendor/@jinn-network/sdk/dist/prediction-v1.js +1 -1
  370. package/dist/vendor/@jinn-network/sdk/dist/solvernets/jinn-repo.d.ts +4 -0
  371. package/dist/vendor/@jinn-network/sdk/dist/solvernets/jinn-repo.js +2 -0
  372. package/dist/vendor/@jinn-network/sdk/dist/solvernets/manifest-schema.d.ts +1 -1
  373. package/dist/vendor/@jinn-network/sdk/dist/solvernets/manifest-schema.js +1 -1
  374. package/dist/vendor/@jinn-network/sdk/dist/solvernets/swe-rebench-v2-held-out-slate.d.ts +65 -0
  375. package/dist/vendor/@jinn-network/sdk/dist/solvernets/swe-rebench-v2-held-out-slate.js +123 -0
  376. package/dist/vendor/@jinn-network/sdk/dist/solvernets/swe-rebench-v2.d.ts +2 -2
  377. package/dist/vendor/@jinn-network/sdk/dist/solvernets/swe-rebench-v2.js +1 -1
  378. package/dist/vendor/@jinn-network/sdk/dist/swe-rebench-v2.d.ts +1 -1
  379. package/dist/vendor/@jinn-network/sdk/dist/swe-rebench-v2.js +1 -1
  380. package/dist/vendor/@jinn-network/sdk/package.json +9 -1
  381. package/docker-compose.yml +3 -2
  382. package/package.json +23 -20
  383. package/plugins/jinn-repo-runtime/.claude-plugin/plugin.json +5 -0
  384. package/plugins/jinn-repo-runtime/.codex-plugin/plugin.json +39 -0
  385. package/plugins/jinn-repo-runtime/README.md +27 -0
  386. package/plugins/jinn-repo-runtime/hooks/hooks.json +16 -0
  387. package/plugins/jinn-repo-runtime/hooks/session-start +73 -0
  388. package/plugins/jinn-repo-runtime/jinn.plugin.json +11 -0
  389. package/plugins/jinn-repo-runtime/skills/task/SKILL.md +92 -0
  390. package/plugins/learner/.claude-plugin/plugin.json +1 -1
  391. package/plugins/learner/.codex-plugin/plugin.json +1 -1
  392. package/plugins/learner/hooks/session-start +30 -1
  393. package/plugins/learner/skills/learn/consolidator-prompt.md +4 -0
  394. package/plugins/swe-rebench-v2-runtime/hooks/hooks.json +16 -0
  395. package/plugins/swe-rebench-v2-runtime/hooks/session-start +74 -0
  396. package/dist/dashboard/assets/index-CzKxvMcU.css +0 -32
  397. package/dist/dashboard/assets/index-yVemxHot.js +0 -351
@@ -0,0 +1,19 @@
1
+ {
2
+ "comment": "BASELINE-FAILURE REGRESSION BENCHMARK (issue #986). Screened: gradeable at the current evalSemanticsVersion AND base claude-code/Haiku frozen fails 0/R (R≥3) AND a stronger Codex/GPT-5.5 prover passes ≥1 (proven headroom). Baseline 0% by construction. Held out from the generator train stream via the active-slate-version union. Content-addressed; scores comparable WITHIN this version only.",
3
+ "schemaVersion": "held-out-slate.v1",
4
+ "solverType": "swe-rebench-v2.v1",
5
+ "version": "v2",
6
+ "generatedAt": "2026-06-04T23:03:42.179Z",
7
+ "instanceIds": [
8
+ "agronholm__anyio-1134",
9
+ "astropy__astropy-19438",
10
+ "con__nwb2bids-347_interface",
11
+ "deepset-ai__haystack-9322",
12
+ "gidgethub__gidgethub-225",
13
+ "iris-hep__func_adl-199",
14
+ "MatterMiners__tardis-361",
15
+ "modelcontextprotocol__python-sdk-222",
16
+ "twisted__towncrier-687"
17
+ ],
18
+ "hash": "sha256:34bb8bfa5e85933e38706551d4afaec3adf4a6ad1c1c0e4d2132f2c47d43d039"
19
+ }
@@ -0,0 +1,628 @@
1
+ {
2
+ "generatedAt": "2026-06-04T23:03:42.179Z",
3
+ "evalSemanticsVersion": "4",
4
+ "baseCodeDigest": "sha256:e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
5
+ "R": 3,
6
+ "proverHarness": "claude-code",
7
+ "proverModel": "opus",
8
+ "heldOutTotal": 9,
9
+ "newThisRun": [
10
+ "deepset-ai__haystack-9322",
11
+ "gidgethub__gidgethub-225",
12
+ "iris-hep__func_adl-199",
13
+ "MatterMiners__tardis-361",
14
+ "modelcontextprotocol__python-sdk-222",
15
+ "twisted__towncrier-687",
16
+ "agronholm__anyio-1134"
17
+ ],
18
+ "carriedOver": [
19
+ "astropy__astropy-19438",
20
+ "con__nwb2bids-347_interface"
21
+ ],
22
+ "screened": [
23
+ {
24
+ "instance_id": "aallan__vera-662_interface",
25
+ "repo": "aallan",
26
+ "basePasses": 1,
27
+ "proverPassed": null,
28
+ "baseRuns": 1,
29
+ "gradeable": true,
30
+ "heldOut": false,
31
+ "reason": "base-passes"
32
+ },
33
+ {
34
+ "instance_id": "agentscope-ai__qwenpaw-3278",
35
+ "repo": "agentscope-ai",
36
+ "basePasses": 0,
37
+ "proverPassed": null,
38
+ "baseRuns": 1,
39
+ "gradeable": true,
40
+ "heldOut": false,
41
+ "reason": "base-unscorable",
42
+ "unscorableReason": "grade-error: swe-rebench-v2 eval could not grade the solution (patch_does_not_apply)"
43
+ },
44
+ {
45
+ "instance_id": "agronholm__anyio-1121",
46
+ "repo": "agronholm",
47
+ "basePasses": 1,
48
+ "proverPassed": null,
49
+ "baseRuns": 1,
50
+ "gradeable": true,
51
+ "heldOut": false,
52
+ "reason": "base-passes"
53
+ },
54
+ {
55
+ "instance_id": "apache__iceberg-python-3295",
56
+ "repo": "apache",
57
+ "basePasses": 1,
58
+ "proverPassed": null,
59
+ "baseRuns": 1,
60
+ "gradeable": true,
61
+ "heldOut": false,
62
+ "reason": "base-passes"
63
+ },
64
+ {
65
+ "instance_id": "astronomy-commons__hats-648",
66
+ "repo": "astronomy-commons",
67
+ "basePasses": 0,
68
+ "proverPassed": null,
69
+ "baseRuns": 2,
70
+ "gradeable": true,
71
+ "heldOut": false,
72
+ "reason": "base-unscorable",
73
+ "unscorableReason": "grade-error: swe-rebench-v2 eval could not grade the solution (patch_merge_conflict)"
74
+ },
75
+ {
76
+ "instance_id": "beever-ai__beever-atlas-102",
77
+ "repo": "beever-ai",
78
+ "basePasses": 1,
79
+ "proverPassed": null,
80
+ "baseRuns": 1,
81
+ "gradeable": true,
82
+ "heldOut": false,
83
+ "reason": "base-passes"
84
+ },
85
+ {
86
+ "instance_id": "cea-hpc__clustershell-592",
87
+ "repo": "cea-hpc",
88
+ "basePasses": 1,
89
+ "proverPassed": null,
90
+ "baseRuns": 1,
91
+ "gradeable": true,
92
+ "heldOut": false,
93
+ "reason": "base-passes"
94
+ },
95
+ {
96
+ "instance_id": "cneud__alto-tools-29",
97
+ "repo": "cneud",
98
+ "basePasses": 1,
99
+ "proverPassed": null,
100
+ "baseRuns": 1,
101
+ "gradeable": true,
102
+ "heldOut": false,
103
+ "reason": "base-passes"
104
+ },
105
+ {
106
+ "instance_id": "copier-org__copier-2646",
107
+ "repo": "copier-org",
108
+ "basePasses": 0,
109
+ "proverPassed": null,
110
+ "baseRuns": 1,
111
+ "gradeable": true,
112
+ "heldOut": false,
113
+ "reason": "base-unscorable",
114
+ "unscorableReason": "grade-error: swe-rebench-v2 eval could not grade the solution (patch_does_not_apply)"
115
+ },
116
+ {
117
+ "instance_id": "cpp-linter__cpp-linter-hooks-206_interface",
118
+ "repo": "cpp-linter",
119
+ "basePasses": 1,
120
+ "proverPassed": null,
121
+ "baseRuns": 1,
122
+ "gradeable": true,
123
+ "heldOut": false,
124
+ "reason": "base-passes"
125
+ },
126
+ {
127
+ "instance_id": "cs-si__eodag-2176",
128
+ "repo": "cs-si",
129
+ "basePasses": 0,
130
+ "proverPassed": false,
131
+ "baseRuns": 3,
132
+ "gradeable": true,
133
+ "heldOut": false,
134
+ "reason": "no-headroom"
135
+ },
136
+ {
137
+ "instance_id": "CWorthy-ocean__C-Star-227",
138
+ "repo": "CWorthy-ocean",
139
+ "basePasses": 0,
140
+ "proverPassed": false,
141
+ "baseRuns": 3,
142
+ "gradeable": true,
143
+ "heldOut": false,
144
+ "reason": "no-headroom"
145
+ },
146
+ {
147
+ "instance_id": "dagster-io__dagster-33605",
148
+ "repo": "dagster-io",
149
+ "basePasses": 1,
150
+ "proverPassed": null,
151
+ "baseRuns": 1,
152
+ "gradeable": true,
153
+ "heldOut": false,
154
+ "reason": "base-passes"
155
+ },
156
+ {
157
+ "instance_id": "databricks__dbt-databricks-1131",
158
+ "repo": "databricks",
159
+ "basePasses": 1,
160
+ "proverPassed": null,
161
+ "baseRuns": 1,
162
+ "gradeable": true,
163
+ "heldOut": false,
164
+ "reason": "base-passes"
165
+ },
166
+ {
167
+ "instance_id": "deepset-ai__haystack-9322",
168
+ "repo": "deepset-ai",
169
+ "basePasses": 0,
170
+ "proverPassed": true,
171
+ "baseRuns": 3,
172
+ "gradeable": true,
173
+ "heldOut": true,
174
+ "reason": "held-out"
175
+ },
176
+ {
177
+ "instance_id": "ets-labs__python-dependency-injector-886",
178
+ "repo": "ets-labs",
179
+ "basePasses": 1,
180
+ "proverPassed": null,
181
+ "baseRuns": 1,
182
+ "gradeable": true,
183
+ "heldOut": false,
184
+ "reason": "base-passes"
185
+ },
186
+ {
187
+ "instance_id": "facelessuser__pymdown-extensions-2651",
188
+ "repo": "facelessuser",
189
+ "basePasses": 1,
190
+ "proverPassed": null,
191
+ "baseRuns": 1,
192
+ "gradeable": true,
193
+ "heldOut": false,
194
+ "reason": "base-passes"
195
+ },
196
+ {
197
+ "instance_id": "fsspec__universal_pathlib-395",
198
+ "repo": "fsspec",
199
+ "basePasses": 0,
200
+ "proverPassed": false,
201
+ "baseRuns": 3,
202
+ "gradeable": true,
203
+ "heldOut": false,
204
+ "reason": "no-headroom"
205
+ },
206
+ {
207
+ "instance_id": "gidgethub__gidgethub-225",
208
+ "repo": "gidgethub",
209
+ "basePasses": 0,
210
+ "proverPassed": true,
211
+ "baseRuns": 3,
212
+ "gradeable": true,
213
+ "heldOut": true,
214
+ "reason": "held-out"
215
+ },
216
+ {
217
+ "instance_id": "googleapis__python-api-core-821",
218
+ "repo": "googleapis",
219
+ "basePasses": 1,
220
+ "proverPassed": null,
221
+ "baseRuns": 1,
222
+ "gradeable": true,
223
+ "heldOut": false,
224
+ "reason": "base-passes"
225
+ },
226
+ {
227
+ "instance_id": "hgrecco__pint-pandas-287",
228
+ "repo": "hgrecco",
229
+ "basePasses": 0,
230
+ "proverPassed": null,
231
+ "baseRuns": 1,
232
+ "gradeable": true,
233
+ "heldOut": false,
234
+ "reason": "base-unscorable",
235
+ "unscorableReason": "grade-error: swe-rebench-v2 eval could not grade the solution (patch_merge_conflict)"
236
+ },
237
+ {
238
+ "instance_id": "hiero-ledger__hiero-sdk-python-1914_interface",
239
+ "repo": "hiero-ledger",
240
+ "basePasses": 1,
241
+ "proverPassed": null,
242
+ "baseRuns": 1,
243
+ "gradeable": true,
244
+ "heldOut": false,
245
+ "reason": "base-passes"
246
+ },
247
+ {
248
+ "instance_id": "icloud-photos-downloader__icloud_photos_downloader-1060",
249
+ "repo": "icloud-photos-downloader",
250
+ "basePasses": 1,
251
+ "proverPassed": null,
252
+ "baseRuns": 1,
253
+ "gradeable": true,
254
+ "heldOut": false,
255
+ "reason": "base-passes"
256
+ },
257
+ {
258
+ "instance_id": "iluvcapra__pycmx-12",
259
+ "repo": "iluvcapra",
260
+ "basePasses": 1,
261
+ "proverPassed": null,
262
+ "baseRuns": 1,
263
+ "gradeable": true,
264
+ "heldOut": false,
265
+ "reason": "base-passes"
266
+ },
267
+ {
268
+ "instance_id": "instructlab__sdg-484",
269
+ "repo": "instructlab",
270
+ "basePasses": 0,
271
+ "proverPassed": null,
272
+ "baseRuns": 1,
273
+ "gradeable": true,
274
+ "heldOut": false,
275
+ "reason": "base-unscorable",
276
+ "unscorableReason": "grade-error: insufficient disk for swe-rebench eval: 39.9 GB free, need ≥ 40.0 GB"
277
+ },
278
+ {
279
+ "instance_id": "intel__code-base-investigator-178",
280
+ "repo": "intel",
281
+ "basePasses": 1,
282
+ "proverPassed": null,
283
+ "baseRuns": 1,
284
+ "gradeable": true,
285
+ "heldOut": false,
286
+ "reason": "base-passes"
287
+ },
288
+ {
289
+ "instance_id": "iris-hep__func_adl-199",
290
+ "repo": "iris-hep",
291
+ "basePasses": 0,
292
+ "proverPassed": true,
293
+ "baseRuns": 3,
294
+ "gradeable": true,
295
+ "heldOut": true,
296
+ "reason": "held-out"
297
+ },
298
+ {
299
+ "instance_id": "isledecomp__reccmp-142",
300
+ "repo": "isledecomp",
301
+ "basePasses": 1,
302
+ "proverPassed": null,
303
+ "baseRuns": 1,
304
+ "gradeable": true,
305
+ "heldOut": false,
306
+ "reason": "base-passes"
307
+ },
308
+ {
309
+ "instance_id": "jawah__niquests-277",
310
+ "repo": "jawah",
311
+ "basePasses": 1,
312
+ "proverPassed": null,
313
+ "baseRuns": 1,
314
+ "gradeable": true,
315
+ "heldOut": false,
316
+ "reason": "base-passes"
317
+ },
318
+ {
319
+ "instance_id": "jlowin__fastmcp-1425",
320
+ "repo": "jlowin",
321
+ "basePasses": 0,
322
+ "proverPassed": null,
323
+ "baseRuns": 1,
324
+ "gradeable": true,
325
+ "heldOut": false,
326
+ "reason": "base-unscorable",
327
+ "unscorableReason": "grade-error: swe-rebench-v2 eval could not grade the solution (patch_does_not_apply)"
328
+ },
329
+ {
330
+ "instance_id": "JonathonReinhart__scuba-269",
331
+ "repo": "JonathonReinhart",
332
+ "basePasses": 1,
333
+ "proverPassed": null,
334
+ "baseRuns": 1,
335
+ "gradeable": true,
336
+ "heldOut": false,
337
+ "reason": "base-passes"
338
+ },
339
+ {
340
+ "instance_id": "MatterMiners__tardis-361",
341
+ "repo": "MatterMiners",
342
+ "basePasses": 0,
343
+ "proverPassed": true,
344
+ "baseRuns": 3,
345
+ "gradeable": true,
346
+ "heldOut": true,
347
+ "reason": "held-out"
348
+ },
349
+ {
350
+ "instance_id": "mempalace__mempalace-1004",
351
+ "repo": "mempalace",
352
+ "basePasses": 0,
353
+ "proverPassed": false,
354
+ "baseRuns": 3,
355
+ "gradeable": true,
356
+ "heldOut": false,
357
+ "reason": "no-headroom"
358
+ },
359
+ {
360
+ "instance_id": "modelcontextprotocol__python-sdk-222",
361
+ "repo": "modelcontextprotocol",
362
+ "basePasses": 0,
363
+ "proverPassed": true,
364
+ "baseRuns": 3,
365
+ "gradeable": true,
366
+ "heldOut": true,
367
+ "reason": "held-out"
368
+ },
369
+ {
370
+ "instance_id": "movingpandas__movingpandas-444",
371
+ "repo": "movingpandas",
372
+ "basePasses": 0,
373
+ "proverPassed": false,
374
+ "baseRuns": 3,
375
+ "gradeable": true,
376
+ "heldOut": false,
377
+ "reason": "no-headroom"
378
+ },
379
+ {
380
+ "instance_id": "nesquena__hermes-webui-1818",
381
+ "repo": "nesquena",
382
+ "basePasses": 0,
383
+ "proverPassed": null,
384
+ "baseRuns": 3,
385
+ "gradeable": true,
386
+ "heldOut": false,
387
+ "reason": "base-unscorable",
388
+ "unscorableReason": "harness-error: [claude-code-learner] harvestOutput: typed payload /var/folders/2y/y3bmqdw55kx2jhq804chv76m0000gn/T/jinn-eval-work-Fv5BLa/.execute/solution-payload.json failed swe-rebench-v2.v1/solution validation. U"
389
+ },
390
+ {
391
+ "instance_id": "networkx__networkx-7804",
392
+ "repo": "networkx",
393
+ "basePasses": 1,
394
+ "proverPassed": null,
395
+ "baseRuns": 1,
396
+ "gradeable": true,
397
+ "heldOut": false,
398
+ "reason": "base-passes"
399
+ },
400
+ {
401
+ "instance_id": "oemof__tespy-921",
402
+ "repo": "oemof",
403
+ "basePasses": 1,
404
+ "proverPassed": null,
405
+ "baseRuns": 1,
406
+ "gradeable": true,
407
+ "heldOut": false,
408
+ "reason": "base-passes"
409
+ },
410
+ {
411
+ "instance_id": "python-scim__scim2-models-139_interface",
412
+ "repo": "python-scim",
413
+ "basePasses": 1,
414
+ "proverPassed": null,
415
+ "baseRuns": 2,
416
+ "gradeable": true,
417
+ "heldOut": false,
418
+ "reason": "base-passes"
419
+ },
420
+ {
421
+ "instance_id": "python-wheel-build__fromager-1106",
422
+ "repo": "python-wheel-build",
423
+ "basePasses": 1,
424
+ "proverPassed": null,
425
+ "baseRuns": 1,
426
+ "gradeable": true,
427
+ "heldOut": false,
428
+ "reason": "base-passes"
429
+ },
430
+ {
431
+ "instance_id": "qBraid__pyqasm-120",
432
+ "repo": "qBraid",
433
+ "basePasses": 1,
434
+ "proverPassed": null,
435
+ "baseRuns": 2,
436
+ "gradeable": true,
437
+ "heldOut": false,
438
+ "reason": "base-passes"
439
+ },
440
+ {
441
+ "instance_id": "raullenchai__rapid-mlx-289",
442
+ "repo": "raullenchai",
443
+ "basePasses": 1,
444
+ "proverPassed": null,
445
+ "baseRuns": 2,
446
+ "gradeable": true,
447
+ "heldOut": false,
448
+ "reason": "base-passes"
449
+ },
450
+ {
451
+ "instance_id": "RDFLib__pySHACL-285",
452
+ "repo": "RDFLib",
453
+ "basePasses": 1,
454
+ "proverPassed": null,
455
+ "baseRuns": 1,
456
+ "gradeable": true,
457
+ "heldOut": false,
458
+ "reason": "base-passes"
459
+ },
460
+ {
461
+ "instance_id": "stanfordnlp__dspy-9478_interface",
462
+ "repo": "stanfordnlp",
463
+ "basePasses": 1,
464
+ "proverPassed": null,
465
+ "baseRuns": 1,
466
+ "gradeable": true,
467
+ "heldOut": false,
468
+ "reason": "base-passes"
469
+ },
470
+ {
471
+ "instance_id": "tobymao__sqlglot-4563",
472
+ "repo": "tobymao",
473
+ "basePasses": 1,
474
+ "proverPassed": null,
475
+ "baseRuns": 1,
476
+ "gradeable": true,
477
+ "heldOut": false,
478
+ "reason": "base-passes"
479
+ },
480
+ {
481
+ "instance_id": "Toloka__crowd-kit-128",
482
+ "repo": "Toloka",
483
+ "basePasses": 1,
484
+ "proverPassed": null,
485
+ "baseRuns": 1,
486
+ "gradeable": true,
487
+ "heldOut": false,
488
+ "reason": "base-passes"
489
+ },
490
+ {
491
+ "instance_id": "twisted__towncrier-687",
492
+ "repo": "twisted",
493
+ "basePasses": 0,
494
+ "proverPassed": true,
495
+ "baseRuns": 3,
496
+ "gradeable": true,
497
+ "heldOut": true,
498
+ "reason": "held-out"
499
+ },
500
+ {
501
+ "instance_id": "ucfopen__canvasapi-716",
502
+ "repo": "ucfopen",
503
+ "basePasses": 1,
504
+ "proverPassed": null,
505
+ "baseRuns": 1,
506
+ "gradeable": true,
507
+ "heldOut": false,
508
+ "reason": "base-passes"
509
+ },
510
+ {
511
+ "instance_id": "unionai-oss__pandera-1898",
512
+ "repo": "unionai-oss",
513
+ "basePasses": 1,
514
+ "proverPassed": null,
515
+ "baseRuns": 1,
516
+ "gradeable": true,
517
+ "heldOut": false,
518
+ "reason": "base-passes"
519
+ },
520
+ {
521
+ "instance_id": "vprusso__toqito-1484_interface",
522
+ "repo": "vprusso",
523
+ "basePasses": 0,
524
+ "proverPassed": null,
525
+ "baseRuns": 1,
526
+ "gradeable": true,
527
+ "heldOut": false,
528
+ "reason": "base-unscorable",
529
+ "unscorableReason": "grade-error: swe-rebench-v2 eval could not grade the solution (patch_merge_conflict)"
530
+ },
531
+ {
532
+ "instance_id": "zopefoundation__Zope-1243",
533
+ "repo": "zopefoundation",
534
+ "basePasses": 1,
535
+ "proverPassed": null,
536
+ "baseRuns": 1,
537
+ "gradeable": true,
538
+ "heldOut": false,
539
+ "reason": "base-passes"
540
+ },
541
+ {
542
+ "instance_id": "agronholm__anyio-1134",
543
+ "repo": "agronholm",
544
+ "basePasses": 0,
545
+ "proverPassed": true,
546
+ "baseRuns": 3,
547
+ "gradeable": true,
548
+ "heldOut": true,
549
+ "reason": "held-out"
550
+ },
551
+ {
552
+ "instance_id": "databricks__dbt-databricks-1428",
553
+ "repo": "databricks",
554
+ "basePasses": 0,
555
+ "proverPassed": null,
556
+ "baseRuns": 2,
557
+ "gradeable": true,
558
+ "heldOut": false,
559
+ "reason": "base-unscorable",
560
+ "unscorableReason": "grade-error: swe-rebench-v2 eval could not grade the solution (patch_does_not_apply)"
561
+ },
562
+ {
563
+ "instance_id": "hiero-ledger__hiero-sdk-python-2007_interface",
564
+ "repo": "hiero-ledger",
565
+ "basePasses": 1,
566
+ "proverPassed": null,
567
+ "baseRuns": 1,
568
+ "gradeable": true,
569
+ "heldOut": false,
570
+ "reason": "base-passes"
571
+ },
572
+ {
573
+ "instance_id": "isledecomp__reccmp-166",
574
+ "repo": "isledecomp",
575
+ "basePasses": 0,
576
+ "proverPassed": null,
577
+ "baseRuns": 3,
578
+ "gradeable": true,
579
+ "heldOut": false,
580
+ "reason": "no-headroom",
581
+ "unscorableReason": "harness: agent produced no patch"
582
+ },
583
+ {
584
+ "instance_id": "movingpandas__movingpandas-447",
585
+ "repo": "movingpandas",
586
+ "basePasses": 0,
587
+ "proverPassed": null,
588
+ "baseRuns": 1,
589
+ "gradeable": true,
590
+ "heldOut": false,
591
+ "reason": "base-unscorable",
592
+ "unscorableReason": "harness: agent produced no patch"
593
+ },
594
+ {
595
+ "instance_id": "tobymao__sqlglot-4618",
596
+ "repo": "tobymao",
597
+ "basePasses": 0,
598
+ "proverPassed": null,
599
+ "baseRuns": 1,
600
+ "gradeable": true,
601
+ "heldOut": false,
602
+ "reason": "base-unscorable",
603
+ "unscorableReason": "harness: agent produced no patch"
604
+ },
605
+ {
606
+ "instance_id": "tobymao__sqlglot-4643",
607
+ "repo": "tobymao",
608
+ "basePasses": 0,
609
+ "proverPassed": null,
610
+ "baseRuns": 1,
611
+ "gradeable": true,
612
+ "heldOut": false,
613
+ "reason": "base-unscorable",
614
+ "unscorableReason": "harness: agent produced no patch"
615
+ },
616
+ {
617
+ "instance_id": "tobymao__sqlglot-7479",
618
+ "repo": "tobymao",
619
+ "basePasses": 0,
620
+ "proverPassed": null,
621
+ "baseRuns": 1,
622
+ "gradeable": true,
623
+ "heldOut": false,
624
+ "reason": "base-unscorable",
625
+ "unscorableReason": "harness: agent produced no patch"
626
+ }
627
+ ]
628
+ }
@@ -3,6 +3,7 @@
3
3
  * See jinn-mono-6q1.1.
4
4
  */
5
5
  import type { TaskGenerator } from '../tasks/sources.js';
6
+ import type { LoadedHeldOutSlate } from './_swe-rebench-v2-held-out-slate.js';
6
7
  /** Overlay fields merged into Task when posting from --spec-file. */
7
8
  export type ParsedSpecOverlay = {
8
9
  window: unknown;
@@ -46,6 +47,13 @@ export interface SolverTypeDefinition<GenConfig = unknown> {
46
47
  * Return `undefined` to skip (default for kinds without auto-gen or not enabled on testnet).
47
48
  */
48
49
  getTestnetAutoConfig?: (ctx: TestnetAutoContext) => GenConfig | undefined;
50
+ /**
51
+ * Load this SolverType's held-out eval slate at `version` (issue #817).
52
+ * Optional so a future eval orchestrator can compose over SolverTypes that
53
+ * define a slate; SolverTypes without one omit it. The slate is
54
+ * content-addressed and throws on hash mismatch or unknown version.
55
+ */
56
+ loadHeldOutSlate?: (version: string) => LoadedHeldOutSlate;
49
57
  ui?: {
50
58
  description: string;
51
59
  category: string;
@@ -40,6 +40,8 @@ export interface SweRebenchV2AutoConfig {
40
40
  export interface SweRebenchV2GeneratorStaticConfig {
41
41
  stateDir?: string;
42
42
  ipfsRegistryUrl?: string;
43
+ /** IPFS gateway for the fresh-volume pool-recovery fetch (#957). */
44
+ ipfsGatewayUrl?: string;
43
45
  agentEoa?: `0x${string}`;
44
46
  safeAddress?: `0x${string}`;
45
47
  agentPrivateKey?: `0x${string}`;