@researai/deepscientist 1.5.16 → 1.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (896) hide show
  1. package/AGENTS.md +309 -130
  2. package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
  3. package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
  4. package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
  5. package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
  6. package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
  7. package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
  8. package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
  9. package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
  10. package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
  11. package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
  12. package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
  13. package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
  14. package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
  15. package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
  16. package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
  17. package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
  18. package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
  19. package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
  20. package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
  21. package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
  22. package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
  23. package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
  24. package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
  25. package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
  26. package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
  27. package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
  28. package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
  29. package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
  30. package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
  31. package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
  32. package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
  33. package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
  34. package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
  35. package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
  36. package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
  37. package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
  38. package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
  39. package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
  40. package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
  41. package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
  42. package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
  43. package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
  44. package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
  45. package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
  46. package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
  47. package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
  48. package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
  49. package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
  50. package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
  51. package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
  52. package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
  53. package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
  54. package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
  55. package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
  56. package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
  57. package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
  58. package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
  59. package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
  60. package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
  61. package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
  62. package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
  63. package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
  64. package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
  65. package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
  66. package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
  67. package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
  68. package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
  69. package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
  70. package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
  71. package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
  72. package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
  73. package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
  74. package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
  75. package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
  76. package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
  77. package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
  78. package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
  79. package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
  80. package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
  81. package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
  82. package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
  83. package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
  84. package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
  85. package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
  86. package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
  87. package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
  88. package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
  89. package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
  90. package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
  91. package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
  92. package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
  93. package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
  94. package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
  95. package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
  96. package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
  97. package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
  98. package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
  99. package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
  100. package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
  101. package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
  102. package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
  103. package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
  104. package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
  105. package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
  106. package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
  107. package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
  108. package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
  109. package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
  110. package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
  111. package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
  112. package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
  113. package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
  114. package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
  115. package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
  116. package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
  117. package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
  118. package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
  119. package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
  120. package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
  121. package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
  122. package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
  123. package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
  124. package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
  125. package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
  126. package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
  127. package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
  128. package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
  129. package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
  130. package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
  131. package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
  132. package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
  133. package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
  134. package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
  135. package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
  136. package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
  137. package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
  138. package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
  139. package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
  140. package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
  141. package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
  142. package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
  143. package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
  144. package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
  145. package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
  146. package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
  147. package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
  148. package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
  149. package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
  150. package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
  151. package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
  152. package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
  153. package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
  154. package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
  155. package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
  156. package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
  157. package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
  158. package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
  159. package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
  160. package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
  161. package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
  162. package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
  163. package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
  164. package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
  165. package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
  166. package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
  167. package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
  168. package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
  169. package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
  170. package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
  171. package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
  172. package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
  173. package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
  174. package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
  175. package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
  176. package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
  177. package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
  178. package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
  179. package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
  180. package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
  181. package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
  182. package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
  183. package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
  184. package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
  185. package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
  186. package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
  187. package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
  188. package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
  189. package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
  190. package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
  191. package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
  192. package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
  193. package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
  194. package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
  195. package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
  196. package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
  197. package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
  198. package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
  199. package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
  200. package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
  201. package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
  202. package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
  203. package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
  204. package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
  205. package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
  206. package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
  207. package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
  208. package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
  209. package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
  210. package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
  211. package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
  212. package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
  213. package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
  214. package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
  215. package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
  216. package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
  217. package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
  218. package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
  219. package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
  220. package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
  221. package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
  222. package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
  223. package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
  224. package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
  225. package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
  226. package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
  227. package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
  228. package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
  229. package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
  230. package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
  231. package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
  232. package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
  233. package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
  234. package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
  235. package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
  236. package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
  237. package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
  238. package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
  239. package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
  240. package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
  241. package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
  242. package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
  243. package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
  244. package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
  245. package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
  246. package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
  247. package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
  248. package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
  249. package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
  250. package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
  251. package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
  252. package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
  253. package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
  254. package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
  255. package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
  256. package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
  257. package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
  258. package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
  259. package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
  260. package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
  261. package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
  262. package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
  263. package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
  264. package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
  265. package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
  266. package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
  267. package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
  268. package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
  269. package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
  270. package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
  271. package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
  272. package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
  273. package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
  274. package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
  275. package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
  276. package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
  277. package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
  278. package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
  279. package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
  280. package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
  281. package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
  282. package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
  283. package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
  284. package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
  285. package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
  286. package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
  287. package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
  288. package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
  289. package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
  290. package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
  291. package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
  292. package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
  293. package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
  294. package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
  295. package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
  296. package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
  297. package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
  298. package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
  299. package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
  300. package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
  301. package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
  302. package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
  303. package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
  304. package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
  305. package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
  306. package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
  307. package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
  308. package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
  309. package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
  310. package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
  311. package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
  312. package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
  313. package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
  314. package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
  315. package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
  316. package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
  317. package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
  318. package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
  319. package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
  320. package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
  321. package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
  322. package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
  323. package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
  324. package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
  325. package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
  326. package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
  327. package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
  328. package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
  329. package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
  330. package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
  331. package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
  332. package/AISB/image/aisb.b10.climate_earth.svg +16 -0
  333. package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
  334. package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
  335. package/AISB/image/aisb.b2.agent_systems.svg +16 -0
  336. package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
  337. package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
  338. package/AISB/image/aisb.b5.math_proof.svg +16 -0
  339. package/AISB/image/aisb.b6.research_process.svg +16 -0
  340. package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
  341. package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
  342. package/AISB/image/aisb.b9.material_science.svg +16 -0
  343. package/README.md +196 -32
  344. package/bin/ds.js +924 -66
  345. package/docs/en/00_QUICK_START.md +195 -18
  346. package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
  347. package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
  348. package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
  349. package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
  350. package/docs/en/05_TUI_GUIDE.md +171 -2
  351. package/docs/en/07_MEMORY_AND_MCP.md +38 -2
  352. package/docs/en/09_DOCTOR.md +78 -7
  353. package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
  354. package/docs/en/11_LICENSE_AND_RISK.md +4 -0
  355. package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
  356. package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
  357. package/docs/en/15_CODEX_PROVIDER_SETUP.md +624 -180
  358. package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
  359. package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
  360. package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
  361. package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +386 -0
  362. package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
  363. package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
  364. package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
  365. package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
  366. package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
  367. package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
  368. package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
  369. package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
  370. package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
  371. package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
  372. package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
  373. package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
  374. package/docs/en/91_DEVELOPMENT.md +266 -0
  375. package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
  376. package/docs/en/README.md +48 -7
  377. package/docs/images/admin/admin-connectors-health-en.png +0 -0
  378. package/docs/images/admin/admin-controllers-en.png +0 -0
  379. package/docs/images/admin/admin-diagnostics-en.png +0 -0
  380. package/docs/images/admin/admin-errors-en.png +0 -0
  381. package/docs/images/admin/admin-issues-en.png +0 -0
  382. package/docs/images/admin/admin-logs-en.png +0 -0
  383. package/docs/images/admin/admin-quest-detail-en.png +0 -0
  384. package/docs/images/admin/admin-quests-en.png +0 -0
  385. package/docs/images/admin/admin-repairs-en.png +0 -0
  386. package/docs/images/admin/admin-runtime-en.png +0 -0
  387. package/docs/images/admin/admin-search-en.png +0 -0
  388. package/docs/images/admin/admin-stats-en.png +0 -0
  389. package/docs/images/admin/admin-summary-en.png +0 -0
  390. package/docs/images/connectors/connector-discord-en.png +0 -0
  391. package/docs/images/connectors/connector-feishu-en.png +0 -0
  392. package/docs/images/connectors/connector-lingzhu-en.png +0 -0
  393. package/docs/images/connectors/connector-qq-en.png +0 -0
  394. package/docs/images/connectors/connector-slack-en.png +0 -0
  395. package/docs/images/connectors/connector-telegram-en.png +0 -0
  396. package/docs/images/connectors/connector-weixin-en.png +0 -0
  397. package/docs/images/connectors/connector-whatsapp-en.png +0 -0
  398. package/docs/images/settings/settings-baselines-en.png +0 -0
  399. package/docs/images/settings/settings-config-en.png +0 -0
  400. package/docs/images/settings/settings-connectors-overview-en.png +0 -0
  401. package/docs/images/settings/settings-deepxiv-en.png +0 -0
  402. package/docs/images/settings/settings-mcp-servers-en.png +0 -0
  403. package/docs/images/settings/settings-plugins-en.png +0 -0
  404. package/docs/images/settings/settings-runners-en.png +0 -0
  405. package/docs/zh/00_QUICK_START.md +142 -18
  406. package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
  407. package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
  408. package/docs/zh/05_TUI_GUIDE.md +171 -2
  409. package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
  410. package/docs/zh/09_DOCTOR.md +54 -8
  411. package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
  412. package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
  413. package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
  414. package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
  415. package/docs/zh/15_CODEX_PROVIDER_SETUP.md +552 -181
  416. package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +384 -0
  417. package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
  418. package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
  419. package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
  420. package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
  421. package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
  422. package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
  423. package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
  424. package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
  425. package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
  426. package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
  427. package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
  428. package/docs/zh/README.md +33 -7
  429. package/install.sh +168 -20
  430. package/package.json +5 -1
  431. package/pyproject.toml +2 -1
  432. package/src/deepscientist/__init__.py +1 -1
  433. package/src/deepscientist/acp/envelope.py +13 -0
  434. package/src/deepscientist/admin/__init__.py +3 -0
  435. package/src/deepscientist/admin/charts.py +681 -0
  436. package/src/deepscientist/admin/logs.py +119 -0
  437. package/src/deepscientist/admin/repairs.py +217 -0
  438. package/src/deepscientist/admin/service.py +1310 -0
  439. package/src/deepscientist/admin/system_info.py +700 -0
  440. package/src/deepscientist/admin/tasks.py +465 -0
  441. package/src/deepscientist/admin/tool_metrics.py +600 -0
  442. package/src/deepscientist/artifact/guidance.py +8 -4
  443. package/src/deepscientist/artifact/schemas.py +115 -0
  444. package/src/deepscientist/artifact/service.py +4268 -260
  445. package/src/deepscientist/bash_exec/monitor.py +30 -3
  446. package/src/deepscientist/bash_exec/service.py +134 -1
  447. package/src/deepscientist/benchstore/__init__.py +4 -0
  448. package/src/deepscientist/benchstore/prompt_builder.py +224 -0
  449. package/src/deepscientist/benchstore/service.py +1716 -0
  450. package/src/deepscientist/bridges/connectors.py +8 -2
  451. package/src/deepscientist/channels/weixin_ilink.py +8 -1
  452. package/src/deepscientist/cli.py +92 -17
  453. package/src/deepscientist/codex_cli_compat.py +187 -74
  454. package/src/deepscientist/config/models.py +82 -11
  455. package/src/deepscientist/config/service.py +1077 -93
  456. package/src/deepscientist/connector/weixin_support.py +48 -17
  457. package/src/deepscientist/daemon/api/handlers.py +827 -235
  458. package/src/deepscientist/daemon/api/router.py +81 -1
  459. package/src/deepscientist/daemon/app.py +1512 -85
  460. package/src/deepscientist/diagnostics/__init__.py +6 -0
  461. package/src/deepscientist/diagnostics/runner_failures.py +277 -0
  462. package/src/deepscientist/doctor.py +407 -56
  463. package/src/deepscientist/evidence_packets.py +590 -0
  464. package/src/deepscientist/home.py +52 -4
  465. package/src/deepscientist/kimi_cli_compat.py +50 -0
  466. package/src/deepscientist/latex_runtime.py +2 -2
  467. package/src/deepscientist/mcp/context.py +2 -0
  468. package/src/deepscientist/mcp/schemas.py +114 -0
  469. package/src/deepscientist/mcp/server.py +1566 -126
  470. package/src/deepscientist/memory/service.py +203 -16
  471. package/src/deepscientist/process_control.py +8 -1
  472. package/src/deepscientist/prompts/builder.py +850 -88
  473. package/src/deepscientist/quest/__init__.py +2 -2
  474. package/src/deepscientist/quest/layout.py +12 -1
  475. package/src/deepscientist/quest/node_traces.py +10 -0
  476. package/src/deepscientist/quest/service.py +1852 -161
  477. package/src/deepscientist/quest/stage_views.py +1 -1
  478. package/src/deepscientist/runners/__init__.py +18 -0
  479. package/src/deepscientist/runners/base.py +89 -1
  480. package/src/deepscientist/runners/builtins.py +13 -1
  481. package/src/deepscientist/runners/claude.py +391 -0
  482. package/src/deepscientist/runners/codex.py +480 -35
  483. package/src/deepscientist/runners/codex_telemetry.py +127 -0
  484. package/src/deepscientist/runners/kimi.py +334 -0
  485. package/src/deepscientist/runners/metadata.py +68 -0
  486. package/src/deepscientist/runners/opencode.py +414 -0
  487. package/src/deepscientist/runners/runtime_overrides.py +100 -0
  488. package/src/deepscientist/runners/simple_cli.py +538 -0
  489. package/src/deepscientist/runtime_storage.py +303 -0
  490. package/src/deepscientist/shared.py +80 -16
  491. package/src/deepscientist/skills/installer.py +37 -0
  492. package/src/deepscientist/skills/registry.py +2 -0
  493. package/src/deepscientist/tinytex.py +2 -2
  494. package/src/deepscientist/tui.py +10 -3
  495. package/src/prompts/benchstore/system.md +77 -0
  496. package/src/prompts/connectors/qq.md +33 -2
  497. package/src/prompts/connectors/weixin.md +208 -23
  498. package/src/prompts/contracts/admin_ops.md +74 -0
  499. package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
  500. package/src/prompts/contracts/shared_interaction.md +5 -10
  501. package/src/prompts/start_setup/system.md +422 -0
  502. package/src/prompts/system.md +411 -304
  503. package/src/prompts/system_copilot.md +89 -0
  504. package/src/skills/analysis-campaign/SKILL.md +239 -578
  505. package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
  506. package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
  507. package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
  508. package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
  509. package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
  510. package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
  511. package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
  512. package/src/skills/baseline/SKILL.md +183 -461
  513. package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
  514. package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
  515. package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
  516. package/src/skills/baseline/references/baseline-plan-template.md +37 -76
  517. package/src/skills/baseline/references/boundary-cases.md +86 -0
  518. package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
  519. package/src/skills/baseline/references/comparability-contract.md +7 -12
  520. package/src/skills/baseline/references/operational-guidance.md +56 -0
  521. package/src/skills/baseline/references/route-selection.md +5 -25
  522. package/src/skills/decision/SKILL.md +113 -306
  523. package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
  524. package/src/skills/decision/references/operational-guidance.md +94 -0
  525. package/src/skills/decision/references/research-route-criteria.md +7 -8
  526. package/src/skills/decision/references/strategic-decision-template.md +13 -26
  527. package/src/skills/experiment/SKILL.md +132 -670
  528. package/src/skills/experiment/references/execution-playbook.md +374 -0
  529. package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
  530. package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
  531. package/src/skills/experiment/references/operational-guidance.md +108 -0
  532. package/src/skills/finalize/SKILL.md +62 -0
  533. package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
  534. package/src/skills/finalize/references/resume-packet-template.md +7 -0
  535. package/src/skills/idea/SKILL.md +228 -15
  536. package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
  537. package/src/skills/idea/references/current-board-packet-template.md +61 -0
  538. package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
  539. package/src/skills/idea/references/idea-generation-playbook.md +21 -0
  540. package/src/skills/idea/references/idea-thinking-flow.md +6 -0
  541. package/src/skills/idea/references/literature-survey-template.md +3 -0
  542. package/src/skills/idea/references/objective-contract-template.md +54 -0
  543. package/src/skills/idea/references/outline-seeding-example.md +56 -0
  544. package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
  545. package/src/skills/idea/references/related-work-playbook.md +75 -2
  546. package/src/skills/idea/references/research-history-playbook.md +114 -0
  547. package/src/skills/idea/references/selection-gate.md +58 -6
  548. package/src/skills/intake-audit/SKILL.md +43 -2
  549. package/src/skills/intake-audit/references/state-audit-template.md +10 -0
  550. package/src/skills/nature-data/SKILL.md +128 -0
  551. package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
  552. package/src/skills/nature-data/agents/openai.yaml +4 -0
  553. package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
  554. package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
  555. package/src/skills/nature-data/references/policy-principles.md +103 -0
  556. package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
  557. package/src/skills/nature-data/references/source-basis.md +54 -0
  558. package/src/skills/nature-data/references/statement-patterns.md +153 -0
  559. package/src/skills/nature-figure/SKILL.md +197 -0
  560. package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
  561. package/src/skills/nature-figure/agents/openai.yaml +4 -0
  562. package/src/skills/nature-figure/evals/evals.json +37 -0
  563. package/src/skills/nature-figure/references/api.md +428 -0
  564. package/src/skills/nature-figure/references/backend-selection.md +100 -0
  565. package/src/skills/nature-figure/references/chart-types.md +281 -0
  566. package/src/skills/nature-figure/references/common-patterns.md +349 -0
  567. package/src/skills/nature-figure/references/design-theory.md +436 -0
  568. package/src/skills/nature-figure/references/figure-contract.md +93 -0
  569. package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
  570. package/src/skills/nature-figure/references/qa-contract.md +119 -0
  571. package/src/skills/nature-figure/references/r-template-index.md +66 -0
  572. package/src/skills/nature-figure/references/r-workflow.md +161 -0
  573. package/src/skills/nature-figure/references/tutorials.md +250 -0
  574. package/src/skills/nature-paper2ppt/SKILL.md +507 -0
  575. package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
  576. package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
  577. package/src/skills/nature-polishing/SKILL.md +385 -0
  578. package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
  579. package/src/skills/nature-polishing/agents/openai.yaml +4 -0
  580. package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
  581. package/src/skills/nature-polishing/references/section-moves.md +240 -0
  582. package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
  583. package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
  584. package/src/skills/optimize/SKILL.md +177 -1568
  585. package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
  586. package/src/skills/optimize/references/candidate-board-template.md +13 -0
  587. package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
  588. package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
  589. package/src/skills/optimize/references/debug-response-template.md +29 -0
  590. package/src/skills/optimize/references/frontier-review-template.md +32 -0
  591. package/src/skills/optimize/references/fusion-playbook.md +36 -0
  592. package/src/skills/optimize/references/method-brief-template.md +73 -0
  593. package/src/skills/optimize/references/operational-guidance.md +621 -0
  594. package/src/skills/optimize/references/optimization-memory-template.md +30 -0
  595. package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
  596. package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
  597. package/src/skills/optimize/references/prompt-patterns.md +49 -0
  598. package/src/skills/paper-outline/SKILL.md +227 -0
  599. package/src/skills/paper-outline/references/outline-patterns.md +87 -0
  600. package/src/skills/paper-plot/SKILL.md +79 -0
  601. package/src/skills/paper-plot/agents/openai.yaml +4 -0
  602. package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
  603. package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
  604. package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
  605. package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
  606. package/src/skills/paper-plot/references/line_training_curve.md +44 -0
  607. package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
  608. package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
  609. package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
  610. package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
  611. package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
  612. package/src/skills/paper-plot/scripts/line_aime.py +94 -0
  613. package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
  614. package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
  615. package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
  616. package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
  617. package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
  618. package/src/skills/rebuttal/SKILL.md +9 -0
  619. package/src/skills/references/tool-usage-by-stage.md +438 -0
  620. package/src/skills/review/SKILL.md +105 -7
  621. package/src/skills/science/PROVENANCE.md +44 -0
  622. package/src/skills/science/SKILL.md +137 -0
  623. package/src/skills/science/references/artifact-science-tool.md +110 -0
  624. package/src/skills/science/references/claim-type-discipline.md +56 -0
  625. package/src/skills/science/references/domain-index.md +422 -0
  626. package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
  627. package/src/skills/science/references/package-check-playbook.md +64 -0
  628. package/src/skills/science/references/package-index.min.json +3616 -0
  629. package/src/skills/science/references/packages/abinit.md +80 -0
  630. package/src/skills/science/references/packages/acts.md +73 -0
  631. package/src/skills/science/references/packages/aiida-core.md +80 -0
  632. package/src/skills/science/references/packages/alamode.md +80 -0
  633. package/src/skills/science/references/packages/amuse.md +88 -0
  634. package/src/skills/science/references/packages/anndata.md +88 -0
  635. package/src/skills/science/references/packages/arbor.md +80 -0
  636. package/src/skills/science/references/packages/arc.md +73 -0
  637. package/src/skills/science/references/packages/astropy.md +88 -0
  638. package/src/skills/science/references/packages/astroquery.md +88 -0
  639. package/src/skills/science/references/packages/atomate2.md +80 -0
  640. package/src/skills/science/references/packages/atomsmltr.md +73 -0
  641. package/src/skills/science/references/packages/awkward.md +73 -0
  642. package/src/skills/science/references/packages/batman.md +88 -0
  643. package/src/skills/science/references/packages/biopython.md +88 -0
  644. package/src/skills/science/references/packages/bloqade.md +73 -0
  645. package/src/skills/science/references/packages/brian2.md +73 -0
  646. package/src/skills/science/references/packages/bullet3.md +73 -0
  647. package/src/skills/science/references/packages/calculix.md +80 -0
  648. package/src/skills/science/references/packages/cantera.md +73 -0
  649. package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
  650. package/src/skills/science/references/packages/ccdproc.md +88 -0
  651. package/src/skills/science/references/packages/celerite2.md +88 -0
  652. package/src/skills/science/references/packages/cellrank.md +73 -0
  653. package/src/skills/science/references/packages/cesm.md +80 -0
  654. package/src/skills/science/references/packages/chemicals.md +73 -0
  655. package/src/skills/science/references/packages/chempy.md +73 -0
  656. package/src/skills/science/references/packages/cirq.md +73 -0
  657. package/src/skills/science/references/packages/coffea.md +73 -0
  658. package/src/skills/science/references/packages/cp2k.md +88 -0
  659. package/src/skills/science/references/packages/custodian.md +80 -0
  660. package/src/skills/science/references/packages/dart.md +73 -0
  661. package/src/skills/science/references/packages/datamol.md +88 -0
  662. package/src/skills/science/references/packages/dd4hep.md +73 -0
  663. package/src/skills/science/references/packages/dealii.md +80 -0
  664. package/src/skills/science/references/packages/deepchem.md +88 -0
  665. package/src/skills/science/references/packages/delphes.md +73 -0
  666. package/src/skills/science/references/packages/devito.md +80 -0
  667. package/src/skills/science/references/packages/dftb.md +88 -0
  668. package/src/skills/science/references/packages/dftd4.md +88 -0
  669. package/src/skills/science/references/packages/dftk-jl.md +80 -0
  670. package/src/skills/science/references/packages/dolfinx.md +80 -0
  671. package/src/skills/science/references/packages/drake.md +73 -0
  672. package/src/skills/science/references/packages/dumux.md +73 -0
  673. package/src/skills/science/references/packages/elk.md +80 -0
  674. package/src/skills/science/references/packages/elmerfem.md +80 -0
  675. package/src/skills/science/references/packages/enzo-e.md +88 -0
  676. package/src/skills/science/references/packages/espresso.md +80 -0
  677. package/src/skills/science/references/packages/exoplanet.md +88 -0
  678. package/src/skills/science/references/packages/fairroot.md +73 -0
  679. package/src/skills/science/references/packages/fbpic.md +80 -0
  680. package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
  681. package/src/skills/science/references/packages/geant4.md +73 -0
  682. package/src/skills/science/references/packages/geosx.md +80 -0
  683. package/src/skills/science/references/packages/gprmax.md +80 -0
  684. package/src/skills/science/references/packages/gromacs.md +80 -0
  685. package/src/skills/science/references/packages/gwaslab.md +73 -0
  686. package/src/skills/science/references/packages/gz-sim.md +73 -0
  687. package/src/skills/science/references/packages/hail.md +88 -0
  688. package/src/skills/science/references/packages/hiphive.md +80 -0
  689. package/src/skills/science/references/packages/hoomd-blue.md +80 -0
  690. package/src/skills/science/references/packages/itensor.md +73 -0
  691. package/src/skills/science/references/packages/itensors-jl.md +73 -0
  692. package/src/skills/science/references/packages/jdftx.md +73 -0
  693. package/src/skills/science/references/packages/jobflow.md +80 -0
  694. package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
  695. package/src/skills/science/references/packages/kite.md +80 -0
  696. package/src/skills/science/references/packages/kratos.md +80 -0
  697. package/src/skills/science/references/packages/kwant.md +73 -0
  698. package/src/skills/science/references/packages/lammps.md +80 -0
  699. package/src/skills/science/references/packages/lightkurve.md +88 -0
  700. package/src/skills/science/references/packages/limix.md +73 -0
  701. package/src/skills/science/references/packages/maxwelllink.md +80 -0
  702. package/src/skills/science/references/packages/mcdc.md +73 -0
  703. package/src/skills/science/references/packages/meep.md +80 -0
  704. package/src/skills/science/references/packages/mfem.md +80 -0
  705. package/src/skills/science/references/packages/mitgcm.md +73 -0
  706. package/src/skills/science/references/packages/modflow6.md +73 -0
  707. package/src/skills/science/references/packages/molecool.md +73 -0
  708. package/src/skills/science/references/packages/mom6.md +73 -0
  709. package/src/skills/science/references/packages/moose.md +80 -0
  710. package/src/skills/science/references/packages/mpas-model.md +73 -0
  711. package/src/skills/science/references/packages/mujoco.md +73 -0
  712. package/src/skills/science/references/packages/mumax3.md +73 -0
  713. package/src/skills/science/references/packages/nekrs.md +80 -0
  714. package/src/skills/science/references/packages/nessi.md +73 -0
  715. package/src/skills/science/references/packages/nest-simulator.md +73 -0
  716. package/src/skills/science/references/packages/netket.md +73 -0
  717. package/src/skills/science/references/packages/neuron.md +73 -0
  718. package/src/skills/science/references/packages/nextflow.md +88 -0
  719. package/src/skills/science/references/packages/nwchem.md +88 -0
  720. package/src/skills/science/references/packages/openbabel.md +88 -0
  721. package/src/skills/science/references/packages/openems.md +80 -0
  722. package/src/skills/science/references/packages/openff-toolkit.md +88 -0
  723. package/src/skills/science/references/packages/openfoam-dev.md +80 -0
  724. package/src/skills/science/references/packages/openmc.md +73 -0
  725. package/src/skills/science/references/packages/openmm.md +80 -0
  726. package/src/skills/science/references/packages/openmoc.md +73 -0
  727. package/src/skills/science/references/packages/openmx.md +80 -0
  728. package/src/skills/science/references/packages/opensees.md +80 -0
  729. package/src/skills/science/references/packages/opensn.md +80 -0
  730. package/src/skills/science/references/packages/opm-simulators.md +73 -0
  731. package/src/skills/science/references/packages/oqupy.md +73 -0
  732. package/src/skills/science/references/packages/packmol.md +80 -0
  733. package/src/skills/science/references/packages/palabos.md +80 -0
  734. package/src/skills/science/references/packages/parflow.md +80 -0
  735. package/src/skills/science/references/packages/pennylane.md +88 -0
  736. package/src/skills/science/references/packages/perceval.md +73 -0
  737. package/src/skills/science/references/packages/phono3py.md +73 -0
  738. package/src/skills/science/references/packages/phonopy.md +73 -0
  739. package/src/skills/science/references/packages/photutils.md +88 -0
  740. package/src/skills/science/references/packages/picongpu.md +80 -0
  741. package/src/skills/science/references/packages/plink-ng.md +88 -0
  742. package/src/skills/science/references/packages/precice.md +73 -0
  743. package/src/skills/science/references/packages/psc.md +80 -0
  744. package/src/skills/science/references/packages/psi4.md +88 -0
  745. package/src/skills/science/references/packages/pybinding.md +73 -0
  746. package/src/skills/science/references/packages/pyfr.md +80 -0
  747. package/src/skills/science/references/packages/pyhf.md +73 -0
  748. package/src/skills/science/references/packages/pyiron_base.md +80 -0
  749. package/src/skills/science/references/packages/pylcp.md +73 -0
  750. package/src/skills/science/references/packages/pylith.md +80 -0
  751. package/src/skills/science/references/packages/pynbody.md +88 -0
  752. package/src/skills/science/references/packages/pysam.md +88 -0
  753. package/src/skills/science/references/packages/pyscf.md +88 -0
  754. package/src/skills/science/references/packages/q-e.md +73 -0
  755. package/src/skills/science/references/packages/qibo.md +73 -0
  756. package/src/skills/science/references/packages/qiskit.md +73 -0
  757. package/src/skills/science/references/packages/quantica-jl.md +73 -0
  758. package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
  759. package/src/skills/science/references/packages/quimb.md +73 -0
  760. package/src/skills/science/references/packages/qulacs.md +73 -0
  761. package/src/skills/science/references/packages/qutip.md +73 -0
  762. package/src/skills/science/references/packages/rdkit.md +88 -0
  763. package/src/skills/science/references/packages/rmg-py.md +73 -0
  764. package/src/skills/science/references/packages/root.md +73 -0
  765. package/src/skills/science/references/packages/scanpy.md +88 -0
  766. package/src/skills/science/references/packages/scikit-allel.md +88 -0
  767. package/src/skills/science/references/packages/scikit-bio.md +88 -0
  768. package/src/skills/science/references/packages/scqubits.md +73 -0
  769. package/src/skills/science/references/packages/scuff-em.md +80 -0
  770. package/src/skills/science/references/packages/scvi-tools.md +73 -0
  771. package/src/skills/science/references/packages/seissol.md +73 -0
  772. package/src/skills/science/references/packages/sfepy.md +80 -0
  773. package/src/skills/science/references/packages/sisl.md +73 -0
  774. package/src/skills/science/references/packages/smilei.md +80 -0
  775. package/src/skills/science/references/packages/snakemake.md +88 -0
  776. package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
  777. package/src/skills/science/references/packages/specutils.md +88 -0
  778. package/src/skills/science/references/packages/spglib.md +80 -0
  779. package/src/skills/science/references/packages/squidpy.md +88 -0
  780. package/src/skills/science/references/packages/starry.md +88 -0
  781. package/src/skills/science/references/packages/strawberryfields.md +73 -0
  782. package/src/skills/science/references/packages/su2.md +80 -0
  783. package/src/skills/science/references/packages/sunny-jl.md +73 -0
  784. package/src/skills/science/references/packages/sw4.md +73 -0
  785. package/src/skills/science/references/packages/swift.md +88 -0
  786. package/src/skills/science/references/packages/tdnegf.md +73 -0
  787. package/src/skills/science/references/packages/tenpy.md +73 -0
  788. package/src/skills/science/references/packages/thermo.md +73 -0
  789. package/src/skills/science/references/packages/tkwant.md +73 -0
  790. package/src/skills/science/references/packages/tvb-root.md +73 -0
  791. package/src/skills/science/references/packages/uproot5.md +73 -0
  792. package/src/skills/science/references/packages/vampire.md +80 -0
  793. package/src/skills/science/references/packages/wannier_tools.md +73 -0
  794. package/src/skills/science/references/packages/warpx.md +80 -0
  795. package/src/skills/science/references/packages/wrf.md +73 -0
  796. package/src/skills/science/references/packages/xtb.md +88 -0
  797. package/src/skills/science/references/packages/yt.md +73 -0
  798. package/src/skills/science/references/science-task-brief-template.md +71 -0
  799. package/src/skills/scout/SKILL.md +83 -425
  800. package/src/skills/scout/references/literature-scout-template.md +5 -24
  801. package/src/skills/scout/references/operational-guidance.md +191 -0
  802. package/src/skills/scout/references/paper-triage-playbook.md +11 -35
  803. package/src/skills/write/SKILL.md +744 -1246
  804. package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
  805. package/src/skills/write/references/oral_package_patterns.md +252 -0
  806. package/src/skills/write/references/oral_writing_principles.md +291 -0
  807. package/src/skills/write/references/section_rewrite_checklist.md +234 -0
  808. package/src/tui/dist/app/AppContainer.js +1314 -27
  809. package/src/tui/dist/components/Composer.js +26 -1
  810. package/src/tui/dist/components/ConfigScreen.js +2 -1
  811. package/src/tui/dist/components/InputPrompt.js +25 -9
  812. package/src/tui/dist/components/MainContent.js +18 -3
  813. package/src/tui/dist/components/QuestScreen.js +3 -2
  814. package/src/tui/dist/components/UtilityScreen.js +37 -0
  815. package/src/tui/dist/hooks/useSafeInput.js +10 -0
  816. package/src/tui/dist/index.js +13 -1
  817. package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
  818. package/src/tui/dist/lib/api.js +89 -1
  819. package/src/tui/package.json +1 -1
  820. package/src/ui/dist/assets/{AnalysisPlugin-DnSm0GZn.js → AnalysisPlugin-CA94NGmI.js} +1 -1
  821. package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
  822. package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
  823. package/src/ui/dist/assets/{CodeViewerPlugin-itb0tltR.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
  824. package/src/ui/dist/assets/{DocViewerPlugin-DqKkiCI6.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
  825. package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
  826. package/src/ui/dist/assets/{GitDiffViewerPlugin-DxL2ezFG.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
  827. package/src/ui/dist/assets/{GitSnapshotViewer-B_RQm1YZ.js → GitSnapshotViewer-CweA6VON.js} +2 -2
  828. package/src/ui/dist/assets/{ImageViewerPlugin-tHqlXY3n.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
  829. package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
  830. package/src/ui/dist/assets/{LatexPlugin-B495DTXC.js → LatexPlugin-BQjAaA5J.js} +4 -4
  831. package/src/ui/dist/assets/{MarkdownViewerPlugin-DG28-61B.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
  832. package/src/ui/dist/assets/{MarketplacePlugin-BiOGT-Kj.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
  833. package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
  834. package/src/ui/dist/assets/{NotebookEditor-CVsj8h_T.js → NotebookEditor-WFyd8Ybt.js} +23 -23
  835. package/src/ui/dist/assets/{PdfLoader-CASDQmxJ.js → PdfLoader-CLE5u5TS.js} +3 -3
  836. package/src/ui/dist/assets/{PdfMarkdownPlugin-BFhwoKsY.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
  837. package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
  838. package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
  839. package/src/ui/dist/assets/{TextViewerPlugin-CB4DYfWO.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
  840. package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
  841. package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
  842. package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
  843. package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
  844. package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
  845. package/src/ui/dist/assets/{code-DLC6G24T.js → code-DbsmSd3Y.js} +1 -1
  846. package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
  847. package/src/ui/dist/assets/{wrap-text-CwMn-iqb.js → file-jump-queue-DeQBikaw.js} +3 -3
  848. package/src/ui/dist/assets/{file-socket-Cu4Qln7Y.js → file-socket-DA5XIx88.js} +1 -1
  849. package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
  850. package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
  851. package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
  852. package/src/ui/dist/assets/{index-wQ7RIIRd.js → index-BsO46tJA.js} +1 -1
  853. package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
  854. package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
  855. package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
  856. package/src/ui/dist/assets/{project-sync-CsX08Qno.js → project-sync-DPmWKmKD.js} +1 -1
  857. package/src/ui/dist/assets/{zoom-out-R-GWEhzS.js → zoom-out-DAukFWen.js} +3 -3
  858. package/src/ui/dist/index.html +3 -3
  859. package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
  860. package/src/skills/baseline/references/memory-playbook.md +0 -40
  861. package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
  862. package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
  863. package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
  864. package/src/skills/write/references/paper-section-playbook.md +0 -64
  865. package/src/skills/write/references/reviewer-first-writing.md +0 -64
  866. package/src/skills/write/references/revision-checklist.md +0 -70
  867. package/src/skills/write/references/section-contracts.md +0 -82
  868. package/src/skills/write/references/sentence-level-proofing.md +0 -49
  869. package/src/ui/dist/assets/AiManusChatView-COFACy7V.js +0 -204
  870. package/src/ui/dist/assets/CliPlugin-CvwCmDQ5.js +0 -109
  871. package/src/ui/dist/assets/CodeEditorPlugin-cOqSa0xq.js +0 -2
  872. package/src/ui/dist/assets/GitCommitViewerPlugin-DVgNHBCS.js +0 -1
  873. package/src/ui/dist/assets/LabCopilotPanel-ClMbq5Yu.js +0 -14
  874. package/src/ui/dist/assets/LabPlugin-L_SuE8ow.js +0 -22
  875. package/src/ui/dist/assets/NotebookEditor-C-4Kt1p9.js +0 -81
  876. package/src/ui/dist/assets/PdfViewerPlugin-DcOzU9vd.js +0 -17
  877. package/src/ui/dist/assets/SearchPlugin-CHj7M58O.js +0 -16
  878. package/src/ui/dist/assets/VNCViewer-CjlbyCB3.js +0 -11
  879. package/src/ui/dist/assets/bot-CFkZY-JP.js +0 -6
  880. package/src/ui/dist/assets/chevron-up-Dq5ofbht.js +0 -6
  881. package/src/ui/dist/assets/file-content-Dv4LoZec.js +0 -1
  882. package/src/ui/dist/assets/file-diff-panel-Denq-lC3.js +0 -1
  883. package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
  884. package/src/ui/dist/assets/git-commit-horizontal-BUh6G52n.js +0 -6
  885. package/src/ui/dist/assets/image-B9HUUddG.js +0 -6
  886. package/src/ui/dist/assets/index-B2B1sg-M.js +0 -1
  887. package/src/ui/dist/assets/index-Cgla8biy.css +0 -33
  888. package/src/ui/dist/assets/index-DRyx7vAc.js +0 -1
  889. package/src/ui/dist/assets/index-Gbl53BNp.js +0 -2496
  890. package/src/ui/dist/assets/pdf-effect-queue-ZtnHFCAi.js +0 -6
  891. package/src/ui/dist/assets/popover-DL6h35vr.js +0 -1
  892. package/src/ui/dist/assets/select-DvmXt1yY.js +0 -11
  893. package/src/ui/dist/assets/sigma-7jpXazui.js +0 -6
  894. package/src/ui/dist/assets/trash-xA7kFt8i.js +0 -11
  895. package/src/ui/dist/assets/useCliAccess-DsMwDjOp.js +0 -1
  896. package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
@@ -0,0 +1,193 @@
1
+ schema_version: 1
2
+ id: aisb.t3.005_tsae
3
+ name: 'Temporal Sparse Autoencoders: Leveraging the Sequential Nature of Language
4
+ for Interpretability'
5
+ version: 0.1.0
6
+ one_line: Train temporal sparse autoencoders (T-SAEs) with a contrastive temporal-consistency
7
+ loss on LLM activations, then evaluate feature quality via SAEBench-style automated
8
+ interpretability scoring.
9
+ task_description: 'This benchmark requires training Temporal Sparse Autoencoders (T-SAEs)
10
+ that partition latent features into high-level (semantic, temporally consistent)
11
+ and low-level (syntactic, token-local) components using a contrastive loss over
12
+ adjacent-token activations from language models (Pythia-160m or Gemma-2-2b). The
13
+ T-SAE architecture extends Matryoshka BatchTopK SAEs with a temporal contrastive
14
+ term encouraging high-level features to remain stable across adjacent tokens in
15
+ a sequence. The primary execution route is: (1) train a T-SAE on model activations
16
+ extracted from the Pile dataset using dictionary_learning/dictionary_learning/train_temporal.py,
17
+ (2) evaluate reconstruction quality, sparsity, and temporal smoothness using dictionary_learning/dictionary_learning/eval_temporal.py,
18
+ and (3) compute automated interpretability scores by processing SAEBench-generated
19
+ explanation JSON files via src/process_sae_bench_autointerp.py. Downstream experiments
20
+ include probing for semantic/ contextual/syntactic content, t-SNE visualization,
21
+ and an HH-RLHF alignment case study. Pretrained Gemma-2-2b T-SAE checkpoints with
22
+ 16384 features and pre-labeled explanations are available on HuggingFace, enabling
23
+ evaluation without retraining. The autointerp evaluation requires SAEBench (external)
24
+ to generate feature explanations using a judge LLM (Llama-3.3-70b-Instruct in the
25
+ paper). Training data streams from the Pile via HuggingFace datasets; no manual
26
+ dataset download is needed for the core route.
27
+
28
+ '
29
+ capability_tags:
30
+ - research_code_optimization
31
+ - mechanistic_interpretability
32
+ - sparse_autoencoders
33
+ - large_language_models
34
+ - evaluation
35
+ - contrastive_learning
36
+ - dictionary_learning
37
+ aisb_direction: T3
38
+ track_fit:
39
+ - paper_track
40
+ - benchmark_track
41
+ task_mode: experiment_driven
42
+ requires_execution: true
43
+ requires_paper: true
44
+ integrity_level: cas_plus_canary
45
+ snapshot_status: runnable
46
+ support_level: advanced
47
+ cost_band: high
48
+ time_band: 1d+
49
+ difficulty: hard
50
+ data_access: public
51
+ primary_outputs:
52
+ - autointerp_score
53
+ - sae_checkpoint
54
+ - interpretability_report
55
+ - probing_accuracy
56
+ - temporal_smoothness_metrics
57
+ launch_profiles:
58
+ - id: quick_check
59
+ label: Quick Check
60
+ description: 'Run a small T-SAE training pass on Pythia-160m with reduced steps
61
+ and a short eval to verify the pipeline end-to-end. Uses NeelNanda/pile-10k for
62
+ fast iteration.
63
+
64
+ '
65
+ - id: autointerp_eval
66
+ label: Autointerp Eval
67
+ description: 'Train temporal sparse autoencoders on full Pile data, generate feature
68
+ explanations via SAEBench with a judge LLM, and compute autointerp scores. This
69
+ is the paper-faithful route requiring external SAEBench and a 70B judge model.
70
+
71
+ '
72
+ - id: pretrained_eval
73
+ label: Pretrained Eval
74
+ description: 'Download the pretrained Gemma-2-2b T-SAE and bundled explanations
75
+ from HuggingFace, then run eval_temporal.py and process_sae_bench_autointerp.py
76
+ without retraining.
77
+
78
+ '
79
+ dataset_download:
80
+ primary_method: streaming
81
+ sources:
82
+ - kind: huggingface
83
+ url: https://huggingface.co/datasets/monology/pile-uncopyrighted
84
+ access: public
85
+ note: Primary training/eval data; streamed via HuggingFace datasets. No manual
86
+ download required.
87
+ - kind: huggingface
88
+ url: https://huggingface.co/datasets/NeelNanda/pile-10k
89
+ access: public
90
+ note: Small subset used for quick evaluation passes.
91
+ - kind: huggingface
92
+ url: https://huggingface.co/alex-oesterling/temporal-saes
93
+ access: public
94
+ note: Pretrained Gemma-2-2b T-SAE checkpoint (16384 features) with labeled explanations.json.
95
+ notes:
96
+ - Training data is streamed; disk usage is dominated by model weights and SAE checkpoints.
97
+ - Gemma-2-2b weights require HuggingFace access agreement.
98
+ credential_requirements:
99
+ mode: optional
100
+ items:
101
+ - HuggingFace token (required for gated models like Gemma-2-2b; optional for Pythia-160m)
102
+ - SAEBench access (external tool for generating feature explanations; not bundled)
103
+ notes:
104
+ - Rename example.env to .env and add HF_TOKEN if using Gemma-2-2b or customizing
105
+ HuggingFace paths.
106
+ - Autointerp evaluation requires running SAEBench externally with a judge LLM (paper
107
+ uses Llama-3.3-70b-Instruct).
108
+ resources:
109
+ minimum:
110
+ cpu_cores: 16
111
+ ram_gb: 64
112
+ disk_gb: 100
113
+ gpu_count: 1
114
+ gpu_vram_gb: 24
115
+ recommended:
116
+ cpu_cores: 32
117
+ ram_gb: 128
118
+ disk_gb: 200
119
+ gpu_count: 1
120
+ gpu_vram_gb: 48
121
+ environment:
122
+ python: '3.11'
123
+ cuda: '12.8'
124
+ pytorch: null
125
+ flash_attn: null
126
+ key_packages:
127
+ - poetry
128
+ - nnsight
129
+ - datasets
130
+ - dictionary_learning (bundled fork)
131
+ notes:
132
+ - Poetry-managed environment; run 'poetry install' to set up. Torch wheels are pulled
133
+ from the cu128 index.
134
+ - The dictionary_learning directory is a bundled fork of github.com/saprmarks/dictionary_learning.
135
+ - See pyproject.toml and poetry.lock for the full pinned dependency set.
136
+ risk_flags:
137
+ - external_eval_dependency
138
+ - large_model_weights
139
+ - judge_model_required
140
+ - some_experiments_under_construction
141
+ risk_notes:
142
+ - SAEBench is not bundled; autointerp evaluation requires cloning and running it separately
143
+ with a large judge LLM (70B parameter Llama-3.3 in the paper).
144
+ - Gemma-2-2b weights (~5 GB) must be downloaded and may require HuggingFace access
145
+ agreement.
146
+ - The full autointerp route requires hosting or API access to a 70B judge model, which
147
+ significantly increases cost.
148
+ - README marks "Sequence Interpretability (Figures 1 and 4)" and "Steering" experiments
149
+ as under construction.
150
+ - No benchmark execution was performed during the packaging pass; metrics are code-backed
151
+ but unverified at runtime.
152
+ recommended_when: 'Use this benchmark when you want a mechanistic-interpretability
153
+ task that combines SAE training with temporal-contrastive learning and automated
154
+ interpretability evaluation. Good fit for research on disentangling semantic vs.
155
+ syntactic features in LLM representations, or for optimizing SAE training pipelines
156
+ under structured priors.
157
+
158
+ '
159
+ not_recommended_when: 'Do not use this if you need a lightweight CPU-only benchmark,
160
+ cannot host LLM checkpoints (Pythia-160m minimum, Gemma-2-2b recommended) locally,
161
+ or lack GPU access. Avoid if you cannot run or access a large judge model for the
162
+ autointerp evaluation route.
163
+
164
+ '
165
+ paper:
166
+ title: 'Temporal Sparse Autoencoders: Leveraging the Sequential Nature of Language
167
+ for Interpretability'
168
+ authors:
169
+ - Usha Bhalla
170
+ - Alex Oesterling
171
+ - Claudio Mayrink Verdun
172
+ - Himabindu Lakkaraju
173
+ - Flavio P. Calmon
174
+ venue: arXiv preprint
175
+ year: 2025
176
+ url: https://arxiv.org/abs/2511.05541
177
+ download:
178
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.005_tsae.zip
179
+ archive_type: zip
180
+ local_dir_name: paper-5-TSAE
181
+ provider: github_release
182
+ repo: ResearAI/DeepScientist
183
+ tag: aisb-v0.0.1
184
+ asset_name: aisb.t3.005_tsae.zip
185
+ sha256: f89d8100092417777d135fded098e3fb26a5f38ccdb300658138273924bf070e
186
+ size_bytes: 322370
187
+ commercial:
188
+ annual_fee: null
189
+ display:
190
+ palette_seed: amber-ink-latent
191
+ art_style: editorial-technical
192
+ accent_priority: high
193
+ image_path: ../image/005_aisb.t3.005_tsae.jpg
@@ -0,0 +1,139 @@
1
+ schema_version: 1
2
+ id: aisb.t3.005_tsae
3
+ name: 时间稀疏自编码器:利用语言的序列特性实现可解释性
4
+ version: 0.1.0
5
+ one_line: 在LLM激活上训练带有对比时间一致性损失的时间稀疏自编码器(T-SAE),然后通过SAEBench风格的自动化可解释性评分来评估特征质量。
6
+ task_description: 本基准测试需要训练时间稀疏自编码器(T-SAE),使用语言模型(Pythia-160m或Gemma-2-2b)相邻token激活上的对比损失,将潜在特征划分为高层级(语义、时间一致)和低层级(句法、token局部)组件。T-SAE架构通过时间对比项扩展了Matryoshka BatchTopK SAE,鼓励高层级特征在序列中的相邻token上保持稳定。主要执行流程为:(1)使用dictionary_learning/dictionary_learning/train_temporal.py从Pile数据集提取的模型激活上训练T-SAE,(2)使用dictionary_learning/dictionary_learning/eval_temporal.py评估重构质量、稀疏性和时间平滑性,(3)通过src/process_sae_bench_autointerp.py处理SAEBench生成的解释JSON文件来计算自动化可解释性评分。下游实验包括语义/上下文/句法内容的探测、t-SNE可视化和HH-RLHF对齐案例研究。预训练的Gemma-2-2b T-SAE检查点(16384特征)和带标签的解释可在HuggingFace上获取,无需重新训练即可评估。自动解释评估需要SAEBench(外部工具)使用评判LLM(论文中使用Llama-3.3-70B-Instruct)生成特征解释。训练数据通过HuggingFace datasets从Pile流式传输;核心流程无需手动下载数据集。
7
+ capability_tags:
8
+ - research_code_optimization
9
+ - mechanistic_interpretability
10
+ - sparse_autoencoders
11
+ - large_language_models
12
+ - evaluation
13
+ - contrastive_learning
14
+ - dictionary_learning
15
+ aisb_direction: T3
16
+ track_fit:
17
+ - paper_track
18
+ - benchmark_track
19
+ task_mode: experiment_driven
20
+ requires_execution: true
21
+ requires_paper: true
22
+ integrity_level: cas_plus_canary
23
+ snapshot_status: runnable
24
+ support_level: advanced
25
+ cost_band: high
26
+ time_band: 1d+
27
+ difficulty: hard
28
+ data_access: public
29
+ primary_outputs:
30
+ - autointerp_score
31
+ - sae_checkpoint
32
+ - interpretability_report
33
+ - probing_accuracy
34
+ - temporal_smoothness_metrics
35
+ launch_profiles:
36
+ - id: quick_check
37
+ label: 快速检查
38
+ description: 在Pythia-160m上运行小规模T-SAE训练,使用减少的步数和简短评估来验证端到端流程。使用NeelNanda/pile-10k进行快速迭代。
39
+ - id: autointerp_eval
40
+ label: 自动解释评估
41
+ description: 在完整Pile数据上训练时间稀疏自编码器,通过SAEBench和评判LLM生成特征解释,并计算自动解释分数。这是论文原始流程,需要外部SAEBench和70B评判模型。
42
+ - id: pretrained_eval
43
+ label: 预训练评估
44
+ description: 从HuggingFace下载预训练的Gemma-2-2b T-SAE和捆绑的解释,然后运行eval_temporal.py和process_sae_bench_autointerp.py,无需重新训练。
45
+ dataset_download:
46
+ primary_method: streaming
47
+ sources:
48
+ - kind: huggingface
49
+ url: https://huggingface.co/datasets/monology/pile-uncopyrighted
50
+ access: public
51
+ note: 主要训练/评估数据;通过HuggingFace datasets流式传输。无需手动下载。
52
+ - kind: huggingface
53
+ url: https://huggingface.co/datasets/NeelNanda/pile-10k
54
+ access: public
55
+ note: 用于快速评估的小规模子集。
56
+ - kind: huggingface
57
+ url: https://huggingface.co/alex-oesterling/temporal-saes
58
+ access: public
59
+ note: 预训练的Gemma-2-2b T-SAE检查点(16384特征)附带标签化的explanations.json。
60
+ notes:
61
+ - 训练数据以流式方式传输;磁盘使用主要由模型权重和SAE检查点占用。
62
+ - Gemma-2-2b权重需要HuggingFace访问协议。
63
+ credential_requirements:
64
+ mode: optional
65
+ items:
66
+ - HuggingFace令牌(用于Gemma-2-2b等门控模型必需;Pythia-160m可选)
67
+ - SAEBench访问权限(用于生成特征解释的外部工具;未捆绑)
68
+ notes:
69
+ - 如使用Gemma-2-2b或自定义HuggingFace路径,请将example.env重命名为.env并添加HF_TOKEN。
70
+ - 自动解释评估需要外部运行SAEBench并使用评判LLM(论文使用Llama-3.3-70B-Instruct)。
71
+ resources:
72
+ minimum:
73
+ cpu_cores: 16
74
+ ram_gb: 64
75
+ disk_gb: 100
76
+ gpu_count: 1
77
+ gpu_vram_gb: 24
78
+ recommended:
79
+ cpu_cores: 32
80
+ ram_gb: 128
81
+ disk_gb: 200
82
+ gpu_count: 1
83
+ gpu_vram_gb: 48
84
+ environment:
85
+ python: '3.11'
86
+ cuda: '12.8'
87
+ pytorch: null
88
+ flash_attn: null
89
+ key_packages:
90
+ - poetry
91
+ - nnsight
92
+ - datasets
93
+ - dictionary_learning (bundled fork)
94
+ notes:
95
+ - Poetry管理的环境;运行'poetry install'进行设置。Torch轮子从cu128索引拉取。
96
+ - dictionary_learning目录是github.com/saprmarks/dictionary_learning的捆绑fork。
97
+ - 完整的固定依赖集请参见pyproject.toml和poetry.lock。
98
+ risk_flags:
99
+ - external_eval_dependency
100
+ - large_model_weights
101
+ - judge_model_required
102
+ - some_experiments_under_construction
103
+ risk_notes:
104
+ - SAEBench未捆绑;自动解释评估需要单独克隆和运行它,并使用大型评判LLM(论文中使用70B参数Llama-3.3)。
105
+ - Gemma-2-2b权重(约5 GB)必须下载,可能需要HuggingFace访问协议。
106
+ - 完整的自动解释路线需要托管或API访问70B评判模型,这会显著增加成本。
107
+ - README将"序列可解释性(图1和4)"和"转向"实验标记为建设中。
108
+ - 打包过程中未执行基准测试;指标有代码支持但运行时未验证。
109
+ recommended_when: 当您需要一个结合SAE训练与时间对比学习和自动化可解释性评估的机械可解释性任务时使用此基准测试。非常适合研究LLM表征中语义与句法特征的解纠缠,或在结构化先验下优化SAE训练流程。
110
+ not_recommended_when: 如果您需要轻量级仅CPU基准测试、无法在本地托管LLM检查点(Pythia-160m最小,Gemma-2-2b推荐)或缺乏GPU访问,请勿使用。如果无法运行或访问大型评判模型进行自动解释评估路线,也应避免。
111
+ paper:
112
+ title: 'Temporal Sparse Autoencoders: Leveraging the Sequential Nature of Language
113
+ for Interpretability'
114
+ authors:
115
+ - Usha Bhalla
116
+ - Alex Oesterling
117
+ - Claudio Mayrink Verdun
118
+ - Himabindu Lakkaraju
119
+ - Flavio P. Calmon
120
+ venue: arXiv preprint
121
+ year: 2025
122
+ url: https://arxiv.org/abs/2511.05541
123
+ download:
124
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.005_tsae.zip
125
+ archive_type: zip
126
+ local_dir_name: paper-5-TSAE
127
+ provider: github_release
128
+ repo: ResearAI/DeepScientist
129
+ tag: aisb-v0.0.1
130
+ asset_name: aisb.t3.005_tsae.zip
131
+ sha256: f89d8100092417777d135fded098e3fb26a5f38ccdb300658138273924bf070e
132
+ size_bytes: 322370
133
+ commercial:
134
+ annual_fee: null
135
+ display:
136
+ palette_seed: amber-ink-latent
137
+ art_style: editorial-technical
138
+ accent_priority: high
139
+ image_path: ../image/005_aisb.t3.005_tsae.jpg
@@ -0,0 +1,194 @@
1
+ schema_version: 1
2
+ id: aisb.t3.006_physense
3
+ name: 'PhySense: Sensor Placement Optimization for Accurate Physics Sensing'
4
+ version: 0.1.0
5
+ one_line: 'Two-stage flow-based physics-field reconstruction and sensor placement
6
+ optimization across turbulent-flow, sea-temperature, and car-aerodynamics benchmarks.
7
+
8
+ '
9
+ task_description: 'This benchmark implements PhySense, a synergistic two-stage framework
10
+ for physics sensing. Stage 1 trains a flow-matching generative model (DiT for regular
11
+ grids, Transolver for irregular meshes) with cross-attention to reconstruct dense
12
+ physical fields from sparse sensor observations at arbitrary placements. Stage 2
13
+ optimizes sensor positions via projected gradient descent under spatial constraints,
14
+ using reconstruction feedback to discover informative placements. The agent must
15
+ run training and inference across three bundled scientific domains: (1) Turbulent-Flow
16
+ (pipe simulation on regular grid), (2) Sea-Temperature (global SST reanalysis on
17
+ regular grid with land mask), and (3) Car-Aerodynamics (3D surface pressure on irregular
18
+ mesh). For each domain the snapshot provides both a base-model inference script
19
+ (random placement) and a walk inference script (optimized placement). Primary metrics
20
+ are relative L2 error and MSE loss; secondary output is the optimized sensor layout.
21
+ Data paths in inference scripts point to external locations that must be populated.
22
+ Pretrained checkpoints are expected under per-domain ./checkpoints/ directories.
23
+ No external evaluation service is required; all metrics are computed locally in
24
+ the inference scripts.
25
+
26
+ '
27
+ capability_tags:
28
+ - research_code_optimization
29
+ - physics_ml
30
+ - sensor_placement
31
+ - scientific_ml
32
+ - field_reconstruction
33
+ - flow_matching
34
+ - generative_models
35
+ aisb_direction: T3
36
+ track_fit:
37
+ - paper_track
38
+ - benchmark_track
39
+ task_mode: experiment_driven
40
+ requires_execution: true
41
+ requires_paper: true
42
+ integrity_level: cas_plus_canary
43
+ snapshot_status: runnable
44
+ support_level: advanced
45
+ cost_band: medium
46
+ time_band: 6-24h
47
+ difficulty: hard
48
+ data_access: public
49
+ primary_outputs:
50
+ - relative_l2
51
+ - mse_loss
52
+ - sensor_layout
53
+ launch_profiles:
54
+ - id: quick_check
55
+ label: Quick Check
56
+ description: 'Run a single-domain inference route (e.g. pipe_infer.py or sea_infer.py)
57
+ with a pretrained checkpoint to verify the pipeline produces relative_l2 and mse_loss.
58
+
59
+ '
60
+ - id: full_benchmark
61
+ label: Full Benchmark
62
+ description: 'Train base reconstruction models and run sensor placement optimization
63
+ across all three domains (Turbulent-Flow, Sea-Temperature, Car-Aerodynamics),
64
+ then evaluate both random-placement and optimized-placement reconstruction quality.
65
+
66
+ '
67
+ - id: placement_only
68
+ label: Placement Optimization Only
69
+ description: 'Starting from pretrained base models, run only the Stage 2 sensor
70
+ placement optimization (walk scripts) and compare against random-placement baselines.
71
+
72
+ '
73
+ dataset_download:
74
+ primary_method: mixed
75
+ sources:
76
+ - kind: github
77
+ url: https://github.com/thuml/PhySense
78
+ access: public
79
+ note: 'Source code repository. Data for each benchmark must be obtained separately;
80
+ see per-domain README files for download links.
81
+
82
+ '
83
+ notes:
84
+ - 'Sea-Temperature data is loaded from a hardcoded path (/workspace/mayuezhou/ddim/sea_data_large/)
85
+ in inference scripts. The agent must download the sea temperature .npy files and
86
+ update paths accordingly.
87
+
88
+ '
89
+ - 'Turbulent-Flow data is loaded via datasets/senseiver_dataloader.py; the underlying
90
+ data source must be obtained and placed in the expected location.
91
+
92
+ '
93
+ - 'Car-Aerodynamics uses DDP training scripts; data paths are configured via command-line
94
+ arguments in shell scripts under Car-Aerodynamics/scripts/.
95
+
96
+ '
97
+ - 'Total dataset size across all three domains is estimated at 20-60 GB depending
98
+ on resolution choices; exact sizes are not stated in the README.
99
+
100
+ '
101
+ credential_requirements:
102
+ mode: none
103
+ items: []
104
+ notes: []
105
+ resources:
106
+ minimum:
107
+ cpu_cores: 8
108
+ ram_gb: 32
109
+ disk_gb: 80
110
+ gpu_count: 1
111
+ gpu_vram_gb: 16
112
+ recommended:
113
+ cpu_cores: 16
114
+ ram_gb: 64
115
+ disk_gb: 150
116
+ gpu_count: 1
117
+ gpu_vram_gb: 24
118
+ environment:
119
+ python: '3.10'
120
+ cuda: '11.8'
121
+ pytorch: 2.1.0
122
+ key_packages:
123
+ - dotwiz
124
+ - pyyaml
125
+ - numpy
126
+ - matplotlib
127
+ notes:
128
+ - See requirements.txt for the full dependency set.
129
+ - 'Inference scripts use torch.cuda.amp.autocast and hardcode GPU device indices
130
+ (e.g. cuda:5, cuda:0). Adjust device IDs to match your hardware.
131
+
132
+ '
133
+ - 'Car-Aerodynamics uses DDP (DistributedDataParallel); multi-GPU may be needed
134
+ for training but single-GPU suffices for inference.
135
+
136
+ '
137
+ risk_flags:
138
+ - hardcoded_paths
139
+ - hardcoded_device_ids
140
+ - dataset_not_bundled
141
+ - checkpoint_not_verified
142
+ risk_notes:
143
+ - 'Inference scripts contain hardcoded absolute data paths (e.g. /workspace/mayuezhou/ddim/sea_data_large/)
144
+ and hardcoded CUDA device indices (torch.cuda.set_device(5)). These must be edited
145
+ before running.
146
+
147
+ '
148
+ - 'Pretrained checkpoints (e.g. pipe_best_base_model.pth, sea_best_base_model.pth,
149
+ pipe_50sensor_opt.pth) are expected under per-domain ./checkpoints/ directories.
150
+ Availability depends on the snapshot packaging; if missing, training must be run
151
+ first.
152
+
153
+ '
154
+ - 'No benchmark execution was performed during the packaging pass; metric values have
155
+ not been verified at runtime.
156
+
157
+ '
158
+ - 'The walk inference scripts (sensor placement optimization evaluation) require optimized
159
+ checkpoints that are produced only after Stage 2 training.
160
+
161
+ '
162
+ recommended_when: 'Use this benchmark when you want a scientific-ML task that combines
163
+ physics-field reconstruction with constrained sensor placement optimization, testing
164
+ generative modeling (flow matching) across heterogeneous physical domains with both
165
+ regular and irregular geometries.
166
+
167
+ '
168
+ not_recommended_when: 'Do not use this if you need a lightweight benchmark with minimal
169
+ storage, no iterative optimization loop, or no GPU requirement. Also not suitable
170
+ if you cannot modify hardcoded paths and device indices in the source scripts.
171
+
172
+ '
173
+ paper:
174
+ title: 'PhySense: Sensor Placement Optimization for Accurate Physics Sensing'
175
+ venue: NeurIPS 2025 Oral
176
+ year: 2025
177
+ url: https://arxiv.org/abs/2505.18190
178
+ download:
179
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.006_physense.zip
180
+ archive_type: zip
181
+ local_dir_name: paper-6-PhySense
182
+ provider: github_release
183
+ repo: ResearAI/DeepScientist
184
+ tag: aisb-v0.0.1
185
+ asset_name: aisb.t3.006_physense.zip
186
+ sha256: b35419c897e1c56bad7037fc90249da8589f432ba58831550a257b99d19e8b6c
187
+ size_bytes: 94438
188
+ commercial:
189
+ annual_fee: null
190
+ display:
191
+ palette_seed: slate-cyan-fluid
192
+ art_style: scientific-visualization
193
+ accent_priority: high
194
+ image_path: ../image/006_aisb.t3.006_physense.jpg
@@ -0,0 +1,118 @@
1
+ schema_version: 1
2
+ id: aisb.t3.006_physense
3
+ name: 'PhySense:用于精确物理感知的传感器布局优化'
4
+ version: 0.1.0
5
+ one_line: '基于双阶段流匹配方法的物理场重建与传感器布局优化,涵盖湍流、海温及汽车空气动力学基准。'
6
+ task_description: '本基准实现了PhySense,一个协同式双阶段物理感知框架。第一阶段训练基于流匹配的条件生成模型(规则网格使用DiT,不规则网格使用Transolver),通过交叉注意力机制从稀疏传感器观测中重建稠密物理场,传感器可放置在任意位置。第二阶段在空间约束下通过投影梯度下降优化传感器位置,利用重建反馈发现信息量最大的放置方案。智能体需在三个捆绑的科学领域运行训练和推理:(1)湍流(规则网格管道模拟),(2)海温(带陆面掩码的规则网格全球海表温度再分析),(3)汽车空气动力学(不规则网格上的3D表面压力)。每个领域提供了基础模型推理脚本(随机放置)和步行推理脚本(优化放置)。主要指标为相对L2误差和MSE损失;次要输出为优化后的传感器布局。推理脚本中的数据路径指向外部位置,需自行填充数据。预训练检查点应存放在各领域的./checkpoints/目录下。无需外部评估服务,所有指标在推理脚本中本地计算。'
7
+ capability_tags:
8
+ - research_code_optimization
9
+ - physics_ml
10
+ - sensor_placement
11
+ - scientific_ml
12
+ - field_reconstruction
13
+ - flow_matching
14
+ - generative_models
15
+ aisb_direction: T3
16
+ track_fit:
17
+ - paper_track
18
+ - benchmark_track
19
+ task_mode: experiment_driven
20
+ requires_execution: true
21
+ requires_paper: true
22
+ integrity_level: cas_plus_canary
23
+ snapshot_status: runnable
24
+ support_level: advanced
25
+ cost_band: medium
26
+ time_band: 6-24h
27
+ difficulty: hard
28
+ data_access: public
29
+ primary_outputs:
30
+ - relative_l2
31
+ - mse_loss
32
+ - sensor_layout
33
+ launch_profiles:
34
+ - id: quick_check
35
+ label: 快速检查
36
+ description: '使用预训练检查点运行单领域推理(如pipe_infer.py或sea_infer.py),验证流水线能否输出relative_l2和mse_loss指标。'
37
+ - id: full_benchmark
38
+ label: 完整基准测试
39
+ description: '在全部三个领域(湍流、海温、汽车空气动力学)上训练基础重建模型并运行传感器布局优化,然后评估随机放置和优化放置两种方案的重建质量。'
40
+ - id: placement_only
41
+ label: 仅布局优化
42
+ description: '基于预训练基础模型,仅运行第二阶段传感器布局优化(步行脚本),并与随机放置基线进行对比。'
43
+ dataset_download:
44
+ primary_method: mixed
45
+ sources:
46
+ - kind: github
47
+ url: https://github.com/thuml/PhySense
48
+ access: public
49
+ note: '源代码仓库。各基准数据需单独获取,详见各领域README文件中的下载链接。'
50
+ notes:
51
+ - '海温数据从推理脚本中的硬编码路径(/workspace/mayuezhou/ddim/sea_data_large/)加载。智能体需下载海温.npy文件并相应更新路径。'
52
+ - '湍流数据通过datasets/senseiver_dataloader.py加载;需获取底层数据源并放置到预期位置。'
53
+ - '汽车空气动力学使用DDP训练脚本;数据路径通过Car-Aerodynamics/scripts/下shell脚本的命令行参数配置。'
54
+ - '三个领域的数据集总大小估计为20-60GB,取决于分辨率选择;README中未注明确切大小。'
55
+ credential_requirements:
56
+ mode: none
57
+ items: []
58
+ notes: []
59
+ resources:
60
+ minimum:
61
+ cpu_cores: 8
62
+ ram_gb: 32
63
+ disk_gb: 80
64
+ gpu_count: 1
65
+ gpu_vram_gb: 16
66
+ recommended:
67
+ cpu_cores: 16
68
+ ram_gb: 64
69
+ disk_gb: 150
70
+ gpu_count: 1
71
+ gpu_vram_gb: 24
72
+ environment:
73
+ python: '3.10'
74
+ cuda: '11.8'
75
+ pytorch: 2.1.0
76
+ key_packages:
77
+ - dotwiz
78
+ - pyyaml
79
+ - numpy
80
+ - matplotlib
81
+ notes:
82
+ - 完整依赖列表见requirements.txt。
83
+ - '推理脚本使用torch.cuda.amp.autocast并硬编码GPU设备索引(如cuda:5、cuda:0)。请根据您的硬件调整设备ID。'
84
+ - '汽车空气动力学使用DDP(DistributedDataParallel);训练可能需要多GPU,但推理仅需单GPU即可。'
85
+ risk_flags:
86
+ - hardcoded_paths
87
+ - hardcoded_device_ids
88
+ - dataset_not_bundled
89
+ - checkpoint_not_verified
90
+ risk_notes:
91
+ - '推理脚本包含硬编码的绝对数据路径(如/workspace/mayuezhou/ddim/sea_data_large/)和硬编码的CUDA设备索引(torch.cuda.set_device(5))。运行前必须编辑修改。'
92
+ - '预训练检查点(如pipe_best_base_model.pth、sea_best_base_model.pth、pipe_50sensor_opt.pth)应存放在各领域./checkpoints/目录下。是否可用取决于快照打包情况;如缺失需先运行训练。'
93
+ - '打包过程中未执行基准测试;指标值未经运行时验证。'
94
+ - '步行推理脚本(传感器布局优化评估)需要优化后的检查点,该检查点仅在第二阶段训练后产生。'
95
+ recommended_when: '当您需要一项结合物理场重建与约束传感器布局优化的科学机器学习任务,且该任务需测试跨异构物理领域的生成式建模(流匹配)能力,涉及规则和不规则几何构型时,请使用此基准。'
96
+ not_recommended_when: '如果需要轻量级基准(存储需求小、无迭代优化循环、无GPU要求),请勿使用。此外,如无法修改源代码脚本中的硬编码路径和设备索引,也不适用。'
97
+ paper:
98
+ title: 'PhySense: Sensor Placement Optimization for Accurate Physics Sensing'
99
+ venue: NeurIPS 2025 Oral
100
+ year: 2025
101
+ url: https://arxiv.org/abs/2505.18190
102
+ download:
103
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.006_physense.zip
104
+ archive_type: zip
105
+ local_dir_name: paper-6-PhySense
106
+ provider: github_release
107
+ repo: ResearAI/DeepScientist
108
+ tag: aisb-v0.0.1
109
+ asset_name: aisb.t3.006_physense.zip
110
+ sha256: b35419c897e1c56bad7037fc90249da8589f432ba58831550a257b99d19e8b6c
111
+ size_bytes: 94438
112
+ commercial:
113
+ annual_fee: null
114
+ display:
115
+ palette_seed: slate-cyan-fluid
116
+ art_style: scientific-visualization
117
+ accent_priority: high
118
+ image_path: ../image/006_aisb.t3.006_physense.jpg