@researai/deepscientist 1.5.17 → 1.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (894) hide show
  1. package/AGENTS.md +309 -130
  2. package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
  3. package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
  4. package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
  5. package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
  6. package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
  7. package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
  8. package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
  9. package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
  10. package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
  11. package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
  12. package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
  13. package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
  14. package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
  15. package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
  16. package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
  17. package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
  18. package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
  19. package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
  20. package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
  21. package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
  22. package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
  23. package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
  24. package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
  25. package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
  26. package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
  27. package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
  28. package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
  29. package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
  30. package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
  31. package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
  32. package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
  33. package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
  34. package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
  35. package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
  36. package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
  37. package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
  38. package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
  39. package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
  40. package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
  41. package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
  42. package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
  43. package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
  44. package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
  45. package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
  46. package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
  47. package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
  48. package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
  49. package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
  50. package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
  51. package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
  52. package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
  53. package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
  54. package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
  55. package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
  56. package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
  57. package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
  58. package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
  59. package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
  60. package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
  61. package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
  62. package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
  63. package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
  64. package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
  65. package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
  66. package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
  67. package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
  68. package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
  69. package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
  70. package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
  71. package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
  72. package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
  73. package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
  74. package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
  75. package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
  76. package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
  77. package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
  78. package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
  79. package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
  80. package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
  81. package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
  82. package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
  83. package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
  84. package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
  85. package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
  86. package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
  87. package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
  88. package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
  89. package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
  90. package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
  91. package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
  92. package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
  93. package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
  94. package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
  95. package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
  96. package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
  97. package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
  98. package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
  99. package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
  100. package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
  101. package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
  102. package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
  103. package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
  104. package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
  105. package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
  106. package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
  107. package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
  108. package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
  109. package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
  110. package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
  111. package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
  112. package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
  113. package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
  114. package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
  115. package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
  116. package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
  117. package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
  118. package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
  119. package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
  120. package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
  121. package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
  122. package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
  123. package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
  124. package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
  125. package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
  126. package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
  127. package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
  128. package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
  129. package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
  130. package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
  131. package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
  132. package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
  133. package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
  134. package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
  135. package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
  136. package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
  137. package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
  138. package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
  139. package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
  140. package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
  141. package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
  142. package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
  143. package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
  144. package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
  145. package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
  146. package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
  147. package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
  148. package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
  149. package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
  150. package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
  151. package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
  152. package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
  153. package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
  154. package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
  155. package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
  156. package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
  157. package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
  158. package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
  159. package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
  160. package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
  161. package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
  162. package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
  163. package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
  164. package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
  165. package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
  166. package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
  167. package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
  168. package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
  169. package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
  170. package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
  171. package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
  172. package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
  173. package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
  174. package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
  175. package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
  176. package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
  177. package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
  178. package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
  179. package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
  180. package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
  181. package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
  182. package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
  183. package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
  184. package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
  185. package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
  186. package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
  187. package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
  188. package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
  189. package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
  190. package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
  191. package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
  192. package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
  193. package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
  194. package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
  195. package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
  196. package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
  197. package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
  198. package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
  199. package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
  200. package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
  201. package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
  202. package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
  203. package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
  204. package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
  205. package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
  206. package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
  207. package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
  208. package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
  209. package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
  210. package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
  211. package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
  212. package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
  213. package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
  214. package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
  215. package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
  216. package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
  217. package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
  218. package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
  219. package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
  220. package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
  221. package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
  222. package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
  223. package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
  224. package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
  225. package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
  226. package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
  227. package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
  228. package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
  229. package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
  230. package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
  231. package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
  232. package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
  233. package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
  234. package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
  235. package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
  236. package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
  237. package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
  238. package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
  239. package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
  240. package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
  241. package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
  242. package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
  243. package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
  244. package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
  245. package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
  246. package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
  247. package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
  248. package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
  249. package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
  250. package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
  251. package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
  252. package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
  253. package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
  254. package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
  255. package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
  256. package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
  257. package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
  258. package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
  259. package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
  260. package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
  261. package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
  262. package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
  263. package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
  264. package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
  265. package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
  266. package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
  267. package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
  268. package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
  269. package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
  270. package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
  271. package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
  272. package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
  273. package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
  274. package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
  275. package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
  276. package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
  277. package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
  278. package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
  279. package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
  280. package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
  281. package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
  282. package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
  283. package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
  284. package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
  285. package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
  286. package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
  287. package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
  288. package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
  289. package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
  290. package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
  291. package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
  292. package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
  293. package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
  294. package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
  295. package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
  296. package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
  297. package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
  298. package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
  299. package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
  300. package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
  301. package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
  302. package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
  303. package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
  304. package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
  305. package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
  306. package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
  307. package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
  308. package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
  309. package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
  310. package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
  311. package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
  312. package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
  313. package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
  314. package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
  315. package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
  316. package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
  317. package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
  318. package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
  319. package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
  320. package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
  321. package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
  322. package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
  323. package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
  324. package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
  325. package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
  326. package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
  327. package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
  328. package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
  329. package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
  330. package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
  331. package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
  332. package/AISB/image/aisb.b10.climate_earth.svg +16 -0
  333. package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
  334. package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
  335. package/AISB/image/aisb.b2.agent_systems.svg +16 -0
  336. package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
  337. package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
  338. package/AISB/image/aisb.b5.math_proof.svg +16 -0
  339. package/AISB/image/aisb.b6.research_process.svg +16 -0
  340. package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
  341. package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
  342. package/AISB/image/aisb.b9.material_science.svg +16 -0
  343. package/README.md +132 -11
  344. package/bin/ds.js +376 -49
  345. package/docs/en/00_QUICK_START.md +135 -18
  346. package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
  347. package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
  348. package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
  349. package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
  350. package/docs/en/05_TUI_GUIDE.md +171 -2
  351. package/docs/en/07_MEMORY_AND_MCP.md +38 -2
  352. package/docs/en/09_DOCTOR.md +64 -4
  353. package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
  354. package/docs/en/11_LICENSE_AND_RISK.md +4 -0
  355. package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
  356. package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
  357. package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
  358. package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
  359. package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
  360. package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
  361. package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
  362. package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
  363. package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
  364. package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
  365. package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
  366. package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
  367. package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
  368. package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
  369. package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
  370. package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
  371. package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
  372. package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
  373. package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
  374. package/docs/en/91_DEVELOPMENT.md +29 -0
  375. package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
  376. package/docs/en/README.md +44 -7
  377. package/docs/images/admin/admin-connectors-health-en.png +0 -0
  378. package/docs/images/admin/admin-controllers-en.png +0 -0
  379. package/docs/images/admin/admin-diagnostics-en.png +0 -0
  380. package/docs/images/admin/admin-errors-en.png +0 -0
  381. package/docs/images/admin/admin-issues-en.png +0 -0
  382. package/docs/images/admin/admin-logs-en.png +0 -0
  383. package/docs/images/admin/admin-quest-detail-en.png +0 -0
  384. package/docs/images/admin/admin-quests-en.png +0 -0
  385. package/docs/images/admin/admin-repairs-en.png +0 -0
  386. package/docs/images/admin/admin-runtime-en.png +0 -0
  387. package/docs/images/admin/admin-search-en.png +0 -0
  388. package/docs/images/admin/admin-stats-en.png +0 -0
  389. package/docs/images/admin/admin-summary-en.png +0 -0
  390. package/docs/images/connectors/connector-discord-en.png +0 -0
  391. package/docs/images/connectors/connector-feishu-en.png +0 -0
  392. package/docs/images/connectors/connector-lingzhu-en.png +0 -0
  393. package/docs/images/connectors/connector-qq-en.png +0 -0
  394. package/docs/images/connectors/connector-slack-en.png +0 -0
  395. package/docs/images/connectors/connector-telegram-en.png +0 -0
  396. package/docs/images/connectors/connector-weixin-en.png +0 -0
  397. package/docs/images/connectors/connector-whatsapp-en.png +0 -0
  398. package/docs/images/settings/settings-baselines-en.png +0 -0
  399. package/docs/images/settings/settings-config-en.png +0 -0
  400. package/docs/images/settings/settings-connectors-overview-en.png +0 -0
  401. package/docs/images/settings/settings-deepxiv-en.png +0 -0
  402. package/docs/images/settings/settings-mcp-servers-en.png +0 -0
  403. package/docs/images/settings/settings-plugins-en.png +0 -0
  404. package/docs/images/settings/settings-runners-en.png +0 -0
  405. package/docs/zh/00_QUICK_START.md +92 -17
  406. package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
  407. package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
  408. package/docs/zh/05_TUI_GUIDE.md +171 -2
  409. package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
  410. package/docs/zh/09_DOCTOR.md +39 -4
  411. package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
  412. package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
  413. package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
  414. package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
  415. package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
  416. package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
  417. package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
  418. package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
  419. package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
  420. package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
  421. package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
  422. package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
  423. package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
  424. package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
  425. package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
  426. package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
  427. package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
  428. package/docs/zh/README.md +29 -7
  429. package/install.sh +122 -16
  430. package/package.json +4 -1
  431. package/pyproject.toml +2 -1
  432. package/src/deepscientist/__init__.py +1 -1
  433. package/src/deepscientist/acp/envelope.py +13 -0
  434. package/src/deepscientist/admin/__init__.py +3 -0
  435. package/src/deepscientist/admin/charts.py +681 -0
  436. package/src/deepscientist/admin/logs.py +119 -0
  437. package/src/deepscientist/admin/repairs.py +217 -0
  438. package/src/deepscientist/admin/service.py +1310 -0
  439. package/src/deepscientist/admin/system_info.py +700 -0
  440. package/src/deepscientist/admin/tasks.py +465 -0
  441. package/src/deepscientist/admin/tool_metrics.py +600 -0
  442. package/src/deepscientist/artifact/guidance.py +8 -4
  443. package/src/deepscientist/artifact/schemas.py +115 -0
  444. package/src/deepscientist/artifact/service.py +4268 -260
  445. package/src/deepscientist/bash_exec/monitor.py +30 -3
  446. package/src/deepscientist/bash_exec/service.py +134 -1
  447. package/src/deepscientist/benchstore/__init__.py +4 -0
  448. package/src/deepscientist/benchstore/prompt_builder.py +224 -0
  449. package/src/deepscientist/benchstore/service.py +1716 -0
  450. package/src/deepscientist/channels/weixin_ilink.py +8 -1
  451. package/src/deepscientist/cli.py +92 -17
  452. package/src/deepscientist/codex_cli_compat.py +2 -2
  453. package/src/deepscientist/config/models.py +82 -11
  454. package/src/deepscientist/config/service.py +927 -91
  455. package/src/deepscientist/connector/weixin_support.py +48 -17
  456. package/src/deepscientist/daemon/api/handlers.py +697 -210
  457. package/src/deepscientist/daemon/api/router.py +76 -1
  458. package/src/deepscientist/daemon/app.py +1054 -51
  459. package/src/deepscientist/diagnostics/runner_failures.py +147 -0
  460. package/src/deepscientist/doctor.py +212 -65
  461. package/src/deepscientist/evidence_packets.py +590 -0
  462. package/src/deepscientist/home.py +52 -4
  463. package/src/deepscientist/kimi_cli_compat.py +50 -0
  464. package/src/deepscientist/latex_runtime.py +2 -2
  465. package/src/deepscientist/mcp/context.py +2 -0
  466. package/src/deepscientist/mcp/schemas.py +114 -0
  467. package/src/deepscientist/mcp/server.py +1566 -126
  468. package/src/deepscientist/memory/service.py +203 -16
  469. package/src/deepscientist/process_control.py +8 -1
  470. package/src/deepscientist/prompts/builder.py +836 -92
  471. package/src/deepscientist/quest/__init__.py +2 -2
  472. package/src/deepscientist/quest/layout.py +12 -1
  473. package/src/deepscientist/quest/node_traces.py +10 -0
  474. package/src/deepscientist/quest/service.py +1430 -139
  475. package/src/deepscientist/quest/stage_views.py +1 -1
  476. package/src/deepscientist/runners/__init__.py +18 -0
  477. package/src/deepscientist/runners/base.py +89 -1
  478. package/src/deepscientist/runners/builtins.py +13 -1
  479. package/src/deepscientist/runners/claude.py +391 -0
  480. package/src/deepscientist/runners/codex.py +421 -21
  481. package/src/deepscientist/runners/codex_telemetry.py +127 -0
  482. package/src/deepscientist/runners/kimi.py +334 -0
  483. package/src/deepscientist/runners/metadata.py +68 -0
  484. package/src/deepscientist/runners/opencode.py +414 -0
  485. package/src/deepscientist/runners/runtime_overrides.py +100 -0
  486. package/src/deepscientist/runners/simple_cli.py +538 -0
  487. package/src/deepscientist/runtime_storage.py +303 -0
  488. package/src/deepscientist/shared.py +61 -16
  489. package/src/deepscientist/skills/installer.py +37 -0
  490. package/src/deepscientist/skills/registry.py +2 -0
  491. package/src/deepscientist/tinytex.py +2 -2
  492. package/src/deepscientist/tui.py +10 -3
  493. package/src/prompts/benchstore/system.md +77 -0
  494. package/src/prompts/connectors/qq.md +33 -2
  495. package/src/prompts/connectors/weixin.md +208 -23
  496. package/src/prompts/contracts/admin_ops.md +74 -0
  497. package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
  498. package/src/prompts/contracts/shared_interaction.md +5 -11
  499. package/src/prompts/start_setup/system.md +422 -0
  500. package/src/prompts/system.md +409 -315
  501. package/src/prompts/system_copilot.md +88 -12
  502. package/src/skills/analysis-campaign/SKILL.md +239 -578
  503. package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
  504. package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
  505. package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
  506. package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
  507. package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
  508. package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
  509. package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
  510. package/src/skills/baseline/SKILL.md +183 -461
  511. package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
  512. package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
  513. package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
  514. package/src/skills/baseline/references/baseline-plan-template.md +37 -76
  515. package/src/skills/baseline/references/boundary-cases.md +86 -0
  516. package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
  517. package/src/skills/baseline/references/comparability-contract.md +7 -12
  518. package/src/skills/baseline/references/operational-guidance.md +56 -0
  519. package/src/skills/baseline/references/route-selection.md +5 -25
  520. package/src/skills/decision/SKILL.md +113 -306
  521. package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
  522. package/src/skills/decision/references/operational-guidance.md +94 -0
  523. package/src/skills/decision/references/research-route-criteria.md +7 -8
  524. package/src/skills/decision/references/strategic-decision-template.md +13 -26
  525. package/src/skills/experiment/SKILL.md +132 -670
  526. package/src/skills/experiment/references/execution-playbook.md +374 -0
  527. package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
  528. package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
  529. package/src/skills/experiment/references/operational-guidance.md +108 -0
  530. package/src/skills/finalize/SKILL.md +62 -0
  531. package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
  532. package/src/skills/finalize/references/resume-packet-template.md +7 -0
  533. package/src/skills/idea/SKILL.md +228 -15
  534. package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
  535. package/src/skills/idea/references/current-board-packet-template.md +61 -0
  536. package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
  537. package/src/skills/idea/references/idea-generation-playbook.md +21 -0
  538. package/src/skills/idea/references/idea-thinking-flow.md +6 -0
  539. package/src/skills/idea/references/literature-survey-template.md +3 -0
  540. package/src/skills/idea/references/objective-contract-template.md +54 -0
  541. package/src/skills/idea/references/outline-seeding-example.md +56 -0
  542. package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
  543. package/src/skills/idea/references/related-work-playbook.md +75 -2
  544. package/src/skills/idea/references/research-history-playbook.md +114 -0
  545. package/src/skills/idea/references/selection-gate.md +58 -6
  546. package/src/skills/intake-audit/SKILL.md +43 -2
  547. package/src/skills/intake-audit/references/state-audit-template.md +10 -0
  548. package/src/skills/nature-data/SKILL.md +128 -0
  549. package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
  550. package/src/skills/nature-data/agents/openai.yaml +4 -0
  551. package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
  552. package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
  553. package/src/skills/nature-data/references/policy-principles.md +103 -0
  554. package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
  555. package/src/skills/nature-data/references/source-basis.md +54 -0
  556. package/src/skills/nature-data/references/statement-patterns.md +153 -0
  557. package/src/skills/nature-figure/SKILL.md +197 -0
  558. package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
  559. package/src/skills/nature-figure/agents/openai.yaml +4 -0
  560. package/src/skills/nature-figure/evals/evals.json +37 -0
  561. package/src/skills/nature-figure/references/api.md +428 -0
  562. package/src/skills/nature-figure/references/backend-selection.md +100 -0
  563. package/src/skills/nature-figure/references/chart-types.md +281 -0
  564. package/src/skills/nature-figure/references/common-patterns.md +349 -0
  565. package/src/skills/nature-figure/references/design-theory.md +436 -0
  566. package/src/skills/nature-figure/references/figure-contract.md +93 -0
  567. package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
  568. package/src/skills/nature-figure/references/qa-contract.md +119 -0
  569. package/src/skills/nature-figure/references/r-template-index.md +66 -0
  570. package/src/skills/nature-figure/references/r-workflow.md +161 -0
  571. package/src/skills/nature-figure/references/tutorials.md +250 -0
  572. package/src/skills/nature-paper2ppt/SKILL.md +507 -0
  573. package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
  574. package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
  575. package/src/skills/nature-polishing/SKILL.md +385 -0
  576. package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
  577. package/src/skills/nature-polishing/agents/openai.yaml +4 -0
  578. package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
  579. package/src/skills/nature-polishing/references/section-moves.md +240 -0
  580. package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
  581. package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
  582. package/src/skills/optimize/SKILL.md +177 -1568
  583. package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
  584. package/src/skills/optimize/references/candidate-board-template.md +13 -0
  585. package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
  586. package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
  587. package/src/skills/optimize/references/debug-response-template.md +29 -0
  588. package/src/skills/optimize/references/frontier-review-template.md +32 -0
  589. package/src/skills/optimize/references/fusion-playbook.md +36 -0
  590. package/src/skills/optimize/references/method-brief-template.md +73 -0
  591. package/src/skills/optimize/references/operational-guidance.md +621 -0
  592. package/src/skills/optimize/references/optimization-memory-template.md +30 -0
  593. package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
  594. package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
  595. package/src/skills/optimize/references/prompt-patterns.md +49 -0
  596. package/src/skills/paper-outline/SKILL.md +227 -0
  597. package/src/skills/paper-outline/references/outline-patterns.md +87 -0
  598. package/src/skills/paper-plot/SKILL.md +79 -0
  599. package/src/skills/paper-plot/agents/openai.yaml +4 -0
  600. package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
  601. package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
  602. package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
  603. package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
  604. package/src/skills/paper-plot/references/line_training_curve.md +44 -0
  605. package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
  606. package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
  607. package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
  608. package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
  609. package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
  610. package/src/skills/paper-plot/scripts/line_aime.py +94 -0
  611. package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
  612. package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
  613. package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
  614. package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
  615. package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
  616. package/src/skills/rebuttal/SKILL.md +9 -0
  617. package/src/skills/references/tool-usage-by-stage.md +438 -0
  618. package/src/skills/review/SKILL.md +105 -7
  619. package/src/skills/science/PROVENANCE.md +44 -0
  620. package/src/skills/science/SKILL.md +137 -0
  621. package/src/skills/science/references/artifact-science-tool.md +110 -0
  622. package/src/skills/science/references/claim-type-discipline.md +56 -0
  623. package/src/skills/science/references/domain-index.md +422 -0
  624. package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
  625. package/src/skills/science/references/package-check-playbook.md +64 -0
  626. package/src/skills/science/references/package-index.min.json +3616 -0
  627. package/src/skills/science/references/packages/abinit.md +80 -0
  628. package/src/skills/science/references/packages/acts.md +73 -0
  629. package/src/skills/science/references/packages/aiida-core.md +80 -0
  630. package/src/skills/science/references/packages/alamode.md +80 -0
  631. package/src/skills/science/references/packages/amuse.md +88 -0
  632. package/src/skills/science/references/packages/anndata.md +88 -0
  633. package/src/skills/science/references/packages/arbor.md +80 -0
  634. package/src/skills/science/references/packages/arc.md +73 -0
  635. package/src/skills/science/references/packages/astropy.md +88 -0
  636. package/src/skills/science/references/packages/astroquery.md +88 -0
  637. package/src/skills/science/references/packages/atomate2.md +80 -0
  638. package/src/skills/science/references/packages/atomsmltr.md +73 -0
  639. package/src/skills/science/references/packages/awkward.md +73 -0
  640. package/src/skills/science/references/packages/batman.md +88 -0
  641. package/src/skills/science/references/packages/biopython.md +88 -0
  642. package/src/skills/science/references/packages/bloqade.md +73 -0
  643. package/src/skills/science/references/packages/brian2.md +73 -0
  644. package/src/skills/science/references/packages/bullet3.md +73 -0
  645. package/src/skills/science/references/packages/calculix.md +80 -0
  646. package/src/skills/science/references/packages/cantera.md +73 -0
  647. package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
  648. package/src/skills/science/references/packages/ccdproc.md +88 -0
  649. package/src/skills/science/references/packages/celerite2.md +88 -0
  650. package/src/skills/science/references/packages/cellrank.md +73 -0
  651. package/src/skills/science/references/packages/cesm.md +80 -0
  652. package/src/skills/science/references/packages/chemicals.md +73 -0
  653. package/src/skills/science/references/packages/chempy.md +73 -0
  654. package/src/skills/science/references/packages/cirq.md +73 -0
  655. package/src/skills/science/references/packages/coffea.md +73 -0
  656. package/src/skills/science/references/packages/cp2k.md +88 -0
  657. package/src/skills/science/references/packages/custodian.md +80 -0
  658. package/src/skills/science/references/packages/dart.md +73 -0
  659. package/src/skills/science/references/packages/datamol.md +88 -0
  660. package/src/skills/science/references/packages/dd4hep.md +73 -0
  661. package/src/skills/science/references/packages/dealii.md +80 -0
  662. package/src/skills/science/references/packages/deepchem.md +88 -0
  663. package/src/skills/science/references/packages/delphes.md +73 -0
  664. package/src/skills/science/references/packages/devito.md +80 -0
  665. package/src/skills/science/references/packages/dftb.md +88 -0
  666. package/src/skills/science/references/packages/dftd4.md +88 -0
  667. package/src/skills/science/references/packages/dftk-jl.md +80 -0
  668. package/src/skills/science/references/packages/dolfinx.md +80 -0
  669. package/src/skills/science/references/packages/drake.md +73 -0
  670. package/src/skills/science/references/packages/dumux.md +73 -0
  671. package/src/skills/science/references/packages/elk.md +80 -0
  672. package/src/skills/science/references/packages/elmerfem.md +80 -0
  673. package/src/skills/science/references/packages/enzo-e.md +88 -0
  674. package/src/skills/science/references/packages/espresso.md +80 -0
  675. package/src/skills/science/references/packages/exoplanet.md +88 -0
  676. package/src/skills/science/references/packages/fairroot.md +73 -0
  677. package/src/skills/science/references/packages/fbpic.md +80 -0
  678. package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
  679. package/src/skills/science/references/packages/geant4.md +73 -0
  680. package/src/skills/science/references/packages/geosx.md +80 -0
  681. package/src/skills/science/references/packages/gprmax.md +80 -0
  682. package/src/skills/science/references/packages/gromacs.md +80 -0
  683. package/src/skills/science/references/packages/gwaslab.md +73 -0
  684. package/src/skills/science/references/packages/gz-sim.md +73 -0
  685. package/src/skills/science/references/packages/hail.md +88 -0
  686. package/src/skills/science/references/packages/hiphive.md +80 -0
  687. package/src/skills/science/references/packages/hoomd-blue.md +80 -0
  688. package/src/skills/science/references/packages/itensor.md +73 -0
  689. package/src/skills/science/references/packages/itensors-jl.md +73 -0
  690. package/src/skills/science/references/packages/jdftx.md +73 -0
  691. package/src/skills/science/references/packages/jobflow.md +80 -0
  692. package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
  693. package/src/skills/science/references/packages/kite.md +80 -0
  694. package/src/skills/science/references/packages/kratos.md +80 -0
  695. package/src/skills/science/references/packages/kwant.md +73 -0
  696. package/src/skills/science/references/packages/lammps.md +80 -0
  697. package/src/skills/science/references/packages/lightkurve.md +88 -0
  698. package/src/skills/science/references/packages/limix.md +73 -0
  699. package/src/skills/science/references/packages/maxwelllink.md +80 -0
  700. package/src/skills/science/references/packages/mcdc.md +73 -0
  701. package/src/skills/science/references/packages/meep.md +80 -0
  702. package/src/skills/science/references/packages/mfem.md +80 -0
  703. package/src/skills/science/references/packages/mitgcm.md +73 -0
  704. package/src/skills/science/references/packages/modflow6.md +73 -0
  705. package/src/skills/science/references/packages/molecool.md +73 -0
  706. package/src/skills/science/references/packages/mom6.md +73 -0
  707. package/src/skills/science/references/packages/moose.md +80 -0
  708. package/src/skills/science/references/packages/mpas-model.md +73 -0
  709. package/src/skills/science/references/packages/mujoco.md +73 -0
  710. package/src/skills/science/references/packages/mumax3.md +73 -0
  711. package/src/skills/science/references/packages/nekrs.md +80 -0
  712. package/src/skills/science/references/packages/nessi.md +73 -0
  713. package/src/skills/science/references/packages/nest-simulator.md +73 -0
  714. package/src/skills/science/references/packages/netket.md +73 -0
  715. package/src/skills/science/references/packages/neuron.md +73 -0
  716. package/src/skills/science/references/packages/nextflow.md +88 -0
  717. package/src/skills/science/references/packages/nwchem.md +88 -0
  718. package/src/skills/science/references/packages/openbabel.md +88 -0
  719. package/src/skills/science/references/packages/openems.md +80 -0
  720. package/src/skills/science/references/packages/openff-toolkit.md +88 -0
  721. package/src/skills/science/references/packages/openfoam-dev.md +80 -0
  722. package/src/skills/science/references/packages/openmc.md +73 -0
  723. package/src/skills/science/references/packages/openmm.md +80 -0
  724. package/src/skills/science/references/packages/openmoc.md +73 -0
  725. package/src/skills/science/references/packages/openmx.md +80 -0
  726. package/src/skills/science/references/packages/opensees.md +80 -0
  727. package/src/skills/science/references/packages/opensn.md +80 -0
  728. package/src/skills/science/references/packages/opm-simulators.md +73 -0
  729. package/src/skills/science/references/packages/oqupy.md +73 -0
  730. package/src/skills/science/references/packages/packmol.md +80 -0
  731. package/src/skills/science/references/packages/palabos.md +80 -0
  732. package/src/skills/science/references/packages/parflow.md +80 -0
  733. package/src/skills/science/references/packages/pennylane.md +88 -0
  734. package/src/skills/science/references/packages/perceval.md +73 -0
  735. package/src/skills/science/references/packages/phono3py.md +73 -0
  736. package/src/skills/science/references/packages/phonopy.md +73 -0
  737. package/src/skills/science/references/packages/photutils.md +88 -0
  738. package/src/skills/science/references/packages/picongpu.md +80 -0
  739. package/src/skills/science/references/packages/plink-ng.md +88 -0
  740. package/src/skills/science/references/packages/precice.md +73 -0
  741. package/src/skills/science/references/packages/psc.md +80 -0
  742. package/src/skills/science/references/packages/psi4.md +88 -0
  743. package/src/skills/science/references/packages/pybinding.md +73 -0
  744. package/src/skills/science/references/packages/pyfr.md +80 -0
  745. package/src/skills/science/references/packages/pyhf.md +73 -0
  746. package/src/skills/science/references/packages/pyiron_base.md +80 -0
  747. package/src/skills/science/references/packages/pylcp.md +73 -0
  748. package/src/skills/science/references/packages/pylith.md +80 -0
  749. package/src/skills/science/references/packages/pynbody.md +88 -0
  750. package/src/skills/science/references/packages/pysam.md +88 -0
  751. package/src/skills/science/references/packages/pyscf.md +88 -0
  752. package/src/skills/science/references/packages/q-e.md +73 -0
  753. package/src/skills/science/references/packages/qibo.md +73 -0
  754. package/src/skills/science/references/packages/qiskit.md +73 -0
  755. package/src/skills/science/references/packages/quantica-jl.md +73 -0
  756. package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
  757. package/src/skills/science/references/packages/quimb.md +73 -0
  758. package/src/skills/science/references/packages/qulacs.md +73 -0
  759. package/src/skills/science/references/packages/qutip.md +73 -0
  760. package/src/skills/science/references/packages/rdkit.md +88 -0
  761. package/src/skills/science/references/packages/rmg-py.md +73 -0
  762. package/src/skills/science/references/packages/root.md +73 -0
  763. package/src/skills/science/references/packages/scanpy.md +88 -0
  764. package/src/skills/science/references/packages/scikit-allel.md +88 -0
  765. package/src/skills/science/references/packages/scikit-bio.md +88 -0
  766. package/src/skills/science/references/packages/scqubits.md +73 -0
  767. package/src/skills/science/references/packages/scuff-em.md +80 -0
  768. package/src/skills/science/references/packages/scvi-tools.md +73 -0
  769. package/src/skills/science/references/packages/seissol.md +73 -0
  770. package/src/skills/science/references/packages/sfepy.md +80 -0
  771. package/src/skills/science/references/packages/sisl.md +73 -0
  772. package/src/skills/science/references/packages/smilei.md +80 -0
  773. package/src/skills/science/references/packages/snakemake.md +88 -0
  774. package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
  775. package/src/skills/science/references/packages/specutils.md +88 -0
  776. package/src/skills/science/references/packages/spglib.md +80 -0
  777. package/src/skills/science/references/packages/squidpy.md +88 -0
  778. package/src/skills/science/references/packages/starry.md +88 -0
  779. package/src/skills/science/references/packages/strawberryfields.md +73 -0
  780. package/src/skills/science/references/packages/su2.md +80 -0
  781. package/src/skills/science/references/packages/sunny-jl.md +73 -0
  782. package/src/skills/science/references/packages/sw4.md +73 -0
  783. package/src/skills/science/references/packages/swift.md +88 -0
  784. package/src/skills/science/references/packages/tdnegf.md +73 -0
  785. package/src/skills/science/references/packages/tenpy.md +73 -0
  786. package/src/skills/science/references/packages/thermo.md +73 -0
  787. package/src/skills/science/references/packages/tkwant.md +73 -0
  788. package/src/skills/science/references/packages/tvb-root.md +73 -0
  789. package/src/skills/science/references/packages/uproot5.md +73 -0
  790. package/src/skills/science/references/packages/vampire.md +80 -0
  791. package/src/skills/science/references/packages/wannier_tools.md +73 -0
  792. package/src/skills/science/references/packages/warpx.md +80 -0
  793. package/src/skills/science/references/packages/wrf.md +73 -0
  794. package/src/skills/science/references/packages/xtb.md +88 -0
  795. package/src/skills/science/references/packages/yt.md +73 -0
  796. package/src/skills/science/references/science-task-brief-template.md +71 -0
  797. package/src/skills/scout/SKILL.md +83 -425
  798. package/src/skills/scout/references/literature-scout-template.md +5 -24
  799. package/src/skills/scout/references/operational-guidance.md +191 -0
  800. package/src/skills/scout/references/paper-triage-playbook.md +11 -35
  801. package/src/skills/write/SKILL.md +744 -1246
  802. package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
  803. package/src/skills/write/references/oral_package_patterns.md +252 -0
  804. package/src/skills/write/references/oral_writing_principles.md +291 -0
  805. package/src/skills/write/references/section_rewrite_checklist.md +234 -0
  806. package/src/tui/dist/app/AppContainer.js +1314 -27
  807. package/src/tui/dist/components/Composer.js +26 -1
  808. package/src/tui/dist/components/ConfigScreen.js +2 -1
  809. package/src/tui/dist/components/InputPrompt.js +25 -9
  810. package/src/tui/dist/components/MainContent.js +18 -3
  811. package/src/tui/dist/components/QuestScreen.js +3 -2
  812. package/src/tui/dist/components/UtilityScreen.js +37 -0
  813. package/src/tui/dist/hooks/useSafeInput.js +10 -0
  814. package/src/tui/dist/index.js +13 -1
  815. package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
  816. package/src/tui/dist/lib/api.js +89 -1
  817. package/src/tui/package.json +1 -1
  818. package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
  819. package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
  820. package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
  821. package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
  822. package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
  823. package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
  824. package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
  825. package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
  826. package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
  827. package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
  828. package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
  829. package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
  830. package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
  831. package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
  832. package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
  833. package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
  834. package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
  835. package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
  836. package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
  837. package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
  838. package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
  839. package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
  840. package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
  841. package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
  842. package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
  843. package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
  844. package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
  845. package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
  846. package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
  847. package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
  848. package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
  849. package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
  850. package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
  851. package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
  852. package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
  853. package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
  854. package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
  855. package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
  856. package/src/ui/dist/index.html +3 -3
  857. package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
  858. package/src/skills/baseline/references/memory-playbook.md +0 -40
  859. package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
  860. package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
  861. package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
  862. package/src/skills/write/references/paper-section-playbook.md +0 -64
  863. package/src/skills/write/references/reviewer-first-writing.md +0 -64
  864. package/src/skills/write/references/revision-checklist.md +0 -70
  865. package/src/skills/write/references/section-contracts.md +0 -82
  866. package/src/skills/write/references/sentence-level-proofing.md +0 -49
  867. package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
  868. package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
  869. package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
  870. package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
  871. package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
  872. package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
  873. package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
  874. package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
  875. package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
  876. package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
  877. package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
  878. package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
  879. package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
  880. package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
  881. package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
  882. package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
  883. package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
  884. package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
  885. package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
  886. package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
  887. package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
  888. package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
  889. package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
  890. package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
  891. package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
  892. package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
  893. package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
  894. package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
@@ -0,0 +1,212 @@
1
+ id: aisb.t3.097_wassersteintl
2
+ name: Wasserstein Transfer Learning
3
+ version: 0.1.0
4
+ one_line: Optimize Wasserstein-based transfer estimators for distributional learning
5
+ across source and target populations using Fréchet regression in the Wasserstein
6
+ space.
7
+ task_description: 'This packaged benchmark covers Wasserstein Transfer Learning (WaTL),
8
+ a novel transfer learning framework for regression models whose outputs are probability
9
+ distributions residing in the Wasserstein space. The method leverages knowledge
10
+ from multiple source domains to improve predictions in a target domain by intrinsically
11
+ incorporating the Wasserstein metric. The three-stage algorithm consists of: (1)
12
+ a weighted auxiliary estimator using global Fréchet regression for known informative
13
+ source subsets, (2) bias correction via gradient descent with cross-validated regularization,
14
+ and (3) projection to Wasserstein space enforcing monotonicity via OSQP solver.
15
+ Evaluation targets RMSPR (Root Mean Squared Prediction Risk) on mortality and physical
16
+ activity datasets, with per-test-point timing as a secondary metric.
17
+
18
+ '
19
+ task_mode: evaluation_driven
20
+ requires_execution: true
21
+ requires_paper: true
22
+ integrity_level: cas_plus_canary
23
+ snapshot_status: runnable
24
+ support_level: turnkey
25
+ time_band: 2-6h
26
+ cost_band: low
27
+ difficulty: medium
28
+ data_access: public
29
+ primary_outputs:
30
+ - rmspr
31
+ - time_ms_per_test_point
32
+ - transfer_learning_report
33
+ launch_profiles:
34
+ - id: simulation
35
+ label: Simulation Route
36
+ description: 'Run the packaged simulation experiment (Section 5 of paper) to validate
37
+ WaTL asymptotic properties. Uses global Fréchet regression with synthetic distributional
38
+ data.
39
+
40
+ '
41
+ command: Rscript Simulation/Simulation.R <M> <n_t> <seed> <setting> <tau>
42
+ arguments:
43
+ - name: M
44
+ description: Grid size for quantile functions
45
+ example: '100'
46
+ - name: n_t
47
+ description: Target sample size
48
+ example: 200-800
49
+ - name: seed
50
+ description: Random seed for reproducibility
51
+ example: '42'
52
+ - name: setting
53
+ description: Data generation setting (1 or 2)
54
+ example: '1'
55
+ - name: tau
56
+ description: Source sample multiplier
57
+ example: 100 or 200
58
+ - id: real_data
59
+ label: Real Data Route
60
+ description: 'Execute the real-world application with mortality or physical activity
61
+ data. Uses local Fréchet regression with OSQP monotonicity projection. Target
62
+ domain analysis with multiple source populations.
63
+
64
+ '
65
+ command: Rscript RealData/RealData.R <seed> <race> <M> <rate> <gender>
66
+ arguments:
67
+ - name: seed
68
+ description: Random seed for reproducibility
69
+ example: '42'
70
+ - name: race
71
+ description: Race index for target population (1=Black, 2=White)
72
+ example: '1'
73
+ - name: M
74
+ description: Grid size for quantile functions
75
+ example: '100'
76
+ - name: rate
77
+ description: Source data sampling rate (0-1)
78
+ example: '1.0'
79
+ - name: gender
80
+ description: Gender for stratification (0=Female, 1=Male)
81
+ example: '0'
82
+ - id: mortality_experiment
83
+ label: Mortality Experiment (RMSPR)
84
+ description: 'Primary end-to-end reproduction path for RMSPR metric using UN World
85
+ Population Prospects 2015 data. Target: Developed countries (45). Sources: Developing
86
+ countries (156). Computes per-test-point timing.
87
+
88
+ '
89
+ command: Rscript mortality_experiment2.R
90
+ notes: 'Uses wpp2015 R package for demographic data. Requires internet for package
91
+ installation. Reproduces Table 1 (Appendix A).
92
+
93
+ '
94
+ dataset_download:
95
+ primary_method: r_package
96
+ sources:
97
+ - name: wpp2015
98
+ description: UN World Population Prospects 2015 mortality data
99
+ package: wpp2015
100
+ - name: NHANES
101
+ description: National Health and Nutrition Examination Survey physical activity
102
+ data
103
+ package: NHANES
104
+ notes:
105
+ - wpp2015 package loads UN demographic data on first use
106
+ - NHANES physical activity intensity data loaded via RealDataFunc.R
107
+ - Both datasets are publicly available from NIH
108
+ credential_requirements:
109
+ mode: none
110
+ items: []
111
+ notes:
112
+ - No authentication required for R package data sources
113
+ - Internet connection needed for package installation and data download
114
+ resources:
115
+ minimum:
116
+ cpu_cores: 4
117
+ ram_gb: 8
118
+ disk_gb: 10
119
+ gpu_count: 0
120
+ gpu_vram_gb: 0
121
+ recommended:
122
+ cpu_cores: 8
123
+ ram_gb: 16
124
+ disk_gb: 20
125
+ gpu_count: 0
126
+ gpu_vram_gb: 0
127
+ environment:
128
+ python: null
129
+ cuda: null
130
+ pytorch: null
131
+ flash_attn: null
132
+ key_packages:
133
+ - name: wpp2015
134
+ description: UN World Population Prospects demographic data
135
+ - name: osqp
136
+ description: Quadratic programming solver for monotonicity projection
137
+ - name: Matrix
138
+ description: Sparse and dense matrix operations
139
+ - name: pracma
140
+ description: Practical numerical mathematics
141
+ - name: parallel
142
+ description: Parallel computation support
143
+ - name: NHANES
144
+ description: NHANES data retrieval
145
+ notes:
146
+ - CPU-only execution is sufficient for all routes
147
+ - GPU not required; workload is primarily statistical computation
148
+ - R-centric workflow; no Python or PyTorch dependencies
149
+ - OSQP solver used in Real Data route for quantile function monotonicity constraint
150
+ risk_flags:
151
+ - no_gpu_required
152
+ - cpu_bound
153
+ - r_only
154
+ risk_notes:
155
+ - Benchmark has no GPU requirement; resource costs are minimal
156
+ - Execution time scales with grid size M and sample sizes
157
+ - OSQP solver convergence may vary with data dimensionality
158
+ recommended_when: 'Use this benchmark when you need a statistics-heavy transfer-learning
159
+ task that operates on distributional data in the Wasserstein space. Suitable for
160
+ evaluating methods that predict probability distributions from covariates using
161
+ optimal transport geometry. Ideal when working with mortality curves, physical activity
162
+ distributions, or other distributional response data where source domain knowledge
163
+ can improve target predictions. R-based execution makes it accessible without GPU
164
+ infrastructure.
165
+
166
+ '
167
+ not_recommended_when: 'Do not use this benchmark if you need neural-network-based
168
+ benchmarks, deep learning workflows, or CUDA-heavy training. Not suitable for tasks
169
+ requiring GPU acceleration or PyTorch-based implementations. Avoid if your research
170
+ focuses on scalar/vector responses rather than distributional outputs in non-Euclidean
171
+ spaces.
172
+
173
+ '
174
+ paper:
175
+ title: Wasserstein Transfer Learning
176
+ authors:
177
+ - Kaicheng Zhang (Zhejiang University)
178
+ - Sinian Zhang (University of Minnesota)
179
+ - Doudou Zhou (National University of Singapore)
180
+ - Yidong Zhou (UC Davis)
181
+ venue: arXiv preprint
182
+ year: 2025
183
+ url: https://arxiv.org/abs/2505.17404
184
+ github: https://github.com/h7nian/WaTL
185
+ display:
186
+ palette_seed: teal-stone-wasserstein
187
+ art_style: statistical-transport
188
+ accent_priority: medium
189
+ image_path: ../image/097_aisb.t3.097_wassersteintl.jpg
190
+ capability_tags:
191
+ - transfer_learning
192
+ - wasserstein_geometry
193
+ - distributional_learning
194
+ - statistical_modeling
195
+ - optimal_transport
196
+ - frechet_regression
197
+ - non_euclidean_output
198
+ aisb_direction: T3
199
+ track_fit:
200
+ - paper_track
201
+ - benchmark_track
202
+ commercial:
203
+ annual_fee: null
204
+ download:
205
+ provider: github_release
206
+ repo: ResearAI/DeepScientist
207
+ tag: aisb-v0.0.1
208
+ asset_name: aisb.t3.097_wassersteintl.zip
209
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.097_wassersteintl.zip
210
+ archive_type: zip
211
+ sha256: 7878e684e20e96ca4ea5aa2ea5f33a4772d22a14b5bf6ab275a68664de302887
212
+ size_bytes: 104086
@@ -0,0 +1,169 @@
1
+ id: aisb.t3.097_wassersteintl
2
+ name: Wasserstein 迁移学习
3
+ version: 0.1.0
4
+ one_line: 使用 Wasserstein 空间中的 Fréchet 回归优化基于 Wasserstein 的迁移估计器,以实现源群体和目标群体之间的分布式学习。
5
+ task_description: 该打包基准涵盖 Wasserstein 迁移学习 (WaTL),这是一种用于回归模型的新型迁移学习框架,其输出是位于 Wasserstein 空间中的概率分布。该方法通过内在地结合 Wasserstein 度量,利用来自多个源域的知识来改进目标域中的预测。该三阶段算法包括:(1) 对已知信息源子集使用全局 Fréchet 回归的加权辅助估计器,(2) 通过交叉验证正则化的梯度下降进行偏差校正,以及 (3) 通过 OSQP 求解器投影到 Wasserstein 空间以强制单调性。评估目标是死亡率和身体活动数据集的 RMSPR(均方根预测风险),每个测试点的时间作为次要指标。
6
+ task_mode: evaluation_driven
7
+ requires_execution: true
8
+ requires_paper: true
9
+ integrity_level: cas_plus_canary
10
+ snapshot_status: runnable
11
+ support_level: turnkey
12
+ time_band: 2-6h
13
+ cost_band: low
14
+ difficulty: medium
15
+ data_access: public
16
+ primary_outputs:
17
+ - rmspr
18
+ - time_ms_per_test_point
19
+ - transfer_learning_report
20
+ launch_profiles:
21
+ - id: simulation
22
+ label: 模拟路线
23
+ description: 运行打包的模拟实验(论文第 5 节)以验证 WaTL 渐近属性。将全局 Fréchet 回归与合成分布数据结合使用。
24
+ command: Rscript Simulation/Simulation.R <M> <n_t> <seed> <setting> <tau>
25
+ arguments:
26
+ - name: M
27
+ description: 分位数函数的网格大小
28
+ example: '100'
29
+ - name: n_t
30
+ description: 目标样本量
31
+ example: 200-800
32
+ - name: seed
33
+ description: 用于再现性的随机种子
34
+ example: '42'
35
+ - name: setting
36
+ description: 数据生成设置(1或2)
37
+ example: '1'
38
+ - name: tau
39
+ description: 源样本乘数
40
+ example: 100 or 200
41
+ - id: real_data
42
+ label: 真实数据路由
43
+ description: 使用死亡率或体力活动数据执行现实世界的应用程序。使用带有 OSQP 单调性投影的局部 Fréchet 回归。具有多个源群体的目标域分析。
44
+ command: Rscript RealData/RealData.R <seed> <race> <M> <rate> <gender>
45
+ arguments:
46
+ - name: seed
47
+ description: 用于再现性的随机种子
48
+ example: '42'
49
+ - name: race
50
+ description: 目标人群的种族指数(1=黑人,2=白人)
51
+ example: '1'
52
+ - name: M
53
+ description: 分位数函数的网格大小
54
+ example: '100'
55
+ - name: rate
56
+ description: 源数据采样率(0-1)
57
+ example: '1.0'
58
+ - name: gender
59
+ description: 分层性别(0=女性,1=男性)
60
+ example: '0'
61
+ - id: mortality_experiment
62
+ label: 死亡率实验 (RMSPR)
63
+ description: 使用联合国 2015 年世界人口展望数据的 RMSPR 指标的主要端到端复制路径。目标:发达国家(45)。资料来源:发展中国家(156)。计算每个测试点的时序。
64
+ command: Rscript mortality_experiment2.R
65
+ notes: 使用 wpp2015 R 包获取人口统计数据。需要互联网来安装软件包。重现表 1(附录 A)。
66
+ dataset_download:
67
+ primary_method: r_package
68
+ sources:
69
+ - name: wpp2015
70
+ description: UN World Population Prospects 2015 mortality data
71
+ package: wpp2015
72
+ - name: NHANES
73
+ description: National Health and Nutrition Examination Survey physical activity data
74
+ package: NHANES
75
+ notes:
76
+ - wpp2015 软件包首次使用时加载联合国人口统计数据
77
+ - NHANES 身体活动强度数据通过 RealDataFunc.R 加载
78
+ - 这两个数据集均可从 NIH 公开获得
79
+ credential_requirements:
80
+ mode: none
81
+ items: []
82
+ notes:
83
+ - R包数据源无需身份验证
84
+ - 软件包安装和数据下载需要互联网连接
85
+ resources:
86
+ minimum:
87
+ cpu_cores: 4
88
+ ram_gb: 8
89
+ disk_gb: 10
90
+ gpu_count: 0
91
+ gpu_vram_gb: 0
92
+ recommended:
93
+ cpu_cores: 8
94
+ ram_gb: 16
95
+ disk_gb: 20
96
+ gpu_count: 0
97
+ gpu_vram_gb: 0
98
+ environment:
99
+ python: null
100
+ cuda: null
101
+ pytorch: null
102
+ flash_attn: null
103
+ key_packages:
104
+ - name: wpp2015
105
+ description: UN World Population Prospects demographic data
106
+ - name: osqp
107
+ description: Quadratic programming solver for monotonicity projection
108
+ - name: Matrix
109
+ description: Sparse and dense matrix operations
110
+ - name: pracma
111
+ description: Practical numerical mathematics
112
+ - name: parallel
113
+ description: Parallel computation support
114
+ - name: NHANES
115
+ description: NHANES data retrieval
116
+ notes:
117
+ - 仅 CPU 执行足以满足所有路由的需要
118
+ - 不需要 GPU;工作量主要是统计计算
119
+ - 以 R 为中心的工作流程;没有 Python 或 PyTorch 依赖项
120
+ - OSQP 求解器在真实数据路径中用于分位数函数单调性约束
121
+ risk_flags:
122
+ - no_gpu_required
123
+ - cpu_bound
124
+ - r_only
125
+ risk_notes:
126
+ - Benchmark 没有 GPU 要求;资源成本极低
127
+ - 执行时间与网格大小 M 和样本大小相关
128
+ - OSQP 求解器收敛可能随数据维度而变化
129
+ recommended_when: 当您需要对 Wasserstein 空间中的分布数据进行操作的统计量大的迁移学习任务时,请使用此基准。适用于评估使用最佳传输几何从协变量预测概率分布的方法。非常适合处理死亡率曲线、体力活动分布或其他分布响应数据,其中源领域知识可以改进目标预测。基于 R 的执行使其无需 GPU 基础设施即可访问。
130
+ not_recommended_when: 如果您需要基于神经网络的基准测试、深度学习工作流程或 CUDA 密集型训练,请勿使用此基准测试。不适合需要 GPU 加速或基于 PyTorch 的实现的任务。如果您的研究重点是标量/向量响应而不是非欧几里得空间中的分布输出,请避免使用。
131
+ paper:
132
+ title: Wasserstein Transfer Learning
133
+ authors:
134
+ - Kaicheng Zhang (Zhejiang University)
135
+ - Sinian Zhang (University of Minnesota)
136
+ - Doudou Zhou (National University of Singapore)
137
+ - Yidong Zhou (UC Davis)
138
+ venue: arXiv preprint
139
+ year: 2025
140
+ url: https://arxiv.org/abs/2505.17404
141
+ github: https://github.com/h7nian/WaTL
142
+ display:
143
+ palette_seed: teal-stone-wasserstein
144
+ art_style: statistical-transport
145
+ accent_priority: medium
146
+ image_path: ../image/097_aisb.t3.097_wassersteintl.jpg
147
+ capability_tags:
148
+ - transfer_learning
149
+ - wasserstein_geometry
150
+ - distributional_learning
151
+ - statistical_modeling
152
+ - optimal_transport
153
+ - frechet_regression
154
+ - non_euclidean_output
155
+ aisb_direction: T3
156
+ track_fit:
157
+ - paper_track
158
+ - benchmark_track
159
+ commercial:
160
+ annual_fee: null
161
+ download:
162
+ provider: github_release
163
+ repo: ResearAI/DeepScientist
164
+ tag: aisb-v0.0.1
165
+ asset_name: aisb.t3.097_wassersteintl.zip
166
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.097_wassersteintl.zip
167
+ archive_type: zip
168
+ sha256: 7878e684e20e96ca4ea5aa2ea5f33a4772d22a14b5bf6ab275a68664de302887
169
+ size_bytes: 104086
@@ -0,0 +1,171 @@
1
+ id: aisb.t3.098_xmahalanobis
2
+ name: 'X-Mahalanobis: Transformer Feature Mixing for Reliable OOD Detection'
3
+ version: 0.1.0
4
+ one_line: Adaptive transformer layer fusion with Mahalanobis distance scoring for
5
+ state-of-the-art out-of-distribution detection.
6
+ task_description: 'This packaged benchmark covers transformer-based out-of-distribution
7
+ (OOD) detection through an adaptive fusion module that dynamically assigns importance
8
+ weights to representations learned by each Transformer layer. The method detects
9
+ OOD samples using Mahalanobis distance scoring across multiple intermediate layers,
10
+ moving beyond reliance on final-layer features alone. The benchmark supports parameter-efficient
11
+ fine-tuning (PEFT) strategies including AdaptFormer, LoRA, Adapter, Visual Prompt
12
+ Tuning (VPT), bias tuning, and full fine-tuning. Evaluation is conducted on class-balanced
13
+ (CIFAR100) and long-tailed (ImageNet-LT) in-distribution classification tasks against
14
+ nine diverse OOD datasets, reporting AUROC and FPR95 metrics.
15
+
16
+ '
17
+ task_mode: experiment_driven
18
+ requires_execution: true
19
+ requires_paper: true
20
+ integrity_level: cas_plus_canary
21
+ snapshot_status: external_eval_required
22
+ support_level: advanced
23
+ time_band: 6-24h
24
+ cost_band: medium
25
+ difficulty: medium
26
+ data_access: public
27
+ primary_outputs:
28
+ - auroc
29
+ - fpr95
30
+ - ood_detection_checkpoint
31
+ launch_profiles:
32
+ - id: quick_eval
33
+ label: Quick Eval
34
+ description: 'Run OOD detection evaluation on a prepared checkpoint using main_test.py.
35
+ Requires trained model weights and config alignment with training setup. Suitable
36
+ for evaluating baselines or comparing fine-tuned checkpoints.
37
+
38
+ '
39
+ estimated_time: 1-2h
40
+ compute_profile: quick_eval
41
+ - id: train_and_test
42
+ label: Train + Test
43
+ description: 'Full PEFT training workflow on CIFAR100 or ImageNet-LT followed by
44
+ OOD evaluation. Supports AdaptFormer (default), LoRA, Adapter, VPT, bias tuning,
45
+ and full fine-tuning. Trains ViT-B/16 (IN21K pretrained or CLIP pretrained) and
46
+ evaluates against multiple OOD datasets.
47
+
48
+ '
49
+ estimated_time: 6-18h
50
+ compute_profile: full_training
51
+ dataset_download:
52
+ primary_method: bundled
53
+ sources:
54
+ - cifar100: torchvision datasets (auto-download)
55
+ - imagenet_lt: requires manual download from ImageNet, LT split preconfigured in
56
+ configs
57
+ - ood_datasets: preconfigured in evaluation pipeline (e.g., SVHN, LSUN, iNaturalist)
58
+ notes:
59
+ - CIFAR100 downloads automatically via torchvision
60
+ - ImageNet-LT requires manual download from ImageNet official source
61
+ - OOD test datasets (TIN, SVHN, LSUN, etc.) handled by evaluation script
62
+ - Data configs located in configs/data/ (cifar100.yaml, imagenet_lt.yaml, imagenet.yaml)
63
+ credential_requirements:
64
+ mode: none
65
+ items: []
66
+ notes:
67
+ - ImageNet download may require academic registration
68
+ - All other datasets are publicly accessible or auto-downloaded
69
+ resources:
70
+ minimum:
71
+ cpu_cores: 8
72
+ ram_gb: 32
73
+ disk_gb: 80
74
+ gpu_count: 1
75
+ gpu_vram_gb: 16
76
+ notes: Supports single-GPU execution for quick_eval and small-scale training
77
+ recommended:
78
+ cpu_cores: 16
79
+ ram_gb: 64
80
+ disk_gb: 150
81
+ gpu_count: 1
82
+ gpu_vram_gb: 24
83
+ notes: '24GB VRAM recommended for batch_size 64 with full PEFT methods on ImageNet-LT.
84
+ AdaptFormer training at lr 0.1 for 20 epochs on ImageNet-LT with CLIP ViT-B/16
85
+ is the most demanding configuration.
86
+
87
+ '
88
+ environment:
89
+ python: '3.9'
90
+ cuda: '11.8'
91
+ pytorch: '2.0'
92
+ flash_attn: null
93
+ key_packages:
94
+ - torch>=2.0
95
+ - torchvision
96
+ - numpy
97
+ - scikit-learn
98
+ - scipy
99
+ - timm
100
+ - open_clip_torch
101
+ notes:
102
+ - See bundled requirements.txt or README for full dependency set
103
+ - open_clip_torch required for CLIP ViT-B/16 model support
104
+ - timm required for IN21K ViT-B/16 pretrained models
105
+ risk_flags:
106
+ - long_runtime
107
+ - gpu_memory_sensitive
108
+ - config_sensitivity
109
+ risk_notes:
110
+ - Full training on ImageNet-LT with 20 epochs may take 12-18 hours
111
+ - Batch size 64 on 24GB GPU requires AdaptFormer PEFT; full fine-tuning may OOM
112
+ - Config alignment between train and test is critical; mismatched configs produce
113
+ invalid results
114
+ - PEFT method flags (adaptformer, lora, adapter, etc.) must be explicitly set per
115
+ experiment
116
+ - Seed setting via --seed flag available but not enforced; reproducibility requires
117
+ manual seed setting
118
+ recommended_when: 'Use this benchmark when developing transformer-based reliability
119
+ and OOD detection methods. Particularly suited for research on: (1) adaptive layer
120
+ fusion strategies, (2) Mahalanobis-based OOD scoring, (3) parameter-efficient fine-tuning
121
+ for out-of-distribution generalization, (4) comparing shallow vs. deep transformer
122
+ representations, and (5) benchmarking OOD detection under class-imbalanced (long-tailed)
123
+ distributions.
124
+
125
+ '
126
+ not_recommended_when: 'Do not use this benchmark for: (1) text-only reliability tasks
127
+ (OOD detection here is vision-only), (2) non-transformer architectures (pure CNN-based
128
+ methods), (3) tasks requiring OOD detection without fine-tuning (zero-shot OOD evaluation),
129
+ or (4) resource-constrained environments without GPU access.
130
+
131
+ '
132
+ paper:
133
+ title: 'X-Mahalanobis: Transformer Feature Mixing for Reliable OOD Detection'
134
+ venue: NeurIPS 2025
135
+ year: 2025
136
+ url: https://arxiv.org/abs/2505.09128
137
+ notes: 'NeurIPS 2025 publication; benchmark packages official implementation from
138
+ the paper. Experiments demonstrate SOTA OOD detection across nine OOD datasets.
139
+
140
+ '
141
+ download:
142
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.098_xmahalanobis.zip
143
+ archive_type: zip
144
+ local_dir_name: paper-98-XMahalanobis
145
+ notes: 'Bundled archive includes full training/test code, configs, utility modules,
146
+ and pretrained model loading support for CLIP and IN21K ViT variants.
147
+
148
+ '
149
+ provider: github_release
150
+ repo: ResearAI/DeepScientist
151
+ tag: aisb-v0.0.1
152
+ asset_name: aisb.t3.098_xmahalanobis.zip
153
+ sha256: c65b3f81a78754d84bff9a76b8a0c13e180f6b3b6d379801647ed189b1f4741e
154
+ size_bytes: 1420263
155
+ display:
156
+ palette_seed: cobalt-silver-mahalanobis
157
+ art_style: reliability-vision
158
+ accent_priority: high
159
+ image_path: ../image/098_aisb.t3.098_xmahalanobis.jpg
160
+ capability_tags:
161
+ - ood_detection
162
+ - transformers
163
+ - computer_vision
164
+ - reliable_ml
165
+ - parameter_efficient_finetuning
166
+ - layer_fusion
167
+ - mahalanobis_distance
168
+ aisb_direction: T3
169
+ track_fit:
170
+ - paper_track
171
+ - benchmark_track
@@ -0,0 +1,127 @@
1
+ id: aisb.t3.098_xmahalanobis
2
+ name: X-Mahalanobis:用于可靠 OOD 检测的变压器特征混合
3
+ version: 0.1.0
4
+ one_line: 自适应变换层融合与马哈拉诺比斯距离评分,用于最先进的分布外检测。
5
+ task_description: 该打包基准测试通过自适应融合模块涵盖基于 Transformer 的分布外 (OOD) 检测,该模块动态地将重要性权重分配给每个 Transformer 层学习的表示。该方法使用跨多个中间层的马哈拉诺比斯距离评分来检测 OOD 样本,不再仅仅依赖最终层特征。该基准测试支持参数高效微调 (PEFT) 策略,包括 AdaptFormer、LoRA、Adapter、视觉提示调整 (VPT)、偏差调整和完全微调。针对九个不同的 OOD 数据集对类平衡 (CIFAR100) 和长尾 (ImageNet-LT) 分布内分类任务进行评估,报告 AUROC 和 FPR95 指标。
6
+ task_mode: experiment_driven
7
+ requires_execution: true
8
+ requires_paper: true
9
+ integrity_level: cas_plus_canary
10
+ snapshot_status: external_eval_required
11
+ support_level: advanced
12
+ time_band: 6-24h
13
+ cost_band: medium
14
+ difficulty: medium
15
+ data_access: public
16
+ primary_outputs:
17
+ - auroc
18
+ - fpr95
19
+ - ood_detection_checkpoint
20
+ launch_profiles:
21
+ - id: quick_eval
22
+ label: 快速评估
23
+ description: 使用 main_test.py 在准备好的检查点上运行 OOD 检测评估。需要经过训练的模型权重和配置与训练设置保持一致。适合评估基线或比较微调的检查点。
24
+ estimated_time: 1-2h
25
+ compute_profile: quick_eval
26
+ - id: train_and_test
27
+ label: 训练+测试
28
+ description: CIFAR100 或 ImageNet-LT 上的完整 PEFT 训练工作流程,然后进行 OOD 评估。支持AdaptFormer(默认)、LoRA、Adapter、VPT、偏置调整和全面微调。训练 ViT-B/16(IN21K 预训练或 CLIP 预训练)并针对多个 OOD 数据集进行评估。
29
+ estimated_time: 6-18h
30
+ compute_profile: full_training
31
+ dataset_download:
32
+ primary_method: bundled
33
+ sources:
34
+ - cifar100: torchvision datasets (auto-download)
35
+ - imagenet_lt: requires manual download from ImageNet, LT split preconfigured in configs
36
+ - ood_datasets: preconfigured in evaluation pipeline (e.g., SVHN, LSUN, iNaturalist)
37
+ notes:
38
+ - CIFAR100 通过 torchvision 自动下载
39
+ - ImageNet-LT需要从ImageNet官方源手动下载
40
+ - 由评估脚本处理的 OOD 测试数据集(TIN、SVHN、LSUN 等)
41
+ - 数据配置位于 configs/data/ (cifar100.yaml, imagenet_lt.yaml, imagenet.yaml)
42
+ credential_requirements:
43
+ mode: none
44
+ items: []
45
+ notes:
46
+ - ImageNet 下载可能需要学术注册
47
+ - 所有其他数据集均可公开访问或自动下载
48
+ resources:
49
+ minimum:
50
+ cpu_cores: 8
51
+ ram_gb: 32
52
+ disk_gb: 80
53
+ gpu_count: 1
54
+ gpu_vram_gb: 16
55
+ notes: 支持单 GPU 执行 quick_eval 和小规模训练
56
+ recommended:
57
+ cpu_cores: 16
58
+ ram_gb: 64
59
+ disk_gb: 150
60
+ gpu_count: 1
61
+ gpu_vram_gb: 24
62
+ notes: 建议 batch_size 64 使用 24GB VRAM,在 ImageNet-LT 上使用完整的 PEFT 方法。 AdaptFormer 使用 CLIP ViT-B/16 在 ImageNet-LT 上以 lr 0.1 进行 20 个周期的训练是要求最高的配置。
63
+ environment:
64
+ python: '3.9'
65
+ cuda: '11.8'
66
+ pytorch: '2.0'
67
+ flash_attn: null
68
+ key_packages:
69
+ - torch>=2.0
70
+ - torchvision
71
+ - numpy
72
+ - scikit-learn
73
+ - scipy
74
+ - timm
75
+ - open_clip_torch
76
+ notes:
77
+ - 请参阅捆绑的 requirements.txt 或 README 以获取完整的依赖项集
78
+ - CLIP ViT-B/16 模型支持需要 open_clip_torch
79
+ - IN21K ViT-B/16 预训练模型所需的 timm
80
+ risk_flags:
81
+ - long_runtime
82
+ - gpu_memory_sensitive
83
+ - config_sensitivity
84
+ risk_notes:
85
+ - 对 ImageNet-LT 进行 20 个 epoch 的完整训练可能需要 12-18 小时
86
+ - 24GB GPU 上的批量大小 64 需要 AdaptFormer PEFT;完全微调可能会OOM
87
+ - 训练和测试之间的配置对齐至关重要;不匹配的配置会产生无效结果
88
+ - 每个实验必须明确设置 PEFT 方法标志(adaptformer、lora、adapter 等)
89
+ - 通过 --seed 标志设置种子可用,但不强制执行;再现性需要手动播种
90
+ recommended_when: 开发基于变压器的可靠性和 OOD 检测方法时使用此基准。特别适合研究:(1) 自适应层融合策略,(2) 基于 Mahalanobis 的 OOD 评分,(3) 针对分布外泛化的参数高效微调,(4) 比较浅层和深层变压器表示,以及 (5) 类不平衡(长尾)分布下的基准 OOD 检测。
91
+ not_recommended_when: 请勿将此基准用于:(1) 纯文本可靠性任务(此处的 OOD 检测仅针对视觉)、(2) 非 Transformer 架构(纯基于 CNN 的方法)、(3) 需要无需微调的 OOD 检测的任务(零样本 OOD 评估)或 (4) 无法访问 GPU 的资源受限环境。
92
+ paper:
93
+ title: 'X-Mahalanobis: Transformer Feature Mixing for Reliable OOD Detection'
94
+ venue: NeurIPS 2025
95
+ year: 2025
96
+ url: https://arxiv.org/abs/2505.09128
97
+ notes: NeurIPS 2025 出版物;基准包官方实现来自论文。实验证明了跨九个 OOD 数据集的 SOTA OOD 检测。
98
+ download:
99
+ url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.098_xmahalanobis.zip
100
+ archive_type: zip
101
+ local_dir_name: paper-98-XMahalanobis
102
+ notes: 'Bundled archive includes full training/test code, configs, utility modules, and pretrained model loading support for CLIP and IN21K ViT variants.
103
+
104
+ '
105
+ provider: github_release
106
+ repo: ResearAI/DeepScientist
107
+ tag: aisb-v0.0.1
108
+ asset_name: aisb.t3.098_xmahalanobis.zip
109
+ sha256: c65b3f81a78754d84bff9a76b8a0c13e180f6b3b6d379801647ed189b1f4741e
110
+ size_bytes: 1420263
111
+ display:
112
+ palette_seed: cobalt-silver-mahalanobis
113
+ art_style: reliability-vision
114
+ accent_priority: high
115
+ image_path: ../image/098_aisb.t3.098_xmahalanobis.jpg
116
+ capability_tags:
117
+ - ood_detection
118
+ - transformers
119
+ - computer_vision
120
+ - reliable_ml
121
+ - parameter_efficient_finetuning
122
+ - layer_fusion
123
+ - mahalanobis_distance
124
+ aisb_direction: T3
125
+ track_fit:
126
+ - paper_track
127
+ - benchmark_track