@researai/deepscientist 1.5.16 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +196 -32
- package/bin/ds.js +924 -66
- package/docs/en/00_QUICK_START.md +195 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +78 -7
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +624 -180
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +386 -0
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +266 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +48 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +142 -18
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +54 -8
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +552 -181
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +384 -0
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +33 -7
- package/install.sh +168 -20
- package/package.json +5 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/bridges/connectors.py +8 -2
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +187 -74
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +1077 -93
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +827 -235
- package/src/deepscientist/daemon/api/router.py +81 -1
- package/src/deepscientist/daemon/app.py +1512 -85
- package/src/deepscientist/diagnostics/__init__.py +6 -0
- package/src/deepscientist/diagnostics/runner_failures.py +277 -0
- package/src/deepscientist/doctor.py +407 -56
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +850 -88
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1852 -161
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +480 -35
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +80 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -10
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +411 -304
- package/src/prompts/system_copilot.md +89 -0
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-DnSm0GZn.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-itb0tltR.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DqKkiCI6.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-DxL2ezFG.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-B_RQm1YZ.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-tHqlXY3n.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-B495DTXC.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DG28-61B.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BiOGT-Kj.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-CVsj8h_T.js → NotebookEditor-WFyd8Ybt.js} +23 -23
- package/src/ui/dist/assets/{PdfLoader-CASDQmxJ.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-BFhwoKsY.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-CB4DYfWO.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-DLC6G24T.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-CwMn-iqb.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-Cu4Qln7Y.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-wQ7RIIRd.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-CsX08Qno.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-R-GWEhzS.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-COFACy7V.js +0 -204
- package/src/ui/dist/assets/CliPlugin-CvwCmDQ5.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-cOqSa0xq.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-DVgNHBCS.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-ClMbq5Yu.js +0 -14
- package/src/ui/dist/assets/LabPlugin-L_SuE8ow.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-C-4Kt1p9.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-DcOzU9vd.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CHj7M58O.js +0 -16
- package/src/ui/dist/assets/VNCViewer-CjlbyCB3.js +0 -11
- package/src/ui/dist/assets/bot-CFkZY-JP.js +0 -6
- package/src/ui/dist/assets/chevron-up-Dq5ofbht.js +0 -6
- package/src/ui/dist/assets/file-content-Dv4LoZec.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-Denq-lC3.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-BUh6G52n.js +0 -6
- package/src/ui/dist/assets/image-B9HUUddG.js +0 -6
- package/src/ui/dist/assets/index-B2B1sg-M.js +0 -1
- package/src/ui/dist/assets/index-Cgla8biy.css +0 -33
- package/src/ui/dist/assets/index-DRyx7vAc.js +0 -1
- package/src/ui/dist/assets/index-Gbl53BNp.js +0 -2496
- package/src/ui/dist/assets/pdf-effect-queue-ZtnHFCAi.js +0 -6
- package/src/ui/dist/assets/popover-DL6h35vr.js +0 -1
- package/src/ui/dist/assets/select-DvmXt1yY.js +0 -11
- package/src/ui/dist/assets/sigma-7jpXazui.js +0 -6
- package/src/ui/dist/assets/trash-xA7kFt8i.js +0 -11
- package/src/ui/dist/assets/useCliAccess-DsMwDjOp.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,193 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.005_tsae
|
|
3
|
+
name: 'Temporal Sparse Autoencoders: Leveraging the Sequential Nature of Language
|
|
4
|
+
for Interpretability'
|
|
5
|
+
version: 0.1.0
|
|
6
|
+
one_line: Train temporal sparse autoencoders (T-SAEs) with a contrastive temporal-consistency
|
|
7
|
+
loss on LLM activations, then evaluate feature quality via SAEBench-style automated
|
|
8
|
+
interpretability scoring.
|
|
9
|
+
task_description: 'This benchmark requires training Temporal Sparse Autoencoders (T-SAEs)
|
|
10
|
+
that partition latent features into high-level (semantic, temporally consistent)
|
|
11
|
+
and low-level (syntactic, token-local) components using a contrastive loss over
|
|
12
|
+
adjacent-token activations from language models (Pythia-160m or Gemma-2-2b). The
|
|
13
|
+
T-SAE architecture extends Matryoshka BatchTopK SAEs with a temporal contrastive
|
|
14
|
+
term encouraging high-level features to remain stable across adjacent tokens in
|
|
15
|
+
a sequence. The primary execution route is: (1) train a T-SAE on model activations
|
|
16
|
+
extracted from the Pile dataset using dictionary_learning/dictionary_learning/train_temporal.py,
|
|
17
|
+
(2) evaluate reconstruction quality, sparsity, and temporal smoothness using dictionary_learning/dictionary_learning/eval_temporal.py,
|
|
18
|
+
and (3) compute automated interpretability scores by processing SAEBench-generated
|
|
19
|
+
explanation JSON files via src/process_sae_bench_autointerp.py. Downstream experiments
|
|
20
|
+
include probing for semantic/ contextual/syntactic content, t-SNE visualization,
|
|
21
|
+
and an HH-RLHF alignment case study. Pretrained Gemma-2-2b T-SAE checkpoints with
|
|
22
|
+
16384 features and pre-labeled explanations are available on HuggingFace, enabling
|
|
23
|
+
evaluation without retraining. The autointerp evaluation requires SAEBench (external)
|
|
24
|
+
to generate feature explanations using a judge LLM (Llama-3.3-70b-Instruct in the
|
|
25
|
+
paper). Training data streams from the Pile via HuggingFace datasets; no manual
|
|
26
|
+
dataset download is needed for the core route.
|
|
27
|
+
|
|
28
|
+
'
|
|
29
|
+
capability_tags:
|
|
30
|
+
- research_code_optimization
|
|
31
|
+
- mechanistic_interpretability
|
|
32
|
+
- sparse_autoencoders
|
|
33
|
+
- large_language_models
|
|
34
|
+
- evaluation
|
|
35
|
+
- contrastive_learning
|
|
36
|
+
- dictionary_learning
|
|
37
|
+
aisb_direction: T3
|
|
38
|
+
track_fit:
|
|
39
|
+
- paper_track
|
|
40
|
+
- benchmark_track
|
|
41
|
+
task_mode: experiment_driven
|
|
42
|
+
requires_execution: true
|
|
43
|
+
requires_paper: true
|
|
44
|
+
integrity_level: cas_plus_canary
|
|
45
|
+
snapshot_status: runnable
|
|
46
|
+
support_level: advanced
|
|
47
|
+
cost_band: high
|
|
48
|
+
time_band: 1d+
|
|
49
|
+
difficulty: hard
|
|
50
|
+
data_access: public
|
|
51
|
+
primary_outputs:
|
|
52
|
+
- autointerp_score
|
|
53
|
+
- sae_checkpoint
|
|
54
|
+
- interpretability_report
|
|
55
|
+
- probing_accuracy
|
|
56
|
+
- temporal_smoothness_metrics
|
|
57
|
+
launch_profiles:
|
|
58
|
+
- id: quick_check
|
|
59
|
+
label: Quick Check
|
|
60
|
+
description: 'Run a small T-SAE training pass on Pythia-160m with reduced steps
|
|
61
|
+
and a short eval to verify the pipeline end-to-end. Uses NeelNanda/pile-10k for
|
|
62
|
+
fast iteration.
|
|
63
|
+
|
|
64
|
+
'
|
|
65
|
+
- id: autointerp_eval
|
|
66
|
+
label: Autointerp Eval
|
|
67
|
+
description: 'Train temporal sparse autoencoders on full Pile data, generate feature
|
|
68
|
+
explanations via SAEBench with a judge LLM, and compute autointerp scores. This
|
|
69
|
+
is the paper-faithful route requiring external SAEBench and a 70B judge model.
|
|
70
|
+
|
|
71
|
+
'
|
|
72
|
+
- id: pretrained_eval
|
|
73
|
+
label: Pretrained Eval
|
|
74
|
+
description: 'Download the pretrained Gemma-2-2b T-SAE and bundled explanations
|
|
75
|
+
from HuggingFace, then run eval_temporal.py and process_sae_bench_autointerp.py
|
|
76
|
+
without retraining.
|
|
77
|
+
|
|
78
|
+
'
|
|
79
|
+
dataset_download:
|
|
80
|
+
primary_method: streaming
|
|
81
|
+
sources:
|
|
82
|
+
- kind: huggingface
|
|
83
|
+
url: https://huggingface.co/datasets/monology/pile-uncopyrighted
|
|
84
|
+
access: public
|
|
85
|
+
note: Primary training/eval data; streamed via HuggingFace datasets. No manual
|
|
86
|
+
download required.
|
|
87
|
+
- kind: huggingface
|
|
88
|
+
url: https://huggingface.co/datasets/NeelNanda/pile-10k
|
|
89
|
+
access: public
|
|
90
|
+
note: Small subset used for quick evaluation passes.
|
|
91
|
+
- kind: huggingface
|
|
92
|
+
url: https://huggingface.co/alex-oesterling/temporal-saes
|
|
93
|
+
access: public
|
|
94
|
+
note: Pretrained Gemma-2-2b T-SAE checkpoint (16384 features) with labeled explanations.json.
|
|
95
|
+
notes:
|
|
96
|
+
- Training data is streamed; disk usage is dominated by model weights and SAE checkpoints.
|
|
97
|
+
- Gemma-2-2b weights require HuggingFace access agreement.
|
|
98
|
+
credential_requirements:
|
|
99
|
+
mode: optional
|
|
100
|
+
items:
|
|
101
|
+
- HuggingFace token (required for gated models like Gemma-2-2b; optional for Pythia-160m)
|
|
102
|
+
- SAEBench access (external tool for generating feature explanations; not bundled)
|
|
103
|
+
notes:
|
|
104
|
+
- Rename example.env to .env and add HF_TOKEN if using Gemma-2-2b or customizing
|
|
105
|
+
HuggingFace paths.
|
|
106
|
+
- Autointerp evaluation requires running SAEBench externally with a judge LLM (paper
|
|
107
|
+
uses Llama-3.3-70b-Instruct).
|
|
108
|
+
resources:
|
|
109
|
+
minimum:
|
|
110
|
+
cpu_cores: 16
|
|
111
|
+
ram_gb: 64
|
|
112
|
+
disk_gb: 100
|
|
113
|
+
gpu_count: 1
|
|
114
|
+
gpu_vram_gb: 24
|
|
115
|
+
recommended:
|
|
116
|
+
cpu_cores: 32
|
|
117
|
+
ram_gb: 128
|
|
118
|
+
disk_gb: 200
|
|
119
|
+
gpu_count: 1
|
|
120
|
+
gpu_vram_gb: 48
|
|
121
|
+
environment:
|
|
122
|
+
python: '3.11'
|
|
123
|
+
cuda: '12.8'
|
|
124
|
+
pytorch: null
|
|
125
|
+
flash_attn: null
|
|
126
|
+
key_packages:
|
|
127
|
+
- poetry
|
|
128
|
+
- nnsight
|
|
129
|
+
- datasets
|
|
130
|
+
- dictionary_learning (bundled fork)
|
|
131
|
+
notes:
|
|
132
|
+
- Poetry-managed environment; run 'poetry install' to set up. Torch wheels are pulled
|
|
133
|
+
from the cu128 index.
|
|
134
|
+
- The dictionary_learning directory is a bundled fork of github.com/saprmarks/dictionary_learning.
|
|
135
|
+
- See pyproject.toml and poetry.lock for the full pinned dependency set.
|
|
136
|
+
risk_flags:
|
|
137
|
+
- external_eval_dependency
|
|
138
|
+
- large_model_weights
|
|
139
|
+
- judge_model_required
|
|
140
|
+
- some_experiments_under_construction
|
|
141
|
+
risk_notes:
|
|
142
|
+
- SAEBench is not bundled; autointerp evaluation requires cloning and running it separately
|
|
143
|
+
with a large judge LLM (70B parameter Llama-3.3 in the paper).
|
|
144
|
+
- Gemma-2-2b weights (~5 GB) must be downloaded and may require HuggingFace access
|
|
145
|
+
agreement.
|
|
146
|
+
- The full autointerp route requires hosting or API access to a 70B judge model, which
|
|
147
|
+
significantly increases cost.
|
|
148
|
+
- README marks "Sequence Interpretability (Figures 1 and 4)" and "Steering" experiments
|
|
149
|
+
as under construction.
|
|
150
|
+
- No benchmark execution was performed during the packaging pass; metrics are code-backed
|
|
151
|
+
but unverified at runtime.
|
|
152
|
+
recommended_when: 'Use this benchmark when you want a mechanistic-interpretability
|
|
153
|
+
task that combines SAE training with temporal-contrastive learning and automated
|
|
154
|
+
interpretability evaluation. Good fit for research on disentangling semantic vs.
|
|
155
|
+
syntactic features in LLM representations, or for optimizing SAE training pipelines
|
|
156
|
+
under structured priors.
|
|
157
|
+
|
|
158
|
+
'
|
|
159
|
+
not_recommended_when: 'Do not use this if you need a lightweight CPU-only benchmark,
|
|
160
|
+
cannot host LLM checkpoints (Pythia-160m minimum, Gemma-2-2b recommended) locally,
|
|
161
|
+
or lack GPU access. Avoid if you cannot run or access a large judge model for the
|
|
162
|
+
autointerp evaluation route.
|
|
163
|
+
|
|
164
|
+
'
|
|
165
|
+
paper:
|
|
166
|
+
title: 'Temporal Sparse Autoencoders: Leveraging the Sequential Nature of Language
|
|
167
|
+
for Interpretability'
|
|
168
|
+
authors:
|
|
169
|
+
- Usha Bhalla
|
|
170
|
+
- Alex Oesterling
|
|
171
|
+
- Claudio Mayrink Verdun
|
|
172
|
+
- Himabindu Lakkaraju
|
|
173
|
+
- Flavio P. Calmon
|
|
174
|
+
venue: arXiv preprint
|
|
175
|
+
year: 2025
|
|
176
|
+
url: https://arxiv.org/abs/2511.05541
|
|
177
|
+
download:
|
|
178
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.005_tsae.zip
|
|
179
|
+
archive_type: zip
|
|
180
|
+
local_dir_name: paper-5-TSAE
|
|
181
|
+
provider: github_release
|
|
182
|
+
repo: ResearAI/DeepScientist
|
|
183
|
+
tag: aisb-v0.0.1
|
|
184
|
+
asset_name: aisb.t3.005_tsae.zip
|
|
185
|
+
sha256: f89d8100092417777d135fded098e3fb26a5f38ccdb300658138273924bf070e
|
|
186
|
+
size_bytes: 322370
|
|
187
|
+
commercial:
|
|
188
|
+
annual_fee: null
|
|
189
|
+
display:
|
|
190
|
+
palette_seed: amber-ink-latent
|
|
191
|
+
art_style: editorial-technical
|
|
192
|
+
accent_priority: high
|
|
193
|
+
image_path: ../image/005_aisb.t3.005_tsae.jpg
|
|
@@ -0,0 +1,139 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.005_tsae
|
|
3
|
+
name: 时间稀疏自编码器:利用语言的序列特性实现可解释性
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 在LLM激活上训练带有对比时间一致性损失的时间稀疏自编码器(T-SAE),然后通过SAEBench风格的自动化可解释性评分来评估特征质量。
|
|
6
|
+
task_description: 本基准测试需要训练时间稀疏自编码器(T-SAE),使用语言模型(Pythia-160m或Gemma-2-2b)相邻token激活上的对比损失,将潜在特征划分为高层级(语义、时间一致)和低层级(句法、token局部)组件。T-SAE架构通过时间对比项扩展了Matryoshka BatchTopK SAE,鼓励高层级特征在序列中的相邻token上保持稳定。主要执行流程为:(1)使用dictionary_learning/dictionary_learning/train_temporal.py从Pile数据集提取的模型激活上训练T-SAE,(2)使用dictionary_learning/dictionary_learning/eval_temporal.py评估重构质量、稀疏性和时间平滑性,(3)通过src/process_sae_bench_autointerp.py处理SAEBench生成的解释JSON文件来计算自动化可解释性评分。下游实验包括语义/上下文/句法内容的探测、t-SNE可视化和HH-RLHF对齐案例研究。预训练的Gemma-2-2b T-SAE检查点(16384特征)和带标签的解释可在HuggingFace上获取,无需重新训练即可评估。自动解释评估需要SAEBench(外部工具)使用评判LLM(论文中使用Llama-3.3-70B-Instruct)生成特征解释。训练数据通过HuggingFace datasets从Pile流式传输;核心流程无需手动下载数据集。
|
|
7
|
+
capability_tags:
|
|
8
|
+
- research_code_optimization
|
|
9
|
+
- mechanistic_interpretability
|
|
10
|
+
- sparse_autoencoders
|
|
11
|
+
- large_language_models
|
|
12
|
+
- evaluation
|
|
13
|
+
- contrastive_learning
|
|
14
|
+
- dictionary_learning
|
|
15
|
+
aisb_direction: T3
|
|
16
|
+
track_fit:
|
|
17
|
+
- paper_track
|
|
18
|
+
- benchmark_track
|
|
19
|
+
task_mode: experiment_driven
|
|
20
|
+
requires_execution: true
|
|
21
|
+
requires_paper: true
|
|
22
|
+
integrity_level: cas_plus_canary
|
|
23
|
+
snapshot_status: runnable
|
|
24
|
+
support_level: advanced
|
|
25
|
+
cost_band: high
|
|
26
|
+
time_band: 1d+
|
|
27
|
+
difficulty: hard
|
|
28
|
+
data_access: public
|
|
29
|
+
primary_outputs:
|
|
30
|
+
- autointerp_score
|
|
31
|
+
- sae_checkpoint
|
|
32
|
+
- interpretability_report
|
|
33
|
+
- probing_accuracy
|
|
34
|
+
- temporal_smoothness_metrics
|
|
35
|
+
launch_profiles:
|
|
36
|
+
- id: quick_check
|
|
37
|
+
label: 快速检查
|
|
38
|
+
description: 在Pythia-160m上运行小规模T-SAE训练,使用减少的步数和简短评估来验证端到端流程。使用NeelNanda/pile-10k进行快速迭代。
|
|
39
|
+
- id: autointerp_eval
|
|
40
|
+
label: 自动解释评估
|
|
41
|
+
description: 在完整Pile数据上训练时间稀疏自编码器,通过SAEBench和评判LLM生成特征解释,并计算自动解释分数。这是论文原始流程,需要外部SAEBench和70B评判模型。
|
|
42
|
+
- id: pretrained_eval
|
|
43
|
+
label: 预训练评估
|
|
44
|
+
description: 从HuggingFace下载预训练的Gemma-2-2b T-SAE和捆绑的解释,然后运行eval_temporal.py和process_sae_bench_autointerp.py,无需重新训练。
|
|
45
|
+
dataset_download:
|
|
46
|
+
primary_method: streaming
|
|
47
|
+
sources:
|
|
48
|
+
- kind: huggingface
|
|
49
|
+
url: https://huggingface.co/datasets/monology/pile-uncopyrighted
|
|
50
|
+
access: public
|
|
51
|
+
note: 主要训练/评估数据;通过HuggingFace datasets流式传输。无需手动下载。
|
|
52
|
+
- kind: huggingface
|
|
53
|
+
url: https://huggingface.co/datasets/NeelNanda/pile-10k
|
|
54
|
+
access: public
|
|
55
|
+
note: 用于快速评估的小规模子集。
|
|
56
|
+
- kind: huggingface
|
|
57
|
+
url: https://huggingface.co/alex-oesterling/temporal-saes
|
|
58
|
+
access: public
|
|
59
|
+
note: 预训练的Gemma-2-2b T-SAE检查点(16384特征)附带标签化的explanations.json。
|
|
60
|
+
notes:
|
|
61
|
+
- 训练数据以流式方式传输;磁盘使用主要由模型权重和SAE检查点占用。
|
|
62
|
+
- Gemma-2-2b权重需要HuggingFace访问协议。
|
|
63
|
+
credential_requirements:
|
|
64
|
+
mode: optional
|
|
65
|
+
items:
|
|
66
|
+
- HuggingFace令牌(用于Gemma-2-2b等门控模型必需;Pythia-160m可选)
|
|
67
|
+
- SAEBench访问权限(用于生成特征解释的外部工具;未捆绑)
|
|
68
|
+
notes:
|
|
69
|
+
- 如使用Gemma-2-2b或自定义HuggingFace路径,请将example.env重命名为.env并添加HF_TOKEN。
|
|
70
|
+
- 自动解释评估需要外部运行SAEBench并使用评判LLM(论文使用Llama-3.3-70B-Instruct)。
|
|
71
|
+
resources:
|
|
72
|
+
minimum:
|
|
73
|
+
cpu_cores: 16
|
|
74
|
+
ram_gb: 64
|
|
75
|
+
disk_gb: 100
|
|
76
|
+
gpu_count: 1
|
|
77
|
+
gpu_vram_gb: 24
|
|
78
|
+
recommended:
|
|
79
|
+
cpu_cores: 32
|
|
80
|
+
ram_gb: 128
|
|
81
|
+
disk_gb: 200
|
|
82
|
+
gpu_count: 1
|
|
83
|
+
gpu_vram_gb: 48
|
|
84
|
+
environment:
|
|
85
|
+
python: '3.11'
|
|
86
|
+
cuda: '12.8'
|
|
87
|
+
pytorch: null
|
|
88
|
+
flash_attn: null
|
|
89
|
+
key_packages:
|
|
90
|
+
- poetry
|
|
91
|
+
- nnsight
|
|
92
|
+
- datasets
|
|
93
|
+
- dictionary_learning (bundled fork)
|
|
94
|
+
notes:
|
|
95
|
+
- Poetry管理的环境;运行'poetry install'进行设置。Torch轮子从cu128索引拉取。
|
|
96
|
+
- dictionary_learning目录是github.com/saprmarks/dictionary_learning的捆绑fork。
|
|
97
|
+
- 完整的固定依赖集请参见pyproject.toml和poetry.lock。
|
|
98
|
+
risk_flags:
|
|
99
|
+
- external_eval_dependency
|
|
100
|
+
- large_model_weights
|
|
101
|
+
- judge_model_required
|
|
102
|
+
- some_experiments_under_construction
|
|
103
|
+
risk_notes:
|
|
104
|
+
- SAEBench未捆绑;自动解释评估需要单独克隆和运行它,并使用大型评判LLM(论文中使用70B参数Llama-3.3)。
|
|
105
|
+
- Gemma-2-2b权重(约5 GB)必须下载,可能需要HuggingFace访问协议。
|
|
106
|
+
- 完整的自动解释路线需要托管或API访问70B评判模型,这会显著增加成本。
|
|
107
|
+
- README将"序列可解释性(图1和4)"和"转向"实验标记为建设中。
|
|
108
|
+
- 打包过程中未执行基准测试;指标有代码支持但运行时未验证。
|
|
109
|
+
recommended_when: 当您需要一个结合SAE训练与时间对比学习和自动化可解释性评估的机械可解释性任务时使用此基准测试。非常适合研究LLM表征中语义与句法特征的解纠缠,或在结构化先验下优化SAE训练流程。
|
|
110
|
+
not_recommended_when: 如果您需要轻量级仅CPU基准测试、无法在本地托管LLM检查点(Pythia-160m最小,Gemma-2-2b推荐)或缺乏GPU访问,请勿使用。如果无法运行或访问大型评判模型进行自动解释评估路线,也应避免。
|
|
111
|
+
paper:
|
|
112
|
+
title: 'Temporal Sparse Autoencoders: Leveraging the Sequential Nature of Language
|
|
113
|
+
for Interpretability'
|
|
114
|
+
authors:
|
|
115
|
+
- Usha Bhalla
|
|
116
|
+
- Alex Oesterling
|
|
117
|
+
- Claudio Mayrink Verdun
|
|
118
|
+
- Himabindu Lakkaraju
|
|
119
|
+
- Flavio P. Calmon
|
|
120
|
+
venue: arXiv preprint
|
|
121
|
+
year: 2025
|
|
122
|
+
url: https://arxiv.org/abs/2511.05541
|
|
123
|
+
download:
|
|
124
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.005_tsae.zip
|
|
125
|
+
archive_type: zip
|
|
126
|
+
local_dir_name: paper-5-TSAE
|
|
127
|
+
provider: github_release
|
|
128
|
+
repo: ResearAI/DeepScientist
|
|
129
|
+
tag: aisb-v0.0.1
|
|
130
|
+
asset_name: aisb.t3.005_tsae.zip
|
|
131
|
+
sha256: f89d8100092417777d135fded098e3fb26a5f38ccdb300658138273924bf070e
|
|
132
|
+
size_bytes: 322370
|
|
133
|
+
commercial:
|
|
134
|
+
annual_fee: null
|
|
135
|
+
display:
|
|
136
|
+
palette_seed: amber-ink-latent
|
|
137
|
+
art_style: editorial-technical
|
|
138
|
+
accent_priority: high
|
|
139
|
+
image_path: ../image/005_aisb.t3.005_tsae.jpg
|
|
@@ -0,0 +1,194 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.006_physense
|
|
3
|
+
name: 'PhySense: Sensor Placement Optimization for Accurate Physics Sensing'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 'Two-stage flow-based physics-field reconstruction and sensor placement
|
|
6
|
+
optimization across turbulent-flow, sea-temperature, and car-aerodynamics benchmarks.
|
|
7
|
+
|
|
8
|
+
'
|
|
9
|
+
task_description: 'This benchmark implements PhySense, a synergistic two-stage framework
|
|
10
|
+
for physics sensing. Stage 1 trains a flow-matching generative model (DiT for regular
|
|
11
|
+
grids, Transolver for irregular meshes) with cross-attention to reconstruct dense
|
|
12
|
+
physical fields from sparse sensor observations at arbitrary placements. Stage 2
|
|
13
|
+
optimizes sensor positions via projected gradient descent under spatial constraints,
|
|
14
|
+
using reconstruction feedback to discover informative placements. The agent must
|
|
15
|
+
run training and inference across three bundled scientific domains: (1) Turbulent-Flow
|
|
16
|
+
(pipe simulation on regular grid), (2) Sea-Temperature (global SST reanalysis on
|
|
17
|
+
regular grid with land mask), and (3) Car-Aerodynamics (3D surface pressure on irregular
|
|
18
|
+
mesh). For each domain the snapshot provides both a base-model inference script
|
|
19
|
+
(random placement) and a walk inference script (optimized placement). Primary metrics
|
|
20
|
+
are relative L2 error and MSE loss; secondary output is the optimized sensor layout.
|
|
21
|
+
Data paths in inference scripts point to external locations that must be populated.
|
|
22
|
+
Pretrained checkpoints are expected under per-domain ./checkpoints/ directories.
|
|
23
|
+
No external evaluation service is required; all metrics are computed locally in
|
|
24
|
+
the inference scripts.
|
|
25
|
+
|
|
26
|
+
'
|
|
27
|
+
capability_tags:
|
|
28
|
+
- research_code_optimization
|
|
29
|
+
- physics_ml
|
|
30
|
+
- sensor_placement
|
|
31
|
+
- scientific_ml
|
|
32
|
+
- field_reconstruction
|
|
33
|
+
- flow_matching
|
|
34
|
+
- generative_models
|
|
35
|
+
aisb_direction: T3
|
|
36
|
+
track_fit:
|
|
37
|
+
- paper_track
|
|
38
|
+
- benchmark_track
|
|
39
|
+
task_mode: experiment_driven
|
|
40
|
+
requires_execution: true
|
|
41
|
+
requires_paper: true
|
|
42
|
+
integrity_level: cas_plus_canary
|
|
43
|
+
snapshot_status: runnable
|
|
44
|
+
support_level: advanced
|
|
45
|
+
cost_band: medium
|
|
46
|
+
time_band: 6-24h
|
|
47
|
+
difficulty: hard
|
|
48
|
+
data_access: public
|
|
49
|
+
primary_outputs:
|
|
50
|
+
- relative_l2
|
|
51
|
+
- mse_loss
|
|
52
|
+
- sensor_layout
|
|
53
|
+
launch_profiles:
|
|
54
|
+
- id: quick_check
|
|
55
|
+
label: Quick Check
|
|
56
|
+
description: 'Run a single-domain inference route (e.g. pipe_infer.py or sea_infer.py)
|
|
57
|
+
with a pretrained checkpoint to verify the pipeline produces relative_l2 and mse_loss.
|
|
58
|
+
|
|
59
|
+
'
|
|
60
|
+
- id: full_benchmark
|
|
61
|
+
label: Full Benchmark
|
|
62
|
+
description: 'Train base reconstruction models and run sensor placement optimization
|
|
63
|
+
across all three domains (Turbulent-Flow, Sea-Temperature, Car-Aerodynamics),
|
|
64
|
+
then evaluate both random-placement and optimized-placement reconstruction quality.
|
|
65
|
+
|
|
66
|
+
'
|
|
67
|
+
- id: placement_only
|
|
68
|
+
label: Placement Optimization Only
|
|
69
|
+
description: 'Starting from pretrained base models, run only the Stage 2 sensor
|
|
70
|
+
placement optimization (walk scripts) and compare against random-placement baselines.
|
|
71
|
+
|
|
72
|
+
'
|
|
73
|
+
dataset_download:
|
|
74
|
+
primary_method: mixed
|
|
75
|
+
sources:
|
|
76
|
+
- kind: github
|
|
77
|
+
url: https://github.com/thuml/PhySense
|
|
78
|
+
access: public
|
|
79
|
+
note: 'Source code repository. Data for each benchmark must be obtained separately;
|
|
80
|
+
see per-domain README files for download links.
|
|
81
|
+
|
|
82
|
+
'
|
|
83
|
+
notes:
|
|
84
|
+
- 'Sea-Temperature data is loaded from a hardcoded path (/workspace/mayuezhou/ddim/sea_data_large/)
|
|
85
|
+
in inference scripts. The agent must download the sea temperature .npy files and
|
|
86
|
+
update paths accordingly.
|
|
87
|
+
|
|
88
|
+
'
|
|
89
|
+
- 'Turbulent-Flow data is loaded via datasets/senseiver_dataloader.py; the underlying
|
|
90
|
+
data source must be obtained and placed in the expected location.
|
|
91
|
+
|
|
92
|
+
'
|
|
93
|
+
- 'Car-Aerodynamics uses DDP training scripts; data paths are configured via command-line
|
|
94
|
+
arguments in shell scripts under Car-Aerodynamics/scripts/.
|
|
95
|
+
|
|
96
|
+
'
|
|
97
|
+
- 'Total dataset size across all three domains is estimated at 20-60 GB depending
|
|
98
|
+
on resolution choices; exact sizes are not stated in the README.
|
|
99
|
+
|
|
100
|
+
'
|
|
101
|
+
credential_requirements:
|
|
102
|
+
mode: none
|
|
103
|
+
items: []
|
|
104
|
+
notes: []
|
|
105
|
+
resources:
|
|
106
|
+
minimum:
|
|
107
|
+
cpu_cores: 8
|
|
108
|
+
ram_gb: 32
|
|
109
|
+
disk_gb: 80
|
|
110
|
+
gpu_count: 1
|
|
111
|
+
gpu_vram_gb: 16
|
|
112
|
+
recommended:
|
|
113
|
+
cpu_cores: 16
|
|
114
|
+
ram_gb: 64
|
|
115
|
+
disk_gb: 150
|
|
116
|
+
gpu_count: 1
|
|
117
|
+
gpu_vram_gb: 24
|
|
118
|
+
environment:
|
|
119
|
+
python: '3.10'
|
|
120
|
+
cuda: '11.8'
|
|
121
|
+
pytorch: 2.1.0
|
|
122
|
+
key_packages:
|
|
123
|
+
- dotwiz
|
|
124
|
+
- pyyaml
|
|
125
|
+
- numpy
|
|
126
|
+
- matplotlib
|
|
127
|
+
notes:
|
|
128
|
+
- See requirements.txt for the full dependency set.
|
|
129
|
+
- 'Inference scripts use torch.cuda.amp.autocast and hardcode GPU device indices
|
|
130
|
+
(e.g. cuda:5, cuda:0). Adjust device IDs to match your hardware.
|
|
131
|
+
|
|
132
|
+
'
|
|
133
|
+
- 'Car-Aerodynamics uses DDP (DistributedDataParallel); multi-GPU may be needed
|
|
134
|
+
for training but single-GPU suffices for inference.
|
|
135
|
+
|
|
136
|
+
'
|
|
137
|
+
risk_flags:
|
|
138
|
+
- hardcoded_paths
|
|
139
|
+
- hardcoded_device_ids
|
|
140
|
+
- dataset_not_bundled
|
|
141
|
+
- checkpoint_not_verified
|
|
142
|
+
risk_notes:
|
|
143
|
+
- 'Inference scripts contain hardcoded absolute data paths (e.g. /workspace/mayuezhou/ddim/sea_data_large/)
|
|
144
|
+
and hardcoded CUDA device indices (torch.cuda.set_device(5)). These must be edited
|
|
145
|
+
before running.
|
|
146
|
+
|
|
147
|
+
'
|
|
148
|
+
- 'Pretrained checkpoints (e.g. pipe_best_base_model.pth, sea_best_base_model.pth,
|
|
149
|
+
pipe_50sensor_opt.pth) are expected under per-domain ./checkpoints/ directories.
|
|
150
|
+
Availability depends on the snapshot packaging; if missing, training must be run
|
|
151
|
+
first.
|
|
152
|
+
|
|
153
|
+
'
|
|
154
|
+
- 'No benchmark execution was performed during the packaging pass; metric values have
|
|
155
|
+
not been verified at runtime.
|
|
156
|
+
|
|
157
|
+
'
|
|
158
|
+
- 'The walk inference scripts (sensor placement optimization evaluation) require optimized
|
|
159
|
+
checkpoints that are produced only after Stage 2 training.
|
|
160
|
+
|
|
161
|
+
'
|
|
162
|
+
recommended_when: 'Use this benchmark when you want a scientific-ML task that combines
|
|
163
|
+
physics-field reconstruction with constrained sensor placement optimization, testing
|
|
164
|
+
generative modeling (flow matching) across heterogeneous physical domains with both
|
|
165
|
+
regular and irregular geometries.
|
|
166
|
+
|
|
167
|
+
'
|
|
168
|
+
not_recommended_when: 'Do not use this if you need a lightweight benchmark with minimal
|
|
169
|
+
storage, no iterative optimization loop, or no GPU requirement. Also not suitable
|
|
170
|
+
if you cannot modify hardcoded paths and device indices in the source scripts.
|
|
171
|
+
|
|
172
|
+
'
|
|
173
|
+
paper:
|
|
174
|
+
title: 'PhySense: Sensor Placement Optimization for Accurate Physics Sensing'
|
|
175
|
+
venue: NeurIPS 2025 Oral
|
|
176
|
+
year: 2025
|
|
177
|
+
url: https://arxiv.org/abs/2505.18190
|
|
178
|
+
download:
|
|
179
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.006_physense.zip
|
|
180
|
+
archive_type: zip
|
|
181
|
+
local_dir_name: paper-6-PhySense
|
|
182
|
+
provider: github_release
|
|
183
|
+
repo: ResearAI/DeepScientist
|
|
184
|
+
tag: aisb-v0.0.1
|
|
185
|
+
asset_name: aisb.t3.006_physense.zip
|
|
186
|
+
sha256: b35419c897e1c56bad7037fc90249da8589f432ba58831550a257b99d19e8b6c
|
|
187
|
+
size_bytes: 94438
|
|
188
|
+
commercial:
|
|
189
|
+
annual_fee: null
|
|
190
|
+
display:
|
|
191
|
+
palette_seed: slate-cyan-fluid
|
|
192
|
+
art_style: scientific-visualization
|
|
193
|
+
accent_priority: high
|
|
194
|
+
image_path: ../image/006_aisb.t3.006_physense.jpg
|
|
@@ -0,0 +1,118 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.006_physense
|
|
3
|
+
name: 'PhySense:用于精确物理感知的传感器布局优化'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: '基于双阶段流匹配方法的物理场重建与传感器布局优化,涵盖湍流、海温及汽车空气动力学基准。'
|
|
6
|
+
task_description: '本基准实现了PhySense,一个协同式双阶段物理感知框架。第一阶段训练基于流匹配的条件生成模型(规则网格使用DiT,不规则网格使用Transolver),通过交叉注意力机制从稀疏传感器观测中重建稠密物理场,传感器可放置在任意位置。第二阶段在空间约束下通过投影梯度下降优化传感器位置,利用重建反馈发现信息量最大的放置方案。智能体需在三个捆绑的科学领域运行训练和推理:(1)湍流(规则网格管道模拟),(2)海温(带陆面掩码的规则网格全球海表温度再分析),(3)汽车空气动力学(不规则网格上的3D表面压力)。每个领域提供了基础模型推理脚本(随机放置)和步行推理脚本(优化放置)。主要指标为相对L2误差和MSE损失;次要输出为优化后的传感器布局。推理脚本中的数据路径指向外部位置,需自行填充数据。预训练检查点应存放在各领域的./checkpoints/目录下。无需外部评估服务,所有指标在推理脚本中本地计算。'
|
|
7
|
+
capability_tags:
|
|
8
|
+
- research_code_optimization
|
|
9
|
+
- physics_ml
|
|
10
|
+
- sensor_placement
|
|
11
|
+
- scientific_ml
|
|
12
|
+
- field_reconstruction
|
|
13
|
+
- flow_matching
|
|
14
|
+
- generative_models
|
|
15
|
+
aisb_direction: T3
|
|
16
|
+
track_fit:
|
|
17
|
+
- paper_track
|
|
18
|
+
- benchmark_track
|
|
19
|
+
task_mode: experiment_driven
|
|
20
|
+
requires_execution: true
|
|
21
|
+
requires_paper: true
|
|
22
|
+
integrity_level: cas_plus_canary
|
|
23
|
+
snapshot_status: runnable
|
|
24
|
+
support_level: advanced
|
|
25
|
+
cost_band: medium
|
|
26
|
+
time_band: 6-24h
|
|
27
|
+
difficulty: hard
|
|
28
|
+
data_access: public
|
|
29
|
+
primary_outputs:
|
|
30
|
+
- relative_l2
|
|
31
|
+
- mse_loss
|
|
32
|
+
- sensor_layout
|
|
33
|
+
launch_profiles:
|
|
34
|
+
- id: quick_check
|
|
35
|
+
label: 快速检查
|
|
36
|
+
description: '使用预训练检查点运行单领域推理(如pipe_infer.py或sea_infer.py),验证流水线能否输出relative_l2和mse_loss指标。'
|
|
37
|
+
- id: full_benchmark
|
|
38
|
+
label: 完整基准测试
|
|
39
|
+
description: '在全部三个领域(湍流、海温、汽车空气动力学)上训练基础重建模型并运行传感器布局优化,然后评估随机放置和优化放置两种方案的重建质量。'
|
|
40
|
+
- id: placement_only
|
|
41
|
+
label: 仅布局优化
|
|
42
|
+
description: '基于预训练基础模型,仅运行第二阶段传感器布局优化(步行脚本),并与随机放置基线进行对比。'
|
|
43
|
+
dataset_download:
|
|
44
|
+
primary_method: mixed
|
|
45
|
+
sources:
|
|
46
|
+
- kind: github
|
|
47
|
+
url: https://github.com/thuml/PhySense
|
|
48
|
+
access: public
|
|
49
|
+
note: '源代码仓库。各基准数据需单独获取,详见各领域README文件中的下载链接。'
|
|
50
|
+
notes:
|
|
51
|
+
- '海温数据从推理脚本中的硬编码路径(/workspace/mayuezhou/ddim/sea_data_large/)加载。智能体需下载海温.npy文件并相应更新路径。'
|
|
52
|
+
- '湍流数据通过datasets/senseiver_dataloader.py加载;需获取底层数据源并放置到预期位置。'
|
|
53
|
+
- '汽车空气动力学使用DDP训练脚本;数据路径通过Car-Aerodynamics/scripts/下shell脚本的命令行参数配置。'
|
|
54
|
+
- '三个领域的数据集总大小估计为20-60GB,取决于分辨率选择;README中未注明确切大小。'
|
|
55
|
+
credential_requirements:
|
|
56
|
+
mode: none
|
|
57
|
+
items: []
|
|
58
|
+
notes: []
|
|
59
|
+
resources:
|
|
60
|
+
minimum:
|
|
61
|
+
cpu_cores: 8
|
|
62
|
+
ram_gb: 32
|
|
63
|
+
disk_gb: 80
|
|
64
|
+
gpu_count: 1
|
|
65
|
+
gpu_vram_gb: 16
|
|
66
|
+
recommended:
|
|
67
|
+
cpu_cores: 16
|
|
68
|
+
ram_gb: 64
|
|
69
|
+
disk_gb: 150
|
|
70
|
+
gpu_count: 1
|
|
71
|
+
gpu_vram_gb: 24
|
|
72
|
+
environment:
|
|
73
|
+
python: '3.10'
|
|
74
|
+
cuda: '11.8'
|
|
75
|
+
pytorch: 2.1.0
|
|
76
|
+
key_packages:
|
|
77
|
+
- dotwiz
|
|
78
|
+
- pyyaml
|
|
79
|
+
- numpy
|
|
80
|
+
- matplotlib
|
|
81
|
+
notes:
|
|
82
|
+
- 完整依赖列表见requirements.txt。
|
|
83
|
+
- '推理脚本使用torch.cuda.amp.autocast并硬编码GPU设备索引(如cuda:5、cuda:0)。请根据您的硬件调整设备ID。'
|
|
84
|
+
- '汽车空气动力学使用DDP(DistributedDataParallel);训练可能需要多GPU,但推理仅需单GPU即可。'
|
|
85
|
+
risk_flags:
|
|
86
|
+
- hardcoded_paths
|
|
87
|
+
- hardcoded_device_ids
|
|
88
|
+
- dataset_not_bundled
|
|
89
|
+
- checkpoint_not_verified
|
|
90
|
+
risk_notes:
|
|
91
|
+
- '推理脚本包含硬编码的绝对数据路径(如/workspace/mayuezhou/ddim/sea_data_large/)和硬编码的CUDA设备索引(torch.cuda.set_device(5))。运行前必须编辑修改。'
|
|
92
|
+
- '预训练检查点(如pipe_best_base_model.pth、sea_best_base_model.pth、pipe_50sensor_opt.pth)应存放在各领域./checkpoints/目录下。是否可用取决于快照打包情况;如缺失需先运行训练。'
|
|
93
|
+
- '打包过程中未执行基准测试;指标值未经运行时验证。'
|
|
94
|
+
- '步行推理脚本(传感器布局优化评估)需要优化后的检查点,该检查点仅在第二阶段训练后产生。'
|
|
95
|
+
recommended_when: '当您需要一项结合物理场重建与约束传感器布局优化的科学机器学习任务,且该任务需测试跨异构物理领域的生成式建模(流匹配)能力,涉及规则和不规则几何构型时,请使用此基准。'
|
|
96
|
+
not_recommended_when: '如果需要轻量级基准(存储需求小、无迭代优化循环、无GPU要求),请勿使用。此外,如无法修改源代码脚本中的硬编码路径和设备索引,也不适用。'
|
|
97
|
+
paper:
|
|
98
|
+
title: 'PhySense: Sensor Placement Optimization for Accurate Physics Sensing'
|
|
99
|
+
venue: NeurIPS 2025 Oral
|
|
100
|
+
year: 2025
|
|
101
|
+
url: https://arxiv.org/abs/2505.18190
|
|
102
|
+
download:
|
|
103
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.006_physense.zip
|
|
104
|
+
archive_type: zip
|
|
105
|
+
local_dir_name: paper-6-PhySense
|
|
106
|
+
provider: github_release
|
|
107
|
+
repo: ResearAI/DeepScientist
|
|
108
|
+
tag: aisb-v0.0.1
|
|
109
|
+
asset_name: aisb.t3.006_physense.zip
|
|
110
|
+
sha256: b35419c897e1c56bad7037fc90249da8589f432ba58831550a257b99d19e8b6c
|
|
111
|
+
size_bytes: 94438
|
|
112
|
+
commercial:
|
|
113
|
+
annual_fee: null
|
|
114
|
+
display:
|
|
115
|
+
palette_seed: slate-cyan-fluid
|
|
116
|
+
art_style: scientific-visualization
|
|
117
|
+
accent_priority: high
|
|
118
|
+
image_path: ../image/006_aisb.t3.006_physense.jpg
|