@researai/deepscientist 1.5.16 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +196 -32
- package/bin/ds.js +924 -66
- package/docs/en/00_QUICK_START.md +195 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +78 -7
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +624 -180
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +386 -0
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +266 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +48 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +142 -18
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +54 -8
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +552 -181
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +384 -0
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +33 -7
- package/install.sh +168 -20
- package/package.json +5 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/bridges/connectors.py +8 -2
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +187 -74
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +1077 -93
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +827 -235
- package/src/deepscientist/daemon/api/router.py +81 -1
- package/src/deepscientist/daemon/app.py +1512 -85
- package/src/deepscientist/diagnostics/__init__.py +6 -0
- package/src/deepscientist/diagnostics/runner_failures.py +277 -0
- package/src/deepscientist/doctor.py +407 -56
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +850 -88
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1852 -161
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +480 -35
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +80 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -10
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +411 -304
- package/src/prompts/system_copilot.md +89 -0
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-DnSm0GZn.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-itb0tltR.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DqKkiCI6.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-DxL2ezFG.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-B_RQm1YZ.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-tHqlXY3n.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-B495DTXC.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DG28-61B.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BiOGT-Kj.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-CVsj8h_T.js → NotebookEditor-WFyd8Ybt.js} +23 -23
- package/src/ui/dist/assets/{PdfLoader-CASDQmxJ.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-BFhwoKsY.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-CB4DYfWO.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-DLC6G24T.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-CwMn-iqb.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-Cu4Qln7Y.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-wQ7RIIRd.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-CsX08Qno.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-R-GWEhzS.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-COFACy7V.js +0 -204
- package/src/ui/dist/assets/CliPlugin-CvwCmDQ5.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-cOqSa0xq.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-DVgNHBCS.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-ClMbq5Yu.js +0 -14
- package/src/ui/dist/assets/LabPlugin-L_SuE8ow.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-C-4Kt1p9.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-DcOzU9vd.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CHj7M58O.js +0 -16
- package/src/ui/dist/assets/VNCViewer-CjlbyCB3.js +0 -11
- package/src/ui/dist/assets/bot-CFkZY-JP.js +0 -6
- package/src/ui/dist/assets/chevron-up-Dq5ofbht.js +0 -6
- package/src/ui/dist/assets/file-content-Dv4LoZec.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-Denq-lC3.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-BUh6G52n.js +0 -6
- package/src/ui/dist/assets/image-B9HUUddG.js +0 -6
- package/src/ui/dist/assets/index-B2B1sg-M.js +0 -1
- package/src/ui/dist/assets/index-Cgla8biy.css +0 -33
- package/src/ui/dist/assets/index-DRyx7vAc.js +0 -1
- package/src/ui/dist/assets/index-Gbl53BNp.js +0 -2496
- package/src/ui/dist/assets/pdf-effect-queue-ZtnHFCAi.js +0 -6
- package/src/ui/dist/assets/popover-DL6h35vr.js +0 -1
- package/src/ui/dist/assets/select-DvmXt1yY.js +0 -11
- package/src/ui/dist/assets/sigma-7jpXazui.js +0 -6
- package/src/ui/dist/assets/trash-xA7kFt8i.js +0 -11
- package/src/ui/dist/assets/useCliAccess-DsMwDjOp.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,234 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.065_proteinbinding
|
|
3
|
+
name: StaB-ddG — Predicting Mutational Effects on Protein Binding from Folding Energy
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: Transfer-learning benchmark for protein-protein binding ΔΔG prediction via
|
|
6
|
+
stability-to-binding parameterization using ProteinMPNN and two-stage fine-tuning.
|
|
7
|
+
task_description: "This packaged benchmark covers the full StaB-ddG workflow for predicting\
|
|
8
|
+
\ mutational effects on protein-protein binding free energies (ΔΔG, kcal/mol). The\
|
|
9
|
+
\ core idea is the thermodynamic identity ΔG_bind(A:B) = ΔG_fold(A:B) − ΔG_fold(A)\
|
|
10
|
+
\ − ΔG_fold(B), which allows binding energy prediction to be reduced to folding\
|
|
11
|
+
\ energy prediction and enables transfer from copious stability data to scarce binding\
|
|
12
|
+
\ data.\nThe benchmark proceeds in two fine-tuning stages:\n\n Stage 1 — Stability\
|
|
13
|
+
\ fine-tuning: ProteinMPNN is fine-tuned on the Megascale high-throughput\n folding\
|
|
14
|
+
\ stability dataset (Tsuboyama 2023, ~350 k measurements, AlphaFold PDB structures,\n\
|
|
15
|
+
\ downloaded from Zenodo record 7992926).\n\n Stage 2 — Binding fine-tuning: The\
|
|
16
|
+
\ stability-fine-tuned model is further fine-tuned on a\n quality-filtered subset\
|
|
17
|
+
\ of the SKEMPI v2 database of protein-protein binding ΔΔG measurements,\n using\
|
|
18
|
+
\ interface-homology cluster splits to prevent data leakage.\n\nEvaluation reproduces\
|
|
19
|
+
\ the SKEMPI benchmark results reported in the ICML 2025 paper, computing per-interface\
|
|
20
|
+
\ Pearson and Spearman correlations, overall correlations, RMSE, and ROC-AUC. Baseline\
|
|
21
|
+
\ comparisons against FoldX and Flex ddG are included in the packaged baselines/\
|
|
22
|
+
\ directory. StaB-ddG is the first deep-learning predictor reported to match FoldX\
|
|
23
|
+
\ accuracy while offering a >1,000× speed-up.\nInputs: PDB structure files (wild-type\
|
|
24
|
+
\ complex), chain specifications, and mutation strings. Outputs: per-mutant ΔΔG\
|
|
25
|
+
\ predictions (kcal/mol), per-interface correlation metrics, and a full evaluation\
|
|
26
|
+
\ CSV.\n"
|
|
27
|
+
capability_tags:
|
|
28
|
+
- protein_modeling
|
|
29
|
+
- binding_energy_prediction
|
|
30
|
+
- structural_biology
|
|
31
|
+
- scientific_ml
|
|
32
|
+
- transfer_learning
|
|
33
|
+
- research_code_optimization
|
|
34
|
+
aisb_direction: T3
|
|
35
|
+
track_fit:
|
|
36
|
+
- paper_track
|
|
37
|
+
- benchmark_track
|
|
38
|
+
task_mode: experiment_driven
|
|
39
|
+
requires_execution: true
|
|
40
|
+
requires_paper: true
|
|
41
|
+
integrity_level: cas_plus_canary
|
|
42
|
+
snapshot_status: runnable
|
|
43
|
+
support_level: advanced
|
|
44
|
+
time_band: 6-24h
|
|
45
|
+
cost_band: medium
|
|
46
|
+
difficulty: hard
|
|
47
|
+
data_access: public
|
|
48
|
+
primary_outputs:
|
|
49
|
+
- per_interface_pearson
|
|
50
|
+
- per_interface_spearman
|
|
51
|
+
- overall_pearson
|
|
52
|
+
- overall_spearman
|
|
53
|
+
- roc_auc
|
|
54
|
+
- ddg_predictions
|
|
55
|
+
- binding_report
|
|
56
|
+
launch_profiles:
|
|
57
|
+
- id: single_prediction
|
|
58
|
+
label: Single Prediction
|
|
59
|
+
description: 'Run a single-mutation or multi-mutation ΔΔG prediction for one complex
|
|
60
|
+
using run_stabddg.py. Requires a PDB file, chain specification (e.g. ABC_DE),
|
|
61
|
+
and a mutation string (e.g. EA63Q,QD30V,KA66A). Uses the pre-trained stabddg.pt
|
|
62
|
+
checkpoint. Outputs output.csv with pred_1 column. No training data download required.
|
|
63
|
+
|
|
64
|
+
'
|
|
65
|
+
- id: eval_only
|
|
66
|
+
label: Evaluation Only
|
|
67
|
+
description: 'Reproduce SKEMPI benchmark numbers using the pre-trained stabddg.pt
|
|
68
|
+
checkpoint via skempi_eval.py. Requires downloading SKEMPI2_PDBs from life.bsc.es.
|
|
69
|
+
Produces cache/eval.csv and per-interface correlation metrics. Fastest path to
|
|
70
|
+
paper numbers.
|
|
71
|
+
|
|
72
|
+
'
|
|
73
|
+
- id: train_and_eval
|
|
74
|
+
label: Full Train + Eval
|
|
75
|
+
description: 'Run the complete two-stage fine-tuning and evaluation pipeline: (1)
|
|
76
|
+
stability fine-tuning on Megascale via stability_finetune.py, then (2) SKEMPI
|
|
77
|
+
binding fine-tuning via skempi_finetune.py, then (3) evaluation via skempi_eval.py.
|
|
78
|
+
Requires both Megascale and SKEMPI data downloads. Optional Wandb tracking via
|
|
79
|
+
--wandb flag.
|
|
80
|
+
|
|
81
|
+
'
|
|
82
|
+
dataset_download:
|
|
83
|
+
primary_method: mixed
|
|
84
|
+
sources:
|
|
85
|
+
- name: Megascale Folding Stability Dataset (Stage 1)
|
|
86
|
+
url: https://zenodo.org/records/7992926
|
|
87
|
+
files:
|
|
88
|
+
- Tsuboyama2023_Dataset2_Dataset3_20230416.csv
|
|
89
|
+
- AlphaFold_model_PDBs.zip
|
|
90
|
+
- Processed_K50_dG_datasets.zip
|
|
91
|
+
notes: 'Download via wget from Zenodo record 7992926. Unzip both archives before
|
|
92
|
+
running stability_finetune.py. Download takes several minutes. Required for
|
|
93
|
+
Stage 1 only.
|
|
94
|
+
|
|
95
|
+
'
|
|
96
|
+
- name: SKEMPI v2 Binding Energy Dataset (Stage 2 and Eval)
|
|
97
|
+
url: https://life.bsc.es/pid/skempi2/database/download/SKEMPI2_PDBs.tgz
|
|
98
|
+
files:
|
|
99
|
+
- SKEMPI2_PDBs.tgz
|
|
100
|
+
notes: 'Download via wget from life.bsc.es and extract with tar -xvzf. A quality-filtered
|
|
101
|
+
SKEMPI CSV and interface-homology cluster train/test splits are pre-packaged
|
|
102
|
+
in data/SKEMPI/. The raw PDB structures must be downloaded separately. Required
|
|
103
|
+
for Stage 2 fine-tuning and for eval_only profile.
|
|
104
|
+
|
|
105
|
+
'
|
|
106
|
+
- name: Benchmark Package Archive
|
|
107
|
+
url: https://deepscientist.cc/AISB/065_proteinbinding
|
|
108
|
+
archive_type: zip
|
|
109
|
+
local_dir_name: paper-65-ProteinBinding
|
|
110
|
+
notes: 'Contains pre-trained model checkpoints (model_ckpts/stabddg.pt, model_ckpts/stability_finetuned.pt,
|
|
111
|
+
model_ckpts/proteinmpnn.pt), packaged SKEMPI splits, baseline prediction CSVs,
|
|
112
|
+
and example inputs.
|
|
113
|
+
|
|
114
|
+
'
|
|
115
|
+
notes:
|
|
116
|
+
- Pre-trained checkpoints are included in the benchmark archive; full training requires
|
|
117
|
+
both external dataset downloads.
|
|
118
|
+
- SKEMPI PDB download is required even for eval_only; the filtered CSV is pre-packaged.
|
|
119
|
+
credential_requirements:
|
|
120
|
+
mode: none
|
|
121
|
+
items: []
|
|
122
|
+
notes:
|
|
123
|
+
- All data sources are publicly accessible without authentication.
|
|
124
|
+
- Optional Wandb account needed only if using the --wandb training flag.
|
|
125
|
+
resources:
|
|
126
|
+
minimum:
|
|
127
|
+
cpu_cores: 8
|
|
128
|
+
ram_gb: 32
|
|
129
|
+
disk_gb: 100
|
|
130
|
+
gpu_count: 1
|
|
131
|
+
gpu_vram_gb: 16
|
|
132
|
+
notes: 'Sufficient for single-prediction and eval_only profiles using the pre-trained
|
|
133
|
+
checkpoint. Stability fine-tuning requires torch.device=''cuda'' and will OOM
|
|
134
|
+
below 16 GB VRAM.
|
|
135
|
+
|
|
136
|
+
'
|
|
137
|
+
recommended:
|
|
138
|
+
cpu_cores: 16
|
|
139
|
+
ram_gb: 64
|
|
140
|
+
disk_gb: 200
|
|
141
|
+
gpu_count: 1
|
|
142
|
+
gpu_vram_gb: 24
|
|
143
|
+
notes: 'Recommended for full train+eval profile. Extra disk headroom accommodates
|
|
144
|
+
Megascale AlphaFold PDBs (~50 GB unzipped) and SKEMPI PDB structures alongside
|
|
145
|
+
checkpoints.
|
|
146
|
+
|
|
147
|
+
'
|
|
148
|
+
environment:
|
|
149
|
+
python: '3.10'
|
|
150
|
+
cuda: null
|
|
151
|
+
pytorch: 2.6.0
|
|
152
|
+
flash_attn: null
|
|
153
|
+
key_packages:
|
|
154
|
+
- biopython==1.85
|
|
155
|
+
- scipy
|
|
156
|
+
- tqdm
|
|
157
|
+
- wandb
|
|
158
|
+
- pandas
|
|
159
|
+
setup_method: conda
|
|
160
|
+
setup_file: environment.yaml
|
|
161
|
+
notes:
|
|
162
|
+
- Create environment with: conda env create -f environment.yaml && conda activate
|
|
163
|
+
stabddg
|
|
164
|
+
- Alternatively, install into an existing PyTorch environment with: pip install
|
|
165
|
+
tqdm scipy wandb pandas biopython
|
|
166
|
+
- Optional editable install: pip install -e .
|
|
167
|
+
- See environment.yaml for the full pinned dependency set.
|
|
168
|
+
- CUDA is required for training stages (torch.device='cuda'); inference can run
|
|
169
|
+
on CPU but is significantly slower.
|
|
170
|
+
paper:
|
|
171
|
+
title: Predicting mutational effects on protein binding from folding energy
|
|
172
|
+
authors:
|
|
173
|
+
- Arthur Deng
|
|
174
|
+
- Karsten Householder
|
|
175
|
+
- Fang Wu
|
|
176
|
+
- Sebastian Thrun
|
|
177
|
+
- K. Christopher Garcia
|
|
178
|
+
- Brian Trippe
|
|
179
|
+
affiliation: Stanford University
|
|
180
|
+
venue: Proceedings of the 42nd International Conference on Machine Learning (ICML
|
|
181
|
+
2025)
|
|
182
|
+
year: 2025
|
|
183
|
+
url: https://arxiv.org/abs/2507.05502
|
|
184
|
+
code: https://github.com/LDeng0205/StaB-ddG
|
|
185
|
+
notes: 'Originally posted as an arXiv preprint (2507.05502) and accepted at ICML
|
|
186
|
+
2025 (PMLR 267). Introduces StaB-ddG as the first DL predictor to match FoldX
|
|
187
|
+
accuracy on SKEMPI while offering >1,000× speed-up over Rosetta-based Flex ddG.
|
|
188
|
+
|
|
189
|
+
'
|
|
190
|
+
download:
|
|
191
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.065_proteinbinding.zip
|
|
192
|
+
archive_type: zip
|
|
193
|
+
local_dir_name: paper-65-ProteinBinding
|
|
194
|
+
provider: github_release
|
|
195
|
+
repo: ResearAI/DeepScientist
|
|
196
|
+
tag: aisb-v0.0.1
|
|
197
|
+
asset_name: aisb.t3.065_proteinbinding.zip
|
|
198
|
+
sha256: 07ea82db652e56e0bd609f637362cd91f74d76f1356d3b7cd3d9c14d82fda319
|
|
199
|
+
size_bytes: 2277469
|
|
200
|
+
commercial:
|
|
201
|
+
annual_fee: null
|
|
202
|
+
display:
|
|
203
|
+
palette_seed: sage-bone-protein
|
|
204
|
+
art_style: molecular-atlas
|
|
205
|
+
accent_priority: high
|
|
206
|
+
image_path: ../image/065_aisb.t3.065_proteinbinding.jpg
|
|
207
|
+
recommended_when: 'Use this benchmark when evaluating models on structural-biology
|
|
208
|
+
tasks involving PDB inputs, mutation lists, and ΔΔG regression or ranking metrics.
|
|
209
|
+
Ideal when the goal is to assess transfer learning from stability to binding, compare
|
|
210
|
+
against FoldX or Flex ddG baselines, or reproduce ICML 2025 SKEMPI benchmark results.
|
|
211
|
+
Also suitable for single-complex inference workflows where only the pre-trained
|
|
212
|
+
checkpoint is needed.
|
|
213
|
+
|
|
214
|
+
'
|
|
215
|
+
not_recommended_when: 'Do not use this benchmark if you need a text-only or sequence-only
|
|
216
|
+
task with no structural inputs. Avoid if your environment cannot provide PDB structure
|
|
217
|
+
files for the wild-type interface or cannot satisfy the GPU memory requirement for
|
|
218
|
+
training. Not appropriate for benchmarks requiring fast iteration cycles, as the
|
|
219
|
+
full train+eval profile takes up to 24 h and requires large external dataset downloads.
|
|
220
|
+
|
|
221
|
+
'
|
|
222
|
+
risk_flags:
|
|
223
|
+
- external_data_download_required
|
|
224
|
+
- gpu_required_for_training
|
|
225
|
+
- no_execution_verified_in_packaging_pass
|
|
226
|
+
risk_notes:
|
|
227
|
+
- Metric values in metric_contract.json are code-backed but not yet verified by live
|
|
228
|
+
execution; trust only after a successful benchmark run produces cache/eval.csv.
|
|
229
|
+
- Megascale AlphaFold PDB download (~50 GB unzipped) may be slow or interrupted on
|
|
230
|
+
low-bandwidth connections; resume support via wget -c.
|
|
231
|
+
- SKEMPI PDB structures must be downloaded separately from life.bsc.es; the filtered
|
|
232
|
+
CSV and splits are pre-packaged but the raw PDBs are not.
|
|
233
|
+
- Monte Carlo variance reduction uses ensemble=20 samples by default at inference;
|
|
234
|
+
reducing this speeds up inference but increases prediction variance.
|
|
@@ -0,0 +1,167 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.065_proteinbinding
|
|
3
|
+
name: StaB-ddG — 通过折叠能量预测蛋白质结合的突变效应
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 基于稳定性到结合参数化的蛋白质-蛋白质结合 ΔΔG 预测迁移学习基准,使用 ProteinMPNN 和两阶段微调。
|
|
6
|
+
task_description: |
|
|
7
|
+
本基准包涵盖完整的 StaB-ddG 工作流程,用于预测突变对蛋白质-蛋白质结合自由能的影响(ΔΔG,kcal/mol)。其核心思想是热力学恒等式 ΔG_bind(A:B) = ΔG_fold(A:B) − ΔG_fold(A) − ΔG_fold(B),它将结合能预测简化为折叠能预测,并实现了从大量稳定性数据到稀缺结合数据的迁移。
|
|
8
|
+
|
|
9
|
+
基准测试分为两个微调阶段:
|
|
10
|
+
|
|
11
|
+
第一阶段 — 稳定性微调:ProteinMPNN 在 Megascale 高通量折叠稳定性数据集上进行微调(Tsuboyama 2023,约 35 万个测量值,AlphaFold PDB 结构,从 Zenodo 记录 7992926 下载)。
|
|
12
|
+
|
|
13
|
+
第二阶段 — 结合微调:将在第一阶段微调后的模型在 SKEMPI v2 数据库中蛋白质-蛋白质结合 ΔΔG 测量的质量过滤子集上进一步微调,使用界面同源聚类划分来防止数据泄露。
|
|
14
|
+
|
|
15
|
+
评估复现了 ICML 2025 论文中报告的 SKEMPI 基准结果,计算每个界面的 Pearson 和 Spearman 相关系数、总体相关系数、RMSE 和 ROC-AUC。基准比较包含 FoldX 和 Flex ddG,在打包的 baselines/ 目录中提供。StaB-ddG 是首个被报道能够匹配 FoldX 精度的深度学习预测器,同时提供超过 1000 倍的加速。
|
|
16
|
+
|
|
17
|
+
输入:PDB 结构文件(野生型复合物)、链规格和突变字符串。输出:每个突变的 ΔΔG 预测值(kcal/mol)、每个界面的相关性指标以及完整的评估 CSV。
|
|
18
|
+
capability_tags:
|
|
19
|
+
- protein_modeling
|
|
20
|
+
- binding_energy_prediction
|
|
21
|
+
- structural_biology
|
|
22
|
+
- scientific_ml
|
|
23
|
+
- transfer_learning
|
|
24
|
+
- research_code_optimization
|
|
25
|
+
aisb_direction: T3
|
|
26
|
+
track_fit:
|
|
27
|
+
- paper_track
|
|
28
|
+
- benchmark_track
|
|
29
|
+
task_mode: experiment_driven
|
|
30
|
+
requires_execution: true
|
|
31
|
+
requires_paper: true
|
|
32
|
+
integrity_level: cas_plus_canary
|
|
33
|
+
snapshot_status: runnable
|
|
34
|
+
support_level: advanced
|
|
35
|
+
time_band: 6-24h
|
|
36
|
+
cost_band: medium
|
|
37
|
+
difficulty: hard
|
|
38
|
+
data_access: public
|
|
39
|
+
primary_outputs:
|
|
40
|
+
- per_interface_pearson
|
|
41
|
+
- per_interface_spearman
|
|
42
|
+
- overall_pearson
|
|
43
|
+
- overall_spearman
|
|
44
|
+
- roc_auc
|
|
45
|
+
- ddg_predictions
|
|
46
|
+
- binding_report
|
|
47
|
+
launch_profiles:
|
|
48
|
+
- id: single_prediction
|
|
49
|
+
label: 单次预测
|
|
50
|
+
description: |
|
|
51
|
+
使用 run_stabddg.py 对单个复合物进行单点突变或多点突变 ΔΔG 预测。需要提供 PDB 文件、链规格(如 ABC_DE)和突变字符串(如 EA63Q,QD30V,KA66A)。使用预训练的 stabddg.pt 检查点。输出包含 pred_1 列的 output.csv。无需下载训练数据。
|
|
52
|
+
- id: eval_only
|
|
53
|
+
label: 仅评估
|
|
54
|
+
description: |
|
|
55
|
+
通过 skempi_eval.py 使用预训练的 stabddg.pt 检查点复现 SKEMPI 基准数值。需要从 life.bsc.es 下载 SKEMPI2_PDBs。生成 cache/eval.csv 和每个界面的相关性指标。是获得论文数值的最快途径。
|
|
56
|
+
- id: train_and_eval
|
|
57
|
+
label: 完整训练 + 评估
|
|
58
|
+
description: |
|
|
59
|
+
运行完整的两阶段微调和评估流程:(1)通过 stability_finetune.py 在 Megascale 上进行稳定性微调,然后(2)通过 skempi_finetune.py 进行 SKEMPI 结合微调,然后(3)通过 skempi_eval.py 进行评估。需要同时下载 Megascale 和 SKEMPI 数据。可通过 --wandb 标志启用可选的 Wandb 跟踪。
|
|
60
|
+
dataset_download:
|
|
61
|
+
primary_method: mixed
|
|
62
|
+
sources:
|
|
63
|
+
- name: Megascale Folding Stability Dataset (Stage 1)
|
|
64
|
+
url: https://zenodo.org/records/7992926
|
|
65
|
+
files:
|
|
66
|
+
- Tsuboyama2023_Dataset2_Dataset3_20230416.csv
|
|
67
|
+
- AlphaFold_model_PDBs.zip
|
|
68
|
+
- Processed_K50_dG_datasets.zip
|
|
69
|
+
notes: |
|
|
70
|
+
通过 wget 从 Zenodo 记录 7992926 下载。运行 stability_finetune.py 前请解压两个压缩包。下载需要几分钟。仅第一阶段需要。
|
|
71
|
+
- name: SKEMPI v2 Binding Energy Dataset (Stage 2 and Eval)
|
|
72
|
+
url: https://life.bsc.es/pid/skempi2/database/download/SKEMPI2_PDBs.tgz
|
|
73
|
+
files:
|
|
74
|
+
- SKEMPI2_PDBs.tgz
|
|
75
|
+
notes: |
|
|
76
|
+
通过 wget 从 life.bsc.es 下载并使用 tar -xvzf 解压。质量过滤后的 SKEMPI CSV 和界面同源聚类训练/测试划分已预装在 data/SKEMPI/ 中。原始 PDB 结构需要单独下载。第二阶段微调和仅评估模式需要此数据。
|
|
77
|
+
- name: Benchmark Package Archive
|
|
78
|
+
url: https://deepscientist.cc/AISB/065_proteinbinding
|
|
79
|
+
archive_type: zip
|
|
80
|
+
local_dir_name: paper-65-ProteinBinding
|
|
81
|
+
notes: |
|
|
82
|
+
包含预训练模型检查点(model_ckpts/stabddg.pt、model_ckpts/stability_finetuned.pt、model_ckpts/proteinmpnn.pt)、打包的 SKEMPI 划分、基线预测 CSV 和示例输入。
|
|
83
|
+
notes:
|
|
84
|
+
- 基准包中包含预训练检查点;完整训练需要下载两个外部数据集。
|
|
85
|
+
- 即使是仅评估模式也需要下载 SKEMPI PDB;过滤后的 CSV 已预装。
|
|
86
|
+
credential_requirements:
|
|
87
|
+
mode: none
|
|
88
|
+
items: []
|
|
89
|
+
notes:
|
|
90
|
+
- 所有数据源均可公开访问,无需认证。
|
|
91
|
+
- 仅在使用 --wandb 训练标志时才需要可选的 Wandb 账户。
|
|
92
|
+
resources:
|
|
93
|
+
minimum:
|
|
94
|
+
cpu_cores: 8
|
|
95
|
+
ram_gb: 32
|
|
96
|
+
disk_gb: 100
|
|
97
|
+
gpu_count: 1
|
|
98
|
+
gpu_vram_gb: 16
|
|
99
|
+
notes: |
|
|
100
|
+
使用预训练检查点进行单次预测和仅评估模式时足够。稳定性微调需要 torch.device='cuda',在 16 GB 以下显存会 OOM。
|
|
101
|
+
recommended:
|
|
102
|
+
cpu_cores: 16
|
|
103
|
+
ram_gb: 64
|
|
104
|
+
disk_gb: 200
|
|
105
|
+
gpu_count: 1
|
|
106
|
+
gpu_vram_gb: 24
|
|
107
|
+
notes: |
|
|
108
|
+
推荐用于完整训练+评估模式。额外的磁盘空间用于容纳 Megascale AlphaFold PDB(解压后约 50 GB)和 SKEMPI PDB 结构以及检查点。
|
|
109
|
+
environment:
|
|
110
|
+
python: '3.10'
|
|
111
|
+
cuda: null
|
|
112
|
+
pytorch: 2.6.0
|
|
113
|
+
flash_attn: null
|
|
114
|
+
key_packages:
|
|
115
|
+
- biopython==1.85
|
|
116
|
+
- scipy
|
|
117
|
+
- tqdm
|
|
118
|
+
- wandb
|
|
119
|
+
- pandas
|
|
120
|
+
setup_method: conda
|
|
121
|
+
setup_file: environment.yaml
|
|
122
|
+
notes: |
|
|
123
|
+
使用 conda env create -f environment.yaml && conda activate stabddg 创建环境。或者,使用 pip install tqdm scipy wandb pandas biopython 安装到现有 PyTorch 环境中。可选的 editable 安装:pip install -e . 有关完整的固定依赖集,请参阅 environment.yaml。训练阶段需要 CUDA(torch.device='cuda');推理可以在 CPU 上运行,但速度会显著变慢。
|
|
124
|
+
paper:
|
|
125
|
+
title: Predicting mutational effects on protein binding from folding energy
|
|
126
|
+
authors:
|
|
127
|
+
- Arthur Deng
|
|
128
|
+
- Karsten Householder
|
|
129
|
+
- Fang Wu
|
|
130
|
+
- Sebastian Thrun
|
|
131
|
+
- K. Christopher Garcia
|
|
132
|
+
- Brian Trippe
|
|
133
|
+
affiliation: Stanford University
|
|
134
|
+
venue: Proceedings of the 42nd International Conference on Machine Learning (ICML
|
|
135
|
+
2025)
|
|
136
|
+
year: 2025
|
|
137
|
+
url: https://arxiv.org/abs/2507.05502
|
|
138
|
+
code: https://github.com/LDeng0205/StaB-ddG
|
|
139
|
+
notes: |
|
|
140
|
+
最初作为 arXiv 预印本(2507.05502)发布,并被 ICML 2025(PMLR 267)接收。介绍了 StaB-ddG 作为首个在 SKEMPI 上匹配 FoldX 精度的深度学习预测器,同时比基于 Rosetta 的 Flex ddG 提供超过 1000 倍的加速。
|
|
141
|
+
download:
|
|
142
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.065_proteinbinding.zip
|
|
143
|
+
archive_type: zip
|
|
144
|
+
local_dir_name: paper-65-ProteinBinding
|
|
145
|
+
provider: github_release
|
|
146
|
+
repo: ResearAI/DeepScientist
|
|
147
|
+
tag: aisb-v0.0.1
|
|
148
|
+
asset_name: aisb.t3.065_proteinbinding.zip
|
|
149
|
+
sha256: 07ea82db652e56e0bd609f637362cd91f74d76f1356d3b7cd3d9c14d82fda319
|
|
150
|
+
size_bytes: 2277469
|
|
151
|
+
commercial:
|
|
152
|
+
annual_fee: null
|
|
153
|
+
display:
|
|
154
|
+
palette_seed: sage-bone-protein
|
|
155
|
+
art_style: molecular-atlas
|
|
156
|
+
accent_priority: high
|
|
157
|
+
image_path: ../image/065_aisb.t3.065_proteinbinding.jpg
|
|
158
|
+
recommended_when: |
|
|
159
|
+
在评估涉及 PDB 输入、突变列表和 ΔΔG 回归或排序指标的结构生物学任务模型时使用此基准。当目标是评估从稳定性到结合的迁移学习、与 FoldX 或 Flex ddG 基线进行比较、或复现 ICML 2025 SKEMPI 基准结果时尤为理想。也适用于只需预训练检查点的单复合物推理工作流。
|
|
160
|
+
not_recommended_when: |
|
|
161
|
+
如果需要纯文本或纯序列任务且没有结构输入,请勿使用此基准。如果您的环境无法提供野生型界面的 PDB 结构文件或无法满足训练的 GPU 内存要求,请避免使用。不适合需要快速迭代周期的基准测试,因为完整的训练+评估流程最多需要 24 小时,且需要下载大型外部数据集。
|
|
162
|
+
risk_flags:
|
|
163
|
+
- external_data_download_required
|
|
164
|
+
- gpu_required_for_training
|
|
165
|
+
- no_execution_verified_in_packaging_pass
|
|
166
|
+
risk_notes: |
|
|
167
|
+
metric_contract.json 中的指标值有代码支持,但尚未通过实际执行验证;仅在基准测试成功运行生成 cache/eval.csv 后才可信。Megascale AlphaFold PDB 下载(解压后约 50 GB)在低带宽连接上可能较慢或中断;通过 wget -c 支持断点续传。SKEMPI PDB 结构必须从 life.bsc.es 单独下载;过滤后的 CSV 和划分已预装,但原始 PDB 除外。蒙特卡洛方差缩减在推理时默认使用 ensemble=20 个样本;减少此值会加快推理但会增加预测方差。
|
|
@@ -0,0 +1,267 @@
|
|
|
1
|
+
id: aisb.t3.066_tropicalattention
|
|
2
|
+
name: 'Tropical Attention: Neural Algorithmic Reasoning for Combinatorial Algorithms'
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Tropical-geometry-based attention mechanism for neural algorithmic reasoning
|
|
5
|
+
on combinatorial tasks, achieving sharp OOD generalization beyond PTIME to NP-hard
|
|
6
|
+
problems.
|
|
7
|
+
task_description: 'This packaged benchmark covers Tropical Attention, an attention
|
|
8
|
+
mechanism grounded in tropical geometry that lifts the attention kernel into tropical
|
|
9
|
+
projective space where reasoning is piecewise-linear and 1-Lipschitz. The benchmark
|
|
10
|
+
evaluates whether replacing or augmenting conventional softmax attention with tropical-geometry
|
|
11
|
+
structure improves algorithmic generalization on 11 combinatorial tasks spanning
|
|
12
|
+
polynomial-time algorithms (Floyd-Warshall, Quickselect, Convex Hull, SCC), NP-complete
|
|
13
|
+
problems (3SUM, Balanced Partition, Subset Sum), and NP-hard problems (0/1 Knapsack,
|
|
14
|
+
Bin Packing, Min Coin Change). Tasks are evaluated under out-of-distribution (OOD)
|
|
15
|
+
conditions including length extrapolation and value-range generalization. Primary
|
|
16
|
+
metric is quickselect_length_ood_f1 measuring length-OOD F1 score on the Quickselect
|
|
17
|
+
task.
|
|
18
|
+
|
|
19
|
+
'
|
|
20
|
+
task_mode: experiment_driven
|
|
21
|
+
requires_execution: true
|
|
22
|
+
requires_paper: true
|
|
23
|
+
integrity_level: cas_plus_canary
|
|
24
|
+
snapshot_status: runnable
|
|
25
|
+
support_level: advanced
|
|
26
|
+
time_band: 6-24h
|
|
27
|
+
cost_band: medium
|
|
28
|
+
difficulty: hard
|
|
29
|
+
data_access: public
|
|
30
|
+
primary_outputs:
|
|
31
|
+
- quickselect_length_ood_f1
|
|
32
|
+
- algorithmic_reasoning_report
|
|
33
|
+
- trained_checkpoint
|
|
34
|
+
launch_profiles:
|
|
35
|
+
- id: quick_eval
|
|
36
|
+
label: Quick Eval
|
|
37
|
+
description: 'Run one packaged neural algorithmic reasoning evaluation route. Loads
|
|
38
|
+
a pre-trained checkpoint and evaluates on OOD test splits for all 11 combinatorial
|
|
39
|
+
tasks. Use --job_file pointing to jobs_to_do_evaluate.csv with --job_id selecting
|
|
40
|
+
the target task. Outputs length-OOD and value-OOD F1 scores per task.
|
|
41
|
+
|
|
42
|
+
'
|
|
43
|
+
- id: full_train_eval
|
|
44
|
+
label: Full Train + Eval
|
|
45
|
+
description: 'Run the complete tropical-attention training and OOD reasoning benchmark
|
|
46
|
+
workflow. Trains models from scratch on 100k samples per task using schedulefree
|
|
47
|
+
optimizer, then evaluates on OOD test sets. Training logs saved to outputs/<timestamp>/.
|
|
48
|
+
Uses --job_file pointing to jobs_to_do_train.csv with --job_id selecting the task
|
|
49
|
+
row.
|
|
50
|
+
|
|
51
|
+
'
|
|
52
|
+
dataset_download:
|
|
53
|
+
primary_method: mixed
|
|
54
|
+
sources:
|
|
55
|
+
- url: https://deepscientist.cc/AISB/066_tropicalattention
|
|
56
|
+
type: benchmark_archive
|
|
57
|
+
archive_type: zip
|
|
58
|
+
local_dir_name: paper-66-TropicalAttention
|
|
59
|
+
- url: https://github.com/Baran-phys/Tropical-Attention
|
|
60
|
+
type: upstream_repository
|
|
61
|
+
notes:
|
|
62
|
+
- Archive contains full code, dataloaders, models, and evaluation scripts
|
|
63
|
+
- Datasets are procedurally generated at runtime via dataloaders.py
|
|
64
|
+
credential_requirements:
|
|
65
|
+
mode: none
|
|
66
|
+
items: []
|
|
67
|
+
notes: []
|
|
68
|
+
resources:
|
|
69
|
+
minimum:
|
|
70
|
+
cpu_cores: 8
|
|
71
|
+
ram_gb: 32
|
|
72
|
+
disk_gb: 50
|
|
73
|
+
gpu_count: 1
|
|
74
|
+
gpu_vram_gb: 16
|
|
75
|
+
notes: Capable of running single-task training; evaluation-only requires less
|
|
76
|
+
recommended:
|
|
77
|
+
cpu_cores: 16
|
|
78
|
+
ram_gb: 64
|
|
79
|
+
disk_gb: 100
|
|
80
|
+
gpu_count: 1
|
|
81
|
+
gpu_vram_gb: 24
|
|
82
|
+
notes: 'Recommended for full multi-task training runs. Single GPU suffices due
|
|
83
|
+
to ~20% fewer parameters than Universal Transformer baselines.
|
|
84
|
+
|
|
85
|
+
'
|
|
86
|
+
environment:
|
|
87
|
+
python: '3.10'
|
|
88
|
+
cuda: '11.8'
|
|
89
|
+
pytorch: 2.1.0
|
|
90
|
+
flash_attn: null
|
|
91
|
+
key_packages:
|
|
92
|
+
- torch
|
|
93
|
+
- schedulefree
|
|
94
|
+
- pandas
|
|
95
|
+
- matplotlib
|
|
96
|
+
- scikit-learn
|
|
97
|
+
notes:
|
|
98
|
+
- See bundled requirements.txt for full dependency set
|
|
99
|
+
- TropicalAttention.py is a drop-in module for standard Transformer blocks
|
|
100
|
+
- CUDA required for training; CPU fallback supported for inference
|
|
101
|
+
risk_flags:
|
|
102
|
+
- ood_metric_variance
|
|
103
|
+
- multi_seed_required
|
|
104
|
+
risk_notes:
|
|
105
|
+
- OOD F1 scores show variance across seeds (e.g., SubsetSum 87.50±6.45); multi-seed
|
|
106
|
+
evaluation recommended
|
|
107
|
+
- Floyd-Warshall and Fractional Knapsack show lower OOD scores than classification
|
|
108
|
+
tasks
|
|
109
|
+
- Training uses 100k samples per task; disk space needed for outputs/<timestamp>/
|
|
110
|
+
artifacts
|
|
111
|
+
recommended_when: 'Use this benchmark when you need to evaluate neural reasoning over
|
|
112
|
+
graph and combinatorial problems with clear OOD behavior. Specifically suited for:
|
|
113
|
+
(1) evaluating attention mechanisms on length-extrapolation tasks, (2) benchmarking
|
|
114
|
+
NP-hard/complete problem solving beyond PTIME, (3) comparing tropical-geometry inductive
|
|
115
|
+
bias against softmax-based transformers, (4) studying polyhedral decision boundaries
|
|
116
|
+
in neural algorithmic reasoning.
|
|
117
|
+
|
|
118
|
+
'
|
|
119
|
+
not_recommended_when: 'Do not use this if you need a plug-and-play application benchmark
|
|
120
|
+
without specialized reasoning datasets. Not suitable when only in-distribution accuracy
|
|
121
|
+
matters, or when PTIME-only algorithmic reasoning is sufficient. Avoid if the research
|
|
122
|
+
question does not involve combinatorial optimization, attention mechanism design,
|
|
123
|
+
or OOD generalization.
|
|
124
|
+
|
|
125
|
+
'
|
|
126
|
+
paper:
|
|
127
|
+
title: 'Tropical Attention: Neural Algorithmic Reasoning for Combinatorial Algorithms'
|
|
128
|
+
venue: NeurIPS 2025
|
|
129
|
+
year: 2025
|
|
130
|
+
url: https://arxiv.org/abs/2505.17190
|
|
131
|
+
authors:
|
|
132
|
+
- Hashemi, Baran (Origins Data Science Lab, Technical University of Munich)
|
|
133
|
+
- Pasque, Kurt (Naval Postgraduate School)
|
|
134
|
+
- Teska, Chris (Naval Postgraduate School)
|
|
135
|
+
- Yoshida, Ruriko (Naval Postgraduate School)
|
|
136
|
+
download:
|
|
137
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.066_tropicalattention.zip
|
|
138
|
+
archive_type: zip
|
|
139
|
+
local_dir_name: paper-66-TropicalAttention
|
|
140
|
+
upstream_url: https://github.com/Baran-phys/Tropical-Attention
|
|
141
|
+
provider: github_release
|
|
142
|
+
repo: ResearAI/DeepScientist
|
|
143
|
+
tag: aisb-v0.0.1
|
|
144
|
+
asset_name: aisb.t3.066_tropicalattention.zip
|
|
145
|
+
sha256: 59c566c1c49e1649bad3e39f2100133d7cb97cea8df9665ae1dea27bcd4a80db
|
|
146
|
+
size_bytes: 1618773
|
|
147
|
+
display:
|
|
148
|
+
palette_seed: lime-violet-tropical
|
|
149
|
+
art_style: geometric-reasoning
|
|
150
|
+
accent_priority: high
|
|
151
|
+
image_path: ../image/066_aisb.t3.066_tropicalattention.jpg
|
|
152
|
+
capability_tags:
|
|
153
|
+
- research_code_optimization
|
|
154
|
+
- neural_algorithmic_reasoning
|
|
155
|
+
- combinatorial_optimization
|
|
156
|
+
- transformers
|
|
157
|
+
- mathematical_reasoning
|
|
158
|
+
- tropical_geometry
|
|
159
|
+
- out_of_distribution_generalization
|
|
160
|
+
- attention_mechanisms
|
|
161
|
+
- np_complete_problems
|
|
162
|
+
- np_hard_problems
|
|
163
|
+
aisb_direction: T3
|
|
164
|
+
track_fit:
|
|
165
|
+
- paper_track
|
|
166
|
+
- benchmark_track
|
|
167
|
+
commercial:
|
|
168
|
+
annual_fee: null
|
|
169
|
+
experiment_anchors:
|
|
170
|
+
train_script: experiment.py
|
|
171
|
+
train_job_csv: jobs_to_do_train.csv
|
|
172
|
+
eval_job_csv: jobs_to_do_evaluate.csv
|
|
173
|
+
attention_module: TropicalAttention.py
|
|
174
|
+
eval_script: eval.py
|
|
175
|
+
metric_contract: json/metric_contract.json
|
|
176
|
+
task_specifications:
|
|
177
|
+
- task_name: Quickselect
|
|
178
|
+
type: classification
|
|
179
|
+
ood_metric: length_ood_f1
|
|
180
|
+
training_length_range: (10,30)
|
|
181
|
+
evaluation_length_range: (10,1024)
|
|
182
|
+
epochs: 100
|
|
183
|
+
notes: Primary OOD benchmark; sharp attention maps preserve k-th element selection
|
|
184
|
+
- task_name: SubsetSumDecision
|
|
185
|
+
type: classification
|
|
186
|
+
complexity: NP-complete
|
|
187
|
+
training_length_range: (8,8)
|
|
188
|
+
value_range: (-5,5)
|
|
189
|
+
epochs: 100
|
|
190
|
+
- task_name: Knapsack
|
|
191
|
+
type: classification
|
|
192
|
+
complexity: NP-hard
|
|
193
|
+
training_length_range: (10,20)
|
|
194
|
+
epochs: 100
|
|
195
|
+
- task_name: BalancedPartition
|
|
196
|
+
type: classification
|
|
197
|
+
complexity: NP-complete
|
|
198
|
+
training_length_range: (10,30)
|
|
199
|
+
epochs: 1000
|
|
200
|
+
- task_name: BinPacking
|
|
201
|
+
type: classification
|
|
202
|
+
complexity: NP-hard
|
|
203
|
+
training_length_range: (10,30)
|
|
204
|
+
epochs: 1000
|
|
205
|
+
- task_name: MinCoinChange
|
|
206
|
+
type: classification
|
|
207
|
+
training_length_range: (10,20)
|
|
208
|
+
epochs: 100
|
|
209
|
+
- task_name: ConvexHull
|
|
210
|
+
type: classification
|
|
211
|
+
training_length_range: (10,30)
|
|
212
|
+
epochs: 100
|
|
213
|
+
- task_name: FractionalKnapsack
|
|
214
|
+
type: regression
|
|
215
|
+
training_length_range: (10,20)
|
|
216
|
+
epochs: 100
|
|
217
|
+
notes: Lower OOD performance expected for regression tasks
|
|
218
|
+
- task_name: FloydWarshall
|
|
219
|
+
type: regression
|
|
220
|
+
training_length_range: (10,30)
|
|
221
|
+
epochs: 100
|
|
222
|
+
notes: All-pairs shortest paths; lower OOD scores than classification tasks
|
|
223
|
+
- task_name: SCC
|
|
224
|
+
type: classification
|
|
225
|
+
training_length_range: (10,30)
|
|
226
|
+
epochs: 100
|
|
227
|
+
- task_name: 3SUM
|
|
228
|
+
type: classification
|
|
229
|
+
complexity: NP-complete
|
|
230
|
+
training_length_range: (10,30)
|
|
231
|
+
epochs: 100
|
|
232
|
+
execution_notes:
|
|
233
|
+
training_invocation: 'python experiment.py --job_file jobs_to_do_train.csv --job_id
|
|
234
|
+
<row_index>
|
|
235
|
+
|
|
236
|
+
'
|
|
237
|
+
evaluation_invocation: 'python experiment.py --job_file jobs_to_do_evaluate.csv
|
|
238
|
+
--job_id <row_index>
|
|
239
|
+
|
|
240
|
+
'
|
|
241
|
+
job_csv_fields:
|
|
242
|
+
- task
|
|
243
|
+
- model_type
|
|
244
|
+
- dataset_name
|
|
245
|
+
- input_dim
|
|
246
|
+
- d_model
|
|
247
|
+
- n_heads
|
|
248
|
+
- num_layers
|
|
249
|
+
- num_epochs
|
|
250
|
+
- dropout
|
|
251
|
+
- lr
|
|
252
|
+
- seed
|
|
253
|
+
- n_samples
|
|
254
|
+
- batch_size
|
|
255
|
+
- length_range
|
|
256
|
+
- value_range
|
|
257
|
+
- noise_prob
|
|
258
|
+
output_directory: outputs/<timestamp>/
|
|
259
|
+
default_hyperparameters:
|
|
260
|
+
d_model: 64
|
|
261
|
+
n_heads: 2
|
|
262
|
+
num_layers: 1
|
|
263
|
+
dropout: 0
|
|
264
|
+
learning_rate: 0.0001
|
|
265
|
+
batch_size: 500
|
|
266
|
+
n_samples: 100000
|
|
267
|
+
seed: 999
|