@researai/deepscientist 1.5.17 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +132 -11
- package/bin/ds.js +376 -49
- package/docs/en/00_QUICK_START.md +135 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +64 -4
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +29 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +44 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +92 -17
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +39 -4
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +29 -7
- package/install.sh +122 -16
- package/package.json +4 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +2 -2
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +927 -91
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +697 -210
- package/src/deepscientist/daemon/api/router.py +76 -1
- package/src/deepscientist/daemon/app.py +1054 -51
- package/src/deepscientist/diagnostics/runner_failures.py +147 -0
- package/src/deepscientist/doctor.py +212 -65
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +836 -92
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1430 -139
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +421 -21
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +61 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -11
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +409 -315
- package/src/prompts/system_copilot.md +88 -12
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
- package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
- package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
- package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
- package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
- package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
- package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
- package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
- package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
- package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
- package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
- package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
- package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
- package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
- package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
- package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
- package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
- package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
- package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,123 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.080_latentscorereweight
|
|
3
|
+
name: Latent Score-Based Reweighting for Robust Classification on Imbalanced Tabular Data
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 在分布偏移下用于稳健表格分类的基于分数的密度重加权方法,无需群组标签。
|
|
6
|
+
task_description: 该基准面向稳健表格分类:利用 score-based(扩散)模型的潜在分数信号识别并上调联合分布 P(X, Y) 中代表性不足区域。不同于 JTT 等只在决策边界 P(Y|X) 附近上调误分类样本的方法,本方法通过与邻近样本的分数向量相似性估计局部密度,并重加权低密度区域,从而得到更全局平衡的训练分布,且不需要群组标签先验。评测目标为分布偏移下的 worst-group accuracy 与 mean accuracy。当前本地快照不含可执行训练/评估代码,两项主指标均为 blocked-no-code,执行前必须先恢复源码。
|
|
7
|
+
task_mode: analysis_driven
|
|
8
|
+
requires_execution: true
|
|
9
|
+
requires_paper: true
|
|
10
|
+
integrity_level: cas_plus_canary
|
|
11
|
+
snapshot_status: restore_needed
|
|
12
|
+
support_level: recovery
|
|
13
|
+
time_band: 6-24h
|
|
14
|
+
cost_band: medium
|
|
15
|
+
difficulty: medium
|
|
16
|
+
data_access: public
|
|
17
|
+
capability_tags:
|
|
18
|
+
- robust_classification
|
|
19
|
+
- tabular_ml
|
|
20
|
+
- score_based_models
|
|
21
|
+
- distribution_shift
|
|
22
|
+
- data_reweighting
|
|
23
|
+
- imbalanced_data
|
|
24
|
+
aisb_direction: T3
|
|
25
|
+
track_fit:
|
|
26
|
+
- paper_track
|
|
27
|
+
- benchmark_track
|
|
28
|
+
primary_outputs:
|
|
29
|
+
- worst_group_accuracy
|
|
30
|
+
- mean_accuracy
|
|
31
|
+
launch_profiles:
|
|
32
|
+
- id: analysis_only
|
|
33
|
+
label: Analysis Only
|
|
34
|
+
description: 'Review preserved benchmark metadata, metric contracts, and paper artefacts. No executable code is present in the current snapshot; this profile supports planning and paper-backed analysis only.
|
|
35
|
+
|
|
36
|
+
'
|
|
37
|
+
- id: restore_first
|
|
38
|
+
label: Restore First
|
|
39
|
+
description: 'Restore the missing latent-score reweighting implementation from the upstream repository (https://github.com/YunzeTong/latent-score-based-reweighting) before treating this entry as runnable. Both metrics remain blocked until restoration.
|
|
40
|
+
|
|
41
|
+
'
|
|
42
|
+
dataset_download:
|
|
43
|
+
primary_method: mixed
|
|
44
|
+
sources: []
|
|
45
|
+
notes:
|
|
46
|
+
- 'The current local snapshot does not preserve an executable benchmark route. Dataset setup should be treated as part of upstream restoration rather than a bundled run path. Refer to the paper and upstream GitHub repository for dataset identities and loading instructions.
|
|
47
|
+
|
|
48
|
+
'
|
|
49
|
+
credential_requirements:
|
|
50
|
+
mode: none
|
|
51
|
+
items: []
|
|
52
|
+
notes: []
|
|
53
|
+
resources:
|
|
54
|
+
minimum:
|
|
55
|
+
cpu_cores: 8
|
|
56
|
+
ram_gb: 32
|
|
57
|
+
disk_gb: 80
|
|
58
|
+
gpu_count: 1
|
|
59
|
+
gpu_vram_gb: 16
|
|
60
|
+
recommended:
|
|
61
|
+
cpu_cores: 16
|
|
62
|
+
ram_gb: 64
|
|
63
|
+
disk_gb: 150
|
|
64
|
+
gpu_count: 1
|
|
65
|
+
gpu_vram_gb: 24
|
|
66
|
+
environment:
|
|
67
|
+
python: null
|
|
68
|
+
cuda: null
|
|
69
|
+
pytorch: null
|
|
70
|
+
flash_attn: null
|
|
71
|
+
key_packages: []
|
|
72
|
+
notes:
|
|
73
|
+
- 'The current local snapshot does not preserve executable setup files or runnable source code. Environment requirements should be treated as provisional until upstream restoration from https://github.com/YunzeTong/latent-score-based-reweighting is complete.
|
|
74
|
+
|
|
75
|
+
'
|
|
76
|
+
- 'Expected dependencies include a score-based or diffusion model library, standard tabular ML packages (e.g. scikit-learn, XGBoost), and a PyTorch backend for the generative density estimation stage. Confirm exact versions from the upstream repository''s requirements file after restoration.
|
|
77
|
+
|
|
78
|
+
'
|
|
79
|
+
risk_flags:
|
|
80
|
+
- source_snapshot_incomplete
|
|
81
|
+
- route_caveat
|
|
82
|
+
- metrics_blocked_no_code
|
|
83
|
+
risk_notes:
|
|
84
|
+
- 'Both primary metrics (worst_group_accuracy, mean_accuracy) are marked blocked-no-code in the metric contract. No executable code anchor was detected in the staged snapshot. Do not report metric values until trusted execution outputs exist from a restored environment.
|
|
85
|
+
|
|
86
|
+
'
|
|
87
|
+
- 'The top-level README is absent from the current snapshot. Do not rely on README-only interpretation; prefer the paper (latex.md) and metric contract (json/metric_contract.json) as authoritative references.
|
|
88
|
+
|
|
89
|
+
'
|
|
90
|
+
recommended_when: 当你需要基于论文进行方案规划、方法分析,或为 latent score-based reweighting 做上游恢复范围界定时可使用本条目。也适合在设计/综述阶段比较密度重加权与边界重加权(如 JTT)。
|
|
91
|
+
not_recommended_when: 不要将当前本地包作为可直接运行的稳健性基准。当前分阶段快照缺少可执行生成式重加权流程,且两项指标均被阻塞。任何结果都应来自完整恢复并验证后的执行环境。
|
|
92
|
+
paper:
|
|
93
|
+
title: Latent Score-Based Reweighting for Robust Classification on Imbalanced Tabular Data
|
|
94
|
+
authors:
|
|
95
|
+
- Yunze Tong
|
|
96
|
+
- Fengda Zhang
|
|
97
|
+
- Zihao Tang
|
|
98
|
+
- Kaifeng Gao
|
|
99
|
+
- Kai Huang
|
|
100
|
+
- Pengfei Lyu
|
|
101
|
+
- Jun Xiao
|
|
102
|
+
- Kun Kuang
|
|
103
|
+
venue: ICML 2025
|
|
104
|
+
year: 2025
|
|
105
|
+
url: https://proceedings.mlr.press/v267/tong25c.html
|
|
106
|
+
code_url: https://github.com/YunzeTong/latent-score-based-reweighting
|
|
107
|
+
download:
|
|
108
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.080_latentscorereweight.zip
|
|
109
|
+
archive_type: zip
|
|
110
|
+
local_dir_name: paper-80-LatentScoreReweight
|
|
111
|
+
provider: github_release
|
|
112
|
+
repo: ResearAI/DeepScientist
|
|
113
|
+
tag: aisb-v0.0.1
|
|
114
|
+
asset_name: aisb.t3.080_latentscorereweight.zip
|
|
115
|
+
sha256: 9c70bcc4a57a17ffc712a81763731ba5c5f46c987ca83e9b5cd0d730a18e0d03
|
|
116
|
+
size_bytes: 36629
|
|
117
|
+
commercial:
|
|
118
|
+
annual_fee: null
|
|
119
|
+
display:
|
|
120
|
+
palette_seed: copper-teal-reweight
|
|
121
|
+
art_style: robust-tabular
|
|
122
|
+
accent_priority: high
|
|
123
|
+
image_path: ../image/080_aisb.t3.080_latentscorereweight.jpg
|
|
@@ -0,0 +1,150 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.081_qmamba
|
|
3
|
+
name: Meta-Black-Box-Optimization through Offline Q-function Learning
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: Offline meta-learning framework for black-box optimization that uses Q-function
|
|
6
|
+
decomposition and Mamba architecture over long configuration trajectories.
|
|
7
|
+
task_description: 'This benchmark entry covers Q-Mamba, an offline meta-black-box
|
|
8
|
+
optimization framework that addresses the effectiveness-efficiency dilemma in MetaBBO.
|
|
9
|
+
The approach transforms dynamic algorithm configuration (DAC) into a long-sequence
|
|
10
|
+
decision process with decomposed Q-functions for each hyper-parameter dimension.
|
|
11
|
+
Key components include: (1) offline data collection from strong baselines and random
|
|
12
|
+
policies for balanced exploration/exploitation, (2) conservative Q-learning with
|
|
13
|
+
compositional Q-loss to handle distribution shift, and (3) a Mamba-based RL agent
|
|
14
|
+
leveraging selective state modeling and hardware-aware parallel scan for efficient
|
|
15
|
+
long-sequence training. The current local snapshot preserves metadata and paper
|
|
16
|
+
references but lacks runnable implementation code, requiring upstream restoration
|
|
17
|
+
before execution.
|
|
18
|
+
|
|
19
|
+
'
|
|
20
|
+
task_mode: analysis_driven
|
|
21
|
+
requires_execution: true
|
|
22
|
+
requires_paper: true
|
|
23
|
+
integrity_level: cas_plus_canary
|
|
24
|
+
snapshot_status: restore_needed
|
|
25
|
+
support_level: recovery
|
|
26
|
+
time_band: 6-24h
|
|
27
|
+
cost_band: medium
|
|
28
|
+
difficulty: hard
|
|
29
|
+
data_access: public
|
|
30
|
+
primary_outputs:
|
|
31
|
+
- mean_reward
|
|
32
|
+
launch_profiles:
|
|
33
|
+
- id: analysis_only
|
|
34
|
+
label: Analysis Only
|
|
35
|
+
description: 'Review the preserved benchmark metadata, paper assets, and offline
|
|
36
|
+
Q-learning route documentation without attempting execution.
|
|
37
|
+
|
|
38
|
+
'
|
|
39
|
+
- id: restore_first
|
|
40
|
+
label: Restore First
|
|
41
|
+
description: 'Restore the missing Q-Mamba implementation from upstream sources before
|
|
42
|
+
treating this benchmark as runnable. Requires fetching executable code from the
|
|
43
|
+
published repository.
|
|
44
|
+
|
|
45
|
+
'
|
|
46
|
+
dataset_download:
|
|
47
|
+
primary_method: pending_restoration
|
|
48
|
+
sources: []
|
|
49
|
+
notes:
|
|
50
|
+
- The current local package does not bundle executable benchmark code or runnable
|
|
51
|
+
evaluation data.
|
|
52
|
+
- Dataset and implementation must be restored from upstream sources referenced in
|
|
53
|
+
the paper.
|
|
54
|
+
- The benchmark route is not available in the current snapshot state.
|
|
55
|
+
credential_requirements:
|
|
56
|
+
mode: none
|
|
57
|
+
items: []
|
|
58
|
+
notes: []
|
|
59
|
+
resources:
|
|
60
|
+
minimum:
|
|
61
|
+
cpu_cores: 8
|
|
62
|
+
ram_gb: 32
|
|
63
|
+
disk_gb: 80
|
|
64
|
+
gpu_count: 1
|
|
65
|
+
gpu_vram_gb: 16
|
|
66
|
+
recommended:
|
|
67
|
+
cpu_cores: 16
|
|
68
|
+
ram_gb: 64
|
|
69
|
+
disk_gb: 150
|
|
70
|
+
gpu_count: 1
|
|
71
|
+
gpu_vram_gb: 24
|
|
72
|
+
environment:
|
|
73
|
+
python: '3.10'
|
|
74
|
+
cuda: '12.1'
|
|
75
|
+
pytorch: 2.1.1
|
|
76
|
+
flash_attn: null
|
|
77
|
+
key_packages:
|
|
78
|
+
- mamba-ssm>=1.2.0
|
|
79
|
+
notes:
|
|
80
|
+
- Environment specifications are provisional based on the paper and upstream restoration
|
|
81
|
+
requirements.
|
|
82
|
+
- The current staged snapshot does not preserve executable setup files or runnable
|
|
83
|
+
source code.
|
|
84
|
+
- Full dependency set should be obtained from the published Q-Mamba source repository.
|
|
85
|
+
- mamba-ssm is the core architectural dependency for the Mamba-based RL agent.
|
|
86
|
+
risk_flags:
|
|
87
|
+
- source_snapshot_incomplete
|
|
88
|
+
- route_caveat
|
|
89
|
+
- no_executable_anchor
|
|
90
|
+
risk_notes:
|
|
91
|
+
- No executable code files detected in the current snapshot that can anchor staged
|
|
92
|
+
metrics.
|
|
93
|
+
- No benchmark execution was performed during this packaging pass.
|
|
94
|
+
- The primary metric mean_reward is blocked pending source restoration.
|
|
95
|
+
- Treat this entry as blocked until upstream restoration provides runnable implementation.
|
|
96
|
+
recommended_when: 'Use this entry when you need paper-backed analysis of the Q-Mamba
|
|
97
|
+
offline meta-optimization approach, or when planning upstream restoration of the
|
|
98
|
+
Mamba-based meta-learning route for black-box optimization. Suitable for understanding
|
|
99
|
+
Q-function decomposition in long-horizon configuration tasks.
|
|
100
|
+
|
|
101
|
+
'
|
|
102
|
+
not_recommended_when: 'Do not treat this local package as a ready-to-run benchmark
|
|
103
|
+
for offline meta-black-box optimization. The executable code, evaluation protocols,
|
|
104
|
+
and benchmark data are absent from the staged snapshot. Do not attempt sequential
|
|
105
|
+
optimization runs without first restoring the missing implementation.
|
|
106
|
+
|
|
107
|
+
'
|
|
108
|
+
paper:
|
|
109
|
+
title: Meta-Black-Box-Optimization through Offline Q-function Learning
|
|
110
|
+
authors: Zeyuan Ma, Zhiguang Cao, Zhou Jiang, Hongshu Guo, Yue-Jiao Gong
|
|
111
|
+
venue: ICML 2025
|
|
112
|
+
year: 2025
|
|
113
|
+
url: https://proceedings.mlr.press/v267/ma25b.html
|
|
114
|
+
notes:
|
|
115
|
+
- Proposes Q-Mamba framework for offline MetaBBO with Q-function decomposition.
|
|
116
|
+
- Addresses effectiveness-efficiency trade-off in meta-learning for dynamic algorithm
|
|
117
|
+
configuration.
|
|
118
|
+
- Uses Mamba architecture for long-sequence learning with parallel scan efficiency.
|
|
119
|
+
- Source codes available online per the paper.
|
|
120
|
+
download:
|
|
121
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.081_qmamba.zip
|
|
122
|
+
archive_type: zip
|
|
123
|
+
local_dir_name: paper-81-QMamba
|
|
124
|
+
notes:
|
|
125
|
+
- Archive contains metadata and documentation; executable code requires restoration
|
|
126
|
+
from upstream.
|
|
127
|
+
provider: github_release
|
|
128
|
+
repo: ResearAI/DeepScientist
|
|
129
|
+
tag: aisb-v0.0.1
|
|
130
|
+
asset_name: aisb.t3.081_qmamba.zip
|
|
131
|
+
sha256: f565acdff164658ee030066f9a6c81cb7685ad3616de081df7c56a837b33cfd4
|
|
132
|
+
size_bytes: 31451
|
|
133
|
+
display:
|
|
134
|
+
palette_seed: slate-gold-offline
|
|
135
|
+
art_style: trajectory-systems
|
|
136
|
+
accent_priority: high
|
|
137
|
+
image_path: ../image/081_aisb.t3.081_qmamba.jpg
|
|
138
|
+
capability_tags:
|
|
139
|
+
- research_code_optimization
|
|
140
|
+
- black_box_optimization
|
|
141
|
+
- offline_rl
|
|
142
|
+
- mamba_models
|
|
143
|
+
- meta_learning
|
|
144
|
+
- q_function_decomposition
|
|
145
|
+
- dynamic_algorithm_configuration
|
|
146
|
+
- long_sequence_decision
|
|
147
|
+
aisb_direction: T3
|
|
148
|
+
track_fit:
|
|
149
|
+
- paper_track
|
|
150
|
+
- benchmark_track
|
|
@@ -0,0 +1,117 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.081_qmamba
|
|
3
|
+
name: Meta-Black-Box-Optimization through Offline Q-function Learning
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 面向黑盒优化的离线元学习框架,使用 Q 函数分解与 Mamba 架构处理长配置轨迹。
|
|
6
|
+
task_description: 该条目覆盖 Q-Mamba:一种离线元黑盒优化框架,用于缓解 MetaBBO 的效果-效率矛盾。方法把动态算法配置(DAC)转化为长序列决策过程,并为每个超参数维度分解 Q 函数。核心包括:(1) 结合强基线与随机策略的离线数据采集以平衡探索与利用;(2) 通过组合式 Q-loss 的保守 Q-learning 处理分布偏移;(3) 使用具备选择性状态建模与硬件友好并行扫描的 Mamba RL 代理进行高效长序列训练。当前本地快照保留元数据与论文引用,但缺少可运行代码,需上游恢复后执行。
|
|
7
|
+
task_mode: analysis_driven
|
|
8
|
+
requires_execution: true
|
|
9
|
+
requires_paper: true
|
|
10
|
+
integrity_level: cas_plus_canary
|
|
11
|
+
snapshot_status: restore_needed
|
|
12
|
+
support_level: recovery
|
|
13
|
+
time_band: 6-24h
|
|
14
|
+
cost_band: medium
|
|
15
|
+
difficulty: hard
|
|
16
|
+
data_access: public
|
|
17
|
+
primary_outputs:
|
|
18
|
+
- mean_reward
|
|
19
|
+
launch_profiles:
|
|
20
|
+
- id: analysis_only
|
|
21
|
+
label: Analysis Only
|
|
22
|
+
description: 'Review the preserved benchmark metadata, paper assets, and offline Q-learning route documentation without attempting execution.
|
|
23
|
+
|
|
24
|
+
'
|
|
25
|
+
- id: restore_first
|
|
26
|
+
label: Restore First
|
|
27
|
+
description: 'Restore the missing Q-Mamba implementation from upstream sources before treating this benchmark as runnable. Requires fetching executable code from the published repository.
|
|
28
|
+
|
|
29
|
+
'
|
|
30
|
+
dataset_download:
|
|
31
|
+
primary_method: pending_restoration
|
|
32
|
+
sources: []
|
|
33
|
+
notes:
|
|
34
|
+
- The current local package does not bundle executable benchmark code or runnable evaluation data.
|
|
35
|
+
- Dataset and implementation must be restored from upstream sources referenced in the paper.
|
|
36
|
+
- The benchmark route is not available in the current snapshot state.
|
|
37
|
+
credential_requirements:
|
|
38
|
+
mode: none
|
|
39
|
+
items: []
|
|
40
|
+
notes: []
|
|
41
|
+
resources:
|
|
42
|
+
minimum:
|
|
43
|
+
cpu_cores: 8
|
|
44
|
+
ram_gb: 32
|
|
45
|
+
disk_gb: 80
|
|
46
|
+
gpu_count: 1
|
|
47
|
+
gpu_vram_gb: 16
|
|
48
|
+
recommended:
|
|
49
|
+
cpu_cores: 16
|
|
50
|
+
ram_gb: 64
|
|
51
|
+
disk_gb: 150
|
|
52
|
+
gpu_count: 1
|
|
53
|
+
gpu_vram_gb: 24
|
|
54
|
+
environment:
|
|
55
|
+
python: '3.10'
|
|
56
|
+
cuda: '12.1'
|
|
57
|
+
pytorch: 2.1.1
|
|
58
|
+
flash_attn: null
|
|
59
|
+
key_packages:
|
|
60
|
+
- mamba-ssm>=1.2.0
|
|
61
|
+
notes:
|
|
62
|
+
- Environment specifications are provisional based on the paper and upstream restoration requirements.
|
|
63
|
+
- The current staged snapshot does not preserve executable setup files or runnable source code.
|
|
64
|
+
- Full dependency set should be obtained from the published Q-Mamba source repository.
|
|
65
|
+
- mamba-ssm is the core architectural dependency for the Mamba-based RL agent.
|
|
66
|
+
risk_flags:
|
|
67
|
+
- source_snapshot_incomplete
|
|
68
|
+
- route_caveat
|
|
69
|
+
- no_executable_anchor
|
|
70
|
+
risk_notes:
|
|
71
|
+
- No executable code files detected in the current snapshot that can anchor staged metrics.
|
|
72
|
+
- No benchmark execution was performed during this packaging pass.
|
|
73
|
+
- The primary metric mean_reward is blocked pending source restoration.
|
|
74
|
+
- Treat this entry as blocked until upstream restoration provides runnable implementation.
|
|
75
|
+
recommended_when: 当你需要对 Q-Mamba 离线元优化方法进行基于论文的分析,或规划恢复 Mamba 元学习黑盒优化路线时可用本条目。也适合理解长时程配置任务中的 Q 函数分解。
|
|
76
|
+
not_recommended_when: 不要把当前本地包视为可直接运行的离线元黑盒优化基准。分阶段快照缺少可执行代码、评估协议和基准数据,恢复实现前不应尝试顺序优化运行。
|
|
77
|
+
paper:
|
|
78
|
+
title: Meta-Black-Box-Optimization through Offline Q-function Learning
|
|
79
|
+
authors: Zeyuan Ma, Zhiguang Cao, Zhou Jiang, Hongshu Guo, Yue-Jiao Gong
|
|
80
|
+
venue: ICML 2025
|
|
81
|
+
year: 2025
|
|
82
|
+
url: https://proceedings.mlr.press/v267/ma25b.html
|
|
83
|
+
notes:
|
|
84
|
+
- Proposes Q-Mamba framework for offline MetaBBO with Q-function decomposition.
|
|
85
|
+
- Addresses effectiveness-efficiency trade-off in meta-learning for dynamic algorithm configuration.
|
|
86
|
+
- Uses Mamba architecture for long-sequence learning with parallel scan efficiency.
|
|
87
|
+
- Source codes available online per the paper.
|
|
88
|
+
download:
|
|
89
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.081_qmamba.zip
|
|
90
|
+
archive_type: zip
|
|
91
|
+
local_dir_name: paper-81-QMamba
|
|
92
|
+
notes:
|
|
93
|
+
- Archive contains metadata and documentation; executable code requires restoration from upstream.
|
|
94
|
+
provider: github_release
|
|
95
|
+
repo: ResearAI/DeepScientist
|
|
96
|
+
tag: aisb-v0.0.1
|
|
97
|
+
asset_name: aisb.t3.081_qmamba.zip
|
|
98
|
+
sha256: f565acdff164658ee030066f9a6c81cb7685ad3616de081df7c56a837b33cfd4
|
|
99
|
+
size_bytes: 31451
|
|
100
|
+
display:
|
|
101
|
+
palette_seed: slate-gold-offline
|
|
102
|
+
art_style: trajectory-systems
|
|
103
|
+
accent_priority: high
|
|
104
|
+
image_path: ../image/081_aisb.t3.081_qmamba.jpg
|
|
105
|
+
capability_tags:
|
|
106
|
+
- research_code_optimization
|
|
107
|
+
- black_box_optimization
|
|
108
|
+
- offline_rl
|
|
109
|
+
- mamba_models
|
|
110
|
+
- meta_learning
|
|
111
|
+
- q_function_decomposition
|
|
112
|
+
- dynamic_algorithm_configuration
|
|
113
|
+
- long_sequence_decision
|
|
114
|
+
aisb_direction: T3
|
|
115
|
+
track_fit:
|
|
116
|
+
- paper_track
|
|
117
|
+
- benchmark_track
|
|
@@ -0,0 +1,160 @@
|
|
|
1
|
+
id: aisb.t3.082_onlinellmrouting
|
|
2
|
+
name: Online LLM Routing
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Training-free online router allocating prompts across multiple LLMs under
|
|
5
|
+
token budget constraints using ANNS and one-time optimization.
|
|
6
|
+
task_description: 'This benchmark implements a training-free online routing algorithm
|
|
7
|
+
for high-volume multi-LLM serving under constrained token budgets. The system uses
|
|
8
|
+
Approximate Nearest Neighbor Search (ANNS) to efficiently estimate query features
|
|
9
|
+
for each deployed LLM from a historical auxiliary dataset, then performs a one-time
|
|
10
|
+
Mixed-Integer Linear Programming (MILP) optimization over a small sample set of
|
|
11
|
+
observed queries (typically ~250) to learn routing weights. These weights guide
|
|
12
|
+
routing decisions for subsequent queries arriving sequentially. The approach requires
|
|
13
|
+
no model training and introduces negligible deployment overhead, making it adaptable
|
|
14
|
+
to dynamic LLM deployment configurations. Theoretical analysis guarantees a competitive
|
|
15
|
+
ratio of 1 - o(1) under mild assumptions.
|
|
16
|
+
|
|
17
|
+
'
|
|
18
|
+
task_mode: evaluation_driven
|
|
19
|
+
requires_execution: true
|
|
20
|
+
requires_paper: true
|
|
21
|
+
integrity_level: cas_plus_canary
|
|
22
|
+
snapshot_status: restore_needed
|
|
23
|
+
support_level: recovery
|
|
24
|
+
time_band: 1-2h
|
|
25
|
+
cost_band: low
|
|
26
|
+
difficulty: medium
|
|
27
|
+
data_access: public
|
|
28
|
+
primary_outputs:
|
|
29
|
+
- quality_score
|
|
30
|
+
- routing_decisions
|
|
31
|
+
- cost_efficiency_metrics
|
|
32
|
+
- throughput_metrics
|
|
33
|
+
launch_profiles:
|
|
34
|
+
- id: analysis_only
|
|
35
|
+
label: Analysis Only
|
|
36
|
+
description: Review preserved routing benchmark metadata, target objective function,
|
|
37
|
+
and MILP formulation. No execution performed.
|
|
38
|
+
- id: restore_first
|
|
39
|
+
label: Restore First
|
|
40
|
+
description: Restore missing online routing implementation and ANNS components before
|
|
41
|
+
treating this benchmark as runnable. Current snapshot lacks executable code anchors.
|
|
42
|
+
dataset_download:
|
|
43
|
+
primary_method: mixed
|
|
44
|
+
sources:
|
|
45
|
+
- type: external_archive
|
|
46
|
+
url: https://deepscientist.cc/AISB/082_onlinellmrouting
|
|
47
|
+
archive_type: zip
|
|
48
|
+
local_dir_name: paper-82-OnlineLLMRouting
|
|
49
|
+
- type: github_repository
|
|
50
|
+
url: https://github.com/fzwark/PORT
|
|
51
|
+
note: Original implementation source referenced in paper
|
|
52
|
+
notes:
|
|
53
|
+
- Archive contains bundled README and requirements for full dependency set
|
|
54
|
+
- Benchmark datasets referenced in paper not included in snapshot
|
|
55
|
+
credential_requirements:
|
|
56
|
+
mode: none
|
|
57
|
+
items: []
|
|
58
|
+
notes:
|
|
59
|
+
- No API credentials required for CPU-only routing evaluation
|
|
60
|
+
- LLM inference APIs not required for the core routing algorithm evaluation
|
|
61
|
+
resources:
|
|
62
|
+
minimum:
|
|
63
|
+
cpu_cores: 8
|
|
64
|
+
ram_gb: 16
|
|
65
|
+
disk_gb: 30
|
|
66
|
+
gpu_count: 0
|
|
67
|
+
gpu_vram_gb: 0
|
|
68
|
+
recommended:
|
|
69
|
+
cpu_cores: 16
|
|
70
|
+
ram_gb: 32
|
|
71
|
+
disk_gb: 80
|
|
72
|
+
gpu_count: 0
|
|
73
|
+
gpu_vram_gb: 0
|
|
74
|
+
notes:
|
|
75
|
+
- CPU-only execution is fully viable for the minimum routing implementation
|
|
76
|
+
- ANNS operations (FAISS) are CPU-optimized with faiss_cpu package
|
|
77
|
+
- No GPU required for MILP solver or routing weight optimization
|
|
78
|
+
- Memory requirements scale with auxiliary dataset size for ANNS indexing
|
|
79
|
+
environment:
|
|
80
|
+
python: '3.10'
|
|
81
|
+
cuda: null
|
|
82
|
+
pytorch: 2.6.0
|
|
83
|
+
flash_attn: null
|
|
84
|
+
key_packages:
|
|
85
|
+
- faiss_cpu==1.10.0
|
|
86
|
+
- transformers==4.51.0
|
|
87
|
+
notes:
|
|
88
|
+
- faiss_cpu provides ANNS index for query feature estimation
|
|
89
|
+
- transformers used for embedding generation if auxiliary dataset requires
|
|
90
|
+
- Full dependency list provided in bundled requirements.txt
|
|
91
|
+
risk_flags:
|
|
92
|
+
- snapshot_incomplete
|
|
93
|
+
- blocked_no_code
|
|
94
|
+
risk_notes:
|
|
95
|
+
- Current snapshot does not expose executable code files anchoring staged metrics
|
|
96
|
+
- No benchmark execution was performed in this packaging pass
|
|
97
|
+
- Treat as blocked until source restoration or richer local snapshot is recovered
|
|
98
|
+
- Top-level README absent in current snapshot
|
|
99
|
+
recommended_when: 'Use this benchmark for systems-routing research focused on retrieval,
|
|
100
|
+
optimization, and budget allocation under token constraints. Ideal for evaluating
|
|
101
|
+
training-free approaches to multi-LLM serving that require rapid routing decisions
|
|
102
|
+
without model retraining.
|
|
103
|
+
|
|
104
|
+
'
|
|
105
|
+
not_recommended_when: 'Do not use this benchmark if you require local GPU finetuning
|
|
106
|
+
of language models, offline ensemble methods with multiple model calls per query,
|
|
107
|
+
or tasks requiring model-based predictors that need training overhead.
|
|
108
|
+
|
|
109
|
+
'
|
|
110
|
+
paper:
|
|
111
|
+
title: Efficient Training-Free Online Routing for High-Volume Multi-LLM Serving
|
|
112
|
+
venue: NeurIPS 2025
|
|
113
|
+
year: 2025
|
|
114
|
+
url: https://openreview.net/forum?id=d4mZyZB5I9
|
|
115
|
+
authors:
|
|
116
|
+
- Fangzhou Wu
|
|
117
|
+
- Sandeep Silwal
|
|
118
|
+
institution: University of Wisconsin-Madison
|
|
119
|
+
display:
|
|
120
|
+
palette_seed: silver-blue-router
|
|
121
|
+
art_style: serving-console
|
|
122
|
+
accent_priority: high
|
|
123
|
+
image_path: ../image/082_aisb.t3.082_onlinellmrouting.jpg
|
|
124
|
+
capability_tags:
|
|
125
|
+
- research_code_optimization
|
|
126
|
+
- llm_routing
|
|
127
|
+
- approximate_nearest_neighbors
|
|
128
|
+
- serving_systems
|
|
129
|
+
- online_optimization
|
|
130
|
+
- milp
|
|
131
|
+
- budget_allocation
|
|
132
|
+
track_fit:
|
|
133
|
+
- paper_track
|
|
134
|
+
- benchmark_track
|
|
135
|
+
aisb_direction: T3
|
|
136
|
+
metric_contract:
|
|
137
|
+
primary_metric: quality_score
|
|
138
|
+
status: blocked_no_code
|
|
139
|
+
notes:
|
|
140
|
+
- No executable code anchor in current snapshot
|
|
141
|
+
- Metric surface blocked until routing implementation is restored
|
|
142
|
+
- Original paper reports 3.55x overall performance improvement and 1.85x cost efficiency
|
|
143
|
+
against 8 baselines
|
|
144
|
+
commercial:
|
|
145
|
+
annual_fee: null
|
|
146
|
+
recovery_rule: 'Prefer existing code files over README-only claims when choosing origin_path,
|
|
147
|
+
source_ref, and evaluation_protocol.code_paths. Keep metrics_summary empty until
|
|
148
|
+
trusted execution outputs exist. If the current snapshot has no executable anchor
|
|
149
|
+
for a metric, mark that metric as provisional or blocked instead of inventing support.
|
|
150
|
+
|
|
151
|
+
'
|
|
152
|
+
download:
|
|
153
|
+
provider: github_release
|
|
154
|
+
repo: ResearAI/DeepScientist
|
|
155
|
+
tag: aisb-v0.0.1
|
|
156
|
+
asset_name: aisb.t3.082_onlinellmrouting.zip
|
|
157
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.082_onlinellmrouting.zip
|
|
158
|
+
archive_type: zip
|
|
159
|
+
sha256: 60d8ccca2c47273b6fa1cd022d1625bd395bd8358d3ef7f79234036d9b1d8a04
|
|
160
|
+
size_bytes: 54262
|
|
@@ -0,0 +1,133 @@
|
|
|
1
|
+
id: aisb.t3.082_onlinellmrouting
|
|
2
|
+
name: Online LLM Routing
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 无需训练的在线路由器:在 token 预算约束下,结合 ANNS 与一次性优化在多个 LLM 间分配请求。
|
|
5
|
+
task_description: 该基准实现了面向高吞吐多 LLM 服务的无训练在线路由算法。系统先用近似最近邻搜索(ANNS)从历史辅助数据中高效估计每个已部署 LLM 的查询特征,再在少量已观测查询样本(通常约 250)上进行一次混合整数线性规划(MILP)以学习路由权重,随后用于后续顺序到达查询的路由决策。该方法无需模型训练,部署额外开销极低,适配动态 LLM 部署配置。理论上在温和假设下可保证 1 - o(1) 的竞争比。
|
|
6
|
+
task_mode: evaluation_driven
|
|
7
|
+
requires_execution: true
|
|
8
|
+
requires_paper: true
|
|
9
|
+
integrity_level: cas_plus_canary
|
|
10
|
+
snapshot_status: restore_needed
|
|
11
|
+
support_level: recovery
|
|
12
|
+
time_band: 1-2h
|
|
13
|
+
cost_band: low
|
|
14
|
+
difficulty: medium
|
|
15
|
+
data_access: public
|
|
16
|
+
primary_outputs:
|
|
17
|
+
- quality_score
|
|
18
|
+
- routing_decisions
|
|
19
|
+
- cost_efficiency_metrics
|
|
20
|
+
- throughput_metrics
|
|
21
|
+
launch_profiles:
|
|
22
|
+
- id: analysis_only
|
|
23
|
+
label: Analysis Only
|
|
24
|
+
description: Review preserved routing benchmark metadata, target objective function, and MILP formulation. No execution performed.
|
|
25
|
+
- id: restore_first
|
|
26
|
+
label: Restore First
|
|
27
|
+
description: Restore missing online routing implementation and ANNS components before treating this benchmark as runnable. Current snapshot lacks executable code anchors.
|
|
28
|
+
dataset_download:
|
|
29
|
+
primary_method: mixed
|
|
30
|
+
sources:
|
|
31
|
+
- type: external_archive
|
|
32
|
+
url: https://deepscientist.cc/AISB/082_onlinellmrouting
|
|
33
|
+
archive_type: zip
|
|
34
|
+
local_dir_name: paper-82-OnlineLLMRouting
|
|
35
|
+
- type: github_repository
|
|
36
|
+
url: https://github.com/fzwark/PORT
|
|
37
|
+
note: Original implementation source referenced in paper
|
|
38
|
+
notes:
|
|
39
|
+
- Archive contains bundled README and requirements for full dependency set
|
|
40
|
+
- Benchmark datasets referenced in paper not included in snapshot
|
|
41
|
+
credential_requirements:
|
|
42
|
+
mode: none
|
|
43
|
+
items: []
|
|
44
|
+
notes:
|
|
45
|
+
- No API credentials required for CPU-only routing evaluation
|
|
46
|
+
- LLM inference APIs not required for the core routing algorithm evaluation
|
|
47
|
+
resources:
|
|
48
|
+
minimum:
|
|
49
|
+
cpu_cores: 8
|
|
50
|
+
ram_gb: 16
|
|
51
|
+
disk_gb: 30
|
|
52
|
+
gpu_count: 0
|
|
53
|
+
gpu_vram_gb: 0
|
|
54
|
+
recommended:
|
|
55
|
+
cpu_cores: 16
|
|
56
|
+
ram_gb: 32
|
|
57
|
+
disk_gb: 80
|
|
58
|
+
gpu_count: 0
|
|
59
|
+
gpu_vram_gb: 0
|
|
60
|
+
notes:
|
|
61
|
+
- CPU-only execution is fully viable for the minimum routing implementation
|
|
62
|
+
- ANNS operations (FAISS) are CPU-optimized with faiss_cpu package
|
|
63
|
+
- No GPU required for MILP solver or routing weight optimization
|
|
64
|
+
- Memory requirements scale with auxiliary dataset size for ANNS indexing
|
|
65
|
+
environment:
|
|
66
|
+
python: '3.10'
|
|
67
|
+
cuda: null
|
|
68
|
+
pytorch: 2.6.0
|
|
69
|
+
flash_attn: null
|
|
70
|
+
key_packages:
|
|
71
|
+
- faiss_cpu==1.10.0
|
|
72
|
+
- transformers==4.51.0
|
|
73
|
+
notes:
|
|
74
|
+
- faiss_cpu provides ANNS index for query feature estimation
|
|
75
|
+
- transformers used for embedding generation if auxiliary dataset requires
|
|
76
|
+
- Full dependency list provided in bundled requirements.txt
|
|
77
|
+
risk_flags:
|
|
78
|
+
- snapshot_incomplete
|
|
79
|
+
- blocked_no_code
|
|
80
|
+
risk_notes:
|
|
81
|
+
- Current snapshot does not expose executable code files anchoring staged metrics
|
|
82
|
+
- No benchmark execution was performed in this packaging pass
|
|
83
|
+
- Treat as blocked until source restoration or richer local snapshot is recovered
|
|
84
|
+
- Top-level README absent in current snapshot
|
|
85
|
+
recommended_when: 当你研究在 token 预算约束下的检索、优化与预算分配型路由系统时使用本基准。适合评估无需重训练即可快速决策的多 LLM 服务路由方案。
|
|
86
|
+
not_recommended_when: 如果你需要本地 GPU 微调语言模型、每查询多模型离线集成,或依赖需训练预测器的任务,不建议使用。
|
|
87
|
+
paper:
|
|
88
|
+
title: Efficient Training-Free Online Routing for High-Volume Multi-LLM Serving
|
|
89
|
+
venue: NeurIPS 2025
|
|
90
|
+
year: 2025
|
|
91
|
+
url: https://openreview.net/forum?id=d4mZyZB5I9
|
|
92
|
+
authors:
|
|
93
|
+
- Fangzhou Wu
|
|
94
|
+
- Sandeep Silwal
|
|
95
|
+
institution: University of Wisconsin-Madison
|
|
96
|
+
display:
|
|
97
|
+
palette_seed: silver-blue-router
|
|
98
|
+
art_style: serving-console
|
|
99
|
+
accent_priority: high
|
|
100
|
+
image_path: ../image/082_aisb.t3.082_onlinellmrouting.jpg
|
|
101
|
+
capability_tags:
|
|
102
|
+
- research_code_optimization
|
|
103
|
+
- llm_routing
|
|
104
|
+
- approximate_nearest_neighbors
|
|
105
|
+
- serving_systems
|
|
106
|
+
- online_optimization
|
|
107
|
+
- milp
|
|
108
|
+
- budget_allocation
|
|
109
|
+
track_fit:
|
|
110
|
+
- paper_track
|
|
111
|
+
- benchmark_track
|
|
112
|
+
aisb_direction: T3
|
|
113
|
+
metric_contract:
|
|
114
|
+
primary_metric: quality_score
|
|
115
|
+
status: blocked_no_code
|
|
116
|
+
notes:
|
|
117
|
+
- No executable code anchor in current snapshot
|
|
118
|
+
- Metric surface blocked until routing implementation is restored
|
|
119
|
+
- Original paper reports 3.55x overall performance improvement and 1.85x cost efficiency against 8 baselines
|
|
120
|
+
commercial:
|
|
121
|
+
annual_fee: null
|
|
122
|
+
recovery_rule: 'Prefer existing code files over README-only claims when choosing origin_path, source_ref, and evaluation_protocol.code_paths. Keep metrics_summary empty until trusted execution outputs exist. If the current snapshot has no executable anchor for a metric, mark that metric as provisional or blocked instead of inventing support.
|
|
123
|
+
|
|
124
|
+
'
|
|
125
|
+
download:
|
|
126
|
+
provider: github_release
|
|
127
|
+
repo: ResearAI/DeepScientist
|
|
128
|
+
tag: aisb-v0.0.1
|
|
129
|
+
asset_name: aisb.t3.082_onlinellmrouting.zip
|
|
130
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.082_onlinellmrouting.zip
|
|
131
|
+
archive_type: zip
|
|
132
|
+
sha256: 60d8ccca2c47273b6fa1cd022d1625bd395bd8358d3ef7f79234036d9b1d8a04
|
|
133
|
+
size_bytes: 54262
|