@researai/deepscientist 1.5.17 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +132 -11
- package/bin/ds.js +376 -49
- package/docs/en/00_QUICK_START.md +135 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +64 -4
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +29 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +44 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +92 -17
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +39 -4
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +29 -7
- package/install.sh +122 -16
- package/package.json +4 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +2 -2
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +927 -91
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +697 -210
- package/src/deepscientist/daemon/api/router.py +76 -1
- package/src/deepscientist/daemon/app.py +1054 -51
- package/src/deepscientist/diagnostics/runner_failures.py +147 -0
- package/src/deepscientist/doctor.py +212 -65
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +836 -92
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1430 -139
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +421 -21
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +61 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -11
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +409 -315
- package/src/prompts/system_copilot.md +88 -12
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
- package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
- package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
- package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
- package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
- package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
- package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
- package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
- package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
- package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
- package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
- package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
- package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
- package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
- package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
- package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
- package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
- package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
- package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,181 @@
|
|
|
1
|
+
id: aisb.t3.072_fedgmt
|
|
2
|
+
name: 'One Arrow, Two Hawks: Sharpness-aware Minimization for Federated Learning via
|
|
3
|
+
Global Model Trajectory'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: Two-stage federated learning benchmark combining trajectory-aware sharpness
|
|
6
|
+
control via EMA gradients and late-stage SWA stabilization for improved convergence
|
|
7
|
+
under non-IID data heterogeneity.
|
|
8
|
+
task_description: 'This packaged benchmark covers federated optimization with trajectory-aware
|
|
9
|
+
sharpness control and late-stage SWA stabilization. The task is to improve federated
|
|
10
|
+
generalization and convergence under non-IID data distributions while maintaining
|
|
11
|
+
client optimization stability. FedGMT combines an EMA-based trajectory tracking
|
|
12
|
+
mechanism with Stochastic Weight Averaging in the final rounds to smooth the loss
|
|
13
|
+
landscape. The implementation extends PFLlib and supports cross-device FL scenarios
|
|
14
|
+
with configurable numbers of heterogeneous clients, participation ratios, and data
|
|
15
|
+
partitioning strategies.
|
|
16
|
+
|
|
17
|
+
'
|
|
18
|
+
task_mode: experiment_driven
|
|
19
|
+
requires_execution: true
|
|
20
|
+
requires_paper: true
|
|
21
|
+
integrity_level: cas_plus_canary
|
|
22
|
+
snapshot_status: runnable
|
|
23
|
+
support_level: advanced
|
|
24
|
+
time_band: 6-24h
|
|
25
|
+
cost_band: medium
|
|
26
|
+
difficulty: medium
|
|
27
|
+
data_access: public
|
|
28
|
+
primary_outputs:
|
|
29
|
+
- test_accuracy
|
|
30
|
+
- federated_checkpoint
|
|
31
|
+
- round_metrics
|
|
32
|
+
launch_profiles:
|
|
33
|
+
- id: quick_eval
|
|
34
|
+
label: Quick Eval
|
|
35
|
+
description: Run one packaged federated-learning evaluation route on CIFAR-10 with
|
|
36
|
+
default hyperparameters and reduced rounds for smoke testing.
|
|
37
|
+
- id: full_federated_run
|
|
38
|
+
label: Full Federated Run
|
|
39
|
+
description: Run the full packaged FedGMT federated optimization workflow across
|
|
40
|
+
500 rounds with full evaluation suite.
|
|
41
|
+
dataset_download:
|
|
42
|
+
primary_method: bundled
|
|
43
|
+
sources:
|
|
44
|
+
- type: cifar10
|
|
45
|
+
partition: dirichlet
|
|
46
|
+
params:
|
|
47
|
+
concentration:
|
|
48
|
+
- 1.0
|
|
49
|
+
- 0.1
|
|
50
|
+
- 0.01
|
|
51
|
+
num_clients: 100
|
|
52
|
+
join_ratio: 0.1
|
|
53
|
+
- type: cifar100
|
|
54
|
+
partition: dirichlet
|
|
55
|
+
- type: cinic10
|
|
56
|
+
partition: dirichlet
|
|
57
|
+
notes:
|
|
58
|
+
- Dataset partitions generated via dataset/generate_dataset.py
|
|
59
|
+
- Dirichlet non-IID partitioning implemented in dataset/utils/
|
|
60
|
+
- 10% active clients per round across 100 total clients in standard config
|
|
61
|
+
credential_requirements:
|
|
62
|
+
mode: none
|
|
63
|
+
items: []
|
|
64
|
+
notes: []
|
|
65
|
+
resources:
|
|
66
|
+
minimum:
|
|
67
|
+
cpu_cores: 8
|
|
68
|
+
ram_gb: 32
|
|
69
|
+
disk_gb: 50
|
|
70
|
+
gpu_count: 1
|
|
71
|
+
gpu_vram_gb: 12
|
|
72
|
+
notes: CNN model; ~2.72s per round on RTX 4090; ~0.93GB VRAM per round
|
|
73
|
+
recommended:
|
|
74
|
+
cpu_cores: 16
|
|
75
|
+
ram_gb: 64
|
|
76
|
+
disk_gb: 100
|
|
77
|
+
gpu_count: 1
|
|
78
|
+
gpu_vram_gb: 24
|
|
79
|
+
notes: ResNet18 model; ~20s per round on RTX 4090; ~1.86GB VRAM per round
|
|
80
|
+
environment:
|
|
81
|
+
python: '3.7'
|
|
82
|
+
cuda: '11.8'
|
|
83
|
+
pytorch: null
|
|
84
|
+
flash_attn: null
|
|
85
|
+
key_packages:
|
|
86
|
+
- torch
|
|
87
|
+
- torchvision
|
|
88
|
+
- tqdm
|
|
89
|
+
- numpy
|
|
90
|
+
notes:
|
|
91
|
+
- Install via pip install -r requirements.txt
|
|
92
|
+
- Python 3.7 tested; see bundled requirements for full dependency set
|
|
93
|
+
risk_flags:
|
|
94
|
+
- extended_training_time
|
|
95
|
+
- multi_round_convergence
|
|
96
|
+
- non_iid_data_heterogeneity
|
|
97
|
+
risk_notes:
|
|
98
|
+
- Full benchmark requires 500 rounds; estimated 4.5h (CNN) to 33h (ResNet18) on single
|
|
99
|
+
GPU
|
|
100
|
+
- SWA stabilization begins at round 400; late-stage convergence may vary with data
|
|
101
|
+
heterogeneity
|
|
102
|
+
- Client drift under extreme non-IID conditions (Dir-0.01) requires careful hyperparameter
|
|
103
|
+
tuning
|
|
104
|
+
recommended_when: 'Use this benchmark when evaluating federated learning algorithms
|
|
105
|
+
under realistic data heterogeneity, studying round-level stability and client drift
|
|
106
|
+
tradeoffs, or benchmarking sharpness-aware minimization techniques in distributed
|
|
107
|
+
settings with privacy-preserving constraints.
|
|
108
|
+
|
|
109
|
+
'
|
|
110
|
+
not_recommended_when: 'Do not use this if you need single-node non-federated training,
|
|
111
|
+
require personalized per-client models, or need rapid prototyping without multi-round
|
|
112
|
+
communication overhead.
|
|
113
|
+
|
|
114
|
+
'
|
|
115
|
+
paper:
|
|
116
|
+
title: 'One Arrow, Two Hawks: Sharpness-aware Minimization for Federated Learning
|
|
117
|
+
via Global Model Trajectory'
|
|
118
|
+
venue: ICML 2025
|
|
119
|
+
year: 2025
|
|
120
|
+
url: https://proceedings.mlr.press/v267/li25bd.html
|
|
121
|
+
download:
|
|
122
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.072_fedgmt.zip
|
|
123
|
+
archive_type: zip
|
|
124
|
+
local_dir_name: paper-72-FedGMT
|
|
125
|
+
provider: github_release
|
|
126
|
+
repo: ResearAI/DeepScientist
|
|
127
|
+
tag: aisb-v0.0.1
|
|
128
|
+
asset_name: aisb.t3.072_fedgmt.zip
|
|
129
|
+
sha256: 469c3e18a45ac8e776a73ab672c969a944e795cf11e24c6385c37bc755a7fdcb
|
|
130
|
+
size_bytes: 84064
|
|
131
|
+
display:
|
|
132
|
+
palette_seed: teal-crimson-federated
|
|
133
|
+
art_style: distributed-dashboard
|
|
134
|
+
accent_priority: high
|
|
135
|
+
image_path: ../image/072_aisb.t3.072_fedgmt.jpg
|
|
136
|
+
capability_tags:
|
|
137
|
+
- research_code_optimization
|
|
138
|
+
- federated_learning
|
|
139
|
+
- sharpness_aware_minimization
|
|
140
|
+
- distributed_training
|
|
141
|
+
- image_classification
|
|
142
|
+
- non_iid_learning
|
|
143
|
+
- swa_stabilization
|
|
144
|
+
aisb_direction: T3
|
|
145
|
+
track_fit:
|
|
146
|
+
- paper_track
|
|
147
|
+
- benchmark_track
|
|
148
|
+
hyperparameters:
|
|
149
|
+
common:
|
|
150
|
+
optimizer: SGD
|
|
151
|
+
learning_rate: 0.01
|
|
152
|
+
momentum: 0.9
|
|
153
|
+
weight_decay: 1.0e-05
|
|
154
|
+
batch_size: 50
|
|
155
|
+
local_epochs: 5
|
|
156
|
+
total_rounds: 500
|
|
157
|
+
fedgmt_specific:
|
|
158
|
+
ema_coefficient_alpha:
|
|
159
|
+
- 0.95
|
|
160
|
+
- 0.995
|
|
161
|
+
- 0.998
|
|
162
|
+
sharpness_strength_gamma:
|
|
163
|
+
- 0.5
|
|
164
|
+
- 1.0
|
|
165
|
+
- 2.0
|
|
166
|
+
penalty_coefficient: 10
|
|
167
|
+
swa_start_round: 400
|
|
168
|
+
swa_window: 100
|
|
169
|
+
algorithm_family:
|
|
170
|
+
- FedAvg
|
|
171
|
+
- FedDyn
|
|
172
|
+
- FedSAM
|
|
173
|
+
- FedSpeed
|
|
174
|
+
- FedSMOO
|
|
175
|
+
- FedLESAM
|
|
176
|
+
- FedGMT
|
|
177
|
+
code_anchors:
|
|
178
|
+
main_entry: system/main.py
|
|
179
|
+
server_base: system/flcore/servers/serverbase.py
|
|
180
|
+
fedgmt_server: system/flcore/servers/servergmt.py
|
|
181
|
+
data_partition: dataset/generate_dataset.py
|
|
@@ -0,0 +1,158 @@
|
|
|
1
|
+
id: aisb.t3.072_fedgmt
|
|
2
|
+
name: '一箭双雕:基于全局模型轨迹的联邦学习锐度感知最小化'
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 两阶段联邦学习基准,结合EMA梯度的轨迹感知锐度控制与后期SWA稳定化,在非独立同分布数据异质性条件下改善收敛性能。
|
|
5
|
+
task_description: |
|
|
6
|
+
本基准套件涵盖基于轨迹感知锐度控制和后期SWA稳定化的联邦优化任务。任务目标是在非独立同分布数据分布下提升联邦泛化能力和收敛性,同时保持客户端优化稳定性。FedGMT结合基于EMA的轨迹跟踪机制与最终轮次的随机权重平均,以平滑损失曲面。实现基于PFLlib扩展,支持跨设备联邦学习场景,可配置异质性客户端数量、参与比例和数据分区策略。
|
|
7
|
+
task_mode: experiment_driven
|
|
8
|
+
requires_execution: true
|
|
9
|
+
requires_paper: true
|
|
10
|
+
integrity_level: cas_plus_canary
|
|
11
|
+
snapshot_status: runnable
|
|
12
|
+
support_level: advanced
|
|
13
|
+
time_band: 6-24h
|
|
14
|
+
cost_band: medium
|
|
15
|
+
difficulty: medium
|
|
16
|
+
data_access: public
|
|
17
|
+
primary_outputs:
|
|
18
|
+
- test_accuracy
|
|
19
|
+
- federated_checkpoint
|
|
20
|
+
- round_metrics
|
|
21
|
+
launch_profiles:
|
|
22
|
+
- id: quick_eval
|
|
23
|
+
label: 快速评估
|
|
24
|
+
description: 使用默认超参数和减少轮次在CIFAR-10上运行一条封装的联邦学习评估路径,用于冒烟测试。
|
|
25
|
+
- id: full_federated_run
|
|
26
|
+
label: 完整联邦运行
|
|
27
|
+
description: 跨500轮运行完整的封装FedGMT联邦优化工作流,包含完整评估套件。
|
|
28
|
+
dataset_download:
|
|
29
|
+
primary_method: bundled
|
|
30
|
+
sources:
|
|
31
|
+
- type: cifar10
|
|
32
|
+
partition: dirichlet
|
|
33
|
+
params:
|
|
34
|
+
concentration:
|
|
35
|
+
- 1.0
|
|
36
|
+
- 0.1
|
|
37
|
+
- 0.01
|
|
38
|
+
num_clients: 100
|
|
39
|
+
join_ratio: 0.1
|
|
40
|
+
- type: cifar100
|
|
41
|
+
partition: dirichlet
|
|
42
|
+
- type: cinic10
|
|
43
|
+
partition: dirichlet
|
|
44
|
+
notes:
|
|
45
|
+
- 数据集分区通过 dataset/generate_dataset.py 生成
|
|
46
|
+
- Dirichlet非独立同分布分区实现于 dataset/utils/
|
|
47
|
+
- 标准配置中每轮10%的活跃客户端,共100个客户端
|
|
48
|
+
credential_requirements:
|
|
49
|
+
mode: none
|
|
50
|
+
items: []
|
|
51
|
+
notes: []
|
|
52
|
+
resources:
|
|
53
|
+
minimum:
|
|
54
|
+
cpu_cores: 8
|
|
55
|
+
ram_gb: 32
|
|
56
|
+
disk_gb: 50
|
|
57
|
+
gpu_count: 1
|
|
58
|
+
gpu_vram_gb: 12
|
|
59
|
+
notes: CNN模型;在RTX 4090上每轮约2.72秒;每轮约0.93GB显存
|
|
60
|
+
recommended:
|
|
61
|
+
cpu_cores: 16
|
|
62
|
+
ram_gb: 64
|
|
63
|
+
disk_gb: 100
|
|
64
|
+
gpu_count: 1
|
|
65
|
+
gpu_vram_gb: 24
|
|
66
|
+
notes: ResNet18模型;在RTX 4090上每轮约20秒;每轮约1.86GB显存
|
|
67
|
+
environment:
|
|
68
|
+
python: '3.7'
|
|
69
|
+
cuda: '11.8'
|
|
70
|
+
pytorch: null
|
|
71
|
+
flash_attn: null
|
|
72
|
+
key_packages:
|
|
73
|
+
- torch
|
|
74
|
+
- torchvision
|
|
75
|
+
- tqdm
|
|
76
|
+
- numpy
|
|
77
|
+
notes:
|
|
78
|
+
- 通过 pip install -r requirements.txt 安装
|
|
79
|
+
- 已测试Python 3.7;完整依赖集见捆绑的requirements文件
|
|
80
|
+
risk_flags:
|
|
81
|
+
- extended_training_time
|
|
82
|
+
- multi_round_convergence
|
|
83
|
+
- non_iid_data_heterogeneity
|
|
84
|
+
risk_notes:
|
|
85
|
+
- 完整基准需要500轮;在单GPU上估计耗时CNN约4.5小时,ResNet18约33小时
|
|
86
|
+
- SWA稳定化从第400轮开始;后期收敛可能因数据异质性而有所差异
|
|
87
|
+
- 在极端非独立同分布条件下(Dir-0.01)的客户端漂移需要仔细调整超参数
|
|
88
|
+
recommended_when: |
|
|
89
|
+
在评估真实数据异质性下的联邦学习算法、研究轮级稳定性和客户端漂移权衡,或在具有隐私保护约束的分布式设置中对锐度感知最小化技术进行基准测试时使用本基准。
|
|
90
|
+
not_recommended_when: |
|
|
91
|
+
如需单节点非联邦训练、需要个性化每客户端模型,或需要在多轮通信开销下进行快速原型开发时,不建议使用本基准。
|
|
92
|
+
paper:
|
|
93
|
+
title: 'One Arrow, Two Hawks: Sharpness-aware Minimization for Federated Learning
|
|
94
|
+
via Global Model Trajectory'
|
|
95
|
+
venue: ICML 2025
|
|
96
|
+
year: 2025
|
|
97
|
+
url: https://proceedings.mlr.press/v267/li25bd.html
|
|
98
|
+
download:
|
|
99
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.072_fedgmt.zip
|
|
100
|
+
archive_type: zip
|
|
101
|
+
local_dir_name: paper-72-FedGMT
|
|
102
|
+
provider: github_release
|
|
103
|
+
repo: ResearAI/DeepScientist
|
|
104
|
+
tag: aisb-v0.0.1
|
|
105
|
+
asset_name: aisb.t3.072_fedgmt.zip
|
|
106
|
+
sha256: 469c3e18a45ac8e776a73ab672c969a944e795cf11e24c6385c37bc755a7fdcb
|
|
107
|
+
size_bytes: 84064
|
|
108
|
+
display:
|
|
109
|
+
palette_seed: teal-crimson-federated
|
|
110
|
+
art_style: distributed-dashboard
|
|
111
|
+
accent_priority: high
|
|
112
|
+
image_path: ../image/072_aisb.t3.072_fedgmt.jpg
|
|
113
|
+
capability_tags:
|
|
114
|
+
- research_code_optimization
|
|
115
|
+
- federated_learning
|
|
116
|
+
- sharpness_aware_minimization
|
|
117
|
+
- distributed_training
|
|
118
|
+
- image_classification
|
|
119
|
+
- non_iid_learning
|
|
120
|
+
- swa_stabilization
|
|
121
|
+
aisb_direction: T3
|
|
122
|
+
track_fit:
|
|
123
|
+
- paper_track
|
|
124
|
+
- benchmark_track
|
|
125
|
+
hyperparameters:
|
|
126
|
+
common:
|
|
127
|
+
optimizer: SGD
|
|
128
|
+
learning_rate: 0.01
|
|
129
|
+
momentum: 0.9
|
|
130
|
+
weight_decay: 1.0e-05
|
|
131
|
+
batch_size: 50
|
|
132
|
+
local_epochs: 5
|
|
133
|
+
total_rounds: 500
|
|
134
|
+
fedgmt_specific:
|
|
135
|
+
ema_coefficient_alpha:
|
|
136
|
+
- 0.95
|
|
137
|
+
- 0.995
|
|
138
|
+
- 0.998
|
|
139
|
+
sharpness_strength_gamma:
|
|
140
|
+
- 0.5
|
|
141
|
+
- 1.0
|
|
142
|
+
- 2.0
|
|
143
|
+
penalty_coefficient: 10
|
|
144
|
+
swa_start_round: 400
|
|
145
|
+
swa_window: 100
|
|
146
|
+
algorithm_family:
|
|
147
|
+
- FedAvg
|
|
148
|
+
- FedDyn
|
|
149
|
+
- FedSAM
|
|
150
|
+
- FedSpeed
|
|
151
|
+
- FedSMOO
|
|
152
|
+
- FedLESAM
|
|
153
|
+
- FedGMT
|
|
154
|
+
code_anchors:
|
|
155
|
+
main_entry: system/main.py
|
|
156
|
+
server_base: system/flcore/servers/serverbase.py
|
|
157
|
+
fedgmt_server: system/flcore/servers/servergmt.py
|
|
158
|
+
data_partition: dataset/generate_dataset.py
|
|
@@ -0,0 +1,161 @@
|
|
|
1
|
+
id: aisb.t3.073_rld
|
|
2
|
+
name: Regularized Langevin Dynamics for Combinatorial Optimization
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Optimize combinatorial optimization via regularized Langevin dynamics with
|
|
5
|
+
Hamming-distance regularization for simulated annealing and neural solvers.
|
|
6
|
+
task_description: 'This packaged benchmark covers combinatorial optimization via Regularized
|
|
7
|
+
Langevin Dynamics (RLD), which enforces an expected Hamming distance between sampled
|
|
8
|
+
and current solutions to escape local optima in discrete domains. The benchmark
|
|
9
|
+
includes two solvers: RLSA (Regularized Langevin Simulated Annealing) based on gradient-guided
|
|
10
|
+
MCMC sampling, and RLNN (Regularized Langevin Neural Network) supporting both differentiable
|
|
11
|
+
(erdoes) and fully black-box (reinforce) training losses. Problems include Maximum
|
|
12
|
+
Independent Set (MIS), Maximum Clique (MCL), and Maximum Cut (MCut) on Erdős–Rényi,
|
|
13
|
+
Revised Model B, and Barabási–Albert random graphs. RLSA achieves comparable or
|
|
14
|
+
superior performance to SOTA SA baselines at 20% of their runtime. RLNN trains efficiently
|
|
15
|
+
via local objectives without requiring labeled data or long-horizon return estimation.
|
|
16
|
+
|
|
17
|
+
'
|
|
18
|
+
task_mode: experiment_driven
|
|
19
|
+
requires_execution: true
|
|
20
|
+
requires_paper: true
|
|
21
|
+
integrity_level: cas_plus_canary
|
|
22
|
+
snapshot_status: runnable
|
|
23
|
+
support_level: advanced
|
|
24
|
+
time_band: 6-24h
|
|
25
|
+
cost_band: medium
|
|
26
|
+
difficulty: hard
|
|
27
|
+
data_access: public
|
|
28
|
+
primary_outputs:
|
|
29
|
+
- rlsa_size
|
|
30
|
+
- rlsa_time
|
|
31
|
+
- optimization_trace
|
|
32
|
+
launch_profiles:
|
|
33
|
+
- id: quick_eval
|
|
34
|
+
label: Quick Eval
|
|
35
|
+
description: 'Run one packaged RLSA evaluation script on a supported combinatorial
|
|
36
|
+
problem. Uses accelerate with configurable precision (fp16/no). Set num_processes=1
|
|
37
|
+
for accurate timing. Tests on small graph instances (RB-[200-300], ER-[700-800],
|
|
38
|
+
BA-[200-300]) with 500-1000 test samples.
|
|
39
|
+
|
|
40
|
+
'
|
|
41
|
+
- id: full_train_eval
|
|
42
|
+
label: Full Train + Eval
|
|
43
|
+
description: 'Run the full packaged regularized Langevin dynamics and neural baseline
|
|
44
|
+
workflow. Includes RLNN training with erdoes loss (differentiable) or reinforce
|
|
45
|
+
loss (black-box), followed by evaluation across small and large graph problem
|
|
46
|
+
instances.
|
|
47
|
+
|
|
48
|
+
'
|
|
49
|
+
dataset_download:
|
|
50
|
+
primary_method: mixed
|
|
51
|
+
sources:
|
|
52
|
+
- type: huggingface
|
|
53
|
+
url: https://huggingface.co/datasets/shengyuf/RLD4CO
|
|
54
|
+
description: Pre-generated test graphs including ER-[9000-11000] for scale evaluation
|
|
55
|
+
- type: generator
|
|
56
|
+
description: Random graph generators included in data/ folder (er_generator.py,
|
|
57
|
+
rb_generator.py, ba_generator.py)
|
|
58
|
+
notes:
|
|
59
|
+
- ER test graphs are from DIMES repository
|
|
60
|
+
- RB and BA graphs generated using DIffUCO code
|
|
61
|
+
- ER-[9000-11000] has no training data; evaluate solvers trained on ER-[700-800]
|
|
62
|
+
directly
|
|
63
|
+
- 1000 instances per problem (2 groups of 500-size test sets)
|
|
64
|
+
credential_requirements:
|
|
65
|
+
mode: none
|
|
66
|
+
items: []
|
|
67
|
+
notes: []
|
|
68
|
+
resources:
|
|
69
|
+
minimum:
|
|
70
|
+
cpu_cores: 8
|
|
71
|
+
ram_gb: 32
|
|
72
|
+
disk_gb: 80
|
|
73
|
+
gpu_count: 1
|
|
74
|
+
gpu_vram_gb: 16
|
|
75
|
+
recommended:
|
|
76
|
+
cpu_cores: 16
|
|
77
|
+
ram_gb: 64
|
|
78
|
+
disk_gb: 150
|
|
79
|
+
gpu_count: 1
|
|
80
|
+
gpu_vram_gb: 24
|
|
81
|
+
environment:
|
|
82
|
+
python: '3.8'
|
|
83
|
+
cuda: '12.4'
|
|
84
|
+
pytorch: 2.4.1
|
|
85
|
+
flash_attn: null
|
|
86
|
+
key_packages:
|
|
87
|
+
- accelerate
|
|
88
|
+
- torch
|
|
89
|
+
- torch_geometric
|
|
90
|
+
- torch_scatter
|
|
91
|
+
- scipy
|
|
92
|
+
- numpy
|
|
93
|
+
- tqdm
|
|
94
|
+
notes:
|
|
95
|
+
- Install dependencies via conda environment.yml: conda env create -f environment.yml
|
|
96
|
+
&& conda activate RLD4CO
|
|
97
|
+
- Framework built on accelerate for distributed evaluation
|
|
98
|
+
- Use --mixed_precision fp16 for faster inference
|
|
99
|
+
risk_flags:
|
|
100
|
+
- gpu_memory_bound
|
|
101
|
+
- disk_io_bound
|
|
102
|
+
- reproducibility_requires_seed
|
|
103
|
+
risk_notes:
|
|
104
|
+
- RLSA timing requires num_processes=1; multi-GPU parallelization affects wall-clock
|
|
105
|
+
measurements
|
|
106
|
+
- Large graph evaluation (ER-[9000-11000]) requires significant GPU memory; use mixed
|
|
107
|
+
precision
|
|
108
|
+
- RLNN training with reinforce loss is computationally intensive due to full black-box
|
|
109
|
+
gradient estimation
|
|
110
|
+
- Random graph generation with multiprocessing (num_processes parameter) affects reproducibility
|
|
111
|
+
recommended_when: 'Use this benchmark when you want a stochastic combinatorial-optimization
|
|
112
|
+
task with controllable sampling and neural baselines, need to evaluate simulated
|
|
113
|
+
annealing variants on random graphs, require unsupervised or black-box optimization
|
|
114
|
+
capability, or want to benchmark against ICML 2025 SOTA SA and NN-based CO solvers.
|
|
115
|
+
|
|
116
|
+
'
|
|
117
|
+
not_recommended_when: 'Do not use this if you need a pure supervised-learning benchmark,
|
|
118
|
+
require exact/optimal solutions as ground truth, work with structured real-world
|
|
119
|
+
graph datasets rather than random generators, or need a deterministic reproducible
|
|
120
|
+
baseline without seed control.
|
|
121
|
+
|
|
122
|
+
'
|
|
123
|
+
paper:
|
|
124
|
+
title: Regularized Langevin Dynamics for Combinatorial Optimization
|
|
125
|
+
venue: ICML 2025
|
|
126
|
+
year: 2025
|
|
127
|
+
url: https://arxiv.org/abs/2502.00277
|
|
128
|
+
authors:
|
|
129
|
+
- Shengyu Feng
|
|
130
|
+
- Yiming Yang
|
|
131
|
+
affiliation: Carnegie Mellon University
|
|
132
|
+
contact: shengyuf@cs.cmu.edu
|
|
133
|
+
download:
|
|
134
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.073_rld.zip
|
|
135
|
+
archive_type: zip
|
|
136
|
+
local_dir_name: paper-73-RLD
|
|
137
|
+
provider: github_release
|
|
138
|
+
repo: ResearAI/DeepScientist
|
|
139
|
+
tag: aisb-v0.0.1
|
|
140
|
+
asset_name: aisb.t3.073_rld.zip
|
|
141
|
+
sha256: 0cbaa2a2ca423ac065c17e38dc60fed2d00bf4a92a39cd1eab7c0a6decb7a2b9
|
|
142
|
+
size_bytes: 53784
|
|
143
|
+
display:
|
|
144
|
+
palette_seed: brass-midnight-langevin
|
|
145
|
+
art_style: optimization-physics
|
|
146
|
+
accent_priority: high
|
|
147
|
+
image_path: ../image/073_aisb.t3.073_rld.jpg
|
|
148
|
+
capability_tags:
|
|
149
|
+
- research_code_optimization
|
|
150
|
+
- combinatorial_optimization
|
|
151
|
+
- langevin_dynamics
|
|
152
|
+
- graph_optimization
|
|
153
|
+
- sampling
|
|
154
|
+
- simulated_annealing
|
|
155
|
+
- neural_heuristics
|
|
156
|
+
- unsupervised_learning
|
|
157
|
+
- black_box_optimization
|
|
158
|
+
aisb_direction: T3
|
|
159
|
+
track_fit:
|
|
160
|
+
- paper_track
|
|
161
|
+
- benchmark_track
|
|
@@ -0,0 +1,129 @@
|
|
|
1
|
+
id: aisb.t3.073_rld
|
|
2
|
+
name: 组合优化的正则化朗之万动力学
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 通过Hamming距离正则化的正则化朗之万动力学优化组合问题,用于模拟退火和神经求解器。
|
|
5
|
+
task_description: >-
|
|
6
|
+
本基准测试包涵盖基于正则化朗之万动力学(RLD)的组合优化问题。RLD通过在采样解和当前解之间施加期望Hamming距离约束来逃离离散域中的局部最优。该基准测试包含两个求解器:基于梯度引导MCMC采样的RLSA(正则化朗之万模拟退火),以及支持可微分损失(erdoes)和完全黑盒损失(reinforce)的RLNN(正则化朗之万神经网络)。问题涵盖Erdős–Rényi、修订模型B和Barabási–Albert随机图上的最大独立集(MIS)、最大团(MCL)和最大割(MCut)。RLSA在仅需SOTA SA基线20%运行时间的情况下达到相当或更优的性能。RLNN通过局部目标高效训练,无需标注数据或长时域回报估计。
|
|
7
|
+
task_mode: experiment_driven
|
|
8
|
+
requires_execution: true
|
|
9
|
+
requires_paper: true
|
|
10
|
+
integrity_level: cas_plus_canary
|
|
11
|
+
snapshot_status: runnable
|
|
12
|
+
support_level: advanced
|
|
13
|
+
time_band: 6-24h
|
|
14
|
+
cost_band: medium
|
|
15
|
+
difficulty: hard
|
|
16
|
+
data_access: public
|
|
17
|
+
primary_outputs:
|
|
18
|
+
- rlsa_size
|
|
19
|
+
- rlsa_time
|
|
20
|
+
- optimization_trace
|
|
21
|
+
launch_profiles:
|
|
22
|
+
- id: quick_eval
|
|
23
|
+
label: 快速评估
|
|
24
|
+
description: >-
|
|
25
|
+
在支持的组合问题上运行一个封装的RLSA评估脚本。使用accelerate,支持可配置精度(fp16/无)。设置num_processes=1以获得精确计时。在小型图实例(RB-[200-300]、ER-[700-800]、BA-[200-300])上测试,包含500-1000个测试样本。
|
|
26
|
+
- id: full_train_eval
|
|
27
|
+
label: 完整训练+评估
|
|
28
|
+
description: >-
|
|
29
|
+
运行完整的封装正则化朗之万动力学和神经基线工作流程。包括使用erdoes损失(可微分)或reinforce损失(黑盒)训练RLNN,然后在小型和大型图问题实例上进行评估。
|
|
30
|
+
dataset_download:
|
|
31
|
+
primary_method: mixed
|
|
32
|
+
sources:
|
|
33
|
+
- type: huggingface
|
|
34
|
+
url: https://huggingface.co/datasets/shengyuf/RLD4CO
|
|
35
|
+
description: 预生成的测试图,包括ER-[9000-11000]用于规模化评估
|
|
36
|
+
- type: generator
|
|
37
|
+
description: data/文件夹中包含的随机图生成器(er_generator.py、rb_generator.py、ba_generator.py)
|
|
38
|
+
notes:
|
|
39
|
+
- ER测试图来自DIMES仓库
|
|
40
|
+
- RB和BA图使用DIffUCO代码生成
|
|
41
|
+
- ER-[9000-11000]无训练数据;直接在ER-[700-800]上训练的求解器进行评估
|
|
42
|
+
- 每个问题1000个实例(2组500大小的测试集)
|
|
43
|
+
credential_requirements:
|
|
44
|
+
mode: none
|
|
45
|
+
items: []
|
|
46
|
+
notes: []
|
|
47
|
+
resources:
|
|
48
|
+
minimum:
|
|
49
|
+
cpu_cores: 8
|
|
50
|
+
ram_gb: 32
|
|
51
|
+
disk_gb: 80
|
|
52
|
+
gpu_count: 1
|
|
53
|
+
gpu_vram_gb: 16
|
|
54
|
+
recommended:
|
|
55
|
+
cpu_cores: 16
|
|
56
|
+
ram_gb: 64
|
|
57
|
+
disk_gb: 150
|
|
58
|
+
gpu_count: 1
|
|
59
|
+
gpu_vram_gb: 24
|
|
60
|
+
environment:
|
|
61
|
+
python: '3.8'
|
|
62
|
+
cuda: '12.4'
|
|
63
|
+
pytorch: 2.4.1
|
|
64
|
+
flash_attn: null
|
|
65
|
+
key_packages:
|
|
66
|
+
- accelerate
|
|
67
|
+
- torch
|
|
68
|
+
- torch_geometric
|
|
69
|
+
- torch_scatter
|
|
70
|
+
- scipy
|
|
71
|
+
- numpy
|
|
72
|
+
- tqdm
|
|
73
|
+
notes:
|
|
74
|
+
- 通过conda environment.yml安装依赖:conda env create -f environment.yml && conda activate
|
|
75
|
+
RLD4CO
|
|
76
|
+
- 基于accelerate构建的分布式评估框架
|
|
77
|
+
- 使用--mixed_precision fp16加速推理
|
|
78
|
+
risk_flags:
|
|
79
|
+
- gpu_memory_bound
|
|
80
|
+
- disk_io_bound
|
|
81
|
+
- reproducibility_requires_seed
|
|
82
|
+
risk_notes:
|
|
83
|
+
- RLSA计时需要num_processes=1;多GPU并行化会影响实际运行时间测量
|
|
84
|
+
- 大型图评估(ER-[9000-11000])需要大量GPU内存;使用混合精度
|
|
85
|
+
- 使用reinforce损失的RLNN训练由于完全黑盒梯度估计而计算密集
|
|
86
|
+
- 使用多进程(num_processes参数)进行随机图生成会影响可重复性
|
|
87
|
+
recommended_when: >-
|
|
88
|
+
当您需要一个具有可控采样和神经基线的随机组合优化任务时使用本基准测试;需要评估随机图上的模拟退火变体时;需要无监督或黑盒优化能力时;或者想要与ICML 2025 SOTA SA和基于NN的CO求解器进行基准对比时。
|
|
89
|
+
not_recommended_when: >-
|
|
90
|
+
如果您需要一个纯监督学习基准测试时不要使用;需要精确/最优解作为真值时不要使用;处理结构化真实世界图数据集而非随机生成器时不要使用;或者需要一个没有种子控制的确定性可重复基线时不要使用。
|
|
91
|
+
paper:
|
|
92
|
+
title: Regularized Langevin Dynamics for Combinatorial Optimization
|
|
93
|
+
venue: ICML 2025
|
|
94
|
+
year: 2025
|
|
95
|
+
url: https://arxiv.org/abs/2502.00277
|
|
96
|
+
authors:
|
|
97
|
+
- Shengyu Feng
|
|
98
|
+
- Yiming Yang
|
|
99
|
+
affiliation: Carnegie Mellon University
|
|
100
|
+
contact: shengyuf@cs.cmu.edu
|
|
101
|
+
download:
|
|
102
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.073_rld.zip
|
|
103
|
+
archive_type: zip
|
|
104
|
+
local_dir_name: paper-73-RLD
|
|
105
|
+
provider: github_release
|
|
106
|
+
repo: ResearAI/DeepScientist
|
|
107
|
+
tag: aisb-v0.0.1
|
|
108
|
+
asset_name: aisb.t3.073_rld.zip
|
|
109
|
+
sha256: 0cbaa2a2ca423ac065c17e38dc60fed2d00bf4a92a39cd1eab7c0a6decb7a2b9
|
|
110
|
+
size_bytes: 53784
|
|
111
|
+
display:
|
|
112
|
+
palette_seed: brass-midnight-langevin
|
|
113
|
+
art_style: optimization-physics
|
|
114
|
+
accent_priority: high
|
|
115
|
+
image_path: ../image/073_aisb.t3.073_rld.jpg
|
|
116
|
+
capability_tags:
|
|
117
|
+
- research_code_optimization
|
|
118
|
+
- combinatorial_optimization
|
|
119
|
+
- langevin_dynamics
|
|
120
|
+
- graph_optimization
|
|
121
|
+
- sampling
|
|
122
|
+
- simulated_annealing
|
|
123
|
+
- neural_heuristics
|
|
124
|
+
- unsupervised_learning
|
|
125
|
+
- black_box_optimization
|
|
126
|
+
aisb_direction: T3
|
|
127
|
+
track_fit:
|
|
128
|
+
- paper_track
|
|
129
|
+
- benchmark_track
|