@researai/deepscientist 1.5.17 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +132 -11
- package/bin/ds.js +376 -49
- package/docs/en/00_QUICK_START.md +135 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +64 -4
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +29 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +44 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +92 -17
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +39 -4
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +29 -7
- package/install.sh +122 -16
- package/package.json +4 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +2 -2
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +927 -91
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +697 -210
- package/src/deepscientist/daemon/api/router.py +76 -1
- package/src/deepscientist/daemon/app.py +1054 -51
- package/src/deepscientist/diagnostics/runner_failures.py +147 -0
- package/src/deepscientist/doctor.py +212 -65
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +836 -92
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1430 -139
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +421 -21
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +61 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -11
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +409 -315
- package/src/prompts/system_copilot.md +88 -12
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
- package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
- package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
- package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
- package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
- package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
- package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
- package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
- package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
- package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
- package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
- package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
- package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
- package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
- package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
- package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
- package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
- package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
- package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,182 @@
|
|
|
1
|
+
id: aisb.t3.042_xpatch
|
|
2
|
+
name: 'xPatch:基于指数季节-趋势分解的双流时间序列预测'
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 采用基于EMA的季节-趋势分解和长上下文补丁的CNN-MLP双流长期时间序列预测。
|
|
5
|
+
task_description: '本封装基准测试包含xPatch,这是一个双流长期时间序列预测(LTSF)架构,使用指数移动平均(EMA)而非简单移动平均将输入序列分解为季节分量和趋势分量。线性流采用MLP层进行趋势预测,非线性流使用深度可分离CNN捕捉季节模式。该模型在非Transformer骨干网络中研究补丁化和通道独立技术,对标Transformer基线(PatchTST、Autoformer、FEDformer、CARD)和线性基线(DLinear、RLinear)在标准LTSF基准数据集上的表现。
|
|
6
|
+
|
|
7
|
+
'
|
|
8
|
+
task_mode: experiment_driven
|
|
9
|
+
requires_execution: true
|
|
10
|
+
requires_paper: true
|
|
11
|
+
integrity_level: cas_plus_canary
|
|
12
|
+
snapshot_status: runnable
|
|
13
|
+
support_level: advanced
|
|
14
|
+
time_band: 6-24h
|
|
15
|
+
cost_band: medium
|
|
16
|
+
difficulty: hard
|
|
17
|
+
data_access: public
|
|
18
|
+
primary_outputs:
|
|
19
|
+
- mse
|
|
20
|
+
- mae
|
|
21
|
+
- forecast_checkpoints
|
|
22
|
+
- ablation_outputs
|
|
23
|
+
launch_profiles:
|
|
24
|
+
- id: quick_eval
|
|
25
|
+
label: 快速评估
|
|
26
|
+
description: '使用统一实验设置在单个准备好的预测数据集上运行xPatch。执行xPatch_unified脚本,使用默认超参数。适用于快速验证模型在单个基准数据集上的行为。
|
|
27
|
+
|
|
28
|
+
'
|
|
29
|
+
- id: hyper_search
|
|
30
|
+
label: 超参数搜索
|
|
31
|
+
description: '在补丁长度、回溯窗口、预测长度和EMA alpha参数上运行全面的超参数搜索。使用xPatch_search脚本。生成的结果可与报告中使用drop-last技巧的基线论文进行公平比较。
|
|
32
|
+
|
|
33
|
+
'
|
|
34
|
+
- id: fair_benchmark
|
|
35
|
+
label: 公平基准测试(TFB/OpenTS)
|
|
36
|
+
description: '遵循TFB基准测试协议,在不使用drop-last技巧的情况下执行公平实验。使用xPatch_fair脚本。结果可与OpenTS排行榜条目进行比较。
|
|
37
|
+
|
|
38
|
+
'
|
|
39
|
+
- id: ablation_suite
|
|
40
|
+
label: 消融实验套件
|
|
41
|
+
description: '运行论文附录中的消融研究,包括EMA分解影响、arctangent损失函数效应、sigmoid学习率调整方案,以及与./ablation目录中基线模型的推理时间比较。
|
|
42
|
+
|
|
43
|
+
'
|
|
44
|
+
dataset_download:
|
|
45
|
+
primary_method: mixed
|
|
46
|
+
sources:
|
|
47
|
+
- name: Google Drive
|
|
48
|
+
url: https://drive.google.com/u/0/uc?id=1NF7VEefXCmXuWNbnNe858WvQAkJ_7wuP&export=download
|
|
49
|
+
format: csv
|
|
50
|
+
- name: Baidu Pan
|
|
51
|
+
url: https://pan.baidu.com/share/init?surl=r3KhGd0Q9PJIUZdfEYoymg&pwd=i9iy
|
|
52
|
+
format: csv
|
|
53
|
+
- name: Kaggle Datasets
|
|
54
|
+
url: https://www.kaggle.com/datasets/wentixxiaogege/time-series-dataset
|
|
55
|
+
format: csv
|
|
56
|
+
notes:
|
|
57
|
+
- 将所有预处理数据集下载到./dataset目录
|
|
58
|
+
- 基准数据集包括:ETTh1、ETTh2、ETTm1、ETTm2、Weather、Traffic、Electricity
|
|
59
|
+
- 数据集已预处理完毕,可直接使用,无需额外标准化步骤
|
|
60
|
+
credential_requirements:
|
|
61
|
+
mode: optional
|
|
62
|
+
items:
|
|
63
|
+
- kaggle_api_token
|
|
64
|
+
notes:
|
|
65
|
+
- Kaggle下载需要kaggle凭据或API令牌
|
|
66
|
+
- Google Drive和百度链接无需认证即可访问
|
|
67
|
+
resources:
|
|
68
|
+
minimum:
|
|
69
|
+
cpu_cores: 8
|
|
70
|
+
ram_gb: 32
|
|
71
|
+
disk_gb: 80
|
|
72
|
+
gpu_count: 1
|
|
73
|
+
gpu_vram_gb: 24
|
|
74
|
+
notes: 单GPU足够;建议使用RTX 6000级或同等配置
|
|
75
|
+
recommended:
|
|
76
|
+
cpu_cores: 16
|
|
77
|
+
ram_gb: 64
|
|
78
|
+
disk_gb: 150
|
|
79
|
+
gpu_count: 1
|
|
80
|
+
gpu_vram_gb: 24
|
|
81
|
+
notes: '原始实验使用单张Quadro RTX 6000(24GB)。超参数搜索和消融研究受益于更大的内存,以便处理更大的批次。
|
|
82
|
+
|
|
83
|
+
'
|
|
84
|
+
environment:
|
|
85
|
+
python: '3.9'
|
|
86
|
+
cuda: '11.8'
|
|
87
|
+
pytorch: 2.5.1
|
|
88
|
+
flash_attn: null
|
|
89
|
+
key_packages:
|
|
90
|
+
- pytorch>=2.0.0
|
|
91
|
+
- numpy
|
|
92
|
+
- pandas
|
|
93
|
+
- scikit-learn
|
|
94
|
+
- matplotlib
|
|
95
|
+
notes:
|
|
96
|
+
- 环境配置文件(environment.yml)指定了conda CUDA 11.8工具包,并使用pip安装PyTorch 2.5.1
|
|
97
|
+
- 混合conda/pip环境栈需要仔细的环境管理
|
|
98
|
+
- 使用以下命令创建conda环境:conda env create -f environment.yml
|
|
99
|
+
- 参见附带的README了解完整的依赖项集合
|
|
100
|
+
- ./scripts目录中的实验脚本处理运行时配置
|
|
101
|
+
risk_flags:
|
|
102
|
+
- mixed_environment_stack
|
|
103
|
+
- data_download_external
|
|
104
|
+
- hyperparameter_sensitivity
|
|
105
|
+
risk_notes:
|
|
106
|
+
- 混合conda CUDA 11.8与pip PyTorch 2.5.1可能导致版本冲突;请验证CUDA运行时与PyTorch内置CUDA版本匹配
|
|
107
|
+
- 从Google Drive/Baidu下载外部数据集可能需要VPN或区域访问
|
|
108
|
+
- 性能对补丁长度、回溯窗口、预测长度和EMA alpha参数敏感
|
|
109
|
+
- 公平基准测试结果按照TFB协议排除了drop-last技巧;请验证哪种实验设置符合您的评估目标
|
|
110
|
+
recommended_when: '当评估双流非Transformer预测架构、研究基于EMA的季节-趋势分解效果、探索Transformer之外的补丁化和通道独立技术,或在长期预测任务中将CNN/MLP方法与已建立的Transformer和线性基线进行比较时,使用此基准测试。
|
|
111
|
+
|
|
112
|
+
'
|
|
113
|
+
not_recommended_when: '对于非时间序列任务、实时/在线预测场景、无法访问配备24GB显存的 workstation级GPU的环境,或需要内置不确定性量化的模型时,不建议使用此基准测试。
|
|
114
|
+
|
|
115
|
+
'
|
|
116
|
+
paper:
|
|
117
|
+
title: 'xPatch: Dual-Stream Time Series Forecasting with Exponential Seasonal-Trend
|
|
118
|
+
Decomposition'
|
|
119
|
+
authors:
|
|
120
|
+
- Artyom Stitsyuk
|
|
121
|
+
- Jaesik Choi
|
|
122
|
+
venue: AAAI 2025
|
|
123
|
+
year: 2025
|
|
124
|
+
volume: '39'
|
|
125
|
+
number: '19'
|
|
126
|
+
pages: 20601-20609
|
|
127
|
+
url: https://ojs.aaai.org/index.php/AAAI/article/view/34270
|
|
128
|
+
arxiv_url: https://arxiv.org/pdf/2412.17323
|
|
129
|
+
bibtex: "@inproceedings{stitsyuk2025xpatch,\n title={xPatch: Dual-Stream Time Series\
|
|
130
|
+
\ Forecasting with Exponential Seasonal-Trend Decomposition},\n author={Stitsyuk,\
|
|
131
|
+
\ Artyom and Choi, Jaesik},\n booktitle={Proceedings of the AAAI Conference on\
|
|
132
|
+
\ Artificial Intelligence},\n volume={39}, number={19}, pages={20601--20609},\
|
|
133
|
+
\ year={2025}\n}\n"
|
|
134
|
+
download:
|
|
135
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.042_xpatch.zip
|
|
136
|
+
archive_type: zip
|
|
137
|
+
local_dir_name: paper-42-xPatch
|
|
138
|
+
provider: github_release
|
|
139
|
+
repo: ResearAI/DeepScientist
|
|
140
|
+
tag: aisb-v0.0.1
|
|
141
|
+
asset_name: aisb.t3.042_xpatch.zip
|
|
142
|
+
sha256: 72c8e6fd7e1a8b2eb184077ce9a37fb36514ef7bb148d8d0ff4ed79d4aa9de25
|
|
143
|
+
size_bytes: 3621184
|
|
144
|
+
display:
|
|
145
|
+
palette_seed: teal-sunrise-trend
|
|
146
|
+
art_style: signal-geometry
|
|
147
|
+
accent_priority: high
|
|
148
|
+
image_path: ../image/042_aisb.t3.042_xpatch.jpg
|
|
149
|
+
metric_contract:
|
|
150
|
+
mse:
|
|
151
|
+
origin_path: utils/metrics.py
|
|
152
|
+
source_ref: MSE function
|
|
153
|
+
evaluation_protocol:
|
|
154
|
+
code_paths:
|
|
155
|
+
- run.py
|
|
156
|
+
- utils/metrics.py
|
|
157
|
+
status: code_backed
|
|
158
|
+
mae:
|
|
159
|
+
origin_path: utils/metrics.py
|
|
160
|
+
source_ref: MAE function
|
|
161
|
+
evaluation_protocol:
|
|
162
|
+
code_paths:
|
|
163
|
+
- run.py
|
|
164
|
+
- utils/metrics.py
|
|
165
|
+
status: code_backed
|
|
166
|
+
forecast_checkpoints:
|
|
167
|
+
origin_path: exp/exp_main.py
|
|
168
|
+
source_ref: model state saving
|
|
169
|
+
status: provisional
|
|
170
|
+
code_anchors:
|
|
171
|
+
- environment.yml
|
|
172
|
+
- run.py
|
|
173
|
+
- utils/metrics.py
|
|
174
|
+
- exp/exp_main.py
|
|
175
|
+
- layers/decomp.py
|
|
176
|
+
- layers/network.py
|
|
177
|
+
- layers/network_cnn.py
|
|
178
|
+
- layers/network_mlp.py
|
|
179
|
+
- models/xPatch.py
|
|
180
|
+
caveat_snapshot: '静态代码审计发现utils/metrics.py和run.py中存在MSE和MAE指标的可执行锚点。本封装过程中未执行基准测试。运行时执行是信任指标值之前的必要步骤。公平基准测试需要TFB/OpenTS协议合规;请确认drop-last技巧处理与评估目标匹配。
|
|
181
|
+
|
|
182
|
+
'
|
|
@@ -0,0 +1,268 @@
|
|
|
1
|
+
id: aisb.t3.043_vhm
|
|
2
|
+
name: VHM
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Two-stage remote-sensing VLM training (VersaD pretrain + instruction SFT)
|
|
5
|
+
with external RSEvalKit evaluation of a 7B model built on Vicuna-7B and CLIP-ViT-L-336px.
|
|
6
|
+
task_description: 'This benchmark covers reproducing the full VHM (Versatile and Honest
|
|
7
|
+
Vision Language Model) pipeline for remote sensing image analysis. The model architecture
|
|
8
|
+
combines Vicuna-7B, CLIP-ViT-L/14-336px vision encoder, and a 2-layer MLP projector.
|
|
9
|
+
Training proceeds in two stages: (1) Pretrain on the VersaD dataset (1.4 million
|
|
10
|
+
RS image-text pairs with rich captions generated by Gemini-Vision), where layers
|
|
11
|
+
8+ of the vision encoder, the projector, and the full LLM are fine-tuned for one
|
|
12
|
+
epoch using DeepSpeed ZeRO-3 across multiple nodes; (2) Supervised fine-tuning (SFT)
|
|
13
|
+
on the VHM_SFT instruction dataset (covering VersaD-Instruct, HnstD honesty data,
|
|
14
|
+
and VariousRS-Instruct tasks including VQA, visual grounding, scene classification,
|
|
15
|
+
object counting, building vectorizing, and multi-label classification), where only
|
|
16
|
+
the projector and LLM are updated. Downstream evaluation requires cloning and installing
|
|
17
|
+
the external RSEvalKit repository in a separate conda environment, along with downloading
|
|
18
|
+
the VHM_Eval dataset (~7.35 GB). The packaged snapshot contains training code, DeepSpeed
|
|
19
|
+
configs, and SLURM launch scripts. Evaluation code, datasets, and model weights
|
|
20
|
+
are NOT bundled. No benchmark execution was performed during packaging; the primary
|
|
21
|
+
metric aid_accuracy is blocked pending RSEvalKit setup.
|
|
22
|
+
|
|
23
|
+
'
|
|
24
|
+
task_mode: experiment_driven
|
|
25
|
+
requires_execution: true
|
|
26
|
+
requires_paper: true
|
|
27
|
+
integrity_level: cas_plus_canary
|
|
28
|
+
snapshot_status: external_eval_required
|
|
29
|
+
support_level: recovery
|
|
30
|
+
time_band: 2-4d
|
|
31
|
+
cost_band: very_high
|
|
32
|
+
difficulty: hard
|
|
33
|
+
data_access: public
|
|
34
|
+
primary_outputs:
|
|
35
|
+
- aid_accuracy
|
|
36
|
+
- vhm_sft_checkpoint
|
|
37
|
+
- rseval_report
|
|
38
|
+
launch_profiles:
|
|
39
|
+
- id: train_only
|
|
40
|
+
label: Train Only
|
|
41
|
+
description: 'Execute pretrain (slurm_pretrain.sh) and SFT (slurm_finetune.sh) stages
|
|
42
|
+
sequentially. Pretrain requires VersaD (~140 GB extracted), LLaVA-1.5 MLP projector
|
|
43
|
+
weights, Vicuna-7B, and CLIP-ViT-L-336px. SFT requires VHM_SFT (~124 GB extracted).
|
|
44
|
+
Produces pretrained and SFT checkpoints. Skips evaluation. Minimum viable on 2×48GB
|
|
45
|
+
GPUs via gradient accumulation; paper-reported timing assumes 16× A100-80GB pretrain
|
|
46
|
+
(~10h) and 8× A100-80GB SFT (~4h).
|
|
47
|
+
|
|
48
|
+
'
|
|
49
|
+
- id: paper_faithful
|
|
50
|
+
label: Paper-Faithful
|
|
51
|
+
description: 'Run full pipeline: pretrain, SFT, then RSEvalKit evaluation. Requires
|
|
52
|
+
cloning RSEvalKit into a separate conda environment (rseval) and downloading VHM_Eval
|
|
53
|
+
(~7.35 GB). Produces all downstream metrics from the paper: AID scene classification
|
|
54
|
+
accuracy, RSVQA, DIOR-RSVG visual grounding, honest QA, building vectorizing,
|
|
55
|
+
and multi-label classification. Minimum 2×48GB GPUs for training; paper-reported
|
|
56
|
+
timing assumes 16× A100-80GB pretrain and 8× A100-80GB SFT. Honest QA evaluation
|
|
57
|
+
calls ChatGPT-3.5 API.
|
|
58
|
+
|
|
59
|
+
'
|
|
60
|
+
dataset_download:
|
|
61
|
+
primary_method: mixed
|
|
62
|
+
sources:
|
|
63
|
+
- kind: huggingface
|
|
64
|
+
url: https://huggingface.co/datasets/FitzPC/VHM_VersaD
|
|
65
|
+
access: public
|
|
66
|
+
note: 'VersaD pretraining corpus: 1.4M RS image-text pairs with Gemini-Vision-generated
|
|
67
|
+
rich captions covering image properties, object attributes, and scene context.
|
|
68
|
+
Approximately 140 GB extracted. Sources include Million-AID (920K), CrowdAI/SpaceNet
|
|
69
|
+
(276K), fMoW (81K), CVUSA (44K), CVACT (44K), and LoveDA (24K). Resolution range
|
|
70
|
+
0.08–153 m/pixel.
|
|
71
|
+
|
|
72
|
+
'
|
|
73
|
+
- kind: huggingface
|
|
74
|
+
url: https://huggingface.co/datasets/FitzPC/VHM_dataset_sft
|
|
75
|
+
access: public
|
|
76
|
+
note: 'VHM_SFT instruction dataset for supervised fine-tuning. Covers VersaD-Instruct,
|
|
77
|
+
HnstD factual and deceptive question pairs, and VariousRS-Instruct tasks. Approximately
|
|
78
|
+
124 GB extracted.
|
|
79
|
+
|
|
80
|
+
'
|
|
81
|
+
- kind: huggingface
|
|
82
|
+
url: https://huggingface.co/FitzPC/vhm_7B
|
|
83
|
+
access: public
|
|
84
|
+
note: 'Released VHM-7B SFT model weights. Allows skipping both training stages
|
|
85
|
+
and proceeding directly to RSEvalKit evaluation.
|
|
86
|
+
|
|
87
|
+
'
|
|
88
|
+
- kind: huggingface
|
|
89
|
+
url: https://huggingface.co/FitzPC/vhm_7b_pretrain_mlp_llm/tree/main
|
|
90
|
+
access: public
|
|
91
|
+
note: 'VHM pretrain-stage LLM and MLP projector weights. For resuming or initializing
|
|
92
|
+
from the pretrain checkpoint rather than training from scratch.
|
|
93
|
+
|
|
94
|
+
'
|
|
95
|
+
- kind: huggingface
|
|
96
|
+
url: https://huggingface.co/FitzPC/vhm_7b_pretrain_vit
|
|
97
|
+
access: public
|
|
98
|
+
note: 'CLIP ViT vision encoder weights after pretraining stage. Fine-tuned from
|
|
99
|
+
layer 8 onward during pretrain.
|
|
100
|
+
|
|
101
|
+
'
|
|
102
|
+
- kind: huggingface
|
|
103
|
+
url: https://huggingface.co/liuhaotian/llava-v1.5-mlp2x-336px-pretrain-vicuna-7b-v1.5/tree/main
|
|
104
|
+
access: public
|
|
105
|
+
note: 'LLaVA-1.5 pretrained MLP projector (mm_projector.bin). Required initialization
|
|
106
|
+
for pretrain stage.
|
|
107
|
+
|
|
108
|
+
'
|
|
109
|
+
- kind: github_repo
|
|
110
|
+
url: https://github.com/fitzpchao/RSEvalKit
|
|
111
|
+
access: public
|
|
112
|
+
note: 'External evaluation toolkit for remote-sensing VLMs. Must be cloned and
|
|
113
|
+
installed in a dedicated conda environment (conda create -n rseval). All downstream
|
|
114
|
+
evaluation metrics are implemented here. VHM_Eval dataset download instructions
|
|
115
|
+
are in RSEvalKit docs/Data.md.
|
|
116
|
+
|
|
117
|
+
'
|
|
118
|
+
notes:
|
|
119
|
+
- 'Paper-faithful reproduction requires VersaD (~140 GB), VHM_SFT (~124 GB), VHM_Eval
|
|
120
|
+
(~7.35 GB), base model weights (Vicuna-7B, CLIP-ViT-L-336px), and LLaVA MLP projector.
|
|
121
|
+
Combined download and extracted footprint exceeds 400 GB before training checkpoints
|
|
122
|
+
and caches.
|
|
123
|
+
|
|
124
|
+
'
|
|
125
|
+
- 'VHM_Eval data is hosted externally; follow RSEvalKit docs/Data.md instructions
|
|
126
|
+
for download.
|
|
127
|
+
|
|
128
|
+
'
|
|
129
|
+
- 'All data and model weights are licensed for research use only (CC BY-NC 4.0).
|
|
130
|
+
Commercial use is prohibited. Model weights are further subject to LLaMA, Vicuna,
|
|
131
|
+
and Gemini license terms.
|
|
132
|
+
|
|
133
|
+
'
|
|
134
|
+
credential_requirements:
|
|
135
|
+
mode: none
|
|
136
|
+
items: []
|
|
137
|
+
notes:
|
|
138
|
+
- 'No API keys or gated-access credentials are required for downloading any bundled
|
|
139
|
+
datasets or model weights.
|
|
140
|
+
|
|
141
|
+
'
|
|
142
|
+
- 'Honest QA evaluation in the paper calls the ChatGPT-3.5 API; reproducing this
|
|
143
|
+
exactly requires an OpenAI API key, but this call occurs inside RSEvalKit, not
|
|
144
|
+
in the training snapshot.
|
|
145
|
+
|
|
146
|
+
'
|
|
147
|
+
resources:
|
|
148
|
+
minimum:
|
|
149
|
+
cpu_cores: 32
|
|
150
|
+
ram_gb: 128
|
|
151
|
+
disk_gb: 400
|
|
152
|
+
gpu_count: 2
|
|
153
|
+
gpu_vram_gb: 48
|
|
154
|
+
gpu_arch: Ampere or newer
|
|
155
|
+
recommended:
|
|
156
|
+
cpu_cores: 64
|
|
157
|
+
ram_gb: 256
|
|
158
|
+
disk_gb: 1200
|
|
159
|
+
gpu_count: 16
|
|
160
|
+
gpu_vram_gb: 80
|
|
161
|
+
gpu_arch: A100
|
|
162
|
+
multi_node: true
|
|
163
|
+
environment:
|
|
164
|
+
python: '3.10'
|
|
165
|
+
cuda: '11.8'
|
|
166
|
+
pytorch: 2.0.1
|
|
167
|
+
flash_attn: 2.3.1.post1
|
|
168
|
+
key_packages:
|
|
169
|
+
- flash-attn==2.3.1.post1
|
|
170
|
+
- deepspeed==0.9.5
|
|
171
|
+
- transformers==4.31.0
|
|
172
|
+
- xformers
|
|
173
|
+
notes:
|
|
174
|
+
- 'requirements.txt pins torch 2.0.1+cu118, flash-attn 2.3.1.post1, and deepspeed
|
|
175
|
+
0.9.5. Create environment with: conda create -n vhm && conda activate vhm && pip
|
|
176
|
+
install -r requirements.txt.
|
|
177
|
+
|
|
178
|
+
'
|
|
179
|
+
- 'Training uses DeepSpeed ZeRO-3 (scripts/zero3.json) with bf16 mixed precision
|
|
180
|
+
and gradient checkpointing. Multi-node launch via torchrun with SLURM (scripts/rs/slurm_pretrain.sh).
|
|
181
|
+
|
|
182
|
+
'
|
|
183
|
+
- 'Three training entry points: vhm/train/train.py (base), vhm/train/train_mem.py
|
|
184
|
+
(FlashAttention, default), vhm/train/train_xformers.py (xformers attention, alternative).
|
|
185
|
+
|
|
186
|
+
'
|
|
187
|
+
- 'Evaluation requires a separate conda environment (rseval) with RSEvalKit requirements.txt.
|
|
188
|
+
A single environment is NOT sufficient for the paper-faithful route.
|
|
189
|
+
|
|
190
|
+
'
|
|
191
|
+
- 'Pretrain fine-tunes vision encoder from layer 8 onward, the MLP projector, and
|
|
192
|
+
the full LLM for one epoch. SFT fine-tunes only the projector and LLM.
|
|
193
|
+
|
|
194
|
+
'
|
|
195
|
+
risk_flags:
|
|
196
|
+
- route_caveat
|
|
197
|
+
- external_eval_dependency
|
|
198
|
+
- large_dataset_route
|
|
199
|
+
- noncommercial_license
|
|
200
|
+
- api_dependency
|
|
201
|
+
risk_notes:
|
|
202
|
+
- 'The paper-faithful route spans three disconnected steps: pretrain (slurm_pretrain.sh),
|
|
203
|
+
SFT (slurm_finetune.sh), and separate RSEvalKit evaluation in a different conda
|
|
204
|
+
environment—not one self-contained local command.
|
|
205
|
+
|
|
206
|
+
'
|
|
207
|
+
- 'Paper-reported training times are 16× A100-80GB for pretrain (~10h) and 8× A100-80GB
|
|
208
|
+
for SFT (~4h). Slower runs on fewer or smaller GPUs should be budgeted in days.
|
|
209
|
+
Gradient accumulation steps can be adjusted to trade wall-clock time for reduced
|
|
210
|
+
GPU count.
|
|
211
|
+
|
|
212
|
+
'
|
|
213
|
+
- 'Dataset preparation is substantial: VersaD ~140 GB, VHM_SFT ~124 GB, VHM_Eval ~7.35
|
|
214
|
+
GB, plus base model weights and generated checkpoints. Total disk footprint can
|
|
215
|
+
exceed 1 TB.
|
|
216
|
+
|
|
217
|
+
'
|
|
218
|
+
- 'The primary evaluation metric (AID scene classification accuracy) depends on external
|
|
219
|
+
RSEvalKit, not a bundled evaluator. No executable evaluation anchor exists in the
|
|
220
|
+
current snapshot. The metric contract marks aid_accuracy as blocked.
|
|
221
|
+
|
|
222
|
+
'
|
|
223
|
+
- 'Honest QA evaluation in the paper calls ChatGPT-3.5 API, introducing an external
|
|
224
|
+
API dependency and potential cost if reproduced exactly.
|
|
225
|
+
|
|
226
|
+
'
|
|
227
|
+
- 'All data is CC BY-NC 4.0 (non-commercial only). Model use is further restricted
|
|
228
|
+
by LLaMA, Vicuna, and Gemini license terms. Research use only.
|
|
229
|
+
|
|
230
|
+
'
|
|
231
|
+
recommended_when: 'Use this benchmark when you want to study remote-sensing VLM pretraining
|
|
232
|
+
on large-scale rich-caption datasets, investigate honesty in VLMs using factual/deceptive
|
|
233
|
+
question pairs, or reproduce the full two-stage training and evaluation pipeline.
|
|
234
|
+
Suitable for teams with multi-node GPU infrastructure (≥2 GPUs with ≥48GB VRAM each;
|
|
235
|
+
8–16× A100-80GB recommended), >400 GB free disk space, and willingness to set up
|
|
236
|
+
the external RSEvalKit evaluation environment.
|
|
237
|
+
|
|
238
|
+
'
|
|
239
|
+
not_recommended_when: 'Do not use this for single-GPU smoke tests, quick evaluation-only
|
|
240
|
+
runs without training, or when you need a fully self-contained evaluator bundled
|
|
241
|
+
in the snapshot. Not suitable if you cannot tolerate multi-day training times, require
|
|
242
|
+
commercial-use licensing, lack multi-node GPU infrastructure, or need an executable
|
|
243
|
+
metric anchor without external dependencies.
|
|
244
|
+
|
|
245
|
+
'
|
|
246
|
+
paper:
|
|
247
|
+
title: 'VHM: Versatile and Honest Vision Language Model for Remote Sensing Image
|
|
248
|
+
Analysis'
|
|
249
|
+
venue: AAAI 2025
|
|
250
|
+
year: 2025
|
|
251
|
+
url: https://arxiv.org/abs/2403.20213
|
|
252
|
+
download:
|
|
253
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.043_vhm.zip
|
|
254
|
+
archive_type: zip
|
|
255
|
+
local_dir_name: paper-43-VHM
|
|
256
|
+
provider: github_release
|
|
257
|
+
repo: ResearAI/DeepScientist
|
|
258
|
+
tag: aisb-v0.0.1
|
|
259
|
+
asset_name: aisb.t3.043_vhm.zip
|
|
260
|
+
sha256: 73136beddf7624545dad64ba3818d9c7f5b78915ee52dfa157396f960ddd630f
|
|
261
|
+
size_bytes: 1902143
|
|
262
|
+
commercial:
|
|
263
|
+
annual_fee: null
|
|
264
|
+
display:
|
|
265
|
+
palette_seed: cobalt-emerald-orbit
|
|
266
|
+
art_style: satellite-atlas
|
|
267
|
+
accent_priority: high
|
|
268
|
+
image_path: ../../../AISB/image/043_aisb.t3.043_vhm.jpg
|
|
@@ -0,0 +1,193 @@
|
|
|
1
|
+
id: aisb.t3.043_vhm
|
|
2
|
+
name: VHM
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 两阶段遥感视觉语言模型训练(VersaD预训练 + 指令SFT),使用外部RSEvalKit对基于Vicuna-7B和CLIP-ViT-L-336px构建的7B模型进行评估。
|
|
5
|
+
task_description: '该基准测试涵盖复现完整的VHM(通用且诚实的视觉语言模型)遥感图像分析流程。模型架构结合了Vicuna-7B、CLIP-ViT-L/14-336px视觉编码器和2层MLP投影器。训练分两个阶段进行:(1)在VersaD数据集上进行预训练(140万对遥感图像-文本对,由Gemini-Vision生成丰富caption),其中对视觉编码器第8层及之后层、投影器和完整LLM进行一个epoch的微调,使用DeepSpeed ZeRO-3在多个节点上运行;(2)在VHM_SFT指令数据集上进行监督微调(SFT)(涵盖VersaD-Instruct、HnstD诚实数据和VariousRS-Instruct任务,包括VQA、视觉定位、场景分类、目标计数、建筑矢量化及多标签分类),仅更新投影器和LLM。下游评估需要在独立的conda环境中克隆并安装外部RSEvalKit仓库,同时下载VHM_Eval数据集(约7.35 GB)。打包的快照包含训练代码、DeepSpeed配置和SLURM启动脚本。评估代码、数据集和模型权重未包含在打包内。打包过程中未执行基准测试;主要指标aid_accuracy因待RSEvalKit设置而处于阻塞状态。
|
|
6
|
+
|
|
7
|
+
'
|
|
8
|
+
task_mode: experiment_driven
|
|
9
|
+
requires_execution: true
|
|
10
|
+
requires_paper: true
|
|
11
|
+
integrity_level: cas_plus_canary
|
|
12
|
+
snapshot_status: external_eval_required
|
|
13
|
+
support_level: recovery
|
|
14
|
+
time_band: 2-4d
|
|
15
|
+
cost_band: very_high
|
|
16
|
+
difficulty: hard
|
|
17
|
+
data_access: public
|
|
18
|
+
primary_outputs:
|
|
19
|
+
- aid_accuracy
|
|
20
|
+
- vhm_sft_checkpoint
|
|
21
|
+
- rseval_report
|
|
22
|
+
launch_profiles:
|
|
23
|
+
- id: train_only
|
|
24
|
+
label: 仅训练
|
|
25
|
+
description: '顺序执行预训练(slurm_pretrain.sh)和SFT(slurm_finetune.sh)阶段。预训练需要VersaD(约140 GB解压后)、LLaVA-1.5 MLP投影器权重、Vicuna-7B和CLIP-ViT-L-336px。SFT需要VHM_SFT(约124 GB解压后)。生成预训练和SFT检查点。跳过评估。最低可在2×48GB GPU上运行(通过梯度累积);论文报告的时间基于16× A100-80GB预训练(约10小时)和8× A100-80GB SFT(约4小时)。
|
|
26
|
+
|
|
27
|
+
'
|
|
28
|
+
- id: paper_faithful
|
|
29
|
+
label: 论文忠实复现
|
|
30
|
+
description: '运行完整流程:预训练、SFT,然后进行RSEvalKit评估。需要将RSEvalKit克隆到独立的conda环境中(rseval)并下载VHM_Eval(约7.35 GB)。生成论文中的所有下游指标:AID场景分类准确率、RSVQA、DIOR-RSVG视觉定位、诚实QA、建筑矢量化及多标签分类。训练最低需要2×48GB GPU;论文报告的时间基于16× A100-80GB预训练和8× A100-80GB SFT。诚实QA评估调用ChatGPT-3.5 API。
|
|
31
|
+
|
|
32
|
+
'
|
|
33
|
+
dataset_download:
|
|
34
|
+
primary_method: mixed
|
|
35
|
+
sources:
|
|
36
|
+
- kind: huggingface
|
|
37
|
+
url: https://huggingface.co/datasets/FitzPC/VHM_VersaD
|
|
38
|
+
access: public
|
|
39
|
+
note: 'VersaD预训练语料库:140万对遥感图像-文本对,包含Gemini-Vision生成的丰富caption,涵盖图像属性、目标特征和场景上下文。解压后约140 GB。来源包括Million-AID(92万)、CrowdAI/SpaceNet(27.6万)、fMoW(8.1万)、CVUSA(4.4万)、CVACT(4.4万)和LoveDA(2.4万)。分辨率范围0.08–153米/像素。
|
|
40
|
+
|
|
41
|
+
'
|
|
42
|
+
- kind: huggingface
|
|
43
|
+
url: https://huggingface.co/datasets/FitzPC/VHM_dataset_sft
|
|
44
|
+
access: public
|
|
45
|
+
note: 'VHM_SFT监督微调指令数据集。涵盖VersaD-Instruct、HnstD事实性和欺骗性问答对以及VariousRS-Instruct任务。解压后约124 GB。
|
|
46
|
+
|
|
47
|
+
'
|
|
48
|
+
- kind: huggingface
|
|
49
|
+
url: https://huggingface.co/FitzPC/vhm_7B
|
|
50
|
+
access: public
|
|
51
|
+
note: '发布的VHM-7B SFT模型权重。可跳过两个训练阶段,直接进行RSEvalKit评估。
|
|
52
|
+
|
|
53
|
+
'
|
|
54
|
+
- kind: huggingface
|
|
55
|
+
url: https://huggingface.co/FitzPC/vhm_7b_pretrain_mlp_llm/tree/main
|
|
56
|
+
access: public
|
|
57
|
+
note: 'VHM预训练阶段的LLM和MLP投影器权重。用于从预训练检查点恢复或初始化,而非从头训练。
|
|
58
|
+
|
|
59
|
+
'
|
|
60
|
+
- kind: huggingface
|
|
61
|
+
url: https://huggingface.co/FitzPC/vhm_7b_pretrain_vit
|
|
62
|
+
access: public
|
|
63
|
+
note: '预训练阶段后的CLIP ViT视觉编码器权重。预训练期间从第8层开始微调。
|
|
64
|
+
|
|
65
|
+
'
|
|
66
|
+
- kind: huggingface
|
|
67
|
+
url: https://huggingface.co/liuhaotian/llava-v1.5-mlp2x-336px-pretrain-vicuna-7b-v1.5/tree/main
|
|
68
|
+
access: public
|
|
69
|
+
note: 'LLaVA-1.5预训练MLP投影器(mm_projector.bin)。预训练阶段必需初始化。
|
|
70
|
+
|
|
71
|
+
'
|
|
72
|
+
- kind: github_repo
|
|
73
|
+
url: https://github.com/fitzpchao/RSEvalKit
|
|
74
|
+
access: public
|
|
75
|
+
note: '遥感视觉语言模型外部评估工具包。必须克隆并在专用conda环境中安装(conda create -n rseval)。所有下游评估指标均在此实现。VHM_Eval数据集下载说明在RSEvalKit docs/Data.md中。
|
|
76
|
+
|
|
77
|
+
'
|
|
78
|
+
notes:
|
|
79
|
+
- '论文忠实复现需要VersaD(约140 GB)、VHM_SFT(约124 GB)、VHM_Eval(约7.35 GB)、基础模型权重(Vicuna-7B、CLIP-ViT-L-336px)和LLaVA MLP投影器。训练检查点和缓存前的综合下载和解压占用空间超过400 GB。
|
|
80
|
+
|
|
81
|
+
'
|
|
82
|
+
- 'VHM_Eval数据托管在外部;请按照RSEvalKit docs/Data.md中的说明进行下载。
|
|
83
|
+
|
|
84
|
+
'
|
|
85
|
+
- '所有数据和模型权重仅限研究使用(CC BY-NC 4.0)。禁止商业使用。模型权重还须遵守LLaMA、Vicuna和Gemini许可条款。
|
|
86
|
+
|
|
87
|
+
'
|
|
88
|
+
credential_requirements:
|
|
89
|
+
mode: none
|
|
90
|
+
items: []
|
|
91
|
+
notes:
|
|
92
|
+
- '下载任何打包的数据集或模型权重无需API密钥或受限访问凭证。
|
|
93
|
+
|
|
94
|
+
'
|
|
95
|
+
- '论文中的诚实QA评估调用ChatGPT-3.5 API;完全复现需要OpenAI API密钥,但该调用发生在RSEvalKit中,而非训练快照中。
|
|
96
|
+
|
|
97
|
+
'
|
|
98
|
+
resources:
|
|
99
|
+
minimum:
|
|
100
|
+
cpu_cores: 32
|
|
101
|
+
ram_gb: 128
|
|
102
|
+
disk_gb: 400
|
|
103
|
+
gpu_count: 2
|
|
104
|
+
gpu_vram_gb: 48
|
|
105
|
+
gpu_arch: Ampere or newer
|
|
106
|
+
recommended:
|
|
107
|
+
cpu_cores: 64
|
|
108
|
+
ram_gb: 256
|
|
109
|
+
disk_gb: 1200
|
|
110
|
+
gpu_count: 16
|
|
111
|
+
gpu_vram_gb: 80
|
|
112
|
+
gpu_arch: A100
|
|
113
|
+
multi_node: true
|
|
114
|
+
environment:
|
|
115
|
+
python: '3.10'
|
|
116
|
+
cuda: '11.8'
|
|
117
|
+
pytorch: 2.0.1
|
|
118
|
+
flash_attn: 2.3.1.post1
|
|
119
|
+
key_packages:
|
|
120
|
+
- flash-attn==2.3.1.post1
|
|
121
|
+
- deepspeed==0.9.5
|
|
122
|
+
- transformers==4.31.0
|
|
123
|
+
- xformers
|
|
124
|
+
notes:
|
|
125
|
+
- 'requirements.txt固定torch 2.0.1+cu118、flash-attn 2.3.1.post1和deepspeed 0.9.5。使用以下命令创建环境:conda create -n vhm && conda activate vhm && pip install -r requirements.txt。
|
|
126
|
+
|
|
127
|
+
'
|
|
128
|
+
- '训练使用DeepSpeed ZeRO-3(scripts/zero3.json),配合bf16混合精度和梯度检查点。通过torchrun和SLURM进行多节点启动(scripts/rs/slurm_pretrain.sh)。
|
|
129
|
+
|
|
130
|
+
'
|
|
131
|
+
- '三个训练入口点:vhm/train/train.py(基础)、vhm/train/train_mem.py(FlashAttention,默认)、vhm/train/train_xformers.py(xformers注意力,可选)。
|
|
132
|
+
|
|
133
|
+
'
|
|
134
|
+
- '评估需要独立的conda环境(rseval)和RSEvalKit requirements.txt。一个环境不足以支持论文忠实复现路线。
|
|
135
|
+
|
|
136
|
+
'
|
|
137
|
+
- '预训练对视觉编码器第8层及之后层、MLP投影器和完整LLM进行一个epoch的微调。SFT仅微调投影器和LLM。
|
|
138
|
+
|
|
139
|
+
'
|
|
140
|
+
risk_flags:
|
|
141
|
+
- route_caveat
|
|
142
|
+
- external_eval_dependency
|
|
143
|
+
- large_dataset_route
|
|
144
|
+
- noncommercial_license
|
|
145
|
+
- api_dependency
|
|
146
|
+
risk_notes:
|
|
147
|
+
- '论文忠实复现路线跨越三个独立步骤:预训练(slurm_pretrain.sh)、SFT(slurm_finetune.sh)和独立conda环境中的RSEvalKit评估——不是一个自包含的本地命令。
|
|
148
|
+
|
|
149
|
+
'
|
|
150
|
+
- '论文报告的训练时间为16× A100-80GB预训练(约10小时)和8× A100-80GB SFT(约4小时)。在更少或更小的GPU上运行较慢,需要预留数天时间。可通过调整梯度累积步数来权衡时钟时间和减少的GPU数量。
|
|
151
|
+
|
|
152
|
+
'
|
|
153
|
+
- '数据集准备量大:VersaD约140 GB、VHM_SFT约124 GB、VHM_Eval约7.35 GB,加上基础模型权重和生成的检查点。总磁盘占用可能超过1 TB。
|
|
154
|
+
|
|
155
|
+
'
|
|
156
|
+
- '主要评估指标(AID场景分类准确率)依赖于外部RSEvalKit,而非打包的评估器。当前快照中不存在可执行的评估锚点。指标契约将aid_accuracy标记为阻塞状态。
|
|
157
|
+
|
|
158
|
+
'
|
|
159
|
+
- '论文中的诚实QA评估调用ChatGPT-3.5 API,引入外部API依赖性和潜在成本(如需完全复现)。
|
|
160
|
+
|
|
161
|
+
'
|
|
162
|
+
- '所有数据均为CC BY-NC 4.0(仅限非商业使用)。模型使用还受LLaMA、Vicuna和Gemini许可条款限制。仅限研究使用。
|
|
163
|
+
|
|
164
|
+
'
|
|
165
|
+
recommended_when: '当您希望研究基于大规模丰富caption数据集的遥感视觉语言模型预训练、使用事实/欺骗性问答对研究视觉语言模型中的诚实性、或复现完整的两阶段训练和评估流程时使用此基准。适用于拥有多节点GPU基础设施(≥2块GPU,每块≥48GB VRAM;推荐8–16× A100-80GB)、超过400 GB可用磁盘空间且愿意设置外部RSEvalKit评估环境的团队。
|
|
166
|
+
|
|
167
|
+
'
|
|
168
|
+
not_recommended_when: '不要将其用于单GPU冒烟测试、无训练的快速仅评估运行,或需要快照中完全自包含评估器的场景。不适用于无法容忍多日训练时间、需要商业使用许可、缺乏多节点GPU基础设施、或需要无外部依赖的可执行指标锚点的场景。
|
|
169
|
+
|
|
170
|
+
'
|
|
171
|
+
paper:
|
|
172
|
+
title: 'VHM: Versatile and Honest Vision Language Model for Remote Sensing Image
|
|
173
|
+
Analysis'
|
|
174
|
+
venue: AAAI 2025
|
|
175
|
+
year: 2025
|
|
176
|
+
url: https://arxiv.org/abs/2403.20213
|
|
177
|
+
download:
|
|
178
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.043_vhm.zip
|
|
179
|
+
archive_type: zip
|
|
180
|
+
local_dir_name: paper-43-VHM
|
|
181
|
+
provider: github_release
|
|
182
|
+
repo: ResearAI/DeepScientist
|
|
183
|
+
tag: aisb-v0.0.1
|
|
184
|
+
asset_name: aisb.t3.043_vhm.zip
|
|
185
|
+
sha256: 73136beddf7624545dad64ba3818d9c7f5b78915ee52dfa157396f960ddd630f
|
|
186
|
+
size_bytes: 1902143
|
|
187
|
+
commercial:
|
|
188
|
+
annual_fee: null
|
|
189
|
+
display:
|
|
190
|
+
palette_seed: cobalt-emerald-orbit
|
|
191
|
+
art_style: satellite-atlas
|
|
192
|
+
accent_priority: high
|
|
193
|
+
image_path: ../../../AISB/image/043_aisb.t3.043_vhm.jpg
|