@researai/deepscientist 1.5.16 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +196 -32
- package/bin/ds.js +924 -66
- package/docs/en/00_QUICK_START.md +195 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +78 -7
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +624 -180
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +386 -0
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +266 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +48 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +142 -18
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +54 -8
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +552 -181
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +384 -0
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +33 -7
- package/install.sh +168 -20
- package/package.json +5 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/bridges/connectors.py +8 -2
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +187 -74
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +1077 -93
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +827 -235
- package/src/deepscientist/daemon/api/router.py +81 -1
- package/src/deepscientist/daemon/app.py +1512 -85
- package/src/deepscientist/diagnostics/__init__.py +6 -0
- package/src/deepscientist/diagnostics/runner_failures.py +277 -0
- package/src/deepscientist/doctor.py +407 -56
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +850 -88
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1852 -161
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +480 -35
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +80 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -10
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +411 -304
- package/src/prompts/system_copilot.md +89 -0
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-DnSm0GZn.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-itb0tltR.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DqKkiCI6.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-DxL2ezFG.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-B_RQm1YZ.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-tHqlXY3n.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-B495DTXC.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DG28-61B.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BiOGT-Kj.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-CVsj8h_T.js → NotebookEditor-WFyd8Ybt.js} +23 -23
- package/src/ui/dist/assets/{PdfLoader-CASDQmxJ.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-BFhwoKsY.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-CB4DYfWO.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-DLC6G24T.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-CwMn-iqb.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-Cu4Qln7Y.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-wQ7RIIRd.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-CsX08Qno.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-R-GWEhzS.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-COFACy7V.js +0 -204
- package/src/ui/dist/assets/CliPlugin-CvwCmDQ5.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-cOqSa0xq.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-DVgNHBCS.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-ClMbq5Yu.js +0 -14
- package/src/ui/dist/assets/LabPlugin-L_SuE8ow.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-C-4Kt1p9.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-DcOzU9vd.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CHj7M58O.js +0 -16
- package/src/ui/dist/assets/VNCViewer-CjlbyCB3.js +0 -11
- package/src/ui/dist/assets/bot-CFkZY-JP.js +0 -6
- package/src/ui/dist/assets/chevron-up-Dq5ofbht.js +0 -6
- package/src/ui/dist/assets/file-content-Dv4LoZec.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-Denq-lC3.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-BUh6G52n.js +0 -6
- package/src/ui/dist/assets/image-B9HUUddG.js +0 -6
- package/src/ui/dist/assets/index-B2B1sg-M.js +0 -1
- package/src/ui/dist/assets/index-Cgla8biy.css +0 -33
- package/src/ui/dist/assets/index-DRyx7vAc.js +0 -1
- package/src/ui/dist/assets/index-Gbl53BNp.js +0 -2496
- package/src/ui/dist/assets/pdf-effect-queue-ZtnHFCAi.js +0 -6
- package/src/ui/dist/assets/popover-DL6h35vr.js +0 -1
- package/src/ui/dist/assets/select-DvmXt1yY.js +0 -11
- package/src/ui/dist/assets/sigma-7jpXazui.js +0 -6
- package/src/ui/dist/assets/trash-xA7kFt8i.js +0 -11
- package/src/ui/dist/assets/useCliAccess-DsMwDjOp.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,224 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.070_certifiedunlearning
|
|
3
|
+
name: Certified Unlearning for Neural Networks
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: Certified machine unlearning via privacy amplification by noisy fine-tuning,
|
|
6
|
+
with provable (ε,δ)-guarantees and no loss-function assumptions.
|
|
7
|
+
task_description: 'This packaged benchmark implements and evaluates certified machine
|
|
8
|
+
unlearning for neural networks (ICML 2025). The core task is to remove the influence
|
|
9
|
+
of a specified forget set from a trained model while preserving utility on the retain
|
|
10
|
+
set, subject to formal (ε,δ)-unlearning guarantees. The method—Privacy Amplification
|
|
11
|
+
by Iteration (PABI)—treats each noisy fine-tuning step on the retain data as a stochastic
|
|
12
|
+
post-processing operation, progressively amplifying privacy without accessing the
|
|
13
|
+
forget data. It imposes no smoothness or convexity assumptions on the loss function,
|
|
14
|
+
making it applicable to arbitrary deep networks. Four methods are benchmarked: PABI
|
|
15
|
+
(gradient clipping), DP-SGD with group privacy, Contractive Coefficients (model
|
|
16
|
+
clipping), and DP-Baseline (output perturbation), alongside full Retrain. Experiments
|
|
17
|
+
cover CIFAR-10, CIFAR-100, and MNIST across four figure-level ablations: privacy
|
|
18
|
+
budget curves, convergence curves, DP-SGD comparisons, and ε-sweep analysis. The
|
|
19
|
+
primary efficiency metric is epochs_to_50pct_val_acc measured during the unlearning
|
|
20
|
+
phase. The framework uses JAX/Flax for all training and unlearning logic; feature
|
|
21
|
+
extraction uses a ResNet-18 backbone. Multi-GPU execution is supported via run_exp.py.
|
|
22
|
+
No benchmark execution was performed during this packaging pass—runtime validation
|
|
23
|
+
is required before trusting metric values.
|
|
24
|
+
|
|
25
|
+
'
|
|
26
|
+
capability_tags:
|
|
27
|
+
- machine_unlearning
|
|
28
|
+
- certified_privacy
|
|
29
|
+
- differential_privacy
|
|
30
|
+
- privacy_amplification
|
|
31
|
+
- neural_networks
|
|
32
|
+
- research_code_optimization
|
|
33
|
+
aisb_direction: T3
|
|
34
|
+
track_fit:
|
|
35
|
+
- paper_track
|
|
36
|
+
- benchmark_track
|
|
37
|
+
task_mode: experiment_driven
|
|
38
|
+
requires_execution: true
|
|
39
|
+
requires_paper: true
|
|
40
|
+
integrity_level: cas_plus_canary
|
|
41
|
+
snapshot_status: runnable
|
|
42
|
+
support_level: advanced
|
|
43
|
+
time_band: 6-24h
|
|
44
|
+
cost_band: medium
|
|
45
|
+
difficulty: hard
|
|
46
|
+
data_access: public
|
|
47
|
+
primary_outputs:
|
|
48
|
+
- epochs_to_50pct_val_acc
|
|
49
|
+
- epochs_to_45pct_val_acc
|
|
50
|
+
- epochs_to_40pct_val_acc
|
|
51
|
+
- epochs_to_35pct_val_acc
|
|
52
|
+
- epochs_to_30pct_val_acc
|
|
53
|
+
- unlearning_checkpoint
|
|
54
|
+
- certification_report
|
|
55
|
+
launch_profiles:
|
|
56
|
+
- id: quick_eval
|
|
57
|
+
label: Quick Eval
|
|
58
|
+
description: 'Run one packaged certified unlearning evaluation route using a single
|
|
59
|
+
pre-configured experiment YAML (e.g., from dp_sgd_runs/). Produces a single certification
|
|
60
|
+
report and efficiency metrics. Fastest path to verifying the environment and metric
|
|
61
|
+
surface.
|
|
62
|
+
|
|
63
|
+
'
|
|
64
|
+
- id: full_unlearning
|
|
65
|
+
label: Full Unlearning
|
|
66
|
+
description: 'Run the complete privacy-aware unlearning training and certification
|
|
67
|
+
workflow across all four experiment suites (budget_curve_runs, convergence_curve_runs,
|
|
68
|
+
dp_sgd_runs, eps_sweep_runs). Reproduces all paper figures. Requires multi-GPU
|
|
69
|
+
execution via run_exp.py.
|
|
70
|
+
|
|
71
|
+
'
|
|
72
|
+
dataset_download:
|
|
73
|
+
primary_method: mixed
|
|
74
|
+
sources:
|
|
75
|
+
- name: CIFAR-10
|
|
76
|
+
notes: Auto-downloaded by JAX/datasets pipeline at runtime.
|
|
77
|
+
- name: CIFAR-100
|
|
78
|
+
notes: Auto-downloaded by JAX/datasets pipeline at runtime.
|
|
79
|
+
- name: MNIST
|
|
80
|
+
notes: Auto-downloaded by JAX/datasets pipeline at runtime.
|
|
81
|
+
- name: ResNet-18 feature cache
|
|
82
|
+
notes: 'Generated locally by running feature_extractor.py before experiments that
|
|
83
|
+
use cifar10_feature or cifar100_feature dataset configs.
|
|
84
|
+
|
|
85
|
+
'
|
|
86
|
+
notes:
|
|
87
|
+
- All datasets are standard public benchmarks; no manual download required unless
|
|
88
|
+
offline execution is needed.
|
|
89
|
+
- feature_extractor.py must be run once before transfer-learning experiment configs
|
|
90
|
+
are used.
|
|
91
|
+
credential_requirements:
|
|
92
|
+
mode: optional
|
|
93
|
+
items:
|
|
94
|
+
- name: Weights & Biases (wandb)
|
|
95
|
+
notes: 'experiment.py calls wandb.init() at startup. Set WANDB_API_KEY or run
|
|
96
|
+
`wandb login` before execution. Offline mode can be enabled by setting WANDB_MODE=offline.
|
|
97
|
+
|
|
98
|
+
'
|
|
99
|
+
notes:
|
|
100
|
+
- No paid data credentials required. wandb is the only external service.
|
|
101
|
+
resources:
|
|
102
|
+
minimum:
|
|
103
|
+
cpu_cores: 8
|
|
104
|
+
ram_gb: 32
|
|
105
|
+
disk_gb: 80
|
|
106
|
+
gpu_count: 1
|
|
107
|
+
gpu_vram_gb: 12
|
|
108
|
+
notes: Sufficient for single-experiment quick_eval runs on MNIST or CIFAR-10.
|
|
109
|
+
recommended:
|
|
110
|
+
cpu_cores: 16
|
|
111
|
+
ram_gb: 64
|
|
112
|
+
disk_gb: 150
|
|
113
|
+
gpu_count: 2
|
|
114
|
+
gpu_vram_gb: 24
|
|
115
|
+
notes: 'Two GPUs allow run_exp.py to parallelize across experiment suites. Required
|
|
116
|
+
for full reproduction of all four figure-level ablations within the 6–24 h time
|
|
117
|
+
band.
|
|
118
|
+
|
|
119
|
+
'
|
|
120
|
+
environment:
|
|
121
|
+
python: '3.8'
|
|
122
|
+
cuda: null
|
|
123
|
+
pytorch: null
|
|
124
|
+
flash_attn: null
|
|
125
|
+
framework: jax
|
|
126
|
+
key_packages:
|
|
127
|
+
- jax==0.5.2
|
|
128
|
+
- jaxlib==0.5.1
|
|
129
|
+
- jax-cuda12-pjrt==0.5.1
|
|
130
|
+
- jax-cuda12-plugin==0.5.1
|
|
131
|
+
- flax==0.10.4
|
|
132
|
+
- optax
|
|
133
|
+
- dp-accounting==0.4.4
|
|
134
|
+
- transformers==4.49.0
|
|
135
|
+
- datasets==2.21.0
|
|
136
|
+
- ml_collections==1.0.0
|
|
137
|
+
- wandb
|
|
138
|
+
- chex==0.1.89
|
|
139
|
+
- torch
|
|
140
|
+
- matplotlib==3.10.1
|
|
141
|
+
- jaxpruner @ git+https://github.com/google-research/jaxpruner@e7af4e4e4748782d6bc433249e359f74ffb845ba
|
|
142
|
+
notes:
|
|
143
|
+
- This benchmark uses JAX/Flax as its primary framework, not PyTorch. PyTorch is
|
|
144
|
+
present in requirements.txt only for DataLoader utilities.
|
|
145
|
+
- CUDA version is determined by jax-cuda12-* wheel; install JAX CUDA packages before
|
|
146
|
+
other dependencies.
|
|
147
|
+
- See requirements.txt for the full pinned dependency set.
|
|
148
|
+
- Python 3.8 is required; the JAX version used (0.5.2) does not support 3.12+.
|
|
149
|
+
risk_flags:
|
|
150
|
+
- jax_cuda_wheel_version_sensitivity
|
|
151
|
+
- wandb_required_at_runtime
|
|
152
|
+
- feature_extractor_prereq
|
|
153
|
+
- no_runtime_execution_in_packaging_pass
|
|
154
|
+
risk_notes:
|
|
155
|
+
- 'JAX CUDA wheels are highly version-sensitive. Install jax-cuda12-pjrt and jax-cuda12-plugin
|
|
156
|
+
before jaxlib to avoid ABI mismatches.
|
|
157
|
+
|
|
158
|
+
'
|
|
159
|
+
- 'experiment.py calls wandb.init() unconditionally; set WANDB_MODE=offline to prevent
|
|
160
|
+
a hard failure when no API key is present.
|
|
161
|
+
|
|
162
|
+
'
|
|
163
|
+
- 'Experiments using cifar10_feature or cifar100_feature dataset configs will fail
|
|
164
|
+
if feature_extractor.py has not been run first.
|
|
165
|
+
|
|
166
|
+
'
|
|
167
|
+
- 'No benchmark execution was performed during this packaging pass. All metric values
|
|
168
|
+
in metric_contract.json are provisional until runtime validation confirms them.
|
|
169
|
+
Do not trust metric surface from README alone.
|
|
170
|
+
|
|
171
|
+
'
|
|
172
|
+
recommended_when: 'Use this benchmark when evaluating certified machine unlearning
|
|
173
|
+
methods on image-classification tasks (CIFAR-10, CIFAR-100, MNIST) with formal (ε,δ)
|
|
174
|
+
privacy guarantees. Ideal for comparing unlearning efficiency (epochs to reach a
|
|
175
|
+
validation accuracy threshold) across PABI, DP-SGD, contractive coefficient, and
|
|
176
|
+
output-perturbation baselines. Best suited for researchers who need assumption-free
|
|
177
|
+
certified unlearning applicable to non-convex deep networks.
|
|
178
|
+
|
|
179
|
+
'
|
|
180
|
+
not_recommended_when: 'Do not use if you only need standard image-classification training
|
|
181
|
+
without privacy or unlearning constraints. Not suitable if your pipeline requires
|
|
182
|
+
PyTorch-native training loops—the core implementation is JAX/Flax only. Avoid if
|
|
183
|
+
GPU VRAM is below 12 GB or if a JAX CUDA environment cannot be established. Not
|
|
184
|
+
appropriate for large-scale language-model unlearning or concept unlearning tasks,
|
|
185
|
+
which require a different method family.
|
|
186
|
+
|
|
187
|
+
'
|
|
188
|
+
paper:
|
|
189
|
+
title: Certified Unlearning for Neural Networks
|
|
190
|
+
authors:
|
|
191
|
+
- Anastasia Koloskova
|
|
192
|
+
- Youssef Allouah
|
|
193
|
+
- Animesh Jha
|
|
194
|
+
- Rachid Guerraoui
|
|
195
|
+
- Sanmi Koyejo
|
|
196
|
+
affiliations:
|
|
197
|
+
- Stanford University
|
|
198
|
+
- EPFL
|
|
199
|
+
venue: ICML 2025
|
|
200
|
+
year: 2025
|
|
201
|
+
url: https://arxiv.org/abs/2506.06985
|
|
202
|
+
bibtex_key: koloskova2025certified
|
|
203
|
+
notes: 'Equal contribution from Koloskova and Allouah. Proceedings of the 42nd International
|
|
204
|
+
Conference on Machine Learning, Vancouver, Canada. PMLR 267.
|
|
205
|
+
|
|
206
|
+
'
|
|
207
|
+
download:
|
|
208
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.070_certifiedunlearning.zip
|
|
209
|
+
archive_type: zip
|
|
210
|
+
local_dir_name: paper-70-CertifiedUnlearning
|
|
211
|
+
upstream_repo: https://github.com/stair-lab/certified-unlearning-neural-networks-icml-2025
|
|
212
|
+
provider: github_release
|
|
213
|
+
repo: ResearAI/DeepScientist
|
|
214
|
+
tag: aisb-v0.0.1
|
|
215
|
+
asset_name: aisb.t3.070_certifiedunlearning.zip
|
|
216
|
+
sha256: 124e11876363b6ccc532c5d235697f96975e0e2883506083a5f9391b63cf1ab7
|
|
217
|
+
size_bytes: 13612960
|
|
218
|
+
commercial:
|
|
219
|
+
annual_fee: null
|
|
220
|
+
display:
|
|
221
|
+
palette_seed: silver-plum-unlearn
|
|
222
|
+
art_style: privacy-lab
|
|
223
|
+
accent_priority: high
|
|
224
|
+
image_path: ../image/070_aisb.t3.070_certifiedunlearning.jpg
|
|
@@ -0,0 +1,171 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.070_certifiedunlearning
|
|
3
|
+
name: 神经网络认证遗忘
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 通过噪声微调实现隐私放大进行认证机器遗忘,提供可证明的(ε,δ)保证且无需损失函数假设。
|
|
6
|
+
task_description: >
|
|
7
|
+
本基准测试包实现并评估了神经网络认证机器遗忘方法(ICML 2025)。核心任务是从已训练模型中移除指定遗忘集的影响,同时在保留集上保持效用,并满足正式的(ε,δ)遗忘保证。该方法——迭代隐私放大(PABI)——将保留数据上每个带噪声的微调步骤视为随机后处理操作,逐步放大隐私性而不访问遗忘数据。该方法对损失函数不做平滑性或凸性假设,适用于任意深度网络。基准测试涵盖四种方法:PABI(梯度裁剪)、基于组隐私的DP-SGD、收缩系数(模型裁剪)和DP基线(输出扰动),以及完整重训练作为对照。实验覆盖CIFAR-10、CIFAR-100和MNIST数据集,包含四组消融实验:隐私预算曲线、收敛曲线、DP-SGD对比和ε扫描分析。主要效率指标为遗忘阶段中epochs_to_50pct_val_acc。框架使用JAX/Flax实现所有训练和遗忘逻辑;特征提取使用ResNet-18骨干网络。支持通过run_exp.py进行多GPU执行。
|
|
8
|
+
|
|
9
|
+
本打包过程未执行任何基准测试运行——在使用指标数值前需进行运行时验证。
|
|
10
|
+
|
|
11
|
+
capability_tags:
|
|
12
|
+
- machine_unlearning
|
|
13
|
+
- certified_privacy
|
|
14
|
+
- differential_privacy
|
|
15
|
+
- privacy_amplification
|
|
16
|
+
- neural_networks
|
|
17
|
+
- research_code_optimization
|
|
18
|
+
aisb_direction: T3
|
|
19
|
+
track_fit:
|
|
20
|
+
- paper_track
|
|
21
|
+
- benchmark_track
|
|
22
|
+
task_mode: experiment_driven
|
|
23
|
+
requires_execution: true
|
|
24
|
+
requires_paper: true
|
|
25
|
+
integrity_level: cas_plus_canary
|
|
26
|
+
snapshot_status: runnable
|
|
27
|
+
support_level: advanced
|
|
28
|
+
time_band: 6-24h
|
|
29
|
+
cost_band: medium
|
|
30
|
+
difficulty: hard
|
|
31
|
+
data_access: public
|
|
32
|
+
primary_outputs:
|
|
33
|
+
- epochs_to_50pct_val_acc
|
|
34
|
+
- epochs_to_45pct_val_acc
|
|
35
|
+
- epochs_to_40pct_val_acc
|
|
36
|
+
- epochs_to_35pct_val_acc
|
|
37
|
+
- epochs_to_30pct_val_acc
|
|
38
|
+
- unlearning_checkpoint
|
|
39
|
+
- certification_report
|
|
40
|
+
launch_profiles:
|
|
41
|
+
- id: quick_eval
|
|
42
|
+
label: 快速评估
|
|
43
|
+
description: >
|
|
44
|
+
使用单个预配置实验YAML(例如来自dp_sgd_runs/)运行一条封装的认证遗忘评估路线。生成一份认证报告和效率指标。是验证环境和指标表面的最快路径。
|
|
45
|
+
|
|
46
|
+
- id: full_unlearning
|
|
47
|
+
label: 完整遗忘
|
|
48
|
+
description: >
|
|
49
|
+
跨所有四组实验套件(budget_curve_runs、convergence_curve_runs、dp_sgd_runs、eps_sweep_runs)运行完整的隐私感知遗忘训练和认证工作流。复现论文所有图表。需要通过run_exp.py进行多GPU执行。
|
|
50
|
+
|
|
51
|
+
dataset_download:
|
|
52
|
+
primary_method: mixed
|
|
53
|
+
sources:
|
|
54
|
+
- name: CIFAR-10
|
|
55
|
+
notes: 由JAX/datasets管道在运行时自动下载。
|
|
56
|
+
- name: CIFAR-100
|
|
57
|
+
notes: 由JAX/datasets管道在运行时自动下载。
|
|
58
|
+
- name: MNIST
|
|
59
|
+
notes: 由JAX/datasets管道在运行时自动下载。
|
|
60
|
+
- name: ResNet-18特征缓存
|
|
61
|
+
notes: 通过在实验前运行feature_extractor.py在本地生成,用于cifar10_feature或cifar100_feature数据集配置。
|
|
62
|
+
|
|
63
|
+
notes:
|
|
64
|
+
- 所有数据集均为标准公开基准测试;除非需要离线执行,无需手动下载。
|
|
65
|
+
- 在使用迁移学习实验配置前,必须运行一次feature_extractor.py。
|
|
66
|
+
credential_requirements:
|
|
67
|
+
mode: optional
|
|
68
|
+
items:
|
|
69
|
+
- name: Weights & Biases (wandb)
|
|
70
|
+
notes: experiment.py在启动时调用wandb.init()。执行前设置WANDB_API_KEY或运行`wandb login`。可通过设置WANDB_MODE=offline启用离线模式。
|
|
71
|
+
|
|
72
|
+
notes:
|
|
73
|
+
- 无需付费数据凭证。wandb是唯一的外部服务。
|
|
74
|
+
resources:
|
|
75
|
+
minimum:
|
|
76
|
+
cpu_cores: 8
|
|
77
|
+
ram_gb: 32
|
|
78
|
+
disk_gb: 80
|
|
79
|
+
gpu_count: 1
|
|
80
|
+
gpu_vram_gb: 12
|
|
81
|
+
notes: 足以在MNIST或CIFAR-10上运行单实验quick_eval。
|
|
82
|
+
recommended:
|
|
83
|
+
cpu_cores: 16
|
|
84
|
+
ram_gb: 64
|
|
85
|
+
disk_gb: 150
|
|
86
|
+
gpu_count: 2
|
|
87
|
+
gpu_vram_gb: 24
|
|
88
|
+
notes: 两块GPU允许run_exp.py并行化执行实验套件。需要在6–24小时时间范围内完整复现所有四组消融图表。
|
|
89
|
+
|
|
90
|
+
environment:
|
|
91
|
+
python: '3.8'
|
|
92
|
+
cuda: null
|
|
93
|
+
pytorch: null
|
|
94
|
+
flash_attn: null
|
|
95
|
+
framework: jax
|
|
96
|
+
key_packages:
|
|
97
|
+
- jax==0.5.2
|
|
98
|
+
- jaxlib==0.5.1
|
|
99
|
+
- jax-cuda12-pjrt==0.5.1
|
|
100
|
+
- jax-cuda12-plugin==0.5.1
|
|
101
|
+
- flax==0.10.4
|
|
102
|
+
- optax
|
|
103
|
+
- dp-accounting==0.4.4
|
|
104
|
+
- transformers==4.49.0
|
|
105
|
+
- datasets==2.21.0
|
|
106
|
+
- ml_collections==1.0.0
|
|
107
|
+
- wandb
|
|
108
|
+
- chex==0.1.89
|
|
109
|
+
- torch
|
|
110
|
+
- matplotlib==3.10.1
|
|
111
|
+
- jaxpruner @ git+https://github.com/google-research/jaxpruner@e7af4e4e4748782d6bc433249e359f74ffb845ba
|
|
112
|
+
notes:
|
|
113
|
+
- 本基准测试使用JAX/Flax作为主要框架,而非PyTorch。PyTorch仅在requirements.txt中用于DataLoader工具类。
|
|
114
|
+
- CUDA版本由jax-cuda12-* wheel决定;安装JAX CUDA包优先于其他依赖项。
|
|
115
|
+
- 完整固定依赖集请参见requirements.txt。
|
|
116
|
+
- 需要Python 3.8;使用的JAX版本(0.5.2)不支持3.12+。
|
|
117
|
+
risk_flags:
|
|
118
|
+
- jax_cuda_wheel_version_sensitivity
|
|
119
|
+
- wandb_required_at_runtime
|
|
120
|
+
- feature_extractor_prereq
|
|
121
|
+
- no_runtime_execution_in_packaging_pass
|
|
122
|
+
risk_notes:
|
|
123
|
+
- JAX CUDA wheel对版本高度敏感。先安装jax-cuda12-pjrt和jax-cuda12-plugin再安装jaxlib,以避免ABI不匹配。
|
|
124
|
+
|
|
125
|
+
- experiment.py无条件调用wandb.init();无API key时设置WANDB_MODE=offline以防止硬性失败。
|
|
126
|
+
|
|
127
|
+
- 使用cifar10_feature或cifar100_feature数据集配置的实验若未先运行feature_extractor.py将失败。
|
|
128
|
+
|
|
129
|
+
- 本打包过程未执行任何基准测试运行。metric_contract.json中的所有指标值均为临时值,需运行时验证后方可信赖。请勿仅凭README信赖指标表面。
|
|
130
|
+
|
|
131
|
+
recommended_when: >
|
|
132
|
+
在需要形式化(ε,δ)隐私保证的图像分类任务(CIFAR-10、CIFAR-100、MNIST)上评估认证机器遗忘方法时使用本基准测试。适合比较PABI、DP-SGD、收缩系数和输出扰动基线之间的遗忘效率(达到验证准确率阈值所需轮数)。最适合需要适用于非凸深度网络的无假设认证遗忘的研究人员。
|
|
133
|
+
|
|
134
|
+
not_recommended_when: >
|
|
135
|
+
若仅需标准图像分类训练而无需隐私或遗忘约束,请勿使用。本基准测试不适用于需要PyTorch原生训练循环的场景——核心实现仅支持JAX/Flax。若GPU显存低于12GB或无法建立JAX CUDA环境,请勿使用。不适用于大规模语言模型遗忘或概念遗忘任务,这些任务需要不同的方法体系。
|
|
136
|
+
|
|
137
|
+
paper:
|
|
138
|
+
title: Certified Unlearning for Neural Networks
|
|
139
|
+
authors:
|
|
140
|
+
- Anastasia Koloskova
|
|
141
|
+
- Youssef Allouah
|
|
142
|
+
- Animesh Jha
|
|
143
|
+
- Rachid Guerraoui
|
|
144
|
+
- Sanmi Koyejo
|
|
145
|
+
affiliations:
|
|
146
|
+
- Stanford University
|
|
147
|
+
- EPFL
|
|
148
|
+
venue: ICML 2025
|
|
149
|
+
year: 2025
|
|
150
|
+
url: https://arxiv.org/abs/2506.06985
|
|
151
|
+
bibtex_key: koloskova2025certified
|
|
152
|
+
notes: Koloskova和Allouah同等贡献。加拿大温哥华第42届国际机器学习会议论文集。PMLR 267。
|
|
153
|
+
|
|
154
|
+
download:
|
|
155
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.070_certifiedunlearning.zip
|
|
156
|
+
archive_type: zip
|
|
157
|
+
local_dir_name: paper-70-CertifiedUnlearning
|
|
158
|
+
upstream_repo: https://github.com/stair-lab/certified-unlearning-neural-networks-icml-2025
|
|
159
|
+
provider: github_release
|
|
160
|
+
repo: ResearAI/DeepScientist
|
|
161
|
+
tag: aisb-v0.0.1
|
|
162
|
+
asset_name: aisb.t3.070_certifiedunlearning.zip
|
|
163
|
+
sha256: 124e11876363b6ccc532c5d235697f96975e0e2883506083a5f9391b63cf1ab7
|
|
164
|
+
size_bytes: 13612960
|
|
165
|
+
commercial:
|
|
166
|
+
annual_fee: null
|
|
167
|
+
display:
|
|
168
|
+
palette_seed: silver-plum-unlearn
|
|
169
|
+
art_style: privacy-lab
|
|
170
|
+
accent_priority: high
|
|
171
|
+
image_path: ../image/070_aisb.t3.070_certifiedunlearning.jpg
|
|
@@ -0,0 +1,142 @@
|
|
|
1
|
+
id: aisb.t3.071_neuralmjd
|
|
2
|
+
name: Neural Non-Stationary Merton Jump Diffusion
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Neural network parameterization of non-stationary Merton jump diffusion
|
|
5
|
+
for time series prediction with explicit stochastic dynamics and abrupt jump modeling.
|
|
6
|
+
task_description: 'This packaged benchmark covers jump-diffusion time-series prediction
|
|
7
|
+
using a neural parameterization of the non-stationary Merton jump diffusion (MJD)
|
|
8
|
+
model. The approach combines a time-inhomogeneous Itô diffusion to capture continuous
|
|
9
|
+
non-stationary stochastic dynamics with a time-inhomogeneous compound Poisson process
|
|
10
|
+
to model abrupt jumps. Parameters of the corresponding stochastic differential equations
|
|
11
|
+
(SDEs) are predicted by a neural network conditioned on historical data and contextual
|
|
12
|
+
information. The task evaluates forecasting fidelity on non-stationary data containing
|
|
13
|
+
discontinuous changes, using MAE for deterministic accuracy and NLL for probabilistic
|
|
14
|
+
calibration.
|
|
15
|
+
|
|
16
|
+
'
|
|
17
|
+
task_mode: experiment_driven
|
|
18
|
+
requires_execution: true
|
|
19
|
+
requires_paper: true
|
|
20
|
+
integrity_level: cas_plus_canary
|
|
21
|
+
snapshot_status: external_eval_required
|
|
22
|
+
support_level: recovery
|
|
23
|
+
time_band: 6-24h
|
|
24
|
+
cost_band: medium
|
|
25
|
+
difficulty: hard
|
|
26
|
+
data_access: public
|
|
27
|
+
primary_outputs:
|
|
28
|
+
- mae
|
|
29
|
+
- nll
|
|
30
|
+
- jump_diffusion_checkpoint
|
|
31
|
+
launch_profiles:
|
|
32
|
+
- id: quick_eval
|
|
33
|
+
label: Quick Eval
|
|
34
|
+
description: Run a single packaged jump-diffusion forecasting evaluation route on
|
|
35
|
+
pre-trained checkpoint with SP500 data.
|
|
36
|
+
estimated_time: 1-2h
|
|
37
|
+
- id: full_train_eval
|
|
38
|
+
label: Full Train + Eval
|
|
39
|
+
description: Run the complete Monte Carlo jump-diffusion training workflow including
|
|
40
|
+
model initialization, training loop with periodic evaluation, checkpointing, and
|
|
41
|
+
final test set evaluation.
|
|
42
|
+
estimated_time: 6-18h
|
|
43
|
+
dataset_download:
|
|
44
|
+
primary_method: curl
|
|
45
|
+
sources:
|
|
46
|
+
- name: SP500 Historical Stock Data
|
|
47
|
+
url: https://www.kaggle.com/api/v1/datasets/download/camnugent/sandp500
|
|
48
|
+
type: kaggle
|
|
49
|
+
format: zip
|
|
50
|
+
local_path: ./data/sandp500
|
|
51
|
+
notes:
|
|
52
|
+
- SP500 dataset requires Kaggle API credentials for download
|
|
53
|
+
- Demo notebook supports synthetic data generation without external downloads
|
|
54
|
+
- Configuration files located in config/sp500/mjd/
|
|
55
|
+
credential_requirements:
|
|
56
|
+
mode: kaggle_api
|
|
57
|
+
items:
|
|
58
|
+
- name: Kaggle API Token
|
|
59
|
+
description: Required for SP500 dataset download from Kaggle
|
|
60
|
+
optional: true
|
|
61
|
+
notes:
|
|
62
|
+
- Kaggle credentials only needed for real-world SP500 data; synthetic data available
|
|
63
|
+
via demo notebook without credentials
|
|
64
|
+
resources:
|
|
65
|
+
minimum:
|
|
66
|
+
cpu_cores: 8
|
|
67
|
+
ram_gb: 32
|
|
68
|
+
disk_gb: 80
|
|
69
|
+
gpu_count: 1
|
|
70
|
+
gpu_vram_gb: 16
|
|
71
|
+
network: false
|
|
72
|
+
recommended:
|
|
73
|
+
cpu_cores: 16
|
|
74
|
+
ram_gb: 64
|
|
75
|
+
disk_gb: 150
|
|
76
|
+
gpu_count: 1
|
|
77
|
+
gpu_vram_gb: 24
|
|
78
|
+
network: true
|
|
79
|
+
environment:
|
|
80
|
+
python: '3.10'
|
|
81
|
+
cuda: '11.8'
|
|
82
|
+
pytorch: 2.1.2
|
|
83
|
+
flash_attn: null
|
|
84
|
+
key_packages:
|
|
85
|
+
- torch>=2.0.0
|
|
86
|
+
- pytorch-geometric
|
|
87
|
+
- pyyaml
|
|
88
|
+
- numpy
|
|
89
|
+
- scipy
|
|
90
|
+
notes:
|
|
91
|
+
- Environment provisioned via setup/conda.yaml or setup/requirements.txt
|
|
92
|
+
- PyG (pytorch-geometric) required for data loaders
|
|
93
|
+
- Full dependency set in bundled requirements; see README for conda setup instructions
|
|
94
|
+
risk_flags:
|
|
95
|
+
- long_training_time
|
|
96
|
+
- stochastic_variance
|
|
97
|
+
risk_notes:
|
|
98
|
+
- Monte Carlo sampling introduces stochastic variance; multiple seeds recommended
|
|
99
|
+
for robust evaluation
|
|
100
|
+
- Training on SP500 with default hyperparameters may take 6-12 hours on single GPU
|
|
101
|
+
- Metric values are provisional pending first trusted execution; stochastic nature
|
|
102
|
+
means results may vary across runs
|
|
103
|
+
recommended_when: 'Use this benchmark when you need probabilistic time-series forecasting
|
|
104
|
+
that explicitly models abrupt discontinuous jumps and non-stationary dynamics. Ideal
|
|
105
|
+
for financial time series with sudden price movements, supply chain data with promotional
|
|
106
|
+
spikes, or any domain requiring interpretable stochastic process modeling alongside
|
|
107
|
+
neural network flexibility.
|
|
108
|
+
|
|
109
|
+
'
|
|
110
|
+
not_recommended_when: 'Do not use this benchmark if you only need simple deterministic
|
|
111
|
+
point forecasting without uncertainty quantification. Not recommended when jump
|
|
112
|
+
events are annotated and event-based temporal point process models would be more
|
|
113
|
+
appropriate. Avoid when GPU memory < 16GB and training throughput is a primary constraint.
|
|
114
|
+
|
|
115
|
+
'
|
|
116
|
+
paper:
|
|
117
|
+
title: Neural Non-Stationary Merton Jump Diffusion for Time Series Prediction
|
|
118
|
+
authors:
|
|
119
|
+
- Yuanpei Gao (University of British Columbia, Vector Institute)
|
|
120
|
+
- Qi Yan (University of British Columbia, Vector Institute)
|
|
121
|
+
- Yan Leng (University of Texas at Austin)
|
|
122
|
+
- Renjie Liao (University of British Columbia, Vector Institute, Canada CIFAR AI
|
|
123
|
+
Chair)
|
|
124
|
+
venue: arXiv preprint arXiv:2506.04542
|
|
125
|
+
year: 2025
|
|
126
|
+
url: https://arxiv.org/abs/2506.04542
|
|
127
|
+
github: https://github.com/DSL-Lab/neural-MJD
|
|
128
|
+
download:
|
|
129
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.071_neuralmjd.zip
|
|
130
|
+
archive_type: zip
|
|
131
|
+
local_dir_name: paper-71-NeuralMJD
|
|
132
|
+
provider: github_release
|
|
133
|
+
repo: ResearAI/DeepScientist
|
|
134
|
+
tag: aisb-v0.0.1
|
|
135
|
+
asset_name: aisb.t3.071_neuralmjd.zip
|
|
136
|
+
sha256: 0ea7d70c8c22946e148ccfdf01295d7608888a1423b5ae6391ad927a6224f2e0
|
|
137
|
+
size_bytes: 101203
|
|
138
|
+
display:
|
|
139
|
+
palette_seed: indigo-copper-jump
|
|
140
|
+
art_style: stochastic-signal
|
|
141
|
+
accent_priority: high
|
|
142
|
+
image_path: ../image/071_aisb.t3.071_neuralmjd.jpg
|
|
@@ -0,0 +1,120 @@
|
|
|
1
|
+
id: aisb.t3.071_neuralmjd
|
|
2
|
+
name: 神经非平稳Merton跳跃扩散
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 用于时间序列预测的神经非平稳Merton跳跃扩散网络参数化方法,具备显式随机动力学建模和突变跳跃捕捉能力。
|
|
5
|
+
task_description: '该标准化基准测试涵盖了基于神经参数化非平稳Merton跳跃扩散(MJD)模型的跳跃扩散时间序列预测任务。该方法结合了时变Itô扩散以捕捉连续非平稳随机动力学,以及时变复合泊松过程以建模突变跳跃。相应随机微分方程(SDEs)的参数由神经网络根据历史数据和上下文信息预测。该任务评估在包含不连续变化的非平稳数据上的预测保真度,使用MAE衡量确定性精度,使用NLL评估概率校准。
|
|
6
|
+
|
|
7
|
+
'
|
|
8
|
+
task_mode: experiment_driven
|
|
9
|
+
requires_execution: true
|
|
10
|
+
requires_paper: true
|
|
11
|
+
integrity_level: cas_plus_canary
|
|
12
|
+
snapshot_status: external_eval_required
|
|
13
|
+
support_level: recovery
|
|
14
|
+
time_band: 6-24h
|
|
15
|
+
cost_band: medium
|
|
16
|
+
difficulty: hard
|
|
17
|
+
data_access: public
|
|
18
|
+
primary_outputs:
|
|
19
|
+
- mae
|
|
20
|
+
- nll
|
|
21
|
+
- jump_diffusion_checkpoint
|
|
22
|
+
launch_profiles:
|
|
23
|
+
- id: quick_eval
|
|
24
|
+
label: 快速评估
|
|
25
|
+
description: 在预训练检查点上使用SP500数据运行单个标准化跳跃扩散预测评估流程。
|
|
26
|
+
estimated_time: 1-2h
|
|
27
|
+
- id: full_train_eval
|
|
28
|
+
label: 完整训练+评估
|
|
29
|
+
description: 运行完整的蒙特卡洛跳跃扩散训练工作流程,包括模型初始化、周期性评估的训练循环、检查点保存以及最终测试集评估。
|
|
30
|
+
estimated_time: 6-18h
|
|
31
|
+
dataset_download:
|
|
32
|
+
primary_method: curl
|
|
33
|
+
sources:
|
|
34
|
+
- name: SP500历史股票数据
|
|
35
|
+
url: https://www.kaggle.com/api/v1/datasets/download/camnugent/sandp500
|
|
36
|
+
type: kaggle
|
|
37
|
+
format: zip
|
|
38
|
+
local_path: ./data/sandp500
|
|
39
|
+
notes:
|
|
40
|
+
- SP500数据集需要Kaggle API凭证才能下载
|
|
41
|
+
- 演示笔记本支持合成数据生成,无需外部下载
|
|
42
|
+
- 配置文件位于config/sp500/mjd/目录
|
|
43
|
+
credential_requirements:
|
|
44
|
+
mode: kaggle_api
|
|
45
|
+
items:
|
|
46
|
+
- name: Kaggle API令牌
|
|
47
|
+
description: 从Kaggle下载SP500数据集所需
|
|
48
|
+
optional: true
|
|
49
|
+
notes:
|
|
50
|
+
- Kaggle凭证仅在使用真实SP500数据时才需要;演示笔记本可通过合成数据使用,无需凭证
|
|
51
|
+
resources:
|
|
52
|
+
minimum:
|
|
53
|
+
cpu_cores: 8
|
|
54
|
+
ram_gb: 32
|
|
55
|
+
disk_gb: 80
|
|
56
|
+
gpu_count: 1
|
|
57
|
+
gpu_vram_gb: 16
|
|
58
|
+
network: false
|
|
59
|
+
recommended:
|
|
60
|
+
cpu_cores: 16
|
|
61
|
+
ram_gb: 64
|
|
62
|
+
disk_gb: 150
|
|
63
|
+
gpu_count: 1
|
|
64
|
+
gpu_vram_gb: 24
|
|
65
|
+
network: true
|
|
66
|
+
environment:
|
|
67
|
+
python: '3.10'
|
|
68
|
+
cuda: '11.8'
|
|
69
|
+
pytorch: 2.1.2
|
|
70
|
+
flash_attn: null
|
|
71
|
+
key_packages:
|
|
72
|
+
- torch>=2.0.0
|
|
73
|
+
- pytorch-geometric
|
|
74
|
+
- pyyaml
|
|
75
|
+
- numpy
|
|
76
|
+
- scipy
|
|
77
|
+
notes:
|
|
78
|
+
- 环境通过setup/conda.yaml或setup/requirements.txt配置
|
|
79
|
+
- PyG(pytorch-geometric)用于数据加载器
|
|
80
|
+
- 完整依赖集在打包的requirements文件中; conda环境设置说明请参阅README
|
|
81
|
+
risk_flags:
|
|
82
|
+
- long_training_time
|
|
83
|
+
- stochastic_variance
|
|
84
|
+
risk_notes:
|
|
85
|
+
- 蒙特卡洛采样引入随机方差;建议使用多个随机种子以获得稳健的评估结果
|
|
86
|
+
- 使用默认超参数在SP500上训练在单个GPU上可能需要6-12小时
|
|
87
|
+
- 指标值为临时值,待首次可信执行后确定;随机特性意味着不同运行之间结果可能有所差异
|
|
88
|
+
recommended_when: '当需要明确建模突变跳跃和不连续变化的概率时间序列预测时使用此基准。适用于具有突然价格波动的金融时间序列、具有促销尖峰的供应链数据,或任何需要将可解释的随机过程建模与神经网络灵活性相结合的场景。
|
|
89
|
+
|
|
90
|
+
'
|
|
91
|
+
not_recommended_when: '如果仅需简单的确定性点预测而不需要不确定性量化,请勿使用此基准。当跳跃事件已标注且基于事件的时序点过程模型更合适时不推荐使用。当GPU内存小于16GB且训练吞吐量是主要约束时应避免。
|
|
92
|
+
|
|
93
|
+
'
|
|
94
|
+
paper:
|
|
95
|
+
title: Neural Non-Stationary Merton Jump Diffusion for Time Series Prediction
|
|
96
|
+
authors:
|
|
97
|
+
- Yuanpei Gao (University of British Columbia, Vector Institute)
|
|
98
|
+
- Qi Yan (University of British Columbia, Vector Institute)
|
|
99
|
+
- Yan Leng (University of Texas at Austin)
|
|
100
|
+
- Renjie Liao (University of British Columbia, Vector Institute, Canada CIFAR AI
|
|
101
|
+
Chair)
|
|
102
|
+
venue: arXiv preprint arXiv:2506.04542
|
|
103
|
+
year: 2025
|
|
104
|
+
url: https://arxiv.org/abs/2506.04542
|
|
105
|
+
github: https://github.com/DSL-Lab/neural-MJD
|
|
106
|
+
download:
|
|
107
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.071_neuralmjd.zip
|
|
108
|
+
archive_type: zip
|
|
109
|
+
local_dir_name: paper-71-NeuralMJD
|
|
110
|
+
provider: github_release
|
|
111
|
+
repo: ResearAI/DeepScientist
|
|
112
|
+
tag: aisb-v0.0.1
|
|
113
|
+
asset_name: aisb.t3.071_neuralmjd.zip
|
|
114
|
+
sha256: 0ea7d70c8c22946e148ccfdf01295d7608888a1423b5ae6391ad927a6224f2e0
|
|
115
|
+
size_bytes: 101203
|
|
116
|
+
display:
|
|
117
|
+
palette_seed: indigo-copper-jump
|
|
118
|
+
art_style: stochastic-signal
|
|
119
|
+
accent_priority: high
|
|
120
|
+
image_path: ../image/071_aisb.t3.071_neuralmjd.jpg
|