@researai/deepscientist 1.5.17 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +132 -11
- package/bin/ds.js +376 -49
- package/docs/en/00_QUICK_START.md +135 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +64 -4
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +29 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +44 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +92 -17
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +39 -4
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +29 -7
- package/install.sh +122 -16
- package/package.json +4 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +2 -2
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +927 -91
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +697 -210
- package/src/deepscientist/daemon/api/router.py +76 -1
- package/src/deepscientist/daemon/app.py +1054 -51
- package/src/deepscientist/diagnostics/runner_failures.py +147 -0
- package/src/deepscientist/doctor.py +212 -65
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +836 -92
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1430 -139
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +421 -21
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +61 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -11
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +409 -315
- package/src/prompts/system_copilot.md +88 -12
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
- package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
- package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
- package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
- package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
- package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
- package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
- package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
- package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
- package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
- package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
- package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
- package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
- package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
- package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
- package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
- package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
- package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
- package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,156 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.047_timepfn
|
|
3
|
+
name: TimePFN
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: PFN-style multivariate time-series forecasting benchmark with synthetic
|
|
6
|
+
pretraining and schedule-sensitive fine-tuning.
|
|
7
|
+
task_description: 'This packaged benchmark covers the full TimePFN workflow: synthetic
|
|
8
|
+
multivariate time-series data generation via Gaussian process kernel composition
|
|
9
|
+
and the linear coregionalization method (LMC-Synth), transformer pretraining on
|
|
10
|
+
those synthetic datasets, and fine-tuning plus evaluation on standard downstream
|
|
11
|
+
forecasting benchmarks (e.g. ETT, Weather, Exchange). The task is to transfer PFN-style
|
|
12
|
+
in-context Bayesian generalisation into practical zero-shot and few-shot forecasting
|
|
13
|
+
quality on public benchmark datasets. Primary metrics are MSE and MAE, both code-backed
|
|
14
|
+
through run.py and utils/metrics.py. No trusted execution output exists yet; runtime
|
|
15
|
+
execution is required before metric values can be considered verified.
|
|
16
|
+
|
|
17
|
+
'
|
|
18
|
+
task_mode: experiment_driven
|
|
19
|
+
requires_execution: true
|
|
20
|
+
requires_paper: true
|
|
21
|
+
integrity_level: cas_plus_canary
|
|
22
|
+
snapshot_status: runnable
|
|
23
|
+
support_level: advanced
|
|
24
|
+
time_band: 6-24h
|
|
25
|
+
cost_band: medium
|
|
26
|
+
difficulty: hard
|
|
27
|
+
data_access: public
|
|
28
|
+
primary_outputs:
|
|
29
|
+
- mse
|
|
30
|
+
- mae
|
|
31
|
+
- pfn_checkpoint
|
|
32
|
+
launch_profiles:
|
|
33
|
+
- id: quick_eval
|
|
34
|
+
label: Quick Eval
|
|
35
|
+
description: 'Run one downstream TimePFN forecasting evaluation route using the
|
|
36
|
+
provided model checkpoint and test scripts under pfn_scripts/test/. No pretraining
|
|
37
|
+
required.
|
|
38
|
+
|
|
39
|
+
'
|
|
40
|
+
- id: pretrain_and_eval
|
|
41
|
+
label: Pretrain + Eval
|
|
42
|
+
description: 'Run the full packaged workflow: generate synthetic MTS data via LMC-Synth,
|
|
43
|
+
pretrain the TimePFN transformer on synthetic data, fine-tune on a downstream
|
|
44
|
+
benchmark dataset, then evaluate MSE and MAE.
|
|
45
|
+
|
|
46
|
+
'
|
|
47
|
+
dataset_download:
|
|
48
|
+
primary_method: mixed
|
|
49
|
+
sources:
|
|
50
|
+
- label: Downstream benchmark datasets (ETT, Weather, Exchange, etc.)
|
|
51
|
+
url: https://drive.google.com/file/d/1l51QsKvQPcqILT3DwfjCgx8Dsg2rpjot/view?usp=sharing
|
|
52
|
+
format: zip
|
|
53
|
+
local_path: ./datasets
|
|
54
|
+
notes: Provided via iTransformer's datasets.zip Google Drive link. Download and
|
|
55
|
+
unzip into ./datasets before running evaluation scripts.
|
|
56
|
+
- label: Synthetic pretraining data
|
|
57
|
+
url: null
|
|
58
|
+
format: generated
|
|
59
|
+
local_path: ./synthetic_data_generation
|
|
60
|
+
notes: Generated locally via LMC-Synth.py and kernel-synth.py. Read bash script
|
|
61
|
+
comments and directives before running.
|
|
62
|
+
- label: Pretrained model checkpoint
|
|
63
|
+
url: https://deepscientist.cc/AISB/047_timepfn
|
|
64
|
+
format: zip
|
|
65
|
+
local_path: paper-47-TimePFN
|
|
66
|
+
notes: Official AISB archive download. Contains checkpoint, training, fine-tuning,
|
|
67
|
+
and testing scripts under pfn_scripts/.
|
|
68
|
+
notes:
|
|
69
|
+
- Downstream benchmark datasets must be placed under ./datasets before any evaluation
|
|
70
|
+
script is invoked.
|
|
71
|
+
- Synthetic data generation is optional if using the provided pretrained checkpoint
|
|
72
|
+
for quick_eval.
|
|
73
|
+
credential_requirements:
|
|
74
|
+
mode: none
|
|
75
|
+
items: []
|
|
76
|
+
notes:
|
|
77
|
+
- Google Drive download for datasets.zip does not require authentication but may
|
|
78
|
+
require manual download if automated fetch is rate-limited.
|
|
79
|
+
resources:
|
|
80
|
+
minimum:
|
|
81
|
+
cpu_cores: 8
|
|
82
|
+
ram_gb: 32
|
|
83
|
+
disk_gb: 100
|
|
84
|
+
gpu_count: 1
|
|
85
|
+
gpu_vram_gb: 16
|
|
86
|
+
recommended:
|
|
87
|
+
cpu_cores: 16
|
|
88
|
+
ram_gb: 64
|
|
89
|
+
disk_gb: 200
|
|
90
|
+
gpu_count: 1
|
|
91
|
+
gpu_vram_gb: 24
|
|
92
|
+
environment:
|
|
93
|
+
python: '3.10'
|
|
94
|
+
cuda: null
|
|
95
|
+
pytorch: 2.2.1
|
|
96
|
+
flash_attn: null
|
|
97
|
+
key_packages:
|
|
98
|
+
- transformers==4.41.1
|
|
99
|
+
- pynvml
|
|
100
|
+
- numpy
|
|
101
|
+
notes:
|
|
102
|
+
- Full dependency list is in requirements.txt. Use a conda virtual environment as
|
|
103
|
+
recommended by the README.
|
|
104
|
+
- run.py uses pynvml for GPU memory polling; pynvml must be installed and NVML must
|
|
105
|
+
be accessible.
|
|
106
|
+
- CUDA version not pinned in source; verify compatibility with PyTorch 2.2.1 and
|
|
107
|
+
your driver.
|
|
108
|
+
risk_flags:
|
|
109
|
+
- dataset_manual_download
|
|
110
|
+
- no_trusted_execution_output
|
|
111
|
+
risk_notes:
|
|
112
|
+
- Downstream benchmark datasets require a manual Google Drive download step; automated
|
|
113
|
+
pipelines may need a workaround.
|
|
114
|
+
- No benchmark execution was performed during the packaging pass. Metric values in
|
|
115
|
+
metric_contract.json are provisional until runtime execution confirms them.
|
|
116
|
+
- Synthetic data generation volume (millions of samples) can be time- and disk-intensive;
|
|
117
|
+
read bash script directives carefully before launching.
|
|
118
|
+
recommended_when: 'Use this benchmark when evaluating foundation-model-style multivariate
|
|
119
|
+
time-series forecasting with synthetic pretraining, or when studying zero-shot and
|
|
120
|
+
few-shot generalisation on standard public forecasting benchmarks (ETT, Weather,
|
|
121
|
+
Exchange). Also appropriate when comparing against PFN-based or Chronos-style forecasting
|
|
122
|
+
baselines.
|
|
123
|
+
|
|
124
|
+
'
|
|
125
|
+
not_recommended_when: 'Do not use this benchmark if you need a simple or trivial forecasting
|
|
126
|
+
baseline, if GPU training is unavailable, if automated dataset download is a hard
|
|
127
|
+
requirement, or if you need verified execution outputs before trusting metric values
|
|
128
|
+
(runtime execution must be completed first).
|
|
129
|
+
|
|
130
|
+
'
|
|
131
|
+
paper:
|
|
132
|
+
title: 'TimePFN: Effective Multivariate Time Series Forecasting with Synthetic Data'
|
|
133
|
+
venue: AAAI 2025
|
|
134
|
+
year: 2025
|
|
135
|
+
url: https://arxiv.org/abs/2502.16294
|
|
136
|
+
authors:
|
|
137
|
+
- Ege Onur Taga
|
|
138
|
+
- M. Emrullah Ildiz
|
|
139
|
+
- Samet Oymak
|
|
140
|
+
affiliation: University of Michigan, Ann Arbor
|
|
141
|
+
citation_key: taga2025timepfn
|
|
142
|
+
download:
|
|
143
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.047_timepfn.zip
|
|
144
|
+
archive_type: zip
|
|
145
|
+
local_dir_name: paper-47-TimePFN
|
|
146
|
+
provider: github_release
|
|
147
|
+
repo: ResearAI/DeepScientist
|
|
148
|
+
tag: aisb-v0.0.1
|
|
149
|
+
asset_name: aisb.t3.047_timepfn.zip
|
|
150
|
+
sha256: b295b1371d836aeeec199601aa42427fcd6cbbf1f73349b5ebdbfd3a5977ab18
|
|
151
|
+
size_bytes: 73341
|
|
152
|
+
display:
|
|
153
|
+
palette_seed: jade-navy-pfn
|
|
154
|
+
art_style: foundation-signal
|
|
155
|
+
accent_priority: high
|
|
156
|
+
image_path: ../image/047_aisb.t3.047_timepfn.jpg
|
|
@@ -0,0 +1,124 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.047_timepfn
|
|
3
|
+
name: TimePFN
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 基于PFN风格的多变量时间序列预测基准,采用合成数据预训练和调度敏感的微调策略。
|
|
6
|
+
task_description: '该打包基准测试涵盖完整的TimePFN工作流程:通过高斯过程核组合和线性协同区域化方法(LMC-Synth)生成合成多变量时间序列数据,在合成数据集上进行Transformer预训练,并在标准下游预测基准(如ETT、Weather、Exchange)上进行微调和评估。任务是将PFN风格的上下文贝叶斯泛化能力迁移到公共基准数据集上的实际零样本和少样本预测质量。主要指标为MSE和MAE,均通过run.py和utils/metrics.py提供代码支持。目前尚无可信执行输出;需要运行时执行后才能将指标值视为已验证。
|
|
7
|
+
|
|
8
|
+
'
|
|
9
|
+
task_mode: experiment_driven
|
|
10
|
+
requires_execution: true
|
|
11
|
+
requires_paper: true
|
|
12
|
+
integrity_level: cas_plus_canary
|
|
13
|
+
snapshot_status: runnable
|
|
14
|
+
support_level: advanced
|
|
15
|
+
time_band: 6-24h
|
|
16
|
+
cost_band: medium
|
|
17
|
+
difficulty: hard
|
|
18
|
+
data_access: public
|
|
19
|
+
primary_outputs:
|
|
20
|
+
- mse
|
|
21
|
+
- mae
|
|
22
|
+
- pfn_checkpoint
|
|
23
|
+
launch_profiles:
|
|
24
|
+
- id: quick_eval
|
|
25
|
+
label: 快速评估
|
|
26
|
+
description: '使用提供的模型检查点和pfn_scripts/test/下的测试脚本运行一个下游TimePFN预测评估流程。无需预训练。
|
|
27
|
+
|
|
28
|
+
'
|
|
29
|
+
- id: pretrain_and_eval
|
|
30
|
+
label: 预训练 + 评估
|
|
31
|
+
description: '运行完整的打包工作流程:通过LMC-Synth生成合成MTS数据,在合成数据上预训练TimePFN transformer,在下游基准数据集上微调,然后评估MSE和MAE。
|
|
32
|
+
|
|
33
|
+
'
|
|
34
|
+
dataset_download:
|
|
35
|
+
primary_method: mixed
|
|
36
|
+
sources:
|
|
37
|
+
- label: 下游基准数据集(ETT、Weather、Exchange等)
|
|
38
|
+
url: https://drive.google.com/file/d/1l51QsKvQPcqILT3DwfjCgx8Dsg2rpjot/view?usp=sharing
|
|
39
|
+
format: zip
|
|
40
|
+
local_path: ./datasets
|
|
41
|
+
notes: 通过iTransformer的datasets.zip Google Drive链接提供。在运行评估脚本前下载并解压到./datasets目录。
|
|
42
|
+
- label: 合成预训练数据
|
|
43
|
+
url: null
|
|
44
|
+
format: generated
|
|
45
|
+
local_path: ./synthetic_data_generation
|
|
46
|
+
notes: 通过LMC-Synth.py和kernel-synth.py本地生成。运行前请阅读bash脚本中的注释和指令。
|
|
47
|
+
- label: 预训练模型检查点
|
|
48
|
+
url: https://deepscientist.cc/AISB/047_timepfn
|
|
49
|
+
format: zip
|
|
50
|
+
local_path: paper-47-TimePFN
|
|
51
|
+
notes: 官方AISB归档下载。包含检查点、训练、微调和pfn_scripts/下的测试脚本。
|
|
52
|
+
notes:
|
|
53
|
+
- 在调用任何评估脚本前,必须将下游基准数据集放置在./datasets目录下。
|
|
54
|
+
- 如果使用提供的预训练检查点进行快速评估,合成数据生成是可选的。
|
|
55
|
+
credential_requirements:
|
|
56
|
+
mode: none
|
|
57
|
+
items: []
|
|
58
|
+
notes:
|
|
59
|
+
- 用于datasets.zip的Google Drive下载不需要身份验证,但如果自动获取受限,可能需要手动下载。
|
|
60
|
+
resources:
|
|
61
|
+
minimum:
|
|
62
|
+
cpu_cores: 8
|
|
63
|
+
ram_gb: 32
|
|
64
|
+
disk_gb: 100
|
|
65
|
+
gpu_count: 1
|
|
66
|
+
gpu_vram_gb: 16
|
|
67
|
+
recommended:
|
|
68
|
+
cpu_cores: 16
|
|
69
|
+
ram_gb: 64
|
|
70
|
+
disk_gb: 200
|
|
71
|
+
gpu_count: 1
|
|
72
|
+
gpu_vram_gb: 24
|
|
73
|
+
environment:
|
|
74
|
+
python: '3.10'
|
|
75
|
+
cuda: null
|
|
76
|
+
pytorch: 2.2.1
|
|
77
|
+
flash_attn: null
|
|
78
|
+
key_packages:
|
|
79
|
+
- transformers==4.41.1
|
|
80
|
+
- pynvml
|
|
81
|
+
- numpy
|
|
82
|
+
notes:
|
|
83
|
+
- 完整的依赖列表在requirements.txt中。建议按照README中的建议使用conda虚拟环境。
|
|
84
|
+
- run.py使用pynvml进行GPU内存轮询;必须安装pynvml且NVML必须可访问。
|
|
85
|
+
- 源代码中未固定CUDA版本;请验证其与PyTorch 2.2.1及您的驱动的兼容性。
|
|
86
|
+
risk_flags:
|
|
87
|
+
- dataset_manual_download
|
|
88
|
+
- no_trusted_execution_output
|
|
89
|
+
risk_notes:
|
|
90
|
+
- 下游基准数据集需要手动从Google Drive下载;自动化流程可能需要变通方案。
|
|
91
|
+
- 打包过程中未执行基准测试。metric_contract.json中的指标值为临时值,需待运行时执行确认。
|
|
92
|
+
- 合成数据生成量(百万级样本)可能耗时且占用大量磁盘空间;启动前请仔细阅读bash脚本指令。
|
|
93
|
+
recommended_when: '在评估基于合成数据预训练的基础模型风格多变量时间序列预测时使用此基准,或在标准公共预测基准(ETT、Weather、Exchange)上研究零样本和少样本泛化时使用此基准。在与基于PFN或Chronos风格的预测基线进行比较时也适用。
|
|
94
|
+
|
|
95
|
+
'
|
|
96
|
+
not_recommended_when: '如果需要简单或基础的时间序列预测基线、如果GPU训练不可用、如果自动化数据集下载是硬性要求、或者在信任指标值之前需要已验证的执行输出(必须先完成运行时执行),请勿使用此基准。
|
|
97
|
+
|
|
98
|
+
'
|
|
99
|
+
paper:
|
|
100
|
+
title: 'TimePFN: Effective Multivariate Time Series Forecasting with Synthetic Data'
|
|
101
|
+
venue: AAAI 2025
|
|
102
|
+
year: 2025
|
|
103
|
+
url: https://arxiv.org/abs/2502.16294
|
|
104
|
+
authors:
|
|
105
|
+
- Ege Onur Taga
|
|
106
|
+
- M. Emrullah Ildiz
|
|
107
|
+
- Samet Oymak
|
|
108
|
+
affiliation: University of Michigan, Ann Arbor
|
|
109
|
+
citation_key: taga2025timepfn
|
|
110
|
+
download:
|
|
111
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.047_timepfn.zip
|
|
112
|
+
archive_type: zip
|
|
113
|
+
local_dir_name: paper-47-TimePFN
|
|
114
|
+
provider: github_release
|
|
115
|
+
repo: ResearAI/DeepScientist
|
|
116
|
+
tag: aisb-v0.0.1
|
|
117
|
+
asset_name: aisb.t3.047_timepfn.zip
|
|
118
|
+
sha256: b295b1371d836aeeec199601aa42427fcd6cbbf1f73349b5ebdbfd3a5977ab18
|
|
119
|
+
size_bytes: 73341
|
|
120
|
+
display:
|
|
121
|
+
palette_seed: jade-navy-pfn
|
|
122
|
+
art_style: foundation-signal
|
|
123
|
+
accent_priority: high
|
|
124
|
+
image_path: ../image/047_aisb.t3.047_timepfn.jpg
|
|
@@ -0,0 +1,148 @@
|
|
|
1
|
+
id: aisb.t3.048_proxyspex
|
|
2
|
+
name: 'Proxy-SPEX: Sample-Efficient Interpretability via Sparse Feature Interactions
|
|
3
|
+
in LLMs'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: Shapley-style sparse feature-interaction approximations for identifying
|
|
6
|
+
compact, meaningful interaction structure in LLM predictions.
|
|
7
|
+
task_description: 'This packaged benchmark covers sparse feature-interaction explanations
|
|
8
|
+
for language models using Shapley-style approximation via the ProxySPEX (Proxy SParse
|
|
9
|
+
EXplainer) method exposed within the shapiq Python package. The task evaluates the
|
|
10
|
+
quality of interaction discovery using budget-limited game evaluations to identify
|
|
11
|
+
compact, meaningful interaction structure behind model behavior. The shapiq package
|
|
12
|
+
extends Shapley value methodology beyond feature attributions to any-order Shapley
|
|
13
|
+
interactions, providing state-of-the-art approximation algorithms and a benchmarking
|
|
14
|
+
suite with pre-computed games and ground-truth values across 10+ application domains.
|
|
15
|
+
|
|
16
|
+
'
|
|
17
|
+
task_mode: evaluation_driven
|
|
18
|
+
requires_execution: true
|
|
19
|
+
requires_paper: true
|
|
20
|
+
integrity_level: cas_plus_canary
|
|
21
|
+
snapshot_status: runnable
|
|
22
|
+
support_level: turnkey
|
|
23
|
+
time_band: 2-6h
|
|
24
|
+
cost_band: medium
|
|
25
|
+
difficulty: medium
|
|
26
|
+
data_access: public
|
|
27
|
+
primary_outputs:
|
|
28
|
+
- precision_at_10
|
|
29
|
+
- precision_at_5
|
|
30
|
+
- feature_interaction_rankings
|
|
31
|
+
- mse
|
|
32
|
+
- mae
|
|
33
|
+
- explanation_report
|
|
34
|
+
launch_profiles:
|
|
35
|
+
- id: quick_eval
|
|
36
|
+
label: Quick Eval
|
|
37
|
+
description: 'Run the packaged sparse interaction explanation route on a single
|
|
38
|
+
target setup using the ProxySPEX approximator with StratifiedBySize sampling on
|
|
39
|
+
the SOUM (Set- Oriented Utility Model) synthetic game. Executes ensemble of 10
|
|
40
|
+
runs per seed with budget=200 and k-SII index for primary evaluation.
|
|
41
|
+
|
|
42
|
+
'
|
|
43
|
+
- id: full_benchmark
|
|
44
|
+
label: Full Benchmark Suite
|
|
45
|
+
description: 'Run the complete shapiq benchmarking suite via eval_benchmark_results.py,
|
|
46
|
+
evaluating all approximator configurations across pre-computed games including
|
|
47
|
+
LocalExplanation, GlobalExplanation, FeatureSelection, DataValuation, DatasetValuation,
|
|
48
|
+
and EnsembleSelection domains.
|
|
49
|
+
|
|
50
|
+
'
|
|
51
|
+
dataset_download:
|
|
52
|
+
primary_method: archive
|
|
53
|
+
sources:
|
|
54
|
+
- url: https://deepscientist.cc/AISB/048_proxyspex
|
|
55
|
+
type: primary_archive
|
|
56
|
+
notes:
|
|
57
|
+
- Archive contains the broader shapiq package (local_dir_name: paper-48-Shapiq)
|
|
58
|
+
- ProxySPEX is one method exposed within the shapiq package API
|
|
59
|
+
- Pre-computed game data and benchmark results included in data/precomputed_games/
|
|
60
|
+
- Additional datasets included: adult_census.csv, bike.csv, california_housing.csv
|
|
61
|
+
credential_requirements:
|
|
62
|
+
mode: none
|
|
63
|
+
items: []
|
|
64
|
+
notes: []
|
|
65
|
+
resources:
|
|
66
|
+
minimum:
|
|
67
|
+
cpu_cores: 8
|
|
68
|
+
ram_gb: 32
|
|
69
|
+
disk_gb: 50
|
|
70
|
+
gpu_count: 0
|
|
71
|
+
gpu_vram_gb: 0
|
|
72
|
+
recommended:
|
|
73
|
+
cpu_cores: 16
|
|
74
|
+
ram_gb: 64
|
|
75
|
+
disk_gb: 100
|
|
76
|
+
gpu_count: 1
|
|
77
|
+
gpu_vram_gb: 24
|
|
78
|
+
environment:
|
|
79
|
+
python: '3.12'
|
|
80
|
+
cuda: null
|
|
81
|
+
pytorch: null
|
|
82
|
+
flash_attn: null
|
|
83
|
+
key_packages:
|
|
84
|
+
- shapiq
|
|
85
|
+
- numpy
|
|
86
|
+
- scipy
|
|
87
|
+
- pandas
|
|
88
|
+
- scikit-learn
|
|
89
|
+
- joblib
|
|
90
|
+
- tqdm
|
|
91
|
+
- sparse-transform
|
|
92
|
+
- galois
|
|
93
|
+
- matplotlib
|
|
94
|
+
- networkx
|
|
95
|
+
notes:
|
|
96
|
+
- CPU-only execution is fully supported for the minimum route
|
|
97
|
+
- GPU acceleration optional but not required; recommended for large-scale LLM explanations
|
|
98
|
+
- The shapiq package is the containing module; ProxySPEX is accessed via shapiq.ProxySPEX
|
|
99
|
+
or shapiq.explainer with approximator="proxyspex"
|
|
100
|
+
- See pyproject.toml and bundled requirements for full dependency specification
|
|
101
|
+
risk_flags: []
|
|
102
|
+
risk_notes:
|
|
103
|
+
- Metric values are code-backed but no benchmark execution was performed in this packaging
|
|
104
|
+
pass
|
|
105
|
+
- Runtime validation required before trusting quantitative outputs
|
|
106
|
+
recommended_when: 'Use this benchmark when you need interpretability tasks focused
|
|
107
|
+
on sparse interaction discovery in language models, want to evaluate approximation
|
|
108
|
+
quality against ground-truth Shapley interactions, or need a CPU-friendly explainability
|
|
109
|
+
evaluation framework with support for any-order interaction quantification.
|
|
110
|
+
|
|
111
|
+
'
|
|
112
|
+
not_recommended_when: 'Do not use this benchmark for pure text generation evaluation,
|
|
113
|
+
full model fine-tuning workflows, or when you require GPU-accelerated training.
|
|
114
|
+
Not suitable when you cannot support repeated explanation runs with varying budget
|
|
115
|
+
constraints.
|
|
116
|
+
|
|
117
|
+
'
|
|
118
|
+
paper:
|
|
119
|
+
title: 'Proxy-SPEX: Sample-Efficient Interpretability via Sparse Feature Interactions
|
|
120
|
+
in LLMs'
|
|
121
|
+
venue: NeurIPS 2025
|
|
122
|
+
year: 2025
|
|
123
|
+
url: https://openreview.net/forum?id=KI8qan2EA7
|
|
124
|
+
download:
|
|
125
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.048_proxyspex.zip
|
|
126
|
+
archive_type: zip
|
|
127
|
+
local_dir_name: paper-48-Shapiq
|
|
128
|
+
provider: github_release
|
|
129
|
+
repo: ResearAI/DeepScientist
|
|
130
|
+
tag: aisb-v0.0.1
|
|
131
|
+
asset_name: aisb.t3.048_proxyspex.zip
|
|
132
|
+
sha256: 3fea6e582a4001554d86ebcb7b95b55a4d537689f6279c561be43ba0e8302778
|
|
133
|
+
size_bytes: 135005330
|
|
134
|
+
display:
|
|
135
|
+
palette_seed: umber-cyan-interact
|
|
136
|
+
art_style: interaction-map
|
|
137
|
+
accent_priority: high
|
|
138
|
+
image_path: ../image/048_aisb.t3.048_proxyspex.jpg
|
|
139
|
+
capability_tags:
|
|
140
|
+
- research_code_optimization
|
|
141
|
+
- mechanistic_interpretability
|
|
142
|
+
- shapley_interactions
|
|
143
|
+
- large_language_models
|
|
144
|
+
- explanation_methods
|
|
145
|
+
aisb_direction: T3
|
|
146
|
+
track_fit:
|
|
147
|
+
- paper_track
|
|
148
|
+
- benchmark_track
|
|
@@ -0,0 +1,125 @@
|
|
|
1
|
+
id: aisb.t3.048_proxyspex
|
|
2
|
+
name: 'Proxy-SPEX: Sample-Efficient Interpretability via Sparse Feature Interactions
|
|
3
|
+
in LLMs'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: >-
|
|
6
|
+
基于Shapley风格的稀疏特征交互近似方法,用于识别LLM预测中紧凑且有意义的交互结构。
|
|
7
|
+
task_description: >-
|
|
8
|
+
该打包基准测试涵盖使用ProxySPEX(Proxy SParse EXplainer)方法通过Shapley风格近似进行语言模型的稀疏特征交互解释。该任务通过预算限制的博弈评估来评估交互发现的质量,以识别模型行为背后紧凑且有意义的交互结构。shapiq包将Shapley值方法从特征归因扩展到任意阶Shapley交互,提供最先进的近似算法以及包含预计算博弈和真值的基准测试套件,涵盖10多个应用领域。
|
|
9
|
+
task_mode: evaluation_driven
|
|
10
|
+
requires_execution: true
|
|
11
|
+
requires_paper: true
|
|
12
|
+
integrity_level: cas_plus_canary
|
|
13
|
+
snapshot_status: runnable
|
|
14
|
+
support_level: turnkey
|
|
15
|
+
time_band: 2-6h
|
|
16
|
+
cost_band: medium
|
|
17
|
+
difficulty: medium
|
|
18
|
+
data_access: public
|
|
19
|
+
primary_outputs:
|
|
20
|
+
- precision_at_10
|
|
21
|
+
- precision_at_5
|
|
22
|
+
- feature_interaction_rankings
|
|
23
|
+
- mse
|
|
24
|
+
- mae
|
|
25
|
+
- explanation_report
|
|
26
|
+
launch_profiles:
|
|
27
|
+
- id: quick_eval
|
|
28
|
+
label: Quick Eval
|
|
29
|
+
label_zh: 快速评估
|
|
30
|
+
description: >-
|
|
31
|
+
使用ProxySPEX近似器在SOUM(集合导向效用模型)合成博弈上运行打包的稀疏交互解释流程,采用StratifiedBySize采样。针对主要评估使用budget=200和k-SII索引执行每个种子10次运行的集成。
|
|
32
|
+
- id: full_benchmark
|
|
33
|
+
label: Full Benchmark Suite
|
|
34
|
+
label_zh: 完整基准测试套件
|
|
35
|
+
description: >-
|
|
36
|
+
通过eval_benchmark_results.py运行完整的shapiq基准测试套件,评估所有近似器配置在预计算博弈上的表现,包括LocalExplanation、GlobalExplanation、FeatureSelection、DataValuation、DatasetValuation和EnsembleSelection领域。
|
|
37
|
+
dataset_download:
|
|
38
|
+
primary_method: archive
|
|
39
|
+
sources:
|
|
40
|
+
- url: https://deepscientist.cc/AISB/048_proxyspex
|
|
41
|
+
type: primary_archive
|
|
42
|
+
notes:
|
|
43
|
+
- 压缩包包含更广泛的shapiq包(local_dir_name: paper-48-Shapiq)
|
|
44
|
+
- ProxySPEX是shapiq包API中暴露的一种方法
|
|
45
|
+
- 预计算的博弈数据和基准测试结果包含在data/precomputed_games/中
|
|
46
|
+
- 附加数据集包括:adult_census.csv、bike.csv、california_housing.csv
|
|
47
|
+
credential_requirements:
|
|
48
|
+
mode: none
|
|
49
|
+
items: []
|
|
50
|
+
notes: []
|
|
51
|
+
resources:
|
|
52
|
+
minimum:
|
|
53
|
+
cpu_cores: 8
|
|
54
|
+
ram_gb: 32
|
|
55
|
+
disk_gb: 50
|
|
56
|
+
gpu_count: 0
|
|
57
|
+
gpu_vram_gb: 0
|
|
58
|
+
recommended:
|
|
59
|
+
cpu_cores: 16
|
|
60
|
+
ram_gb: 64
|
|
61
|
+
disk_gb: 100
|
|
62
|
+
gpu_count: 1
|
|
63
|
+
gpu_vram_gb: 24
|
|
64
|
+
environment:
|
|
65
|
+
python: '3.12'
|
|
66
|
+
cuda: null
|
|
67
|
+
pytorch: null
|
|
68
|
+
flash_attn: null
|
|
69
|
+
key_packages:
|
|
70
|
+
- shapiq
|
|
71
|
+
- numpy
|
|
72
|
+
- scipy
|
|
73
|
+
- pandas
|
|
74
|
+
- scikit-learn
|
|
75
|
+
- joblib
|
|
76
|
+
- tqdm
|
|
77
|
+
- sparse-transform
|
|
78
|
+
- galois
|
|
79
|
+
- matplotlib
|
|
80
|
+
- networkx
|
|
81
|
+
notes:
|
|
82
|
+
- 最小化路线完全支持CPU执行
|
|
83
|
+
- GPU加速可选但非必需;大规模LLM解释推荐使用GPU
|
|
84
|
+
- shapiq包是包含模块;ProxySPEX通过shapiq.ProxySPEX或shapiq.explainer
|
|
85
|
+
with approximator="proxyspex"访问
|
|
86
|
+
- 参见pyproject.toml和捆绑的requirements以获取完整的依赖规范
|
|
87
|
+
risk_flags: []
|
|
88
|
+
risk_notes:
|
|
89
|
+
- 指标值有代码支持,但本次打包过程中未执行基准测试
|
|
90
|
+
- 在信任定量输出之前需要运行时验证
|
|
91
|
+
recommended_when: >-
|
|
92
|
+
当您需要专注于语言模型中稀疏交互发现的可解释性任务时使用此基准测试;想要根据真值Shapley交互评估近似质量时使用;或者需要一个支持任意阶交互量化的CPU友好的可解释性评估框架时使用。
|
|
93
|
+
not_recommended_when: >-
|
|
94
|
+
不要将此基准测试用于纯文本生成评估、完整模型微调工作流程,或当您需要GPU加速训练时。如果无法支持具有不同预算约束的重复解释运行,则不适合使用。
|
|
95
|
+
paper:
|
|
96
|
+
title: 'Proxy-SPEX: Sample-Efficient Interpretability via Sparse Feature Interactions
|
|
97
|
+
in LLMs'
|
|
98
|
+
venue: NeurIPS 2025
|
|
99
|
+
year: 2025
|
|
100
|
+
url: https://openreview.net/forum?id=KI8qan2EA7
|
|
101
|
+
download:
|
|
102
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.048_proxyspex.zip
|
|
103
|
+
archive_type: zip
|
|
104
|
+
local_dir_name: paper-48-Shapiq
|
|
105
|
+
provider: github_release
|
|
106
|
+
repo: ResearAI/DeepScientist
|
|
107
|
+
tag: aisb-v0.0.1
|
|
108
|
+
asset_name: aisb.t3.048_proxyspex.zip
|
|
109
|
+
sha256: 3fea6e582a4001554d86ebcb7b95b55a4d537689f6279c561be43ba0e8302778
|
|
110
|
+
size_bytes: 135005330
|
|
111
|
+
display:
|
|
112
|
+
palette_seed: umber-cyan-interact
|
|
113
|
+
art_style: interaction-map
|
|
114
|
+
accent_priority: high
|
|
115
|
+
image_path: ../image/048_aisb.t3.048_proxyspex.jpg
|
|
116
|
+
capability_tags:
|
|
117
|
+
- research_code_optimization
|
|
118
|
+
- mechanistic_interpretability
|
|
119
|
+
- shapley_interactions
|
|
120
|
+
- large_language_models
|
|
121
|
+
- explanation_methods
|
|
122
|
+
aisb_direction: T3
|
|
123
|
+
track_fit:
|
|
124
|
+
- paper_track
|
|
125
|
+
- benchmark_track
|