@researai/deepscientist 1.5.17 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +132 -11
- package/bin/ds.js +376 -49
- package/docs/en/00_QUICK_START.md +135 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +64 -4
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +29 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +44 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +92 -17
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +39 -4
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +29 -7
- package/install.sh +122 -16
- package/package.json +4 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +2 -2
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +927 -91
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +697 -210
- package/src/deepscientist/daemon/api/router.py +76 -1
- package/src/deepscientist/daemon/app.py +1054 -51
- package/src/deepscientist/diagnostics/runner_failures.py +147 -0
- package/src/deepscientist/doctor.py +212 -65
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +836 -92
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1430 -139
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +421 -21
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +61 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -11
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +409 -315
- package/src/prompts/system_copilot.md +88 -12
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
- package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
- package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
- package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
- package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
- package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
- package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
- package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
- package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
- package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
- package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
- package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
- package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
- package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
- package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
- package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
- package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
- package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
- package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,212 @@
|
|
|
1
|
+
id: aisb.t3.097_wassersteintl
|
|
2
|
+
name: Wasserstein Transfer Learning
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Optimize Wasserstein-based transfer estimators for distributional learning
|
|
5
|
+
across source and target populations using Fréchet regression in the Wasserstein
|
|
6
|
+
space.
|
|
7
|
+
task_description: 'This packaged benchmark covers Wasserstein Transfer Learning (WaTL),
|
|
8
|
+
a novel transfer learning framework for regression models whose outputs are probability
|
|
9
|
+
distributions residing in the Wasserstein space. The method leverages knowledge
|
|
10
|
+
from multiple source domains to improve predictions in a target domain by intrinsically
|
|
11
|
+
incorporating the Wasserstein metric. The three-stage algorithm consists of: (1)
|
|
12
|
+
a weighted auxiliary estimator using global Fréchet regression for known informative
|
|
13
|
+
source subsets, (2) bias correction via gradient descent with cross-validated regularization,
|
|
14
|
+
and (3) projection to Wasserstein space enforcing monotonicity via OSQP solver.
|
|
15
|
+
Evaluation targets RMSPR (Root Mean Squared Prediction Risk) on mortality and physical
|
|
16
|
+
activity datasets, with per-test-point timing as a secondary metric.
|
|
17
|
+
|
|
18
|
+
'
|
|
19
|
+
task_mode: evaluation_driven
|
|
20
|
+
requires_execution: true
|
|
21
|
+
requires_paper: true
|
|
22
|
+
integrity_level: cas_plus_canary
|
|
23
|
+
snapshot_status: runnable
|
|
24
|
+
support_level: turnkey
|
|
25
|
+
time_band: 2-6h
|
|
26
|
+
cost_band: low
|
|
27
|
+
difficulty: medium
|
|
28
|
+
data_access: public
|
|
29
|
+
primary_outputs:
|
|
30
|
+
- rmspr
|
|
31
|
+
- time_ms_per_test_point
|
|
32
|
+
- transfer_learning_report
|
|
33
|
+
launch_profiles:
|
|
34
|
+
- id: simulation
|
|
35
|
+
label: Simulation Route
|
|
36
|
+
description: 'Run the packaged simulation experiment (Section 5 of paper) to validate
|
|
37
|
+
WaTL asymptotic properties. Uses global Fréchet regression with synthetic distributional
|
|
38
|
+
data.
|
|
39
|
+
|
|
40
|
+
'
|
|
41
|
+
command: Rscript Simulation/Simulation.R <M> <n_t> <seed> <setting> <tau>
|
|
42
|
+
arguments:
|
|
43
|
+
- name: M
|
|
44
|
+
description: Grid size for quantile functions
|
|
45
|
+
example: '100'
|
|
46
|
+
- name: n_t
|
|
47
|
+
description: Target sample size
|
|
48
|
+
example: 200-800
|
|
49
|
+
- name: seed
|
|
50
|
+
description: Random seed for reproducibility
|
|
51
|
+
example: '42'
|
|
52
|
+
- name: setting
|
|
53
|
+
description: Data generation setting (1 or 2)
|
|
54
|
+
example: '1'
|
|
55
|
+
- name: tau
|
|
56
|
+
description: Source sample multiplier
|
|
57
|
+
example: 100 or 200
|
|
58
|
+
- id: real_data
|
|
59
|
+
label: Real Data Route
|
|
60
|
+
description: 'Execute the real-world application with mortality or physical activity
|
|
61
|
+
data. Uses local Fréchet regression with OSQP monotonicity projection. Target
|
|
62
|
+
domain analysis with multiple source populations.
|
|
63
|
+
|
|
64
|
+
'
|
|
65
|
+
command: Rscript RealData/RealData.R <seed> <race> <M> <rate> <gender>
|
|
66
|
+
arguments:
|
|
67
|
+
- name: seed
|
|
68
|
+
description: Random seed for reproducibility
|
|
69
|
+
example: '42'
|
|
70
|
+
- name: race
|
|
71
|
+
description: Race index for target population (1=Black, 2=White)
|
|
72
|
+
example: '1'
|
|
73
|
+
- name: M
|
|
74
|
+
description: Grid size for quantile functions
|
|
75
|
+
example: '100'
|
|
76
|
+
- name: rate
|
|
77
|
+
description: Source data sampling rate (0-1)
|
|
78
|
+
example: '1.0'
|
|
79
|
+
- name: gender
|
|
80
|
+
description: Gender for stratification (0=Female, 1=Male)
|
|
81
|
+
example: '0'
|
|
82
|
+
- id: mortality_experiment
|
|
83
|
+
label: Mortality Experiment (RMSPR)
|
|
84
|
+
description: 'Primary end-to-end reproduction path for RMSPR metric using UN World
|
|
85
|
+
Population Prospects 2015 data. Target: Developed countries (45). Sources: Developing
|
|
86
|
+
countries (156). Computes per-test-point timing.
|
|
87
|
+
|
|
88
|
+
'
|
|
89
|
+
command: Rscript mortality_experiment2.R
|
|
90
|
+
notes: 'Uses wpp2015 R package for demographic data. Requires internet for package
|
|
91
|
+
installation. Reproduces Table 1 (Appendix A).
|
|
92
|
+
|
|
93
|
+
'
|
|
94
|
+
dataset_download:
|
|
95
|
+
primary_method: r_package
|
|
96
|
+
sources:
|
|
97
|
+
- name: wpp2015
|
|
98
|
+
description: UN World Population Prospects 2015 mortality data
|
|
99
|
+
package: wpp2015
|
|
100
|
+
- name: NHANES
|
|
101
|
+
description: National Health and Nutrition Examination Survey physical activity
|
|
102
|
+
data
|
|
103
|
+
package: NHANES
|
|
104
|
+
notes:
|
|
105
|
+
- wpp2015 package loads UN demographic data on first use
|
|
106
|
+
- NHANES physical activity intensity data loaded via RealDataFunc.R
|
|
107
|
+
- Both datasets are publicly available from NIH
|
|
108
|
+
credential_requirements:
|
|
109
|
+
mode: none
|
|
110
|
+
items: []
|
|
111
|
+
notes:
|
|
112
|
+
- No authentication required for R package data sources
|
|
113
|
+
- Internet connection needed for package installation and data download
|
|
114
|
+
resources:
|
|
115
|
+
minimum:
|
|
116
|
+
cpu_cores: 4
|
|
117
|
+
ram_gb: 8
|
|
118
|
+
disk_gb: 10
|
|
119
|
+
gpu_count: 0
|
|
120
|
+
gpu_vram_gb: 0
|
|
121
|
+
recommended:
|
|
122
|
+
cpu_cores: 8
|
|
123
|
+
ram_gb: 16
|
|
124
|
+
disk_gb: 20
|
|
125
|
+
gpu_count: 0
|
|
126
|
+
gpu_vram_gb: 0
|
|
127
|
+
environment:
|
|
128
|
+
python: null
|
|
129
|
+
cuda: null
|
|
130
|
+
pytorch: null
|
|
131
|
+
flash_attn: null
|
|
132
|
+
key_packages:
|
|
133
|
+
- name: wpp2015
|
|
134
|
+
description: UN World Population Prospects demographic data
|
|
135
|
+
- name: osqp
|
|
136
|
+
description: Quadratic programming solver for monotonicity projection
|
|
137
|
+
- name: Matrix
|
|
138
|
+
description: Sparse and dense matrix operations
|
|
139
|
+
- name: pracma
|
|
140
|
+
description: Practical numerical mathematics
|
|
141
|
+
- name: parallel
|
|
142
|
+
description: Parallel computation support
|
|
143
|
+
- name: NHANES
|
|
144
|
+
description: NHANES data retrieval
|
|
145
|
+
notes:
|
|
146
|
+
- CPU-only execution is sufficient for all routes
|
|
147
|
+
- GPU not required; workload is primarily statistical computation
|
|
148
|
+
- R-centric workflow; no Python or PyTorch dependencies
|
|
149
|
+
- OSQP solver used in Real Data route for quantile function monotonicity constraint
|
|
150
|
+
risk_flags:
|
|
151
|
+
- no_gpu_required
|
|
152
|
+
- cpu_bound
|
|
153
|
+
- r_only
|
|
154
|
+
risk_notes:
|
|
155
|
+
- Benchmark has no GPU requirement; resource costs are minimal
|
|
156
|
+
- Execution time scales with grid size M and sample sizes
|
|
157
|
+
- OSQP solver convergence may vary with data dimensionality
|
|
158
|
+
recommended_when: 'Use this benchmark when you need a statistics-heavy transfer-learning
|
|
159
|
+
task that operates on distributional data in the Wasserstein space. Suitable for
|
|
160
|
+
evaluating methods that predict probability distributions from covariates using
|
|
161
|
+
optimal transport geometry. Ideal when working with mortality curves, physical activity
|
|
162
|
+
distributions, or other distributional response data where source domain knowledge
|
|
163
|
+
can improve target predictions. R-based execution makes it accessible without GPU
|
|
164
|
+
infrastructure.
|
|
165
|
+
|
|
166
|
+
'
|
|
167
|
+
not_recommended_when: 'Do not use this benchmark if you need neural-network-based
|
|
168
|
+
benchmarks, deep learning workflows, or CUDA-heavy training. Not suitable for tasks
|
|
169
|
+
requiring GPU acceleration or PyTorch-based implementations. Avoid if your research
|
|
170
|
+
focuses on scalar/vector responses rather than distributional outputs in non-Euclidean
|
|
171
|
+
spaces.
|
|
172
|
+
|
|
173
|
+
'
|
|
174
|
+
paper:
|
|
175
|
+
title: Wasserstein Transfer Learning
|
|
176
|
+
authors:
|
|
177
|
+
- Kaicheng Zhang (Zhejiang University)
|
|
178
|
+
- Sinian Zhang (University of Minnesota)
|
|
179
|
+
- Doudou Zhou (National University of Singapore)
|
|
180
|
+
- Yidong Zhou (UC Davis)
|
|
181
|
+
venue: arXiv preprint
|
|
182
|
+
year: 2025
|
|
183
|
+
url: https://arxiv.org/abs/2505.17404
|
|
184
|
+
github: https://github.com/h7nian/WaTL
|
|
185
|
+
display:
|
|
186
|
+
palette_seed: teal-stone-wasserstein
|
|
187
|
+
art_style: statistical-transport
|
|
188
|
+
accent_priority: medium
|
|
189
|
+
image_path: ../image/097_aisb.t3.097_wassersteintl.jpg
|
|
190
|
+
capability_tags:
|
|
191
|
+
- transfer_learning
|
|
192
|
+
- wasserstein_geometry
|
|
193
|
+
- distributional_learning
|
|
194
|
+
- statistical_modeling
|
|
195
|
+
- optimal_transport
|
|
196
|
+
- frechet_regression
|
|
197
|
+
- non_euclidean_output
|
|
198
|
+
aisb_direction: T3
|
|
199
|
+
track_fit:
|
|
200
|
+
- paper_track
|
|
201
|
+
- benchmark_track
|
|
202
|
+
commercial:
|
|
203
|
+
annual_fee: null
|
|
204
|
+
download:
|
|
205
|
+
provider: github_release
|
|
206
|
+
repo: ResearAI/DeepScientist
|
|
207
|
+
tag: aisb-v0.0.1
|
|
208
|
+
asset_name: aisb.t3.097_wassersteintl.zip
|
|
209
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.097_wassersteintl.zip
|
|
210
|
+
archive_type: zip
|
|
211
|
+
sha256: 7878e684e20e96ca4ea5aa2ea5f33a4772d22a14b5bf6ab275a68664de302887
|
|
212
|
+
size_bytes: 104086
|
|
@@ -0,0 +1,169 @@
|
|
|
1
|
+
id: aisb.t3.097_wassersteintl
|
|
2
|
+
name: Wasserstein 迁移学习
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 使用 Wasserstein 空间中的 Fréchet 回归优化基于 Wasserstein 的迁移估计器,以实现源群体和目标群体之间的分布式学习。
|
|
5
|
+
task_description: 该打包基准涵盖 Wasserstein 迁移学习 (WaTL),这是一种用于回归模型的新型迁移学习框架,其输出是位于 Wasserstein 空间中的概率分布。该方法通过内在地结合 Wasserstein 度量,利用来自多个源域的知识来改进目标域中的预测。该三阶段算法包括:(1) 对已知信息源子集使用全局 Fréchet 回归的加权辅助估计器,(2) 通过交叉验证正则化的梯度下降进行偏差校正,以及 (3) 通过 OSQP 求解器投影到 Wasserstein 空间以强制单调性。评估目标是死亡率和身体活动数据集的 RMSPR(均方根预测风险),每个测试点的时间作为次要指标。
|
|
6
|
+
task_mode: evaluation_driven
|
|
7
|
+
requires_execution: true
|
|
8
|
+
requires_paper: true
|
|
9
|
+
integrity_level: cas_plus_canary
|
|
10
|
+
snapshot_status: runnable
|
|
11
|
+
support_level: turnkey
|
|
12
|
+
time_band: 2-6h
|
|
13
|
+
cost_band: low
|
|
14
|
+
difficulty: medium
|
|
15
|
+
data_access: public
|
|
16
|
+
primary_outputs:
|
|
17
|
+
- rmspr
|
|
18
|
+
- time_ms_per_test_point
|
|
19
|
+
- transfer_learning_report
|
|
20
|
+
launch_profiles:
|
|
21
|
+
- id: simulation
|
|
22
|
+
label: 模拟路线
|
|
23
|
+
description: 运行打包的模拟实验(论文第 5 节)以验证 WaTL 渐近属性。将全局 Fréchet 回归与合成分布数据结合使用。
|
|
24
|
+
command: Rscript Simulation/Simulation.R <M> <n_t> <seed> <setting> <tau>
|
|
25
|
+
arguments:
|
|
26
|
+
- name: M
|
|
27
|
+
description: 分位数函数的网格大小
|
|
28
|
+
example: '100'
|
|
29
|
+
- name: n_t
|
|
30
|
+
description: 目标样本量
|
|
31
|
+
example: 200-800
|
|
32
|
+
- name: seed
|
|
33
|
+
description: 用于再现性的随机种子
|
|
34
|
+
example: '42'
|
|
35
|
+
- name: setting
|
|
36
|
+
description: 数据生成设置(1或2)
|
|
37
|
+
example: '1'
|
|
38
|
+
- name: tau
|
|
39
|
+
description: 源样本乘数
|
|
40
|
+
example: 100 or 200
|
|
41
|
+
- id: real_data
|
|
42
|
+
label: 真实数据路由
|
|
43
|
+
description: 使用死亡率或体力活动数据执行现实世界的应用程序。使用带有 OSQP 单调性投影的局部 Fréchet 回归。具有多个源群体的目标域分析。
|
|
44
|
+
command: Rscript RealData/RealData.R <seed> <race> <M> <rate> <gender>
|
|
45
|
+
arguments:
|
|
46
|
+
- name: seed
|
|
47
|
+
description: 用于再现性的随机种子
|
|
48
|
+
example: '42'
|
|
49
|
+
- name: race
|
|
50
|
+
description: 目标人群的种族指数(1=黑人,2=白人)
|
|
51
|
+
example: '1'
|
|
52
|
+
- name: M
|
|
53
|
+
description: 分位数函数的网格大小
|
|
54
|
+
example: '100'
|
|
55
|
+
- name: rate
|
|
56
|
+
description: 源数据采样率(0-1)
|
|
57
|
+
example: '1.0'
|
|
58
|
+
- name: gender
|
|
59
|
+
description: 分层性别(0=女性,1=男性)
|
|
60
|
+
example: '0'
|
|
61
|
+
- id: mortality_experiment
|
|
62
|
+
label: 死亡率实验 (RMSPR)
|
|
63
|
+
description: 使用联合国 2015 年世界人口展望数据的 RMSPR 指标的主要端到端复制路径。目标:发达国家(45)。资料来源:发展中国家(156)。计算每个测试点的时序。
|
|
64
|
+
command: Rscript mortality_experiment2.R
|
|
65
|
+
notes: 使用 wpp2015 R 包获取人口统计数据。需要互联网来安装软件包。重现表 1(附录 A)。
|
|
66
|
+
dataset_download:
|
|
67
|
+
primary_method: r_package
|
|
68
|
+
sources:
|
|
69
|
+
- name: wpp2015
|
|
70
|
+
description: UN World Population Prospects 2015 mortality data
|
|
71
|
+
package: wpp2015
|
|
72
|
+
- name: NHANES
|
|
73
|
+
description: National Health and Nutrition Examination Survey physical activity data
|
|
74
|
+
package: NHANES
|
|
75
|
+
notes:
|
|
76
|
+
- wpp2015 软件包首次使用时加载联合国人口统计数据
|
|
77
|
+
- NHANES 身体活动强度数据通过 RealDataFunc.R 加载
|
|
78
|
+
- 这两个数据集均可从 NIH 公开获得
|
|
79
|
+
credential_requirements:
|
|
80
|
+
mode: none
|
|
81
|
+
items: []
|
|
82
|
+
notes:
|
|
83
|
+
- R包数据源无需身份验证
|
|
84
|
+
- 软件包安装和数据下载需要互联网连接
|
|
85
|
+
resources:
|
|
86
|
+
minimum:
|
|
87
|
+
cpu_cores: 4
|
|
88
|
+
ram_gb: 8
|
|
89
|
+
disk_gb: 10
|
|
90
|
+
gpu_count: 0
|
|
91
|
+
gpu_vram_gb: 0
|
|
92
|
+
recommended:
|
|
93
|
+
cpu_cores: 8
|
|
94
|
+
ram_gb: 16
|
|
95
|
+
disk_gb: 20
|
|
96
|
+
gpu_count: 0
|
|
97
|
+
gpu_vram_gb: 0
|
|
98
|
+
environment:
|
|
99
|
+
python: null
|
|
100
|
+
cuda: null
|
|
101
|
+
pytorch: null
|
|
102
|
+
flash_attn: null
|
|
103
|
+
key_packages:
|
|
104
|
+
- name: wpp2015
|
|
105
|
+
description: UN World Population Prospects demographic data
|
|
106
|
+
- name: osqp
|
|
107
|
+
description: Quadratic programming solver for monotonicity projection
|
|
108
|
+
- name: Matrix
|
|
109
|
+
description: Sparse and dense matrix operations
|
|
110
|
+
- name: pracma
|
|
111
|
+
description: Practical numerical mathematics
|
|
112
|
+
- name: parallel
|
|
113
|
+
description: Parallel computation support
|
|
114
|
+
- name: NHANES
|
|
115
|
+
description: NHANES data retrieval
|
|
116
|
+
notes:
|
|
117
|
+
- 仅 CPU 执行足以满足所有路由的需要
|
|
118
|
+
- 不需要 GPU;工作量主要是统计计算
|
|
119
|
+
- 以 R 为中心的工作流程;没有 Python 或 PyTorch 依赖项
|
|
120
|
+
- OSQP 求解器在真实数据路径中用于分位数函数单调性约束
|
|
121
|
+
risk_flags:
|
|
122
|
+
- no_gpu_required
|
|
123
|
+
- cpu_bound
|
|
124
|
+
- r_only
|
|
125
|
+
risk_notes:
|
|
126
|
+
- Benchmark 没有 GPU 要求;资源成本极低
|
|
127
|
+
- 执行时间与网格大小 M 和样本大小相关
|
|
128
|
+
- OSQP 求解器收敛可能随数据维度而变化
|
|
129
|
+
recommended_when: 当您需要对 Wasserstein 空间中的分布数据进行操作的统计量大的迁移学习任务时,请使用此基准。适用于评估使用最佳传输几何从协变量预测概率分布的方法。非常适合处理死亡率曲线、体力活动分布或其他分布响应数据,其中源领域知识可以改进目标预测。基于 R 的执行使其无需 GPU 基础设施即可访问。
|
|
130
|
+
not_recommended_when: 如果您需要基于神经网络的基准测试、深度学习工作流程或 CUDA 密集型训练,请勿使用此基准测试。不适合需要 GPU 加速或基于 PyTorch 的实现的任务。如果您的研究重点是标量/向量响应而不是非欧几里得空间中的分布输出,请避免使用。
|
|
131
|
+
paper:
|
|
132
|
+
title: Wasserstein Transfer Learning
|
|
133
|
+
authors:
|
|
134
|
+
- Kaicheng Zhang (Zhejiang University)
|
|
135
|
+
- Sinian Zhang (University of Minnesota)
|
|
136
|
+
- Doudou Zhou (National University of Singapore)
|
|
137
|
+
- Yidong Zhou (UC Davis)
|
|
138
|
+
venue: arXiv preprint
|
|
139
|
+
year: 2025
|
|
140
|
+
url: https://arxiv.org/abs/2505.17404
|
|
141
|
+
github: https://github.com/h7nian/WaTL
|
|
142
|
+
display:
|
|
143
|
+
palette_seed: teal-stone-wasserstein
|
|
144
|
+
art_style: statistical-transport
|
|
145
|
+
accent_priority: medium
|
|
146
|
+
image_path: ../image/097_aisb.t3.097_wassersteintl.jpg
|
|
147
|
+
capability_tags:
|
|
148
|
+
- transfer_learning
|
|
149
|
+
- wasserstein_geometry
|
|
150
|
+
- distributional_learning
|
|
151
|
+
- statistical_modeling
|
|
152
|
+
- optimal_transport
|
|
153
|
+
- frechet_regression
|
|
154
|
+
- non_euclidean_output
|
|
155
|
+
aisb_direction: T3
|
|
156
|
+
track_fit:
|
|
157
|
+
- paper_track
|
|
158
|
+
- benchmark_track
|
|
159
|
+
commercial:
|
|
160
|
+
annual_fee: null
|
|
161
|
+
download:
|
|
162
|
+
provider: github_release
|
|
163
|
+
repo: ResearAI/DeepScientist
|
|
164
|
+
tag: aisb-v0.0.1
|
|
165
|
+
asset_name: aisb.t3.097_wassersteintl.zip
|
|
166
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.097_wassersteintl.zip
|
|
167
|
+
archive_type: zip
|
|
168
|
+
sha256: 7878e684e20e96ca4ea5aa2ea5f33a4772d22a14b5bf6ab275a68664de302887
|
|
169
|
+
size_bytes: 104086
|
|
@@ -0,0 +1,171 @@
|
|
|
1
|
+
id: aisb.t3.098_xmahalanobis
|
|
2
|
+
name: 'X-Mahalanobis: Transformer Feature Mixing for Reliable OOD Detection'
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Adaptive transformer layer fusion with Mahalanobis distance scoring for
|
|
5
|
+
state-of-the-art out-of-distribution detection.
|
|
6
|
+
task_description: 'This packaged benchmark covers transformer-based out-of-distribution
|
|
7
|
+
(OOD) detection through an adaptive fusion module that dynamically assigns importance
|
|
8
|
+
weights to representations learned by each Transformer layer. The method detects
|
|
9
|
+
OOD samples using Mahalanobis distance scoring across multiple intermediate layers,
|
|
10
|
+
moving beyond reliance on final-layer features alone. The benchmark supports parameter-efficient
|
|
11
|
+
fine-tuning (PEFT) strategies including AdaptFormer, LoRA, Adapter, Visual Prompt
|
|
12
|
+
Tuning (VPT), bias tuning, and full fine-tuning. Evaluation is conducted on class-balanced
|
|
13
|
+
(CIFAR100) and long-tailed (ImageNet-LT) in-distribution classification tasks against
|
|
14
|
+
nine diverse OOD datasets, reporting AUROC and FPR95 metrics.
|
|
15
|
+
|
|
16
|
+
'
|
|
17
|
+
task_mode: experiment_driven
|
|
18
|
+
requires_execution: true
|
|
19
|
+
requires_paper: true
|
|
20
|
+
integrity_level: cas_plus_canary
|
|
21
|
+
snapshot_status: external_eval_required
|
|
22
|
+
support_level: advanced
|
|
23
|
+
time_band: 6-24h
|
|
24
|
+
cost_band: medium
|
|
25
|
+
difficulty: medium
|
|
26
|
+
data_access: public
|
|
27
|
+
primary_outputs:
|
|
28
|
+
- auroc
|
|
29
|
+
- fpr95
|
|
30
|
+
- ood_detection_checkpoint
|
|
31
|
+
launch_profiles:
|
|
32
|
+
- id: quick_eval
|
|
33
|
+
label: Quick Eval
|
|
34
|
+
description: 'Run OOD detection evaluation on a prepared checkpoint using main_test.py.
|
|
35
|
+
Requires trained model weights and config alignment with training setup. Suitable
|
|
36
|
+
for evaluating baselines or comparing fine-tuned checkpoints.
|
|
37
|
+
|
|
38
|
+
'
|
|
39
|
+
estimated_time: 1-2h
|
|
40
|
+
compute_profile: quick_eval
|
|
41
|
+
- id: train_and_test
|
|
42
|
+
label: Train + Test
|
|
43
|
+
description: 'Full PEFT training workflow on CIFAR100 or ImageNet-LT followed by
|
|
44
|
+
OOD evaluation. Supports AdaptFormer (default), LoRA, Adapter, VPT, bias tuning,
|
|
45
|
+
and full fine-tuning. Trains ViT-B/16 (IN21K pretrained or CLIP pretrained) and
|
|
46
|
+
evaluates against multiple OOD datasets.
|
|
47
|
+
|
|
48
|
+
'
|
|
49
|
+
estimated_time: 6-18h
|
|
50
|
+
compute_profile: full_training
|
|
51
|
+
dataset_download:
|
|
52
|
+
primary_method: bundled
|
|
53
|
+
sources:
|
|
54
|
+
- cifar100: torchvision datasets (auto-download)
|
|
55
|
+
- imagenet_lt: requires manual download from ImageNet, LT split preconfigured in
|
|
56
|
+
configs
|
|
57
|
+
- ood_datasets: preconfigured in evaluation pipeline (e.g., SVHN, LSUN, iNaturalist)
|
|
58
|
+
notes:
|
|
59
|
+
- CIFAR100 downloads automatically via torchvision
|
|
60
|
+
- ImageNet-LT requires manual download from ImageNet official source
|
|
61
|
+
- OOD test datasets (TIN, SVHN, LSUN, etc.) handled by evaluation script
|
|
62
|
+
- Data configs located in configs/data/ (cifar100.yaml, imagenet_lt.yaml, imagenet.yaml)
|
|
63
|
+
credential_requirements:
|
|
64
|
+
mode: none
|
|
65
|
+
items: []
|
|
66
|
+
notes:
|
|
67
|
+
- ImageNet download may require academic registration
|
|
68
|
+
- All other datasets are publicly accessible or auto-downloaded
|
|
69
|
+
resources:
|
|
70
|
+
minimum:
|
|
71
|
+
cpu_cores: 8
|
|
72
|
+
ram_gb: 32
|
|
73
|
+
disk_gb: 80
|
|
74
|
+
gpu_count: 1
|
|
75
|
+
gpu_vram_gb: 16
|
|
76
|
+
notes: Supports single-GPU execution for quick_eval and small-scale training
|
|
77
|
+
recommended:
|
|
78
|
+
cpu_cores: 16
|
|
79
|
+
ram_gb: 64
|
|
80
|
+
disk_gb: 150
|
|
81
|
+
gpu_count: 1
|
|
82
|
+
gpu_vram_gb: 24
|
|
83
|
+
notes: '24GB VRAM recommended for batch_size 64 with full PEFT methods on ImageNet-LT.
|
|
84
|
+
AdaptFormer training at lr 0.1 for 20 epochs on ImageNet-LT with CLIP ViT-B/16
|
|
85
|
+
is the most demanding configuration.
|
|
86
|
+
|
|
87
|
+
'
|
|
88
|
+
environment:
|
|
89
|
+
python: '3.9'
|
|
90
|
+
cuda: '11.8'
|
|
91
|
+
pytorch: '2.0'
|
|
92
|
+
flash_attn: null
|
|
93
|
+
key_packages:
|
|
94
|
+
- torch>=2.0
|
|
95
|
+
- torchvision
|
|
96
|
+
- numpy
|
|
97
|
+
- scikit-learn
|
|
98
|
+
- scipy
|
|
99
|
+
- timm
|
|
100
|
+
- open_clip_torch
|
|
101
|
+
notes:
|
|
102
|
+
- See bundled requirements.txt or README for full dependency set
|
|
103
|
+
- open_clip_torch required for CLIP ViT-B/16 model support
|
|
104
|
+
- timm required for IN21K ViT-B/16 pretrained models
|
|
105
|
+
risk_flags:
|
|
106
|
+
- long_runtime
|
|
107
|
+
- gpu_memory_sensitive
|
|
108
|
+
- config_sensitivity
|
|
109
|
+
risk_notes:
|
|
110
|
+
- Full training on ImageNet-LT with 20 epochs may take 12-18 hours
|
|
111
|
+
- Batch size 64 on 24GB GPU requires AdaptFormer PEFT; full fine-tuning may OOM
|
|
112
|
+
- Config alignment between train and test is critical; mismatched configs produce
|
|
113
|
+
invalid results
|
|
114
|
+
- PEFT method flags (adaptformer, lora, adapter, etc.) must be explicitly set per
|
|
115
|
+
experiment
|
|
116
|
+
- Seed setting via --seed flag available but not enforced; reproducibility requires
|
|
117
|
+
manual seed setting
|
|
118
|
+
recommended_when: 'Use this benchmark when developing transformer-based reliability
|
|
119
|
+
and OOD detection methods. Particularly suited for research on: (1) adaptive layer
|
|
120
|
+
fusion strategies, (2) Mahalanobis-based OOD scoring, (3) parameter-efficient fine-tuning
|
|
121
|
+
for out-of-distribution generalization, (4) comparing shallow vs. deep transformer
|
|
122
|
+
representations, and (5) benchmarking OOD detection under class-imbalanced (long-tailed)
|
|
123
|
+
distributions.
|
|
124
|
+
|
|
125
|
+
'
|
|
126
|
+
not_recommended_when: 'Do not use this benchmark for: (1) text-only reliability tasks
|
|
127
|
+
(OOD detection here is vision-only), (2) non-transformer architectures (pure CNN-based
|
|
128
|
+
methods), (3) tasks requiring OOD detection without fine-tuning (zero-shot OOD evaluation),
|
|
129
|
+
or (4) resource-constrained environments without GPU access.
|
|
130
|
+
|
|
131
|
+
'
|
|
132
|
+
paper:
|
|
133
|
+
title: 'X-Mahalanobis: Transformer Feature Mixing for Reliable OOD Detection'
|
|
134
|
+
venue: NeurIPS 2025
|
|
135
|
+
year: 2025
|
|
136
|
+
url: https://arxiv.org/abs/2505.09128
|
|
137
|
+
notes: 'NeurIPS 2025 publication; benchmark packages official implementation from
|
|
138
|
+
the paper. Experiments demonstrate SOTA OOD detection across nine OOD datasets.
|
|
139
|
+
|
|
140
|
+
'
|
|
141
|
+
download:
|
|
142
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.098_xmahalanobis.zip
|
|
143
|
+
archive_type: zip
|
|
144
|
+
local_dir_name: paper-98-XMahalanobis
|
|
145
|
+
notes: 'Bundled archive includes full training/test code, configs, utility modules,
|
|
146
|
+
and pretrained model loading support for CLIP and IN21K ViT variants.
|
|
147
|
+
|
|
148
|
+
'
|
|
149
|
+
provider: github_release
|
|
150
|
+
repo: ResearAI/DeepScientist
|
|
151
|
+
tag: aisb-v0.0.1
|
|
152
|
+
asset_name: aisb.t3.098_xmahalanobis.zip
|
|
153
|
+
sha256: c65b3f81a78754d84bff9a76b8a0c13e180f6b3b6d379801647ed189b1f4741e
|
|
154
|
+
size_bytes: 1420263
|
|
155
|
+
display:
|
|
156
|
+
palette_seed: cobalt-silver-mahalanobis
|
|
157
|
+
art_style: reliability-vision
|
|
158
|
+
accent_priority: high
|
|
159
|
+
image_path: ../image/098_aisb.t3.098_xmahalanobis.jpg
|
|
160
|
+
capability_tags:
|
|
161
|
+
- ood_detection
|
|
162
|
+
- transformers
|
|
163
|
+
- computer_vision
|
|
164
|
+
- reliable_ml
|
|
165
|
+
- parameter_efficient_finetuning
|
|
166
|
+
- layer_fusion
|
|
167
|
+
- mahalanobis_distance
|
|
168
|
+
aisb_direction: T3
|
|
169
|
+
track_fit:
|
|
170
|
+
- paper_track
|
|
171
|
+
- benchmark_track
|
|
@@ -0,0 +1,127 @@
|
|
|
1
|
+
id: aisb.t3.098_xmahalanobis
|
|
2
|
+
name: X-Mahalanobis:用于可靠 OOD 检测的变压器特征混合
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 自适应变换层融合与马哈拉诺比斯距离评分,用于最先进的分布外检测。
|
|
5
|
+
task_description: 该打包基准测试通过自适应融合模块涵盖基于 Transformer 的分布外 (OOD) 检测,该模块动态地将重要性权重分配给每个 Transformer 层学习的表示。该方法使用跨多个中间层的马哈拉诺比斯距离评分来检测 OOD 样本,不再仅仅依赖最终层特征。该基准测试支持参数高效微调 (PEFT) 策略,包括 AdaptFormer、LoRA、Adapter、视觉提示调整 (VPT)、偏差调整和完全微调。针对九个不同的 OOD 数据集对类平衡 (CIFAR100) 和长尾 (ImageNet-LT) 分布内分类任务进行评估,报告 AUROC 和 FPR95 指标。
|
|
6
|
+
task_mode: experiment_driven
|
|
7
|
+
requires_execution: true
|
|
8
|
+
requires_paper: true
|
|
9
|
+
integrity_level: cas_plus_canary
|
|
10
|
+
snapshot_status: external_eval_required
|
|
11
|
+
support_level: advanced
|
|
12
|
+
time_band: 6-24h
|
|
13
|
+
cost_band: medium
|
|
14
|
+
difficulty: medium
|
|
15
|
+
data_access: public
|
|
16
|
+
primary_outputs:
|
|
17
|
+
- auroc
|
|
18
|
+
- fpr95
|
|
19
|
+
- ood_detection_checkpoint
|
|
20
|
+
launch_profiles:
|
|
21
|
+
- id: quick_eval
|
|
22
|
+
label: 快速评估
|
|
23
|
+
description: 使用 main_test.py 在准备好的检查点上运行 OOD 检测评估。需要经过训练的模型权重和配置与训练设置保持一致。适合评估基线或比较微调的检查点。
|
|
24
|
+
estimated_time: 1-2h
|
|
25
|
+
compute_profile: quick_eval
|
|
26
|
+
- id: train_and_test
|
|
27
|
+
label: 训练+测试
|
|
28
|
+
description: CIFAR100 或 ImageNet-LT 上的完整 PEFT 训练工作流程,然后进行 OOD 评估。支持AdaptFormer(默认)、LoRA、Adapter、VPT、偏置调整和全面微调。训练 ViT-B/16(IN21K 预训练或 CLIP 预训练)并针对多个 OOD 数据集进行评估。
|
|
29
|
+
estimated_time: 6-18h
|
|
30
|
+
compute_profile: full_training
|
|
31
|
+
dataset_download:
|
|
32
|
+
primary_method: bundled
|
|
33
|
+
sources:
|
|
34
|
+
- cifar100: torchvision datasets (auto-download)
|
|
35
|
+
- imagenet_lt: requires manual download from ImageNet, LT split preconfigured in configs
|
|
36
|
+
- ood_datasets: preconfigured in evaluation pipeline (e.g., SVHN, LSUN, iNaturalist)
|
|
37
|
+
notes:
|
|
38
|
+
- CIFAR100 通过 torchvision 自动下载
|
|
39
|
+
- ImageNet-LT需要从ImageNet官方源手动下载
|
|
40
|
+
- 由评估脚本处理的 OOD 测试数据集(TIN、SVHN、LSUN 等)
|
|
41
|
+
- 数据配置位于 configs/data/ (cifar100.yaml, imagenet_lt.yaml, imagenet.yaml)
|
|
42
|
+
credential_requirements:
|
|
43
|
+
mode: none
|
|
44
|
+
items: []
|
|
45
|
+
notes:
|
|
46
|
+
- ImageNet 下载可能需要学术注册
|
|
47
|
+
- 所有其他数据集均可公开访问或自动下载
|
|
48
|
+
resources:
|
|
49
|
+
minimum:
|
|
50
|
+
cpu_cores: 8
|
|
51
|
+
ram_gb: 32
|
|
52
|
+
disk_gb: 80
|
|
53
|
+
gpu_count: 1
|
|
54
|
+
gpu_vram_gb: 16
|
|
55
|
+
notes: 支持单 GPU 执行 quick_eval 和小规模训练
|
|
56
|
+
recommended:
|
|
57
|
+
cpu_cores: 16
|
|
58
|
+
ram_gb: 64
|
|
59
|
+
disk_gb: 150
|
|
60
|
+
gpu_count: 1
|
|
61
|
+
gpu_vram_gb: 24
|
|
62
|
+
notes: 建议 batch_size 64 使用 24GB VRAM,在 ImageNet-LT 上使用完整的 PEFT 方法。 AdaptFormer 使用 CLIP ViT-B/16 在 ImageNet-LT 上以 lr 0.1 进行 20 个周期的训练是要求最高的配置。
|
|
63
|
+
environment:
|
|
64
|
+
python: '3.9'
|
|
65
|
+
cuda: '11.8'
|
|
66
|
+
pytorch: '2.0'
|
|
67
|
+
flash_attn: null
|
|
68
|
+
key_packages:
|
|
69
|
+
- torch>=2.0
|
|
70
|
+
- torchvision
|
|
71
|
+
- numpy
|
|
72
|
+
- scikit-learn
|
|
73
|
+
- scipy
|
|
74
|
+
- timm
|
|
75
|
+
- open_clip_torch
|
|
76
|
+
notes:
|
|
77
|
+
- 请参阅捆绑的 requirements.txt 或 README 以获取完整的依赖项集
|
|
78
|
+
- CLIP ViT-B/16 模型支持需要 open_clip_torch
|
|
79
|
+
- IN21K ViT-B/16 预训练模型所需的 timm
|
|
80
|
+
risk_flags:
|
|
81
|
+
- long_runtime
|
|
82
|
+
- gpu_memory_sensitive
|
|
83
|
+
- config_sensitivity
|
|
84
|
+
risk_notes:
|
|
85
|
+
- 对 ImageNet-LT 进行 20 个 epoch 的完整训练可能需要 12-18 小时
|
|
86
|
+
- 24GB GPU 上的批量大小 64 需要 AdaptFormer PEFT;完全微调可能会OOM
|
|
87
|
+
- 训练和测试之间的配置对齐至关重要;不匹配的配置会产生无效结果
|
|
88
|
+
- 每个实验必须明确设置 PEFT 方法标志(adaptformer、lora、adapter 等)
|
|
89
|
+
- 通过 --seed 标志设置种子可用,但不强制执行;再现性需要手动播种
|
|
90
|
+
recommended_when: 开发基于变压器的可靠性和 OOD 检测方法时使用此基准。特别适合研究:(1) 自适应层融合策略,(2) 基于 Mahalanobis 的 OOD 评分,(3) 针对分布外泛化的参数高效微调,(4) 比较浅层和深层变压器表示,以及 (5) 类不平衡(长尾)分布下的基准 OOD 检测。
|
|
91
|
+
not_recommended_when: 请勿将此基准用于:(1) 纯文本可靠性任务(此处的 OOD 检测仅针对视觉)、(2) 非 Transformer 架构(纯基于 CNN 的方法)、(3) 需要无需微调的 OOD 检测的任务(零样本 OOD 评估)或 (4) 无法访问 GPU 的资源受限环境。
|
|
92
|
+
paper:
|
|
93
|
+
title: 'X-Mahalanobis: Transformer Feature Mixing for Reliable OOD Detection'
|
|
94
|
+
venue: NeurIPS 2025
|
|
95
|
+
year: 2025
|
|
96
|
+
url: https://arxiv.org/abs/2505.09128
|
|
97
|
+
notes: NeurIPS 2025 出版物;基准包官方实现来自论文。实验证明了跨九个 OOD 数据集的 SOTA OOD 检测。
|
|
98
|
+
download:
|
|
99
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.098_xmahalanobis.zip
|
|
100
|
+
archive_type: zip
|
|
101
|
+
local_dir_name: paper-98-XMahalanobis
|
|
102
|
+
notes: 'Bundled archive includes full training/test code, configs, utility modules, and pretrained model loading support for CLIP and IN21K ViT variants.
|
|
103
|
+
|
|
104
|
+
'
|
|
105
|
+
provider: github_release
|
|
106
|
+
repo: ResearAI/DeepScientist
|
|
107
|
+
tag: aisb-v0.0.1
|
|
108
|
+
asset_name: aisb.t3.098_xmahalanobis.zip
|
|
109
|
+
sha256: c65b3f81a78754d84bff9a76b8a0c13e180f6b3b6d379801647ed189b1f4741e
|
|
110
|
+
size_bytes: 1420263
|
|
111
|
+
display:
|
|
112
|
+
palette_seed: cobalt-silver-mahalanobis
|
|
113
|
+
art_style: reliability-vision
|
|
114
|
+
accent_priority: high
|
|
115
|
+
image_path: ../image/098_aisb.t3.098_xmahalanobis.jpg
|
|
116
|
+
capability_tags:
|
|
117
|
+
- ood_detection
|
|
118
|
+
- transformers
|
|
119
|
+
- computer_vision
|
|
120
|
+
- reliable_ml
|
|
121
|
+
- parameter_efficient_finetuning
|
|
122
|
+
- layer_fusion
|
|
123
|
+
- mahalanobis_distance
|
|
124
|
+
aisb_direction: T3
|
|
125
|
+
track_fit:
|
|
126
|
+
- paper_track
|
|
127
|
+
- benchmark_track
|