@researai/deepscientist 1.5.17 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +132 -11
- package/bin/ds.js +376 -49
- package/docs/en/00_QUICK_START.md +135 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +64 -4
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +29 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +44 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +92 -17
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +39 -4
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +29 -7
- package/install.sh +122 -16
- package/package.json +4 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +2 -2
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +927 -91
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +697 -210
- package/src/deepscientist/daemon/api/router.py +76 -1
- package/src/deepscientist/daemon/app.py +1054 -51
- package/src/deepscientist/diagnostics/runner_failures.py +147 -0
- package/src/deepscientist/doctor.py +212 -65
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +836 -92
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1430 -139
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +421 -21
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +61 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -11
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +409 -315
- package/src/prompts/system_copilot.md +88 -12
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
- package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
- package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
- package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
- package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
- package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
- package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
- package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
- package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
- package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
- package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
- package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
- package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
- package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
- package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
- package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
- package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
- package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
- package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,174 @@
|
|
|
1
|
+
id: aisb.t3.040_graniteguardian
|
|
2
|
+
name: '花岗岩卫士:全面的LLM安全防护'
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 多头LLM安全防护,可在配置的标准下检测越狱、幻觉及其他跨提示和响应的风险。
|
|
5
|
+
task_description: '本封装基准测试涵盖Granite Guardian风格的LLM安全防护,涉及风险维度包括越狱、社交偏见、粗口、暴力、色情内容、不道德行为以及RAG特定的幻觉风险(上下文相关性、扎根性、答案相关性)。任务涉及评估或校准风险检测头,以提升安全检测指标。当前快照捆绑了cookbook风格的使用路径和Jupyter笔记本,演示使用vLLM进行模型推理,但用于忠实复现指标的XSTEST风格评估器尚未包含在归档中。在将此作为完整基准测试路径之前,需要针对完整指标契约进行外部评估。
|
|
6
|
+
|
|
7
|
+
'
|
|
8
|
+
capability_tags:
|
|
9
|
+
- llm_safety
|
|
10
|
+
- guardrails
|
|
11
|
+
- risk_detection
|
|
12
|
+
- classification
|
|
13
|
+
- evaluation
|
|
14
|
+
- rag_quality
|
|
15
|
+
- content_moderation
|
|
16
|
+
- research_code_optimization
|
|
17
|
+
aisb_direction: T3
|
|
18
|
+
track_fit:
|
|
19
|
+
- paper_track
|
|
20
|
+
- benchmark_track
|
|
21
|
+
task_mode: evaluation_driven
|
|
22
|
+
requires_execution: true
|
|
23
|
+
requires_paper: true
|
|
24
|
+
integrity_level: cas_plus_canary
|
|
25
|
+
snapshot_status: external_eval_required
|
|
26
|
+
support_level: recovery
|
|
27
|
+
time_band: 2-6h
|
|
28
|
+
cost_band: medium
|
|
29
|
+
difficulty: medium
|
|
30
|
+
data_access: public
|
|
31
|
+
primary_outputs:
|
|
32
|
+
- xstest_rh_auc
|
|
33
|
+
- xstest_rh_f1
|
|
34
|
+
- xstest_rr_auc
|
|
35
|
+
- xstest_rr_f1
|
|
36
|
+
- risk_scoring_examples
|
|
37
|
+
- guardrail_auc
|
|
38
|
+
- rag_hallucination_auc
|
|
39
|
+
launch_profiles:
|
|
40
|
+
- id: cookbook_demo
|
|
41
|
+
label: Cookbook演示
|
|
42
|
+
description: '运行封装的Granite Guardian cookbook(基于vLLM的笔记本),以验证配置标准下的模型使用和风险评分行为。涵盖越狱检测、RAG扎根性检查和自定义标准工作流。
|
|
43
|
+
|
|
44
|
+
'
|
|
45
|
+
- id: restore_eval
|
|
46
|
+
label: 恢复评估路径
|
|
47
|
+
description: '在将此基准测试作为忠实指标复现路径之前,请附加或恢复缺失的XSTEST风格评估器。当前快照缺少XSTEST指标的可执行锚点。
|
|
48
|
+
|
|
49
|
+
'
|
|
50
|
+
- id: external_benchmark_eval
|
|
51
|
+
label: 外部基准测试评估
|
|
52
|
+
description: '在外部基准测试上评估Granite Guardian模型,包括XSTEST、LLM-AggreFact和REVEAL,以获取可复现的AUC和F1分数。
|
|
53
|
+
|
|
54
|
+
'
|
|
55
|
+
dataset_download:
|
|
56
|
+
primary_method: huggingface
|
|
57
|
+
sources:
|
|
58
|
+
- name: Granite Guardian模型
|
|
59
|
+
url: https://huggingface.co/ibm-granite
|
|
60
|
+
notes:
|
|
61
|
+
- granite-guardian-3.3-8b
|
|
62
|
+
- granite-guardian-3.2-5b
|
|
63
|
+
- granite-guardian-3.2-3b-a800m
|
|
64
|
+
- granite-guardian-3.1-8b
|
|
65
|
+
- granite-guardian-3.1-2b
|
|
66
|
+
- name: 评估数据集
|
|
67
|
+
url: https://huggingface.co/ibm
|
|
68
|
+
notes:
|
|
69
|
+
- SocialStigmaQA
|
|
70
|
+
- AttaQ
|
|
71
|
+
- ProvoQ
|
|
72
|
+
- WikiContradict
|
|
73
|
+
credential_requirements:
|
|
74
|
+
mode: none
|
|
75
|
+
items: []
|
|
76
|
+
notes:
|
|
77
|
+
- 所有模型权重和数据集均可公开访问
|
|
78
|
+
- HF Spaces演示地址:https://huggingface.co/spaces/ibm-granite/granite-guardian
|
|
79
|
+
resources:
|
|
80
|
+
minimum:
|
|
81
|
+
cpu_cores: 8
|
|
82
|
+
ram_gb: 32
|
|
83
|
+
disk_gb: 80
|
|
84
|
+
gpu_count: 1
|
|
85
|
+
gpu_vram_gb: 24
|
|
86
|
+
recommended:
|
|
87
|
+
cpu_cores: 16
|
|
88
|
+
ram_gb: 64
|
|
89
|
+
disk_gb: 150
|
|
90
|
+
gpu_count: 1
|
|
91
|
+
gpu_vram_gb: 48
|
|
92
|
+
environment:
|
|
93
|
+
python: '3.10'
|
|
94
|
+
cuda: '11.8'
|
|
95
|
+
pytorch: 2.1.0
|
|
96
|
+
flash_attn: null
|
|
97
|
+
key_packages:
|
|
98
|
+
- torch
|
|
99
|
+
- transformers
|
|
100
|
+
- vllm
|
|
101
|
+
notes:
|
|
102
|
+
- 参见捆绑的README/requirements获取完整依赖集
|
|
103
|
+
- 推荐使用vLLM进行高效推理
|
|
104
|
+
- 内容警告:示例可能包含冒犯性语言、刻板印象或歧视性内容
|
|
105
|
+
risk_flags:
|
|
106
|
+
- blocked_metrics
|
|
107
|
+
- partial_snapshot
|
|
108
|
+
risk_notes:
|
|
109
|
+
- xstest_rh_auc指标在当前快照中没有可执行代码锚点
|
|
110
|
+
- xstest_rh_f1指标在当前快照中没有可执行代码锚点
|
|
111
|
+
- xstest_rr_auc指标在当前快照中没有可执行代码锚点
|
|
112
|
+
- xstest_rr_f1指标在当前快照中没有可执行代码锚点
|
|
113
|
+
- 本次打包未执行基准测试
|
|
114
|
+
- 在恢复源文件或获取更完整的本地快照之前,请勿使用
|
|
115
|
+
- 恢复规则:选择origin_path、source_ref和evaluation_protocol.code_paths时,优先使用现有代码文件而非仅README声明
|
|
116
|
+
recommended_when: '当您需要带有可配置标准的实用LLM安全防护评估任务、生产级监控用例或RAG管道安全验证时使用此基准测试。特别适合评估检索增强生成场景中的风险检测(扎根性、上下文相关性、答案相关性)以及越狱抵抗测试。
|
|
117
|
+
|
|
118
|
+
'
|
|
119
|
+
not_recommended_when: '如果您需要当前快照中具有XSTEST指标锚点的完全可执行基准测试,或者您的重点是生成质量而非安全和验证,请勿使用。当需要可复现指标而无需外部评估设置时也不适用。
|
|
120
|
+
|
|
121
|
+
'
|
|
122
|
+
paper:
|
|
123
|
+
title: 'Granite Guardian: Comprehensive LLM Safeguarding'
|
|
124
|
+
authors: 'Inkit Padhi, Manish Nagireddy, Giandomenico Cornacchia, Subhajit Chaudhury,
|
|
125
|
+
Tejaswini Pedapati, Pierre Dognin, Keerthiram Murugesan, Erik Miehling, Martin
|
|
126
|
+
Santillan, Cooper Kieran Fraser, Giulio Zizzo, Muhammad Zaid Hameed, Mark Purcell,
|
|
127
|
+
Michael Desmond, Qian Pan, Zahra Ashktorab, Inge Vejsbjerg, Elizabeth Daly, Michael
|
|
128
|
+
Hind, Werner Geyer, Ambrish Rawat, Kush R. Varshney, Prasanna Sattigeri
|
|
129
|
+
|
|
130
|
+
'
|
|
131
|
+
venue: NAACL 2025 Industry Track
|
|
132
|
+
year: 2025
|
|
133
|
+
url: https://arxiv.org/abs/2412.07724
|
|
134
|
+
github: https://github.com/ibm-granite/granite-guardian
|
|
135
|
+
license: Apache 2.0
|
|
136
|
+
key_findings:
|
|
137
|
+
- 在有害内容基准测试上达到0.871的AUC分数
|
|
138
|
+
- 在RAG幻觉相关基准测试上达到0.854的AUC分数
|
|
139
|
+
- 在部署导向指标上优于其他开源和闭源模型
|
|
140
|
+
- 在结合人工标注和合成数据的独特数据集上训练
|
|
141
|
+
- 支持自定义标准用于自定义风险检测
|
|
142
|
+
download:
|
|
143
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.040_graniteguardian.zip
|
|
144
|
+
archive_type: zip
|
|
145
|
+
local_dir_name: paper-40-GraniteGuardian
|
|
146
|
+
provider: github_release
|
|
147
|
+
repo: ResearAI/DeepScientist
|
|
148
|
+
tag: aisb-v0.0.1
|
|
149
|
+
asset_name: aisb.t3.040_graniteguardian.zip
|
|
150
|
+
sha256: c98d57a175b4dc64b7f4bb81e3c4c16adb38a98775335f077f780d491e92b4e2
|
|
151
|
+
size_bytes: 2545921
|
|
152
|
+
display:
|
|
153
|
+
palette_seed: indigo-sand-shield
|
|
154
|
+
art_style: safety-console
|
|
155
|
+
accent_priority: high
|
|
156
|
+
image_path: ../image/040_aisb.t3.040_graniteguardian.jpg
|
|
157
|
+
code_anchors:
|
|
158
|
+
executable:
|
|
159
|
+
- cookbooks/granite-guardian-3.3/quickstart.ipynb
|
|
160
|
+
- cookbooks/granite-guardian-3.2/detailed_guide_vllm.ipynb
|
|
161
|
+
- cookbooks/granite-guardian-3.1/quick_start_vllm.ipynb
|
|
162
|
+
code_roots:
|
|
163
|
+
- cookbooks/
|
|
164
|
+
blocked_metrics:
|
|
165
|
+
- xstest_rh_auc
|
|
166
|
+
- xstest_rh_f1
|
|
167
|
+
- xstest_rr_auc
|
|
168
|
+
- xstest_rr_f1
|
|
169
|
+
recovery_rule: '选择origin_path、source_ref和evaluation_protocol.code_paths时,优先使用现有代码文件而非仅README声明。在获得可信执行输出之前,保持metrics_summary为空。如果当前快照中不存在可执行锚点,则将指标标记为临时/阻止状态。
|
|
170
|
+
|
|
171
|
+
'
|
|
172
|
+
commercial:
|
|
173
|
+
annual_fee: null
|
|
174
|
+
notes: 模型以Apache 2.0许可证开源发布
|
|
@@ -0,0 +1,149 @@
|
|
|
1
|
+
id: aisb.t3.041_amdm
|
|
2
|
+
name: Auto-Regressive Moving Diffusion Models for Time Series Forecasting
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Diffusion-based time-series forecasting with auto-regressive moving structure
|
|
5
|
+
and continuous sequential diffusion for improved probabilistic forecasting.
|
|
6
|
+
task_description: 'This benchmark implements the Auto-Regressive Moving Diffusion
|
|
7
|
+
(ARMD) model for time series forecasting. Unlike traditional diffusion models that
|
|
8
|
+
start from white Gaussian noise, ARMD employs chain-based diffusion with priors,
|
|
9
|
+
modeling the evolution of time series as a continuous sequential diffusion process.
|
|
10
|
+
The forward diffusion diffuses the future series into the historical series, while
|
|
11
|
+
the reverse denoising/devolution process transforms historical series into future
|
|
12
|
+
forecasts. This aligns the diffusion sampling procedure with the forecasting objective,
|
|
13
|
+
removing the need for conditional generation. The task is to tune diffusion schedules
|
|
14
|
+
and moving dynamics to improve probabilistic forecasting metrics on standard public
|
|
15
|
+
benchmark suites.
|
|
16
|
+
|
|
17
|
+
'
|
|
18
|
+
task_mode: experiment_driven
|
|
19
|
+
requires_execution: true
|
|
20
|
+
requires_paper: true
|
|
21
|
+
integrity_level: cas_plus_canary
|
|
22
|
+
snapshot_status: partial
|
|
23
|
+
support_level: recovery
|
|
24
|
+
time_band: 6-24h
|
|
25
|
+
cost_band: medium
|
|
26
|
+
difficulty: hard
|
|
27
|
+
data_access: public
|
|
28
|
+
primary_outputs:
|
|
29
|
+
- mse
|
|
30
|
+
- mae
|
|
31
|
+
- forecast_samples
|
|
32
|
+
launch_profiles:
|
|
33
|
+
- id: analysis_only
|
|
34
|
+
label: Analysis Only
|
|
35
|
+
description: Inspect the preserved diffusion forecasting code and configs before
|
|
36
|
+
a full run.
|
|
37
|
+
- id: restore_first
|
|
38
|
+
label: Restore First
|
|
39
|
+
description: Restore the missing main entry files referenced by the README before
|
|
40
|
+
treating this package as runnable.
|
|
41
|
+
- id: full_train_eval
|
|
42
|
+
label: Full Train and Evaluate
|
|
43
|
+
description: Run training with scheduler-aware training and evaluate on all metrics.
|
|
44
|
+
Use config files in Config/ directory (etth1.yaml, ettm1.yaml, exchange.yaml,
|
|
45
|
+
stock.yaml).
|
|
46
|
+
dataset_download:
|
|
47
|
+
primary_method: mixed
|
|
48
|
+
sources:
|
|
49
|
+
- name: ETT dataset
|
|
50
|
+
url: https://github.com/thuml/iTransformer
|
|
51
|
+
license: MIT
|
|
52
|
+
- name: Solar Energy and Exchange datasets
|
|
53
|
+
url: https://github.com/thuml/iTransformer
|
|
54
|
+
license: MIT
|
|
55
|
+
- name: Stock dataset
|
|
56
|
+
url: https://github.com/Y-debug-sys/Diffusion-TS
|
|
57
|
+
license: MIT
|
|
58
|
+
notes:
|
|
59
|
+
- Download datasets and place in ./Data/datasets directory
|
|
60
|
+
- Datasets must be obtained from external repositories as they are not bundled
|
|
61
|
+
credential_requirements:
|
|
62
|
+
mode: none
|
|
63
|
+
items: []
|
|
64
|
+
notes: []
|
|
65
|
+
resources:
|
|
66
|
+
minimum:
|
|
67
|
+
cpu_cores: 8
|
|
68
|
+
ram_gb: 32
|
|
69
|
+
disk_gb: 80
|
|
70
|
+
gpu_count: 1
|
|
71
|
+
gpu_vram_gb: 16
|
|
72
|
+
recommended:
|
|
73
|
+
cpu_cores: 16
|
|
74
|
+
ram_gb: 64
|
|
75
|
+
disk_gb: 150
|
|
76
|
+
gpu_count: 1
|
|
77
|
+
gpu_vram_gb: 24
|
|
78
|
+
environment:
|
|
79
|
+
python: '3.10'
|
|
80
|
+
cuda: '11.8'
|
|
81
|
+
pytorch: 2.1.0
|
|
82
|
+
flash_attn: null
|
|
83
|
+
key_packages:
|
|
84
|
+
- ema_pytorch
|
|
85
|
+
- tqdm
|
|
86
|
+
- torch
|
|
87
|
+
- numpy
|
|
88
|
+
- scipy
|
|
89
|
+
- scikit-learn
|
|
90
|
+
- matplotlib
|
|
91
|
+
- seaborn
|
|
92
|
+
notes:
|
|
93
|
+
- Install dependencies via: pip install -r requirements.txt
|
|
94
|
+
- Full dependency set documented in bundled README
|
|
95
|
+
risk_flags:
|
|
96
|
+
- partial_snapshot
|
|
97
|
+
- no_runtime_verification
|
|
98
|
+
risk_notes:
|
|
99
|
+
- Static code audit found executable anchors for all staged metrics
|
|
100
|
+
- No benchmark execution was performed in this packaging pass
|
|
101
|
+
- Runtime execution required before trusting metric values
|
|
102
|
+
- Recovery mode recommended to restore any missing main entry files
|
|
103
|
+
recommended_when: 'Use this benchmark when you need a diffusion-style probabilistic
|
|
104
|
+
forecasting task with standard public time-series datasets, require state-of-the-art
|
|
105
|
+
performance on multivariate forecasting, or want to explore continuous sequential
|
|
106
|
+
diffusion methods that align diffusion sampling with forecasting objectives.
|
|
107
|
+
|
|
108
|
+
'
|
|
109
|
+
not_recommended_when: 'Do not use this if you need a tiny CPU-only benchmark, require
|
|
110
|
+
a non-generative point-estimate forecasting setup, or need pre-executed and verified
|
|
111
|
+
metric values without runtime overhead.
|
|
112
|
+
|
|
113
|
+
'
|
|
114
|
+
paper:
|
|
115
|
+
title: Auto-Regressive Moving Diffusion Models for Time Series Forecasting
|
|
116
|
+
authors:
|
|
117
|
+
- Jiaxin Gao
|
|
118
|
+
- Qinglong Cao
|
|
119
|
+
- Yuntian Chen
|
|
120
|
+
venue: arXiv preprint
|
|
121
|
+
year: 2024
|
|
122
|
+
url: https://arxiv.org/abs/2412.09328
|
|
123
|
+
code_url: https://github.com/daxin007/ARMD
|
|
124
|
+
display:
|
|
125
|
+
palette_seed: midnight-amber-diffusion
|
|
126
|
+
art_style: sequential-lab
|
|
127
|
+
accent_priority: high
|
|
128
|
+
image_path: ../image/041_aisb.t3.041_amdm.jpg
|
|
129
|
+
capability_tags:
|
|
130
|
+
- research_code_optimization
|
|
131
|
+
- time_series_forecasting
|
|
132
|
+
- diffusion_models
|
|
133
|
+
- forecasting
|
|
134
|
+
- scientific_ml
|
|
135
|
+
- probabilistic_forecasting
|
|
136
|
+
- autoregressive_moving
|
|
137
|
+
aisb_direction: T3
|
|
138
|
+
track_fit:
|
|
139
|
+
- paper_track
|
|
140
|
+
- benchmark_track
|
|
141
|
+
download:
|
|
142
|
+
provider: github_release
|
|
143
|
+
repo: ResearAI/DeepScientist
|
|
144
|
+
tag: aisb-v0.0.1
|
|
145
|
+
asset_name: aisb.t3.041_amdm.zip
|
|
146
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.041_amdm.zip
|
|
147
|
+
archive_type: zip
|
|
148
|
+
sha256: 9fc41b0433a71fc79ca141b9d6451c7323ab4286cead7d38e77d5ed793283244
|
|
149
|
+
size_bytes: 2172119
|
|
@@ -0,0 +1,137 @@
|
|
|
1
|
+
id: aisb.t3.041_amdm
|
|
2
|
+
name: 时间序列预测的自回归移动扩散模型
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: 基于扩散的时间序列预测,采用自回归移动结构和连续顺序扩散,提升概率预测能力。
|
|
5
|
+
task_description: >
|
|
6
|
+
本基准实现了用于时间序列预测的自回归移动扩散(ARMD)模型。与从白高斯噪声开始
|
|
7
|
+
的传统扩散模型不同,ARMD采用基于链的扩散与先验,将时间序列的演化建模为连续顺序扩
|
|
8
|
+
散过程。前向扩散将未来序列扩散到历史序列,而反向去噪/演化过程则将历史序列转换为
|
|
9
|
+
未来预测。这使扩散采样过程与预测目标对齐,无需条件生成。任务是通过调整扩散调度
|
|
10
|
+
和移动动态来提升标准公开基准套件上的概率预测指标。
|
|
11
|
+
|
|
12
|
+
task_mode: experiment_driven
|
|
13
|
+
requires_execution: true
|
|
14
|
+
requires_paper: true
|
|
15
|
+
integrity_level: cas_plus_canary
|
|
16
|
+
snapshot_status: partial
|
|
17
|
+
support_level: recovery
|
|
18
|
+
time_band: 6-24h
|
|
19
|
+
cost_band: medium
|
|
20
|
+
difficulty: hard
|
|
21
|
+
data_access: public
|
|
22
|
+
primary_outputs:
|
|
23
|
+
- mse
|
|
24
|
+
- mae
|
|
25
|
+
- forecast_samples
|
|
26
|
+
launch_profiles:
|
|
27
|
+
- id: analysis_only
|
|
28
|
+
label: 仅分析
|
|
29
|
+
description: 在完整运行前,检查保存的扩散预测代码和配置。
|
|
30
|
+
- id: restore_first
|
|
31
|
+
label: 优先恢复
|
|
32
|
+
description: 在将此包视为可运行之前,恢复README中引用的缺失主入口文件。
|
|
33
|
+
- id: full_train_eval
|
|
34
|
+
label: 完整训练和评估
|
|
35
|
+
description: 使用调度器感知训练进行训练,并在所有指标上评估。使用Config/目录下的
|
|
36
|
+
配置文件(etth1.yaml、ettm1.yaml、exchange.yaml、stock.yaml)。
|
|
37
|
+
dataset_download:
|
|
38
|
+
primary_method: mixed
|
|
39
|
+
sources:
|
|
40
|
+
- name: ETT数据集
|
|
41
|
+
url: https://github.com/thuml/iTransformer
|
|
42
|
+
license: MIT
|
|
43
|
+
- name: 太阳能和汇率数据集
|
|
44
|
+
url: https://github.com/thuml/iTransformer
|
|
45
|
+
license: MIT
|
|
46
|
+
- name: 股票数据集
|
|
47
|
+
url: https://github.com/Y-debug-sys/Diffusion-TS
|
|
48
|
+
license: MIT
|
|
49
|
+
notes:
|
|
50
|
+
- 下载数据集并放置在 ./Data/datasets 目录
|
|
51
|
+
- 数据集必须从外部仓库获取,因未捆绑
|
|
52
|
+
credential_requirements:
|
|
53
|
+
mode: none
|
|
54
|
+
items: []
|
|
55
|
+
notes: []
|
|
56
|
+
resources:
|
|
57
|
+
minimum:
|
|
58
|
+
cpu_cores: 8
|
|
59
|
+
ram_gb: 32
|
|
60
|
+
disk_gb: 80
|
|
61
|
+
gpu_count: 1
|
|
62
|
+
gpu_vram_gb: 16
|
|
63
|
+
recommended:
|
|
64
|
+
cpu_cores: 16
|
|
65
|
+
ram_gb: 64
|
|
66
|
+
disk_gb: 150
|
|
67
|
+
gpu_count: 1
|
|
68
|
+
gpu_vram_gb: 24
|
|
69
|
+
environment:
|
|
70
|
+
python: '3.10'
|
|
71
|
+
cuda: '11.8'
|
|
72
|
+
pytorch: 2.1.0
|
|
73
|
+
flash_attn: null
|
|
74
|
+
key_packages:
|
|
75
|
+
- ema_pytorch
|
|
76
|
+
- tqdm
|
|
77
|
+
- torch
|
|
78
|
+
- numpy
|
|
79
|
+
- scipy
|
|
80
|
+
- scikit-learn
|
|
81
|
+
- matplotlib
|
|
82
|
+
- seaborn
|
|
83
|
+
notes:
|
|
84
|
+
- 通过以下命令安装依赖:pip install -r requirements.txt
|
|
85
|
+
- 完整依赖集记录在捆绑的README中
|
|
86
|
+
risk_flags:
|
|
87
|
+
- partial_snapshot
|
|
88
|
+
- no_runtime_verification
|
|
89
|
+
risk_notes:
|
|
90
|
+
- 静态代码审计发现所有分阶段指标都有可执行锚点
|
|
91
|
+
- 本次打包未执行基准测试
|
|
92
|
+
- 运行时执行是验证指标值之前必需的
|
|
93
|
+
- 建议使用恢复模式以恢复任何缺失的主入口文件
|
|
94
|
+
recommended_when: >
|
|
95
|
+
当您需要使用标准公开时间序列数据集进行扩散式概率预测任务、需要在多元预测上达
|
|
96
|
+
到最优性能,或想要探索将扩散采样与预测目标对齐的连续顺序扩散方法时,请使用此基准。
|
|
97
|
+
|
|
98
|
+
not_recommended_when: >
|
|
99
|
+
如果您需要仅CPU运行的小型基准测试、需要非生成式的点估计预测设置,或需要在无运行
|
|
100
|
+
时开销的情况下获得预先执行并验证的指标值,请勿使用此基准。
|
|
101
|
+
|
|
102
|
+
paper:
|
|
103
|
+
title: Auto-Regressive Moving Diffusion Models for Time Series Forecasting
|
|
104
|
+
authors:
|
|
105
|
+
- Jiaxin Gao
|
|
106
|
+
- Qinglong Cao
|
|
107
|
+
- Yuntian Chen
|
|
108
|
+
venue: arXiv preprint
|
|
109
|
+
year: 2024
|
|
110
|
+
url: https://arxiv.org/abs/2412.09328
|
|
111
|
+
code_url: https://github.com/daxin007/ARMD
|
|
112
|
+
display:
|
|
113
|
+
palette_seed: midnight-amber-diffusion
|
|
114
|
+
art_style: sequential-lab
|
|
115
|
+
accent_priority: high
|
|
116
|
+
image_path: ../image/041_aisb.t3.041_amdm.jpg
|
|
117
|
+
capability_tags:
|
|
118
|
+
- research_code_optimization
|
|
119
|
+
- time_series_forecasting
|
|
120
|
+
- diffusion_models
|
|
121
|
+
- forecasting
|
|
122
|
+
- scientific_ml
|
|
123
|
+
- probabilistic_forecasting
|
|
124
|
+
- autoregressive_moving
|
|
125
|
+
aisb_direction: T3
|
|
126
|
+
track_fit:
|
|
127
|
+
- paper_track
|
|
128
|
+
- benchmark_track
|
|
129
|
+
download:
|
|
130
|
+
provider: github_release
|
|
131
|
+
repo: ResearAI/DeepScientist
|
|
132
|
+
tag: aisb-v0.0.1
|
|
133
|
+
asset_name: aisb.t3.041_amdm.zip
|
|
134
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.041_amdm.zip
|
|
135
|
+
archive_type: zip
|
|
136
|
+
sha256: 9fc41b0433a71fc79ca141b9d6451c7323ab4286cead7d38e77d5ed793283244
|
|
137
|
+
size_bytes: 2172119
|
|
@@ -0,0 +1,216 @@
|
|
|
1
|
+
id: aisb.t3.042_xpatch
|
|
2
|
+
name: 'xPatch: Dual-Stream Time Series Forecasting with Exponential Seasonal-Trend
|
|
3
|
+
Decomposition'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: CNN-MLP dual-stream long-term time-series forecasting with EMA-based seasonal-trend
|
|
6
|
+
decomposition and long-context patching.
|
|
7
|
+
task_description: 'This packaged benchmark covers xPatch, a dual-stream long-term
|
|
8
|
+
time series forecasting (LTSF) architecture that decomposes input series into seasonal
|
|
9
|
+
and trend components using Exponential Moving Average (EMA) rather than simple moving
|
|
10
|
+
average. The linear stream employs MLP layers for trend prediction while the nonlinear
|
|
11
|
+
stream uses depthwise separable CNN for seasonal patterns. The model investigates
|
|
12
|
+
patching and channel-independence techniques within a non-transformer backbone,
|
|
13
|
+
evaluating against transformer baselines (PatchTST, Autoformer, FEDformer, CARD)
|
|
14
|
+
and linear baselines (DLinear, RLinear) on standard LTSF benchmark datasets.
|
|
15
|
+
|
|
16
|
+
'
|
|
17
|
+
task_mode: experiment_driven
|
|
18
|
+
requires_execution: true
|
|
19
|
+
requires_paper: true
|
|
20
|
+
integrity_level: cas_plus_canary
|
|
21
|
+
snapshot_status: runnable
|
|
22
|
+
support_level: advanced
|
|
23
|
+
time_band: 6-24h
|
|
24
|
+
cost_band: medium
|
|
25
|
+
difficulty: hard
|
|
26
|
+
data_access: public
|
|
27
|
+
primary_outputs:
|
|
28
|
+
- mse
|
|
29
|
+
- mae
|
|
30
|
+
- forecast_checkpoints
|
|
31
|
+
- ablation_outputs
|
|
32
|
+
launch_profiles:
|
|
33
|
+
- id: quick_eval
|
|
34
|
+
label: Quick Eval
|
|
35
|
+
description: 'Run xPatch on a single prepared forecasting dataset using unified
|
|
36
|
+
experimental settings. Executes xPatch_unified script with default hyperparameters.
|
|
37
|
+
Suitable for rapid validation of model behavior on one benchmark dataset.
|
|
38
|
+
|
|
39
|
+
'
|
|
40
|
+
- id: hyper_search
|
|
41
|
+
label: Hyperparameter Search
|
|
42
|
+
description: 'Run comprehensive hyperparameter search across patch length, lookback
|
|
43
|
+
windows, prediction lengths, and EMA alpha parameter. Uses xPatch_search script.
|
|
44
|
+
Produces results for fair comparison against baseline papers that report with
|
|
45
|
+
drop-last trick.
|
|
46
|
+
|
|
47
|
+
'
|
|
48
|
+
- id: fair_benchmark
|
|
49
|
+
label: Fair Benchmark (TFB/OpenTS)
|
|
50
|
+
description: 'Execute fair experiments without the drop-last trick following the
|
|
51
|
+
TFB benchmark protocol. Uses xPatch_fair script. Results are comparable to OpenTS
|
|
52
|
+
leaderboard entries.
|
|
53
|
+
|
|
54
|
+
'
|
|
55
|
+
- id: ablation_suite
|
|
56
|
+
label: Ablation Suite
|
|
57
|
+
description: 'Run ablation studies from the paper appendix including EMA decomposition
|
|
58
|
+
impact, arctangent loss effect, sigmoid learning rate adjustment scheme, and inference
|
|
59
|
+
time comparisons against baseline models in ./ablation directory.
|
|
60
|
+
|
|
61
|
+
'
|
|
62
|
+
dataset_download:
|
|
63
|
+
primary_method: mixed
|
|
64
|
+
sources:
|
|
65
|
+
- name: Google Drive
|
|
66
|
+
url: https://drive.google.com/u/0/uc?id=1NF7VEefXCmXuWNbnNe858WvQAkJ_7wuP&export=download
|
|
67
|
+
format: csv
|
|
68
|
+
- name: Baidu Pan
|
|
69
|
+
url: https://pan.baidu.com/share/init?surl=r3KhGd0Q9PJIUZdfEYoymg&pwd=i9iy
|
|
70
|
+
format: csv
|
|
71
|
+
- name: Kaggle Datasets
|
|
72
|
+
url: https://www.kaggle.com/datasets/wentixxiaogege/time-series-dataset
|
|
73
|
+
format: csv
|
|
74
|
+
notes:
|
|
75
|
+
- Download all preprocessed datasets into ./dataset directory
|
|
76
|
+
- Benchmark datasets include: ETTh1, ETTh2, ETTm1, ETTm2, Weather, Traffic, Electricity
|
|
77
|
+
- Datasets are pre-processed and ready for direct use without additional normalization
|
|
78
|
+
steps
|
|
79
|
+
credential_requirements:
|
|
80
|
+
mode: optional
|
|
81
|
+
items:
|
|
82
|
+
- kaggle_api_token
|
|
83
|
+
notes:
|
|
84
|
+
- Kaggle download requires kaggle credentials or API token
|
|
85
|
+
- Google Drive and Baidu links available without authentication
|
|
86
|
+
resources:
|
|
87
|
+
minimum:
|
|
88
|
+
cpu_cores: 8
|
|
89
|
+
ram_gb: 32
|
|
90
|
+
disk_gb: 80
|
|
91
|
+
gpu_count: 1
|
|
92
|
+
gpu_vram_gb: 24
|
|
93
|
+
notes: Single GPU sufficient; RTX 6000-class or equivalent recommended
|
|
94
|
+
recommended:
|
|
95
|
+
cpu_cores: 16
|
|
96
|
+
ram_gb: 64
|
|
97
|
+
disk_gb: 150
|
|
98
|
+
gpu_count: 1
|
|
99
|
+
gpu_vram_gb: 24
|
|
100
|
+
notes: 'Original experiments used single Quadro RTX 6000 (24GB). Hyperparameter
|
|
101
|
+
search and ablation studies benefit from additional RAM for larger batch sizes.
|
|
102
|
+
|
|
103
|
+
'
|
|
104
|
+
environment:
|
|
105
|
+
python: '3.9'
|
|
106
|
+
cuda: '11.8'
|
|
107
|
+
pytorch: 2.5.1
|
|
108
|
+
flash_attn: null
|
|
109
|
+
key_packages:
|
|
110
|
+
- pytorch>=2.0.0
|
|
111
|
+
- numpy
|
|
112
|
+
- pandas
|
|
113
|
+
- scikit-learn
|
|
114
|
+
- matplotlib
|
|
115
|
+
notes:
|
|
116
|
+
- Environment file (environment.yml) specifies conda CUDA 11.8 toolkit with pip-installed
|
|
117
|
+
PyTorch 2.5.1
|
|
118
|
+
- Mixed conda/pip stack requires careful environment management
|
|
119
|
+
- Create conda environment with: conda env create -f environment.yml
|
|
120
|
+
- See bundled README for full dependency set
|
|
121
|
+
- Experiment scripts in ./scripts directory handle runtime configuration
|
|
122
|
+
risk_flags:
|
|
123
|
+
- mixed_environment_stack
|
|
124
|
+
- data_download_external
|
|
125
|
+
- hyperparameter_sensitivity
|
|
126
|
+
risk_notes:
|
|
127
|
+
- Mixed conda CUDA 11.8 with pip PyTorch 2.5.1 may cause version conflicts; verify
|
|
128
|
+
CUDA runtime matches PyTorch built-in CUDA
|
|
129
|
+
- External dataset downloads from Google Drive/Baidu may require VPN or regional access
|
|
130
|
+
- Performance is sensitive to patch length, lookback window, prediction length, and
|
|
131
|
+
EMA alpha parameter
|
|
132
|
+
- Fair benchmark results exclude drop-last trick per TFB protocol; verify which experimental
|
|
133
|
+
setting matches your evaluation goals
|
|
134
|
+
recommended_when: 'Use this benchmark when evaluating dual-stream non-transformer
|
|
135
|
+
forecasting architectures, studying EMA-based seasonal-trend decomposition effects,
|
|
136
|
+
investigating patching and channel-independence outside transformer backbones, or
|
|
137
|
+
comparing CNN/MLP approaches against established transformer and linear baselines
|
|
138
|
+
on long-term forecasting tasks.
|
|
139
|
+
|
|
140
|
+
'
|
|
141
|
+
not_recommended_when: 'Do not use this benchmark for non-time-series tasks, real-time/online
|
|
142
|
+
forecasting scenarios, scenarios without access to workstation-class GPU with 24GB
|
|
143
|
+
VRAM, or when requiring models with built-in uncertainty quantification.
|
|
144
|
+
|
|
145
|
+
'
|
|
146
|
+
paper:
|
|
147
|
+
title: 'xPatch: Dual-Stream Time Series Forecasting with Exponential Seasonal-Trend
|
|
148
|
+
Decomposition'
|
|
149
|
+
authors:
|
|
150
|
+
- Artyom Stitsyuk
|
|
151
|
+
- Jaesik Choi
|
|
152
|
+
venue: AAAI 2025
|
|
153
|
+
year: 2025
|
|
154
|
+
volume: '39'
|
|
155
|
+
number: '19'
|
|
156
|
+
pages: 20601-20609
|
|
157
|
+
url: https://ojs.aaai.org/index.php/AAAI/article/view/34270
|
|
158
|
+
arxiv_url: https://arxiv.org/pdf/2412.17323
|
|
159
|
+
bibtex: "@inproceedings{stitsyuk2025xpatch,\n title={xPatch: Dual-Stream Time Series\
|
|
160
|
+
\ Forecasting with Exponential Seasonal-Trend Decomposition},\n author={Stitsyuk,\
|
|
161
|
+
\ Artyom and Choi, Jaesik},\n booktitle={Proceedings of the AAAI Conference on\
|
|
162
|
+
\ Artificial Intelligence},\n volume={39}, number={19}, pages={20601--20609},\
|
|
163
|
+
\ year={2025}\n}\n"
|
|
164
|
+
download:
|
|
165
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.042_xpatch.zip
|
|
166
|
+
archive_type: zip
|
|
167
|
+
local_dir_name: paper-42-xPatch
|
|
168
|
+
provider: github_release
|
|
169
|
+
repo: ResearAI/DeepScientist
|
|
170
|
+
tag: aisb-v0.0.1
|
|
171
|
+
asset_name: aisb.t3.042_xpatch.zip
|
|
172
|
+
sha256: 72c8e6fd7e1a8b2eb184077ce9a37fb36514ef7bb148d8d0ff4ed79d4aa9de25
|
|
173
|
+
size_bytes: 3621184
|
|
174
|
+
display:
|
|
175
|
+
palette_seed: teal-sunrise-trend
|
|
176
|
+
art_style: signal-geometry
|
|
177
|
+
accent_priority: high
|
|
178
|
+
image_path: ../image/042_aisb.t3.042_xpatch.jpg
|
|
179
|
+
metric_contract:
|
|
180
|
+
mse:
|
|
181
|
+
origin_path: utils/metrics.py
|
|
182
|
+
source_ref: MSE function
|
|
183
|
+
evaluation_protocol:
|
|
184
|
+
code_paths:
|
|
185
|
+
- run.py
|
|
186
|
+
- utils/metrics.py
|
|
187
|
+
status: code_backed
|
|
188
|
+
mae:
|
|
189
|
+
origin_path: utils/metrics.py
|
|
190
|
+
source_ref: MAE function
|
|
191
|
+
evaluation_protocol:
|
|
192
|
+
code_paths:
|
|
193
|
+
- run.py
|
|
194
|
+
- utils/metrics.py
|
|
195
|
+
status: code_backed
|
|
196
|
+
forecast_checkpoints:
|
|
197
|
+
origin_path: exp/exp_main.py
|
|
198
|
+
source_ref: model state saving
|
|
199
|
+
status: provisional
|
|
200
|
+
code_anchors:
|
|
201
|
+
- environment.yml
|
|
202
|
+
- run.py
|
|
203
|
+
- utils/metrics.py
|
|
204
|
+
- exp/exp_main.py
|
|
205
|
+
- layers/decomp.py
|
|
206
|
+
- layers/network.py
|
|
207
|
+
- layers/network_cnn.py
|
|
208
|
+
- layers/network_mlp.py
|
|
209
|
+
- models/xPatch.py
|
|
210
|
+
caveat_snapshot: 'Static code audit found executable anchors for MSE and MAE metrics
|
|
211
|
+
in utils/metrics.py and run.py. No benchmark execution was performed in this packaging
|
|
212
|
+
pass. Runtime execution is required before trusting metric values. Fair benchmark
|
|
213
|
+
requires TFB/OpenTS protocol compliance; confirm drop-last trick handling matches
|
|
214
|
+
evaluation goals.
|
|
215
|
+
|
|
216
|
+
'
|