@researai/deepscientist 1.5.17 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +132 -11
- package/bin/ds.js +376 -49
- package/docs/en/00_QUICK_START.md +135 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +64 -4
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +622 -187
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +29 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +44 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +92 -17
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +39 -4
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +550 -188
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +105 -2
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +29 -7
- package/install.sh +122 -16
- package/package.json +4 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +2 -2
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +927 -91
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +697 -210
- package/src/deepscientist/daemon/api/router.py +76 -1
- package/src/deepscientist/daemon/app.py +1054 -51
- package/src/deepscientist/diagnostics/runner_failures.py +147 -0
- package/src/deepscientist/doctor.py +212 -65
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +836 -92
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1430 -139
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +421 -21
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +61 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -11
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +409 -315
- package/src/prompts/system_copilot.md +88 -12
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-BCKAfjba.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-CbaFRrUU.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DAjLVeQD.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-CQACjoAA.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-0r4nLPke.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-nBOmI2v_.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-ZwtV8pIp.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DKqVfKyW.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BwxStZ9D.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-DB9N_T9q.js → NotebookEditor-WFyd8Ybt.js} +3 -3
- package/src/ui/dist/assets/{PdfLoader-eWBONbQP.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-D22YOZL3.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-C5xqeeUH.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-WlFHE7z_.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-BC-Hltpd.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-CfQPKQKj.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-CwNu1aH4.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-C9IdzdZW.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-E_gaeAxL.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-Bv-Z8YpU.js +0 -204
- package/src/ui/dist/assets/CliPlugin-BCKcpc35.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-DbOfSJ8K.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-CIUqbUDO.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-BHxOxF4z.js +0 -14
- package/src/ui/dist/assets/LabPlugin-BKoZGs95.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-BEQhaQbt.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-c-RK9DLM.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CxF9ytAx.js +0 -16
- package/src/ui/dist/assets/VNCViewer-BoLGLnHz.js +0 -11
- package/src/ui/dist/assets/bot-DREQOxzP.js +0 -6
- package/src/ui/dist/assets/chevron-up-C9Qpx4DE.js +0 -6
- package/src/ui/dist/assets/file-content-BZMz3RYp.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-CQhw0jS2.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-DxZ8DCZh.js +0 -6
- package/src/ui/dist/assets/image-Bgl4VIyx.js +0 -6
- package/src/ui/dist/assets/index-BpV6lusQ.css +0 -33
- package/src/ui/dist/assets/index-CBNVuWcP.js +0 -2496
- package/src/ui/dist/assets/index-DrUnlf6K.js +0 -1
- package/src/ui/dist/assets/index-NW-h8VzN.js +0 -1
- package/src/ui/dist/assets/pdf-effect-queue-J8OnM0jE.js +0 -6
- package/src/ui/dist/assets/popover-CLc0pPP8.js +0 -1
- package/src/ui/dist/assets/select-Cs2PmzwL.js +0 -11
- package/src/ui/dist/assets/sigma-ClKcHAXm.js +0 -6
- package/src/ui/dist/assets/trash-DwpbFr3w.js +0 -11
- package/src/ui/dist/assets/useCliAccess-NQ8m0Let.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,206 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.011_osd
|
|
3
|
+
name: Orthogonal Subspace Decomposition for Generalizable AI-Generated Image Detection
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: Train and evaluate a CLIP-ViT-L/14 detector that uses SVD-based orthogonal
|
|
6
|
+
subspace decomposition (Effort) to generalize across deepfake and synthetic-image
|
|
7
|
+
forgery families on DeepfakeBench and GenImage benchmarks.
|
|
8
|
+
task_description: 'This benchmark packages the "Effort" method for AI-generated image
|
|
9
|
+
detection. The core idea is to decompose CLIP-ViT-L/14 weight matrices via SVD into
|
|
10
|
+
frozen principal components (preserving pre-trained knowledge) and trainable residual
|
|
11
|
+
components (learning forgery patterns), enforcing orthogonality to prevent overfitting
|
|
12
|
+
to seen forgery types. The execution route involves: (1) downloading the CLIP-ViT-L/14
|
|
13
|
+
backbone and pre-trained Effort checkpoints from Google Drive, (2) obtaining deepfake
|
|
14
|
+
datasets externally from DeepfakeBench (FaceForensics++, Celeb-DF-v2, DF40) or GenImage/Chameleon
|
|
15
|
+
for synthetic-image evaluation, (3) training the Effort detector head on one source
|
|
16
|
+
dataset while keeping SVD-principal components frozen, and (4) evaluating cross-dataset
|
|
17
|
+
generalization accuracy across multiple unseen forgery methods. Two codebases are
|
|
18
|
+
bundled: DeepfakeBench (face deepfake detection, Table 1 results) and UniversalFakeDetect_Benchmark
|
|
19
|
+
(general synthetic image detection, Table 2 results). The primary metric is detection
|
|
20
|
+
accuracy on unseen forgery families (e.g., BigGAN, CycleGAN, SimSwap). Datasets
|
|
21
|
+
must be downloaded separately from external sources and are large (tens to hundreds
|
|
22
|
+
of GB). Checkpoints are hosted on Google Drive.
|
|
23
|
+
|
|
24
|
+
'
|
|
25
|
+
capability_tags:
|
|
26
|
+
- research_code_optimization
|
|
27
|
+
- computer_vision
|
|
28
|
+
- deepfake_detection
|
|
29
|
+
- image_forensics
|
|
30
|
+
- benchmark_evaluation
|
|
31
|
+
- clip_finetuning
|
|
32
|
+
aisb_direction: T3
|
|
33
|
+
track_fit:
|
|
34
|
+
- paper_track
|
|
35
|
+
- benchmark_track
|
|
36
|
+
task_mode: experiment_driven
|
|
37
|
+
requires_execution: true
|
|
38
|
+
requires_paper: true
|
|
39
|
+
integrity_level: cas_plus_canary
|
|
40
|
+
snapshot_status: runnable
|
|
41
|
+
support_level: advanced
|
|
42
|
+
cost_band: high
|
|
43
|
+
time_band: 1d+
|
|
44
|
+
difficulty: hard
|
|
45
|
+
data_access: public
|
|
46
|
+
primary_outputs:
|
|
47
|
+
- biggan_accuracy
|
|
48
|
+
- detection_scores
|
|
49
|
+
- benchmark_report
|
|
50
|
+
- cross_dataset_auc
|
|
51
|
+
launch_profiles:
|
|
52
|
+
- id: quick_check
|
|
53
|
+
label: Quick Check (Inference Only)
|
|
54
|
+
description: 'Download a pre-trained Effort checkpoint from Google Drive and run
|
|
55
|
+
DeepfakeBench/training/demo.py on a single image or folder to verify the inference
|
|
56
|
+
pipeline produces fake-probability scores.
|
|
57
|
+
|
|
58
|
+
'
|
|
59
|
+
- id: single_dataset_train
|
|
60
|
+
label: Single-Dataset Train + Test
|
|
61
|
+
description: 'Train the Effort detector on one source dataset (e.g., FaceForensics++)
|
|
62
|
+
using a single GPU, then test on one held-out dataset (e.g., Celeb-DF-v2). Verifies
|
|
63
|
+
the training loop, SVD decomposition, orthogonal/KSV losses, and checkpoint saving.
|
|
64
|
+
|
|
65
|
+
'
|
|
66
|
+
- id: cross_benchmark_eval
|
|
67
|
+
label: Cross-Benchmark Evaluation
|
|
68
|
+
description: 'Evaluate the trained or pre-trained Effort detector across multiple
|
|
69
|
+
unseen forgery datasets (SimSwap, BlendFace, DeepFaceLab, etc. via DF40) to reproduce
|
|
70
|
+
the cross-dataset generalization results from the paper.
|
|
71
|
+
|
|
72
|
+
'
|
|
73
|
+
- id: univfd_benchmark
|
|
74
|
+
label: UniversalFakeDetect Benchmark
|
|
75
|
+
description: 'Use the UniversalFakeDetect_Benchmark/ codebase to reproduce Table
|
|
76
|
+
2 results on general synthetic image detection (GenImage, Chameleon).
|
|
77
|
+
|
|
78
|
+
'
|
|
79
|
+
dataset_download:
|
|
80
|
+
primary_method: mixed
|
|
81
|
+
sources:
|
|
82
|
+
- kind: external_repo
|
|
83
|
+
url: https://github.com/SCLBD/DeepfakeBench
|
|
84
|
+
access: public
|
|
85
|
+
note: 'FaceForensics++, Celeb-DF-v2, and other face deepfake datasets. Pre-processed
|
|
86
|
+
frames and face crops available via DeepfakeBench.
|
|
87
|
+
|
|
88
|
+
'
|
|
89
|
+
- kind: external_repo
|
|
90
|
+
url: https://github.com/YZY-stack/DF40
|
|
91
|
+
access: public
|
|
92
|
+
note: 'DF40 dataset with 40 distinct forgery methods for broader evaluation.
|
|
93
|
+
|
|
94
|
+
'
|
|
95
|
+
- kind: google_drive
|
|
96
|
+
url: https://drive.google.com/drive/folders/19kQwGDjF18uk78EnnypxxOLaG4Aa4v1h?usp=sharing
|
|
97
|
+
access: public
|
|
98
|
+
note: Pre-trained Effort checkpoints (FF++, GenImage, Chameleon).
|
|
99
|
+
- kind: google_drive
|
|
100
|
+
url: https://drive.google.com/drive/folders/1fm3Jd8lFMiSP1qgdmsxfqlJZGpr_bXsx?usp=drive_link
|
|
101
|
+
access: public
|
|
102
|
+
note: CLIP-ViT-L/14 backbone weights required by effort_detector.py.
|
|
103
|
+
notes:
|
|
104
|
+
- Deepfake datasets are tens to hundreds of GB after extraction.
|
|
105
|
+
- GenImage and Chameleon datasets must be obtained separately for Table 2 reproduction.
|
|
106
|
+
- JSON index files for each dataset must be generated or obtained from DeepfakeBench/DF40.
|
|
107
|
+
- CLIP backbone path is hardcoded in effort_detector.py and must be adjusted to
|
|
108
|
+
local path.
|
|
109
|
+
credential_requirements:
|
|
110
|
+
mode: none
|
|
111
|
+
items: []
|
|
112
|
+
notes:
|
|
113
|
+
- All datasets and checkpoints are publicly available but hosted externally on Google
|
|
114
|
+
Drive and GitHub repos.
|
|
115
|
+
resources:
|
|
116
|
+
minimum:
|
|
117
|
+
cpu_cores: 8
|
|
118
|
+
ram_gb: 32
|
|
119
|
+
disk_gb: 150
|
|
120
|
+
gpu_count: 1
|
|
121
|
+
gpu_vram_gb: 16
|
|
122
|
+
recommended:
|
|
123
|
+
cpu_cores: 16
|
|
124
|
+
ram_gb: 64
|
|
125
|
+
disk_gb: 300
|
|
126
|
+
gpu_count: 4
|
|
127
|
+
gpu_vram_gb: 24
|
|
128
|
+
environment:
|
|
129
|
+
python: 3.7.2
|
|
130
|
+
cuda: '11.3'
|
|
131
|
+
pytorch: 1.12.0
|
|
132
|
+
flash_attn: null
|
|
133
|
+
key_packages:
|
|
134
|
+
- transformers
|
|
135
|
+
- loralib
|
|
136
|
+
- dlib==19.24.0
|
|
137
|
+
- opencv-python==4.6.0.66
|
|
138
|
+
- scikit-learn==1.0.2
|
|
139
|
+
- albumentations==1.1.0
|
|
140
|
+
- timm==0.6.12
|
|
141
|
+
- efficientnet-pytorch==0.7.1
|
|
142
|
+
- openai-clip (from git)
|
|
143
|
+
- kornia
|
|
144
|
+
- einops
|
|
145
|
+
notes:
|
|
146
|
+
- README specifies Python 3.7.2 and PyTorch 1.11, but install.sh installs torch==1.12.0+cu113;
|
|
147
|
+
use install.sh as the authoritative route.
|
|
148
|
+
- install.sh pins numpy==1.21.5, scipy==1.7.3 and many other specific versions.
|
|
149
|
+
- CLIP backbone uses HuggingFace transformers CLIPModel, not the OpenAI CLIP package
|
|
150
|
+
directly for the detector, but OpenAI CLIP is also installed.
|
|
151
|
+
- dlib is required for face landmark extraction during face-deepfake preprocessing.
|
|
152
|
+
risk_flags:
|
|
153
|
+
- external_dataset_dependency
|
|
154
|
+
- external_checkpoint_dependency
|
|
155
|
+
- hardcoded_paths
|
|
156
|
+
- large_dataset_route
|
|
157
|
+
- google_drive_download
|
|
158
|
+
risk_notes:
|
|
159
|
+
- Datasets (FaceForensics++, DF40, GenImage, Chameleon) are not bundled and must be
|
|
160
|
+
downloaded from external sources totaling potentially hundreds of GB.
|
|
161
|
+
- CLIP backbone path is hardcoded as "../models--openai--clip-vit-large-patch14" in
|
|
162
|
+
effort_detector.py and must be manually adjusted.
|
|
163
|
+
- Pre-trained checkpoints are hosted on Google Drive, which may rate-limit or require
|
|
164
|
+
manual browser download.
|
|
165
|
+
- The benchmark was statically audited but no runtime execution was performed during
|
|
166
|
+
packaging; metric values are unverified.
|
|
167
|
+
- install.sh installs torch 1.12 with CUDA 11.3 which may conflict with newer driver
|
|
168
|
+
setups.
|
|
169
|
+
- JSON dataset index files must be generated via preprocessing scripts or obtained
|
|
170
|
+
from DeepfakeBench/DF40 repos.
|
|
171
|
+
recommended_when: 'Use this benchmark when you want a realistic image-forensics optimization
|
|
172
|
+
task involving CLIP-based fine-tuning with SVD orthogonal decomposition, cross-dataset
|
|
173
|
+
generalization evaluation across many forgery families, and large-scale vision datasets.
|
|
174
|
+
Suitable for research into parameter-efficient tuning, deepfake detection robustness,
|
|
175
|
+
and foundation-model adaptation.
|
|
176
|
+
|
|
177
|
+
'
|
|
178
|
+
not_recommended_when: 'Do not use this if you cannot provision 150+ GB of disk for
|
|
179
|
+
datasets and checkpoints, lack a CUDA GPU with at least 16 GB VRAM, need a lightweight
|
|
180
|
+
CPU-only benchmark, or cannot download large files from Google Drive and external
|
|
181
|
+
GitHub repositories.
|
|
182
|
+
|
|
183
|
+
'
|
|
184
|
+
paper:
|
|
185
|
+
title: 'Effort: Efficient Orthogonal Modeling for Generalizable AI-Generated Image
|
|
186
|
+
Detection'
|
|
187
|
+
venue: ICML 2025 Oral
|
|
188
|
+
year: 2025
|
|
189
|
+
url: https://arxiv.org/abs/2411.15633
|
|
190
|
+
download:
|
|
191
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.011_osd.zip
|
|
192
|
+
archive_type: zip
|
|
193
|
+
local_dir_name: paper-11-OSD
|
|
194
|
+
provider: github_release
|
|
195
|
+
repo: ResearAI/DeepScientist
|
|
196
|
+
tag: aisb-v0.0.1
|
|
197
|
+
asset_name: aisb.t3.011_osd.zip
|
|
198
|
+
sha256: db6c786efc3503420d8269cff59b8abd9ac07786364bc130a811615db99364d8
|
|
199
|
+
size_bytes: 29719270
|
|
200
|
+
commercial:
|
|
201
|
+
annual_fee: null
|
|
202
|
+
display:
|
|
203
|
+
palette_seed: obsidian-coral-vision
|
|
204
|
+
art_style: forensic-clean
|
|
205
|
+
accent_priority: high
|
|
206
|
+
image_path: ../image/011_aisb.t3.011_osd.jpg
|
|
@@ -0,0 +1,163 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.011_osd
|
|
3
|
+
name: 正交子空间分解用于可泛化的AI生成图像检测
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 训练并评估一个使用基于SVD的正交子空间分解(Effort)的CLIP-ViT-L/14检测器,以在DeepfakeBench和GenImage基准上跨深度伪造和合成图像伪造家族实现泛化。
|
|
6
|
+
task_description: '本基准将"Effort"方法打包用于AI生成图像检测。核心思想是通过SVD将CLIP-ViT-L/14权重矩阵分解为冻结的主成分(保留预训练知识)和可训练的残差成分(学习伪造模式),并强制正交性以防止对已知伪造类型的过拟合。执行流程包括:(1)从Google Drive下载CLIP-ViT-L/14主干网络和预训练的Effort检查点,(2)从外部获取深度伪造数据集(DeepfakeBench的FaceForensics++、Celeb-DF-v2、DF40)或GenImage/Chameleon用于合成图像评估,(3)在保持SVD主成分冻结的同时,在一个源数据集上训练Effort检测器头部,(4)在多个未见过的伪造方法上评估跨数据集泛化准确率。打包了两个代码库:DeepfakeBench(面部深度伪造检测,表1结果)和UniversalFakeDetect_Benchmark(通用合成图像检测,表2结果)。主要指标是在未见伪造家族上的检测准确率(如BigGAN、CycleGAN、SimSwap)。数据集必须从外部来源单独下载,且体积较大(数十到数百GB)。检查点托管在Google Drive上。
|
|
7
|
+
|
|
8
|
+
'
|
|
9
|
+
capability_tags:
|
|
10
|
+
- research_code_optimization
|
|
11
|
+
- computer_vision
|
|
12
|
+
- deepfake_detection
|
|
13
|
+
- image_forensics
|
|
14
|
+
- benchmark_evaluation
|
|
15
|
+
- clip_finetuning
|
|
16
|
+
aisb_direction: T3
|
|
17
|
+
track_fit:
|
|
18
|
+
- paper_track
|
|
19
|
+
- benchmark_track
|
|
20
|
+
task_mode: experiment_driven
|
|
21
|
+
requires_execution: true
|
|
22
|
+
requires_paper: true
|
|
23
|
+
integrity_level: cas_plus_canary
|
|
24
|
+
snapshot_status: runnable
|
|
25
|
+
support_level: advanced
|
|
26
|
+
cost_band: high
|
|
27
|
+
time_band: 1d+
|
|
28
|
+
difficulty: hard
|
|
29
|
+
data_access: public
|
|
30
|
+
primary_outputs:
|
|
31
|
+
- biggan_accuracy
|
|
32
|
+
- detection_scores
|
|
33
|
+
- benchmark_report
|
|
34
|
+
- cross_dataset_auc
|
|
35
|
+
launch_profiles:
|
|
36
|
+
- id: quick_check
|
|
37
|
+
label: 快速检查(仅推理)
|
|
38
|
+
description: '从Google Drive下载预训练的Effort检查点,并在单个图像或文件夹上运行DeepfakeBench/training/demo.py,以验证推理流程是否产生伪造概率分数。
|
|
39
|
+
|
|
40
|
+
'
|
|
41
|
+
- id: single_dataset_train
|
|
42
|
+
label: 单数据集训练+测试
|
|
43
|
+
description: '使用单个GPU在一个源数据集(如FaceForensics++)上训练Effort检测器,然后在一个保留数据集(如Celeb-DF-v2)上进行测试。验证训练循环、SVD分解、正交/KSV损失和检查点保存功能。
|
|
44
|
+
|
|
45
|
+
'
|
|
46
|
+
- id: cross_benchmark_eval
|
|
47
|
+
label: 跨基准评估
|
|
48
|
+
description: '在多个未见过的伪造数据集(通过DF40的SimSwap、BlendFace、DeepFaceLab等)上评估训练或预训练的Effort检测器,以复现论文中的跨数据集泛化结果。
|
|
49
|
+
|
|
50
|
+
'
|
|
51
|
+
- id: univfd_benchmark
|
|
52
|
+
label: UniversalFakeDetect基准
|
|
53
|
+
description: '使用UniversalFakeDetect_Benchmark/代码库复现表2中关于通用合成图像检测(GenImage、Chameleon)的结果。
|
|
54
|
+
|
|
55
|
+
'
|
|
56
|
+
dataset_download:
|
|
57
|
+
primary_method: mixed
|
|
58
|
+
sources:
|
|
59
|
+
- kind: external_repo
|
|
60
|
+
url: https://github.com/SCLBD/DeepfakeBench
|
|
61
|
+
access: public
|
|
62
|
+
note: 'FaceForensics++、Celeb-DF-v2及其他面部深度伪造数据集。通过DeepfakeBench可获取预处理后的帧和人脸crop。
|
|
63
|
+
|
|
64
|
+
'
|
|
65
|
+
- kind: external_repo
|
|
66
|
+
url: https://github.com/YZY-stack/DF40
|
|
67
|
+
access: public
|
|
68
|
+
note: DF40数据集,包含40种不同的伪造方法,用于更广泛的评估。
|
|
69
|
+
- kind: google_drive
|
|
70
|
+
url: https://drive.google.com/drive/folders/19kQwGDjF18uk78EnnypxxOLaG4Aa4v1h?usp=sharing
|
|
71
|
+
access: public
|
|
72
|
+
note: 预训练的Effort检查点(FF++、GenImage、Chameleon)。
|
|
73
|
+
- kind: google_drive
|
|
74
|
+
url: https://drive.google.com/drive/folders/1fm3Jd8lFMiSP1qgdmsxfqlJZGpr_bXsx?usp=drive_link
|
|
75
|
+
access: public
|
|
76
|
+
note: effort_detector.py所需的CLIP-ViT-L/14主干网络权重。
|
|
77
|
+
notes:
|
|
78
|
+
- 深度伪造数据集解压后为数十到数百GB。
|
|
79
|
+
- GenImage和Chameleon数据集必须单独获取以复现表2。
|
|
80
|
+
- 每个数据集的JSON索引文件必须通过预处理脚本生成或从DeepfakeBench/DF40获取。
|
|
81
|
+
- CLIP主干路径在effort_detector.py中硬编码,必须调整为本地路径。
|
|
82
|
+
credential_requirements:
|
|
83
|
+
mode: none
|
|
84
|
+
items: []
|
|
85
|
+
notes:
|
|
86
|
+
- 所有数据集和检查点均可公开获取,但托管在外部的Google Drive和GitHub仓库上。
|
|
87
|
+
resources:
|
|
88
|
+
minimum:
|
|
89
|
+
cpu_cores: 8
|
|
90
|
+
ram_gb: 32
|
|
91
|
+
disk_gb: 150
|
|
92
|
+
gpu_count: 1
|
|
93
|
+
gpu_vram_gb: 16
|
|
94
|
+
recommended:
|
|
95
|
+
cpu_cores: 16
|
|
96
|
+
ram_gb: 64
|
|
97
|
+
disk_gb: 300
|
|
98
|
+
gpu_count: 4
|
|
99
|
+
gpu_vram_gb: 24
|
|
100
|
+
environment:
|
|
101
|
+
python: 3.7.2
|
|
102
|
+
cuda: '11.3'
|
|
103
|
+
pytorch: 1.12.0
|
|
104
|
+
flash_attn: null
|
|
105
|
+
key_packages:
|
|
106
|
+
- transformers
|
|
107
|
+
- loralib
|
|
108
|
+
- dlib==19.24.0
|
|
109
|
+
- opencv-python==4.6.0.66
|
|
110
|
+
- scikit-learn==1.0.2
|
|
111
|
+
- albumentations==1.1.0
|
|
112
|
+
- timm==0.6.12
|
|
113
|
+
- efficientnet-pytorch==0.7.1
|
|
114
|
+
- openai-clip (from git)
|
|
115
|
+
- kornia
|
|
116
|
+
- einops
|
|
117
|
+
notes:
|
|
118
|
+
- README指定Python 3.7.2和PyTorch 1.11,但install.sh安装torch==1.12.0+cu113;请以install.sh作为权威安装路径。
|
|
119
|
+
- install.sh固定numpy==1.21.5、scipy==1.7.3及其他众多特定版本。
|
|
120
|
+
- CLIP主干使用HuggingFace transformers的CLIPModel,而非直接使用OpenAI CLIP包用于检测器,但也安装了OpenAI CLIP。
|
|
121
|
+
- dlib用于人脸深度伪造预处理期间的人脸特征点提取。
|
|
122
|
+
risk_flags:
|
|
123
|
+
- external_dataset_dependency
|
|
124
|
+
- external_checkpoint_dependency
|
|
125
|
+
- hardcoded_paths
|
|
126
|
+
- large_dataset_route
|
|
127
|
+
- google_drive_download
|
|
128
|
+
risk_notes:
|
|
129
|
+
- 数据集(FaceForensics++、DF40、GenImage、Chameleon)未打包,必须从外部来源下载,总量可能达数百GB。
|
|
130
|
+
- CLIP主干路径在effort_detector.py中硬编码为"../models--openai--clip-vit-large-patch14",必须手动调整。
|
|
131
|
+
- 预训练检查点托管在Google Drive上,可能会有速率限制或需要手动浏览器下载。
|
|
132
|
+
- 该基准已进行静态审计,但在打包过程中未执行运行时验证;指标值未经验证。
|
|
133
|
+
- install.sh安装torch 1.12配合CUDA 11.3,可能与更新版本的驱动设置冲突。
|
|
134
|
+
- 必须通过预处理脚本生成JSON数据集索引文件,或从DeepfakeBench/DF40仓库获取。
|
|
135
|
+
recommended_when: '当您需要一个涉及基于CLIP的微调与SVD正交分解的真实图像取证优化任务、跨多个伪造家族的数据集泛化评估,以及大规模视觉数据集时,请使用此基准。适用于参数高效微调、深度伪造检测鲁棒性和基础模型适应方面的研究。
|
|
136
|
+
|
|
137
|
+
'
|
|
138
|
+
not_recommended_when: '如果您无法为数据集和检查点提供150GB以上的磁盘空间、缺乏至少16GB显存的CUDA GPU、需要轻量级纯CPU基准,或无法从Google Drive和外部GitHub仓库下载大文件,请勿使用此基准。
|
|
139
|
+
|
|
140
|
+
'
|
|
141
|
+
paper:
|
|
142
|
+
title: 'Effort: Efficient Orthogonal Modeling for Generalizable AI-Generated Image
|
|
143
|
+
Detection'
|
|
144
|
+
venue: ICML 2025 Oral
|
|
145
|
+
year: 2025
|
|
146
|
+
url: https://arxiv.org/abs/2411.15633
|
|
147
|
+
download:
|
|
148
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.011_osd.zip
|
|
149
|
+
archive_type: zip
|
|
150
|
+
local_dir_name: paper-11-OSD
|
|
151
|
+
provider: github_release
|
|
152
|
+
repo: ResearAI/DeepScientist
|
|
153
|
+
tag: aisb-v0.0.1
|
|
154
|
+
asset_name: aisb.t3.011_osd.zip
|
|
155
|
+
sha256: db6c786efc3503420d8269cff59b8abd9ac07786364bc130a811615db99364d8
|
|
156
|
+
size_bytes: 29719270
|
|
157
|
+
commercial:
|
|
158
|
+
annual_fee: null
|
|
159
|
+
display:
|
|
160
|
+
palette_seed: obsidian-coral-vision
|
|
161
|
+
art_style: forensic-clean
|
|
162
|
+
accent_priority: high
|
|
163
|
+
image_path: ../image/011_aisb.t3.011_osd.jpg
|
|
@@ -0,0 +1,206 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.012_efficientqat
|
|
3
|
+
name: 'EfficientQAT: Efficient Quantization-Aware Training for Large Language Models'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 'Two-phase low-bit quantization-aware training (Block-AP → E2E-QP) for Llama-2/3
|
|
6
|
+
and Mistral families (7B–70B), evaluated via WikiText-2 perplexity, C4 perplexity,
|
|
7
|
+
and zero-shot accuracy on five reasoning benchmarks.
|
|
8
|
+
|
|
9
|
+
'
|
|
10
|
+
task_description: 'This benchmark implements EfficientQAT, a two-stage quantization-aware
|
|
11
|
+
training pipeline for large language models at 2/3/4-bit weight-only precision.
|
|
12
|
+
Stage 1 (Block-AP) trains all parameters—weights, step sizes, and zero points—block-by-block
|
|
13
|
+
using reconstruction loss on 4096 RedPajama samples (context length 2048). Stage
|
|
14
|
+
2 (E2E-QP) freezes the quantized integer weights and fine-tunes only the quantization
|
|
15
|
+
step sizes end-to-end on a target dataset (RedPajama or Alpaca, context length 4096).
|
|
16
|
+
The primary executable anchors are main_block_ap.py and main_e2e_qp.py, with supplementary
|
|
17
|
+
scale-calibration scripts (calibrate_scales.py, calibrate_scales_v2.py). Evaluation
|
|
18
|
+
measures WikiText-2 perplexity, C4 perplexity, and average zero-shot accuracy on
|
|
19
|
+
WinoGrande, PIQA, HellaSwag, ARC-Easy, and ARC-Challenge using lm-eval v0.4.2. Pre-quantized
|
|
20
|
+
checkpoints for many model/bit configurations are available on HuggingFace and can
|
|
21
|
+
be converted to GPTQ or BitBLAS formats via bundled transfer scripts. The paper
|
|
22
|
+
reports that 2-bit Llama-2-70B can be obtained on a single A100-80GB in 41 hours
|
|
23
|
+
with <3 points accuracy degradation. No external evaluation service is required;
|
|
24
|
+
all metrics are computed locally.
|
|
25
|
+
|
|
26
|
+
'
|
|
27
|
+
capability_tags:
|
|
28
|
+
- research_code_optimization
|
|
29
|
+
- large_language_models
|
|
30
|
+
- quantization
|
|
31
|
+
- model_compression
|
|
32
|
+
- efficient_inference
|
|
33
|
+
- quantization_aware_training
|
|
34
|
+
aisb_direction: T3
|
|
35
|
+
track_fit:
|
|
36
|
+
- paper_track
|
|
37
|
+
- benchmark_track
|
|
38
|
+
task_mode: experiment_driven
|
|
39
|
+
requires_execution: true
|
|
40
|
+
requires_paper: true
|
|
41
|
+
integrity_level: cas_plus_canary
|
|
42
|
+
snapshot_status: runnable
|
|
43
|
+
support_level: advanced
|
|
44
|
+
time_band: 1d+
|
|
45
|
+
cost_band: high
|
|
46
|
+
difficulty: hard
|
|
47
|
+
data_access: public
|
|
48
|
+
primary_outputs:
|
|
49
|
+
- wikitext2_ppl
|
|
50
|
+
- c4_ppl
|
|
51
|
+
- quantized_checkpoint
|
|
52
|
+
- avg_accuracy
|
|
53
|
+
launch_profiles:
|
|
54
|
+
- id: calibration_only
|
|
55
|
+
label: Calibration Only
|
|
56
|
+
description: 'Run scale calibration (calibrate_scales.py or calibrate_scales_v2.py)
|
|
57
|
+
on a pre-quantized checkpoint using WikiText-2 train data. Produces updated scale
|
|
58
|
+
parameters without full Block-AP or E2E-QP retraining. Fastest route; requires
|
|
59
|
+
a pre-quantized model on disk.
|
|
60
|
+
|
|
61
|
+
'
|
|
62
|
+
- id: qat_eval
|
|
63
|
+
label: QAT + Eval
|
|
64
|
+
description: 'Run the full two-stage EfficientQAT pipeline: Block-AP block-wise
|
|
65
|
+
training via main_block_ap.py, followed by E2E-QP end-to-end step-size training
|
|
66
|
+
via main_e2e_qp.py, then evaluate WikiText-2/C4 perplexity and zero-shot accuracy
|
|
67
|
+
on five reasoning tasks. This is the paper-faithful route and requires significant
|
|
68
|
+
GPU time (hours to days depending on model size).
|
|
69
|
+
|
|
70
|
+
'
|
|
71
|
+
- id: eval_pretrained
|
|
72
|
+
label: Evaluate Pre-Quantized
|
|
73
|
+
description: 'Download a pre-quantized EfficientQAT checkpoint from HuggingFace
|
|
74
|
+
and evaluate perplexity and zero-shot accuracy without any training. Uses main_block_ap.py
|
|
75
|
+
with --resume_quant.
|
|
76
|
+
|
|
77
|
+
'
|
|
78
|
+
dataset_download:
|
|
79
|
+
primary_method: mixed
|
|
80
|
+
sources:
|
|
81
|
+
- kind: huggingface
|
|
82
|
+
url: https://huggingface.co/datasets/togethercomputer/RedPajama-Data-1T-Sample
|
|
83
|
+
access: public
|
|
84
|
+
note: 'RedPajama calibration data used for both Block-AP (4096 samples, seqlen
|
|
85
|
+
2048) and E2E-QP (4096 samples, seqlen 4096). Downloaded automatically by datautils_block.py.
|
|
86
|
+
|
|
87
|
+
'
|
|
88
|
+
- kind: huggingface
|
|
89
|
+
url: https://huggingface.co/datasets/wikitext
|
|
90
|
+
access: public
|
|
91
|
+
note: 'WikiText-2 (wikitext-2-raw-v1) used for perplexity evaluation and scale
|
|
92
|
+
calibration. Downloaded automatically during eval.
|
|
93
|
+
|
|
94
|
+
'
|
|
95
|
+
- kind: huggingface
|
|
96
|
+
url: https://huggingface.co/ChenMnZ
|
|
97
|
+
access: public
|
|
98
|
+
note: 'Pre-quantized model checkpoints for Llama-2 (7B/13B/70B), Llama-3 (8B/70B),
|
|
99
|
+
Llama-3-Instruct, and Mistral-Large in EQAT/GPTQ/BitBLAS formats. Individual
|
|
100
|
+
checkpoints range from ~2 GB to ~39 GB.
|
|
101
|
+
|
|
102
|
+
'
|
|
103
|
+
- kind: huggingface
|
|
104
|
+
url: https://huggingface.co/datasets/tatsu-lab/alpaca
|
|
105
|
+
access: public
|
|
106
|
+
note: 'Alpaca instruction-tuning dataset, used as alternative E2E-QP training
|
|
107
|
+
data for instruction-tuning scenarios.
|
|
108
|
+
|
|
109
|
+
'
|
|
110
|
+
notes:
|
|
111
|
+
- Full-precision base models (e.g. Llama-2-70B at ~131 GB) must be downloaded separately
|
|
112
|
+
from their original HuggingFace repos if running Block-AP from scratch.
|
|
113
|
+
- Pre-quantized checkpoints are much smaller (e.g. w2g64 Llama-2-70B is ~20 GB).
|
|
114
|
+
- Total disk usage depends heavily on which model families and bit widths are targeted.
|
|
115
|
+
credential_requirements:
|
|
116
|
+
mode: none
|
|
117
|
+
items:
|
|
118
|
+
- HuggingFace account may be needed for gated models (Llama-2, Llama-3) but not
|
|
119
|
+
for the EfficientQAT checkpoints themselves
|
|
120
|
+
notes:
|
|
121
|
+
- Meta Llama model weights require accepting a license on HuggingFace before download.
|
|
122
|
+
- Pre-quantized EfficientQAT checkpoints under ChenMnZ namespace are publicly accessible.
|
|
123
|
+
resources:
|
|
124
|
+
minimum:
|
|
125
|
+
cpu_cores: 16
|
|
126
|
+
ram_gb: 64
|
|
127
|
+
disk_gb: 200
|
|
128
|
+
gpu_count: 1
|
|
129
|
+
gpu_vram_gb: 48
|
|
130
|
+
recommended:
|
|
131
|
+
cpu_cores: 32
|
|
132
|
+
ram_gb: 128
|
|
133
|
+
disk_gb: 500
|
|
134
|
+
gpu_count: 2
|
|
135
|
+
gpu_vram_gb: 80
|
|
136
|
+
environment:
|
|
137
|
+
python: '3.11'
|
|
138
|
+
cuda: null
|
|
139
|
+
pytorch: 2.2.2
|
|
140
|
+
flash_attn: null
|
|
141
|
+
key_packages:
|
|
142
|
+
- bitsandbytes==0.41.0
|
|
143
|
+
- transformers==4.40.1
|
|
144
|
+
- lm-eval==0.4.2
|
|
145
|
+
- accelerate
|
|
146
|
+
- datasets
|
|
147
|
+
notes:
|
|
148
|
+
- See the bundled requirements.txt for the full dependency set.
|
|
149
|
+
- CUDA toolkit version is not pinned in the repo; any version supporting PyTorch
|
|
150
|
+
2.2.2 should work.
|
|
151
|
+
- GPTQModel (v0.9.8 tested) is required only for model format transfer to GPTQ/BitBLAS;
|
|
152
|
+
not needed for core QAT or evaluation.
|
|
153
|
+
- bitsandbytes is used for the AdamW optimizer in E2E-QP training.
|
|
154
|
+
risk_flags:
|
|
155
|
+
- large_model_download
|
|
156
|
+
- high_gpu_memory
|
|
157
|
+
- long_training_time
|
|
158
|
+
- gated_model_access
|
|
159
|
+
risk_notes:
|
|
160
|
+
- 70B model routes require a single A100-80GB (paper reports 41 hours for 2-bit Llama-2-70B
|
|
161
|
+
Block-AP + E2E-QP) or multi-GPU setups.
|
|
162
|
+
- 7B model routes are feasible on a single 48GB GPU but still take multiple hours
|
|
163
|
+
for full Block-AP + E2E-QP.
|
|
164
|
+
- Full-precision base model weights for Llama-2/3 are gated on HuggingFace and require
|
|
165
|
+
license acceptance.
|
|
166
|
+
- The --off_load_to_disk flag in Block-AP can reduce CPU memory usage at the cost
|
|
167
|
+
of training speed.
|
|
168
|
+
- No benchmark execution was performed during the packaging pass; runtime verification
|
|
169
|
+
is still needed.
|
|
170
|
+
- E2E-QP memory for 2-bit Llama-2-70B is reported as 34.2 GB in the paper.
|
|
171
|
+
recommended_when: 'Use this benchmark when you want an LLM-systems task centered on
|
|
172
|
+
quantization-aware training at aggressive bit widths (2–4 bit), with self-contained
|
|
173
|
+
training and evaluation pipelines covering multiple model scales from 7B to 70B.
|
|
174
|
+
Suitable for evaluating optimization strategies for low-bit QAT, comparing against
|
|
175
|
+
PTQ and Q-PEFT baselines, or producing deployable quantized checkpoints in GPTQ/BitBLAS
|
|
176
|
+
formats.
|
|
177
|
+
|
|
178
|
+
'
|
|
179
|
+
not_recommended_when: 'Do not use this if you lack access to at least one GPU with
|
|
180
|
+
≥48 GB VRAM, if you need sub-hour benchmark turnaround, or if your focus is on small
|
|
181
|
+
models (<7B parameters). Also not suitable if you need weight-activation quantization
|
|
182
|
+
benchmarks (this benchmark is weight-only quantization).
|
|
183
|
+
|
|
184
|
+
'
|
|
185
|
+
paper:
|
|
186
|
+
title: 'EfficientQAT: Efficient Quantization-Aware Training for Large Language Models'
|
|
187
|
+
venue: ACL 2025 Main
|
|
188
|
+
year: 2025
|
|
189
|
+
url: https://arxiv.org/abs/2407.11062
|
|
190
|
+
download:
|
|
191
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.012_efficientqat.zip
|
|
192
|
+
archive_type: zip
|
|
193
|
+
local_dir_name: paper-12-EfficientQAT
|
|
194
|
+
provider: github_release
|
|
195
|
+
repo: ResearAI/DeepScientist
|
|
196
|
+
tag: aisb-v0.0.1
|
|
197
|
+
asset_name: aisb.t3.012_efficientqat.zip
|
|
198
|
+
sha256: 8f53850f12f1bdbc4e3212b21fb51a7479ebb8ab715f3138d96ef1da979b2977
|
|
199
|
+
size_bytes: 107235
|
|
200
|
+
commercial:
|
|
201
|
+
annual_fee: null
|
|
202
|
+
display:
|
|
203
|
+
palette_seed: amber-steel-llm
|
|
204
|
+
art_style: hardware-editorial
|
|
205
|
+
accent_priority: high
|
|
206
|
+
image_path: ../image/012_aisb.t3.012_efficientqat.jpg
|