@researai/deepscientist 1.5.16 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +196 -32
- package/bin/ds.js +924 -66
- package/docs/en/00_QUICK_START.md +195 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +78 -7
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +624 -180
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +386 -0
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +266 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +48 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +142 -18
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +54 -8
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +552 -181
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +384 -0
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +33 -7
- package/install.sh +168 -20
- package/package.json +5 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/bridges/connectors.py +8 -2
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +187 -74
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +1077 -93
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +827 -235
- package/src/deepscientist/daemon/api/router.py +81 -1
- package/src/deepscientist/daemon/app.py +1512 -85
- package/src/deepscientist/diagnostics/__init__.py +6 -0
- package/src/deepscientist/diagnostics/runner_failures.py +277 -0
- package/src/deepscientist/doctor.py +407 -56
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +850 -88
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1852 -161
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +480 -35
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +80 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -10
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +411 -304
- package/src/prompts/system_copilot.md +89 -0
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-DnSm0GZn.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-itb0tltR.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DqKkiCI6.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-DxL2ezFG.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-B_RQm1YZ.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-tHqlXY3n.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-B495DTXC.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DG28-61B.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BiOGT-Kj.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-CVsj8h_T.js → NotebookEditor-WFyd8Ybt.js} +23 -23
- package/src/ui/dist/assets/{PdfLoader-CASDQmxJ.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-BFhwoKsY.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-CB4DYfWO.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-DLC6G24T.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-CwMn-iqb.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-Cu4Qln7Y.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-wQ7RIIRd.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-CsX08Qno.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-R-GWEhzS.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-COFACy7V.js +0 -204
- package/src/ui/dist/assets/CliPlugin-CvwCmDQ5.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-cOqSa0xq.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-DVgNHBCS.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-ClMbq5Yu.js +0 -14
- package/src/ui/dist/assets/LabPlugin-L_SuE8ow.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-C-4Kt1p9.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-DcOzU9vd.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CHj7M58O.js +0 -16
- package/src/ui/dist/assets/VNCViewer-CjlbyCB3.js +0 -11
- package/src/ui/dist/assets/bot-CFkZY-JP.js +0 -6
- package/src/ui/dist/assets/chevron-up-Dq5ofbht.js +0 -6
- package/src/ui/dist/assets/file-content-Dv4LoZec.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-Denq-lC3.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-BUh6G52n.js +0 -6
- package/src/ui/dist/assets/image-B9HUUddG.js +0 -6
- package/src/ui/dist/assets/index-B2B1sg-M.js +0 -1
- package/src/ui/dist/assets/index-Cgla8biy.css +0 -33
- package/src/ui/dist/assets/index-DRyx7vAc.js +0 -1
- package/src/ui/dist/assets/index-Gbl53BNp.js +0 -2496
- package/src/ui/dist/assets/pdf-effect-queue-ZtnHFCAi.js +0 -6
- package/src/ui/dist/assets/popover-DL6h35vr.js +0 -1
- package/src/ui/dist/assets/select-DvmXt1yY.js +0 -11
- package/src/ui/dist/assets/sigma-7jpXazui.js +0 -6
- package/src/ui/dist/assets/trash-xA7kFt8i.js +0 -11
- package/src/ui/dist/assets/useCliAccess-DsMwDjOp.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,169 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.007_reasoningiqa
|
|
3
|
+
name: 'RALI: Reasoning-Aligned Lightweight Image Quality Assessment'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: Evaluate a CLIP-based lightweight IQA scorer (RALI) distilled from reasoning-heavy
|
|
6
|
+
RL-trained multimodal models on standard image quality benchmarks using PLCC, SRCC,
|
|
7
|
+
and MAE.
|
|
8
|
+
task_description: 'This benchmark evaluates RALI, a lightweight no-reference image
|
|
9
|
+
quality assessment (IQA) model that uses CLIP-based contrastive alignment to match
|
|
10
|
+
the generalization of much larger reasoning-based IQA models (e.g., Q-Insight) at
|
|
11
|
+
~4% of their parameters and inference time. The execution route loads pretrained
|
|
12
|
+
RALI checkpoints (CLIP vision encoder, PCA transform, prototype scorer), runs inference
|
|
13
|
+
on IQA benchmark datasets (KONIQ, KADID10K, SPAQ, etc.), and computes Pearson Linear
|
|
14
|
+
Correlation Coefficient (PLCC), Spearman Rank Correlation Coefficient (SRCC), and
|
|
15
|
+
Mean Absolute Error (MAE) against ground-truth subjective quality scores. The primary
|
|
16
|
+
entry point is eval_json.sh / eval_json.py, which scores images from JSON-defined
|
|
17
|
+
test splits and writes per-image predictions to a JSON log. A demo script (demo_rali_score.py)
|
|
18
|
+
provides single-image scoring. No training is required; all checkpoints are pretrained.
|
|
19
|
+
The benchmark tests whether an agent can correctly set up the environment, download
|
|
20
|
+
external checkpoints and dataset images, configure paths, and reproduce the paper''s
|
|
21
|
+
reported correlation metrics.
|
|
22
|
+
|
|
23
|
+
'
|
|
24
|
+
capability_tags:
|
|
25
|
+
- research_code_optimization
|
|
26
|
+
- computer_vision
|
|
27
|
+
- image_quality_assessment
|
|
28
|
+
- representation_learning
|
|
29
|
+
- evaluation
|
|
30
|
+
aisb_direction: T3
|
|
31
|
+
track_fit:
|
|
32
|
+
- paper_track
|
|
33
|
+
- benchmark_track
|
|
34
|
+
task_mode: experiment_driven
|
|
35
|
+
requires_execution: true
|
|
36
|
+
requires_paper: true
|
|
37
|
+
integrity_level: cas_plus_canary
|
|
38
|
+
snapshot_status: runnable
|
|
39
|
+
support_level: turnkey
|
|
40
|
+
time_band: 2-6h
|
|
41
|
+
cost_band: medium
|
|
42
|
+
difficulty: medium
|
|
43
|
+
data_access: public
|
|
44
|
+
primary_outputs:
|
|
45
|
+
- plcc
|
|
46
|
+
- srcc
|
|
47
|
+
- mae
|
|
48
|
+
launch_profiles:
|
|
49
|
+
- id: quick_check
|
|
50
|
+
label: Quick Check
|
|
51
|
+
description: 'Run demo_rali_score.py on a single bundled image to verify that the
|
|
52
|
+
checkpoint loads, PCA and prototype scorer initialize, and a quality score is
|
|
53
|
+
produced. No dataset download required.
|
|
54
|
+
|
|
55
|
+
'
|
|
56
|
+
- id: benchmark_eval
|
|
57
|
+
label: Benchmark Eval
|
|
58
|
+
description: 'Run eval_json.sh on one or more IQA benchmark test splits (e.g., KADID10K,
|
|
59
|
+
KONIQ, SPAQ). Requires downloading pretrained RALI checkpoints from HuggingFace
|
|
60
|
+
and the Data-DeQA-Score dataset images. Produces per-image prediction JSONs and
|
|
61
|
+
computes PLCC, SRCC, MAE.
|
|
62
|
+
|
|
63
|
+
'
|
|
64
|
+
dataset_download:
|
|
65
|
+
primary_method: huggingface
|
|
66
|
+
sources:
|
|
67
|
+
- kind: huggingface
|
|
68
|
+
url: https://huggingface.co/ByteDance/Q-Insight/tree/main/RALI
|
|
69
|
+
access: public
|
|
70
|
+
note: 'RALI pretrained checkpoints (ckpt.pt, pca.pkl, basis.npz, and CLIP fine-tuned
|
|
71
|
+
model under best/). Place under ./checkpoints/.
|
|
72
|
+
|
|
73
|
+
'
|
|
74
|
+
- kind: huggingface
|
|
75
|
+
url: https://huggingface.co/datasets/zhiyuanyou/Data-DeQA-Score/tree/main
|
|
76
|
+
access: public
|
|
77
|
+
note: 'IQA benchmark meta files and source images for KONIQ, KADID10K, SPAQ, and
|
|
78
|
+
others. Place under ./Data-DeQA-Score/. Image directories may total several
|
|
79
|
+
GB.
|
|
80
|
+
|
|
81
|
+
'
|
|
82
|
+
notes:
|
|
83
|
+
- Checkpoint download is ~1-2 GB. Dataset images vary by benchmark; full Data-DeQA-Score
|
|
84
|
+
may exceed 10 GB.
|
|
85
|
+
- The snapshot includes directory stubs (Data-DeQA-Score/KADID10K, Data-DeQA-Score/KONIQ)
|
|
86
|
+
but not the actual images.
|
|
87
|
+
credential_requirements:
|
|
88
|
+
mode: none
|
|
89
|
+
items: []
|
|
90
|
+
notes:
|
|
91
|
+
- All checkpoints and datasets are publicly available on HuggingFace without authentication.
|
|
92
|
+
resources:
|
|
93
|
+
minimum:
|
|
94
|
+
cpu_cores: 8
|
|
95
|
+
ram_gb: 32
|
|
96
|
+
disk_gb: 80
|
|
97
|
+
gpu_count: 1
|
|
98
|
+
gpu_vram_gb: 12
|
|
99
|
+
recommended:
|
|
100
|
+
cpu_cores: 16
|
|
101
|
+
ram_gb: 64
|
|
102
|
+
disk_gb: 150
|
|
103
|
+
gpu_count: 1
|
|
104
|
+
gpu_vram_gb: 24
|
|
105
|
+
environment:
|
|
106
|
+
python: null
|
|
107
|
+
cuda: null
|
|
108
|
+
pytorch: null
|
|
109
|
+
flash_attn: null
|
|
110
|
+
key_packages:
|
|
111
|
+
- transformers
|
|
112
|
+
- torch
|
|
113
|
+
- joblib
|
|
114
|
+
- numpy
|
|
115
|
+
- Pillow
|
|
116
|
+
- tqdm
|
|
117
|
+
notes:
|
|
118
|
+
- setup.sh installs all dependencies. See bundled README and requirements for the
|
|
119
|
+
full dependency set.
|
|
120
|
+
- Uses CLIPModel and CLIPProcessor from HuggingFace transformers.
|
|
121
|
+
- Exact Python/CUDA/PyTorch versions are not pinned; any recent compatible set should
|
|
122
|
+
work.
|
|
123
|
+
risk_flags:
|
|
124
|
+
- external_checkpoint_download
|
|
125
|
+
- external_dataset_download
|
|
126
|
+
- no_training_in_snapshot
|
|
127
|
+
risk_notes:
|
|
128
|
+
- Pretrained RALI checkpoints must be downloaded from HuggingFace (ByteDance/Q-Insight/RALI)
|
|
129
|
+
before any evaluation can run.
|
|
130
|
+
- Dataset images are not bundled; only JSON meta files and directory stubs are included.
|
|
131
|
+
Images must be fetched from Data-DeQA-Score on HuggingFace.
|
|
132
|
+
- No training code is included in the snapshot; this is inference/evaluation only.
|
|
133
|
+
- No benchmark execution was performed during the packaging pass; metric values have
|
|
134
|
+
not been verified at runtime.
|
|
135
|
+
recommended_when: 'Use this benchmark when you want a vision evaluation task with
|
|
136
|
+
pretrained checkpoints and straightforward image-benchmark execution. Good for testing
|
|
137
|
+
an agent''s ability to download external resources, configure paths, and run a self-contained
|
|
138
|
+
PyTorch inference pipeline that produces standard IQA correlation metrics.
|
|
139
|
+
|
|
140
|
+
'
|
|
141
|
+
not_recommended_when: 'Do not use this if you need a large-scale training task, a
|
|
142
|
+
video quality benchmark, or a task that exercises long-horizon multi-stage model
|
|
143
|
+
training. Also not suitable if you want a fully self-contained benchmark with no
|
|
144
|
+
external downloads.
|
|
145
|
+
|
|
146
|
+
'
|
|
147
|
+
paper:
|
|
148
|
+
title: 'Reasoning as Representation: Rethinking Visual Reinforcement Learning in
|
|
149
|
+
Image Quality Assessment'
|
|
150
|
+
venue: ICLR 2026 Oral
|
|
151
|
+
year: 2026
|
|
152
|
+
url: https://arxiv.org/abs/2510.11369
|
|
153
|
+
download:
|
|
154
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.007_reasoningiqa.zip
|
|
155
|
+
archive_type: zip
|
|
156
|
+
local_dir_name: paper-7-ReasoningIQA
|
|
157
|
+
provider: github_release
|
|
158
|
+
repo: ResearAI/DeepScientist
|
|
159
|
+
tag: aisb-v0.0.1
|
|
160
|
+
asset_name: aisb.t3.007_reasoningiqa.zip
|
|
161
|
+
sha256: 91b252c7f1616ea5b8889a80d6c6ba001c92f6b2f5db2998c133f533cdcc6bdf
|
|
162
|
+
size_bytes: 857520
|
|
163
|
+
commercial:
|
|
164
|
+
annual_fee: null
|
|
165
|
+
display:
|
|
166
|
+
palette_seed: cobalt-pearl-contrast
|
|
167
|
+
art_style: crisp-editorial
|
|
168
|
+
accent_priority: medium
|
|
169
|
+
image_path: ../image/007_aisb.t3.007_reasoningiqa.jpg
|
|
@@ -0,0 +1,133 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.007_reasoningiqa
|
|
3
|
+
name: 'RALI: 基于对齐推理的轻量级图像质量评估'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 评估基于CLIP的轻量级IQA评分模型(RALI),该模型从推理密集型RL训练的多模态模型中蒸馏而来,在标准图像质量基准测试中使用PLCC、SRCC和MAE进行评估。
|
|
6
|
+
task_description: '本基准测试评估RALI,这是一款轻量级无参考图像质量评估(IQA)模型,采用基于CLIP的对比对齐技术,在仅使用约4%参数和推理时间的前提下,达到与大型推理驱动IQA模型(如Q-Insight)相当的泛化能力。执行路由加载预训练的RALI检查点(CLIP视觉编码器、PCA变换、原型评分器),在IQA基准数据集(KONIQ、KADID10K、SPAQ等)上进行推理,并计算皮尔逊线性相关系数(PLCC)、斯皮尔曼等级相关系数(SRCC)和平均绝对误差(MAE)与主观质量评分ground truth的对比结果。主要入口点是eval_json.sh / eval_json.py,对JSON定义的测试分割中的图像进行评分,并将每张图像的预测结果写入JSON日志。演示脚本(demo_rali_score.py)提供单图像评分功能。无需训练,所有检查点均为预训练。本基准测试检验智能体能否正确设置环境、下载外部检查点和数据集图像、配置路径,并复现论文中报告的相关性指标。
|
|
7
|
+
|
|
8
|
+
'
|
|
9
|
+
capability_tags:
|
|
10
|
+
- research_code_optimization
|
|
11
|
+
- computer_vision
|
|
12
|
+
- image_quality_assessment
|
|
13
|
+
- representation_learning
|
|
14
|
+
- evaluation
|
|
15
|
+
aisb_direction: T3
|
|
16
|
+
track_fit:
|
|
17
|
+
- paper_track
|
|
18
|
+
- benchmark_track
|
|
19
|
+
task_mode: experiment_driven
|
|
20
|
+
requires_execution: true
|
|
21
|
+
requires_paper: true
|
|
22
|
+
integrity_level: cas_plus_canary
|
|
23
|
+
snapshot_status: runnable
|
|
24
|
+
support_level: turnkey
|
|
25
|
+
time_band: 2-6h
|
|
26
|
+
cost_band: medium
|
|
27
|
+
difficulty: medium
|
|
28
|
+
data_access: public
|
|
29
|
+
primary_outputs:
|
|
30
|
+
- plcc
|
|
31
|
+
- srcc
|
|
32
|
+
- mae
|
|
33
|
+
launch_profiles:
|
|
34
|
+
- id: quick_check
|
|
35
|
+
label: 快速检查
|
|
36
|
+
description: '运行demo_rali_score.py对单个捆绑图像进行评分,验证检查点加载、PCA和原型评分器初始化,并产生质量评分。无需下载数据集。
|
|
37
|
+
|
|
38
|
+
'
|
|
39
|
+
- id: benchmark_eval
|
|
40
|
+
label: 基准评估
|
|
41
|
+
description: '在某一个或多个IQA基准测试分割(如KADID10K、KONIQ、SPAQ)上运行eval_json.sh。需要从HuggingFace下载预训练的RALI检查点和Data-DeQA-Score数据集图像。生成每张图像的预测JSON,并计算PLCC、SRCC、MAE。
|
|
42
|
+
|
|
43
|
+
'
|
|
44
|
+
dataset_download:
|
|
45
|
+
primary_method: huggingface
|
|
46
|
+
sources:
|
|
47
|
+
- kind: huggingface
|
|
48
|
+
url: https://huggingface.co/ByteDance/Q-Insight/tree/main/RALI
|
|
49
|
+
access: public
|
|
50
|
+
note: 'RALI预训练检查点(ckpt.pt、pca.pkl、basis.npz以及best/下的CLIP微调模型)。放置于./checkpoints/目录下。
|
|
51
|
+
|
|
52
|
+
'
|
|
53
|
+
- kind: huggingface
|
|
54
|
+
url: https://huggingface.co/datasets/zhiyuanyou/Data-DeQA-Score/tree/main
|
|
55
|
+
access: public
|
|
56
|
+
note: 'IQA基准测试元文件和KONIQ、KADID10K、SPAQ等数据集的源图像。放置于./Data-DeQA-Score/目录下。图像目录总计可能达数GB。
|
|
57
|
+
|
|
58
|
+
'
|
|
59
|
+
notes:
|
|
60
|
+
- 检查点下载约1-2 GB。数据集图像大小因基准测试而异,完整的Data-DeQA-Score可能超过10 GB。
|
|
61
|
+
- 快照包含目录存根(Data-DeQA-Score/KADID10K、Data-DeQA-Score/KONIQ),但不包含实际图像。
|
|
62
|
+
credential_requirements:
|
|
63
|
+
mode: none
|
|
64
|
+
items: []
|
|
65
|
+
notes:
|
|
66
|
+
- 所有检查点和数据集均可通过HuggingFace公开访问,无需身份验证。
|
|
67
|
+
resources:
|
|
68
|
+
minimum:
|
|
69
|
+
cpu_cores: 8
|
|
70
|
+
ram_gb: 32
|
|
71
|
+
disk_gb: 80
|
|
72
|
+
gpu_count: 1
|
|
73
|
+
gpu_vram_gb: 12
|
|
74
|
+
recommended:
|
|
75
|
+
cpu_cores: 16
|
|
76
|
+
ram_gb: 64
|
|
77
|
+
disk_gb: 150
|
|
78
|
+
gpu_count: 1
|
|
79
|
+
gpu_vram_gb: 24
|
|
80
|
+
environment:
|
|
81
|
+
python: null
|
|
82
|
+
cuda: null
|
|
83
|
+
pytorch: null
|
|
84
|
+
flash_attn: null
|
|
85
|
+
key_packages:
|
|
86
|
+
- transformers
|
|
87
|
+
- torch
|
|
88
|
+
- joblib
|
|
89
|
+
- numpy
|
|
90
|
+
- Pillow
|
|
91
|
+
- tqdm
|
|
92
|
+
notes:
|
|
93
|
+
- setup.sh安装所有依赖项。参见捆绑的README和requirements以了解完整的依赖集合。
|
|
94
|
+
- 使用HuggingFace transformers中的CLIPModel和CLIPProcessor。
|
|
95
|
+
- 未固定精确的Python/CUDA/PyTorch版本,任何近期兼容版本组合均应可用。
|
|
96
|
+
risk_flags:
|
|
97
|
+
- external_checkpoint_download
|
|
98
|
+
- external_dataset_download
|
|
99
|
+
- no_training_in_snapshot
|
|
100
|
+
risk_notes:
|
|
101
|
+
- 必须从HuggingFace(ByteDance/Q-Insight/RALI)下载预训练的RALI检查点后才能运行任何评估。
|
|
102
|
+
- 数据集图像未捆绑,仅包含JSON元文件和目录存根。图像必须从HuggingFace上的Data-DeQA-Score获取。
|
|
103
|
+
- 快照中不包含训练代码,仅用于推理/评估。
|
|
104
|
+
- 打包过程中未执行基准测试,运行时指标值未经核实。
|
|
105
|
+
recommended_when: '当您需要一个视觉评估任务且具备预训练检查点和直接的图像基准执行时使用此基准测试。适合测试智能体下载外部资源、配置路径和运行自包含PyTorch推理管道以产生标准IQA相关性指标的能力。
|
|
106
|
+
|
|
107
|
+
'
|
|
108
|
+
not_recommended_when: '如果需要大规模训练任务、视频质量基准测试或需要长时间多阶段模型训练的任务,请勿使用。也不适合需要完全自包含且无外部下载的基准测试。
|
|
109
|
+
|
|
110
|
+
'
|
|
111
|
+
paper:
|
|
112
|
+
title: 'Reasoning as Representation: Rethinking Visual Reinforcement Learning in
|
|
113
|
+
Image Quality Assessment'
|
|
114
|
+
venue: ICLR 2026 Oral
|
|
115
|
+
year: 2026
|
|
116
|
+
url: https://arxiv.org/abs/2510.11369
|
|
117
|
+
download:
|
|
118
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.007_reasoningiqa.zip
|
|
119
|
+
archive_type: zip
|
|
120
|
+
local_dir_name: paper-7-ReasoningIQA
|
|
121
|
+
provider: github_release
|
|
122
|
+
repo: ResearAI/DeepScientist
|
|
123
|
+
tag: aisb-v0.0.1
|
|
124
|
+
asset_name: aisb.t3.007_reasoningiqa.zip
|
|
125
|
+
sha256: 91b252c7f1616ea5b8889a80d6c6ba001c92f6b2f5db2998c133f533cdcc6bdf
|
|
126
|
+
size_bytes: 857520
|
|
127
|
+
commercial:
|
|
128
|
+
annual_fee: null
|
|
129
|
+
display:
|
|
130
|
+
palette_seed: cobalt-pearl-contrast
|
|
131
|
+
art_style: crisp-editorial
|
|
132
|
+
accent_priority: medium
|
|
133
|
+
image_path: ../image/007_aisb.t3.007_reasoningiqa.jpg
|
|
@@ -0,0 +1,188 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.008_meanflows
|
|
3
|
+
name: Mean Flows for One-step Generative Modeling
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 'Train and evaluate a MeanFlow one-step generative model on CIFAR-10, measuring
|
|
6
|
+
FID-50K via a bundled evaluation script that requires a restored source tree and
|
|
7
|
+
checkpoint.
|
|
8
|
+
|
|
9
|
+
'
|
|
10
|
+
task_description: 'This benchmark covers one-step image generation using the MeanFlow
|
|
11
|
+
framework, which learns an average velocity field (as opposed to instantaneous velocity
|
|
12
|
+
in standard Flow Matching) to enable single-NFE sampling. The packaged snapshot
|
|
13
|
+
includes an evaluation script (eval_cifar10.py) and config but is missing the core
|
|
14
|
+
MeanFlow training source tree (expected at /py-meanflow/meanflow/) and the pretrained
|
|
15
|
+
checkpoint (/checkpoints/cifar10_meanflow.pth). Before any benchmark run, agents
|
|
16
|
+
must restore the upstream MeanFlow codebase (model definitions, train_arg_parser,
|
|
17
|
+
model_configs) and obtain or retrain the CIFAR-10 checkpoint. Once restored, the
|
|
18
|
+
evaluation route generates 50,000 samples with a single forward pass per image (1-NFE)
|
|
19
|
+
using an EMA network, computes FID against CIFAR-10 training images via torchmetrics
|
|
20
|
+
FrechetInceptionDistance, and reports the scalar FID score. The paper reports FID
|
|
21
|
+
3.43 on ImageNet 256×256; the CIFAR-10 route here is a smaller-scale reproduction
|
|
22
|
+
target. Training uses a JVP-based loss with stop-gradient on the target, implemented
|
|
23
|
+
in JAX in the original paper but the evaluation script is PyTorch. No pre-training,
|
|
24
|
+
distillation, or curriculum learning is required by the method itself. The optimization
|
|
25
|
+
goal is to minimize FID while maintaining one-step (1-NFE) generation.
|
|
26
|
+
|
|
27
|
+
'
|
|
28
|
+
capability_tags:
|
|
29
|
+
- research_code_optimization
|
|
30
|
+
- generative_modeling
|
|
31
|
+
- diffusion_models
|
|
32
|
+
- computer_vision
|
|
33
|
+
- image_generation
|
|
34
|
+
- flow_matching
|
|
35
|
+
aisb_direction: T3
|
|
36
|
+
track_fit:
|
|
37
|
+
- paper_track
|
|
38
|
+
- benchmark_track
|
|
39
|
+
task_mode: experiment_driven
|
|
40
|
+
requires_execution: true
|
|
41
|
+
requires_paper: true
|
|
42
|
+
integrity_level: cas_plus_canary
|
|
43
|
+
snapshot_status: partial
|
|
44
|
+
support_level: recovery
|
|
45
|
+
cost_band: medium
|
|
46
|
+
time_band: 6-24h
|
|
47
|
+
difficulty: hard
|
|
48
|
+
data_access: public
|
|
49
|
+
primary_outputs:
|
|
50
|
+
- fid
|
|
51
|
+
- generated_samples
|
|
52
|
+
- evaluation_log
|
|
53
|
+
launch_profiles:
|
|
54
|
+
- id: analysis_only
|
|
55
|
+
label: Analysis Only
|
|
56
|
+
description: 'Inspect the preserved eval_cifar10.py, config.yaml, and metric contract
|
|
57
|
+
without running any generation. Useful for understanding the evaluation route
|
|
58
|
+
and planning restoration of the missing source tree.
|
|
59
|
+
|
|
60
|
+
'
|
|
61
|
+
- id: restore_first
|
|
62
|
+
label: Restore First
|
|
63
|
+
description: 'Clone the upstream MeanFlow repository to provide model definitions
|
|
64
|
+
and train_arg_parser, obtain or retrain the CIFAR-10 checkpoint, then run the
|
|
65
|
+
full FID-50K evaluation pipeline via eval_cifar10.py.
|
|
66
|
+
|
|
67
|
+
'
|
|
68
|
+
- id: train_and_eval
|
|
69
|
+
label: Train and Evaluate
|
|
70
|
+
description: 'Restore the full training pipeline, train MeanFlow on CIFAR-10 from
|
|
71
|
+
scratch using the JVP-based average-velocity loss, then evaluate FID-50K. Expect
|
|
72
|
+
multi-hour training on 2× A100 GPUs.
|
|
73
|
+
|
|
74
|
+
'
|
|
75
|
+
dataset_download:
|
|
76
|
+
primary_method: torchvision
|
|
77
|
+
sources:
|
|
78
|
+
- kind: torchvision
|
|
79
|
+
url: https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz
|
|
80
|
+
access: public
|
|
81
|
+
note: 'CIFAR-10 training set (50K images, 32×32). The eval script expects pre-downloaded
|
|
82
|
+
data at /tmp/cifar10_data/cifar10_data with download=False. Use torchvision.datasets.CIFAR10(download=True)
|
|
83
|
+
to fetch automatically.
|
|
84
|
+
|
|
85
|
+
'
|
|
86
|
+
notes:
|
|
87
|
+
- CIFAR-10 is approximately 170 MB compressed, under 1 GB extracted.
|
|
88
|
+
- The pretrained checkpoint (cifar10_meanflow.pth) is not bundled and must be obtained
|
|
89
|
+
or retrained.
|
|
90
|
+
credential_requirements:
|
|
91
|
+
mode: none
|
|
92
|
+
items: []
|
|
93
|
+
notes:
|
|
94
|
+
- No API keys or credentials are needed. CIFAR-10 is freely downloadable.
|
|
95
|
+
resources:
|
|
96
|
+
minimum:
|
|
97
|
+
cpu_cores: 8
|
|
98
|
+
ram_gb: 32
|
|
99
|
+
disk_gb: 60
|
|
100
|
+
gpu_count: 2
|
|
101
|
+
gpu_vram_gb: 40
|
|
102
|
+
recommended:
|
|
103
|
+
cpu_cores: 16
|
|
104
|
+
ram_gb: 64
|
|
105
|
+
disk_gb: 120
|
|
106
|
+
gpu_count: 2
|
|
107
|
+
gpu_vram_gb: 80
|
|
108
|
+
environment:
|
|
109
|
+
python: '3.10'
|
|
110
|
+
cuda: '12.1'
|
|
111
|
+
pytorch: 2.1.0
|
|
112
|
+
flash_attn: null
|
|
113
|
+
key_packages:
|
|
114
|
+
- torchvision
|
|
115
|
+
- torchmetrics
|
|
116
|
+
- numpy
|
|
117
|
+
notes:
|
|
118
|
+
- The original paper implementation uses JAX with jax.jvp for the JVP-based training
|
|
119
|
+
loss; the bundled eval script uses PyTorch with torch.func.jvp.
|
|
120
|
+
- The local reproduction config used two A100 GPUs for FID-50K evaluation.
|
|
121
|
+
- The upstream MeanFlow source tree (model definitions, train_arg_parser, model_configs)
|
|
122
|
+
must be restored before execution.
|
|
123
|
+
- Batch size defaults to 128 for evaluation; adjust based on available VRAM.
|
|
124
|
+
risk_flags:
|
|
125
|
+
- missing_source_tree
|
|
126
|
+
- missing_checkpoint
|
|
127
|
+
- hardcoded_paths
|
|
128
|
+
- no_prior_execution
|
|
129
|
+
risk_notes:
|
|
130
|
+
- The eval script hardcodes paths to /py-meanflow/meanflow/ and /checkpoints/cifar10_meanflow.pth
|
|
131
|
+
which do not exist in the snapshot.
|
|
132
|
+
- The core MeanFlow model code (models/model_configs.py, train_arg_parser.py) is not
|
|
133
|
+
present in the local snapshot and must be sourced from the upstream repository.
|
|
134
|
+
- No benchmark execution was performed during packaging; all metric values are unverified.
|
|
135
|
+
- The README is absent from the current snapshot; rely on AGENTS.md, OPTIMIZATION.md,
|
|
136
|
+
and the paper for guidance.
|
|
137
|
+
- The training route requires JAX if following the paper's implementation, but the
|
|
138
|
+
eval route is PyTorch-based, creating a potential framework mismatch.
|
|
139
|
+
recommended_when: 'Use this benchmark when you want a compact, single-dataset image
|
|
140
|
+
generation task with a clear scalar FID target, one-step (1-NFE) sampling as the
|
|
141
|
+
core constraint, and interest in optimizing flow-based generative models without
|
|
142
|
+
distillation or curriculum learning. Good for agents that can handle code restoration
|
|
143
|
+
and dependency resolution.
|
|
144
|
+
|
|
145
|
+
'
|
|
146
|
+
not_recommended_when: 'Do not use this if you cannot provision at least two modern
|
|
147
|
+
CUDA GPUs (≥40 GB VRAM each) for sample generation and FID scoring, or if you need
|
|
148
|
+
a fully self-contained ready-to-run benchmark without any source tree restoration.
|
|
149
|
+
Also avoid if you require ImageNet-scale results, as this snapshot targets CIFAR-10
|
|
150
|
+
only.
|
|
151
|
+
|
|
152
|
+
'
|
|
153
|
+
paper:
|
|
154
|
+
title: Mean Flows for One-step Generative Modeling
|
|
155
|
+
authors:
|
|
156
|
+
- Zhengyang Geng
|
|
157
|
+
- Mingyang Deng
|
|
158
|
+
- Xingjian Bai
|
|
159
|
+
- J. Zico Kolter
|
|
160
|
+
- Kaiming He
|
|
161
|
+
affiliations:
|
|
162
|
+
- CMU
|
|
163
|
+
- MIT
|
|
164
|
+
venue: arXiv preprint
|
|
165
|
+
year: 2025
|
|
166
|
+
url: https://arxiv.org/abs/2505.13447
|
|
167
|
+
key_results:
|
|
168
|
+
- metric: FID
|
|
169
|
+
value: 3.43
|
|
170
|
+
dataset: ImageNet 256×256
|
|
171
|
+
condition: 1-NFE, trained from scratch, no distillation
|
|
172
|
+
download:
|
|
173
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.008_meanflows.zip
|
|
174
|
+
archive_type: zip
|
|
175
|
+
local_dir_name: paper-8-MeanFlows
|
|
176
|
+
provider: github_release
|
|
177
|
+
repo: ResearAI/DeepScientist
|
|
178
|
+
tag: aisb-v0.0.1
|
|
179
|
+
asset_name: aisb.t3.008_meanflows.zip
|
|
180
|
+
sha256: 3583357776f7b2d323b8a8170a88cb6559c1c90319e5b2947dc84ad1baf822e3
|
|
181
|
+
size_bytes: 100179
|
|
182
|
+
commercial:
|
|
183
|
+
annual_fee: null
|
|
184
|
+
display:
|
|
185
|
+
palette_seed: magenta-slate-ode
|
|
186
|
+
art_style: modern-lab
|
|
187
|
+
accent_priority: high
|
|
188
|
+
image_path: ../image/008_aisb.t3.008_meanflows.jpg
|
|
@@ -0,0 +1,140 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.008_meanflows
|
|
3
|
+
name: 用于一步生成建模的均值流
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 在 CIFAR-10 上训练并评估 MeanFlow 一步生成模型,通过捆绑的评估脚本测量 FID-50K,该脚本需要恢复源代码树和检查点。
|
|
6
|
+
|
|
7
|
+
task_description: 本基准测试涵盖使用 MeanFlow 框架进行的一步图像生成,该框架学习平均速度场(而非标准流匹配中的瞬时速度),以实现单次 NFE 采样。打包的快照包含评估脚本(eval_cifar10.py)和配置文件,但缺少核心 MeanFlow 训练源代码树(位于 /py-meanflow/meanflow/)和预训练检查点(/checkpoints/cifar10_meanflow.pth)。在任何基准测试运行之前,智能体必须恢复上游 MeanFlow 代码库(模型定义、train_arg_parser、model_configs)并获取或重新训练 CIFAR-10 检查点。恢复后,评估路线使用 EMA 网络通过单次前向传递(1-NFE)生成 50,000 个样本,通过 torchmetrics FrechetInceptionDistance 计算相对于 CIFAR-10 训练图像的 FID,并报告标量 FID 分数。论文报告 ImageNet 256×256 上 FID 为 3.43;此处 CIFAR-10 路线是较小规模的复现目标。训练使用基于 JVP 的损失函数和对目标的停止梯度,原始论文使用 JAX 实现,但评估脚本使用 PyTorch。该方法本身不需要预训练、蒸馏或课程学习。优化目标是在保持一步(1-NFE)生成的同时最小化 FID。
|
|
8
|
+
|
|
9
|
+
capability_tags:
|
|
10
|
+
- research_code_optimization
|
|
11
|
+
- generative_modeling
|
|
12
|
+
- diffusion_models
|
|
13
|
+
- computer_vision
|
|
14
|
+
- image_generation
|
|
15
|
+
- flow_matching
|
|
16
|
+
aisb_direction: T3
|
|
17
|
+
track_fit:
|
|
18
|
+
- paper_track
|
|
19
|
+
- benchmark_track
|
|
20
|
+
task_mode: experiment_driven
|
|
21
|
+
requires_execution: true
|
|
22
|
+
requires_paper: true
|
|
23
|
+
integrity_level: cas_plus_canary
|
|
24
|
+
snapshot_status: partial
|
|
25
|
+
support_level: recovery
|
|
26
|
+
cost_band: medium
|
|
27
|
+
time_band: 6-24h
|
|
28
|
+
difficulty: hard
|
|
29
|
+
data_access: public
|
|
30
|
+
primary_outputs:
|
|
31
|
+
- fid
|
|
32
|
+
- generated_samples
|
|
33
|
+
- evaluation_log
|
|
34
|
+
launch_profiles:
|
|
35
|
+
- id: analysis_only
|
|
36
|
+
label: 仅分析
|
|
37
|
+
description: 检查保存的 eval_cifar10.py、config.yaml 和指标合约,无需运行任何生成过程。用于理解评估路线并规划恢复缺失的源代码树。
|
|
38
|
+
|
|
39
|
+
- id: restore_first
|
|
40
|
+
label: 先恢复
|
|
41
|
+
description: 克隆上游 MeanFlow 仓库以提供模型定义和 train_arg_parser,获取或重新训练 CIFAR-10 检查点,然后通过 eval_cifar10.py 运行完整的 FID-50K 评估流程。
|
|
42
|
+
|
|
43
|
+
- id: train_and_eval
|
|
44
|
+
label: 训练并评估
|
|
45
|
+
description: 恢复完整的训练流程,使用基于 JVP 的平均速度损失从头开始在 CIFAR-10 上训练 MeanFlow,然后评估 FID-50K。预计在 2× A100 GPU 上需要数小时训练。
|
|
46
|
+
|
|
47
|
+
dataset_download:
|
|
48
|
+
primary_method: torchvision
|
|
49
|
+
sources:
|
|
50
|
+
- kind: torchvision
|
|
51
|
+
url: https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz
|
|
52
|
+
access: public
|
|
53
|
+
note: CIFAR-10 训练集(50K 张图像,32×32)。评估脚本期望在 /tmp/cifar10_data/cifar10_data 处有预下载的数据,download=False。使用 torchvision.datasets.CIFAR10(download=True) 自动获取。
|
|
54
|
+
|
|
55
|
+
notes:
|
|
56
|
+
- CIFAR-10 压缩后约 170 MB,解压后不到 1 GB。
|
|
57
|
+
- 预训练检查点(cifar10_meanflow.pth)未捆绑,必须获取或重新训练。
|
|
58
|
+
credential_requirements:
|
|
59
|
+
mode: none
|
|
60
|
+
items: []
|
|
61
|
+
notes:
|
|
62
|
+
- 无需 API 密钥或凭证。CIFAR-10 可免费下载。
|
|
63
|
+
resources:
|
|
64
|
+
minimum:
|
|
65
|
+
cpu_cores: 8
|
|
66
|
+
ram_gb: 32
|
|
67
|
+
disk_gb: 60
|
|
68
|
+
gpu_count: 2
|
|
69
|
+
gpu_vram_gb: 40
|
|
70
|
+
recommended:
|
|
71
|
+
cpu_cores: 16
|
|
72
|
+
ram_gb: 64
|
|
73
|
+
disk_gb: 120
|
|
74
|
+
gpu_count: 2
|
|
75
|
+
gpu_vram_gb: 80
|
|
76
|
+
environment:
|
|
77
|
+
python: '3.10'
|
|
78
|
+
cuda: '12.1'
|
|
79
|
+
pytorch: 2.1.0
|
|
80
|
+
flash_attn: null
|
|
81
|
+
key_packages:
|
|
82
|
+
- torchvision
|
|
83
|
+
- torchmetrics
|
|
84
|
+
- numpy
|
|
85
|
+
notes:
|
|
86
|
+
- 原始论文实现使用 JAX 和 jax.jvp 进行基于 JVP 的训练损失;捆绑的评估脚本使用 PyTorch 和 torch.func.jvp。
|
|
87
|
+
- 本地复现配置使用两枚 A100 GPU 进行 FID-50K 评估。
|
|
88
|
+
- 上游 MeanFlow 源代码树(模型定义、train_arg_parser、model_configs)必须在执行前恢复。
|
|
89
|
+
- 默认批量大小为 128 用于评估;根据可用 VRAM 进行调整。
|
|
90
|
+
risk_flags:
|
|
91
|
+
- missing_source_tree
|
|
92
|
+
- missing_checkpoint
|
|
93
|
+
- hardcoded_paths
|
|
94
|
+
- no_prior_execution
|
|
95
|
+
risk_notes:
|
|
96
|
+
- 评估脚本硬编码了 /py-meanflow/meanflow/ 和 /checkpoints/cifar10_meanflow.pth 的路径,这些路径在快照中不存在。
|
|
97
|
+
- 核心 MeanFlow 模型代码(models/model_configs.py、train_arg_parser.py)未出现在本地快照中,必须从上游仓库获取。
|
|
98
|
+
- 打包期间未执行任何基准测试;所有指标值均未验证。
|
|
99
|
+
- 当前快照中没有 README;请参考 AGENTS.md、OPTIMIZATION.md 和论文。
|
|
100
|
+
- 如果遵循论文的实现,训练路线需要 JAX,但评估路线基于 PyTorch,可能存在框架不匹配。
|
|
101
|
+
recommended_when: 当您需要一个紧凑的、单数据集的图像生成任务,具有明确的标量 FID 目标、一步(1-NFE)采样作为核心约束,并对优化基于流的生成模型(无需蒸馏或课程学习)感兴趣时,可使用此基准测试。适合能够处理代码恢复和依赖项解析的智能体。
|
|
102
|
+
|
|
103
|
+
not_recommended_when: 如果无法为样本生成和 FID 评分配置至少两枚现代 CUDA GPU(每枚 ≥40 GB VRAM),或者需要一个完全自包含的、随时可运行的基准测试而无需任何源代码树恢复,请勿使用。如果需要 ImageNet 规模的结果,也应避免,因为此快照仅针对 CIFAR-10。
|
|
104
|
+
|
|
105
|
+
paper:
|
|
106
|
+
title: Mean Flows for One-step Generative Modeling
|
|
107
|
+
authors:
|
|
108
|
+
- Zhengyang Geng
|
|
109
|
+
- Mingyang Deng
|
|
110
|
+
- Xingjian Bai
|
|
111
|
+
- J. Zico Kolter
|
|
112
|
+
- Kaiming He
|
|
113
|
+
affiliations:
|
|
114
|
+
- CMU
|
|
115
|
+
- MIT
|
|
116
|
+
venue: arXiv preprint
|
|
117
|
+
year: 2025
|
|
118
|
+
url: https://arxiv.org/abs/2505.13447
|
|
119
|
+
key_results:
|
|
120
|
+
- metric: FID
|
|
121
|
+
value: 3.43
|
|
122
|
+
dataset: ImageNet 256×256
|
|
123
|
+
condition: 1-NFE, 从头训练, 无蒸馏
|
|
124
|
+
download:
|
|
125
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.008_meanflows.zip
|
|
126
|
+
archive_type: zip
|
|
127
|
+
local_dir_name: paper-8-MeanFlows
|
|
128
|
+
provider: github_release
|
|
129
|
+
repo: ResearAI/DeepScientist
|
|
130
|
+
tag: aisb-v0.0.1
|
|
131
|
+
asset_name: aisb.t3.008_meanflows.zip
|
|
132
|
+
sha256: 3583357776f7b2d323b8a8170a88cb6559c1c90319e5b2947dc84ad1baf822e3
|
|
133
|
+
size_bytes: 100179
|
|
134
|
+
commercial:
|
|
135
|
+
annual_fee: null
|
|
136
|
+
display:
|
|
137
|
+
palette_seed: magenta-slate-ode
|
|
138
|
+
art_style: modern-lab
|
|
139
|
+
accent_priority: high
|
|
140
|
+
image_path: ../image/008_aisb.t3.008_meanflows.jpg
|