@researai/deepscientist 1.5.16 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +309 -130
- package/AISB/catalog/aisb.b1.agentic_coding.yaml +244 -0
- package/AISB/catalog/aisb.b10.climate_earth.yaml +235 -0
- package/AISB/catalog/aisb.b11.model_efficiency.yaml +231 -0
- package/AISB/catalog/aisb.b12.embodied_ai.yaml +238 -0
- package/AISB/catalog/aisb.b2.agent_systems.yaml +229 -0
- package/AISB/catalog/aisb.b3.self_evolving_rl.yaml +237 -0
- package/AISB/catalog/aisb.b4.lm_reasoning.yaml +240 -0
- package/AISB/catalog/aisb.b5.math_proof.yaml +235 -0
- package/AISB/catalog/aisb.b6.research_process.yaml +243 -0
- package/AISB/catalog/aisb.b7.multimodal_fusion.yaml +232 -0
- package/AISB/catalog/aisb.b8.lifesci_drug.yaml +275 -0
- package/AISB/catalog/aisb.b9.material_science.yaml +237 -0
- package/AISB/catalog/aisb.t3.001_savvy.yaml +159 -0
- package/AISB/catalog/aisb.t3.001_savvy.zh.yaml +121 -0
- package/AISB/catalog/aisb.t3.002_pinet.yaml +189 -0
- package/AISB/catalog/aisb.t3.002_pinet.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.yaml +184 -0
- package/AISB/catalog/aisb.t3.004_decentralattn.zh.yaml +153 -0
- package/AISB/catalog/aisb.t3.005_tsae.yaml +193 -0
- package/AISB/catalog/aisb.t3.005_tsae.zh.yaml +139 -0
- package/AISB/catalog/aisb.t3.006_physense.yaml +194 -0
- package/AISB/catalog/aisb.t3.006_physense.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.yaml +169 -0
- package/AISB/catalog/aisb.t3.007_reasoningiqa.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.008_meanflows.yaml +188 -0
- package/AISB/catalog/aisb.t3.008_meanflows.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.yaml +179 -0
- package/AISB/catalog/aisb.t3.009_scoremissing.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.yaml +221 -0
- package/AISB/catalog/aisb.t3.010_suitabilityfilter.zh.yaml +141 -0
- package/AISB/catalog/aisb.t3.011_osd.yaml +206 -0
- package/AISB/catalog/aisb.t3.011_osd.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.yaml +206 -0
- package/AISB/catalog/aisb.t3.012_efficientqat.zh.yaml +159 -0
- package/AISB/catalog/aisb.t3.013_appl.yaml +152 -0
- package/AISB/catalog/aisb.t3.013_appl.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.014_piguard.yaml +207 -0
- package/AISB/catalog/aisb.t3.014_piguard.zh.yaml +164 -0
- package/AISB/catalog/aisb.t3.015_frspec.yaml +209 -0
- package/AISB/catalog/aisb.t3.015_frspec.zh.yaml +163 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.yaml +166 -0
- package/AISB/catalog/aisb.t3.016_mathfusion.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.yaml +171 -0
- package/AISB/catalog/aisb.t3.017_multimodalglp.zh.yaml +122 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.yaml +206 -0
- package/AISB/catalog/aisb.t3.018_cotsynth.zh.yaml +162 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.yaml +211 -0
- package/AISB/catalog/aisb.t3.019_dyscaleut.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.020_aristotle.yaml +173 -0
- package/AISB/catalog/aisb.t3.020_aristotle.zh.yaml +119 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.yaml +160 -0
- package/AISB/catalog/aisb.t3.021_tokenrecycling.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.yaml +204 -0
- package/AISB/catalog/aisb.t3.022_chainofreasoning.zh.yaml +161 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.yaml +211 -0
- package/AISB/catalog/aisb.t3.023_guidedembed.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.yaml +148 -0
- package/AISB/catalog/aisb.t3.024_outputcentric.zh.yaml +131 -0
- package/AISB/catalog/aisb.t3.025_deeper.yaml +143 -0
- package/AISB/catalog/aisb.t3.025_deeper.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.026_gartkg.yaml +195 -0
- package/AISB/catalog/aisb.t3.026_gartkg.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.027_citeeval.yaml +182 -0
- package/AISB/catalog/aisb.t3.027_citeeval.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.028_sbam.yaml +206 -0
- package/AISB/catalog/aisb.t3.028_sbam.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.yaml +224 -0
- package/AISB/catalog/aisb.t3.029_cdqgeoembed.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.030_processrm.yaml +211 -0
- package/AISB/catalog/aisb.t3.030_processrm.zh.yaml +166 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.yaml +172 -0
- package/AISB/catalog/aisb.t3.031_circuitstability.zh.yaml +134 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.yaml +169 -0
- package/AISB/catalog/aisb.t3.032_ptsolver.zh.yaml +135 -0
- package/AISB/catalog/aisb.t3.033_gcse.yaml +144 -0
- package/AISB/catalog/aisb.t3.033_gcse.zh.yaml +126 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.yaml +183 -0
- package/AISB/catalog/aisb.t3.034_ensemblewm.zh.yaml +146 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.yaml +207 -0
- package/AISB/catalog/aisb.t3.035_moralvalueswa.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.yaml +210 -0
- package/AISB/catalog/aisb.t3.036_weakstrongpref.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.yaml +172 -0
- package/AISB/catalog/aisb.t3.037_dementiamask.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.038_tinysam.yaml +284 -0
- package/AISB/catalog/aisb.t3.038_tinysam.zh.yaml +240 -0
- package/AISB/catalog/aisb.t3.039_calf.yaml +224 -0
- package/AISB/catalog/aisb.t3.039_calf.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.yaml +199 -0
- package/AISB/catalog/aisb.t3.040_graniteguardian.zh.yaml +174 -0
- package/AISB/catalog/aisb.t3.041_amdm.yaml +149 -0
- package/AISB/catalog/aisb.t3.041_amdm.zh.yaml +137 -0
- package/AISB/catalog/aisb.t3.042_xpatch.yaml +216 -0
- package/AISB/catalog/aisb.t3.042_xpatch.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.043_vhm.yaml +268 -0
- package/AISB/catalog/aisb.t3.043_vhm.zh.yaml +193 -0
- package/AISB/catalog/aisb.t3.044_rgvi.yaml +224 -0
- package/AISB/catalog/aisb.t3.044_rgvi.zh.yaml +176 -0
- package/AISB/catalog/aisb.t3.045_pslstm.yaml +203 -0
- package/AISB/catalog/aisb.t3.045_pslstm.zh.yaml +179 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.yaml +208 -0
- package/AISB/catalog/aisb.t3.046_nonstatts.zh.yaml +194 -0
- package/AISB/catalog/aisb.t3.047_timepfn.yaml +156 -0
- package/AISB/catalog/aisb.t3.047_timepfn.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.yaml +148 -0
- package/AISB/catalog/aisb.t3.048_proxyspex.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.yaml +183 -0
- package/AISB/catalog/aisb.t3.049_hogwildinference.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.yaml +214 -0
- package/AISB/catalog/aisb.t3.050_causalpfn.zh.yaml +190 -0
- package/AISB/catalog/aisb.t3.051_flashtp.yaml +169 -0
- package/AISB/catalog/aisb.t3.051_flashtp.zh.yaml +124 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.yaml +155 -0
- package/AISB/catalog/aisb.t3.052_nsdiff.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.053_k2vae.yaml +158 -0
- package/AISB/catalog/aisb.t3.053_k2vae.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.054_timebase.yaml +178 -0
- package/AISB/catalog/aisb.t3.054_timebase.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.055_csbrain.yaml +238 -0
- package/AISB/catalog/aisb.t3.055_csbrain.zh.yaml +184 -0
- package/AISB/catalog/aisb.t3.056_infosam.yaml +224 -0
- package/AISB/catalog/aisb.t3.056_infosam.zh.yaml +189 -0
- package/AISB/catalog/aisb.t3.057_mdreid.yaml +129 -0
- package/AISB/catalog/aisb.t3.057_mdreid.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.yaml +171 -0
- package/AISB/catalog/aisb.t3.058_mindglitch.zh.yaml +145 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.yaml +154 -0
- package/AISB/catalog/aisb.t3.059_selfsupervised.zh.yaml +125 -0
- package/AISB/catalog/aisb.t3.060_iaggad.yaml +121 -0
- package/AISB/catalog/aisb.t3.060_iaggad.zh.yaml +100 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.yaml +136 -0
- package/AISB/catalog/aisb.t3.061_hsgkn.zh.yaml +113 -0
- package/AISB/catalog/aisb.t3.062_visionts.yaml +237 -0
- package/AISB/catalog/aisb.t3.062_visionts.zh.yaml +216 -0
- package/AISB/catalog/aisb.t3.063_tsrag.yaml +162 -0
- package/AISB/catalog/aisb.t3.063_tsrag.zh.yaml +138 -0
- package/AISB/catalog/aisb.t3.064_pir.yaml +221 -0
- package/AISB/catalog/aisb.t3.064_pir.zh.yaml +197 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.yaml +234 -0
- package/AISB/catalog/aisb.t3.065_proteinbinding.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.yaml +267 -0
- package/AISB/catalog/aisb.t3.066_tropicalattention.zh.yaml +229 -0
- package/AISB/catalog/aisb.t3.067_kanad.yaml +193 -0
- package/AISB/catalog/aisb.t3.067_kanad.zh.yaml +167 -0
- package/AISB/catalog/aisb.t3.068_sempo.yaml +187 -0
- package/AISB/catalog/aisb.t3.068_sempo.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.069_treehfd.yaml +129 -0
- package/AISB/catalog/aisb.t3.069_treehfd.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.yaml +224 -0
- package/AISB/catalog/aisb.t3.070_certifiedunlearning.zh.yaml +171 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.yaml +142 -0
- package/AISB/catalog/aisb.t3.071_neuralmjd.zh.yaml +120 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.yaml +181 -0
- package/AISB/catalog/aisb.t3.072_fedgmt.zh.yaml +158 -0
- package/AISB/catalog/aisb.t3.073_rld.yaml +161 -0
- package/AISB/catalog/aisb.t3.073_rld.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.074_lsvi.yaml +163 -0
- package/AISB/catalog/aisb.t3.074_lsvi.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.yaml +201 -0
- package/AISB/catalog/aisb.t3.075_treeslicedentropy.zh.yaml +148 -0
- package/AISB/catalog/aisb.t3.076_aanet.yaml +169 -0
- package/AISB/catalog/aisb.t3.076_aanet.zh.yaml +129 -0
- package/AISB/catalog/aisb.t3.077_cmnn.yaml +199 -0
- package/AISB/catalog/aisb.t3.077_cmnn.zh.yaml +165 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.yaml +146 -0
- package/AISB/catalog/aisb.t3.078_conformalanomaly.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.yaml +131 -0
- package/AISB/catalog/aisb.t3.079_dpfkmeans.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.yaml +169 -0
- package/AISB/catalog/aisb.t3.080_latentscorereweight.zh.yaml +123 -0
- package/AISB/catalog/aisb.t3.081_qmamba.yaml +150 -0
- package/AISB/catalog/aisb.t3.081_qmamba.zh.yaml +117 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.yaml +160 -0
- package/AISB/catalog/aisb.t3.082_onlinellmrouting.zh.yaml +133 -0
- package/AISB/catalog/aisb.t3.083_starformer.yaml +178 -0
- package/AISB/catalog/aisb.t3.083_starformer.zh.yaml +140 -0
- package/AISB/catalog/aisb.t3.084_ift.yaml +139 -0
- package/AISB/catalog/aisb.t3.084_ift.zh.yaml +111 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.yaml +183 -0
- package/AISB/catalog/aisb.t3.085_neuralsurv.zh.yaml +143 -0
- package/AISB/catalog/aisb.t3.086_stella.yaml +197 -0
- package/AISB/catalog/aisb.t3.086_stella.zh.yaml +142 -0
- package/AISB/catalog/aisb.t3.087_moses.yaml +167 -0
- package/AISB/catalog/aisb.t3.087_moses.zh.yaml +132 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.yaml +140 -0
- package/AISB/catalog/aisb.t3.088_channelnorm.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.yaml +730 -0
- package/AISB/catalog/aisb.t3.089_causalvelocity.zh.yaml +668 -0
- package/AISB/catalog/aisb.t3.090_rstib.yaml +144 -0
- package/AISB/catalog/aisb.t3.090_rstib.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.yaml +132 -0
- package/AISB/catalog/aisb.t3.091_timeawarecausal.zh.yaml +107 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.yaml +138 -0
- package/AISB/catalog/aisb.t3.092_kmeanslocalopt.zh.yaml +110 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.yaml +134 -0
- package/AISB/catalog/aisb.t3.093_fedwmsam.zh.yaml +106 -0
- package/AISB/catalog/aisb.t3.094_boundre.yaml +147 -0
- package/AISB/catalog/aisb.t3.094_boundre.zh.yaml +114 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.yaml +153 -0
- package/AISB/catalog/aisb.t3.095_fastfeaturecp.zh.yaml +118 -0
- package/AISB/catalog/aisb.t3.096_m3svm.yaml +189 -0
- package/AISB/catalog/aisb.t3.096_m3svm.zh.yaml +149 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.yaml +212 -0
- package/AISB/catalog/aisb.t3.097_wassersteintl.zh.yaml +169 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.yaml +171 -0
- package/AISB/catalog/aisb.t3.098_xmahalanobis.zh.yaml +127 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.yaml +248 -0
- package/AISB/catalog/aisb.t3.099_ollalanding.zh.yaml +182 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.yaml +179 -0
- package/AISB/catalog/aisb.t3.100_invmissingdata.zh.yaml +150 -0
- package/AISB/catalog/aisb.t3.101_acia.yaml +164 -0
- package/AISB/catalog/aisb.t3.101_acia.zh.yaml +109 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.yaml +178 -0
- package/AISB/catalog/aisb.t3.102_stochasticff.zh.yaml +130 -0
- package/AISB/catalog/aisb.t3.103_qdcp.yaml +150 -0
- package/AISB/catalog/aisb.t3.103_qdcp.zh.yaml +116 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.yaml +137 -0
- package/AISB/catalog/aisb.t3.104_balancedactiveinf.zh.yaml +104 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.yaml +161 -0
- package/AISB/catalog/aisb.t3.105_binaryclasseval.zh.yaml +130 -0
- package/AISB/image/001_aisb.t3.001_savvy.jpg +0 -0
- package/AISB/image/002_aisb.t3.002_pinet.jpg +0 -0
- package/AISB/image/003_aisb.t3.003_dmsqd.jpg +0 -0
- package/AISB/image/004_aisb.t3.004_decentralattn.jpg +0 -0
- package/AISB/image/005_aisb.t3.005_tsae.jpg +0 -0
- package/AISB/image/006_aisb.t3.006_physense.jpg +0 -0
- package/AISB/image/007_aisb.t3.007_reasoningiqa.jpg +0 -0
- package/AISB/image/008_aisb.t3.008_meanflows.jpg +0 -0
- package/AISB/image/009_aisb.t3.009_scoremissing.jpg +0 -0
- package/AISB/image/010_aisb.t3.010_suitabilityfilter.jpg +0 -0
- package/AISB/image/011_aisb.t3.011_osd.jpg +0 -0
- package/AISB/image/012_aisb.t3.012_efficientqat.jpg +0 -0
- package/AISB/image/013_aisb.t3.013_appl.jpg +0 -0
- package/AISB/image/014_aisb.t3.014_piguard.jpg +0 -0
- package/AISB/image/015_aisb.t3.015_frspec.jpg +0 -0
- package/AISB/image/016_aisb.t3.016_mathfusion.jpg +0 -0
- package/AISB/image/017_aisb.t3.017_multimodalglp.jpg +0 -0
- package/AISB/image/018_aisb.t3.018_cotsynth.jpg +0 -0
- package/AISB/image/019_aisb.t3.019_dyscaleut.jpg +0 -0
- package/AISB/image/020_aisb.t3.020_aristotle.jpg +0 -0
- package/AISB/image/021_aisb.t3.021_tokenrecycling.jpg +0 -0
- package/AISB/image/022_aisb.t3.022_chainofreasoning.jpg +0 -0
- package/AISB/image/023_aisb.t3.023_guidedembed.jpg +0 -0
- package/AISB/image/024_aisb.t3.024_outputcentric.jpg +0 -0
- package/AISB/image/025_aisb.t3.025_deeper.jpg +0 -0
- package/AISB/image/026_aisb.t3.026_gartkg.jpg +0 -0
- package/AISB/image/027_aisb.t3.027_citeeval.jpg +0 -0
- package/AISB/image/028_aisb.t3.028_sbam.jpg +0 -0
- package/AISB/image/029_aisb.t3.029_cdqgeoembed.jpg +0 -0
- package/AISB/image/030_aisb.t3.030_processrm.jpg +0 -0
- package/AISB/image/031_aisb.t3.031_circuitstability.jpg +0 -0
- package/AISB/image/032_aisb.t3.032_ptsolver.jpg +0 -0
- package/AISB/image/033_aisb.t3.033_gcse.jpg +0 -0
- package/AISB/image/034_aisb.t3.034_ensemblewm.jpg +0 -0
- package/AISB/image/035_aisb.t3.035_moralvalueswa.jpg +0 -0
- package/AISB/image/036_aisb.t3.036_weakstrongpref.jpg +0 -0
- package/AISB/image/037_aisb.t3.037_dementiamask.jpg +0 -0
- package/AISB/image/038_aisb.t3.038_tinysam.jpg +0 -0
- package/AISB/image/039_aisb.t3.039_calf.jpg +0 -0
- package/AISB/image/040_aisb.t3.040_graniteguardian.jpg +0 -0
- package/AISB/image/041_aisb.t3.041_amdm.jpg +0 -0
- package/AISB/image/042_aisb.t3.042_xpatch.jpg +0 -0
- package/AISB/image/043_aisb.t3.043_vhm.jpg +0 -0
- package/AISB/image/044_aisb.t3.044_rgvi.jpg +0 -0
- package/AISB/image/045_aisb.t3.045_pslstm.jpg +0 -0
- package/AISB/image/046_aisb.t3.046_nonstatts.jpg +0 -0
- package/AISB/image/047_aisb.t3.047_timepfn.jpg +0 -0
- package/AISB/image/048_aisb.t3.048_proxyspex.jpg +0 -0
- package/AISB/image/049_aisb.t3.049_hogwildinference.jpg +0 -0
- package/AISB/image/050_aisb.t3.050_causalpfn.jpg +0 -0
- package/AISB/image/051_aisb.t3.051_flashtp.jpg +0 -0
- package/AISB/image/052_aisb.t3.052_nsdiff.jpg +0 -0
- package/AISB/image/053_aisb.t3.053_k2vae.jpg +0 -0
- package/AISB/image/054_aisb.t3.054_timebase.jpg +0 -0
- package/AISB/image/055_aisb.t3.055_csbrain.jpg +0 -0
- package/AISB/image/056_aisb.t3.056_infosam.jpg +0 -0
- package/AISB/image/057_aisb.t3.057_mdreid.jpg +0 -0
- package/AISB/image/058_aisb.t3.058_mindglitch.jpg +0 -0
- package/AISB/image/059_aisb.t3.059_selfsupervised.jpg +0 -0
- package/AISB/image/060_aisb.t3.060_iaggad.jpg +0 -0
- package/AISB/image/061_aisb.t3.061_hsgkn.jpg +0 -0
- package/AISB/image/062_aisb.t3.062_visionts.jpg +0 -0
- package/AISB/image/063_aisb.t3.063_tsrag.jpg +0 -0
- package/AISB/image/064_aisb.t3.064_pir.jpg +0 -0
- package/AISB/image/065_aisb.t3.065_proteinbinding.jpg +0 -0
- package/AISB/image/066_aisb.t3.066_tropicalattention.jpg +0 -0
- package/AISB/image/067_aisb.t3.067_kanad.jpg +0 -0
- package/AISB/image/068_aisb.t3.068_sempo.jpg +0 -0
- package/AISB/image/069_aisb.t3.069_treehfd.jpg +0 -0
- package/AISB/image/070_aisb.t3.070_certifiedunlearning.jpg +0 -0
- package/AISB/image/071_aisb.t3.071_neuralmjd.jpg +0 -0
- package/AISB/image/072_aisb.t3.072_fedgmt.jpg +0 -0
- package/AISB/image/073_aisb.t3.073_rld.jpg +0 -0
- package/AISB/image/074_aisb.t3.074_lsvi.jpg +0 -0
- package/AISB/image/075_aisb.t3.075_treeslicedentropy.jpg +0 -0
- package/AISB/image/076_aisb.t3.076_aanet.jpg +0 -0
- package/AISB/image/077_aisb.t3.077_cmnn.jpg +0 -0
- package/AISB/image/078_aisb.t3.078_conformalanomaly.jpg +0 -0
- package/AISB/image/079_aisb.t3.079_dpfkmeans.jpg +0 -0
- package/AISB/image/080_aisb.t3.080_latentscorereweight.jpg +0 -0
- package/AISB/image/081_aisb.t3.081_qmamba.jpg +0 -0
- package/AISB/image/082_aisb.t3.082_onlinellmrouting.jpg +0 -0
- package/AISB/image/083_aisb.t3.083_starformer.jpg +0 -0
- package/AISB/image/084_aisb.t3.084_ift.jpg +0 -0
- package/AISB/image/085_aisb.t3.085_neuralsurv.jpg +0 -0
- package/AISB/image/086_aisb.t3.086_stella.jpg +0 -0
- package/AISB/image/087_aisb.t3.087_moses.jpg +0 -0
- package/AISB/image/088_aisb.t3.088_channelnorm.jpg +0 -0
- package/AISB/image/089_aisb.t3.089_causalvelocity.jpg +0 -0
- package/AISB/image/090_aisb.t3.090_rstib.jpg +0 -0
- package/AISB/image/091_aisb.t3.091_timeawarecausal.jpg +0 -0
- package/AISB/image/092_aisb.t3.092_kmeanslocalopt.jpg +0 -0
- package/AISB/image/093_aisb.t3.093_fedwmsam.jpg +0 -0
- package/AISB/image/094_aisb.t3.094_boundre.jpg +0 -0
- package/AISB/image/095_aisb.t3.095_fastfeaturecp.jpg +0 -0
- package/AISB/image/096_aisb.t3.096_m3svm.jpg +0 -0
- package/AISB/image/097_aisb.t3.097_wassersteintl.jpg +0 -0
- package/AISB/image/098_aisb.t3.098_xmahalanobis.jpg +0 -0
- package/AISB/image/099_aisb.t3.099_ollalanding.jpg +0 -0
- package/AISB/image/100_aisb.t3.100_invmissingdata.jpg +0 -0
- package/AISB/image/101_aisb.t3.101_acia.jpg +0 -0
- package/AISB/image/102_aisb.t3.102_stochasticff.jpg +0 -0
- package/AISB/image/103_aisb.t3.103_qdcp.jpg +0 -0
- package/AISB/image/104_aisb.t3.104_balancedactiveinf.jpg +0 -0
- package/AISB/image/105_aisb.t3.105_binaryclasseval.jpg +0 -0
- package/AISB/image/106_aisb.t1.reasoning_lite.jpg +0 -0
- package/AISB/image/107_aisb.t2.paper_audit.jpg +0 -0
- package/AISB/image/108_aisb.t3.multi_gpu_search.jpg +0 -0
- package/AISB/image/109_aisb.t3.tdc_admet.jpg +0 -0
- package/AISB/image/aisb.b1.agentic_coding.svg +16 -0
- package/AISB/image/aisb.b10.climate_earth.svg +16 -0
- package/AISB/image/aisb.b11.model_efficiency.svg +16 -0
- package/AISB/image/aisb.b12.embodied_ai.svg +16 -0
- package/AISB/image/aisb.b2.agent_systems.svg +16 -0
- package/AISB/image/aisb.b3.self_evolving_rl.svg +16 -0
- package/AISB/image/aisb.b4.lm_reasoning.svg +16 -0
- package/AISB/image/aisb.b5.math_proof.svg +16 -0
- package/AISB/image/aisb.b6.research_process.svg +16 -0
- package/AISB/image/aisb.b7.multimodal_fusion.svg +16 -0
- package/AISB/image/aisb.b8.lifesci_drug.svg +16 -0
- package/AISB/image/aisb.b9.material_science.svg +16 -0
- package/README.md +196 -32
- package/bin/ds.js +924 -66
- package/docs/en/00_QUICK_START.md +195 -18
- package/docs/en/01_SETTINGS_REFERENCE.md +468 -96
- package/docs/en/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/en/03_QQ_CONNECTOR_GUIDE.md +14 -3
- package/docs/en/04_LINGZHU_CONNECTOR_GUIDE.md +2 -0
- package/docs/en/05_TUI_GUIDE.md +171 -2
- package/docs/en/07_MEMORY_AND_MCP.md +38 -2
- package/docs/en/09_DOCTOR.md +78 -7
- package/docs/en/10_WEIXIN_CONNECTOR_GUIDE.md +38 -1
- package/docs/en/11_LICENSE_AND_RISK.md +4 -0
- package/docs/en/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/en/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/en/15_CODEX_PROVIDER_SETUP.md +624 -180
- package/docs/en/16_TELEGRAM_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/17_WHATSAPP_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/18_FEISHU_CONNECTOR_GUIDE.md +14 -0
- package/docs/en/21_LOCAL_MODEL_BACKENDS_GUIDE.md +386 -0
- package/docs/en/22_BENCHSTORE_YAML_REFERENCE.md +469 -0
- package/docs/en/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +316 -0
- package/docs/en/24_CLAUDE_CODE_PROVIDER_SETUP.md +469 -0
- package/docs/en/25_OPENCODE_PROVIDER_SETUP.md +653 -0
- package/docs/en/26_CITATION_AND_ATTRIBUTION.md +119 -0
- package/docs/en/27_KIMI_CODE_PROVIDER_SETUP.md +180 -0
- package/docs/en/28_DISCORD_CONNECTOR_GUIDE.md +61 -0
- package/docs/en/29_SLACK_CONNECTOR_GUIDE.md +60 -0
- package/docs/en/30_SETTINGS_CONTROL_CENTER_GUIDE.md +371 -0
- package/docs/en/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/en/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +273 -0
- package/docs/en/33_WORKSPACE_EXPLORER_QA.md +121 -0
- package/docs/en/91_DEVELOPMENT.md +266 -0
- package/docs/en/99_ACKNOWLEDGEMENTS.md +24 -19
- package/docs/en/README.md +48 -7
- package/docs/images/admin/admin-connectors-health-en.png +0 -0
- package/docs/images/admin/admin-controllers-en.png +0 -0
- package/docs/images/admin/admin-diagnostics-en.png +0 -0
- package/docs/images/admin/admin-errors-en.png +0 -0
- package/docs/images/admin/admin-issues-en.png +0 -0
- package/docs/images/admin/admin-logs-en.png +0 -0
- package/docs/images/admin/admin-quest-detail-en.png +0 -0
- package/docs/images/admin/admin-quests-en.png +0 -0
- package/docs/images/admin/admin-repairs-en.png +0 -0
- package/docs/images/admin/admin-runtime-en.png +0 -0
- package/docs/images/admin/admin-search-en.png +0 -0
- package/docs/images/admin/admin-stats-en.png +0 -0
- package/docs/images/admin/admin-summary-en.png +0 -0
- package/docs/images/connectors/connector-discord-en.png +0 -0
- package/docs/images/connectors/connector-feishu-en.png +0 -0
- package/docs/images/connectors/connector-lingzhu-en.png +0 -0
- package/docs/images/connectors/connector-qq-en.png +0 -0
- package/docs/images/connectors/connector-slack-en.png +0 -0
- package/docs/images/connectors/connector-telegram-en.png +0 -0
- package/docs/images/connectors/connector-weixin-en.png +0 -0
- package/docs/images/connectors/connector-whatsapp-en.png +0 -0
- package/docs/images/settings/settings-baselines-en.png +0 -0
- package/docs/images/settings/settings-config-en.png +0 -0
- package/docs/images/settings/settings-connectors-overview-en.png +0 -0
- package/docs/images/settings/settings-deepxiv-en.png +0 -0
- package/docs/images/settings/settings-mcp-servers-en.png +0 -0
- package/docs/images/settings/settings-plugins-en.png +0 -0
- package/docs/images/settings/settings-runners-en.png +0 -0
- package/docs/zh/00_QUICK_START.md +142 -18
- package/docs/zh/01_SETTINGS_REFERENCE.md +219 -98
- package/docs/zh/02_START_RESEARCH_GUIDE.md +26 -5
- package/docs/zh/05_TUI_GUIDE.md +171 -2
- package/docs/zh/07_MEMORY_AND_MCP.md +29 -2
- package/docs/zh/09_DOCTOR.md +54 -8
- package/docs/zh/10_WEIXIN_CONNECTOR_GUIDE.md +24 -1
- package/docs/zh/11_LICENSE_AND_RISK.md +4 -0
- package/docs/zh/12_GUIDED_WORKFLOW_TOUR.md +15 -0
- package/docs/zh/14_PROMPT_SKILLS_AND_MCP_GUIDE.md +9 -0
- package/docs/zh/15_CODEX_PROVIDER_SETUP.md +552 -181
- package/docs/zh/21_LOCAL_MODEL_BACKENDS_GUIDE.md +384 -0
- package/docs/zh/22_BENCHSTORE_YAML_REFERENCE.md +459 -0
- package/docs/zh/23_BENCHSTORE_GITHUB_RELEASES_SPEC.md +287 -0
- package/docs/zh/23_CLAUDE_RUNNER_GUIDE.md +103 -0
- package/docs/zh/24_CLAUDE_CODE_PROVIDER_SETUP.md +460 -0
- package/docs/zh/25_OPENCODE_PROVIDER_SETUP.md +660 -0
- package/docs/zh/26_CITATION_AND_ATTRIBUTION.md +102 -0
- package/docs/zh/27_KIMI_CODE_PROVIDER_SETUP.md +51 -0
- package/docs/zh/{19_LOCAL_BROWSER_AUTH.md → 31_LOCAL_BROWSER_AUTH.md} +1 -1
- package/docs/zh/32_WINDOWS_WSL2_DEPLOYMENT_GUIDE.md +264 -0
- package/docs/zh/33_WORKSPACE_EXPLORER_QA.md +127 -0
- package/docs/zh/99_ACKNOWLEDGEMENTS.md +23 -19
- package/docs/zh/README.md +33 -7
- package/install.sh +168 -20
- package/package.json +5 -1
- package/pyproject.toml +2 -1
- package/src/deepscientist/__init__.py +1 -1
- package/src/deepscientist/acp/envelope.py +13 -0
- package/src/deepscientist/admin/__init__.py +3 -0
- package/src/deepscientist/admin/charts.py +681 -0
- package/src/deepscientist/admin/logs.py +119 -0
- package/src/deepscientist/admin/repairs.py +217 -0
- package/src/deepscientist/admin/service.py +1310 -0
- package/src/deepscientist/admin/system_info.py +700 -0
- package/src/deepscientist/admin/tasks.py +465 -0
- package/src/deepscientist/admin/tool_metrics.py +600 -0
- package/src/deepscientist/artifact/guidance.py +8 -4
- package/src/deepscientist/artifact/schemas.py +115 -0
- package/src/deepscientist/artifact/service.py +4268 -260
- package/src/deepscientist/bash_exec/monitor.py +30 -3
- package/src/deepscientist/bash_exec/service.py +134 -1
- package/src/deepscientist/benchstore/__init__.py +4 -0
- package/src/deepscientist/benchstore/prompt_builder.py +224 -0
- package/src/deepscientist/benchstore/service.py +1716 -0
- package/src/deepscientist/bridges/connectors.py +8 -2
- package/src/deepscientist/channels/weixin_ilink.py +8 -1
- package/src/deepscientist/cli.py +92 -17
- package/src/deepscientist/codex_cli_compat.py +187 -74
- package/src/deepscientist/config/models.py +82 -11
- package/src/deepscientist/config/service.py +1077 -93
- package/src/deepscientist/connector/weixin_support.py +48 -17
- package/src/deepscientist/daemon/api/handlers.py +827 -235
- package/src/deepscientist/daemon/api/router.py +81 -1
- package/src/deepscientist/daemon/app.py +1512 -85
- package/src/deepscientist/diagnostics/__init__.py +6 -0
- package/src/deepscientist/diagnostics/runner_failures.py +277 -0
- package/src/deepscientist/doctor.py +407 -56
- package/src/deepscientist/evidence_packets.py +590 -0
- package/src/deepscientist/home.py +52 -4
- package/src/deepscientist/kimi_cli_compat.py +50 -0
- package/src/deepscientist/latex_runtime.py +2 -2
- package/src/deepscientist/mcp/context.py +2 -0
- package/src/deepscientist/mcp/schemas.py +114 -0
- package/src/deepscientist/mcp/server.py +1566 -126
- package/src/deepscientist/memory/service.py +203 -16
- package/src/deepscientist/process_control.py +8 -1
- package/src/deepscientist/prompts/builder.py +850 -88
- package/src/deepscientist/quest/__init__.py +2 -2
- package/src/deepscientist/quest/layout.py +12 -1
- package/src/deepscientist/quest/node_traces.py +10 -0
- package/src/deepscientist/quest/service.py +1852 -161
- package/src/deepscientist/quest/stage_views.py +1 -1
- package/src/deepscientist/runners/__init__.py +18 -0
- package/src/deepscientist/runners/base.py +89 -1
- package/src/deepscientist/runners/builtins.py +13 -1
- package/src/deepscientist/runners/claude.py +391 -0
- package/src/deepscientist/runners/codex.py +480 -35
- package/src/deepscientist/runners/codex_telemetry.py +127 -0
- package/src/deepscientist/runners/kimi.py +334 -0
- package/src/deepscientist/runners/metadata.py +68 -0
- package/src/deepscientist/runners/opencode.py +414 -0
- package/src/deepscientist/runners/runtime_overrides.py +100 -0
- package/src/deepscientist/runners/simple_cli.py +538 -0
- package/src/deepscientist/runtime_storage.py +303 -0
- package/src/deepscientist/shared.py +80 -16
- package/src/deepscientist/skills/installer.py +37 -0
- package/src/deepscientist/skills/registry.py +2 -0
- package/src/deepscientist/tinytex.py +2 -2
- package/src/deepscientist/tui.py +10 -3
- package/src/prompts/benchstore/system.md +77 -0
- package/src/prompts/connectors/qq.md +33 -2
- package/src/prompts/connectors/weixin.md +208 -23
- package/src/prompts/contracts/admin_ops.md +74 -0
- package/src/prompts/contracts/admin_ops_knowledge.md +138 -0
- package/src/prompts/contracts/shared_interaction.md +5 -10
- package/src/prompts/start_setup/system.md +422 -0
- package/src/prompts/system.md +411 -304
- package/src/prompts/system_copilot.md +89 -0
- package/src/skills/analysis-campaign/SKILL.md +239 -578
- package/src/skills/analysis-campaign/references/artifact-flow-examples.md +102 -0
- package/src/skills/analysis-campaign/references/boundary-cases.md +98 -0
- package/src/skills/analysis-campaign/references/campaign-checklist-template.md +39 -24
- package/src/skills/analysis-campaign/references/campaign-design.md +26 -10
- package/src/skills/analysis-campaign/references/campaign-plan-template.md +53 -54
- package/src/skills/analysis-campaign/references/operational-guidance.md +97 -0
- package/src/skills/analysis-campaign/references/writing-facing-slice-examples.md +10 -20
- package/src/skills/baseline/SKILL.md +183 -461
- package/src/skills/baseline/references/artifact-flow-examples.md +106 -0
- package/src/skills/baseline/references/artifact-payload-examples.md +1 -1
- package/src/skills/baseline/references/baseline-checklist-template.md +27 -35
- package/src/skills/baseline/references/baseline-plan-template.md +37 -76
- package/src/skills/baseline/references/boundary-cases.md +86 -0
- package/src/skills/baseline/references/codebase-audit-checklist.md +2 -6
- package/src/skills/baseline/references/comparability-contract.md +7 -12
- package/src/skills/baseline/references/operational-guidance.md +56 -0
- package/src/skills/baseline/references/route-selection.md +5 -25
- package/src/skills/decision/SKILL.md +113 -306
- package/src/skills/decision/references/checkpoint-memory-template.md +47 -0
- package/src/skills/decision/references/operational-guidance.md +94 -0
- package/src/skills/decision/references/research-route-criteria.md +7 -8
- package/src/skills/decision/references/strategic-decision-template.md +13 -26
- package/src/skills/experiment/SKILL.md +132 -670
- package/src/skills/experiment/references/execution-playbook.md +374 -0
- package/src/skills/experiment/references/main-experiment-checklist-template.md +26 -2
- package/src/skills/experiment/references/main-experiment-plan-template.md +28 -17
- package/src/skills/experiment/references/operational-guidance.md +108 -0
- package/src/skills/finalize/SKILL.md +62 -0
- package/src/skills/finalize/references/checkpoint-memory-template.md +49 -0
- package/src/skills/finalize/references/resume-packet-template.md +7 -0
- package/src/skills/idea/SKILL.md +228 -15
- package/src/skills/idea/references/controlled-brainstorming-playbook.md +78 -0
- package/src/skills/idea/references/current-board-packet-template.md +61 -0
- package/src/skills/idea/references/high-value-idea-sourcing.md +119 -0
- package/src/skills/idea/references/idea-generation-playbook.md +21 -0
- package/src/skills/idea/references/idea-thinking-flow.md +6 -0
- package/src/skills/idea/references/literature-survey-template.md +3 -0
- package/src/skills/idea/references/objective-contract-template.md +54 -0
- package/src/skills/idea/references/outline-seeding-example.md +56 -0
- package/src/skills/idea/references/pre-idea-draft-template.md +105 -0
- package/src/skills/idea/references/related-work-playbook.md +75 -2
- package/src/skills/idea/references/research-history-playbook.md +114 -0
- package/src/skills/idea/references/selection-gate.md +58 -6
- package/src/skills/intake-audit/SKILL.md +43 -2
- package/src/skills/intake-audit/references/state-audit-template.md +10 -0
- package/src/skills/nature-data/SKILL.md +128 -0
- package/src/skills/nature-data/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-data/agents/openai.yaml +4 -0
- package/src/skills/nature-data/references/chinese-author-alignment.md +84 -0
- package/src/skills/nature-data/references/fair-metadata-checklist.md +105 -0
- package/src/skills/nature-data/references/policy-principles.md +103 -0
- package/src/skills/nature-data/references/repository-and-identifiers.md +96 -0
- package/src/skills/nature-data/references/source-basis.md +54 -0
- package/src/skills/nature-data/references/statement-patterns.md +153 -0
- package/src/skills/nature-figure/SKILL.md +197 -0
- package/src/skills/nature-figure/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-figure/agents/openai.yaml +4 -0
- package/src/skills/nature-figure/evals/evals.json +37 -0
- package/src/skills/nature-figure/references/api.md +428 -0
- package/src/skills/nature-figure/references/backend-selection.md +100 -0
- package/src/skills/nature-figure/references/chart-types.md +281 -0
- package/src/skills/nature-figure/references/common-patterns.md +349 -0
- package/src/skills/nature-figure/references/design-theory.md +436 -0
- package/src/skills/nature-figure/references/figure-contract.md +93 -0
- package/src/skills/nature-figure/references/nature-2026-observations.md +112 -0
- package/src/skills/nature-figure/references/qa-contract.md +119 -0
- package/src/skills/nature-figure/references/r-template-index.md +66 -0
- package/src/skills/nature-figure/references/r-workflow.md +161 -0
- package/src/skills/nature-figure/references/tutorials.md +250 -0
- package/src/skills/nature-paper2ppt/SKILL.md +507 -0
- package/src/skills/nature-paper2ppt/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-paper2ppt/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/SKILL.md +385 -0
- package/src/skills/nature-polishing/UPSTREAM_LICENSE.txt +21 -0
- package/src/skills/nature-polishing/agents/openai.yaml +4 -0
- package/src/skills/nature-polishing/references/phrasebank-playbook.md +162 -0
- package/src/skills/nature-polishing/references/section-moves.md +240 -0
- package/src/skills/nature-polishing/references/style-guardrails.md +94 -0
- package/src/skills/nature-polishing/references/writing-strategy.md +148 -0
- package/src/skills/optimize/SKILL.md +177 -1568
- package/src/skills/optimize/references/brief-shaping-playbook.md +95 -0
- package/src/skills/optimize/references/candidate-board-template.md +13 -0
- package/src/skills/optimize/references/candidate-ranking-template.md +51 -0
- package/src/skills/optimize/references/codegen-route-playbook.md +50 -0
- package/src/skills/optimize/references/debug-response-template.md +29 -0
- package/src/skills/optimize/references/frontier-review-template.md +32 -0
- package/src/skills/optimize/references/fusion-playbook.md +36 -0
- package/src/skills/optimize/references/method-brief-template.md +73 -0
- package/src/skills/optimize/references/operational-guidance.md +621 -0
- package/src/skills/optimize/references/optimization-memory-template.md +30 -0
- package/src/skills/optimize/references/optimize-checklist-template.md +18 -0
- package/src/skills/optimize/references/plateau-response-playbook.md +28 -0
- package/src/skills/optimize/references/prompt-patterns.md +49 -0
- package/src/skills/paper-outline/SKILL.md +227 -0
- package/src/skills/paper-outline/references/outline-patterns.md +87 -0
- package/src/skills/paper-plot/SKILL.md +79 -0
- package/src/skills/paper-plot/agents/openai.yaml +4 -0
- package/src/skills/paper-plot/references/bar_grouped_hatch.md +96 -0
- package/src/skills/paper-plot/references/bar_paired_delta.md +72 -0
- package/src/skills/paper-plot/references/line_confidence_band.md +75 -0
- package/src/skills/paper-plot/references/line_loss_with_inset.md +65 -0
- package/src/skills/paper-plot/references/line_training_curve.md +44 -0
- package/src/skills/paper-plot/references/radar_dual_series.md +59 -0
- package/src/skills/paper-plot/references/scatter_broken_axis.md +59 -0
- package/src/skills/paper-plot/references/scatter_tsne_cluster.md +72 -0
- package/src/skills/paper-plot/scripts/bar_memevolve.py +109 -0
- package/src/skills/paper-plot/scripts/bar_spice.py +166 -0
- package/src/skills/paper-plot/scripts/line_aime.py +94 -0
- package/src/skills/paper-plot/scripts/line_loss_inset.py +157 -0
- package/src/skills/paper-plot/scripts/line_selfdistill.py +168 -0
- package/src/skills/paper-plot/scripts/radar_dora.py +151 -0
- package/src/skills/paper-plot/scripts/scatter_break.py +169 -0
- package/src/skills/paper-plot/scripts/scatter_tsne.py +133 -0
- package/src/skills/rebuttal/SKILL.md +9 -0
- package/src/skills/references/tool-usage-by-stage.md +438 -0
- package/src/skills/review/SKILL.md +105 -7
- package/src/skills/science/PROVENANCE.md +44 -0
- package/src/skills/science/SKILL.md +137 -0
- package/src/skills/science/references/artifact-science-tool.md +110 -0
- package/src/skills/science/references/claim-type-discipline.md +56 -0
- package/src/skills/science/references/domain-index.md +422 -0
- package/src/skills/science/references/hpc-via-bash-exec.md +42 -0
- package/src/skills/science/references/package-check-playbook.md +64 -0
- package/src/skills/science/references/package-index.min.json +3616 -0
- package/src/skills/science/references/packages/abinit.md +80 -0
- package/src/skills/science/references/packages/acts.md +73 -0
- package/src/skills/science/references/packages/aiida-core.md +80 -0
- package/src/skills/science/references/packages/alamode.md +80 -0
- package/src/skills/science/references/packages/amuse.md +88 -0
- package/src/skills/science/references/packages/anndata.md +88 -0
- package/src/skills/science/references/packages/arbor.md +80 -0
- package/src/skills/science/references/packages/arc.md +73 -0
- package/src/skills/science/references/packages/astropy.md +88 -0
- package/src/skills/science/references/packages/astroquery.md +88 -0
- package/src/skills/science/references/packages/atomate2.md +80 -0
- package/src/skills/science/references/packages/atomsmltr.md +73 -0
- package/src/skills/science/references/packages/awkward.md +73 -0
- package/src/skills/science/references/packages/batman.md +88 -0
- package/src/skills/science/references/packages/biopython.md +88 -0
- package/src/skills/science/references/packages/bloqade.md +73 -0
- package/src/skills/science/references/packages/brian2.md +73 -0
- package/src/skills/science/references/packages/bullet3.md +73 -0
- package/src/skills/science/references/packages/calculix.md +80 -0
- package/src/skills/science/references/packages/cantera.md +73 -0
- package/src/skills/science/references/packages/cavity-md-ipi.md +80 -0
- package/src/skills/science/references/packages/ccdproc.md +88 -0
- package/src/skills/science/references/packages/celerite2.md +88 -0
- package/src/skills/science/references/packages/cellrank.md +73 -0
- package/src/skills/science/references/packages/cesm.md +80 -0
- package/src/skills/science/references/packages/chemicals.md +73 -0
- package/src/skills/science/references/packages/chempy.md +73 -0
- package/src/skills/science/references/packages/cirq.md +73 -0
- package/src/skills/science/references/packages/coffea.md +73 -0
- package/src/skills/science/references/packages/cp2k.md +88 -0
- package/src/skills/science/references/packages/custodian.md +80 -0
- package/src/skills/science/references/packages/dart.md +73 -0
- package/src/skills/science/references/packages/datamol.md +88 -0
- package/src/skills/science/references/packages/dd4hep.md +73 -0
- package/src/skills/science/references/packages/dealii.md +80 -0
- package/src/skills/science/references/packages/deepchem.md +88 -0
- package/src/skills/science/references/packages/delphes.md +73 -0
- package/src/skills/science/references/packages/devito.md +80 -0
- package/src/skills/science/references/packages/dftb.md +88 -0
- package/src/skills/science/references/packages/dftd4.md +88 -0
- package/src/skills/science/references/packages/dftk-jl.md +80 -0
- package/src/skills/science/references/packages/dolfinx.md +80 -0
- package/src/skills/science/references/packages/drake.md +73 -0
- package/src/skills/science/references/packages/dumux.md +73 -0
- package/src/skills/science/references/packages/elk.md +80 -0
- package/src/skills/science/references/packages/elmerfem.md +80 -0
- package/src/skills/science/references/packages/enzo-e.md +88 -0
- package/src/skills/science/references/packages/espresso.md +80 -0
- package/src/skills/science/references/packages/exoplanet.md +88 -0
- package/src/skills/science/references/packages/fairroot.md +73 -0
- package/src/skills/science/references/packages/fbpic.md +80 -0
- package/src/skills/science/references/packages/fdtdbath-meep.md +80 -0
- package/src/skills/science/references/packages/geant4.md +73 -0
- package/src/skills/science/references/packages/geosx.md +80 -0
- package/src/skills/science/references/packages/gprmax.md +80 -0
- package/src/skills/science/references/packages/gromacs.md +80 -0
- package/src/skills/science/references/packages/gwaslab.md +73 -0
- package/src/skills/science/references/packages/gz-sim.md +73 -0
- package/src/skills/science/references/packages/hail.md +88 -0
- package/src/skills/science/references/packages/hiphive.md +80 -0
- package/src/skills/science/references/packages/hoomd-blue.md +80 -0
- package/src/skills/science/references/packages/itensor.md +73 -0
- package/src/skills/science/references/packages/itensors-jl.md +73 -0
- package/src/skills/science/references/packages/jdftx.md +73 -0
- package/src/skills/science/references/packages/jobflow.md +80 -0
- package/src/skills/science/references/packages/kadanoffbaym-jl.md +73 -0
- package/src/skills/science/references/packages/kite.md +80 -0
- package/src/skills/science/references/packages/kratos.md +80 -0
- package/src/skills/science/references/packages/kwant.md +73 -0
- package/src/skills/science/references/packages/lammps.md +80 -0
- package/src/skills/science/references/packages/lightkurve.md +88 -0
- package/src/skills/science/references/packages/limix.md +73 -0
- package/src/skills/science/references/packages/maxwelllink.md +80 -0
- package/src/skills/science/references/packages/mcdc.md +73 -0
- package/src/skills/science/references/packages/meep.md +80 -0
- package/src/skills/science/references/packages/mfem.md +80 -0
- package/src/skills/science/references/packages/mitgcm.md +73 -0
- package/src/skills/science/references/packages/modflow6.md +73 -0
- package/src/skills/science/references/packages/molecool.md +73 -0
- package/src/skills/science/references/packages/mom6.md +73 -0
- package/src/skills/science/references/packages/moose.md +80 -0
- package/src/skills/science/references/packages/mpas-model.md +73 -0
- package/src/skills/science/references/packages/mujoco.md +73 -0
- package/src/skills/science/references/packages/mumax3.md +73 -0
- package/src/skills/science/references/packages/nekrs.md +80 -0
- package/src/skills/science/references/packages/nessi.md +73 -0
- package/src/skills/science/references/packages/nest-simulator.md +73 -0
- package/src/skills/science/references/packages/netket.md +73 -0
- package/src/skills/science/references/packages/neuron.md +73 -0
- package/src/skills/science/references/packages/nextflow.md +88 -0
- package/src/skills/science/references/packages/nwchem.md +88 -0
- package/src/skills/science/references/packages/openbabel.md +88 -0
- package/src/skills/science/references/packages/openems.md +80 -0
- package/src/skills/science/references/packages/openff-toolkit.md +88 -0
- package/src/skills/science/references/packages/openfoam-dev.md +80 -0
- package/src/skills/science/references/packages/openmc.md +73 -0
- package/src/skills/science/references/packages/openmm.md +80 -0
- package/src/skills/science/references/packages/openmoc.md +73 -0
- package/src/skills/science/references/packages/openmx.md +80 -0
- package/src/skills/science/references/packages/opensees.md +80 -0
- package/src/skills/science/references/packages/opensn.md +80 -0
- package/src/skills/science/references/packages/opm-simulators.md +73 -0
- package/src/skills/science/references/packages/oqupy.md +73 -0
- package/src/skills/science/references/packages/packmol.md +80 -0
- package/src/skills/science/references/packages/palabos.md +80 -0
- package/src/skills/science/references/packages/parflow.md +80 -0
- package/src/skills/science/references/packages/pennylane.md +88 -0
- package/src/skills/science/references/packages/perceval.md +73 -0
- package/src/skills/science/references/packages/phono3py.md +73 -0
- package/src/skills/science/references/packages/phonopy.md +73 -0
- package/src/skills/science/references/packages/photutils.md +88 -0
- package/src/skills/science/references/packages/picongpu.md +80 -0
- package/src/skills/science/references/packages/plink-ng.md +88 -0
- package/src/skills/science/references/packages/precice.md +73 -0
- package/src/skills/science/references/packages/psc.md +80 -0
- package/src/skills/science/references/packages/psi4.md +88 -0
- package/src/skills/science/references/packages/pybinding.md +73 -0
- package/src/skills/science/references/packages/pyfr.md +80 -0
- package/src/skills/science/references/packages/pyhf.md +73 -0
- package/src/skills/science/references/packages/pyiron_base.md +80 -0
- package/src/skills/science/references/packages/pylcp.md +73 -0
- package/src/skills/science/references/packages/pylith.md +80 -0
- package/src/skills/science/references/packages/pynbody.md +88 -0
- package/src/skills/science/references/packages/pysam.md +88 -0
- package/src/skills/science/references/packages/pyscf.md +88 -0
- package/src/skills/science/references/packages/q-e.md +73 -0
- package/src/skills/science/references/packages/qibo.md +73 -0
- package/src/skills/science/references/packages/qiskit.md +73 -0
- package/src/skills/science/references/packages/quantica-jl.md +73 -0
- package/src/skills/science/references/packages/quantumoptics-jl.md +73 -0
- package/src/skills/science/references/packages/quimb.md +73 -0
- package/src/skills/science/references/packages/qulacs.md +73 -0
- package/src/skills/science/references/packages/qutip.md +73 -0
- package/src/skills/science/references/packages/rdkit.md +88 -0
- package/src/skills/science/references/packages/rmg-py.md +73 -0
- package/src/skills/science/references/packages/root.md +73 -0
- package/src/skills/science/references/packages/scanpy.md +88 -0
- package/src/skills/science/references/packages/scikit-allel.md +88 -0
- package/src/skills/science/references/packages/scikit-bio.md +88 -0
- package/src/skills/science/references/packages/scqubits.md +73 -0
- package/src/skills/science/references/packages/scuff-em.md +80 -0
- package/src/skills/science/references/packages/scvi-tools.md +73 -0
- package/src/skills/science/references/packages/seissol.md +73 -0
- package/src/skills/science/references/packages/sfepy.md +80 -0
- package/src/skills/science/references/packages/sisl.md +73 -0
- package/src/skills/science/references/packages/smilei.md +80 -0
- package/src/skills/science/references/packages/snakemake.md +88 -0
- package/src/skills/science/references/packages/specfem3d-globe.md +80 -0
- package/src/skills/science/references/packages/specutils.md +88 -0
- package/src/skills/science/references/packages/spglib.md +80 -0
- package/src/skills/science/references/packages/squidpy.md +88 -0
- package/src/skills/science/references/packages/starry.md +88 -0
- package/src/skills/science/references/packages/strawberryfields.md +73 -0
- package/src/skills/science/references/packages/su2.md +80 -0
- package/src/skills/science/references/packages/sunny-jl.md +73 -0
- package/src/skills/science/references/packages/sw4.md +73 -0
- package/src/skills/science/references/packages/swift.md +88 -0
- package/src/skills/science/references/packages/tdnegf.md +73 -0
- package/src/skills/science/references/packages/tenpy.md +73 -0
- package/src/skills/science/references/packages/thermo.md +73 -0
- package/src/skills/science/references/packages/tkwant.md +73 -0
- package/src/skills/science/references/packages/tvb-root.md +73 -0
- package/src/skills/science/references/packages/uproot5.md +73 -0
- package/src/skills/science/references/packages/vampire.md +80 -0
- package/src/skills/science/references/packages/wannier_tools.md +73 -0
- package/src/skills/science/references/packages/warpx.md +80 -0
- package/src/skills/science/references/packages/wrf.md +73 -0
- package/src/skills/science/references/packages/xtb.md +88 -0
- package/src/skills/science/references/packages/yt.md +73 -0
- package/src/skills/science/references/science-task-brief-template.md +71 -0
- package/src/skills/scout/SKILL.md +83 -425
- package/src/skills/scout/references/literature-scout-template.md +5 -24
- package/src/skills/scout/references/operational-guidance.md +191 -0
- package/src/skills/scout/references/paper-triage-playbook.md +11 -35
- package/src/skills/write/SKILL.md +744 -1246
- package/src/skills/write/references/experiments_analysis_patterns.md +129 -0
- package/src/skills/write/references/oral_package_patterns.md +252 -0
- package/src/skills/write/references/oral_writing_principles.md +291 -0
- package/src/skills/write/references/section_rewrite_checklist.md +234 -0
- package/src/tui/dist/app/AppContainer.js +1314 -27
- package/src/tui/dist/components/Composer.js +26 -1
- package/src/tui/dist/components/ConfigScreen.js +2 -1
- package/src/tui/dist/components/InputPrompt.js +25 -9
- package/src/tui/dist/components/MainContent.js +18 -3
- package/src/tui/dist/components/QuestScreen.js +3 -2
- package/src/tui/dist/components/UtilityScreen.js +37 -0
- package/src/tui/dist/hooks/useSafeInput.js +10 -0
- package/src/tui/dist/index.js +13 -1
- package/src/tui/dist/layouts/DefaultAppLayout.js +11 -8
- package/src/tui/dist/lib/api.js +89 -1
- package/src/tui/package.json +1 -1
- package/src/ui/dist/assets/{AnalysisPlugin-DnSm0GZn.js → AnalysisPlugin-CA94NGmI.js} +1 -1
- package/src/ui/dist/assets/CliPlugin-DHBzphZU.js +79 -0
- package/src/ui/dist/assets/CodeEditorPlugin-BOFwD2rn.js +2 -0
- package/src/ui/dist/assets/{CodeViewerPlugin-itb0tltR.js → CodeViewerPlugin-CqDpgjik.js} +4 -4
- package/src/ui/dist/assets/{DocViewerPlugin-DqKkiCI6.js → DocViewerPlugin-UDBgt8-4.js} +3 -3
- package/src/ui/dist/assets/GitCommitViewerPlugin-BmHtZ0bZ.js +6 -0
- package/src/ui/dist/assets/{GitDiffViewerPlugin-DxL2ezFG.js → GitDiffViewerPlugin-CAxjNorQ.js} +2 -2
- package/src/ui/dist/assets/{GitSnapshotViewer-B_RQm1YZ.js → GitSnapshotViewer-CweA6VON.js} +2 -2
- package/src/ui/dist/assets/{ImageViewerPlugin-tHqlXY3n.js → ImageViewerPlugin-C8wHGvGN.js} +5 -5
- package/src/ui/dist/assets/LabPlugin-COyyLUol.js +32 -0
- package/src/ui/dist/assets/{LatexPlugin-B495DTXC.js → LatexPlugin-BQjAaA5J.js} +4 -4
- package/src/ui/dist/assets/{MarkdownViewerPlugin-DG28-61B.js → MarkdownViewerPlugin-Dy1NE2dI.js} +3 -3
- package/src/ui/dist/assets/{MarketplacePlugin-BiOGT-Kj.js → MarketplacePlugin-DMIZtEJ2.js} +2 -2
- package/src/ui/dist/assets/NotebookEditor-CFHMq_Qt.js +91 -0
- package/src/ui/dist/assets/{NotebookEditor-CVsj8h_T.js → NotebookEditor-WFyd8Ybt.js} +23 -23
- package/src/ui/dist/assets/{PdfLoader-CASDQmxJ.js → PdfLoader-CLE5u5TS.js} +3 -3
- package/src/ui/dist/assets/{PdfMarkdownPlugin-BFhwoKsY.js → PdfMarkdownPlugin-_iNK_H83.js} +1 -1
- package/src/ui/dist/assets/PdfViewerPlugin-DgWsbInT.js +22 -0
- package/src/ui/dist/assets/SearchPlugin-DrZmn5iw.js +11 -0
- package/src/ui/dist/assets/{TextViewerPlugin-CB4DYfWO.js → TextViewerPlugin-D1-T3aC7.js} +4 -4
- package/src/ui/dist/assets/branding/runner-claude.svg +107 -0
- package/src/ui/dist/assets/branding/runner-codex.svg +10 -0
- package/src/ui/dist/assets/branding/runner-kimi.svg +14 -0
- package/src/ui/dist/assets/branding/runner-opencode.svg +7 -0
- package/src/ui/dist/assets/cli-store-CoZ-x5Ip.js +1 -0
- package/src/ui/dist/assets/{code-DLC6G24T.js → code-DbsmSd3Y.js} +1 -1
- package/src/ui/dist/assets/file-diff-panel-DsvyRz47.js +1 -0
- package/src/ui/dist/assets/{wrap-text-CwMn-iqb.js → file-jump-queue-DeQBikaw.js} +3 -3
- package/src/ui/dist/assets/{file-socket-Cu4Qln7Y.js → file-socket-DA5XIx88.js} +1 -1
- package/src/ui/dist/assets/fonts/ds-fonts.css +50 -4
- package/src/ui/dist/assets/images/deepxiv/register-guide.png +0 -0
- package/src/ui/dist/assets/index-39vY9LmZ.js +1 -0
- package/src/ui/dist/assets/{index-wQ7RIIRd.js → index-BsO46tJA.js} +1 -1
- package/src/ui/dist/assets/index-CHzJ2xtB.js +3530 -0
- package/src/ui/dist/assets/index-DH-zxoZ3.css +33 -0
- package/src/ui/dist/assets/{plugin-notebook-HbW2K-1c.js → plugin-notebook-JRhysCqj.js} +2 -2
- package/src/ui/dist/assets/{project-sync-CsX08Qno.js → project-sync-DPmWKmKD.js} +1 -1
- package/src/ui/dist/assets/{zoom-out-R-GWEhzS.js → zoom-out-DAukFWen.js} +3 -3
- package/src/ui/dist/index.html +3 -3
- package/src/skills/analysis-campaign/references/artifact-orchestration.md +0 -58
- package/src/skills/baseline/references/memory-playbook.md +0 -40
- package/src/skills/baseline/references/publishable-baseline-package.md +0 -30
- package/src/skills/write/references/outline-evidence-contract-example.md +0 -107
- package/src/skills/write/references/paper-experiment-matrix-template.md +0 -131
- package/src/skills/write/references/paper-section-playbook.md +0 -64
- package/src/skills/write/references/reviewer-first-writing.md +0 -64
- package/src/skills/write/references/revision-checklist.md +0 -70
- package/src/skills/write/references/section-contracts.md +0 -82
- package/src/skills/write/references/sentence-level-proofing.md +0 -49
- package/src/ui/dist/assets/AiManusChatView-COFACy7V.js +0 -204
- package/src/ui/dist/assets/CliPlugin-CvwCmDQ5.js +0 -109
- package/src/ui/dist/assets/CodeEditorPlugin-cOqSa0xq.js +0 -2
- package/src/ui/dist/assets/GitCommitViewerPlugin-DVgNHBCS.js +0 -1
- package/src/ui/dist/assets/LabCopilotPanel-ClMbq5Yu.js +0 -14
- package/src/ui/dist/assets/LabPlugin-L_SuE8ow.js +0 -22
- package/src/ui/dist/assets/NotebookEditor-C-4Kt1p9.js +0 -81
- package/src/ui/dist/assets/PdfViewerPlugin-DcOzU9vd.js +0 -17
- package/src/ui/dist/assets/SearchPlugin-CHj7M58O.js +0 -16
- package/src/ui/dist/assets/VNCViewer-CjlbyCB3.js +0 -11
- package/src/ui/dist/assets/bot-CFkZY-JP.js +0 -6
- package/src/ui/dist/assets/chevron-up-Dq5ofbht.js +0 -6
- package/src/ui/dist/assets/file-content-Dv4LoZec.js +0 -1
- package/src/ui/dist/assets/file-diff-panel-Denq-lC3.js +0 -1
- package/src/ui/dist/assets/file-jump-queue-DA-SdG__.js +0 -1
- package/src/ui/dist/assets/git-commit-horizontal-BUh6G52n.js +0 -6
- package/src/ui/dist/assets/image-B9HUUddG.js +0 -6
- package/src/ui/dist/assets/index-B2B1sg-M.js +0 -1
- package/src/ui/dist/assets/index-Cgla8biy.css +0 -33
- package/src/ui/dist/assets/index-DRyx7vAc.js +0 -1
- package/src/ui/dist/assets/index-Gbl53BNp.js +0 -2496
- package/src/ui/dist/assets/pdf-effect-queue-ZtnHFCAi.js +0 -6
- package/src/ui/dist/assets/popover-DL6h35vr.js +0 -1
- package/src/ui/dist/assets/select-DvmXt1yY.js +0 -11
- package/src/ui/dist/assets/sigma-7jpXazui.js +0 -6
- package/src/ui/dist/assets/trash-xA7kFt8i.js +0 -11
- package/src/ui/dist/assets/useCliAccess-DsMwDjOp.js +0 -1
- package/src/ui/dist/assets/useFileDiffOverlay-FuhcnKiw.js +0 -1
|
@@ -0,0 +1,183 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.049_hogwildinference
|
|
3
|
+
name: 'Hogwild! Inference: Parallel LLM Generation via Concurrent Attention'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: 'Benchmark and optimize parallel LLM inference where multiple workers share
|
|
6
|
+
a concurrent KV cache, measuring tokens-per-second throughput and custom CUDA kernel
|
|
7
|
+
latency on L40-class GPUs.
|
|
8
|
+
|
|
9
|
+
'
|
|
10
|
+
task_description: 'This benchmark evaluates a parallel LLM generation system called
|
|
11
|
+
Hogwild! Inference, where multiple LLM "workers" run concurrently with a shared
|
|
12
|
+
Key-Value attention cache, allowing instant cross-attention between workers via
|
|
13
|
+
RoPE position re-rotation. The optimization task is to maximize multi-worker inference
|
|
14
|
+
throughput (tokens_per_second) without breaking correctness or stability of the
|
|
15
|
+
concurrent cache mechanism.
|
|
16
|
+
|
|
17
|
+
The package provides two execution routes: (1) Jupyter notebooks (basic_example,
|
|
18
|
+
full_example, hogwild_with_fast_kernels) that run 2-agent parallel inference on
|
|
19
|
+
open-source reasoning LLMs (e.g. QwQ, DeepSeek-R1) using the Python `shared_cache`
|
|
20
|
+
library and `generation.py`, and (2) a standalone C++/CUDA kernel benchmark (`inference_lib/src/benchmark.cpp`)
|
|
21
|
+
that measures raw attention-kernel latency in microseconds for the custom Flash-Decoding-inspired
|
|
22
|
+
paged attention with per-block query rotation.
|
|
23
|
+
|
|
24
|
+
The fast kernels require compilation via CMake with nvcc (CUDA architectures 80/86/89)
|
|
25
|
+
and were tuned for L40 GPUs. The primary metric `tokens_per_second` is route-backed
|
|
26
|
+
through the kernel benchmark executable but has not been verified end-to-end in
|
|
27
|
+
this packaging pass; runtime execution is required before trusting reported values.
|
|
28
|
+
Model weights (e.g. Llama-3.2-3B for Colab, or larger reasoning models like QwQ-32B)
|
|
29
|
+
must be downloaded from HuggingFace at inference time. No training is involved—this
|
|
30
|
+
is purely an inference-time systems benchmark.
|
|
31
|
+
|
|
32
|
+
'
|
|
33
|
+
capability_tags:
|
|
34
|
+
- research_code_optimization
|
|
35
|
+
- large_language_models
|
|
36
|
+
- parallel_inference
|
|
37
|
+
- systems_efficiency
|
|
38
|
+
- cuda_kernels
|
|
39
|
+
aisb_direction: T3
|
|
40
|
+
track_fit:
|
|
41
|
+
- paper_track
|
|
42
|
+
- benchmark_track
|
|
43
|
+
task_mode: evaluation_driven
|
|
44
|
+
requires_execution: true
|
|
45
|
+
requires_paper: true
|
|
46
|
+
integrity_level: cas_plus_canary
|
|
47
|
+
snapshot_status: partial
|
|
48
|
+
support_level: advanced
|
|
49
|
+
time_band: 1-2d
|
|
50
|
+
cost_band: high
|
|
51
|
+
difficulty: hard
|
|
52
|
+
data_access: public
|
|
53
|
+
primary_outputs:
|
|
54
|
+
- tokens_per_second
|
|
55
|
+
- kernel_latency_us
|
|
56
|
+
- benchmark_logs
|
|
57
|
+
launch_profiles:
|
|
58
|
+
- id: notebook_inference
|
|
59
|
+
label: Notebook Inference
|
|
60
|
+
description: 'Run the bundled Jupyter notebooks (basic_example, full_example, hogwild_with_fast_kernels)
|
|
61
|
+
to perform 2-agent parallel LLM inference with a shared KV cache. Requires a GPU
|
|
62
|
+
with sufficient VRAM for the chosen model. Outputs generation traces and informal
|
|
63
|
+
throughput.
|
|
64
|
+
|
|
65
|
+
'
|
|
66
|
+
- id: kernel_benchmark
|
|
67
|
+
label: CUDA Kernel Benchmark
|
|
68
|
+
description: 'Build the C++ benchmark executable from inference_lib via CMake +
|
|
69
|
+
nvcc, then run it to measure raw attention kernel latency. Produces microsecond-level
|
|
70
|
+
timing for the custom paged-attention kernel with query rotation. Throughput conversion
|
|
71
|
+
to tokens_per_second must be verified manually against end-to-end generation.
|
|
72
|
+
|
|
73
|
+
'
|
|
74
|
+
dataset_download:
|
|
75
|
+
primary_method: huggingface
|
|
76
|
+
sources:
|
|
77
|
+
- kind: huggingface
|
|
78
|
+
url: https://huggingface.co/models
|
|
79
|
+
access: public
|
|
80
|
+
note: 'Model weights (e.g. Llama-3.2-3B, QwQ-32B, DeepSeek-R1) are downloaded
|
|
81
|
+
at inference time via HuggingFace transformers. No separate dataset download
|
|
82
|
+
is required; the benchmark operates on prompted reasoning tasks defined in the
|
|
83
|
+
notebooks.
|
|
84
|
+
|
|
85
|
+
'
|
|
86
|
+
notes:
|
|
87
|
+
- No large offline dataset is needed. Storage is dominated by model weights (7–65
|
|
88
|
+
GB depending on model choice).
|
|
89
|
+
- The evals/ directory contains evaluation scripts for LIMO, LiveCodeBench, and
|
|
90
|
+
OlympiadBench but these are auxiliary.
|
|
91
|
+
credential_requirements:
|
|
92
|
+
mode: none
|
|
93
|
+
items: []
|
|
94
|
+
notes:
|
|
95
|
+
- A HuggingFace token may be needed for gated models like Llama-3.2 but is not required
|
|
96
|
+
for all model choices.
|
|
97
|
+
resources:
|
|
98
|
+
minimum:
|
|
99
|
+
cpu_cores: 8
|
|
100
|
+
ram_gb: 32
|
|
101
|
+
disk_gb: 80
|
|
102
|
+
gpu_count: 1
|
|
103
|
+
gpu_vram_gb: 24
|
|
104
|
+
recommended:
|
|
105
|
+
cpu_cores: 16
|
|
106
|
+
ram_gb: 64
|
|
107
|
+
disk_gb: 150
|
|
108
|
+
gpu_count: 1
|
|
109
|
+
gpu_vram_gb: 48
|
|
110
|
+
environment:
|
|
111
|
+
python: '3.10'
|
|
112
|
+
cuda: '11.8'
|
|
113
|
+
pytorch: 2.6.0
|
|
114
|
+
key_packages:
|
|
115
|
+
- transformers==4.51.3
|
|
116
|
+
- numpy
|
|
117
|
+
- CLI11 (C++ dep, fetched by CMake)
|
|
118
|
+
notes:
|
|
119
|
+
- The fast inference kernels require nvcc in PATH (or CUDACXX set). CMake >= 3.22
|
|
120
|
+
is needed.
|
|
121
|
+
- CUDA architectures 80, 86, 89 are targeted (A100, L40, RTX 4090 class).
|
|
122
|
+
- Kernels were specifically optimized for L40 and similar GPUs; performance on other
|
|
123
|
+
architectures may differ.
|
|
124
|
+
- The Colab notebook demonstrates a minimal route with Llama-3.2-3B and limited
|
|
125
|
+
collaboration.
|
|
126
|
+
- pip install -e . inside inference_lib/ builds the Python-bound CUDA extension.
|
|
127
|
+
risk_flags:
|
|
128
|
+
- metric_not_verified_e2e
|
|
129
|
+
- requires_cuda_compilation
|
|
130
|
+
- model_download_at_runtime
|
|
131
|
+
risk_notes:
|
|
132
|
+
- 'The primary metric tokens_per_second is route-backed via the C++ kernel benchmark
|
|
133
|
+
but no end-to-end benchmark execution was performed during packaging. Runtime verification
|
|
134
|
+
is required before trusting metric values.
|
|
135
|
+
|
|
136
|
+
'
|
|
137
|
+
- 'Building the fast kernels requires a working nvcc toolchain and compatible GPU
|
|
138
|
+
architecture. Compilation failures are possible on non-standard CUDA setups.
|
|
139
|
+
|
|
140
|
+
'
|
|
141
|
+
- 'Larger reasoning models (QwQ-32B, DeepSeek-R1) require 48+ GB VRAM; the minimum
|
|
142
|
+
24 GB spec only supports smaller models like Llama-3.2-3B with limited collaboration
|
|
143
|
+
quality.
|
|
144
|
+
|
|
145
|
+
'
|
|
146
|
+
- 'The evals/ directory references external evaluation suites (LIMO, LiveCodeBench,
|
|
147
|
+
OlympiadBench) that may require additional setup not fully documented in the snapshot.
|
|
148
|
+
|
|
149
|
+
'
|
|
150
|
+
recommended_when: 'Use this benchmark when you want an LLM-systems optimization task
|
|
151
|
+
focused on parallel inference throughput, concurrent KV cache design, and custom
|
|
152
|
+
CUDA kernel performance. Suitable for researchers working on inference-time parallelism,
|
|
153
|
+
attention kernel optimization, or multi-agent LLM coordination at the systems level.
|
|
154
|
+
|
|
155
|
+
'
|
|
156
|
+
not_recommended_when: 'Do not use this if you lack access to a modern CUDA GPU (Ampere
|
|
157
|
+
or newer), if you need a training-oriented benchmark, or if you are looking for
|
|
158
|
+
a self-contained accuracy evaluation with automated scoring. The metric surface
|
|
159
|
+
requires manual verification and the kernel build adds significant setup complexity.
|
|
160
|
+
|
|
161
|
+
'
|
|
162
|
+
paper:
|
|
163
|
+
title: 'Hogwild! Inference: Parallel LLM Generation via Concurrent Attention'
|
|
164
|
+
venue: arXiv preprint
|
|
165
|
+
year: 2025
|
|
166
|
+
url: https://arxiv.org/abs/2504.06261
|
|
167
|
+
download:
|
|
168
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.049_hogwildinference.zip
|
|
169
|
+
archive_type: zip
|
|
170
|
+
local_dir_name: paper-49-HogwildInference
|
|
171
|
+
provider: github_release
|
|
172
|
+
repo: ResearAI/DeepScientist
|
|
173
|
+
tag: aisb-v0.0.1
|
|
174
|
+
asset_name: aisb.t3.049_hogwildinference.zip
|
|
175
|
+
sha256: b5cc4e8d0a697683307a664b948af23324ca548c6ce7b8380035fe7410dabcdd
|
|
176
|
+
size_bytes: 226660
|
|
177
|
+
commercial:
|
|
178
|
+
annual_fee: null
|
|
179
|
+
display:
|
|
180
|
+
palette_seed: orange-slate-cache
|
|
181
|
+
art_style: concurrent-systems
|
|
182
|
+
accent_priority: high
|
|
183
|
+
image_path: ../image/049_aisb.t3.049_hogwildinference.jpg
|
|
@@ -0,0 +1,138 @@
|
|
|
1
|
+
schema_version: 1
|
|
2
|
+
id: aisb.t3.049_hogwildinference
|
|
3
|
+
name: 'Hogwild! Inference: Parallel LLM Generation via Concurrent Attention'
|
|
4
|
+
version: 0.1.0
|
|
5
|
+
one_line: '在多个工作进程共享并发 KV 缓存的并行 LLM 推理场景下进行基准测试和优化,测量 L40 级 GPU 上的每秒令牌吞吐量和自定义 CUDA 内核延迟。
|
|
6
|
+
|
|
7
|
+
'
|
|
8
|
+
task_description: '该基准测试评估名为 Hogwild! Inference 的并行 LLM 生成系统,其中多个 LLM"工作进程"通过共享键值注意力缓存并发运行,通过 RoPE 位置重旋转实现工作进程间的即时交叉注意力。优化任务是在不破坏并发缓存机制正确性或稳定性的前提下,最大化多工作进程推理吞吐量(tokens_per_second)。
|
|
9
|
+
|
|
10
|
+
该软件包提供两条执行路径:(1)Jupyter 笔记本(basic_example、full_example、hogwild_with_fast_kernels),使用 Python `shared_cache` 库和 `generation.py` 在开源推理 LLM(如 QwQ、DeepSeek-R1)上运行 2 智能体并行推理;(2)独立 C++/CUDA 内核基准测试(`inference_lib/src/benchmark.cpp`),用于测量自定义 Flash-Decoding 启发的分页注意力(带逐块查询旋转)的原始注意力内核延迟(微秒级)。
|
|
11
|
+
|
|
12
|
+
快速内核需要通过 CMake + nvcc 编译(CUDA 架构 80/86/89),并针对 L40 GPU 进行了优化。主要指标 `tokens_per_second` 通过内核基准测试可执行文件进行了路由支持,但在本次打包过程中未进行端到端验证,需要运行时执行后才能信任报告值。模型权重(如 Colab 用的 Llama-3.2-3B,或更大的推理模型如 QwQ-32B)需要在推理时从 HuggingFace 下载。无需训练——这是纯推理时系统基准测试。
|
|
13
|
+
|
|
14
|
+
'
|
|
15
|
+
capability_tags:
|
|
16
|
+
- research_code_optimization
|
|
17
|
+
- large_language_models
|
|
18
|
+
- parallel_inference
|
|
19
|
+
- systems_efficiency
|
|
20
|
+
- cuda_kernels
|
|
21
|
+
aisb_direction: T3
|
|
22
|
+
track_fit:
|
|
23
|
+
- paper_track
|
|
24
|
+
- benchmark_track
|
|
25
|
+
task_mode: evaluation_driven
|
|
26
|
+
requires_execution: true
|
|
27
|
+
requires_paper: true
|
|
28
|
+
integrity_level: cas_plus_canary
|
|
29
|
+
snapshot_status: partial
|
|
30
|
+
support_level: advanced
|
|
31
|
+
time_band: 1-2d
|
|
32
|
+
cost_band: high
|
|
33
|
+
difficulty: hard
|
|
34
|
+
data_access: public
|
|
35
|
+
primary_outputs:
|
|
36
|
+
- tokens_per_second
|
|
37
|
+
- kernel_latency_us
|
|
38
|
+
- benchmark_logs
|
|
39
|
+
launch_profiles:
|
|
40
|
+
- id: notebook_inference
|
|
41
|
+
label: 笔记本推理
|
|
42
|
+
description: '运行捆绑的 Jupyter 笔记本(basic_example、full_example、hogwild_with_fast_kernels),使用共享 KV 缓存执行 2 智能体并行 LLM 推理。需要具有足够 VRAM 的 GPU 用于所选模型。输出生成轨迹和非正式吞吐量。
|
|
43
|
+
|
|
44
|
+
'
|
|
45
|
+
- id: kernel_benchmark
|
|
46
|
+
label: CUDA 内核基准测试
|
|
47
|
+
description: '通过 CMake + nvcc 从 inference_lib 构建 C++ 基准测试可执行文件,然后运行它来测量原始注意力内核延迟。为自定义分页注意力内核(带查询旋转)生成微秒级计时。吞吐量转换为 tokens_per_second 必须手动验证以对抗端到端生成。
|
|
48
|
+
|
|
49
|
+
'
|
|
50
|
+
dataset_download:
|
|
51
|
+
primary_method: huggingface
|
|
52
|
+
sources:
|
|
53
|
+
- kind: huggingface
|
|
54
|
+
url: https://huggingface.co/models
|
|
55
|
+
access: public
|
|
56
|
+
note: '模型权重(如 Llama-3.2-3B、QwQ-32B、DeepSeek-R1)在推理时通过 HuggingFace transformers 下载。不需要单独的数据集下载;基准测试操作在笔记本中定义的提示推理任务。
|
|
57
|
+
|
|
58
|
+
'
|
|
59
|
+
notes:
|
|
60
|
+
- 不需要大型离线数据集。存储主要由模型权重决定(根据模型选择为 7–65 GB)。
|
|
61
|
+
- evals/ 目录包含 LIMO、LiveCodeBench 和 OlympiadBench 的评估脚本,但这些是辅助性的。
|
|
62
|
+
credential_requirements:
|
|
63
|
+
mode: none
|
|
64
|
+
items: []
|
|
65
|
+
notes:
|
|
66
|
+
- 对于 Llama-3.2 等门控模型可能需要 HuggingFace 令牌,但并非所有模型选择都需要。
|
|
67
|
+
resources:
|
|
68
|
+
minimum:
|
|
69
|
+
cpu_cores: 8
|
|
70
|
+
ram_gb: 32
|
|
71
|
+
disk_gb: 80
|
|
72
|
+
gpu_count: 1
|
|
73
|
+
gpu_vram_gb: 24
|
|
74
|
+
recommended:
|
|
75
|
+
cpu_cores: 16
|
|
76
|
+
ram_gb: 64
|
|
77
|
+
disk_gb: 150
|
|
78
|
+
gpu_count: 1
|
|
79
|
+
gpu_vram_gb: 48
|
|
80
|
+
environment:
|
|
81
|
+
python: '3.10'
|
|
82
|
+
cuda: '11.8'
|
|
83
|
+
pytorch: 2.6.0
|
|
84
|
+
key_packages:
|
|
85
|
+
- transformers==4.51.3
|
|
86
|
+
- numpy
|
|
87
|
+
- CLI11 (C++ 依赖,由 CMake 获取)
|
|
88
|
+
notes:
|
|
89
|
+
- 快速推理内核需要 nvcc 在 PATH 中(或设置 CUDACXX)。需要 CMake >= 3.22。
|
|
90
|
+
- 目标是 CUDA 架构 80、86、89(A100、L40、RTX 4090 类)。
|
|
91
|
+
- 内核专门针对 L40 和类似 GPU 进行了优化;其他架构上的性能可能有所不同。
|
|
92
|
+
- Colab 笔记本演示了使用 Llama-3.2-3B 和有限协作的最小路径。
|
|
93
|
+
- 在 inference_lib/ 中运行 pip install -e . 可构建绑定 Python 的 CUDA 扩展。
|
|
94
|
+
risk_flags:
|
|
95
|
+
- metric_not_verified_e2e
|
|
96
|
+
- requires_cuda_compilation
|
|
97
|
+
- model_download_at_runtime
|
|
98
|
+
risk_notes:
|
|
99
|
+
- '主要指标 tokens_per_second 通过 C++ 内核基准测试进行了路由支持,但在打包期间未执行端到端基准测试。在信任指标值之前需要运行时验证。
|
|
100
|
+
|
|
101
|
+
'
|
|
102
|
+
- '构建快速内核需要可用的 nvcc 工具链和兼容的 GPU 架构。在非标准 CUDA 设置上可能出现编译失败。
|
|
103
|
+
|
|
104
|
+
'
|
|
105
|
+
- '更大的推理模型(QwQ-32B、DeepSeek-R1)需要 48+ GB VRAM;最低 24 GB 规格仅支持较小的模型(如 Llama-3.2-3B),协作质量有限。
|
|
106
|
+
|
|
107
|
+
'
|
|
108
|
+
- 'evals/ 目录引用了外部评估套件(LIMO、LiveCodeBench、OlympiadBench),这些可能需要快照中未完全记录的额外设置。
|
|
109
|
+
|
|
110
|
+
'
|
|
111
|
+
recommended_when: '当您需要一个专注于并行推理吞吐量、并发 KV 缓存设计和自定义 CUDA 内核性能的 LLM 系统优化任务时使用此基准测试。适用于从事推理时并行性、注意力内核优化或在系统级别进行多智能体 LLM 协调的研究人员。
|
|
112
|
+
|
|
113
|
+
'
|
|
114
|
+
not_recommended_when: '如果您无法访问现代 CUDA GPU(安培或更新),如果您需要以训练为导向的基准测试,或者如果您正在寻找具有自动评分的自包含准确性评估,请不要使用此基准测试。指标表面需要手动验证,内核构建增加了显著的设置复杂性。
|
|
115
|
+
|
|
116
|
+
'
|
|
117
|
+
paper:
|
|
118
|
+
title: 'Hogwild! Inference: Parallel LLM Generation via Concurrent Attention'
|
|
119
|
+
venue: arXiv preprint
|
|
120
|
+
year: 2025
|
|
121
|
+
url: https://arxiv.org/abs/2504.06261
|
|
122
|
+
download:
|
|
123
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.049_hogwildinference.zip
|
|
124
|
+
archive_type: zip
|
|
125
|
+
local_dir_name: paper-49-HogwildInference
|
|
126
|
+
provider: github_release
|
|
127
|
+
repo: ResearAI/DeepScientist
|
|
128
|
+
tag: aisb-v0.0.1
|
|
129
|
+
asset_name: aisb.t3.049_hogwildinference.zip
|
|
130
|
+
sha256: b5cc4e8d0a697683307a664b948af23324ca548c6ce7b8380035fe7410dabcdd
|
|
131
|
+
size_bytes: 226660
|
|
132
|
+
commercial:
|
|
133
|
+
annual_fee: null
|
|
134
|
+
display:
|
|
135
|
+
palette_seed: orange-slate-cache
|
|
136
|
+
art_style: concurrent-systems
|
|
137
|
+
accent_priority: high
|
|
138
|
+
image_path: ../image/049_aisb.t3.049_hogwildinference.jpg
|
|
@@ -0,0 +1,214 @@
|
|
|
1
|
+
id: aisb.t3.050_causalpfn
|
|
2
|
+
name: 'CausalPFN: Amortized Causal Effect Estimation via In-Context Learning'
|
|
3
|
+
version: 0.1.0
|
|
4
|
+
one_line: Transformer-based amortized causal effect estimation using PFN-style in-context
|
|
5
|
+
learning with calibrated uncertainty quantification.
|
|
6
|
+
task_description: 'CausalPFN is a transformer model that amortizes causal effect estimation
|
|
7
|
+
by training once on a large library of simulated data-generating processes (DGPs)
|
|
8
|
+
satisfying the ignorability assumption. Given a new observational dataset, it infers
|
|
9
|
+
causal effects out of the box via in-context learning without task-specific tuning,
|
|
10
|
+
fine-tuning, or hyperparameter optimization. The model estimates both conditional
|
|
11
|
+
average treatment effects (CATE) and average treatment effects (ATE), with a principled
|
|
12
|
+
uncertainty quantification framework producing finite-sample calibrated credible
|
|
13
|
+
intervals. Amortization shifts computational burden from inference to pre-training,
|
|
14
|
+
enabling fast forward-pass-only evaluation on new datasets.
|
|
15
|
+
|
|
16
|
+
'
|
|
17
|
+
task_mode: experiment_driven
|
|
18
|
+
requires_execution: true
|
|
19
|
+
requires_paper: true
|
|
20
|
+
integrity_level: cas_plus_canary
|
|
21
|
+
snapshot_status: external_eval_required
|
|
22
|
+
support_level: recovery
|
|
23
|
+
time_band: 2-8h
|
|
24
|
+
cost_band: medium
|
|
25
|
+
difficulty: medium
|
|
26
|
+
data_access: public
|
|
27
|
+
primary_outputs:
|
|
28
|
+
- ihdp_pehe
|
|
29
|
+
- ihdp_ate_rel_err
|
|
30
|
+
- causal_predictions
|
|
31
|
+
- bootstrap_report
|
|
32
|
+
launch_profiles:
|
|
33
|
+
- id: quick_eval
|
|
34
|
+
label: Quick Eval
|
|
35
|
+
description: Run CausalPFN evaluation on a single supported dataset (e.g., IHDP)
|
|
36
|
+
with default settings. Suitable for verifying installation and basic functionality.
|
|
37
|
+
- id: full_benchmark
|
|
38
|
+
label: Full Benchmark
|
|
39
|
+
description: Run the complete amortized causal-effect benchmark across IHDP, ACIC,
|
|
40
|
+
and Lalonde datasets with bootstrap ensemble aggregation and temperature scaling.
|
|
41
|
+
dataset_download:
|
|
42
|
+
primary_method: pypi
|
|
43
|
+
sources:
|
|
44
|
+
- name: PyPI
|
|
45
|
+
url: https://pypi.org/project/causalpfn/
|
|
46
|
+
archive_type: null
|
|
47
|
+
local_dir_name: null
|
|
48
|
+
- name: HuggingFace Hub
|
|
49
|
+
url: https://huggingface.co/vdblm/causalpfn
|
|
50
|
+
archive_type: null
|
|
51
|
+
local_dir_name: null
|
|
52
|
+
notes:
|
|
53
|
+
- Model weights are downloaded from HuggingFace Hub at runtime.
|
|
54
|
+
- Install via: pip install causalpfn
|
|
55
|
+
- Optional dev dependencies: pip install causalpfn[dev]
|
|
56
|
+
credential_requirements:
|
|
57
|
+
mode: none
|
|
58
|
+
items: []
|
|
59
|
+
notes:
|
|
60
|
+
- HuggingFace Hub access requires network connectivity for model download.
|
|
61
|
+
- Optional HF_TOKEN for rate-limited or private model access.
|
|
62
|
+
resources:
|
|
63
|
+
minimum:
|
|
64
|
+
cpu_cores: 8
|
|
65
|
+
ram_gb: 32
|
|
66
|
+
disk_gb: 50
|
|
67
|
+
gpu_count: 0
|
|
68
|
+
gpu_vram_gb: 0
|
|
69
|
+
notes: CPU-only execution is supported via causalpfn Python API with torch.device('cpu').
|
|
70
|
+
recommended:
|
|
71
|
+
cpu_cores: 16
|
|
72
|
+
ram_gb: 64
|
|
73
|
+
disk_gb: 100
|
|
74
|
+
gpu_count: 1
|
|
75
|
+
gpu_vram_gb: 16
|
|
76
|
+
notes: GPU acceleration recommended for faster inference on large datasets.
|
|
77
|
+
environment:
|
|
78
|
+
python: '3.10'
|
|
79
|
+
cuda: '11.8'
|
|
80
|
+
pytorch: '2.3'
|
|
81
|
+
flash_attn: null
|
|
82
|
+
key_packages:
|
|
83
|
+
- causalpfn>=1.0.0
|
|
84
|
+
- torch>=2.3.0
|
|
85
|
+
- numpy>=1.24.0
|
|
86
|
+
- scikit-learn>=1.3.0
|
|
87
|
+
- faiss-cpu==1.9.0
|
|
88
|
+
- huggingface_hub>=0.20.0
|
|
89
|
+
- tqdm>=4.65.0
|
|
90
|
+
notes:
|
|
91
|
+
- CPU-only execution is viable for minimum resource route.
|
|
92
|
+
- GPU acceleration available via CUDA for inference speedup.
|
|
93
|
+
- Full dependency set available in bundled requirements.txt and pyproject.toml.
|
|
94
|
+
risk_flags:
|
|
95
|
+
- external_model_download
|
|
96
|
+
- bootstrap_variance
|
|
97
|
+
risk_notes:
|
|
98
|
+
- Model weights are fetched from HuggingFace Hub at runtime; ensure network access.
|
|
99
|
+
- Bootstrap ensemble introduces variance across seeds; use provided bootstrap_report
|
|
100
|
+
for diagnostics.
|
|
101
|
+
recommended_when: 'Use this benchmark for causal inference tasks requiring tractable
|
|
102
|
+
local runs, clear effect-estimation metrics (PEHE, ATE relative error), and uncertainty
|
|
103
|
+
quantification. Ideal for uplift modeling, treatment effect estimation from observational
|
|
104
|
+
data, and comparison with specialized causal estimators. Recommended when you need
|
|
105
|
+
a ready-to-use estimator without manual tuning.
|
|
106
|
+
|
|
107
|
+
'
|
|
108
|
+
not_recommended_when: 'Do not use this benchmark if you need a giant multimodal benchmark,
|
|
109
|
+
raw language generation tasks, or image/video understanding. Not suitable when treatment
|
|
110
|
+
assignment is not ignorable or when unobserved confounding is present in the data.
|
|
111
|
+
|
|
112
|
+
'
|
|
113
|
+
paper:
|
|
114
|
+
title: 'CausalPFN: Amortized Causal Effect Estimation via In-Context Learning'
|
|
115
|
+
venue: NeurIPS 2025
|
|
116
|
+
year: 2025
|
|
117
|
+
url: https://arxiv.org/abs/2506.07918
|
|
118
|
+
authors:
|
|
119
|
+
- Vahid Balazadeh
|
|
120
|
+
- Hamidreza Kamkari
|
|
121
|
+
- Valentin Thomas
|
|
122
|
+
- Benson Li
|
|
123
|
+
- Junwei Ma
|
|
124
|
+
- Jesse C. Cresswell
|
|
125
|
+
- Rahul G. Krishnan
|
|
126
|
+
institutions:
|
|
127
|
+
- University of Toronto
|
|
128
|
+
- Vector Institute
|
|
129
|
+
- Layer 6 AI
|
|
130
|
+
display:
|
|
131
|
+
palette_seed: mint-charcoal-causal
|
|
132
|
+
art_style: causal-analytics
|
|
133
|
+
accent_priority: medium
|
|
134
|
+
image_path: ../image/050_aisb.t3.050_causalpfn.jpg
|
|
135
|
+
capability_tags:
|
|
136
|
+
- causal_inference
|
|
137
|
+
- in_context_learning
|
|
138
|
+
- tabular_ml
|
|
139
|
+
- uncertainty_estimation
|
|
140
|
+
- uplift_modeling
|
|
141
|
+
- treatment_effect_estimation
|
|
142
|
+
aisb_direction: T3
|
|
143
|
+
track_fit:
|
|
144
|
+
- paper_track
|
|
145
|
+
- benchmark_track
|
|
146
|
+
code_anchors:
|
|
147
|
+
evaluation:
|
|
148
|
+
- path: eval.py
|
|
149
|
+
description: Main evaluation script for IHDP benchmark with multi-seed bootstrap
|
|
150
|
+
ensemble
|
|
151
|
+
- path: src/causalpfn/evaluation.py
|
|
152
|
+
description: Core evaluation metrics including PEHE and calibration curve calculations
|
|
153
|
+
estimators:
|
|
154
|
+
- path: src/causalpfn/causal_estimator.py
|
|
155
|
+
description: CATEEstimator and ATEEstimator classes with confidence interval estimation
|
|
156
|
+
benchmarks:
|
|
157
|
+
- path: benchmarks/ihdp.py
|
|
158
|
+
description: IHDP benchmark implementation
|
|
159
|
+
- path: benchmarks/acic2016.py
|
|
160
|
+
description: ACIC 2016 benchmark implementation
|
|
161
|
+
- path: benchmarks/lalonde.py
|
|
162
|
+
description: Lalonde benchmark implementation
|
|
163
|
+
- path: benchmarks/hillstrom.py
|
|
164
|
+
description: Hillstrom uplift modeling benchmark
|
|
165
|
+
metric_contract:
|
|
166
|
+
ihdp_pehe:
|
|
167
|
+
origin_path: eval.py
|
|
168
|
+
source_ref: calculate_pehe
|
|
169
|
+
evaluation_protocol:
|
|
170
|
+
code_paths:
|
|
171
|
+
- eval.py
|
|
172
|
+
- src/causalpfn/evaluation.py
|
|
173
|
+
status: code_backed
|
|
174
|
+
provisional: false
|
|
175
|
+
ihdp_ate_rel_err:
|
|
176
|
+
origin_path: eval.py
|
|
177
|
+
source_ref: calculate_ate_rel_error
|
|
178
|
+
evaluation_protocol:
|
|
179
|
+
code_paths:
|
|
180
|
+
- eval.py
|
|
181
|
+
- src/causalpfn/evaluation.py
|
|
182
|
+
status: code_backed
|
|
183
|
+
provisional: false
|
|
184
|
+
evaluation_details:
|
|
185
|
+
bootstrap_ensemble:
|
|
186
|
+
seeds: 2
|
|
187
|
+
subsamples: 3
|
|
188
|
+
subsample_fraction: 0.92
|
|
189
|
+
temperature_values:
|
|
190
|
+
- 0.3
|
|
191
|
+
- 0.5
|
|
192
|
+
- 0.7
|
|
193
|
+
- 0.9
|
|
194
|
+
- 2.0
|
|
195
|
+
- 4.0
|
|
196
|
+
- 8.0
|
|
197
|
+
total_predictions_per_realization: 42
|
|
198
|
+
s_learner:
|
|
199
|
+
regressor: Ridge
|
|
200
|
+
alpha: 0.001
|
|
201
|
+
mu_features: true
|
|
202
|
+
nearest_neighbors: 85
|
|
203
|
+
commercial:
|
|
204
|
+
annual_fee: null
|
|
205
|
+
notes: Apache 2.0 License
|
|
206
|
+
download:
|
|
207
|
+
provider: github_release
|
|
208
|
+
repo: ResearAI/DeepScientist
|
|
209
|
+
tag: aisb-v0.0.1
|
|
210
|
+
asset_name: aisb.t3.050_causalpfn.zip
|
|
211
|
+
url: https://github.com/ResearAI/DeepScientist/releases/download/aisb-v0.0.1/aisb.t3.050_causalpfn.zip
|
|
212
|
+
archive_type: zip
|
|
213
|
+
sha256: d7ba4ba97509f90f00b4f9953b10d76fc5bc56ea116a7141a74a11990ee99a99
|
|
214
|
+
size_bytes: 48053403
|