medsci-skills 4.10.0 → 5.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (103) hide show
  1. package/README.md +26 -13
  2. package/metadata/distribution_files.json +401 -26
  3. package/metadata/distribution_manifest.json +7 -1
  4. package/metadata/skills_catalog.json +67 -1
  5. package/package.json +1 -1
  6. package/skills/architecture-zoo/SKILL.md +100 -0
  7. package/skills/architecture-zoo/references/classification.md +102 -0
  8. package/skills/architecture-zoo/references/detection.md +68 -0
  9. package/skills/architecture-zoo/references/foundation_models.md +87 -0
  10. package/skills/architecture-zoo/references/index.md +55 -0
  11. package/skills/architecture-zoo/references/segmentation.md +110 -0
  12. package/skills/architecture-zoo/references/synthesis.md +71 -0
  13. package/skills/architecture-zoo/skill.yml +36 -0
  14. package/skills/check-reporting/references/appraisal_tools/METRICS_RELOADED.md +36 -0
  15. package/skills/find-journal/POLICY.md +9 -0
  16. package/skills/find-journal/SKILL.md +147 -13
  17. package/skills/find-journal/references/acceptance_signals_schema.md +126 -0
  18. package/skills/find-journal/references/journal_profiles/AJR.md +8 -0
  19. package/skills/find-journal/references/journal_profiles/Clinical_and_Molecular_Hepatology.md +2 -2
  20. package/skills/find-journal/references/journal_profiles/European_Radiology.md +8 -0
  21. package/skills/find-journal/references/journal_profiles/Investigative_Radiology.md +8 -0
  22. package/skills/find-journal/references/journal_profiles/KJR.md +8 -0
  23. package/skills/find-journal/references/journal_profiles/RYAI.md +8 -0
  24. package/skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_ceiling.txt +18 -0
  25. package/skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_clean.txt +10 -0
  26. package/skills/find-journal/scripts/acceptance_readiness_challenge/fixture_ceiling/manuscript.md +16 -0
  27. package/skills/find-journal/scripts/acceptance_readiness_challenge/fixture_clean/manuscript.md +15 -0
  28. package/skills/find-journal/scripts/acceptance_readiness_challenge/problem.md +38 -0
  29. package/skills/find-journal/scripts/acceptance_readiness_challenge/verify.sh +28 -0
  30. package/skills/find-journal/scripts/assess_acceptance_readiness.py +235 -0
  31. package/skills/find-journal/skill.yml +5 -1
  32. package/skills/mllm-eval/SKILL.md +108 -0
  33. package/skills/mllm-eval/scripts/check_mllm_eval_completeness.py +184 -0
  34. package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_bad.md +3 -0
  35. package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_good.md +9 -0
  36. package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/problem.md +29 -0
  37. package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/verify.sh +25 -0
  38. package/skills/mllm-eval/skill.yml +44 -0
  39. package/skills/mllm-eval/tests/test_mllm_eval_completeness.sh +49 -0
  40. package/skills/model-card/SKILL.md +103 -0
  41. package/skills/model-card/references/datasheet_template.md +38 -0
  42. package/skills/model-card/references/metric_dimensions.md +32 -0
  43. package/skills/model-card/references/model_card_template.md +62 -0
  44. package/skills/model-card/scripts/check_model_card_complete.py +202 -0
  45. package/skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/DATASHEET.md +31 -0
  46. package/skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/MODEL_CARD.md +48 -0
  47. package/skills/model-card/scripts/check_model_card_complete_challenge/fixture/incomplete/MODEL_CARD.md +28 -0
  48. package/skills/model-card/scripts/check_model_card_complete_challenge/problem.md +31 -0
  49. package/skills/model-card/scripts/check_model_card_complete_challenge/verify.sh +34 -0
  50. package/skills/model-card/skill.yml +41 -0
  51. package/skills/model-card/tests/test_model_card_complete.sh +75 -0
  52. package/skills/model-evaluation/SKILL.md +88 -0
  53. package/skills/model-evaluation/references/metric_guide.md +44 -0
  54. package/skills/model-evaluation/scripts/check_metric_reporting.py +196 -0
  55. package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_bad.md +2 -0
  56. package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_good.md +3 -0
  57. package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_bad.md +2 -0
  58. package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_good.md +3 -0
  59. package/skills/model-evaluation/scripts/metric_reporting_challenge/problem.md +27 -0
  60. package/skills/model-evaluation/scripts/metric_reporting_challenge/verify.sh +29 -0
  61. package/skills/model-evaluation/skill.yml +43 -0
  62. package/skills/model-evaluation/tests/test_metric_reporting.sh +47 -0
  63. package/skills/model-scaffold/SKILL.md +126 -0
  64. package/skills/model-scaffold/references/training_guide.md +46 -0
  65. package/skills/model-scaffold/scripts/check_training_hygiene.py +254 -0
  66. package/skills/model-scaffold/scripts/scaffold.py +1122 -0
  67. package/skills/model-scaffold/scripts/scaffold_challenge/expected/split_assignment.csv +13 -0
  68. package/skills/model-scaffold/scripts/scaffold_challenge/fixture/manifest.csv +19 -0
  69. package/skills/model-scaffold/scripts/scaffold_challenge/problem.md +44 -0
  70. package/skills/model-scaffold/scripts/scaffold_challenge/verify.sh +105 -0
  71. package/skills/model-scaffold/skill.yml +46 -0
  72. package/skills/model-scaffold/tests/fixtures/bad_evaluate.py +10 -0
  73. package/skills/model-scaffold/tests/fixtures/bad_train.py +9 -0
  74. package/skills/model-scaffold/tests/test_training_hygiene.sh +82 -0
  75. package/skills/model-validation/SKILL.md +146 -0
  76. package/skills/model-validation/scripts/check_split_leakage.py +269 -0
  77. package/skills/model-validation/scripts/check_split_leakage_challenge/expected/clean.txt +9 -0
  78. package/skills/model-validation/scripts/check_split_leakage_challenge/expected/leak.txt +9 -0
  79. package/skills/model-validation/scripts/check_split_leakage_challenge/fixture/split_seed.txt +1 -0
  80. package/skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_clean.csv +14 -0
  81. package/skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_leak.csv +15 -0
  82. package/skills/model-validation/scripts/check_split_leakage_challenge/problem.md +39 -0
  83. package/skills/model-validation/scripts/check_split_leakage_challenge/verify.sh +37 -0
  84. package/skills/model-validation/skill.yml +43 -0
  85. package/skills/model-validation/tests/fixtures/leak_subject.csv +6 -0
  86. package/skills/model-validation/tests/fixtures/noseed_clean.csv +5 -0
  87. package/skills/model-validation/tests/fixtures/single_partition.csv +4 -0
  88. package/skills/model-validation/tests/test_split_leakage.sh +78 -0
  89. package/skills/peer-review/SKILL.md +12 -0
  90. package/skills/peer-review/references/domain-probes/mllm_evaluation.md +102 -0
  91. package/skills/peer-review/references/domain-probes/model_development.md +52 -0
  92. package/skills/present-paper/SKILL.md +80 -15
  93. package/skills/present-paper/references/presentation_design_guidelines.md +133 -0
  94. package/skills/present-paper/references/slide_visual_styles/CATALOG.md +43 -0
  95. package/skills/present-paper/references/slide_visual_styles/clinical_blue.md +70 -0
  96. package/skills/present-paper/references/slide_visual_styles/dark_modern.md +66 -0
  97. package/skills/present-paper/references/slide_visual_styles/editorial_mono.md +66 -0
  98. package/skills/present-paper/references/slide_visual_styles/institutional_brand.md +80 -0
  99. package/skills/present-paper/scripts/inspect_pptx_template.py +135 -0
  100. package/skills/self-review/SKILL.md +2 -0
  101. package/skills/self-review/references/domain-probes/mllm_evaluation.md +102 -0
  102. package/skills/self-review/references/domain-probes/model_development.md +52 -0
  103. package/skills/write-paper/references/journal_profiles/Clinical_and_Molecular_Hepatology.md +2 -1
package/README.md CHANGED
@@ -2,14 +2,14 @@
2
2
 
3
3
  # MedSci Skills
4
4
 
5
- **45 skills that actually work.** Built by a physician-researcher, tested on real publications.
5
+ **51 skills that actually work.** Built by a physician-researcher, tested on real publications.
6
6
 
7
- *MedSci Skills is a submission-grade clinical manuscript workflow, not a generic biomedical skill catalog. Its moat is the compliance layer — 38 reporting guidelines and risk-of-bias tools, reference/citation verification, and deterministic integrity gates, before peer review sees the manuscript. It competes on clinical submission reliability, not skill count.*
7
+ *MedSci Skills is an end-to-end research tool for physician and medical-engineering researchers — design → scaffold → validate → publish — for the clinical manuscript and the medical-AI model behind it. Its moat is the compliance layer — 38 reporting guidelines and risk-of-bias tools, reference/citation verification, and deterministic integrity gates before peer review now extended by a model-engineering lane that scaffolds reproducible, leakage-safe training repos and audits model validation. Clinical AI model research engineering is in scope; a general AI-scientist platform is not. It competes on clinical submission reliability, not skill count.*
8
8
 
9
9
  [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](LICENSE)
10
10
  [![Release](https://img.shields.io/github/v/release/Aperivue/medsci-skills?style=flat-square&color=blue)](https://github.com/Aperivue/medsci-skills/releases/latest)
11
11
  [![CI](https://img.shields.io/github/actions/workflow/status/Aperivue/medsci-skills/validate.yml?branch=main&style=flat-square&label=CI)](https://github.com/Aperivue/medsci-skills/actions/workflows/validate.yml)
12
- ![Skills](https://img.shields.io/badge/Skills-45-brightgreen?style=flat-square)
12
+ ![Skills](https://img.shields.io/badge/Skills-51-brightgreen?style=flat-square)
13
13
  [![npm](https://img.shields.io/npm/v/medsci-skills?style=flat-square&label=npm&color=cb3837)](https://www.npmjs.com/package/medsci-skills)
14
14
  [![Watch the 2-min intro](https://img.shields.io/badge/▶_Watch-2--min_intro-FF0000?style=flat-square&logo=youtube&logoColor=white)](https://youtu.be/MclQ_RIofpE)
15
15
  [![good first issues](https://img.shields.io/github/issues/Aperivue/medsci-skills/good%20first%20issue?style=flat-square&label=good%20first%20issues&color=7057ff)](https://github.com/Aperivue/medsci-skills/contribute)
@@ -42,14 +42,20 @@
42
42
  ## What is MedSci Skills?
43
43
 
44
44
  MedSci Skills is an open-source Claude Code skill collection for **clinical
45
- manuscript preparation**. It helps physician-researchers and biomedical
46
- investigators move from literature search, study design, statistics, and figures to
47
- reporting-guideline compliance, citation/reference auditing, numerical-consistency
48
- checks, and response-to-reviewer workflows — combining agentic writing with
49
- **deterministic integrity gates** for submission-grade biomedical research. It is
50
- **not** a diagnostic tool, an autonomous author, or a general AI-scientist platform;
51
- every output requires human-expert verification. New here? See the
52
- [3 workflows below](#start-here-3-workflows), the [FAQ](docs/faq.md), and the
45
+ research — the manuscript and the medical-AI model alike**. It helps
46
+ physician-researchers and biomedical/medical-engineering investigators move from
47
+ literature search, study design, statistics, and figures to reporting-guideline
48
+ compliance, citation/reference auditing, numerical-consistency checks, and
49
+ response-to-reviewer workflows combining agentic writing with **deterministic
50
+ integrity gates** for submission-grade biomedical research. As of **v5.0** it adds a
51
+ **model-engineering lane**: choose a paper-grounded architecture, scaffold a
52
+ reproducible, leakage-safe PyTorch training repo, and validate, document, and
53
+ evaluate a medical-imaging or LLM/MLLM model so the work reaches a paper — it
54
+ **integrates** MONAI / nnU-Net, never reimplements them. Clinical AI model research
55
+ engineering is in scope; it is **not** a diagnostic tool, an autonomous author, or a
56
+ general AI-scientist platform, and every output requires human-expert verification.
57
+ New here? See the [3 workflows below](#start-here-3-workflows), the
58
+ [FAQ](docs/faq.md), and the
53
59
  [scope boundary](ROADMAP.md#not-planned--explicitly-out-of-scope).
54
60
 
55
61
  ---
@@ -82,17 +88,18 @@ Restart Claude Code, then start with **`/orchestrate`** — it classifies your r
82
88
 
83
89
  ### Install as a Claude Code plugin
84
90
 
85
- Prefer plugins? One line adds the marketplace; `/plugin` then lets you browse eight category plugins and enable the ones you want:
91
+ Prefer plugins? One line adds the marketplace; `/plugin` then lets you browse nine category plugins and enable the ones you want:
86
92
 
87
93
  ```text
88
94
  /plugin marketplace add Aperivue/medsci-skills
89
- /plugin # browse eight category plugins; enable the ones you want
95
+ /plugin # browse nine category plugins; enable the ones you want
90
96
  ```
91
97
 
92
98
  | Plugin | Covers |
93
99
  |--------|--------|
94
100
  | `medsci-literature` | Literature search, full-text retrieval, Zotero sync, reference-integrity audits |
95
101
  | `medsci-data` | Study design, variable operationalization, sample size, data cleaning, de-identification, codebooks, dataset versioning |
102
+ | `medsci-modeling` | Architecture selection, reproducible model-scaffold repos, model-validation audits, Model Card/Datasheet, model & LLM/MLLM evaluation |
96
103
  | `medsci-analysis` | Statistics, figures, batch/cross-national/replication analysis, meta-analysis |
97
104
  | `medsci-writing` | IMRAD & protocol drafting, AI-pattern removal, AI-search optimization, reviewer responses |
98
105
  | `medsci-review` | Self-review, peer review, reporting-guideline compliance |
@@ -451,6 +458,12 @@ ma-scout -> search-lit -> fulltext-retrieval -> design-study ──> write-proto
451
458
  | **make-figures** | Publication-ready figures and visual abstracts: ROC curves, forest plots, PRISMA/CONSORT/STARD flow diagrams, Kaplan-Meier curves, Bland-Altman plots, confusion matrices, and journal-specific visual/graphical abstracts (python-pptx template-based). Communication-first design principles (Nat Hum Behav 2026 — key message, audience, cognitive load, figure-vs-table decision) and five flow-diagram production lessons (official-template fidelity, VML fallback PDF export, docx XML escape, sequential placeholder mapping, version freeze); critic rubric Section G adds 5 communication-first checks. `--study-type` auto-generates the full required figure set; structured `_figure_manifest.md` output for downstream pipeline consumption; D2 enforced as default for flow diagrams. |
452
459
  | **design-study** | Study design review: identifies analysis unit, cohort logic, data leakage risks, comparator design, validation strategy, and reporting guideline fit. |
453
460
  | **design-ai-benchmarking** | Design and validity review for benchmarking AI system(s) against a human-expert panel: evaluation-question and arm definition, decoupled multi-dimensional rubrics with anchors, planted calibration probes (positive-control / known-bad / instability / mechanism-contradiction), reviewer-panel construction with per-reviewer randomization, inter-rater reliability targets with separate control-item reliability, LLM-as-judge vs human-as-judge adjudication, construct-independence guards, and a structured JSON rating-export schema. Locks the rubric before data collection. |
461
+ | **model-validation** | Design or audit the clinical-validation study for an engineer-built medical-imaging model (segmentation / classification / detection): patient-level split disjointness and the data-leakage taxonomy, tuning-on-test, internal vs genuine external validation, comparator design, single-run vs multi-seed variance, task-correct metric selection (Metrics Reloaded), test-set sizing, and CLAIM 2024 / TRIPOD+AI / STARD-AI reporting fit. Ships a deterministic split-leakage gate that proves patient disjointness by set arithmetic on the emitted split table. Integrates with MONAI / nnU-Net — does not replace them. |
462
+ | **model-scaffold** | Generate a reproducible, runnable PyTorch training repo for a medical-imaging task — segmentation (U-Net), classification, detection, image-to-image synthesis, or self-supervised pretraining — the missing middle link between choosing an architecture and validating a trained model. Emits a patient-level seed-locked split as an auditable artifact, a task-appropriate model, train/evaluate scripts that seed every RNG and infer under eval mode, a config, requirements, a reproducibility record, and a Methods stub with VERIFY placeholders (no fabricated numbers). Reproducibility holds by construction; ships a `check_training_hygiene` AST gate + a network-free build→validate challenge. Integrates with MONAI / nnU-Net / TorchIO / timm / torchvision — does not reimplement them. |
463
+ | **architecture-zoo** | "Which architecture for which research question" decision tool: maps task (classification / segmentation / detection / transfer), modality, data scale, and class imbalance to a paper-grounded architecture shortlist. Curates the foundational curriculum (ResNet / DenseNet / EfficientNet / ViT / Swin; U-Net / 3-D U-Net / Attention & Residual U-Net / nnU-Net / Mask R-CNN; SAM/MedSAM / TotalSegmentator / BiomedCLIP / DINO / MAE / SimCLR) — each with core idea, when-to-use, medical-imaging use, reference implementation, validation setup, and the matching model-scaffold template. Advisory; teaches archetypes, not a live SOTA leaderboard. |
464
+ | **model-card** | Generate the documentation an engineer-built medical-imaging model must carry — a Model Card (Mitchell et al. 2019), a Datasheet for its dataset (Gebru et al. 2021), and a METRIC-informed data-quality pass — filled from user-supplied facts (never fabricated), then verify every required section is present and non-empty with a deterministic completeness gate (`check_model_card_complete`). Model Card / Datasheet are documentation standards vendored as templates, not counted reporting checklists. |
465
+ | **model-evaluation** | Compute and report task-correct held-out metrics for a trained medical-imaging model — segmentation (Dice + a boundary metric HD95/NSD, per structure), classification (AUROC + AUPRC + sensitivity/specificity with bootstrap CIs at the deployment prevalence), or detection (FROC/mAP with a stated IoU criterion) — plus calibration and subgroup slices. Emits a per-case table for analyze-stats and gates the metric choice against Metrics Reloaded / CLAIM 2024 (`check_metric_reporting`). Numbers come only from executed code. |
466
+ | **mllm-eval** | Model-agnostic evaluation harness (closed API or open weights) for an LLM/MLLM on a clinical task — radiology report generation, VQA, clinical text extraction — covering the adjudicated reference standard, clinical-efficacy metrics (RadGraph-F1 / CheXbert-F1 beyond BLEU/ROUGE), faithfulness/hallucination, pretraining-contamination, prompt sensitivity, and a reader study; gates the plan with `check_mllm_eval_completeness` and routes the reviewer audit to the MLLM probe. |
454
467
  | **intake-project** | Classifies new research projects, summarizes current state, identifies missing inputs, and recommends next steps. |
455
468
  | **grant-builder** | Structures grant proposals: significance, innovation, approach, milestones, and consortium roles. |
456
469
  | **present-paper** | Academic presentation preparation: paper analysis, supporting research, speaker scripts, slide note injection, and Q&A prep. |
@@ -396,6 +396,46 @@
396
396
  "size": 1421,
397
397
  "sha256": "912c52e9289a7ccb014aa8a18105b6dfe04c2cc040e970c73b4bbc6b2d8a8a39"
398
398
  },
399
+ {
400
+ "path": "skills/architecture-zoo/SKILL.md",
401
+ "size": 5712,
402
+ "sha256": "ffb9a52d417f309a3b22c8d0f74e6700b67350c0d7a2a2e2c785f0cb4cb066bc"
403
+ },
404
+ {
405
+ "path": "skills/architecture-zoo/references/classification.md",
406
+ "size": 5986,
407
+ "sha256": "035e0fddaccb0e19e23ffd7756b075154f847ee20f9a512cd2a010c0db4210fa"
408
+ },
409
+ {
410
+ "path": "skills/architecture-zoo/references/detection.md",
411
+ "size": 3917,
412
+ "sha256": "60549b53a87dcb149c442498695321e94c28f0c8853316dda995a2dd730dfeec"
413
+ },
414
+ {
415
+ "path": "skills/architecture-zoo/references/foundation_models.md",
416
+ "size": 5267,
417
+ "sha256": "495453b025f1cb13d5ba0bac9be6d3b0d63dd958ea48d2b9e55bc222e9c26786"
418
+ },
419
+ {
420
+ "path": "skills/architecture-zoo/references/index.md",
421
+ "size": 4024,
422
+ "sha256": "d2360eb8635347f0f22be0b0e337a540db865aafdc12678455cf32bc49fd9d3d"
423
+ },
424
+ {
425
+ "path": "skills/architecture-zoo/references/segmentation.md",
426
+ "size": 6508,
427
+ "sha256": "17618fe3d6884cf89b034ededcd69e081a65d7bfd473495eb2ab1fb5d8b15d8b"
428
+ },
429
+ {
430
+ "path": "skills/architecture-zoo/references/synthesis.md",
431
+ "size": 3973,
432
+ "sha256": "b7fec1a55a7b9e2f8eea6979d7bfbda1fc03664aeec0cc89daac8c8f9bdfb8bc"
433
+ },
434
+ {
435
+ "path": "skills/architecture-zoo/skill.yml",
436
+ "size": 2836,
437
+ "sha256": "7d7c727a9fc75383e775feac14faf1c4caad90307ed8ca20859ef499ac17deb0"
438
+ },
399
439
  {
400
440
  "path": "skills/author-strategy/SKILL.md",
401
441
  "size": 9209,
@@ -506,6 +546,11 @@
506
546
  "size": 4373,
507
547
  "sha256": "ee59d959b91c831d34e04853a83a969bb6315e49f692baa904ab8805b8f17147"
508
548
  },
549
+ {
550
+ "path": "skills/check-reporting/references/appraisal_tools/METRICS_RELOADED.md",
551
+ "size": 2384,
552
+ "sha256": "e06267be7ffa5b5e3f52de387b745bf2676f016c29b02a5872d38c68ddf762ec"
553
+ },
509
554
  {
510
555
  "path": "skills/check-reporting/references/checklists/AMSTAR2.md",
511
556
  "size": 4566,
@@ -1023,13 +1068,18 @@
1023
1068
  },
1024
1069
  {
1025
1070
  "path": "skills/find-journal/POLICY.md",
1026
- "size": 4486,
1027
- "sha256": "02de377328f457c57c5edbade8bae40e12c51b4c6ff8ab6293b330c482187ce7"
1071
+ "size": 5255,
1072
+ "sha256": "c2b61b5830844fa3eebe333dc4864acb4d085097e81ba2dbc1ef72dd65bebee3"
1028
1073
  },
1029
1074
  {
1030
1075
  "path": "skills/find-journal/SKILL.md",
1031
- "size": 14455,
1032
- "sha256": "48a95f5ee639e59f00241608b23b3e652395bffaa63a6bccba295e5b3d5a49d6"
1076
+ "size": 22072,
1077
+ "sha256": "45074f6499896700bff0eb20bd91c4076b143bcd39521d56559239edaa8b24d8"
1078
+ },
1079
+ {
1080
+ "path": "skills/find-journal/references/acceptance_signals_schema.md",
1081
+ "size": 6869,
1082
+ "sha256": "620ba1c55272908a16125ba69074491df5246d6cf9afa14e6b08a08e8dc4e866"
1033
1083
  },
1034
1084
  {
1035
1085
  "path": "skills/find-journal/references/journal_profiles/AJNR.md",
@@ -1038,8 +1088,8 @@
1038
1088
  },
1039
1089
  {
1040
1090
  "path": "skills/find-journal/references/journal_profiles/AJR.md",
1041
- "size": 1417,
1042
- "sha256": "ae26a8ea72672a973977a01f7e7a8cdbdc98b5dbcd2a7bc4605bb6eaee1a87fe"
1091
+ "size": 2075,
1092
+ "sha256": "9d9a5ee7b3b2287a6deae8fc06d54dd60b26afa843f5830f7bb5fb2e2ac633f7"
1043
1093
  },
1044
1094
  {
1045
1095
  "path": "skills/find-journal/references/journal_profiles/Abdominal_Radiology.md",
@@ -1098,8 +1148,8 @@
1098
1148
  },
1099
1149
  {
1100
1150
  "path": "skills/find-journal/references/journal_profiles/Clinical_and_Molecular_Hepatology.md",
1101
- "size": 2151,
1102
- "sha256": "7b343dd7628ec9c6efcd4c9afcb66ca35846d48af20c62e58038c437f0405a0a"
1151
+ "size": 2391,
1152
+ "sha256": "7d923a09bc543fe49db28b9b79714958522e2fe1781d60c6f22dc1efcd3ba650"
1103
1153
  },
1104
1154
  {
1105
1155
  "path": "skills/find-journal/references/journal_profiles/Cureus.md",
@@ -1128,8 +1178,8 @@
1128
1178
  },
1129
1179
  {
1130
1180
  "path": "skills/find-journal/references/journal_profiles/European_Radiology.md",
1131
- "size": 1640,
1132
- "sha256": "b71a9fe293c985c47f674459b4a613083749bc8d246d062e2c3afddc988e349c"
1181
+ "size": 2350,
1182
+ "sha256": "fa50a9a9d6012b8c6b75d81a69b950dfbe7db29775c8112bf5fe68d6d5655dfa"
1133
1183
  },
1134
1184
  {
1135
1185
  "path": "skills/find-journal/references/journal_profiles/Hepatology_Communications.md",
@@ -1158,8 +1208,8 @@
1158
1208
  },
1159
1209
  {
1160
1210
  "path": "skills/find-journal/references/journal_profiles/Investigative_Radiology.md",
1161
- "size": 1480,
1162
- "sha256": "ab740ec46a98b92fc243d4770b2a4f6ed400ea5a1f86e0fdffc121cdb2c98fa9"
1211
+ "size": 2118,
1212
+ "sha256": "c218b4e764a070a3297802076c1e6c68e514160cc1efa038552cc271b01af9ce"
1163
1213
  },
1164
1214
  {
1165
1215
  "path": "skills/find-journal/references/journal_profiles/JACC_Advances.md",
@@ -1248,8 +1298,8 @@
1248
1298
  },
1249
1299
  {
1250
1300
  "path": "skills/find-journal/references/journal_profiles/KJR.md",
1251
- "size": 3036,
1252
- "sha256": "a0814e6d62288389db7528b73a25db870ab91635dc4b946fb0c8bf8af47150a3"
1301
+ "size": 4061,
1302
+ "sha256": "0849de001a47038b8bfc92b337285372c80ccf4861162cae876295d82ea4f1c8"
1253
1303
  },
1254
1304
  {
1255
1305
  "path": "skills/find-journal/references/journal_profiles/Korean_Circulation_Journal.md",
@@ -1348,8 +1398,8 @@
1348
1398
  },
1349
1399
  {
1350
1400
  "path": "skills/find-journal/references/journal_profiles/RYAI.md",
1351
- "size": 1601,
1352
- "sha256": "1a6a387ed715a559bb0a7fd535b76ecb9334ff21e43b6c025520ca1167993a5e"
1401
+ "size": 2341,
1402
+ "sha256": "6d85cd675a5e6f395f74865256b7fe937749a4e31cb4c6f8d43d4059cb33a717"
1353
1403
  },
1354
1404
  {
1355
1405
  "path": "skills/find-journal/references/journal_profiles/Radiology.md",
@@ -1396,10 +1446,45 @@
1396
1446
  "size": 1511,
1397
1447
  "sha256": "e2811a46b89f39a7395d98460347ce274ff58ce50138364e8cf96050a05aad91"
1398
1448
  },
1449
+ {
1450
+ "path": "skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_ceiling.txt",
1451
+ "size": 1570,
1452
+ "sha256": "1e84f888350249a3b187d38731a371487232851c6521689e319ef59408ed9448"
1453
+ },
1454
+ {
1455
+ "path": "skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_clean.txt",
1456
+ "size": 350,
1457
+ "sha256": "40b1a3b94cf15d504fc2c04e25f5aa737410a8b2480118dcd3c9cd1927ee825c"
1458
+ },
1459
+ {
1460
+ "path": "skills/find-journal/scripts/acceptance_readiness_challenge/fixture_ceiling/manuscript.md",
1461
+ "size": 717,
1462
+ "sha256": "557ce5c0607024aebae3375e117b1052acace3d1931a3dc8d015a6b9c6043843"
1463
+ },
1464
+ {
1465
+ "path": "skills/find-journal/scripts/acceptance_readiness_challenge/fixture_clean/manuscript.md",
1466
+ "size": 646,
1467
+ "sha256": "77a215d5c5fe8d09035308f04cdf26ab7c2736c53563b71930a2be1941b7061b"
1468
+ },
1469
+ {
1470
+ "path": "skills/find-journal/scripts/acceptance_readiness_challenge/problem.md",
1471
+ "size": 1981,
1472
+ "sha256": "469b518a373f5bef95016dc866f82b0d05395eb26ae162656abf1303495ed71c"
1473
+ },
1474
+ {
1475
+ "path": "skills/find-journal/scripts/acceptance_readiness_challenge/verify.sh",
1476
+ "size": 1232,
1477
+ "sha256": "0c525f322306fd5229269f155179924d80a419301988fff0171115c3b323d795"
1478
+ },
1479
+ {
1480
+ "path": "skills/find-journal/scripts/assess_acceptance_readiness.py",
1481
+ "size": 10959,
1482
+ "sha256": "32930f970f308d95aaf82c61d809a307685668165df4fe2bf7c2b4f5052b3e87"
1483
+ },
1399
1484
  {
1400
1485
  "path": "skills/find-journal/skill.yml",
1401
- "size": 1428,
1402
- "sha256": "0fdf9fdce505cc1d264bdb9c69a4ad6107ea6d510d186385f854636b9f10e609"
1486
+ "size": 1971,
1487
+ "sha256": "8a4ce35c9fccb8a43de5d06bee09b27fc70d2c735d8fa9fce353ec9467fa9936"
1403
1488
  },
1404
1489
  {
1405
1490
  "path": "skills/fulltext-retrieval/SKILL.md",
@@ -2411,6 +2496,241 @@
2411
2496
  "size": 3891,
2412
2497
  "sha256": "d056566bb052bd917b4705fcd4912ef2173d5bd61b83bff4885b847bb824aa83"
2413
2498
  },
2499
+ {
2500
+ "path": "skills/mllm-eval/SKILL.md",
2501
+ "size": 6288,
2502
+ "sha256": "ccf3da2f70b356d432b3d33500f667f9d7858500a9ff325631a9a16f5f300a8b"
2503
+ },
2504
+ {
2505
+ "path": "skills/mllm-eval/scripts/check_mllm_eval_completeness.py",
2506
+ "size": 9380,
2507
+ "sha256": "fe24a9b0dfcce7d826c29be59f2534c768daf73e1e98f545e8a7791bc0709079"
2508
+ },
2509
+ {
2510
+ "path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_bad.md",
2511
+ "size": 202,
2512
+ "sha256": "41cd455b9a747f92506091f0a8fa607e069042c4add683d12b274e6081538ea1"
2513
+ },
2514
+ {
2515
+ "path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_good.md",
2516
+ "size": 795,
2517
+ "sha256": "93b703c163348e766dfbd2d01b2fc7267b57a082652d8bdd839b23646caa99a6"
2518
+ },
2519
+ {
2520
+ "path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/problem.md",
2521
+ "size": 1681,
2522
+ "sha256": "dc9ce54a7bd47ff5d3383c76e681760c0891dc503933863948df1cd999a11a0e"
2523
+ },
2524
+ {
2525
+ "path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/verify.sh",
2526
+ "size": 1335,
2527
+ "sha256": "7c3afbcd5adecdcdc8a2c9d14251521e2bfa39cbd3f650e77c92f37aabe49c9c"
2528
+ },
2529
+ {
2530
+ "path": "skills/mllm-eval/skill.yml",
2531
+ "size": 3373,
2532
+ "sha256": "72fcc60d62edc95808df7cc0ff283822069caaa61e9163fc8d3f298a3afa3801"
2533
+ },
2534
+ {
2535
+ "path": "skills/model-card/SKILL.md",
2536
+ "size": 5807,
2537
+ "sha256": "070b1ab8391a37bc4ffebadb918b71e83251da2293d119f5b0cfbf28bea0d4c2"
2538
+ },
2539
+ {
2540
+ "path": "skills/model-card/references/datasheet_template.md",
2541
+ "size": 2280,
2542
+ "sha256": "11998d71a43fcdf75d7f3b72cd46de7f9e4d999ac6b0b6febd5a3dee92a7a517"
2543
+ },
2544
+ {
2545
+ "path": "skills/model-card/references/metric_dimensions.md",
2546
+ "size": 3066,
2547
+ "sha256": "70aeb1af8ed7510aff0562c8ac99852a0b1b49de5eb3ef923a1bbeb4f4c051eb"
2548
+ },
2549
+ {
2550
+ "path": "skills/model-card/references/model_card_template.md",
2551
+ "size": 3239,
2552
+ "sha256": "e40ed0b7fd1a7370d22bb74a596048d1e09b75c14f1b2064ba89d06c886cefbd"
2553
+ },
2554
+ {
2555
+ "path": "skills/model-card/scripts/check_model_card_complete.py",
2556
+ "size": 8856,
2557
+ "sha256": "aa1fdc6a88e18696d0dfc23397a8a9141c1219583081deb5e27b822f152d4005"
2558
+ },
2559
+ {
2560
+ "path": "skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/DATASHEET.md",
2561
+ "size": 2179,
2562
+ "sha256": "1b53763c3017c88de0ddc583fc6a1975400d69d1929852580fd96c7fe08ccc3e"
2563
+ },
2564
+ {
2565
+ "path": "skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/MODEL_CARD.md",
2566
+ "size": 2785,
2567
+ "sha256": "fbb5ce99d2d144ecb53d1581826758d4aece996351089e7592999873760dcfaf"
2568
+ },
2569
+ {
2570
+ "path": "skills/model-card/scripts/check_model_card_complete_challenge/fixture/incomplete/MODEL_CARD.md",
2571
+ "size": 880,
2572
+ "sha256": "9b017400531316d787b71aaa7bc4a1fc82aa7f782e54df1eda1c34cde8980db4"
2573
+ },
2574
+ {
2575
+ "path": "skills/model-card/scripts/check_model_card_complete_challenge/problem.md",
2576
+ "size": 1853,
2577
+ "sha256": "dc85f56704dfd049cd9807d0ffd77bc1264de69c2b20ca3e691f6eedc6843deb"
2578
+ },
2579
+ {
2580
+ "path": "skills/model-card/scripts/check_model_card_complete_challenge/verify.sh",
2581
+ "size": 1857,
2582
+ "sha256": "8a8ee577857f4333b38313d6a322f02a54d8011698251bbec4e1a7d6bd758b21"
2583
+ },
2584
+ {
2585
+ "path": "skills/model-card/skill.yml",
2586
+ "size": 2877,
2587
+ "sha256": "0d71da374191ca35545b90130d7d30d4693e4bd469014a3b0993063bdfd4b958"
2588
+ },
2589
+ {
2590
+ "path": "skills/model-evaluation/SKILL.md",
2591
+ "size": 5031,
2592
+ "sha256": "17ffde905359e4cffdf747422b7d41c214d2abfcc71e50e1b1e4a689d87fa695"
2593
+ },
2594
+ {
2595
+ "path": "skills/model-evaluation/references/metric_guide.md",
2596
+ "size": 2454,
2597
+ "sha256": "8d09ca7ce9fb9f66ee4942689294d9b12ae1d892ac67769cd68fdc38a4e220ee"
2598
+ },
2599
+ {
2600
+ "path": "skills/model-evaluation/scripts/check_metric_reporting.py",
2601
+ "size": 9564,
2602
+ "sha256": "c33f52ee62ae93417027d0bb0b6cf2a95f5747d52403ab99c075bc64a5e2c593"
2603
+ },
2604
+ {
2605
+ "path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_bad.md",
2606
+ "size": 84,
2607
+ "sha256": "571aceb9567454e8bbe12e0967bc4cde4b142da99f6056f7530f3b8723ddf77c"
2608
+ },
2609
+ {
2610
+ "path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_good.md",
2611
+ "size": 186,
2612
+ "sha256": "ba44a3b38b4128fa713555c8b332f211e9087e6bc016d80af4c3074c3ca6ef8e"
2613
+ },
2614
+ {
2615
+ "path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_bad.md",
2616
+ "size": 119,
2617
+ "sha256": "50c138840976b8fa010cb0ca9fd24fffc7181e275eb6c71e76500da7d2a0420d"
2618
+ },
2619
+ {
2620
+ "path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_good.md",
2621
+ "size": 207,
2622
+ "sha256": "903a2dbd61cf56ce8e3d808f867ebd47ba4d6f2bd1542d7482b85477a6876eb0"
2623
+ },
2624
+ {
2625
+ "path": "skills/model-evaluation/scripts/metric_reporting_challenge/problem.md",
2626
+ "size": 1599,
2627
+ "sha256": "1f842374e3569d5fc27d7c26aa7f6bc6be43f7f38d2d9f3e2f9ab62fb29ddd65"
2628
+ },
2629
+ {
2630
+ "path": "skills/model-evaluation/scripts/metric_reporting_challenge/verify.sh",
2631
+ "size": 1235,
2632
+ "sha256": "f819d1333a7206db6383ccbd41c6eadae015004e61ae335e67a3334936c58cc8"
2633
+ },
2634
+ {
2635
+ "path": "skills/model-evaluation/skill.yml",
2636
+ "size": 2921,
2637
+ "sha256": "9713dbab40c54ca88324e7dcd74d3142890f9625ad68d708ba40b0cf57a7b9ee"
2638
+ },
2639
+ {
2640
+ "path": "skills/model-scaffold/SKILL.md",
2641
+ "size": 7686,
2642
+ "sha256": "cede2020d3ceee0e1599cbcfb412230ab9c04b08032c8bbaff620e4129ec6785"
2643
+ },
2644
+ {
2645
+ "path": "skills/model-scaffold/references/training_guide.md",
2646
+ "size": 2661,
2647
+ "sha256": "4a3197a89b8d3473071051f67a7bcf40f71ecf007e942f81e9c40dc48fce1a9c"
2648
+ },
2649
+ {
2650
+ "path": "skills/model-scaffold/scripts/check_training_hygiene.py",
2651
+ "size": 11752,
2652
+ "sha256": "66970049c85e46a0080b5f19eb3b5ac9dfd656a674b6f1698825e968eedd4814"
2653
+ },
2654
+ {
2655
+ "path": "skills/model-scaffold/scripts/scaffold.py",
2656
+ "size": 40470,
2657
+ "sha256": "33569806ecd230aebb9d35c77a27b8480d23329b00f633d7fee9531a7bcec974"
2658
+ },
2659
+ {
2660
+ "path": "skills/model-scaffold/scripts/scaffold_challenge/expected/split_assignment.csv",
2661
+ "size": 144,
2662
+ "sha256": "23949c5c9d179ef152127e0e6b865138169184f95c4e2d5234a65bab3762bd71"
2663
+ },
2664
+ {
2665
+ "path": "skills/model-scaffold/scripts/scaffold_challenge/fixture/manifest.csv",
2666
+ "size": 582,
2667
+ "sha256": "defce0cdce35211f038b139a9ab4214c63b22f3e60ba7ee74fa6bea8fe33aa7f"
2668
+ },
2669
+ {
2670
+ "path": "skills/model-scaffold/scripts/scaffold_challenge/problem.md",
2671
+ "size": 2678,
2672
+ "sha256": "369e98da65cbd16c67f5ff3f17d99b707d713bbf3239409f9921190c85f8f08a"
2673
+ },
2674
+ {
2675
+ "path": "skills/model-scaffold/scripts/scaffold_challenge/verify.sh",
2676
+ "size": 5136,
2677
+ "sha256": "040acee712943e8392b70b40b790438bec056a3a4e7a282f76455d2a2b791447"
2678
+ },
2679
+ {
2680
+ "path": "skills/model-scaffold/skill.yml",
2681
+ "size": 3195,
2682
+ "sha256": "06c4ed02872bfc38abd1c753c02a640a2bfaa1141fbfdd9f8b9ccbe18a148d82"
2683
+ },
2684
+ {
2685
+ "path": "skills/model-validation/SKILL.md",
2686
+ "size": 9347,
2687
+ "sha256": "ecd48672a03923bf1ace63528fd2dbcf138cd880103cc8c40345b3857d66ad1c"
2688
+ },
2689
+ {
2690
+ "path": "skills/model-validation/scripts/check_split_leakage.py",
2691
+ "size": 11616,
2692
+ "sha256": "a207b82abbb5914927e0de25663820c250207b0b1689f8ed17bfe6bda9eed6e2"
2693
+ },
2694
+ {
2695
+ "path": "skills/model-validation/scripts/check_split_leakage_challenge/expected/clean.txt",
2696
+ "size": 358,
2697
+ "sha256": "5d1e203ebc6656c172f60f4cd4eb3954fdbcd77579a6768c6bbd56952a966e6c"
2698
+ },
2699
+ {
2700
+ "path": "skills/model-validation/scripts/check_split_leakage_challenge/expected/leak.txt",
2701
+ "size": 470,
2702
+ "sha256": "34be75bbbabf10073a1fd11587e019491b7319e2030b166a1ab3e82e4899f3c2"
2703
+ },
2704
+ {
2705
+ "path": "skills/model-validation/scripts/check_split_leakage_challenge/fixture/split_seed.txt",
2706
+ "size": 3,
2707
+ "sha256": "084c799cd551dd1d8d5c5f9a5d593b2e931f5e36122ee5c793c1d08a19839cc0"
2708
+ },
2709
+ {
2710
+ "path": "skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_clean.csv",
2711
+ "size": 150,
2712
+ "sha256": "a4a15320685b58c4868737e40b4df0a07a942b39b5d94611e87d63d22e88aee0"
2713
+ },
2714
+ {
2715
+ "path": "skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_leak.csv",
2716
+ "size": 145,
2717
+ "sha256": "1bc2cc7b11a7a4a9ddc0168a83eab33ea1b03e3ca98bda5301679a18e19faf53"
2718
+ },
2719
+ {
2720
+ "path": "skills/model-validation/scripts/check_split_leakage_challenge/problem.md",
2721
+ "size": 2347,
2722
+ "sha256": "f140095ec5d190120bf73dc62710b2ccac31c7f7d54307a0854c8438df61940e"
2723
+ },
2724
+ {
2725
+ "path": "skills/model-validation/scripts/check_split_leakage_challenge/verify.sh",
2726
+ "size": 1925,
2727
+ "sha256": "9ae88c109caa1408a3a3b08ea0583fc97ce98b93c909f75d043f08a231e91e61"
2728
+ },
2729
+ {
2730
+ "path": "skills/model-validation/skill.yml",
2731
+ "size": 3079,
2732
+ "sha256": "4891c0698445f98552ab2a2315bc8288a6cc4744f8711e20f939c8af8739e434"
2733
+ },
2414
2734
  {
2415
2735
  "path": "skills/orchestrate/SKILL.md",
2416
2736
  "size": 35203,
@@ -2438,8 +2758,8 @@
2438
2758
  },
2439
2759
  {
2440
2760
  "path": "skills/peer-review/SKILL.md",
2441
- "size": 55415,
2442
- "sha256": "4b75d67b35444eada1a08700b9a0d27e6b8453fbca197893799db77811904b52"
2761
+ "size": 58493,
2762
+ "sha256": "057c39cd131c49eeb1949560a0d510f176a012431a0c8d36dd803061f98e0629"
2443
2763
  },
2444
2764
  {
2445
2765
  "path": "skills/peer-review/references/aczel_2021_reviewer2_patterns.md",
@@ -2481,6 +2801,16 @@
2481
2801
  "size": 11244,
2482
2802
  "sha256": "197cfaa4bdcfe223a0ebfb69c229ccb3852160ab76870ade914eb8997ab684c5"
2483
2803
  },
2804
+ {
2805
+ "path": "skills/peer-review/references/domain-probes/mllm_evaluation.md",
2806
+ "size": 7785,
2807
+ "sha256": "1b63f7d987bc2ba8b9e67008b1713d4e874437f22c46002a12dcda1da0b73d2a"
2808
+ },
2809
+ {
2810
+ "path": "skills/peer-review/references/domain-probes/model_development.md",
2811
+ "size": 10438,
2812
+ "sha256": "263db14ecedfc51caffb8b4966bade4566706b3ae4ce67d0b15840bdbbcdba07"
2813
+ },
2484
2814
  {
2485
2815
  "path": "skills/peer-review/references/domain-probes/narrative_review.md",
2486
2816
  "size": 12598,
@@ -2643,8 +2973,8 @@
2643
2973
  },
2644
2974
  {
2645
2975
  "path": "skills/present-paper/SKILL.md",
2646
- "size": 29247,
2647
- "sha256": "aa8455317bd4996d5b1e0cc9d27c8be33b8112b7826749d87376c161d6cf87d5"
2976
+ "size": 33518,
2977
+ "sha256": "777197edf83a4d242508b366abe24681198467a95950b0acc385ac2714f33cb4"
2648
2978
  },
2649
2979
  {
2650
2980
  "path": "skills/present-paper/references/critic_rubrics/slide.md",
@@ -2661,11 +2991,41 @@
2661
2991
  "size": 15007,
2662
2992
  "sha256": "d0f964af7523ec8bfef50ca627878f8c2cfe58159c2a827c5f7dfd43585cf9ee"
2663
2993
  },
2994
+ {
2995
+ "path": "skills/present-paper/references/presentation_design_guidelines.md",
2996
+ "size": 7460,
2997
+ "sha256": "689d021ff7fc5e04abf93f3d6e1b0646bb5aa86430239b76b51d2224b3b92f0c"
2998
+ },
2664
2999
  {
2665
3000
  "path": "skills/present-paper/references/slide_design_principles.md",
2666
3001
  "size": 10436,
2667
3002
  "sha256": "7f2a5e03c8f2ddbb2d84a163506c5f3a2d1cca1353a694abd7bfb14225324826"
2668
3003
  },
3004
+ {
3005
+ "path": "skills/present-paper/references/slide_visual_styles/CATALOG.md",
3006
+ "size": 3177,
3007
+ "sha256": "78782ce6916212bcae9e1d8513197721a8ac72ed1faa33ce335b36d0c88a828f"
3008
+ },
3009
+ {
3010
+ "path": "skills/present-paper/references/slide_visual_styles/clinical_blue.md",
3011
+ "size": 3249,
3012
+ "sha256": "334ee770935b93a1ddf86c426a8f3da377d2618c0f6553308ccc38e871f26160"
3013
+ },
3014
+ {
3015
+ "path": "skills/present-paper/references/slide_visual_styles/dark_modern.md",
3016
+ "size": 3197,
3017
+ "sha256": "b5adf2331318a1276fa5eedf173a36c056d220fbfa04819a5c4d4d68b1109f68"
3018
+ },
3019
+ {
3020
+ "path": "skills/present-paper/references/slide_visual_styles/editorial_mono.md",
3021
+ "size": 3068,
3022
+ "sha256": "db07e84bbf4d248f0a4837fe22ed61c82e176fe94055b590131e24d25c59f20b"
3023
+ },
3024
+ {
3025
+ "path": "skills/present-paper/references/slide_visual_styles/institutional_brand.md",
3026
+ "size": 4431,
3027
+ "sha256": "c8b04c93bf61072fc6c4ee7d402e107d7375e933d60085bf325d74830896684a"
3028
+ },
2669
3029
  {
2670
3030
  "path": "skills/present-paper/references/slide_visual_styles/nature_lancet.md",
2671
3031
  "size": 7989,
@@ -2691,6 +3051,11 @@
2691
3051
  "size": 6758,
2692
3052
  "sha256": "6eeaf94c396d0f4ff365eaea0408f2fc00f8e2dc75b53a9514214194cb9329f9"
2693
3053
  },
3054
+ {
3055
+ "path": "skills/present-paper/scripts/inspect_pptx_template.py",
3056
+ "size": 5073,
3057
+ "sha256": "648fe3d2904a5ffffb41eb064d1780f605a672dc44618a74b5e3e59c023cb63d"
3058
+ },
2694
3059
  {
2695
3060
  "path": "skills/present-paper/scripts/strip_notes_for_sharing.py",
2696
3061
  "size": 5508,
@@ -2933,8 +3298,8 @@
2933
3298
  },
2934
3299
  {
2935
3300
  "path": "skills/self-review/SKILL.md",
2936
- "size": 94121,
2937
- "sha256": "7222f5bc17832d84a23f1ea63fb090eb9a114c70bec3cf16ff2c7a16b24d0f40"
3301
+ "size": 94657,
3302
+ "sha256": "14c982c492d6305c238737366f0996415133fe02ff9aaad7e2c2207d78d260a2"
2938
3303
  },
2939
3304
  {
2940
3305
  "path": "skills/self-review/references/domain-probes/ai_overclaiming.md",
@@ -2971,6 +3336,16 @@
2971
3336
  "size": 11244,
2972
3337
  "sha256": "197cfaa4bdcfe223a0ebfb69c229ccb3852160ab76870ade914eb8997ab684c5"
2973
3338
  },
3339
+ {
3340
+ "path": "skills/self-review/references/domain-probes/mllm_evaluation.md",
3341
+ "size": 7785,
3342
+ "sha256": "1b63f7d987bc2ba8b9e67008b1713d4e874437f22c46002a12dcda1da0b73d2a"
3343
+ },
3344
+ {
3345
+ "path": "skills/self-review/references/domain-probes/model_development.md",
3346
+ "size": 10438,
3347
+ "sha256": "263db14ecedfc51caffb8b4966bade4566706b3ae4ce67d0b15840bdbbcdba07"
3348
+ },
2974
3349
  {
2975
3350
  "path": "skills/self-review/references/domain-probes/narrative_review.md",
2976
3351
  "size": 12598,
@@ -3418,8 +3793,8 @@
3418
3793
  },
3419
3794
  {
3420
3795
  "path": "skills/write-paper/references/journal_profiles/Clinical_and_Molecular_Hepatology.md",
3421
- "size": 7981,
3422
- "sha256": "666c53f8c68b3a3436beafdb76a3671825802c5d6fe0a92c052db9075848c7da"
3796
+ "size": 8585,
3797
+ "sha256": "b268d9cf8caa255e72ab4cbc7960473de7666e8c65e86cb3d2e41ea6791a0642"
3423
3798
  },
3424
3799
  {
3425
3800
  "path": "skills/write-paper/references/journal_profiles/Diabetes_Metabolism_Journal.md",