medsci-skills 4.10.0 → 4.11.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +8 -2
- package/metadata/distribution_files.json +354 -24
- package/metadata/distribution_manifest.json +7 -1
- package/metadata/skills_catalog.json +61 -1
- package/package.json +1 -1
- package/skills/architecture-zoo/SKILL.md +96 -0
- package/skills/architecture-zoo/references/classification.md +102 -0
- package/skills/architecture-zoo/references/foundation_models.md +87 -0
- package/skills/architecture-zoo/references/index.md +55 -0
- package/skills/architecture-zoo/references/segmentation.md +110 -0
- package/skills/architecture-zoo/skill.yml +36 -0
- package/skills/check-reporting/references/appraisal_tools/METRICS_RELOADED.md +36 -0
- package/skills/find-journal/POLICY.md +9 -0
- package/skills/find-journal/SKILL.md +147 -13
- package/skills/find-journal/references/acceptance_signals_schema.md +126 -0
- package/skills/find-journal/references/journal_profiles/AJR.md +8 -0
- package/skills/find-journal/references/journal_profiles/Clinical_and_Molecular_Hepatology.md +2 -2
- package/skills/find-journal/references/journal_profiles/European_Radiology.md +8 -0
- package/skills/find-journal/references/journal_profiles/Investigative_Radiology.md +8 -0
- package/skills/find-journal/references/journal_profiles/KJR.md +8 -0
- package/skills/find-journal/references/journal_profiles/RYAI.md +8 -0
- package/skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_ceiling.txt +18 -0
- package/skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_clean.txt +10 -0
- package/skills/find-journal/scripts/acceptance_readiness_challenge/fixture_ceiling/manuscript.md +16 -0
- package/skills/find-journal/scripts/acceptance_readiness_challenge/fixture_clean/manuscript.md +15 -0
- package/skills/find-journal/scripts/acceptance_readiness_challenge/problem.md +38 -0
- package/skills/find-journal/scripts/acceptance_readiness_challenge/verify.sh +28 -0
- package/skills/find-journal/scripts/assess_acceptance_readiness.py +235 -0
- package/skills/find-journal/skill.yml +5 -1
- package/skills/mllm-eval/SKILL.md +108 -0
- package/skills/mllm-eval/scripts/check_mllm_eval_completeness.py +184 -0
- package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_bad.md +3 -0
- package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_good.md +9 -0
- package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/problem.md +29 -0
- package/skills/mllm-eval/scripts/mllm_eval_completeness_challenge/verify.sh +25 -0
- package/skills/mllm-eval/skill.yml +44 -0
- package/skills/mllm-eval/tests/test_mllm_eval_completeness.sh +49 -0
- package/skills/model-card/SKILL.md +103 -0
- package/skills/model-card/references/datasheet_template.md +38 -0
- package/skills/model-card/references/metric_dimensions.md +32 -0
- package/skills/model-card/references/model_card_template.md +62 -0
- package/skills/model-card/scripts/check_model_card_complete.py +202 -0
- package/skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/DATASHEET.md +31 -0
- package/skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/MODEL_CARD.md +48 -0
- package/skills/model-card/scripts/check_model_card_complete_challenge/fixture/incomplete/MODEL_CARD.md +28 -0
- package/skills/model-card/scripts/check_model_card_complete_challenge/problem.md +31 -0
- package/skills/model-card/scripts/check_model_card_complete_challenge/verify.sh +34 -0
- package/skills/model-card/skill.yml +41 -0
- package/skills/model-card/tests/test_model_card_complete.sh +75 -0
- package/skills/model-evaluation/SKILL.md +88 -0
- package/skills/model-evaluation/references/metric_guide.md +44 -0
- package/skills/model-evaluation/scripts/check_metric_reporting.py +196 -0
- package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_bad.md +2 -0
- package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_good.md +3 -0
- package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_bad.md +2 -0
- package/skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_good.md +3 -0
- package/skills/model-evaluation/scripts/metric_reporting_challenge/problem.md +27 -0
- package/skills/model-evaluation/scripts/metric_reporting_challenge/verify.sh +29 -0
- package/skills/model-evaluation/skill.yml +43 -0
- package/skills/model-evaluation/tests/test_metric_reporting.sh +47 -0
- package/skills/model-scaffold/SKILL.md +120 -0
- package/skills/model-scaffold/references/training_guide.md +46 -0
- package/skills/model-scaffold/scripts/check_training_hygiene.py +254 -0
- package/skills/model-scaffold/scripts/scaffold.py +495 -0
- package/skills/model-scaffold/scripts/scaffold_challenge/expected/split_assignment.csv +13 -0
- package/skills/model-scaffold/scripts/scaffold_challenge/fixture/manifest.csv +19 -0
- package/skills/model-scaffold/scripts/scaffold_challenge/problem.md +44 -0
- package/skills/model-scaffold/scripts/scaffold_challenge/verify.sh +89 -0
- package/skills/model-scaffold/skill.yml +46 -0
- package/skills/model-scaffold/tests/fixtures/bad_evaluate.py +10 -0
- package/skills/model-scaffold/tests/fixtures/bad_train.py +9 -0
- package/skills/model-scaffold/tests/test_training_hygiene.sh +70 -0
- package/skills/model-validation/SKILL.md +146 -0
- package/skills/model-validation/scripts/check_split_leakage.py +269 -0
- package/skills/model-validation/scripts/check_split_leakage_challenge/expected/clean.txt +9 -0
- package/skills/model-validation/scripts/check_split_leakage_challenge/expected/leak.txt +9 -0
- package/skills/model-validation/scripts/check_split_leakage_challenge/fixture/split_seed.txt +1 -0
- package/skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_clean.csv +14 -0
- package/skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_leak.csv +15 -0
- package/skills/model-validation/scripts/check_split_leakage_challenge/problem.md +39 -0
- package/skills/model-validation/scripts/check_split_leakage_challenge/verify.sh +37 -0
- package/skills/model-validation/skill.yml +43 -0
- package/skills/model-validation/tests/fixtures/leak_subject.csv +6 -0
- package/skills/model-validation/tests/fixtures/noseed_clean.csv +5 -0
- package/skills/model-validation/tests/fixtures/single_partition.csv +4 -0
- package/skills/model-validation/tests/test_split_leakage.sh +78 -0
- package/skills/peer-review/SKILL.md +12 -0
- package/skills/peer-review/references/domain-probes/mllm_evaluation.md +102 -0
- package/skills/peer-review/references/domain-probes/model_development.md +52 -0
- package/skills/self-review/SKILL.md +2 -0
- package/skills/self-review/references/domain-probes/mllm_evaluation.md +102 -0
- package/skills/self-review/references/domain-probes/model_development.md +52 -0
- package/skills/write-paper/references/journal_profiles/Clinical_and_Molecular_Hepatology.md +2 -1
package/README.md
CHANGED
|
@@ -2,14 +2,14 @@
|
|
|
2
2
|
|
|
3
3
|
# MedSci Skills
|
|
4
4
|
|
|
5
|
-
**
|
|
5
|
+
**51 skills that actually work.** Built by a physician-researcher, tested on real publications.
|
|
6
6
|
|
|
7
7
|
*MedSci Skills is a submission-grade clinical manuscript workflow, not a generic biomedical skill catalog. Its moat is the compliance layer — 38 reporting guidelines and risk-of-bias tools, reference/citation verification, and deterministic integrity gates, before peer review sees the manuscript. It competes on clinical submission reliability, not skill count.*
|
|
8
8
|
|
|
9
9
|
[](LICENSE)
|
|
10
10
|
[](https://github.com/Aperivue/medsci-skills/releases/latest)
|
|
11
11
|
[](https://github.com/Aperivue/medsci-skills/actions/workflows/validate.yml)
|
|
12
|
-

|
|
13
13
|
[](https://www.npmjs.com/package/medsci-skills)
|
|
14
14
|
[](https://youtu.be/MclQ_RIofpE)
|
|
15
15
|
[](https://github.com/Aperivue/medsci-skills/contribute)
|
|
@@ -451,6 +451,12 @@ ma-scout -> search-lit -> fulltext-retrieval -> design-study ──> write-proto
|
|
|
451
451
|
| **make-figures** | Publication-ready figures and visual abstracts: ROC curves, forest plots, PRISMA/CONSORT/STARD flow diagrams, Kaplan-Meier curves, Bland-Altman plots, confusion matrices, and journal-specific visual/graphical abstracts (python-pptx template-based). Communication-first design principles (Nat Hum Behav 2026 — key message, audience, cognitive load, figure-vs-table decision) and five flow-diagram production lessons (official-template fidelity, VML fallback PDF export, docx XML escape, sequential placeholder mapping, version freeze); critic rubric Section G adds 5 communication-first checks. `--study-type` auto-generates the full required figure set; structured `_figure_manifest.md` output for downstream pipeline consumption; D2 enforced as default for flow diagrams. |
|
|
452
452
|
| **design-study** | Study design review: identifies analysis unit, cohort logic, data leakage risks, comparator design, validation strategy, and reporting guideline fit. |
|
|
453
453
|
| **design-ai-benchmarking** | Design and validity review for benchmarking AI system(s) against a human-expert panel: evaluation-question and arm definition, decoupled multi-dimensional rubrics with anchors, planted calibration probes (positive-control / known-bad / instability / mechanism-contradiction), reviewer-panel construction with per-reviewer randomization, inter-rater reliability targets with separate control-item reliability, LLM-as-judge vs human-as-judge adjudication, construct-independence guards, and a structured JSON rating-export schema. Locks the rubric before data collection. |
|
|
454
|
+
| **model-validation** | Design or audit the clinical-validation study for an engineer-built medical-imaging model (segmentation / classification / detection): patient-level split disjointness and the data-leakage taxonomy, tuning-on-test, internal vs genuine external validation, comparator design, single-run vs multi-seed variance, task-correct metric selection (Metrics Reloaded), test-set sizing, and CLAIM 2024 / TRIPOD+AI / STARD-AI reporting fit. Ships a deterministic split-leakage gate that proves patient disjointness by set arithmetic on the emitted split table. Integrates with MONAI / nnU-Net — does not replace them. |
|
|
455
|
+
| **model-scaffold** | Generate a reproducible, runnable PyTorch training repo for a medical-imaging segmentation task — the missing middle link between choosing an architecture and validating a trained model. Emits a patient-level seed-locked split as an auditable artifact, a configurable U-Net, train/evaluate scripts that seed every RNG and infer under eval mode, a config, requirements, a reproducibility record, and a Methods stub with VERIFY placeholders (no fabricated numbers). Reproducibility holds by construction; ships a `check_training_hygiene` AST gate + a network-free build→validate challenge. Integrates with MONAI / nnU-Net / TorchIO — does not reimplement them. |
|
|
456
|
+
| **architecture-zoo** | "Which architecture for which research question" decision tool: maps task (classification / segmentation / detection / transfer), modality, data scale, and class imbalance to a paper-grounded architecture shortlist. Curates the foundational curriculum (ResNet / DenseNet / EfficientNet / ViT / Swin; U-Net / 3-D U-Net / Attention & Residual U-Net / nnU-Net / Mask R-CNN; SAM/MedSAM / TotalSegmentator / BiomedCLIP / DINO / MAE / SimCLR) — each with core idea, when-to-use, medical-imaging use, reference implementation, validation setup, and the matching model-scaffold template. Advisory; teaches archetypes, not a live SOTA leaderboard. |
|
|
457
|
+
| **model-card** | Generate the documentation an engineer-built medical-imaging model must carry — a Model Card (Mitchell et al. 2019), a Datasheet for its dataset (Gebru et al. 2021), and a METRIC-informed data-quality pass — filled from user-supplied facts (never fabricated), then verify every required section is present and non-empty with a deterministic completeness gate (`check_model_card_complete`). Model Card / Datasheet are documentation standards vendored as templates, not counted reporting checklists. |
|
|
458
|
+
| **model-evaluation** | Compute and report task-correct held-out metrics for a trained medical-imaging model — segmentation (Dice + a boundary metric HD95/NSD, per structure), classification (AUROC + AUPRC + sensitivity/specificity with bootstrap CIs at the deployment prevalence), or detection (FROC/mAP with a stated IoU criterion) — plus calibration and subgroup slices. Emits a per-case table for analyze-stats and gates the metric choice against Metrics Reloaded / CLAIM 2024 (`check_metric_reporting`). Numbers come only from executed code. |
|
|
459
|
+
| **mllm-eval** | Model-agnostic evaluation harness (closed API or open weights) for an LLM/MLLM on a clinical task — radiology report generation, VQA, clinical text extraction — covering the adjudicated reference standard, clinical-efficacy metrics (RadGraph-F1 / CheXbert-F1 beyond BLEU/ROUGE), faithfulness/hallucination, pretraining-contamination, prompt sensitivity, and a reader study; gates the plan with `check_mllm_eval_completeness` and routes the reviewer audit to the MLLM probe. |
|
|
454
460
|
| **intake-project** | Classifies new research projects, summarizes current state, identifies missing inputs, and recommends next steps. |
|
|
455
461
|
| **grant-builder** | Structures grant proposals: significance, innovation, approach, milestones, and consortium roles. |
|
|
456
462
|
| **present-paper** | Academic presentation preparation: paper analysis, supporting research, speaker scripts, slide note injection, and Q&A prep. |
|
|
@@ -396,6 +396,36 @@
|
|
|
396
396
|
"size": 1421,
|
|
397
397
|
"sha256": "912c52e9289a7ccb014aa8a18105b6dfe04c2cc040e970c73b4bbc6b2d8a8a39"
|
|
398
398
|
},
|
|
399
|
+
{
|
|
400
|
+
"path": "skills/architecture-zoo/SKILL.md",
|
|
401
|
+
"size": 5444,
|
|
402
|
+
"sha256": "6d8f81262a42ff24e36dca425511804b9f324d2c900f31f701c703e3d8326729"
|
|
403
|
+
},
|
|
404
|
+
{
|
|
405
|
+
"path": "skills/architecture-zoo/references/classification.md",
|
|
406
|
+
"size": 5986,
|
|
407
|
+
"sha256": "035e0fddaccb0e19e23ffd7756b075154f847ee20f9a512cd2a010c0db4210fa"
|
|
408
|
+
},
|
|
409
|
+
{
|
|
410
|
+
"path": "skills/architecture-zoo/references/foundation_models.md",
|
|
411
|
+
"size": 5267,
|
|
412
|
+
"sha256": "495453b025f1cb13d5ba0bac9be6d3b0d63dd958ea48d2b9e55bc222e9c26786"
|
|
413
|
+
},
|
|
414
|
+
{
|
|
415
|
+
"path": "skills/architecture-zoo/references/index.md",
|
|
416
|
+
"size": 4065,
|
|
417
|
+
"sha256": "a1ed80efcf9a56e0286972ae9b08bd38965bb20a569e3aac5314549dfa6ad5f4"
|
|
418
|
+
},
|
|
419
|
+
{
|
|
420
|
+
"path": "skills/architecture-zoo/references/segmentation.md",
|
|
421
|
+
"size": 6508,
|
|
422
|
+
"sha256": "17618fe3d6884cf89b034ededcd69e081a65d7bfd473495eb2ab1fb5d8b15d8b"
|
|
423
|
+
},
|
|
424
|
+
{
|
|
425
|
+
"path": "skills/architecture-zoo/skill.yml",
|
|
426
|
+
"size": 2889,
|
|
427
|
+
"sha256": "275cfb1d0779028d79d8596879c09b5b6c714859142cb72a12b7ec901acc69e1"
|
|
428
|
+
},
|
|
399
429
|
{
|
|
400
430
|
"path": "skills/author-strategy/SKILL.md",
|
|
401
431
|
"size": 9209,
|
|
@@ -506,6 +536,11 @@
|
|
|
506
536
|
"size": 4373,
|
|
507
537
|
"sha256": "ee59d959b91c831d34e04853a83a969bb6315e49f692baa904ab8805b8f17147"
|
|
508
538
|
},
|
|
539
|
+
{
|
|
540
|
+
"path": "skills/check-reporting/references/appraisal_tools/METRICS_RELOADED.md",
|
|
541
|
+
"size": 2384,
|
|
542
|
+
"sha256": "e06267be7ffa5b5e3f52de387b745bf2676f016c29b02a5872d38c68ddf762ec"
|
|
543
|
+
},
|
|
509
544
|
{
|
|
510
545
|
"path": "skills/check-reporting/references/checklists/AMSTAR2.md",
|
|
511
546
|
"size": 4566,
|
|
@@ -1023,13 +1058,18 @@
|
|
|
1023
1058
|
},
|
|
1024
1059
|
{
|
|
1025
1060
|
"path": "skills/find-journal/POLICY.md",
|
|
1026
|
-
"size":
|
|
1027
|
-
"sha256": "
|
|
1061
|
+
"size": 5255,
|
|
1062
|
+
"sha256": "c2b61b5830844fa3eebe333dc4864acb4d085097e81ba2dbc1ef72dd65bebee3"
|
|
1028
1063
|
},
|
|
1029
1064
|
{
|
|
1030
1065
|
"path": "skills/find-journal/SKILL.md",
|
|
1031
|
-
"size":
|
|
1032
|
-
"sha256": "
|
|
1066
|
+
"size": 22072,
|
|
1067
|
+
"sha256": "45074f6499896700bff0eb20bd91c4076b143bcd39521d56559239edaa8b24d8"
|
|
1068
|
+
},
|
|
1069
|
+
{
|
|
1070
|
+
"path": "skills/find-journal/references/acceptance_signals_schema.md",
|
|
1071
|
+
"size": 6869,
|
|
1072
|
+
"sha256": "620ba1c55272908a16125ba69074491df5246d6cf9afa14e6b08a08e8dc4e866"
|
|
1033
1073
|
},
|
|
1034
1074
|
{
|
|
1035
1075
|
"path": "skills/find-journal/references/journal_profiles/AJNR.md",
|
|
@@ -1038,8 +1078,8 @@
|
|
|
1038
1078
|
},
|
|
1039
1079
|
{
|
|
1040
1080
|
"path": "skills/find-journal/references/journal_profiles/AJR.md",
|
|
1041
|
-
"size":
|
|
1042
|
-
"sha256": "
|
|
1081
|
+
"size": 2075,
|
|
1082
|
+
"sha256": "9d9a5ee7b3b2287a6deae8fc06d54dd60b26afa843f5830f7bb5fb2e2ac633f7"
|
|
1043
1083
|
},
|
|
1044
1084
|
{
|
|
1045
1085
|
"path": "skills/find-journal/references/journal_profiles/Abdominal_Radiology.md",
|
|
@@ -1098,8 +1138,8 @@
|
|
|
1098
1138
|
},
|
|
1099
1139
|
{
|
|
1100
1140
|
"path": "skills/find-journal/references/journal_profiles/Clinical_and_Molecular_Hepatology.md",
|
|
1101
|
-
"size":
|
|
1102
|
-
"sha256": "
|
|
1141
|
+
"size": 2391,
|
|
1142
|
+
"sha256": "7d923a09bc543fe49db28b9b79714958522e2fe1781d60c6f22dc1efcd3ba650"
|
|
1103
1143
|
},
|
|
1104
1144
|
{
|
|
1105
1145
|
"path": "skills/find-journal/references/journal_profiles/Cureus.md",
|
|
@@ -1128,8 +1168,8 @@
|
|
|
1128
1168
|
},
|
|
1129
1169
|
{
|
|
1130
1170
|
"path": "skills/find-journal/references/journal_profiles/European_Radiology.md",
|
|
1131
|
-
"size":
|
|
1132
|
-
"sha256": "
|
|
1171
|
+
"size": 2350,
|
|
1172
|
+
"sha256": "fa50a9a9d6012b8c6b75d81a69b950dfbe7db29775c8112bf5fe68d6d5655dfa"
|
|
1133
1173
|
},
|
|
1134
1174
|
{
|
|
1135
1175
|
"path": "skills/find-journal/references/journal_profiles/Hepatology_Communications.md",
|
|
@@ -1158,8 +1198,8 @@
|
|
|
1158
1198
|
},
|
|
1159
1199
|
{
|
|
1160
1200
|
"path": "skills/find-journal/references/journal_profiles/Investigative_Radiology.md",
|
|
1161
|
-
"size":
|
|
1162
|
-
"sha256": "
|
|
1201
|
+
"size": 2118,
|
|
1202
|
+
"sha256": "c218b4e764a070a3297802076c1e6c68e514160cc1efa038552cc271b01af9ce"
|
|
1163
1203
|
},
|
|
1164
1204
|
{
|
|
1165
1205
|
"path": "skills/find-journal/references/journal_profiles/JACC_Advances.md",
|
|
@@ -1248,8 +1288,8 @@
|
|
|
1248
1288
|
},
|
|
1249
1289
|
{
|
|
1250
1290
|
"path": "skills/find-journal/references/journal_profiles/KJR.md",
|
|
1251
|
-
"size":
|
|
1252
|
-
"sha256": "
|
|
1291
|
+
"size": 4061,
|
|
1292
|
+
"sha256": "0849de001a47038b8bfc92b337285372c80ccf4861162cae876295d82ea4f1c8"
|
|
1253
1293
|
},
|
|
1254
1294
|
{
|
|
1255
1295
|
"path": "skills/find-journal/references/journal_profiles/Korean_Circulation_Journal.md",
|
|
@@ -1348,8 +1388,8 @@
|
|
|
1348
1388
|
},
|
|
1349
1389
|
{
|
|
1350
1390
|
"path": "skills/find-journal/references/journal_profiles/RYAI.md",
|
|
1351
|
-
"size":
|
|
1352
|
-
"sha256": "
|
|
1391
|
+
"size": 2341,
|
|
1392
|
+
"sha256": "6d85cd675a5e6f395f74865256b7fe937749a4e31cb4c6f8d43d4059cb33a717"
|
|
1353
1393
|
},
|
|
1354
1394
|
{
|
|
1355
1395
|
"path": "skills/find-journal/references/journal_profiles/Radiology.md",
|
|
@@ -1396,10 +1436,45 @@
|
|
|
1396
1436
|
"size": 1511,
|
|
1397
1437
|
"sha256": "e2811a46b89f39a7395d98460347ce274ff58ce50138364e8cf96050a05aad91"
|
|
1398
1438
|
},
|
|
1439
|
+
{
|
|
1440
|
+
"path": "skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_ceiling.txt",
|
|
1441
|
+
"size": 1570,
|
|
1442
|
+
"sha256": "1e84f888350249a3b187d38731a371487232851c6521689e319ef59408ed9448"
|
|
1443
|
+
},
|
|
1444
|
+
{
|
|
1445
|
+
"path": "skills/find-journal/scripts/acceptance_readiness_challenge/expected/report_clean.txt",
|
|
1446
|
+
"size": 350,
|
|
1447
|
+
"sha256": "40b1a3b94cf15d504fc2c04e25f5aa737410a8b2480118dcd3c9cd1927ee825c"
|
|
1448
|
+
},
|
|
1449
|
+
{
|
|
1450
|
+
"path": "skills/find-journal/scripts/acceptance_readiness_challenge/fixture_ceiling/manuscript.md",
|
|
1451
|
+
"size": 717,
|
|
1452
|
+
"sha256": "557ce5c0607024aebae3375e117b1052acace3d1931a3dc8d015a6b9c6043843"
|
|
1453
|
+
},
|
|
1454
|
+
{
|
|
1455
|
+
"path": "skills/find-journal/scripts/acceptance_readiness_challenge/fixture_clean/manuscript.md",
|
|
1456
|
+
"size": 646,
|
|
1457
|
+
"sha256": "77a215d5c5fe8d09035308f04cdf26ab7c2736c53563b71930a2be1941b7061b"
|
|
1458
|
+
},
|
|
1459
|
+
{
|
|
1460
|
+
"path": "skills/find-journal/scripts/acceptance_readiness_challenge/problem.md",
|
|
1461
|
+
"size": 1981,
|
|
1462
|
+
"sha256": "469b518a373f5bef95016dc866f82b0d05395eb26ae162656abf1303495ed71c"
|
|
1463
|
+
},
|
|
1464
|
+
{
|
|
1465
|
+
"path": "skills/find-journal/scripts/acceptance_readiness_challenge/verify.sh",
|
|
1466
|
+
"size": 1232,
|
|
1467
|
+
"sha256": "0c525f322306fd5229269f155179924d80a419301988fff0171115c3b323d795"
|
|
1468
|
+
},
|
|
1469
|
+
{
|
|
1470
|
+
"path": "skills/find-journal/scripts/assess_acceptance_readiness.py",
|
|
1471
|
+
"size": 10959,
|
|
1472
|
+
"sha256": "32930f970f308d95aaf82c61d809a307685668165df4fe2bf7c2b4f5052b3e87"
|
|
1473
|
+
},
|
|
1399
1474
|
{
|
|
1400
1475
|
"path": "skills/find-journal/skill.yml",
|
|
1401
|
-
"size":
|
|
1402
|
-
"sha256": "
|
|
1476
|
+
"size": 1971,
|
|
1477
|
+
"sha256": "8a4ce35c9fccb8a43de5d06bee09b27fc70d2c735d8fa9fce353ec9467fa9936"
|
|
1403
1478
|
},
|
|
1404
1479
|
{
|
|
1405
1480
|
"path": "skills/fulltext-retrieval/SKILL.md",
|
|
@@ -2411,6 +2486,241 @@
|
|
|
2411
2486
|
"size": 3891,
|
|
2412
2487
|
"sha256": "d056566bb052bd917b4705fcd4912ef2173d5bd61b83bff4885b847bb824aa83"
|
|
2413
2488
|
},
|
|
2489
|
+
{
|
|
2490
|
+
"path": "skills/mllm-eval/SKILL.md",
|
|
2491
|
+
"size": 6288,
|
|
2492
|
+
"sha256": "ccf3da2f70b356d432b3d33500f667f9d7858500a9ff325631a9a16f5f300a8b"
|
|
2493
|
+
},
|
|
2494
|
+
{
|
|
2495
|
+
"path": "skills/mllm-eval/scripts/check_mllm_eval_completeness.py",
|
|
2496
|
+
"size": 9380,
|
|
2497
|
+
"sha256": "fe24a9b0dfcce7d826c29be59f2534c768daf73e1e98f545e8a7791bc0709079"
|
|
2498
|
+
},
|
|
2499
|
+
{
|
|
2500
|
+
"path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_bad.md",
|
|
2501
|
+
"size": 202,
|
|
2502
|
+
"sha256": "41cd455b9a747f92506091f0a8fa607e069042c4add683d12b274e6081538ea1"
|
|
2503
|
+
},
|
|
2504
|
+
{
|
|
2505
|
+
"path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/fixture/plan_good.md",
|
|
2506
|
+
"size": 795,
|
|
2507
|
+
"sha256": "93b703c163348e766dfbd2d01b2fc7267b57a082652d8bdd839b23646caa99a6"
|
|
2508
|
+
},
|
|
2509
|
+
{
|
|
2510
|
+
"path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/problem.md",
|
|
2511
|
+
"size": 1681,
|
|
2512
|
+
"sha256": "dc9ce54a7bd47ff5d3383c76e681760c0891dc503933863948df1cd999a11a0e"
|
|
2513
|
+
},
|
|
2514
|
+
{
|
|
2515
|
+
"path": "skills/mllm-eval/scripts/mllm_eval_completeness_challenge/verify.sh",
|
|
2516
|
+
"size": 1335,
|
|
2517
|
+
"sha256": "7c3afbcd5adecdcdc8a2c9d14251521e2bfa39cbd3f650e77c92f37aabe49c9c"
|
|
2518
|
+
},
|
|
2519
|
+
{
|
|
2520
|
+
"path": "skills/mllm-eval/skill.yml",
|
|
2521
|
+
"size": 3373,
|
|
2522
|
+
"sha256": "72fcc60d62edc95808df7cc0ff283822069caaa61e9163fc8d3f298a3afa3801"
|
|
2523
|
+
},
|
|
2524
|
+
{
|
|
2525
|
+
"path": "skills/model-card/SKILL.md",
|
|
2526
|
+
"size": 5807,
|
|
2527
|
+
"sha256": "070b1ab8391a37bc4ffebadb918b71e83251da2293d119f5b0cfbf28bea0d4c2"
|
|
2528
|
+
},
|
|
2529
|
+
{
|
|
2530
|
+
"path": "skills/model-card/references/datasheet_template.md",
|
|
2531
|
+
"size": 2280,
|
|
2532
|
+
"sha256": "11998d71a43fcdf75d7f3b72cd46de7f9e4d999ac6b0b6febd5a3dee92a7a517"
|
|
2533
|
+
},
|
|
2534
|
+
{
|
|
2535
|
+
"path": "skills/model-card/references/metric_dimensions.md",
|
|
2536
|
+
"size": 3066,
|
|
2537
|
+
"sha256": "70aeb1af8ed7510aff0562c8ac99852a0b1b49de5eb3ef923a1bbeb4f4c051eb"
|
|
2538
|
+
},
|
|
2539
|
+
{
|
|
2540
|
+
"path": "skills/model-card/references/model_card_template.md",
|
|
2541
|
+
"size": 3239,
|
|
2542
|
+
"sha256": "e40ed0b7fd1a7370d22bb74a596048d1e09b75c14f1b2064ba89d06c886cefbd"
|
|
2543
|
+
},
|
|
2544
|
+
{
|
|
2545
|
+
"path": "skills/model-card/scripts/check_model_card_complete.py",
|
|
2546
|
+
"size": 8856,
|
|
2547
|
+
"sha256": "aa1fdc6a88e18696d0dfc23397a8a9141c1219583081deb5e27b822f152d4005"
|
|
2548
|
+
},
|
|
2549
|
+
{
|
|
2550
|
+
"path": "skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/DATASHEET.md",
|
|
2551
|
+
"size": 2179,
|
|
2552
|
+
"sha256": "1b53763c3017c88de0ddc583fc6a1975400d69d1929852580fd96c7fe08ccc3e"
|
|
2553
|
+
},
|
|
2554
|
+
{
|
|
2555
|
+
"path": "skills/model-card/scripts/check_model_card_complete_challenge/fixture/complete/MODEL_CARD.md",
|
|
2556
|
+
"size": 2785,
|
|
2557
|
+
"sha256": "fbb5ce99d2d144ecb53d1581826758d4aece996351089e7592999873760dcfaf"
|
|
2558
|
+
},
|
|
2559
|
+
{
|
|
2560
|
+
"path": "skills/model-card/scripts/check_model_card_complete_challenge/fixture/incomplete/MODEL_CARD.md",
|
|
2561
|
+
"size": 880,
|
|
2562
|
+
"sha256": "9b017400531316d787b71aaa7bc4a1fc82aa7f782e54df1eda1c34cde8980db4"
|
|
2563
|
+
},
|
|
2564
|
+
{
|
|
2565
|
+
"path": "skills/model-card/scripts/check_model_card_complete_challenge/problem.md",
|
|
2566
|
+
"size": 1853,
|
|
2567
|
+
"sha256": "dc85f56704dfd049cd9807d0ffd77bc1264de69c2b20ca3e691f6eedc6843deb"
|
|
2568
|
+
},
|
|
2569
|
+
{
|
|
2570
|
+
"path": "skills/model-card/scripts/check_model_card_complete_challenge/verify.sh",
|
|
2571
|
+
"size": 1857,
|
|
2572
|
+
"sha256": "8a8ee577857f4333b38313d6a322f02a54d8011698251bbec4e1a7d6bd758b21"
|
|
2573
|
+
},
|
|
2574
|
+
{
|
|
2575
|
+
"path": "skills/model-card/skill.yml",
|
|
2576
|
+
"size": 2877,
|
|
2577
|
+
"sha256": "0d71da374191ca35545b90130d7d30d4693e4bd469014a3b0993063bdfd4b958"
|
|
2578
|
+
},
|
|
2579
|
+
{
|
|
2580
|
+
"path": "skills/model-evaluation/SKILL.md",
|
|
2581
|
+
"size": 5031,
|
|
2582
|
+
"sha256": "17ffde905359e4cffdf747422b7d41c214d2abfcc71e50e1b1e4a689d87fa695"
|
|
2583
|
+
},
|
|
2584
|
+
{
|
|
2585
|
+
"path": "skills/model-evaluation/references/metric_guide.md",
|
|
2586
|
+
"size": 2454,
|
|
2587
|
+
"sha256": "8d09ca7ce9fb9f66ee4942689294d9b12ae1d892ac67769cd68fdc38a4e220ee"
|
|
2588
|
+
},
|
|
2589
|
+
{
|
|
2590
|
+
"path": "skills/model-evaluation/scripts/check_metric_reporting.py",
|
|
2591
|
+
"size": 9564,
|
|
2592
|
+
"sha256": "c33f52ee62ae93417027d0bb0b6cf2a95f5747d52403ab99c075bc64a5e2c593"
|
|
2593
|
+
},
|
|
2594
|
+
{
|
|
2595
|
+
"path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_bad.md",
|
|
2596
|
+
"size": 84,
|
|
2597
|
+
"sha256": "571aceb9567454e8bbe12e0967bc4cde4b142da99f6056f7530f3b8723ddf77c"
|
|
2598
|
+
},
|
|
2599
|
+
{
|
|
2600
|
+
"path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/clf_good.md",
|
|
2601
|
+
"size": 186,
|
|
2602
|
+
"sha256": "ba44a3b38b4128fa713555c8b332f211e9087e6bc016d80af4c3074c3ca6ef8e"
|
|
2603
|
+
},
|
|
2604
|
+
{
|
|
2605
|
+
"path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_bad.md",
|
|
2606
|
+
"size": 119,
|
|
2607
|
+
"sha256": "50c138840976b8fa010cb0ca9fd24fffc7181e275eb6c71e76500da7d2a0420d"
|
|
2608
|
+
},
|
|
2609
|
+
{
|
|
2610
|
+
"path": "skills/model-evaluation/scripts/metric_reporting_challenge/fixture/seg_good.md",
|
|
2611
|
+
"size": 207,
|
|
2612
|
+
"sha256": "903a2dbd61cf56ce8e3d808f867ebd47ba4d6f2bd1542d7482b85477a6876eb0"
|
|
2613
|
+
},
|
|
2614
|
+
{
|
|
2615
|
+
"path": "skills/model-evaluation/scripts/metric_reporting_challenge/problem.md",
|
|
2616
|
+
"size": 1599,
|
|
2617
|
+
"sha256": "1f842374e3569d5fc27d7c26aa7f6bc6be43f7f38d2d9f3e2f9ab62fb29ddd65"
|
|
2618
|
+
},
|
|
2619
|
+
{
|
|
2620
|
+
"path": "skills/model-evaluation/scripts/metric_reporting_challenge/verify.sh",
|
|
2621
|
+
"size": 1235,
|
|
2622
|
+
"sha256": "f819d1333a7206db6383ccbd41c6eadae015004e61ae335e67a3334936c58cc8"
|
|
2623
|
+
},
|
|
2624
|
+
{
|
|
2625
|
+
"path": "skills/model-evaluation/skill.yml",
|
|
2626
|
+
"size": 2921,
|
|
2627
|
+
"sha256": "9713dbab40c54ca88324e7dcd74d3142890f9625ad68d708ba40b0cf57a7b9ee"
|
|
2628
|
+
},
|
|
2629
|
+
{
|
|
2630
|
+
"path": "skills/model-scaffold/SKILL.md",
|
|
2631
|
+
"size": 7048,
|
|
2632
|
+
"sha256": "a1612de8a2888667137c3d81100adcb4a6c42d45c73edf93f715fad1da7e179f"
|
|
2633
|
+
},
|
|
2634
|
+
{
|
|
2635
|
+
"path": "skills/model-scaffold/references/training_guide.md",
|
|
2636
|
+
"size": 2661,
|
|
2637
|
+
"sha256": "4a3197a89b8d3473071051f67a7bcf40f71ecf007e942f81e9c40dc48fce1a9c"
|
|
2638
|
+
},
|
|
2639
|
+
{
|
|
2640
|
+
"path": "skills/model-scaffold/scripts/check_training_hygiene.py",
|
|
2641
|
+
"size": 11752,
|
|
2642
|
+
"sha256": "66970049c85e46a0080b5f19eb3b5ac9dfd656a674b6f1698825e968eedd4814"
|
|
2643
|
+
},
|
|
2644
|
+
{
|
|
2645
|
+
"path": "skills/model-scaffold/scripts/scaffold.py",
|
|
2646
|
+
"size": 19327,
|
|
2647
|
+
"sha256": "d37d617d9753faf6cd6f4d9332d896ad3704d4f2dea8578d4d23f02baedbfd09"
|
|
2648
|
+
},
|
|
2649
|
+
{
|
|
2650
|
+
"path": "skills/model-scaffold/scripts/scaffold_challenge/expected/split_assignment.csv",
|
|
2651
|
+
"size": 144,
|
|
2652
|
+
"sha256": "23949c5c9d179ef152127e0e6b865138169184f95c4e2d5234a65bab3762bd71"
|
|
2653
|
+
},
|
|
2654
|
+
{
|
|
2655
|
+
"path": "skills/model-scaffold/scripts/scaffold_challenge/fixture/manifest.csv",
|
|
2656
|
+
"size": 582,
|
|
2657
|
+
"sha256": "defce0cdce35211f038b139a9ab4214c63b22f3e60ba7ee74fa6bea8fe33aa7f"
|
|
2658
|
+
},
|
|
2659
|
+
{
|
|
2660
|
+
"path": "skills/model-scaffold/scripts/scaffold_challenge/problem.md",
|
|
2661
|
+
"size": 2678,
|
|
2662
|
+
"sha256": "369e98da65cbd16c67f5ff3f17d99b707d713bbf3239409f9921190c85f8f08a"
|
|
2663
|
+
},
|
|
2664
|
+
{
|
|
2665
|
+
"path": "skills/model-scaffold/scripts/scaffold_challenge/verify.sh",
|
|
2666
|
+
"size": 4191,
|
|
2667
|
+
"sha256": "f2476dc72772ffa77ba13ed43067a19bf4f9b6fbce9ce49a1726eee2f64d7b21"
|
|
2668
|
+
},
|
|
2669
|
+
{
|
|
2670
|
+
"path": "skills/model-scaffold/skill.yml",
|
|
2671
|
+
"size": 3104,
|
|
2672
|
+
"sha256": "a6284452adbbb533c63dcd294c5b4b7fce7d93e1be381d27323168ac3888ba33"
|
|
2673
|
+
},
|
|
2674
|
+
{
|
|
2675
|
+
"path": "skills/model-validation/SKILL.md",
|
|
2676
|
+
"size": 9347,
|
|
2677
|
+
"sha256": "ecd48672a03923bf1ace63528fd2dbcf138cd880103cc8c40345b3857d66ad1c"
|
|
2678
|
+
},
|
|
2679
|
+
{
|
|
2680
|
+
"path": "skills/model-validation/scripts/check_split_leakage.py",
|
|
2681
|
+
"size": 11616,
|
|
2682
|
+
"sha256": "a207b82abbb5914927e0de25663820c250207b0b1689f8ed17bfe6bda9eed6e2"
|
|
2683
|
+
},
|
|
2684
|
+
{
|
|
2685
|
+
"path": "skills/model-validation/scripts/check_split_leakage_challenge/expected/clean.txt",
|
|
2686
|
+
"size": 358,
|
|
2687
|
+
"sha256": "5d1e203ebc6656c172f60f4cd4eb3954fdbcd77579a6768c6bbd56952a966e6c"
|
|
2688
|
+
},
|
|
2689
|
+
{
|
|
2690
|
+
"path": "skills/model-validation/scripts/check_split_leakage_challenge/expected/leak.txt",
|
|
2691
|
+
"size": 470,
|
|
2692
|
+
"sha256": "34be75bbbabf10073a1fd11587e019491b7319e2030b166a1ab3e82e4899f3c2"
|
|
2693
|
+
},
|
|
2694
|
+
{
|
|
2695
|
+
"path": "skills/model-validation/scripts/check_split_leakage_challenge/fixture/split_seed.txt",
|
|
2696
|
+
"size": 3,
|
|
2697
|
+
"sha256": "084c799cd551dd1d8d5c5f9a5d593b2e931f5e36122ee5c793c1d08a19839cc0"
|
|
2698
|
+
},
|
|
2699
|
+
{
|
|
2700
|
+
"path": "skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_clean.csv",
|
|
2701
|
+
"size": 150,
|
|
2702
|
+
"sha256": "a4a15320685b58c4868737e40b4df0a07a942b39b5d94611e87d63d22e88aee0"
|
|
2703
|
+
},
|
|
2704
|
+
{
|
|
2705
|
+
"path": "skills/model-validation/scripts/check_split_leakage_challenge/fixture/splits_leak.csv",
|
|
2706
|
+
"size": 145,
|
|
2707
|
+
"sha256": "1bc2cc7b11a7a4a9ddc0168a83eab33ea1b03e3ca98bda5301679a18e19faf53"
|
|
2708
|
+
},
|
|
2709
|
+
{
|
|
2710
|
+
"path": "skills/model-validation/scripts/check_split_leakage_challenge/problem.md",
|
|
2711
|
+
"size": 2347,
|
|
2712
|
+
"sha256": "f140095ec5d190120bf73dc62710b2ccac31c7f7d54307a0854c8438df61940e"
|
|
2713
|
+
},
|
|
2714
|
+
{
|
|
2715
|
+
"path": "skills/model-validation/scripts/check_split_leakage_challenge/verify.sh",
|
|
2716
|
+
"size": 1925,
|
|
2717
|
+
"sha256": "9ae88c109caa1408a3a3b08ea0583fc97ce98b93c909f75d043f08a231e91e61"
|
|
2718
|
+
},
|
|
2719
|
+
{
|
|
2720
|
+
"path": "skills/model-validation/skill.yml",
|
|
2721
|
+
"size": 3079,
|
|
2722
|
+
"sha256": "4891c0698445f98552ab2a2315bc8288a6cc4744f8711e20f939c8af8739e434"
|
|
2723
|
+
},
|
|
2414
2724
|
{
|
|
2415
2725
|
"path": "skills/orchestrate/SKILL.md",
|
|
2416
2726
|
"size": 35203,
|
|
@@ -2438,8 +2748,8 @@
|
|
|
2438
2748
|
},
|
|
2439
2749
|
{
|
|
2440
2750
|
"path": "skills/peer-review/SKILL.md",
|
|
2441
|
-
"size":
|
|
2442
|
-
"sha256": "
|
|
2751
|
+
"size": 58493,
|
|
2752
|
+
"sha256": "057c39cd131c49eeb1949560a0d510f176a012431a0c8d36dd803061f98e0629"
|
|
2443
2753
|
},
|
|
2444
2754
|
{
|
|
2445
2755
|
"path": "skills/peer-review/references/aczel_2021_reviewer2_patterns.md",
|
|
@@ -2481,6 +2791,16 @@
|
|
|
2481
2791
|
"size": 11244,
|
|
2482
2792
|
"sha256": "197cfaa4bdcfe223a0ebfb69c229ccb3852160ab76870ade914eb8997ab684c5"
|
|
2483
2793
|
},
|
|
2794
|
+
{
|
|
2795
|
+
"path": "skills/peer-review/references/domain-probes/mllm_evaluation.md",
|
|
2796
|
+
"size": 7785,
|
|
2797
|
+
"sha256": "1b63f7d987bc2ba8b9e67008b1713d4e874437f22c46002a12dcda1da0b73d2a"
|
|
2798
|
+
},
|
|
2799
|
+
{
|
|
2800
|
+
"path": "skills/peer-review/references/domain-probes/model_development.md",
|
|
2801
|
+
"size": 10438,
|
|
2802
|
+
"sha256": "263db14ecedfc51caffb8b4966bade4566706b3ae4ce67d0b15840bdbbcdba07"
|
|
2803
|
+
},
|
|
2484
2804
|
{
|
|
2485
2805
|
"path": "skills/peer-review/references/domain-probes/narrative_review.md",
|
|
2486
2806
|
"size": 12598,
|
|
@@ -2933,8 +3253,8 @@
|
|
|
2933
3253
|
},
|
|
2934
3254
|
{
|
|
2935
3255
|
"path": "skills/self-review/SKILL.md",
|
|
2936
|
-
"size":
|
|
2937
|
-
"sha256": "
|
|
3256
|
+
"size": 94657,
|
|
3257
|
+
"sha256": "14c982c492d6305c238737366f0996415133fe02ff9aaad7e2c2207d78d260a2"
|
|
2938
3258
|
},
|
|
2939
3259
|
{
|
|
2940
3260
|
"path": "skills/self-review/references/domain-probes/ai_overclaiming.md",
|
|
@@ -2971,6 +3291,16 @@
|
|
|
2971
3291
|
"size": 11244,
|
|
2972
3292
|
"sha256": "197cfaa4bdcfe223a0ebfb69c229ccb3852160ab76870ade914eb8997ab684c5"
|
|
2973
3293
|
},
|
|
3294
|
+
{
|
|
3295
|
+
"path": "skills/self-review/references/domain-probes/mllm_evaluation.md",
|
|
3296
|
+
"size": 7785,
|
|
3297
|
+
"sha256": "1b63f7d987bc2ba8b9e67008b1713d4e874437f22c46002a12dcda1da0b73d2a"
|
|
3298
|
+
},
|
|
3299
|
+
{
|
|
3300
|
+
"path": "skills/self-review/references/domain-probes/model_development.md",
|
|
3301
|
+
"size": 10438,
|
|
3302
|
+
"sha256": "263db14ecedfc51caffb8b4966bade4566706b3ae4ce67d0b15840bdbbcdba07"
|
|
3303
|
+
},
|
|
2974
3304
|
{
|
|
2975
3305
|
"path": "skills/self-review/references/domain-probes/narrative_review.md",
|
|
2976
3306
|
"size": 12598,
|
|
@@ -3418,8 +3748,8 @@
|
|
|
3418
3748
|
},
|
|
3419
3749
|
{
|
|
3420
3750
|
"path": "skills/write-paper/references/journal_profiles/Clinical_and_Molecular_Hepatology.md",
|
|
3421
|
-
"size":
|
|
3422
|
-
"sha256": "
|
|
3751
|
+
"size": 8585,
|
|
3752
|
+
"sha256": "b268d9cf8caa255e72ab4cbc7960473de7666e8c65e86cb3d2e41ea6791a0642"
|
|
3423
3753
|
},
|
|
3424
3754
|
{
|
|
3425
3755
|
"path": "skills/write-paper/references/journal_profiles/Diabetes_Metabolism_Journal.md",
|
|
@@ -1,10 +1,11 @@
|
|
|
1
1
|
{
|
|
2
2
|
"schema_version": 1,
|
|
3
|
-
"version": "4.
|
|
3
|
+
"version": "4.11.0",
|
|
4
4
|
"owned_skills": [
|
|
5
5
|
"academic-aio",
|
|
6
6
|
"add-journal",
|
|
7
7
|
"analyze-stats",
|
|
8
|
+
"architecture-zoo",
|
|
8
9
|
"author-strategy",
|
|
9
10
|
"batch-cohort",
|
|
10
11
|
"calc-sample-size",
|
|
@@ -30,6 +31,11 @@
|
|
|
30
31
|
"manage-project",
|
|
31
32
|
"manage-refs",
|
|
32
33
|
"meta-analysis",
|
|
34
|
+
"mllm-eval",
|
|
35
|
+
"model-card",
|
|
36
|
+
"model-evaluation",
|
|
37
|
+
"model-scaffold",
|
|
38
|
+
"model-validation",
|
|
33
39
|
"orchestrate",
|
|
34
40
|
"peer-review",
|
|
35
41
|
"polish-language",
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"_comment": "AUTO-GENERATED by scripts/gen_skills_catalog_json.py from each skills/<slug>/SKILL.md + skill.yml. Machine-readable skill catalog (single source of truth) consumed by external surfaces such as the aperivue.com storefront to gate skill-list completeness. Do not hand-edit; CI gate: python3 scripts/gen_skills_catalog_json.py --check.",
|
|
3
|
-
"skill_count":
|
|
3
|
+
"skill_count": 51,
|
|
4
4
|
"categories": [
|
|
5
5
|
{
|
|
6
6
|
"key": "literature_references",
|
|
@@ -17,6 +17,7 @@
|
|
|
17
17
|
"key": "data_study_design",
|
|
18
18
|
"label": "Data & Study Design",
|
|
19
19
|
"slugs": [
|
|
20
|
+
"architecture-zoo",
|
|
20
21
|
"calc-sample-size",
|
|
21
22
|
"clean-data",
|
|
22
23
|
"define-variables",
|
|
@@ -24,6 +25,11 @@
|
|
|
24
25
|
"design-ai-benchmarking",
|
|
25
26
|
"design-study",
|
|
26
27
|
"generate-codebook",
|
|
28
|
+
"mllm-eval",
|
|
29
|
+
"model-card",
|
|
30
|
+
"model-evaluation",
|
|
31
|
+
"model-scaffold",
|
|
32
|
+
"model-validation",
|
|
27
33
|
"version-dataset"
|
|
28
34
|
]
|
|
29
35
|
},
|
|
@@ -124,6 +130,15 @@
|
|
|
124
130
|
"maturity": "official",
|
|
125
131
|
"description": "Statistical analysis for medical research papers."
|
|
126
132
|
},
|
|
133
|
+
{
|
|
134
|
+
"slug": "architecture-zoo",
|
|
135
|
+
"category": "data_study_design",
|
|
136
|
+
"category_label": "Data & Study Design",
|
|
137
|
+
"layer": "D",
|
|
138
|
+
"owner_domain": "architecture_reference",
|
|
139
|
+
"maturity": "official",
|
|
140
|
+
"description": "Choose a model architecture for a medical-imaging research question before scaffolding."
|
|
141
|
+
},
|
|
127
142
|
{
|
|
128
143
|
"slug": "author-strategy",
|
|
129
144
|
"category": "project_workflow",
|
|
@@ -349,6 +364,51 @@
|
|
|
349
364
|
"maturity": "official",
|
|
350
365
|
"description": "Systematic review and meta-analysis pipeline for medical research."
|
|
351
366
|
},
|
|
367
|
+
{
|
|
368
|
+
"slug": "mllm-eval",
|
|
369
|
+
"category": "data_study_design",
|
|
370
|
+
"category_label": "Data & Study Design",
|
|
371
|
+
"layer": "D",
|
|
372
|
+
"owner_domain": "model_evaluation",
|
|
373
|
+
"maturity": "official",
|
|
374
|
+
"description": "Design or audit a model-agnostic evaluation harness for an LLM or multimodal LLM on a clinical task (radiology report generation, visual question answering, clinical text extraction/classification) —…"
|
|
375
|
+
},
|
|
376
|
+
{
|
|
377
|
+
"slug": "model-card",
|
|
378
|
+
"category": "data_study_design",
|
|
379
|
+
"category_label": "Data & Study Design",
|
|
380
|
+
"layer": "C",
|
|
381
|
+
"owner_domain": "model_reporting",
|
|
382
|
+
"maturity": "official",
|
|
383
|
+
"description": "Generate the documentation an engineer-built medical-imaging model must carry — a Model Card (Mitchell et al."
|
|
384
|
+
},
|
|
385
|
+
{
|
|
386
|
+
"slug": "model-evaluation",
|
|
387
|
+
"category": "data_study_design",
|
|
388
|
+
"category_label": "Data & Study Design",
|
|
389
|
+
"layer": "B",
|
|
390
|
+
"owner_domain": "model_evaluation",
|
|
391
|
+
"maturity": "official",
|
|
392
|
+
"description": "Compute and report task-correct held-out metrics for a trained medical-imaging model — segmentation (Dice plus a boundary metric such as HD95 or NSD, per structure), classification (AUROC plus AUPRC a…"
|
|
393
|
+
},
|
|
394
|
+
{
|
|
395
|
+
"slug": "model-scaffold",
|
|
396
|
+
"category": "data_study_design",
|
|
397
|
+
"category_label": "Data & Study Design",
|
|
398
|
+
"layer": "B",
|
|
399
|
+
"owner_domain": "model_development",
|
|
400
|
+
"maturity": "official",
|
|
401
|
+
"description": "Generate a reproducible, runnable PyTorch training repo for a medical-imaging segmentation task — the missing middle link between choosing an architecture and validating a trained model."
|
|
402
|
+
},
|
|
403
|
+
{
|
|
404
|
+
"slug": "model-validation",
|
|
405
|
+
"category": "data_study_design",
|
|
406
|
+
"category_label": "Data & Study Design",
|
|
407
|
+
"layer": "D",
|
|
408
|
+
"owner_domain": "model_validation",
|
|
409
|
+
"maturity": "official",
|
|
410
|
+
"description": "Design or audit the clinical-validation study for an engineer-built medical-imaging model (segmentation, classification, or detection) before the validation report or manuscript is written."
|
|
411
|
+
},
|
|
352
412
|
{
|
|
353
413
|
"slug": "orchestrate",
|
|
354
414
|
"category": "project_workflow",
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "medsci-skills",
|
|
3
|
-
"version": "4.
|
|
3
|
+
"version": "4.11.0",
|
|
4
4
|
"description": "MedSci Skills — a medical/scientific research skill suite for AI coding agents (Claude Code, Codex, Cursor, Copilot). The npm package is a terminal-friendly installer shortcut; the canonical distribution remains the GitHub repository and the Claude Code plugin marketplace.",
|
|
5
5
|
"license": "SEE LICENSE IN LICENSE",
|
|
6
6
|
"homepage": "https://github.com/Aperivue/medsci-skills#readme",
|