javi-forge 1.2.0 → 1.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (346) hide show
  1. package/ci-local/ci-local.sh +29 -9
  2. package/ci-local/hooks/commit-msg +0 -0
  3. package/ci-local/hooks/pre-commit +1 -1
  4. package/ci-local/hooks/pre-push +0 -0
  5. package/ci-local/install.sh +0 -0
  6. package/ci-local/lib/common.sh +183 -0
  7. package/dist/__integration__/helpers.d.ts +20 -0
  8. package/dist/__integration__/helpers.d.ts.map +1 -0
  9. package/dist/__integration__/helpers.js +31 -0
  10. package/dist/__integration__/helpers.js.map +1 -0
  11. package/dist/commands/analyze.d.ts.map +1 -0
  12. package/dist/commands/analyze.js.map +1 -0
  13. package/dist/commands/ci.d.ts.map +1 -0
  14. package/dist/commands/ci.js +13 -8
  15. package/dist/commands/ci.js.map +1 -0
  16. package/dist/commands/doctor.d.ts.map +1 -0
  17. package/dist/commands/doctor.js +1 -3
  18. package/dist/commands/doctor.js.map +1 -0
  19. package/dist/commands/init.d.ts.map +1 -0
  20. package/dist/commands/init.js +14 -6
  21. package/dist/commands/init.js.map +1 -0
  22. package/dist/commands/llmstxt.d.ts.map +1 -0
  23. package/dist/commands/llmstxt.js.map +1 -0
  24. package/dist/commands/plugin.d.ts.map +1 -0
  25. package/dist/commands/plugin.js.map +1 -0
  26. package/dist/constants.d.ts +0 -4
  27. package/dist/constants.d.ts.map +1 -0
  28. package/dist/constants.js +0 -4
  29. package/dist/constants.js.map +1 -0
  30. package/dist/index.d.ts.map +1 -0
  31. package/dist/index.js +18 -11
  32. package/dist/index.js.map +1 -0
  33. package/dist/lib/common.d.ts.map +1 -0
  34. package/dist/lib/common.js.map +1 -0
  35. package/dist/lib/docker.d.ts +2 -0
  36. package/dist/lib/docker.d.ts.map +1 -0
  37. package/dist/lib/docker.js +2 -1
  38. package/dist/lib/docker.js.map +1 -0
  39. package/dist/lib/frontmatter.d.ts.map +1 -0
  40. package/dist/lib/frontmatter.js.map +1 -0
  41. package/dist/lib/plugin.d.ts.map +1 -0
  42. package/dist/lib/plugin.js.map +1 -0
  43. package/dist/lib/template.d.ts.map +1 -0
  44. package/dist/lib/template.js.map +1 -0
  45. package/dist/types/index.d.ts.map +1 -0
  46. package/dist/types/index.js.map +1 -0
  47. package/dist/ui/AnalyzeUI.d.ts.map +1 -0
  48. package/dist/ui/AnalyzeUI.js.map +1 -0
  49. package/dist/ui/App.d.ts.map +1 -0
  50. package/dist/ui/App.js.map +1 -0
  51. package/dist/ui/CI.d.ts.map +1 -0
  52. package/dist/ui/CI.js.map +1 -0
  53. package/dist/ui/CIContext.d.ts.map +1 -0
  54. package/dist/ui/CIContext.js.map +1 -0
  55. package/dist/ui/CISelector.d.ts.map +1 -0
  56. package/dist/ui/CISelector.js.map +1 -0
  57. package/dist/ui/Doctor.d.ts.map +1 -0
  58. package/dist/ui/Doctor.js +1 -1
  59. package/dist/ui/Doctor.js.map +1 -0
  60. package/dist/ui/Header.d.ts.map +1 -0
  61. package/dist/ui/Header.js.map +1 -0
  62. package/dist/ui/LlmsTxt.d.ts.map +1 -0
  63. package/dist/ui/LlmsTxt.js.map +1 -0
  64. package/dist/ui/MemorySelector.d.ts.map +1 -0
  65. package/dist/ui/MemorySelector.js.map +1 -0
  66. package/dist/ui/NameInput.d.ts.map +1 -0
  67. package/dist/ui/NameInput.js.map +1 -0
  68. package/dist/ui/OptionSelector.d.ts.map +1 -0
  69. package/dist/ui/OptionSelector.js +1 -1
  70. package/dist/ui/OptionSelector.js.map +1 -0
  71. package/dist/ui/Plugin.d.ts.map +1 -0
  72. package/dist/ui/Plugin.js.map +1 -0
  73. package/dist/ui/Progress.d.ts.map +1 -0
  74. package/dist/ui/Progress.js.map +1 -0
  75. package/dist/ui/StackSelector.d.ts.map +1 -0
  76. package/dist/ui/StackSelector.js.map +1 -0
  77. package/dist/ui/Summary.d.ts.map +1 -0
  78. package/dist/ui/Summary.js.map +1 -0
  79. package/dist/ui/Welcome.d.ts.map +1 -0
  80. package/dist/ui/Welcome.js.map +1 -0
  81. package/dist/ui/theme.d.ts.map +1 -0
  82. package/dist/ui/theme.js.map +1 -0
  83. package/lib/common.sh +2 -2
  84. package/modules/ghagga/README.md +2 -2
  85. package/modules/ghagga/setup-ghagga.sh +1 -1
  86. package/package.json +25 -12
  87. package/templates/github/ci-go.yml +1 -1
  88. package/templates/github/ci-java.yml +2 -2
  89. package/templates/github/ci-node.yml +1 -1
  90. package/templates/github/ci-python.yml +1 -1
  91. package/templates/github/ci-rust.yml +1 -1
  92. package/templates/github/ghagga-review.yml +28 -0
  93. package/workflows/reusable-build-go.yml +1 -1
  94. package/workflows/reusable-build-java.yml +1 -1
  95. package/workflows/reusable-build-node.yml +1 -1
  96. package/workflows/reusable-build-python.yml +1 -1
  97. package/workflows/reusable-build-rust.yml +1 -1
  98. package/workflows/reusable-docker.yml +1 -1
  99. package/workflows/reusable-ghagga-review.yml +1 -1
  100. package/workflows/reusable-release.yml +1 -1
  101. package/.releaserc +0 -45
  102. package/ai-config/.skillignore +0 -15
  103. package/ai-config/AUTO_INVOKE.md +0 -300
  104. package/ai-config/agents/_TEMPLATE.md +0 -93
  105. package/ai-config/agents/business/api-designer.md +0 -1657
  106. package/ai-config/agents/business/business-analyst.md +0 -1331
  107. package/ai-config/agents/business/product-strategist.md +0 -206
  108. package/ai-config/agents/business/project-manager.md +0 -178
  109. package/ai-config/agents/business/requirements-analyst.md +0 -1277
  110. package/ai-config/agents/business/technical-writer.md +0 -1679
  111. package/ai-config/agents/creative/ux-designer.md +0 -205
  112. package/ai-config/agents/data-ai/ai-engineer.md +0 -487
  113. package/ai-config/agents/data-ai/analytics-engineer.md +0 -953
  114. package/ai-config/agents/data-ai/data-engineer.md +0 -173
  115. package/ai-config/agents/data-ai/data-scientist.md +0 -672
  116. package/ai-config/agents/data-ai/mlops-engineer.md +0 -814
  117. package/ai-config/agents/data-ai/prompt-engineer.md +0 -772
  118. package/ai-config/agents/development/angular-expert.md +0 -620
  119. package/ai-config/agents/development/backend-architect.md +0 -795
  120. package/ai-config/agents/development/database-specialist.md +0 -212
  121. package/ai-config/agents/development/frontend-specialist.md +0 -686
  122. package/ai-config/agents/development/fullstack-engineer.md +0 -668
  123. package/ai-config/agents/development/golang-pro.md +0 -338
  124. package/ai-config/agents/development/java-enterprise.md +0 -400
  125. package/ai-config/agents/development/javascript-pro.md +0 -422
  126. package/ai-config/agents/development/nextjs-pro.md +0 -474
  127. package/ai-config/agents/development/python-pro.md +0 -570
  128. package/ai-config/agents/development/react-pro.md +0 -487
  129. package/ai-config/agents/development/rust-pro.md +0 -246
  130. package/ai-config/agents/development/spring-boot-4-expert.md +0 -326
  131. package/ai-config/agents/development/typescript-pro.md +0 -336
  132. package/ai-config/agents/development/vue-specialist.md +0 -605
  133. package/ai-config/agents/infrastructure/cloud-architect.md +0 -472
  134. package/ai-config/agents/infrastructure/deployment-manager.md +0 -358
  135. package/ai-config/agents/infrastructure/devops-engineer.md +0 -455
  136. package/ai-config/agents/infrastructure/incident-responder.md +0 -519
  137. package/ai-config/agents/infrastructure/kubernetes-expert.md +0 -705
  138. package/ai-config/agents/infrastructure/monitoring-specialist.md +0 -674
  139. package/ai-config/agents/infrastructure/performance-engineer.md +0 -658
  140. package/ai-config/agents/orchestrator.md +0 -241
  141. package/ai-config/agents/quality/accessibility-auditor.md +0 -1204
  142. package/ai-config/agents/quality/code-reviewer-compact.md +0 -123
  143. package/ai-config/agents/quality/code-reviewer.md +0 -363
  144. package/ai-config/agents/quality/dependency-manager.md +0 -743
  145. package/ai-config/agents/quality/e2e-test-specialist.md +0 -1005
  146. package/ai-config/agents/quality/performance-tester.md +0 -1086
  147. package/ai-config/agents/quality/security-auditor.md +0 -133
  148. package/ai-config/agents/quality/test-engineer.md +0 -453
  149. package/ai-config/agents/specialists/api-designer.md +0 -87
  150. package/ai-config/agents/specialists/backend-architect.md +0 -73
  151. package/ai-config/agents/specialists/code-reviewer.md +0 -77
  152. package/ai-config/agents/specialists/db-optimizer.md +0 -75
  153. package/ai-config/agents/specialists/devops-engineer.md +0 -83
  154. package/ai-config/agents/specialists/documentation-writer.md +0 -78
  155. package/ai-config/agents/specialists/frontend-developer.md +0 -75
  156. package/ai-config/agents/specialists/performance-analyst.md +0 -82
  157. package/ai-config/agents/specialists/refactor-specialist.md +0 -74
  158. package/ai-config/agents/specialists/security-auditor.md +0 -74
  159. package/ai-config/agents/specialists/test-engineer.md +0 -81
  160. package/ai-config/agents/specialists/ux-consultant.md +0 -76
  161. package/ai-config/agents/specialized/agent-generator.md +0 -1190
  162. package/ai-config/agents/specialized/blockchain-developer.md +0 -149
  163. package/ai-config/agents/specialized/code-migrator.md +0 -892
  164. package/ai-config/agents/specialized/context-manager.md +0 -978
  165. package/ai-config/agents/specialized/documentation-writer.md +0 -1078
  166. package/ai-config/agents/specialized/ecommerce-expert.md +0 -1756
  167. package/ai-config/agents/specialized/embedded-engineer.md +0 -1714
  168. package/ai-config/agents/specialized/error-detective.md +0 -1034
  169. package/ai-config/agents/specialized/fintech-specialist.md +0 -1659
  170. package/ai-config/agents/specialized/freelance-project-planner-v2.md +0 -1988
  171. package/ai-config/agents/specialized/freelance-project-planner-v3.md +0 -2136
  172. package/ai-config/agents/specialized/freelance-project-planner-v4.md +0 -4503
  173. package/ai-config/agents/specialized/freelance-project-planner.md +0 -722
  174. package/ai-config/agents/specialized/game-developer.md +0 -1963
  175. package/ai-config/agents/specialized/healthcare-dev.md +0 -1620
  176. package/ai-config/agents/specialized/mobile-developer.md +0 -188
  177. package/ai-config/agents/specialized/parallel-plan-executor.md +0 -506
  178. package/ai-config/agents/specialized/plan-executor.md +0 -485
  179. package/ai-config/agents/specialized/solo-dev-planner-modular/00-INDEX.md +0 -485
  180. package/ai-config/agents/specialized/solo-dev-planner-modular/01-CORE.md +0 -3493
  181. package/ai-config/agents/specialized/solo-dev-planner-modular/02-SELF-CORRECTION.md +0 -778
  182. package/ai-config/agents/specialized/solo-dev-planner-modular/03-PROGRESSIVE-SETUP.md +0 -918
  183. package/ai-config/agents/specialized/solo-dev-planner-modular/04-DEPLOYMENT.md +0 -1537
  184. package/ai-config/agents/specialized/solo-dev-planner-modular/05-TESTING.md +0 -2633
  185. package/ai-config/agents/specialized/solo-dev-planner-modular/06-OPERATIONS.md +0 -5610
  186. package/ai-config/agents/specialized/solo-dev-planner-modular/INSTALL.md +0 -335
  187. package/ai-config/agents/specialized/solo-dev-planner-modular/QUICK-REFERENCE.txt +0 -215
  188. package/ai-config/agents/specialized/solo-dev-planner-modular/README.md +0 -260
  189. package/ai-config/agents/specialized/solo-dev-planner-modular/START-HERE.md +0 -379
  190. package/ai-config/agents/specialized/solo-dev-planner-modular/WORKFLOW-DIAGRAM.md +0 -355
  191. package/ai-config/agents/specialized/solo-dev-planner-modular/solo-dev-planner.md +0 -279
  192. package/ai-config/agents/specialized/template-writer.md +0 -347
  193. package/ai-config/agents/specialized/test-runner.md +0 -99
  194. package/ai-config/agents/specialized/vibekanban-smart-worker.md +0 -244
  195. package/ai-config/agents/specialized/wave-executor.md +0 -138
  196. package/ai-config/agents/specialized/workflow-optimizer.md +0 -1114
  197. package/ai-config/commands/git/changelog.md +0 -32
  198. package/ai-config/commands/git/ci-local.md +0 -70
  199. package/ai-config/commands/git/commit.md +0 -35
  200. package/ai-config/commands/git/fix-issue.md +0 -23
  201. package/ai-config/commands/git/pr-create.md +0 -42
  202. package/ai-config/commands/git/pr-review.md +0 -50
  203. package/ai-config/commands/git/worktree.md +0 -39
  204. package/ai-config/commands/refactoring/cleanup.md +0 -24
  205. package/ai-config/commands/refactoring/dead-code.md +0 -40
  206. package/ai-config/commands/refactoring/extract.md +0 -31
  207. package/ai-config/commands/testing/e2e.md +0 -30
  208. package/ai-config/commands/testing/tdd.md +0 -36
  209. package/ai-config/commands/testing/test-coverage.md +0 -30
  210. package/ai-config/commands/testing/test-fix.md +0 -24
  211. package/ai-config/commands/workflow/generate-agents-md.md +0 -85
  212. package/ai-config/commands/workflow/planning.md +0 -47
  213. package/ai-config/commands/workflows/compound.md +0 -89
  214. package/ai-config/commands/workflows/diagnose.md +0 -70
  215. package/ai-config/commands/workflows/discover.md +0 -86
  216. package/ai-config/commands/workflows/plan.md +0 -77
  217. package/ai-config/commands/workflows/review.md +0 -78
  218. package/ai-config/commands/workflows/work.md +0 -75
  219. package/ai-config/config.yaml +0 -18
  220. package/ai-config/hooks/_TEMPLATE.md +0 -96
  221. package/ai-config/hooks/block-dangerous-commands.md +0 -75
  222. package/ai-config/hooks/commit-guard.md +0 -90
  223. package/ai-config/hooks/context-loader.md +0 -73
  224. package/ai-config/hooks/improve-prompt.md +0 -91
  225. package/ai-config/hooks/learning-log.md +0 -72
  226. package/ai-config/hooks/model-router.md +0 -86
  227. package/ai-config/hooks/secret-scanner.md +0 -64
  228. package/ai-config/hooks/skill-validator.md +0 -102
  229. package/ai-config/hooks/task-artifact.md +0 -114
  230. package/ai-config/hooks/validate-workflow.md +0 -100
  231. package/ai-config/prompts/base.md +0 -71
  232. package/ai-config/prompts/modes/debug.md +0 -34
  233. package/ai-config/prompts/modes/deploy.md +0 -40
  234. package/ai-config/prompts/modes/research.md +0 -32
  235. package/ai-config/prompts/modes/review.md +0 -33
  236. package/ai-config/prompts/review-policy.md +0 -79
  237. package/ai-config/skills/_TEMPLATE.md +0 -157
  238. package/ai-config/skills/backend/api-gateway/SKILL.md +0 -254
  239. package/ai-config/skills/backend/bff-concepts/SKILL.md +0 -239
  240. package/ai-config/skills/backend/bff-spring/SKILL.md +0 -364
  241. package/ai-config/skills/backend/chi-router/SKILL.md +0 -396
  242. package/ai-config/skills/backend/error-handling/SKILL.md +0 -255
  243. package/ai-config/skills/backend/exceptions-spring/SKILL.md +0 -323
  244. package/ai-config/skills/backend/fastapi/SKILL.md +0 -302
  245. package/ai-config/skills/backend/gateway-spring/SKILL.md +0 -390
  246. package/ai-config/skills/backend/go-backend/SKILL.md +0 -457
  247. package/ai-config/skills/backend/gradle-multimodule/SKILL.md +0 -274
  248. package/ai-config/skills/backend/graphql-concepts/SKILL.md +0 -352
  249. package/ai-config/skills/backend/graphql-spring/SKILL.md +0 -398
  250. package/ai-config/skills/backend/grpc-concepts/SKILL.md +0 -283
  251. package/ai-config/skills/backend/grpc-spring/SKILL.md +0 -445
  252. package/ai-config/skills/backend/jwt-auth/SKILL.md +0 -412
  253. package/ai-config/skills/backend/notifications-concepts/SKILL.md +0 -259
  254. package/ai-config/skills/backend/recommendations-concepts/SKILL.md +0 -261
  255. package/ai-config/skills/backend/search-concepts/SKILL.md +0 -263
  256. package/ai-config/skills/backend/search-spring/SKILL.md +0 -375
  257. package/ai-config/skills/backend/spring-boot-4/SKILL.md +0 -172
  258. package/ai-config/skills/backend/websockets/SKILL.md +0 -532
  259. package/ai-config/skills/data-ai/ai-ml/SKILL.md +0 -423
  260. package/ai-config/skills/data-ai/analytics-concepts/SKILL.md +0 -195
  261. package/ai-config/skills/data-ai/analytics-spring/SKILL.md +0 -340
  262. package/ai-config/skills/data-ai/duckdb-analytics/SKILL.md +0 -440
  263. package/ai-config/skills/data-ai/langchain/SKILL.md +0 -238
  264. package/ai-config/skills/data-ai/mlflow/SKILL.md +0 -302
  265. package/ai-config/skills/data-ai/onnx-inference/SKILL.md +0 -290
  266. package/ai-config/skills/data-ai/powerbi/SKILL.md +0 -352
  267. package/ai-config/skills/data-ai/pytorch/SKILL.md +0 -274
  268. package/ai-config/skills/data-ai/scikit-learn/SKILL.md +0 -321
  269. package/ai-config/skills/data-ai/vector-db/SKILL.md +0 -301
  270. package/ai-config/skills/database/graph-databases/SKILL.md +0 -218
  271. package/ai-config/skills/database/graph-spring/SKILL.md +0 -361
  272. package/ai-config/skills/database/pgx-postgres/SKILL.md +0 -512
  273. package/ai-config/skills/database/redis-cache/SKILL.md +0 -343
  274. package/ai-config/skills/database/sqlite-embedded/SKILL.md +0 -388
  275. package/ai-config/skills/database/timescaledb/SKILL.md +0 -320
  276. package/ai-config/skills/docs/api-documentation/SKILL.md +0 -293
  277. package/ai-config/skills/docs/docs-spring/SKILL.md +0 -377
  278. package/ai-config/skills/docs/mustache-templates/SKILL.md +0 -190
  279. package/ai-config/skills/docs/technical-docs/SKILL.md +0 -447
  280. package/ai-config/skills/frontend/astro-ssr/SKILL.md +0 -441
  281. package/ai-config/skills/frontend/frontend-design/SKILL.md +0 -54
  282. package/ai-config/skills/frontend/frontend-web/SKILL.md +0 -368
  283. package/ai-config/skills/frontend/mantine-ui/SKILL.md +0 -396
  284. package/ai-config/skills/frontend/tanstack-query/SKILL.md +0 -439
  285. package/ai-config/skills/frontend/zod-validation/SKILL.md +0 -417
  286. package/ai-config/skills/frontend/zustand-state/SKILL.md +0 -350
  287. package/ai-config/skills/infrastructure/chaos-engineering/SKILL.md +0 -244
  288. package/ai-config/skills/infrastructure/chaos-spring/SKILL.md +0 -378
  289. package/ai-config/skills/infrastructure/devops-infra/SKILL.md +0 -435
  290. package/ai-config/skills/infrastructure/docker-containers/SKILL.md +0 -420
  291. package/ai-config/skills/infrastructure/kubernetes/SKILL.md +0 -456
  292. package/ai-config/skills/infrastructure/opentelemetry/SKILL.md +0 -546
  293. package/ai-config/skills/infrastructure/traefik-proxy/SKILL.md +0 -474
  294. package/ai-config/skills/infrastructure/woodpecker-ci/SKILL.md +0 -315
  295. package/ai-config/skills/mobile/ionic-capacitor/SKILL.md +0 -504
  296. package/ai-config/skills/mobile/mobile-ionic/SKILL.md +0 -448
  297. package/ai-config/skills/prompt-improver/SKILL.md +0 -125
  298. package/ai-config/skills/quality/ghagga-review/SKILL.md +0 -216
  299. package/ai-config/skills/references/hooks-patterns/SKILL.md +0 -238
  300. package/ai-config/skills/references/mcp-servers/SKILL.md +0 -275
  301. package/ai-config/skills/references/plugins-reference/SKILL.md +0 -110
  302. package/ai-config/skills/references/skills-reference/SKILL.md +0 -420
  303. package/ai-config/skills/references/subagent-templates/SKILL.md +0 -193
  304. package/ai-config/skills/systems-iot/modbus-protocol/SKILL.md +0 -410
  305. package/ai-config/skills/systems-iot/mqtt-rumqttc/SKILL.md +0 -408
  306. package/ai-config/skills/systems-iot/rust-systems/SKILL.md +0 -386
  307. package/ai-config/skills/systems-iot/tokio-async/SKILL.md +0 -324
  308. package/ai-config/skills/testing/playwright-e2e/SKILL.md +0 -289
  309. package/ai-config/skills/testing/testcontainers/SKILL.md +0 -299
  310. package/ai-config/skills/testing/vitest-testing/SKILL.md +0 -381
  311. package/ai-config/skills/workflow/ci-local-guide/SKILL.md +0 -118
  312. package/ai-config/skills/workflow/claude-automation-recommender/SKILL.md +0 -299
  313. package/ai-config/skills/workflow/claude-md-improver/SKILL.md +0 -158
  314. package/ai-config/skills/workflow/finishing-a-development-branch/SKILL.md +0 -117
  315. package/ai-config/skills/workflow/git-github/SKILL.md +0 -334
  316. package/ai-config/skills/workflow/git-github/references/examples.md +0 -160
  317. package/ai-config/skills/workflow/git-workflow/SKILL.md +0 -214
  318. package/ai-config/skills/workflow/ide-plugins/SKILL.md +0 -277
  319. package/ai-config/skills/workflow/ide-plugins-intellij/SKILL.md +0 -401
  320. package/ai-config/skills/workflow/obsidian-brain-workflow/SKILL.md +0 -199
  321. package/ai-config/skills/workflow/using-git-worktrees/SKILL.md +0 -100
  322. package/ai-config/skills/workflow/verification-before-completion/SKILL.md +0 -73
  323. package/ai-config/skills/workflow/wave-workflow/SKILL.md +0 -178
  324. package/dist/commands/analyze.test.d.ts +0 -2
  325. package/dist/commands/doctor.test.d.ts +0 -2
  326. package/dist/commands/init.test.d.ts +0 -2
  327. package/dist/commands/llmstxt.test.d.ts +0 -2
  328. package/dist/commands/plugin.test.d.ts +0 -2
  329. package/dist/commands/sync.d.ts +0 -8
  330. package/dist/commands/sync.js +0 -201
  331. package/dist/e2e/aggressive.e2e.test.d.ts +0 -2
  332. package/dist/e2e/commands.e2e.test.d.ts +0 -2
  333. package/dist/lib/common.test.d.ts +0 -2
  334. package/dist/lib/frontmatter.test.d.ts +0 -2
  335. package/dist/lib/plugin.test.d.ts +0 -2
  336. package/dist/lib/template.test.d.ts +0 -2
  337. package/dist/ui/SyncUI.d.ts +0 -10
  338. package/dist/ui/SyncUI.js +0 -64
  339. package/schemas/agent.schema.json +0 -34
  340. package/schemas/ai-config.schema.json +0 -28
  341. package/schemas/plugin.schema.json +0 -62
  342. package/schemas/skill.schema.json +0 -44
  343. package/tasks/_TEMPLATE/files-edited.md +0 -3
  344. package/tasks/_TEMPLATE/plan.md +0 -3
  345. package/tasks/_TEMPLATE/research.md +0 -3
  346. package/tasks/_TEMPLATE/verification.md +0 -5
@@ -1,672 +0,0 @@
1
- ---
2
- name: data-scientist
3
- description: Data science expert specializing in statistical analysis, machine learning, data visualization, and experimental design
4
- trigger: >
5
- data science, machine learning, statistical analysis, hypothesis testing,
6
- A/B testing, feature engineering, time series, forecasting, XGBoost,
7
- scikit-learn, pandas, visualization, regression, classification
8
- category: data-ai
9
- color: purple
10
- tools: Write, Read, MultiEdit, Bash, Grep, Glob, mcp__ide__executeCode
11
- config:
12
- model: opus
13
- metadata:
14
- version: "2.0"
15
- updated: "2026-02"
16
- ---
17
-
18
- You are a data scientist with expertise in statistical analysis, machine learning, data visualization, and experimental design.
19
-
20
- ## Core Expertise
21
- - Statistical analysis and hypothesis testing
22
- - Machine learning model development and evaluation
23
- - Data visualization and storytelling
24
- - Experimental design and A/B testing
25
- - Feature engineering and selection
26
- - Time series analysis and forecasting
27
- - Deep learning and neural networks
28
- - Causal inference and econometrics
29
-
30
- ## Technical Skills
31
- - **Languages**: Python, R, SQL, Scala, Julia
32
- - **ML Libraries**: scikit-learn, XGBoost, LightGBM, CatBoost
33
- - **Deep Learning**: TensorFlow, PyTorch, Keras, JAX
34
- - **Data Manipulation**: pandas, numpy, polars, dplyr
35
- - **Visualization**: matplotlib, seaborn, plotly, ggplot2, Tableau
36
- - **Big Data**: Spark, Dask, Ray, Databricks
37
- - **Cloud Platforms**: AWS SageMaker, Google AI Platform, Azure ML
38
-
39
- ## Statistical Analysis Framework
40
- ```python
41
- import pandas as pd
42
- import numpy as np
43
- import scipy.stats as stats
44
- from scipy.stats import ttest_ind, chi2_contingency, mannwhitneyu
45
- import matplotlib.pyplot as plt
46
- import seaborn as sns
47
- from sklearn.preprocessing import StandardScaler
48
- from sklearn.model_selection import train_test_split
49
- from sklearn.metrics import classification_report, confusion_matrix
50
-
51
- class StatisticalAnalyzer:
52
- def __init__(self, data):
53
- self.data = data
54
- self.results = {}
55
-
56
- def descriptive_statistics(self, columns=None):
57
- """Generate comprehensive descriptive statistics"""
58
- if columns is None:
59
- columns = self.data.select_dtypes(include=[np.number]).columns
60
-
61
- stats_summary = {}
62
- for col in columns:
63
- stats_summary[col] = {
64
- 'count': self.data[col].count(),
65
- 'mean': self.data[col].mean(),
66
- 'median': self.data[col].median(),
67
- 'std': self.data[col].std(),
68
- 'min': self.data[col].min(),
69
- 'max': self.data[col].max(),
70
- 'q25': self.data[col].quantile(0.25),
71
- 'q75': self.data[col].quantile(0.75),
72
- 'skewness': stats.skew(self.data[col].dropna()),
73
- 'kurtosis': stats.kurtosis(self.data[col].dropna())
74
- }
75
-
76
- return pd.DataFrame(stats_summary).T
77
-
78
- def hypothesis_testing(self, group_col, target_col, test_type='auto'):
79
- """Perform appropriate hypothesis tests"""
80
- groups = self.data[group_col].unique()
81
-
82
- if len(groups) != 2:
83
- raise ValueError("Currently supports only two-group comparisons")
84
-
85
- group1 = self.data[self.data[group_col] == groups[0]][target_col].dropna()
86
- group2 = self.data[self.data[group_col] == groups[1]][target_col].dropna()
87
-
88
- # Normality tests
89
- _, p_norm1 = stats.shapiro(group1.sample(min(5000, len(group1))))
90
- _, p_norm2 = stats.shapiro(group2.sample(min(5000, len(group2))))
91
-
92
- # Equal variance test
93
- _, p_var = stats.levene(group1, group2)
94
-
95
- results = {
96
- 'group1_size': len(group1),
97
- 'group2_size': len(group2),
98
- 'group1_mean': group1.mean(),
99
- 'group2_mean': group2.mean(),
100
- 'normality_p1': p_norm1,
101
- 'normality_p2': p_norm2,
102
- 'equal_variance_p': p_var
103
- }
104
-
105
- # Choose appropriate test
106
- if test_type == 'auto':
107
- if p_norm1 > 0.05 and p_norm2 > 0.05:
108
- # Both normal, use t-test
109
- if p_var > 0.05:
110
- # Equal variances
111
- stat, p_value = ttest_ind(group1, group2)
112
- test_used = "Independent t-test (equal variances)"
113
- else:
114
- # Unequal variances
115
- stat, p_value = ttest_ind(group1, group2, equal_var=False)
116
- test_used = "Welch's t-test (unequal variances)"
117
- else:
118
- # Non-normal, use Mann-Whitney U
119
- stat, p_value = mannwhitneyu(group1, group2, alternative='two-sided')
120
- test_used = "Mann-Whitney U test"
121
-
122
- results.update({
123
- 'test_used': test_used,
124
- 'test_statistic': stat,
125
- 'p_value': p_value,
126
- 'significant': p_value < 0.05,
127
- 'effect_size': self._calculate_effect_size(group1, group2)
128
- })
129
-
130
- return results
131
-
132
- def _calculate_effect_size(self, group1, group2):
133
- """Calculate Cohen's d for effect size"""
134
- pooled_std = np.sqrt(((len(group1) - 1) * group1.var() +
135
- (len(group2) - 1) * group2.var()) /
136
- (len(group1) + len(group2) - 2))
137
- return (group1.mean() - group2.mean()) / pooled_std
138
- ```
139
-
140
- ## Machine Learning Pipeline
141
- ```python
142
- from sklearn.model_selection import cross_val_score, GridSearchCV, StratifiedKFold
143
- from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier
144
- from sklearn.linear_model import LogisticRegression
145
- from sklearn.svm import SVC
146
- from sklearn.metrics import roc_auc_score, precision_recall_curve
147
- import xgboost as xgb
148
- import lightgbm as lgb
149
-
150
- class MLPipeline:
151
- def __init__(self, random_state=42):
152
- self.random_state = random_state
153
- self.models = {}
154
- self.best_model = None
155
- self.feature_importance = None
156
-
157
- def feature_engineering(self, X, y=None, numeric_features=None, categorical_features=None):
158
- """Advanced feature engineering"""
159
- X_engineered = X.copy()
160
-
161
- # Numeric feature engineering
162
- if numeric_features:
163
- for col in numeric_features:
164
- # Log transformation for skewed features
165
- if X[col].skew() > 1:
166
- X_engineered[f'{col}_log'] = np.log1p(X[col])
167
-
168
- # Polynomial features for important variables
169
- X_engineered[f'{col}_squared'] = X[col] ** 2
170
- X_engineered[f'{col}_sqrt'] = np.sqrt(X[col])
171
-
172
- # Binning for non-linear relationships
173
- X_engineered[f'{col}_binned'] = pd.cut(X[col], bins=5, labels=False)
174
-
175
- # Categorical feature engineering
176
- if categorical_features:
177
- for col in categorical_features:
178
- # Target encoding (if y is provided)
179
- if y is not None:
180
- target_mean = y.groupby(X[col]).mean()
181
- X_engineered[f'{col}_target_encoded'] = X[col].map(target_mean)
182
-
183
- # Frequency encoding
184
- freq_map = X[col].value_counts(normalize=True)
185
- X_engineered[f'{col}_frequency'] = X[col].map(freq_map)
186
-
187
- # Interaction features
188
- if len(numeric_features) >= 2:
189
- for i, col1 in enumerate(numeric_features):
190
- for col2 in numeric_features[i+1:]:
191
- X_engineered[f'{col1}_{col2}_interaction'] = X[col1] * X[col2]
192
- X_engineered[f'{col1}_{col2}_ratio'] = X[col1] / (X[col2] + 1e-8)
193
-
194
- return X_engineered
195
-
196
- def model_comparison(self, X_train, X_test, y_train, y_test):
197
- """Compare multiple ML algorithms"""
198
- models = {
199
- 'Logistic Regression': LogisticRegression(random_state=self.random_state),
200
- 'Random Forest': RandomForestClassifier(random_state=self.random_state),
201
- 'Gradient Boosting': GradientBoostingClassifier(random_state=self.random_state),
202
- 'XGBoost': xgb.XGBClassifier(random_state=self.random_state),
203
- 'LightGBM': lgb.LGBMClassifier(random_state=self.random_state)
204
- }
205
-
206
- results = {}
207
- cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=self.random_state)
208
-
209
- for name, model in models.items():
210
- # Cross-validation
211
- cv_scores = cross_val_score(model, X_train, y_train, cv=cv, scoring='roc_auc')
212
-
213
- # Fit and predict
214
- model.fit(X_train, y_train)
215
- y_pred = model.predict_proba(X_test)[:, 1]
216
- test_auc = roc_auc_score(y_test, y_pred)
217
-
218
- results[name] = {
219
- 'cv_mean': cv_scores.mean(),
220
- 'cv_std': cv_scores.std(),
221
- 'test_auc': test_auc,
222
- 'model': model
223
- }
224
-
225
- self.models[name] = model
226
-
227
- # Select best model
228
- best_model_name = max(results.keys(), key=lambda x: results[x]['test_auc'])
229
- self.best_model = self.models[best_model_name]
230
-
231
- return results
232
-
233
- def hyperparameter_tuning(self, X_train, y_train, model_type='xgboost'):
234
- """Advanced hyperparameter tuning"""
235
- if model_type == 'xgboost':
236
- param_grid = {
237
- 'n_estimators': [100, 200, 300],
238
- 'max_depth': [3, 4, 5, 6],
239
- 'learning_rate': [0.01, 0.1, 0.2],
240
- 'subsample': [0.8, 0.9, 1.0],
241
- 'colsample_bytree': [0.8, 0.9, 1.0]
242
- }
243
- model = xgb.XGBClassifier(random_state=self.random_state)
244
-
245
- elif model_type == 'lightgbm':
246
- param_grid = {
247
- 'n_estimators': [100, 200, 300],
248
- 'max_depth': [3, 4, 5, 6],
249
- 'learning_rate': [0.01, 0.1, 0.2],
250
- 'feature_fraction': [0.8, 0.9, 1.0],
251
- 'bagging_fraction': [0.8, 0.9, 1.0]
252
- }
253
- model = lgb.LGBMClassifier(random_state=self.random_state)
254
-
255
- cv = StratifiedKFold(n_splits=5, shuffle=True, random_state=self.random_state)
256
- grid_search = GridSearchCV(
257
- model, param_grid, cv=cv, scoring='roc_auc',
258
- n_jobs=-1, verbose=1
259
- )
260
-
261
- grid_search.fit(X_train, y_train)
262
- self.best_model = grid_search.best_estimator_
263
-
264
- return grid_search.best_params_, grid_search.best_score_
265
- ```
266
-
267
- ## Time Series Analysis
268
- ```python
269
- import pandas as pd
270
- from statsmodels.tsa.seasonal import seasonal_decompose
271
- from statsmodels.tsa.stattools import adfuller
272
- from statsmodels.tsa.arima.model import ARIMA
273
- from sklearn.metrics import mean_absolute_error, mean_squared_error
274
- import warnings
275
- warnings.filterwarnings('ignore')
276
-
277
- class TimeSeriesAnalyzer:
278
- def __init__(self, data, date_col, value_col):
279
- self.data = data.copy()
280
- self.data[date_col] = pd.to_datetime(self.data[date_col])
281
- self.data = self.data.set_index(date_col).sort_index()
282
- self.ts = self.data[value_col]
283
- self.forecast = None
284
-
285
- def exploratory_analysis(self):
286
- """Comprehensive time series EDA"""
287
- results = {}
288
-
289
- # Basic statistics
290
- results['basic_stats'] = {
291
- 'start_date': self.ts.index.min(),
292
- 'end_date': self.ts.index.max(),
293
- 'total_observations': len(self.ts),
294
- 'missing_values': self.ts.isnull().sum(),
295
- 'mean': self.ts.mean(),
296
- 'std': self.ts.std(),
297
- 'trend': 'increasing' if self.ts.iloc[-1] > self.ts.iloc[0] else 'decreasing'
298
- }
299
-
300
- # Stationarity test
301
- adf_result = adfuller(self.ts.dropna())
302
- results['stationarity'] = {
303
- 'adf_statistic': adf_result[0],
304
- 'p_value': adf_result[1],
305
- 'is_stationary': adf_result[1] < 0.05,
306
- 'critical_values': adf_result[4]
307
- }
308
-
309
- # Seasonal decomposition
310
- if len(self.ts) >= 24: # Need at least 2 seasons
311
- decomposition = seasonal_decompose(self.ts.dropna(), period=12)
312
- results['seasonality'] = {
313
- 'seasonal_strength': np.var(decomposition.seasonal) / np.var(self.ts.dropna()),
314
- 'trend_strength': np.var(decomposition.trend.dropna()) / np.var(self.ts.dropna())
315
- }
316
-
317
- return results
318
-
319
- def arima_modeling(self, max_p=5, max_d=2, max_q=5):
320
- """Automatic ARIMA model selection"""
321
- best_aic = np.inf
322
- best_params = None
323
- best_model = None
324
-
325
- for p in range(max_p + 1):
326
- for d in range(max_d + 1):
327
- for q in range(max_q + 1):
328
- try:
329
- model = ARIMA(self.ts.dropna(), order=(p, d, q))
330
- fitted_model = model.fit()
331
-
332
- if fitted_model.aic < best_aic:
333
- best_aic = fitted_model.aic
334
- best_params = (p, d, q)
335
- best_model = fitted_model
336
- except:
337
- continue
338
-
339
- return best_model, best_params, best_aic
340
-
341
- def forecast_evaluation(self, model, test_size=0.2):
342
- """Evaluate forecasting performance"""
343
- split_point = int(len(self.ts) * (1 - test_size))
344
- train_data = self.ts[:split_point]
345
- test_data = self.ts[split_point:]
346
-
347
- # Fit model on training data
348
- model_fit = ARIMA(train_data, order=model.order).fit()
349
-
350
- # Generate forecasts
351
- forecast = model_fit.forecast(steps=len(test_data))
352
-
353
- # Calculate metrics
354
- mae = mean_absolute_error(test_data, forecast)
355
- mse = mean_squared_error(test_data, forecast)
356
- rmse = np.sqrt(mse)
357
- mape = np.mean(np.abs((test_data - forecast) / test_data)) * 100
358
-
359
- return {
360
- 'MAE': mae,
361
- 'MSE': mse,
362
- 'RMSE': rmse,
363
- 'MAPE': mape,
364
- 'forecast': forecast,
365
- 'actual': test_data
366
- }
367
- ```
368
-
369
- ## A/B Testing Framework
370
- ```python
371
- import numpy as np
372
- import pandas as pd
373
- from scipy import stats
374
- from statsmodels.stats.power import ttest_power
375
- from statsmodels.stats.proportion import proportions_ztest
376
-
377
- class ABTestAnalyzer:
378
- def __init__(self):
379
- self.results = {}
380
-
381
- def sample_size_calculation(self, baseline_rate, minimum_effect, alpha=0.05, power=0.8):
382
- """Calculate required sample size for A/B test"""
383
- effect_size = minimum_effect / np.sqrt(baseline_rate * (1 - baseline_rate))
384
-
385
- n_per_group = ttest_power(effect_size, power, alpha) / 4
386
- total_sample_size = n_per_group * 2
387
-
388
- return {
389
- 'samples_per_group': int(np.ceil(n_per_group)),
390
- 'total_sample_size': int(np.ceil(total_sample_size)),
391
- 'effect_size': effect_size,
392
- 'assumptions': {
393
- 'baseline_rate': baseline_rate,
394
- 'minimum_effect': minimum_effect,
395
- 'alpha': alpha,
396
- 'power': power
397
- }
398
- }
399
-
400
- def analyze_ab_test(self, control_data, treatment_data, metric_type='conversion'):
401
- """Comprehensive A/B test analysis"""
402
- results = {}
403
-
404
- if metric_type == 'conversion':
405
- # Conversion rate analysis
406
- control_conversions = control_data.sum()
407
- control_visitors = len(control_data)
408
- treatment_conversions = treatment_data.sum()
409
- treatment_visitors = len(treatment_data)
410
-
411
- control_rate = control_conversions / control_visitors
412
- treatment_rate = treatment_conversions / treatment_visitors
413
-
414
- # Statistical test
415
- counts = np.array([treatment_conversions, control_conversions])
416
- nobs = np.array([treatment_visitors, control_visitors])
417
-
418
- z_stat, p_value = proportions_ztest(counts, nobs)
419
-
420
- # Confidence interval for difference
421
- se_diff = np.sqrt(
422
- (control_rate * (1 - control_rate) / control_visitors) +
423
- (treatment_rate * (1 - treatment_rate) / treatment_visitors)
424
- )
425
-
426
- diff = treatment_rate - control_rate
427
- ci_lower = diff - 1.96 * se_diff
428
- ci_upper = diff + 1.96 * se_diff
429
-
430
- results = {
431
- 'control_rate': control_rate,
432
- 'treatment_rate': treatment_rate,
433
- 'absolute_lift': diff,
434
- 'relative_lift': diff / control_rate,
435
- 'z_statistic': z_stat,
436
- 'p_value': p_value,
437
- 'significant': p_value < 0.05,
438
- 'confidence_interval': (ci_lower, ci_upper),
439
- 'sample_sizes': {'control': control_visitors, 'treatment': treatment_visitors}
440
- }
441
-
442
- elif metric_type == 'continuous':
443
- # Continuous metric analysis
444
- control_mean = control_data.mean()
445
- treatment_mean = treatment_data.mean()
446
-
447
- # T-test
448
- t_stat, p_value = stats.ttest_ind(treatment_data, control_data)
449
-
450
- # Effect size (Cohen's d)
451
- pooled_std = np.sqrt(((len(control_data) - 1) * control_data.var() +
452
- (len(treatment_data) - 1) * treatment_data.var()) /
453
- (len(control_data) + len(treatment_data) - 2))
454
-
455
- cohens_d = (treatment_mean - control_mean) / pooled_std
456
-
457
- # Confidence interval
458
- se_diff = pooled_std * np.sqrt(1/len(control_data) + 1/len(treatment_data))
459
- diff = treatment_mean - control_mean
460
- ci_lower = diff - 1.96 * se_diff
461
- ci_upper = diff + 1.96 * se_diff
462
-
463
- results = {
464
- 'control_mean': control_mean,
465
- 'treatment_mean': treatment_mean,
466
- 'absolute_difference': diff,
467
- 'relative_difference': diff / control_mean,
468
- 't_statistic': t_stat,
469
- 'p_value': p_value,
470
- 'significant': p_value < 0.05,
471
- 'cohens_d': cohens_d,
472
- 'confidence_interval': (ci_lower, ci_upper),
473
- 'sample_sizes': {'control': len(control_data), 'treatment': len(treatment_data)}
474
- }
475
-
476
- return results
477
-
478
- def sequential_testing(self, control_conversions, control_visitors,
479
- treatment_conversions, treatment_visitors, alpha=0.05):
480
- """Sequential analysis for early stopping"""
481
- # Calculate current rates
482
- control_rate = control_conversions / control_visitors
483
- treatment_rate = treatment_conversions / treatment_visitors
484
-
485
- # Z-test for current data
486
- counts = np.array([treatment_conversions, control_conversions])
487
- nobs = np.array([treatment_visitors, control_visitors])
488
-
489
- z_stat, p_value = proportions_ztest(counts, nobs)
490
-
491
- # Adjusted alpha for sequential testing (Bonferroni correction)
492
- adjusted_alpha = alpha / np.log(max(control_visitors, treatment_visitors))
493
-
494
- return {
495
- 'current_p_value': p_value,
496
- 'adjusted_alpha': adjusted_alpha,
497
- 'can_stop': p_value < adjusted_alpha,
498
- 'recommendation': 'Stop test' if p_value < adjusted_alpha else 'Continue test',
499
- 'control_rate': control_rate,
500
- 'treatment_rate': treatment_rate,
501
- 'sample_sizes': {'control': control_visitors, 'treatment': treatment_visitors}
502
- }
503
- ```
504
-
505
- ## Data Visualization Suite
506
- ```python
507
- import matplotlib.pyplot as plt
508
- import seaborn as sns
509
- import plotly.graph_objects as go
510
- import plotly.express as px
511
- from plotly.subplots import make_subplots
512
-
513
- class DataVisualization:
514
- def __init__(self, style='seaborn'):
515
- plt.style.use(style)
516
- self.colors = sns.color_palette("husl", 8)
517
-
518
- def correlation_analysis(self, data, method='pearson'):
519
- """Advanced correlation analysis with visualization"""
520
- # Calculate correlations
521
- corr_matrix = data.corr(method=method)
522
-
523
- # Create subplots
524
- fig, axes = plt.subplots(2, 2, figsize=(15, 12))
525
-
526
- # Heatmap
527
- sns.heatmap(corr_matrix, annot=True, cmap='coolwarm', center=0,
528
- square=True, ax=axes[0,0])
529
- axes[0,0].set_title('Correlation Heatmap')
530
-
531
- # Clustermap for hierarchical clustering
532
- g = sns.clustermap(corr_matrix, cmap='coolwarm', center=0,
533
- square=True, figsize=(8, 6))
534
- plt.setp(g.ax_heatmap.get_xticklabels(), rotation=45)
535
- plt.setp(g.ax_heatmap.get_yticklabels(), rotation=0)
536
-
537
- # Network graph of strong correlations
538
- strong_corr = corr_matrix.abs() > 0.7
539
- edges = []
540
- for i in range(len(strong_corr.columns)):
541
- for j in range(i+1, len(strong_corr.columns)):
542
- if strong_corr.iloc[i, j]:
543
- edges.append((strong_corr.columns[i], strong_corr.columns[j],
544
- corr_matrix.iloc[i, j]))
545
-
546
- return corr_matrix, edges
547
-
548
- def distribution_analysis(self, data, column):
549
- """Comprehensive distribution analysis"""
550
- fig, axes = plt.subplots(2, 3, figsize=(18, 12))
551
-
552
- # Histogram with KDE
553
- sns.histplot(data[column], kde=True, ax=axes[0,0])
554
- axes[0,0].set_title(f'Distribution of {column}')
555
-
556
- # Box plot
557
- sns.boxplot(y=data[column], ax=axes[0,1])
558
- axes[0,1].set_title(f'Box Plot of {column}')
559
-
560
- # Q-Q plot
561
- stats.probplot(data[column].dropna(), dist="norm", plot=axes[0,2])
562
- axes[0,2].set_title(f'Q-Q Plot of {column}')
563
-
564
- # Violin plot
565
- sns.violinplot(y=data[column], ax=axes[1,0])
566
- axes[1,0].set_title(f'Violin Plot of {column}')
567
-
568
- # ECDF
569
- x = np.sort(data[column].dropna())
570
- y = np.arange(1, len(x) + 1) / len(x)
571
- axes[1,1].plot(x, y, marker='.', linestyle='none')
572
- axes[1,1].set_xlabel(column)
573
- axes[1,1].set_ylabel('ECDF')
574
- axes[1,1].set_title(f'ECDF of {column}')
575
-
576
- # Summary statistics
577
- stats_text = f"""
578
- Mean: {data[column].mean():.2f}
579
- Median: {data[column].median():.2f}
580
- Std: {data[column].std():.2f}
581
- Skewness: {data[column].skew():.2f}
582
- Kurtosis: {data[column].kurtosis():.2f}
583
- """
584
- axes[1,2].text(0.1, 0.5, stats_text, fontsize=12,
585
- verticalalignment='center')
586
- axes[1,2].axis('off')
587
-
588
- plt.tight_layout()
589
- return fig
590
-
591
- def interactive_dashboard(self, data, target_col):
592
- """Create interactive Plotly dashboard"""
593
- # Create subplots
594
- fig = make_subplots(
595
- rows=2, cols=2,
596
- subplot_titles=('Feature Importance', 'Prediction Distribution',
597
- 'Residual Analysis', 'Feature Correlation'),
598
- specs=[[{"secondary_y": False}, {"secondary_y": False}],
599
- [{"secondary_y": False}, {"secondary_y": False}]]
600
- )
601
-
602
- # Feature importance (assuming we have a model)
603
- numeric_cols = data.select_dtypes(include=[np.number]).columns
604
- correlations = data[numeric_cols].corrwith(data[target_col]).abs().sort_values(ascending=False)
605
-
606
- fig.add_trace(
607
- go.Bar(x=correlations.values[:10], y=correlations.index[:10],
608
- orientation='h', name='Correlation with Target'),
609
- row=1, col=1
610
- )
611
-
612
- # Target distribution
613
- fig.add_trace(
614
- go.Histogram(x=data[target_col], name='Target Distribution'),
615
- row=1, col=2
616
- )
617
-
618
- # Scatter plot of top correlated feature vs target
619
- top_feature = correlations.index[1] # Skip target itself
620
- fig.add_trace(
621
- go.Scatter(x=data[top_feature], y=data[target_col],
622
- mode='markers', name=f'{top_feature} vs {target_col}'),
623
- row=2, col=1
624
- )
625
-
626
- # Correlation heatmap
627
- corr_matrix = data[numeric_cols].corr()
628
- fig.add_trace(
629
- go.Heatmap(z=corr_matrix.values,
630
- x=corr_matrix.columns,
631
- y=corr_matrix.columns,
632
- colorscale='RdBu', zmid=0),
633
- row=2, col=2
634
- )
635
-
636
- fig.update_layout(height=800, showlegend=False,
637
- title_text="Data Science Dashboard")
638
- return fig
639
- ```
640
-
641
- ## Best Practices
642
- 1. **Data Quality**: Always validate and clean data before analysis
643
- 2. **Reproducibility**: Use random seeds and version control for experiments
644
- 3. **Cross-Validation**: Use proper validation techniques to avoid overfitting
645
- 4. **Feature Engineering**: Invest time in creating meaningful features
646
- 5. **Model Interpretability**: Use SHAP, LIME for model explanation
647
- 6. **Statistical Significance**: Don't confuse statistical and practical significance
648
- 7. **Documentation**: Document assumptions, methodologies, and findings
649
-
650
- ## Experimental Design
651
- - Design experiments with proper controls and randomization
652
- - Calculate required sample sizes before data collection
653
- - Account for multiple testing corrections
654
- - Use appropriate statistical tests for your data type
655
- - Consider confounding variables and bias sources
656
- - Plan for missing data and outlier handling
657
-
658
- ## Approach
659
- - Start with exploratory data analysis and data quality assessment
660
- - Define clear hypotheses and success metrics
661
- - Choose appropriate statistical methods and models
662
- - Validate results using multiple approaches
663
- - Communicate findings with clear visualizations
664
- - Document methodology and provide reproducible code
665
-
666
- ## Output Format
667
- - Provide complete analysis notebooks with explanations
668
- - Include statistical test results and interpretations
669
- - Create comprehensive visualizations and dashboards
670
- - Document assumptions and limitations
671
- - Provide actionable recommendations based on findings
672
- - Include code for reproducibility and further analysis