tech-hub-skills 1.2.0 → 1.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (198) hide show
  1. package/{LICENSE → .claude/LICENSE} +21 -21
  2. package/.claude/README.md +291 -0
  3. package/.claude/bin/cli.js +266 -0
  4. package/{bin → .claude/bin}/copilot.js +182 -182
  5. package/{bin → .claude/bin}/postinstall.js +42 -42
  6. package/{tech_hub_skills/skills → .claude/commands}/README.md +336 -336
  7. package/{tech_hub_skills/skills → .claude/commands}/ai-engineer.md +104 -104
  8. package/{tech_hub_skills/skills → .claude/commands}/aws.md +143 -143
  9. package/{tech_hub_skills/skills → .claude/commands}/azure.md +149 -149
  10. package/{tech_hub_skills/skills → .claude/commands}/backend-developer.md +108 -108
  11. package/{tech_hub_skills/skills → .claude/commands}/code-review.md +399 -399
  12. package/{tech_hub_skills/skills → .claude/commands}/compliance-automation.md +747 -747
  13. package/{tech_hub_skills/skills → .claude/commands}/compliance-officer.md +108 -108
  14. package/{tech_hub_skills/skills → .claude/commands}/data-engineer.md +113 -113
  15. package/{tech_hub_skills/skills → .claude/commands}/data-governance.md +102 -102
  16. package/{tech_hub_skills/skills → .claude/commands}/data-scientist.md +123 -123
  17. package/{tech_hub_skills/skills → .claude/commands}/database-admin.md +109 -109
  18. package/{tech_hub_skills/skills → .claude/commands}/devops.md +160 -160
  19. package/{tech_hub_skills/skills → .claude/commands}/docker.md +160 -160
  20. package/{tech_hub_skills/skills → .claude/commands}/enterprise-dashboard.md +613 -613
  21. package/{tech_hub_skills/skills → .claude/commands}/finops.md +184 -184
  22. package/{tech_hub_skills/skills → .claude/commands}/frontend-developer.md +108 -108
  23. package/{tech_hub_skills/skills → .claude/commands}/gcp.md +143 -143
  24. package/{tech_hub_skills/skills → .claude/commands}/ml-engineer.md +115 -115
  25. package/{tech_hub_skills/skills → .claude/commands}/mlops.md +187 -187
  26. package/{tech_hub_skills/skills → .claude/commands}/network-engineer.md +109 -109
  27. package/{tech_hub_skills/skills → .claude/commands}/optimization-advisor.md +329 -329
  28. package/{tech_hub_skills/skills → .claude/commands}/orchestrator.md +623 -623
  29. package/{tech_hub_skills/skills → .claude/commands}/platform-engineer.md +102 -102
  30. package/{tech_hub_skills/skills → .claude/commands}/process-automation.md +226 -226
  31. package/{tech_hub_skills/skills → .claude/commands}/process-changelog.md +184 -184
  32. package/{tech_hub_skills/skills → .claude/commands}/process-documentation.md +484 -484
  33. package/{tech_hub_skills/skills → .claude/commands}/process-kanban.md +324 -324
  34. package/{tech_hub_skills/skills → .claude/commands}/process-versioning.md +214 -214
  35. package/{tech_hub_skills/skills → .claude/commands}/product-designer.md +104 -104
  36. package/{tech_hub_skills/skills → .claude/commands}/project-starter.md +443 -443
  37. package/{tech_hub_skills/skills → .claude/commands}/qa-engineer.md +109 -109
  38. package/{tech_hub_skills/skills → .claude/commands}/security-architect.md +135 -135
  39. package/{tech_hub_skills/skills → .claude/commands}/sre.md +109 -109
  40. package/{tech_hub_skills/skills → .claude/commands}/system-design.md +126 -126
  41. package/{tech_hub_skills/skills → .claude/commands}/technical-writer.md +101 -101
  42. package/.claude/package.json +46 -0
  43. package/{tech_hub_skills → .claude}/roles/ai-engineer/skills/01-prompt-engineering/README.md +252 -252
  44. package/.claude/roles/ai-engineer/skills/01-prompt-engineering/prompt_ab_tester.py +356 -0
  45. package/.claude/roles/ai-engineer/skills/01-prompt-engineering/prompt_template_manager.py +274 -0
  46. package/.claude/roles/ai-engineer/skills/01-prompt-engineering/token_cost_estimator.py +324 -0
  47. package/{tech_hub_skills → .claude}/roles/ai-engineer/skills/02-rag-pipeline/README.md +448 -448
  48. package/.claude/roles/ai-engineer/skills/02-rag-pipeline/document_chunker.py +336 -0
  49. package/.claude/roles/ai-engineer/skills/02-rag-pipeline/rag_pipeline.sql +213 -0
  50. package/{tech_hub_skills → .claude}/roles/ai-engineer/skills/03-agent-orchestration/README.md +599 -599
  51. package/{tech_hub_skills → .claude}/roles/ai-engineer/skills/04-llm-guardrails/README.md +735 -735
  52. package/{tech_hub_skills → .claude}/roles/ai-engineer/skills/05-vector-embeddings/README.md +711 -711
  53. package/{tech_hub_skills → .claude}/roles/ai-engineer/skills/06-llm-evaluation/README.md +777 -777
  54. package/{tech_hub_skills → .claude}/roles/azure/skills/01-infrastructure-fundamentals/README.md +264 -264
  55. package/{tech_hub_skills → .claude}/roles/azure/skills/02-data-factory/README.md +264 -264
  56. package/{tech_hub_skills → .claude}/roles/azure/skills/03-synapse-analytics/README.md +264 -264
  57. package/{tech_hub_skills → .claude}/roles/azure/skills/04-databricks/README.md +264 -264
  58. package/{tech_hub_skills → .claude}/roles/azure/skills/05-functions/README.md +264 -264
  59. package/{tech_hub_skills → .claude}/roles/azure/skills/06-kubernetes-service/README.md +264 -264
  60. package/{tech_hub_skills → .claude}/roles/azure/skills/07-openai-service/README.md +264 -264
  61. package/{tech_hub_skills → .claude}/roles/azure/skills/08-machine-learning/README.md +264 -264
  62. package/{tech_hub_skills → .claude}/roles/azure/skills/09-storage-adls/README.md +264 -264
  63. package/{tech_hub_skills → .claude}/roles/azure/skills/10-networking/README.md +264 -264
  64. package/{tech_hub_skills → .claude}/roles/azure/skills/11-sql-cosmos/README.md +264 -264
  65. package/{tech_hub_skills → .claude}/roles/azure/skills/12-event-hubs/README.md +264 -264
  66. package/{tech_hub_skills → .claude}/roles/code-review/skills/01-automated-code-review/README.md +394 -394
  67. package/{tech_hub_skills → .claude}/roles/code-review/skills/02-pr-review-workflow/README.md +427 -427
  68. package/{tech_hub_skills → .claude}/roles/code-review/skills/03-code-quality-gates/README.md +518 -518
  69. package/{tech_hub_skills → .claude}/roles/code-review/skills/04-reviewer-assignment/README.md +504 -504
  70. package/{tech_hub_skills → .claude}/roles/code-review/skills/05-review-analytics/README.md +540 -540
  71. package/{tech_hub_skills → .claude}/roles/data-engineer/skills/01-lakehouse-architecture/README.md +550 -550
  72. package/.claude/roles/data-engineer/skills/01-lakehouse-architecture/bronze_ingestion.py +337 -0
  73. package/.claude/roles/data-engineer/skills/01-lakehouse-architecture/medallion_queries.sql +300 -0
  74. package/{tech_hub_skills → .claude}/roles/data-engineer/skills/02-etl-pipeline/README.md +580 -580
  75. package/{tech_hub_skills → .claude}/roles/data-engineer/skills/03-data-quality/README.md +579 -579
  76. package/{tech_hub_skills → .claude}/roles/data-engineer/skills/04-streaming-pipelines/README.md +608 -608
  77. package/{tech_hub_skills → .claude}/roles/data-engineer/skills/05-performance-optimization/README.md +547 -547
  78. package/{tech_hub_skills → .claude}/roles/data-governance/skills/01-data-catalog/README.md +112 -112
  79. package/{tech_hub_skills → .claude}/roles/data-governance/skills/02-data-lineage/README.md +129 -129
  80. package/{tech_hub_skills → .claude}/roles/data-governance/skills/03-data-quality-framework/README.md +182 -182
  81. package/{tech_hub_skills → .claude}/roles/data-governance/skills/04-access-control/README.md +39 -39
  82. package/{tech_hub_skills → .claude}/roles/data-governance/skills/05-master-data-management/README.md +40 -40
  83. package/{tech_hub_skills → .claude}/roles/data-governance/skills/06-compliance-privacy/README.md +46 -46
  84. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/01-eda-automation/README.md +230 -230
  85. package/.claude/roles/data-scientist/skills/01-eda-automation/eda_generator.py +446 -0
  86. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/02-statistical-modeling/README.md +264 -264
  87. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/03-feature-engineering/README.md +264 -264
  88. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/04-predictive-modeling/README.md +264 -264
  89. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/05-customer-analytics/README.md +264 -264
  90. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/06-campaign-analysis/README.md +264 -264
  91. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/07-experimentation/README.md +264 -264
  92. package/{tech_hub_skills → .claude}/roles/data-scientist/skills/08-data-visualization/README.md +264 -264
  93. package/{tech_hub_skills → .claude}/roles/devops/skills/01-cicd-pipeline/README.md +264 -264
  94. package/{tech_hub_skills → .claude}/roles/devops/skills/02-container-orchestration/README.md +264 -264
  95. package/{tech_hub_skills → .claude}/roles/devops/skills/03-infrastructure-as-code/README.md +264 -264
  96. package/{tech_hub_skills → .claude}/roles/devops/skills/04-gitops/README.md +264 -264
  97. package/{tech_hub_skills → .claude}/roles/devops/skills/05-environment-management/README.md +264 -264
  98. package/{tech_hub_skills → .claude}/roles/devops/skills/06-automated-testing/README.md +264 -264
  99. package/{tech_hub_skills → .claude}/roles/devops/skills/07-release-management/README.md +264 -264
  100. package/{tech_hub_skills → .claude}/roles/devops/skills/08-monitoring-alerting/README.md +264 -264
  101. package/{tech_hub_skills → .claude}/roles/devops/skills/09-devsecops/README.md +265 -265
  102. package/{tech_hub_skills → .claude}/roles/finops/skills/01-cost-visibility/README.md +264 -264
  103. package/{tech_hub_skills → .claude}/roles/finops/skills/02-resource-tagging/README.md +264 -264
  104. package/{tech_hub_skills → .claude}/roles/finops/skills/03-budget-management/README.md +264 -264
  105. package/{tech_hub_skills → .claude}/roles/finops/skills/04-reserved-instances/README.md +264 -264
  106. package/{tech_hub_skills → .claude}/roles/finops/skills/05-spot-optimization/README.md +264 -264
  107. package/{tech_hub_skills → .claude}/roles/finops/skills/06-storage-tiering/README.md +264 -264
  108. package/{tech_hub_skills → .claude}/roles/finops/skills/07-compute-rightsizing/README.md +264 -264
  109. package/{tech_hub_skills → .claude}/roles/finops/skills/08-chargeback/README.md +264 -264
  110. package/{tech_hub_skills → .claude}/roles/ml-engineer/skills/01-mlops-pipeline/README.md +566 -566
  111. package/{tech_hub_skills → .claude}/roles/ml-engineer/skills/02-feature-engineering/README.md +655 -655
  112. package/{tech_hub_skills → .claude}/roles/ml-engineer/skills/03-model-training/README.md +704 -704
  113. package/{tech_hub_skills → .claude}/roles/ml-engineer/skills/04-model-serving/README.md +845 -845
  114. package/{tech_hub_skills → .claude}/roles/ml-engineer/skills/05-model-monitoring/README.md +874 -874
  115. package/{tech_hub_skills → .claude}/roles/mlops/skills/01-ml-pipeline-orchestration/README.md +264 -264
  116. package/{tech_hub_skills → .claude}/roles/mlops/skills/02-experiment-tracking/README.md +264 -264
  117. package/{tech_hub_skills → .claude}/roles/mlops/skills/03-model-registry/README.md +264 -264
  118. package/{tech_hub_skills → .claude}/roles/mlops/skills/04-feature-store/README.md +264 -264
  119. package/{tech_hub_skills → .claude}/roles/mlops/skills/05-model-deployment/README.md +264 -264
  120. package/{tech_hub_skills → .claude}/roles/mlops/skills/06-model-observability/README.md +264 -264
  121. package/{tech_hub_skills → .claude}/roles/mlops/skills/07-data-versioning/README.md +264 -264
  122. package/{tech_hub_skills → .claude}/roles/mlops/skills/08-ab-testing/README.md +264 -264
  123. package/{tech_hub_skills → .claude}/roles/mlops/skills/09-automated-retraining/README.md +264 -264
  124. package/{tech_hub_skills → .claude}/roles/platform-engineer/skills/01-internal-developer-platform/README.md +153 -153
  125. package/{tech_hub_skills → .claude}/roles/platform-engineer/skills/02-self-service-infrastructure/README.md +57 -57
  126. package/{tech_hub_skills → .claude}/roles/platform-engineer/skills/03-slo-sli-management/README.md +59 -59
  127. package/{tech_hub_skills → .claude}/roles/platform-engineer/skills/04-developer-experience/README.md +57 -57
  128. package/{tech_hub_skills → .claude}/roles/platform-engineer/skills/05-incident-management/README.md +73 -73
  129. package/{tech_hub_skills → .claude}/roles/platform-engineer/skills/06-capacity-management/README.md +59 -59
  130. package/{tech_hub_skills → .claude}/roles/product-designer/skills/01-requirements-discovery/README.md +407 -407
  131. package/{tech_hub_skills → .claude}/roles/product-designer/skills/02-user-research/README.md +382 -382
  132. package/{tech_hub_skills → .claude}/roles/product-designer/skills/03-brainstorming-ideation/README.md +437 -437
  133. package/{tech_hub_skills → .claude}/roles/product-designer/skills/04-ux-design/README.md +496 -496
  134. package/{tech_hub_skills → .claude}/roles/product-designer/skills/05-product-market-fit/README.md +376 -376
  135. package/{tech_hub_skills → .claude}/roles/product-designer/skills/06-stakeholder-management/README.md +412 -412
  136. package/{tech_hub_skills → .claude}/roles/security-architect/skills/01-pii-detection/README.md +319 -319
  137. package/{tech_hub_skills → .claude}/roles/security-architect/skills/02-threat-modeling/README.md +264 -264
  138. package/{tech_hub_skills → .claude}/roles/security-architect/skills/03-infrastructure-security/README.md +264 -264
  139. package/{tech_hub_skills → .claude}/roles/security-architect/skills/04-iam/README.md +264 -264
  140. package/{tech_hub_skills → .claude}/roles/security-architect/skills/05-application-security/README.md +264 -264
  141. package/{tech_hub_skills → .claude}/roles/security-architect/skills/06-secrets-management/README.md +264 -264
  142. package/{tech_hub_skills → .claude}/roles/security-architect/skills/07-security-monitoring/README.md +264 -264
  143. package/{tech_hub_skills → .claude}/roles/system-design/skills/01-architecture-patterns/README.md +337 -337
  144. package/{tech_hub_skills → .claude}/roles/system-design/skills/02-requirements-engineering/README.md +264 -264
  145. package/{tech_hub_skills → .claude}/roles/system-design/skills/03-scalability/README.md +264 -264
  146. package/{tech_hub_skills → .claude}/roles/system-design/skills/04-high-availability/README.md +264 -264
  147. package/{tech_hub_skills → .claude}/roles/system-design/skills/05-cost-optimization-design/README.md +264 -264
  148. package/{tech_hub_skills → .claude}/roles/system-design/skills/06-api-design/README.md +264 -264
  149. package/{tech_hub_skills → .claude}/roles/system-design/skills/07-observability-architecture/README.md +264 -264
  150. package/{tech_hub_skills → .claude}/roles/system-design/skills/08-process-automation/PROCESS_TEMPLATE.md +336 -336
  151. package/{tech_hub_skills → .claude}/roles/system-design/skills/08-process-automation/README.md +521 -521
  152. package/.claude/roles/system-design/skills/08-process-automation/ai_prompt_generator.py +744 -0
  153. package/.claude/roles/system-design/skills/08-process-automation/automation_recommender.py +688 -0
  154. package/.claude/roles/system-design/skills/08-process-automation/plan_generator.py +679 -0
  155. package/.claude/roles/system-design/skills/08-process-automation/process_analyzer.py +528 -0
  156. package/.claude/roles/system-design/skills/08-process-automation/process_parser.py +684 -0
  157. package/.claude/roles/system-design/skills/08-process-automation/role_matcher.py +615 -0
  158. package/.claude/skills/README.md +336 -0
  159. package/.claude/skills/ai-engineer.md +104 -0
  160. package/.claude/skills/aws.md +143 -0
  161. package/.claude/skills/azure.md +149 -0
  162. package/.claude/skills/backend-developer.md +108 -0
  163. package/.claude/skills/code-review.md +399 -0
  164. package/.claude/skills/compliance-automation.md +747 -0
  165. package/.claude/skills/compliance-officer.md +108 -0
  166. package/.claude/skills/data-engineer.md +113 -0
  167. package/.claude/skills/data-governance.md +102 -0
  168. package/.claude/skills/data-scientist.md +123 -0
  169. package/.claude/skills/database-admin.md +109 -0
  170. package/.claude/skills/devops.md +160 -0
  171. package/.claude/skills/docker.md +160 -0
  172. package/.claude/skills/enterprise-dashboard.md +613 -0
  173. package/.claude/skills/finops.md +184 -0
  174. package/.claude/skills/frontend-developer.md +108 -0
  175. package/.claude/skills/gcp.md +143 -0
  176. package/.claude/skills/ml-engineer.md +115 -0
  177. package/.claude/skills/mlops.md +187 -0
  178. package/.claude/skills/network-engineer.md +109 -0
  179. package/.claude/skills/optimization-advisor.md +329 -0
  180. package/.claude/skills/orchestrator.md +623 -0
  181. package/.claude/skills/platform-engineer.md +102 -0
  182. package/.claude/skills/process-automation.md +226 -0
  183. package/.claude/skills/process-changelog.md +184 -0
  184. package/.claude/skills/process-documentation.md +484 -0
  185. package/.claude/skills/process-kanban.md +324 -0
  186. package/.claude/skills/process-versioning.md +214 -0
  187. package/.claude/skills/product-designer.md +104 -0
  188. package/.claude/skills/project-starter.md +443 -0
  189. package/.claude/skills/qa-engineer.md +109 -0
  190. package/.claude/skills/security-architect.md +135 -0
  191. package/.claude/skills/sre.md +109 -0
  192. package/.claude/skills/system-design.md +126 -0
  193. package/.claude/skills/technical-writer.md +101 -0
  194. package/.gitattributes +2 -0
  195. package/GITHUB_COPILOT.md +106 -0
  196. package/README.md +192 -291
  197. package/package.json +16 -46
  198. package/bin/cli.js +0 -241
@@ -1,264 +1,264 @@
1
- # Skill 02: Azure Data Factory
2
-
3
- ## 🎯 Overview
4
- Pipeline creation, integration runtime, linked services
5
-
6
- ## 🔗 Connections
7
- - **Data Engineer**: Data foundation and pipelines (de-01, de-02, de-03)
8
- - **Security Architect**: Compliance, PII detection, access control (sa-01, sa-02)
9
- - **ML Engineer**: Model lifecycle and serving (ml-01, ml-04)
10
- - **AI Engineer**: LLM integration and automation (ai-01, ai-02, ai-07)
11
- - **MLOps**: Experiment tracking and monitoring (mo-01, mo-03, mo-06)
12
- - **FinOps**: Cost optimization and tracking (fo-01, fo-07)
13
- - **DevOps**: CI/CD, containerization, monitoring (do-01, do-03, do-08)
14
- - **System Design**: Architecture patterns (sd-01)
15
- - **Dependencies**: de-02
16
-
17
- ## 🛠️ Tools Included
18
-
19
- ### 1. Primary Implementation Script
20
- Core implementation for azure data factory.
21
-
22
- ### 2. Configuration Manager
23
- Manage configuration and settings for azure data factory.
24
-
25
- ### 3. Integration Connector
26
- Connect with other Tech Hub skills and external services.
27
-
28
- ### 4. Monitoring & Metrics
29
- Track performance, costs, and quality metrics.
30
-
31
- ### 5. Automation Scripts
32
- Automate common workflows and tasks.
33
-
34
- ## 📊 Key Metrics
35
- - Implementation quality score
36
- - Performance benchmarks
37
- - Cost efficiency
38
- - Security compliance rate
39
- - Integration test coverage
40
-
41
- ## 🚀 Quick Start
42
-
43
- ```python
44
- # Example implementation for Azure Data Factory
45
- from azure import 02_data_factory
46
-
47
- # Initialize
48
- service = 02DataFactoryService()
49
-
50
- # Execute
51
- result = service.execute(
52
- config={
53
- "environment": "production",
54
- "enable_monitoring": True
55
- }
56
- )
57
-
58
- print(f"Status: {result.status}")
59
- print(f"Metrics: {result.metrics}")
60
- ```
61
-
62
- ## 📚 Best Practices
63
-
64
- ### Cost Optimization (FinOps Integration)
65
-
66
- 1. **Monitor Resource Costs**
67
- - Track costs per execution
68
- - Set budget alerts
69
- - Optimize resource utilization
70
- - Reference: FinOps fo-01 (Cost Monitoring)
71
-
72
- 2. **Right-size Resources**
73
- - Use appropriate compute sizes
74
- - Implement auto-scaling
75
- - Leverage spot/reserved instances where applicable
76
- - Reference: FinOps fo-06, fo-07
77
-
78
- ### Security & Privacy (Security Architect Integration)
79
-
80
- 3. **Implement Access Control**
81
- - Use least privilege principle
82
- - Enable Azure AD authentication
83
- - Audit access logs
84
- - Reference: Security Architect sa-02 (IAM), sa-04
85
-
86
- 4. **Data Protection**
87
- - Encrypt data at rest and in transit
88
- - Scan for PII before processing
89
- - Implement data retention policies
90
- - Reference: Security Architect sa-01 (PII Detection)
91
-
92
- ### Quality & Governance (Data Engineer Integration)
93
-
94
- 5. **Ensure Data Quality**
95
- - Validate inputs and outputs
96
- - Implement quality gates
97
- - Monitor data freshness
98
- - Reference: Data Engineer de-03 (Data Quality)
99
-
100
- ### Lifecycle Management (MLOps Integration)
101
-
102
- 6. **Version Control**
103
- - Version all configurations
104
- - Track changes over time
105
- - Enable rollback capability
106
- - Reference: MLOps mo-03 (Versioning)
107
-
108
- 7. **Continuous Monitoring**
109
- - Track performance metrics
110
- - Set up alerting
111
- - Monitor for drift
112
- - Reference: MLOps mo-06 (Monitoring)
113
-
114
- ### Deployment & Operations (DevOps Integration)
115
-
116
- 8. **Automate Deployment**
117
- - Implement CI/CD pipelines
118
- - Use infrastructure as code
119
- - Enable blue-green deployments
120
- - Reference: DevOps do-01 (CI/CD), do-03 (IaC)
121
-
122
- 9. **Observability**
123
- - Implement distributed tracing
124
- - Set up dashboards
125
- - Enable logging and metrics
126
- - Reference: DevOps do-08 (Monitoring)
127
-
128
- ### Azure-Specific Best Practices
129
-
130
- 10. **Leverage Azure Services**
131
- - Use managed services where possible
132
- - Implement Azure Policy for governance
133
- - Enable Azure Monitor integration
134
- - Use managed identities for authentication
135
-
136
- ## 💰 Cost Optimization Examples
137
-
138
- ### Cost Tracking
139
- ```python
140
- from finops_tracker import CostTracker
141
-
142
- tracker = CostTracker()
143
-
144
- @tracker.track_costs
145
- def run_operation(params):
146
- # Your operation here
147
- result = execute_operation(params)
148
- return result
149
-
150
- # Monthly report
151
- report = tracker.monthly_report()
152
- print(f"Total cost: ${report.total_cost:.2f}")
153
- print(f"Cost per operation: ${report.avg_cost:.4f}")
154
- ```
155
-
156
- ## 🔒 Security Best Practices Examples
157
-
158
- ### Access Control Implementation
159
- ```python
160
- from azure.identity import DefaultAzureCredential
161
- from security_manager import AccessControl
162
-
163
- credential = DefaultAzureCredential()
164
- access_control = AccessControl(credential)
165
-
166
- # Validate access before operation
167
- @access_control.require_role("operator")
168
- def sensitive_operation(data):
169
- # Operation logic
170
- return process_data(data)
171
- ```
172
-
173
- ## 📊 Enhanced Metrics & Monitoring
174
-
175
- | Metric Category | Metric | Target | Tool |
176
- |-----------------|--------|--------|------|
177
- | **Performance** | Execution time (p95) | <5s | Azure Monitor |
178
- | | Success rate | >99% | Custom metrics |
179
- | **Cost** | Cost per operation | <$0.05 | FinOps dashboard |
180
- | | Resource utilization | >75% | Azure Monitor |
181
- | **Quality** | Error rate | <1% | App Insights |
182
- | | Data quality score | >95% | Quality tracker |
183
- | **Security** | Access violations | 0 | Security logs |
184
- | | Compliance score | 100% | Audit system |
185
-
186
- ## 🚀 Deployment Pipeline
187
-
188
- ### CI/CD Example
189
- ```yaml
190
- # .github/workflows/deploy-02-data-factory.yml
191
- name: Deploy Azure Data Factory
192
-
193
- on:
194
- push:
195
- paths:
196
- - 'azure/skills/02-data-factory/**'
197
- branches:
198
- - main
199
-
200
- jobs:
201
- test:
202
- runs-on: ubuntu-latest
203
- steps:
204
- - uses: actions/checkout@v3
205
- - name: Run tests
206
- run: pytest tests/ -v
207
- - name: Security scan
208
- run: python scripts/security_scan.py
209
- - name: Cost validation
210
- run: python scripts/validate_costs.py
211
-
212
- deploy:
213
- needs: test
214
- runs-on: ubuntu-latest
215
- steps:
216
- - name: Deploy to Azure
217
- run: |
218
- az deployment group create \
219
- --resource-group rg-azure \
220
- --template-file infra/main.bicep
221
- - name: Monitor deployment
222
- run: python scripts/monitor_health.py --duration 10m
223
- ```
224
-
225
- ## 🔄 Integration Workflow
226
-
227
- ### End-to-End Process
228
- ```
229
- 1. Input Validation
230
-
231
- 2. Security Checks (sa-01, sa-02)
232
-
233
- 3. Main Processing
234
-
235
- 4. Quality Validation (de-03)
236
-
237
- 5. Cost Tracking (fo-01)
238
-
239
- 6. Monitoring & Logging (do-08)
240
-
241
- 7. Output Delivery
242
- ```
243
-
244
- ## 🎯 Quick Wins
245
-
246
- 1. **Enable cost tracking** - Monitor spending from day one
247
- 2. **Implement security scanning** - Catch vulnerabilities early
248
- 3. **Set up monitoring** - Full visibility into operations
249
- 4. **Automate deployment** - Faster, safer releases
250
- 5. **Add quality gates** - Prevent bad data from propagating
251
- 6. **Enable caching** - Reduce redundant operations
252
- 7. **Implement retries** - Improve reliability
253
- 8. **Set up alerting** - Know about issues immediately
254
-
255
- ## 🔗 Related Skills
256
- - de-02
257
-
258
- ---
259
-
260
- **Skill ID**: `02-data-factory`
261
- **Complexity**: Medium
262
- **Dependencies**: de-02
263
- **Business Value**: High
264
- **Estimated Implementation Time**: 4-8 hours
1
+ # Skill 02: Azure Data Factory
2
+
3
+ ## 🎯 Overview
4
+ Pipeline creation, integration runtime, linked services
5
+
6
+ ## 🔗 Connections
7
+ - **Data Engineer**: Data foundation and pipelines (de-01, de-02, de-03)
8
+ - **Security Architect**: Compliance, PII detection, access control (sa-01, sa-02)
9
+ - **ML Engineer**: Model lifecycle and serving (ml-01, ml-04)
10
+ - **AI Engineer**: LLM integration and automation (ai-01, ai-02, ai-07)
11
+ - **MLOps**: Experiment tracking and monitoring (mo-01, mo-03, mo-06)
12
+ - **FinOps**: Cost optimization and tracking (fo-01, fo-07)
13
+ - **DevOps**: CI/CD, containerization, monitoring (do-01, do-03, do-08)
14
+ - **System Design**: Architecture patterns (sd-01)
15
+ - **Dependencies**: de-02
16
+
17
+ ## 🛠️ Tools Included
18
+
19
+ ### 1. Primary Implementation Script
20
+ Core implementation for azure data factory.
21
+
22
+ ### 2. Configuration Manager
23
+ Manage configuration and settings for azure data factory.
24
+
25
+ ### 3. Integration Connector
26
+ Connect with other Tech Hub skills and external services.
27
+
28
+ ### 4. Monitoring & Metrics
29
+ Track performance, costs, and quality metrics.
30
+
31
+ ### 5. Automation Scripts
32
+ Automate common workflows and tasks.
33
+
34
+ ## 📊 Key Metrics
35
+ - Implementation quality score
36
+ - Performance benchmarks
37
+ - Cost efficiency
38
+ - Security compliance rate
39
+ - Integration test coverage
40
+
41
+ ## 🚀 Quick Start
42
+
43
+ ```python
44
+ # Example implementation for Azure Data Factory
45
+ from azure import 02_data_factory
46
+
47
+ # Initialize
48
+ service = 02DataFactoryService()
49
+
50
+ # Execute
51
+ result = service.execute(
52
+ config={
53
+ "environment": "production",
54
+ "enable_monitoring": True
55
+ }
56
+ )
57
+
58
+ print(f"Status: {result.status}")
59
+ print(f"Metrics: {result.metrics}")
60
+ ```
61
+
62
+ ## 📚 Best Practices
63
+
64
+ ### Cost Optimization (FinOps Integration)
65
+
66
+ 1. **Monitor Resource Costs**
67
+ - Track costs per execution
68
+ - Set budget alerts
69
+ - Optimize resource utilization
70
+ - Reference: FinOps fo-01 (Cost Monitoring)
71
+
72
+ 2. **Right-size Resources**
73
+ - Use appropriate compute sizes
74
+ - Implement auto-scaling
75
+ - Leverage spot/reserved instances where applicable
76
+ - Reference: FinOps fo-06, fo-07
77
+
78
+ ### Security & Privacy (Security Architect Integration)
79
+
80
+ 3. **Implement Access Control**
81
+ - Use least privilege principle
82
+ - Enable Azure AD authentication
83
+ - Audit access logs
84
+ - Reference: Security Architect sa-02 (IAM), sa-04
85
+
86
+ 4. **Data Protection**
87
+ - Encrypt data at rest and in transit
88
+ - Scan for PII before processing
89
+ - Implement data retention policies
90
+ - Reference: Security Architect sa-01 (PII Detection)
91
+
92
+ ### Quality & Governance (Data Engineer Integration)
93
+
94
+ 5. **Ensure Data Quality**
95
+ - Validate inputs and outputs
96
+ - Implement quality gates
97
+ - Monitor data freshness
98
+ - Reference: Data Engineer de-03 (Data Quality)
99
+
100
+ ### Lifecycle Management (MLOps Integration)
101
+
102
+ 6. **Version Control**
103
+ - Version all configurations
104
+ - Track changes over time
105
+ - Enable rollback capability
106
+ - Reference: MLOps mo-03 (Versioning)
107
+
108
+ 7. **Continuous Monitoring**
109
+ - Track performance metrics
110
+ - Set up alerting
111
+ - Monitor for drift
112
+ - Reference: MLOps mo-06 (Monitoring)
113
+
114
+ ### Deployment & Operations (DevOps Integration)
115
+
116
+ 8. **Automate Deployment**
117
+ - Implement CI/CD pipelines
118
+ - Use infrastructure as code
119
+ - Enable blue-green deployments
120
+ - Reference: DevOps do-01 (CI/CD), do-03 (IaC)
121
+
122
+ 9. **Observability**
123
+ - Implement distributed tracing
124
+ - Set up dashboards
125
+ - Enable logging and metrics
126
+ - Reference: DevOps do-08 (Monitoring)
127
+
128
+ ### Azure-Specific Best Practices
129
+
130
+ 10. **Leverage Azure Services**
131
+ - Use managed services where possible
132
+ - Implement Azure Policy for governance
133
+ - Enable Azure Monitor integration
134
+ - Use managed identities for authentication
135
+
136
+ ## 💰 Cost Optimization Examples
137
+
138
+ ### Cost Tracking
139
+ ```python
140
+ from finops_tracker import CostTracker
141
+
142
+ tracker = CostTracker()
143
+
144
+ @tracker.track_costs
145
+ def run_operation(params):
146
+ # Your operation here
147
+ result = execute_operation(params)
148
+ return result
149
+
150
+ # Monthly report
151
+ report = tracker.monthly_report()
152
+ print(f"Total cost: ${report.total_cost:.2f}")
153
+ print(f"Cost per operation: ${report.avg_cost:.4f}")
154
+ ```
155
+
156
+ ## 🔒 Security Best Practices Examples
157
+
158
+ ### Access Control Implementation
159
+ ```python
160
+ from azure.identity import DefaultAzureCredential
161
+ from security_manager import AccessControl
162
+
163
+ credential = DefaultAzureCredential()
164
+ access_control = AccessControl(credential)
165
+
166
+ # Validate access before operation
167
+ @access_control.require_role("operator")
168
+ def sensitive_operation(data):
169
+ # Operation logic
170
+ return process_data(data)
171
+ ```
172
+
173
+ ## 📊 Enhanced Metrics & Monitoring
174
+
175
+ | Metric Category | Metric | Target | Tool |
176
+ |-----------------|--------|--------|------|
177
+ | **Performance** | Execution time (p95) | <5s | Azure Monitor |
178
+ | | Success rate | >99% | Custom metrics |
179
+ | **Cost** | Cost per operation | <$0.05 | FinOps dashboard |
180
+ | | Resource utilization | >75% | Azure Monitor |
181
+ | **Quality** | Error rate | <1% | App Insights |
182
+ | | Data quality score | >95% | Quality tracker |
183
+ | **Security** | Access violations | 0 | Security logs |
184
+ | | Compliance score | 100% | Audit system |
185
+
186
+ ## 🚀 Deployment Pipeline
187
+
188
+ ### CI/CD Example
189
+ ```yaml
190
+ # .github/workflows/deploy-02-data-factory.yml
191
+ name: Deploy Azure Data Factory
192
+
193
+ on:
194
+ push:
195
+ paths:
196
+ - 'azure/skills/02-data-factory/**'
197
+ branches:
198
+ - main
199
+
200
+ jobs:
201
+ test:
202
+ runs-on: ubuntu-latest
203
+ steps:
204
+ - uses: actions/checkout@v3
205
+ - name: Run tests
206
+ run: pytest tests/ -v
207
+ - name: Security scan
208
+ run: python scripts/security_scan.py
209
+ - name: Cost validation
210
+ run: python scripts/validate_costs.py
211
+
212
+ deploy:
213
+ needs: test
214
+ runs-on: ubuntu-latest
215
+ steps:
216
+ - name: Deploy to Azure
217
+ run: |
218
+ az deployment group create \
219
+ --resource-group rg-azure \
220
+ --template-file infra/main.bicep
221
+ - name: Monitor deployment
222
+ run: python scripts/monitor_health.py --duration 10m
223
+ ```
224
+
225
+ ## 🔄 Integration Workflow
226
+
227
+ ### End-to-End Process
228
+ ```
229
+ 1. Input Validation
230
+
231
+ 2. Security Checks (sa-01, sa-02)
232
+
233
+ 3. Main Processing
234
+
235
+ 4. Quality Validation (de-03)
236
+
237
+ 5. Cost Tracking (fo-01)
238
+
239
+ 6. Monitoring & Logging (do-08)
240
+
241
+ 7. Output Delivery
242
+ ```
243
+
244
+ ## 🎯 Quick Wins
245
+
246
+ 1. **Enable cost tracking** - Monitor spending from day one
247
+ 2. **Implement security scanning** - Catch vulnerabilities early
248
+ 3. **Set up monitoring** - Full visibility into operations
249
+ 4. **Automate deployment** - Faster, safer releases
250
+ 5. **Add quality gates** - Prevent bad data from propagating
251
+ 6. **Enable caching** - Reduce redundant operations
252
+ 7. **Implement retries** - Improve reliability
253
+ 8. **Set up alerting** - Know about issues immediately
254
+
255
+ ## 🔗 Related Skills
256
+ - de-02
257
+
258
+ ---
259
+
260
+ **Skill ID**: `02-data-factory`
261
+ **Complexity**: Medium
262
+ **Dependencies**: de-02
263
+ **Business Value**: High
264
+ **Estimated Implementation Time**: 4-8 hours