@ngxtm/devkit 3.7.0 → 3.8.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/merged-commands/3d-web-experience.md +254 -0
- package/merged-commands/ab-test-setup.md +232 -0
- package/merged-commands/accessibility-compliance-accessibility-audit.md +42 -0
- package/merged-commands/active-directory-attacks.md +383 -0
- package/merged-commands/address-github-comments.md +55 -0
- package/merged-commands/aesthetic.md +134 -0
- package/merged-commands/agent-evaluation.md +64 -0
- package/merged-commands/agent-framework-azure-hosted-agents.md +332 -0
- package/merged-commands/agent-manager-skill.md +40 -0
- package/merged-commands/agent-memory-mcp.md +82 -0
- package/merged-commands/agent-memory-systems.md +67 -0
- package/merged-commands/agent-orchestration-improve-agent.md +349 -0
- package/merged-commands/agent-orchestration-multi-agent-optimize.md +239 -0
- package/merged-commands/agent-tool-builder.md +53 -0
- package/merged-commands/agile-product-owner.md +31 -0
- package/merged-commands/ai-agents-architect.md +90 -0
- package/merged-commands/ai-artist.md +75 -0
- package/merged-commands/ai-engineer.md +171 -0
- package/merged-commands/ai-multimodal.md +109 -0
- package/merged-commands/ai-product.md +54 -0
- package/merged-commands/ai-wrapper-product.md +273 -0
- package/merged-commands/airflow-dag-patterns.md +41 -0
- package/merged-commands/algolia-search.md +66 -0
- package/merged-commands/algorithmic-art.md +405 -0
- package/merged-commands/analytics-tracking.md +404 -0
- package/merged-commands/angular-architect.md +97 -0
- package/merged-commands/angular-migration.md +428 -0
- package/merged-commands/anti-reversing-techniques.md +42 -0
- package/merged-commands/api-design-principles.md +37 -0
- package/merged-commands/api-designer.md +101 -0
- package/merged-commands/api-documentation-generator.md +484 -0
- package/merged-commands/api-documenter.md +184 -0
- package/merged-commands/api-fuzzing-bug-bounty.md +433 -0
- package/merged-commands/api-patterns.md +81 -0
- package/merged-commands/api-security-best-practices.md +907 -0
- package/merged-commands/api-testing-observability-api-mock.md +46 -0
- package/merged-commands/app-builder.md +75 -0
- package/merged-commands/app-store-optimization.md +403 -0
- package/merged-commands/application-performance-performance-optimization.md +154 -0
- package/merged-commands/architect-review.md +174 -0
- package/merged-commands/architecture-decision-records.md +441 -0
- package/merged-commands/architecture-designer.md +89 -0
- package/merged-commands/architecture-patterns.md +37 -0
- package/merged-commands/architecture.md +55 -0
- package/merged-commands/arm-cortex-expert.md +306 -0
- package/merged-commands/artifacts-builder.md +74 -0
- package/merged-commands/ask-questions-if-underspecified.md +81 -0
- package/merged-commands/async-python-patterns.md +39 -0
- package/merged-commands/atlassian-mcp.md +100 -0
- package/merged-commands/attack-tree-construction.md +38 -0
- package/merged-commands/auth-implementation-patterns.md +39 -0
- package/merged-commands/automate-whatsapp.md +257 -0
- package/merged-commands/autonomous-agent-patterns.md +761 -0
- package/merged-commands/autonomous-agents.md +68 -0
- package/merged-commands/avalonia-layout-zafiro.md +59 -0
- package/merged-commands/avalonia-viewmodels-zafiro.md +29 -0
- package/merged-commands/avalonia-zafiro-development.md +29 -0
- package/merged-commands/aws-agentic-ai.md +117 -0
- package/merged-commands/aws-cdk-development.md +278 -0
- package/merged-commands/aws-cost-operations.md +317 -0
- package/merged-commands/aws-penetration-testing.md +405 -0
- package/merged-commands/aws-serverless-eda.md +757 -0
- package/merged-commands/aws-serverless.md +323 -0
- package/merged-commands/aws-skills.md +22 -0
- package/merged-commands/azd-deployment.md +296 -0
- package/merged-commands/azure-ai-agents-python.md +277 -0
- package/merged-commands/azure-ai-search-python.md +198 -0
- package/merged-commands/azure-ai-voicelive-skill.md +294 -0
- package/merged-commands/azure-functions.md +42 -0
- package/merged-commands/backend-architect.md +333 -0
- package/merged-commands/backend-dev-guidelines.md +342 -0
- package/merged-commands/backend-development-feature-development.md +180 -0
- package/merged-commands/backend-development.md +155 -0
- package/merged-commands/backend-security-coder.md +156 -0
- package/merged-commands/backtesting-frameworks.md +39 -0
- package/merged-commands/bash-defensive-patterns.md +43 -0
- package/merged-commands/bash-linux.md +199 -0
- package/merged-commands/bash-pro.md +310 -0
- package/merged-commands/bats-testing-patterns.md +34 -0
- package/merged-commands/bazel-build-optimization.md +397 -0
- package/merged-commands/beautiful-prose.md +22 -0
- package/merged-commands/behavioral-modes.md +242 -0
- package/merged-commands/best-practices.md +500 -0
- package/merged-commands/better-auth.md +204 -0
- package/merged-commands/billing-automation.md +42 -0
- package/merged-commands/binary-analysis-patterns.md +450 -0
- package/merged-commands/blockchain-developer.md +208 -0
- package/merged-commands/blockrun.md +292 -0
- package/merged-commands/brainstorming.md +230 -0
- package/merged-commands/brand-guidelines-anthropic.md +73 -0
- package/merged-commands/brand-guidelines-community.md +73 -0
- package/merged-commands/brand-guidelines.md +73 -0
- package/merged-commands/broken-authentication.md +476 -0
- package/merged-commands/browser-automation.md +70 -0
- package/merged-commands/browser-extension-builder.md +261 -0
- package/merged-commands/building-ai-agent-on-cloudflare.md +391 -0
- package/merged-commands/building-mcp-server-on-cloudflare.md +265 -0
- package/merged-commands/bullmq-specialist.md +57 -0
- package/merged-commands/bun-development.md +691 -0
- package/merged-commands/burp-suite-testing.md +380 -0
- package/merged-commands/business-analyst.md +182 -0
- package/merged-commands/busybox-on-windows.md +30 -0
- package/merged-commands/c-pro.md +56 -0
- package/merged-commands/c4-architecture-c4-architecture.md +389 -0
- package/merged-commands/c4-code.md +244 -0
- package/merged-commands/c4-component.md +153 -0
- package/merged-commands/c4-container.md +171 -0
- package/merged-commands/c4-context.md +150 -0
- package/merged-commands/canvas-design.md +130 -0
- package/merged-commands/cc-skill-backend-patterns.md +584 -0
- package/merged-commands/cc-skill-clickhouse-io.md +431 -0
- package/merged-commands/cc-skill-coding-standards.md +522 -0
- package/merged-commands/cc-skill-continuous-learning.md +10 -0
- package/merged-commands/cc-skill-frontend-patterns.md +633 -0
- package/merged-commands/cc-skill-project-guidelines-example.md +352 -0
- package/merged-commands/cc-skill-security-review.md +496 -0
- package/merged-commands/cc-skill-strategic-compact.md +10 -0
- package/merged-commands/changelog-automation.md +38 -0
- package/merged-commands/changelog-generator.md +104 -0
- package/merged-commands/chaos-engineer.md +98 -0
- package/merged-commands/chrome-devtools.md +407 -0
- package/merged-commands/cicd-automation-workflow-automate.md +51 -0
- package/merged-commands/clarity-gate.md +22 -0
- package/merged-commands/claude-ally-health.md +22 -0
- package/merged-commands/claude-code-guide.md +68 -0
- package/merged-commands/claude-d3js-skill.md +820 -0
- package/merged-commands/claude-scientific-skills.md +22 -0
- package/merged-commands/claude-speed-reader.md +22 -0
- package/merged-commands/claude-win11-speckit-update-skill.md +22 -0
- package/merged-commands/clean-code.md +201 -0
- package/merged-commands/clerk-auth.md +56 -0
- package/merged-commands/cli-developer.md +97 -0
- package/merged-commands/cloud-architect.md +135 -0
- package/merged-commands/cloud-penetration-testing.md +501 -0
- package/merged-commands/cloudflare-expert.md +227 -0
- package/merged-commands/code-documentation-code-explain.md +46 -0
- package/merged-commands/code-documentation-doc-generate.md +48 -0
- package/merged-commands/code-documentation.md +263 -0
- package/merged-commands/code-documenter.md +95 -0
- package/merged-commands/code-refactoring-context-restore.md +179 -0
- package/merged-commands/code-refactoring-refactor-clean.md +51 -0
- package/merged-commands/code-refactoring-tech-debt.md +386 -0
- package/merged-commands/code-refactoring.md +209 -0
- package/merged-commands/code-review-ai-ai-review.md +450 -0
- package/merged-commands/code-review-checklist.md +444 -0
- package/merged-commands/code-review-excellence.md +40 -0
- package/merged-commands/code-review.md +121 -0
- package/merged-commands/code-reviewer.md +178 -0
- package/merged-commands/codebase-cleanup-deps-audit.md +51 -0
- package/merged-commands/codebase-cleanup-refactor-clean.md +51 -0
- package/merged-commands/codebase-cleanup-tech-debt.md +386 -0
- package/merged-commands/codex-review.md +37 -0
- package/merged-commands/commit.md +171 -0
- package/merged-commands/competitive-ads-extractor.md +293 -0
- package/merged-commands/competitive-landscape.md +34 -0
- package/merged-commands/competitor-alternatives.md +750 -0
- package/merged-commands/comprehensive-review-full-review.md +146 -0
- package/merged-commands/comprehensive-review-pr-enhance.md +46 -0
- package/merged-commands/computer-use-agents.md +315 -0
- package/merged-commands/concise-planning.md +62 -0
- package/merged-commands/conductor-implement.md +388 -0
- package/merged-commands/conductor-manage.md +39 -0
- package/merged-commands/conductor-new-track.md +433 -0
- package/merged-commands/conductor-revert.md +372 -0
- package/merged-commands/conductor-setup.md +426 -0
- package/merged-commands/conductor-status.md +338 -0
- package/merged-commands/conductor-validator.md +62 -0
- package/merged-commands/content-creator.md +248 -0
- package/merged-commands/content-marketer.md +170 -0
- package/merged-commands/content-research-writer.md +538 -0
- package/merged-commands/context-compression.md +266 -0
- package/merged-commands/context-degradation.md +238 -0
- package/merged-commands/context-driven-development.md +400 -0
- package/merged-commands/context-engineering.md +107 -0
- package/merged-commands/context-fundamentals.md +192 -0
- package/merged-commands/context-management-context-restore.md +179 -0
- package/merged-commands/context-management-context-save.md +177 -0
- package/merged-commands/context-manager.md +185 -0
- package/merged-commands/context-optimization.md +186 -0
- package/merged-commands/context-window-management.md +53 -0
- package/merged-commands/context7-auto-research.md +36 -0
- package/merged-commands/conversation-memory.md +61 -0
- package/merged-commands/copy-editing.md +439 -0
- package/merged-commands/copywriting.md +225 -0
- package/merged-commands/core-components.md +264 -0
- package/merged-commands/cosmos-db-python-skill.md +198 -0
- package/merged-commands/cost-optimization.md +286 -0
- package/merged-commands/cpp-pro.md +59 -0
- package/merged-commands/cqrs-implementation.md +35 -0
- package/merged-commands/create-pr.md +192 -0
- package/merged-commands/crewai.md +243 -0
- package/merged-commands/csharp-developer.md +94 -0
- package/merged-commands/csharp-pro.md +59 -0
- package/merged-commands/culture-index.md +43 -0
- package/merged-commands/customer-support.md +170 -0
- package/merged-commands/daily-news-report.md +356 -0
- package/merged-commands/data-engineer.md +224 -0
- package/merged-commands/data-engineering-data-driven-feature.md +182 -0
- package/merged-commands/data-engineering-data-pipeline.md +201 -0
- package/merged-commands/data-quality-frameworks.md +40 -0
- package/merged-commands/data-scientist.md +199 -0
- package/merged-commands/data-storytelling.md +465 -0
- package/merged-commands/database-admin.md +165 -0
- package/merged-commands/database-architect.md +268 -0
- package/merged-commands/database-cloud-optimization-cost-optimize.md +44 -0
- package/merged-commands/database-design.md +52 -0
- package/merged-commands/database-migration.md +436 -0
- package/merged-commands/database-migrations-migration-observability.md +420 -0
- package/merged-commands/database-migrations-sql-migrations.md +53 -0
- package/merged-commands/database-optimizer.md +167 -0
- package/merged-commands/databases.md +232 -0
- package/merged-commands/dbt-transformation-patterns.md +34 -0
- package/merged-commands/debugger.md +49 -0
- package/merged-commands/debugging-strategies.md +34 -0
- package/merged-commands/debugging-toolkit-smart-debug.md +197 -0
- package/merged-commands/debugging-wizard.md +93 -0
- package/merged-commands/debugging.md +84 -0
- package/merged-commands/deep-research.md +114 -0
- package/merged-commands/defi-protocol-templates.md +466 -0
- package/merged-commands/dependency-management-deps-audit.md +44 -0
- package/merged-commands/dependency-upgrade.md +421 -0
- package/merged-commands/deployment-engineer.md +170 -0
- package/merged-commands/deployment-pipeline-design.md +371 -0
- package/merged-commands/deployment-procedures.md +241 -0
- package/merged-commands/deployment-validation-config-validate.md +496 -0
- package/merged-commands/design-md.md +178 -0
- package/merged-commands/design-orchestration.md +167 -0
- package/merged-commands/developer-growth-analysis.md +322 -0
- package/merged-commands/devops-engineer.md +92 -0
- package/merged-commands/devops-troubleshooter.md +161 -0
- package/merged-commands/devops.md +285 -0
- package/merged-commands/discord-bot-architect.md +277 -0
- package/merged-commands/dispatching-parallel-agents.md +180 -0
- package/merged-commands/distributed-debugging-debug-trace.md +44 -0
- package/merged-commands/distributed-tracing.md +450 -0
- package/merged-commands/django-expert.md +89 -0
- package/merged-commands/django-pro.md +180 -0
- package/merged-commands/doc-coauthoring.md +375 -0
- package/merged-commands/docker-expert.md +409 -0
- package/merged-commands/docs-architect.md +98 -0
- package/merged-commands/docs-seeker.md +102 -0
- package/merged-commands/documentation-generation-doc-generate.md +48 -0
- package/merged-commands/documentation-templates.md +194 -0
- package/merged-commands/docx-official.md +197 -0
- package/merged-commands/docx.md +197 -0
- package/merged-commands/domain-name-brainstormer.md +212 -0
- package/merged-commands/dotnet-architect.md +197 -0
- package/merged-commands/dotnet-backend-patterns.md +37 -0
- package/merged-commands/dotnet-core-expert.md +96 -0
- package/merged-commands/dx-optimizer.md +83 -0
- package/merged-commands/e2e-testing-patterns.md +41 -0
- package/merged-commands/elixir-pro.md +59 -0
- package/merged-commands/email-sequence.md +925 -0
- package/merged-commands/email-systems.md +54 -0
- package/merged-commands/embedded-systems.md +98 -0
- package/merged-commands/embedding-strategies.md +491 -0
- package/merged-commands/employment-contract-templates.md +39 -0
- package/merged-commands/environment-setup-guide.md +479 -0
- package/merged-commands/error-debugging-error-analysis.md +47 -0
- package/merged-commands/error-debugging-error-trace.md +43 -0
- package/merged-commands/error-debugging-multi-agent-review.md +216 -0
- package/merged-commands/error-detective.md +53 -0
- package/merged-commands/error-diagnostics-error-analysis.md +47 -0
- package/merged-commands/error-diagnostics-error-trace.md +48 -0
- package/merged-commands/error-diagnostics-smart-debug.md +197 -0
- package/merged-commands/error-handling-patterns.md +35 -0
- package/merged-commands/ethical-hacking-methodology.md +466 -0
- package/merged-commands/evaluation.md +238 -0
- package/merged-commands/event-sourcing-architect.md +58 -0
- package/merged-commands/event-store-design.md +449 -0
- package/merged-commands/exa-search.md +36 -0
- package/merged-commands/executing-plans.md +76 -0
- package/merged-commands/expo-app-design.md +22 -0
- package/merged-commands/expo-deployment.md +72 -0
- package/merged-commands/fal-audio.md +22 -0
- package/merged-commands/fal-generate.md +22 -0
- package/merged-commands/fal-image-edit.md +22 -0
- package/merged-commands/fal-platform.md +22 -0
- package/merged-commands/fal-upscale.md +22 -0
- package/merged-commands/fal-workflow.md +22 -0
- package/merged-commands/fastapi-expert.md +93 -0
- package/merged-commands/fastapi-pro.md +192 -0
- package/merged-commands/fastapi-router.md +52 -0
- package/merged-commands/fastapi-templates.md +32 -0
- package/merged-commands/feature-forge.md +90 -0
- package/merged-commands/ffuf-claude-skill.md +22 -0
- package/merged-commands/file-organizer.md +250 -0
- package/merged-commands/file-path-traversal.md +486 -0
- package/merged-commands/file-uploads.md +22 -0
- package/merged-commands/find-bugs.md +86 -0
- package/merged-commands/fine-tuning-expert.md +98 -0
- package/merged-commands/finishing-a-development-branch.md +200 -0
- package/merged-commands/firebase.md +56 -0
- package/merged-commands/firecrawl-scraper.md +37 -0
- package/merged-commands/firmware-analyst.md +320 -0
- package/merged-commands/fix-review.md +53 -0
- package/merged-commands/fixing.md +72 -0
- package/merged-commands/flutter-expert.md +200 -0
- package/merged-commands/form-cro.md +441 -0
- package/merged-commands/foundry-iq-agent.md +15 -0
- package/merged-commands/foundry-iq-python.md +275 -0
- package/merged-commands/foundry-nextgen-frontend.md +555 -0
- package/merged-commands/foundry-sdk-python.md +290 -0
- package/merged-commands/fp-ts-errors.md +856 -0
- package/merged-commands/fp-ts-pragmatic.md +598 -0
- package/merged-commands/fp-ts-react.md +796 -0
- package/merged-commands/framework-migration-code-migrate.md +48 -0
- package/merged-commands/framework-migration-deps-upgrade.md +48 -0
- package/merged-commands/framework-migration-legacy-modernize.md +132 -0
- package/merged-commands/free-tool-strategy.md +576 -0
- package/merged-commands/frontend-design.md +272 -0
- package/merged-commands/frontend-dev-guidelines.md +359 -0
- package/merged-commands/frontend-developer.md +171 -0
- package/merged-commands/frontend-development.md +399 -0
- package/merged-commands/frontend-mobile-development-component-scaffold.md +403 -0
- package/merged-commands/frontend-mobile-security-xss-scan.md +322 -0
- package/merged-commands/frontend-security-coder.md +170 -0
- package/merged-commands/frontend-slides.md +770 -0
- package/merged-commands/full-stack-orchestration-full-stack-feature.md +135 -0
- package/merged-commands/fullstack-guardian.md +99 -0
- package/merged-commands/game-developer.md +94 -0
- package/merged-commands/game-development.md +167 -0
- package/merged-commands/gcp-cloud-run.md +288 -0
- package/merged-commands/gdpr-data-handling.md +33 -0
- package/merged-commands/geo-fundamentals.md +156 -0
- package/merged-commands/git-advanced-workflows.md +412 -0
- package/merged-commands/git-pr-workflows-git-workflow.md +140 -0
- package/merged-commands/git-pr-workflows-onboard.md +416 -0
- package/merged-commands/git-pr-workflows-pr-enhance.md +48 -0
- package/merged-commands/git-pushing.md +33 -0
- package/merged-commands/github-actions-templates.md +345 -0
- package/merged-commands/github-workflow-automation.md +846 -0
- package/merged-commands/gitlab-ci-patterns.md +283 -0
- package/merged-commands/gitops-workflow.md +303 -0
- package/merged-commands/go-concurrency-patterns.md +33 -0
- package/merged-commands/godot-gdscript-patterns.md +33 -0
- package/merged-commands/golang-pro.md +179 -0
- package/merged-commands/google-adk-python.md +243 -0
- package/merged-commands/grafana-dashboards.md +381 -0
- package/merged-commands/graphql-architect.md +182 -0
- package/merged-commands/graphql.md +68 -0
- package/merged-commands/haskell-pro.md +56 -0
- package/merged-commands/helm-chart-scaffolding.md +34 -0
- package/merged-commands/hr-pro.md +126 -0
- package/merged-commands/html-injection-testing.md +498 -0
- package/merged-commands/hubspot-integration.md +42 -0
- package/merged-commands/hugging-face-cli.md +198 -0
- package/merged-commands/hugging-face-jobs.md +1038 -0
- package/merged-commands/hybrid-cloud-architect.md +168 -0
- package/merged-commands/hybrid-cloud-networking.md +238 -0
- package/merged-commands/hybrid-search-implementation.md +32 -0
- package/merged-commands/i18n-localization.md +154 -0
- package/merged-commands/idor-testing.md +442 -0
- package/merged-commands/image-enhancer.md +99 -0
- package/merged-commands/imagen.md +77 -0
- package/merged-commands/incident-responder.md +213 -0
- package/merged-commands/incident-response-incident-response.md +168 -0
- package/merged-commands/incident-response-smart-fix.md +29 -0
- package/merged-commands/incident-runbook-templates.md +395 -0
- package/merged-commands/infinite-gratitude.md +26 -0
- package/merged-commands/inngest.md +55 -0
- package/merged-commands/interactive-portfolio.md +223 -0
- package/merged-commands/internal-comms-anthropic.md +32 -0
- package/merged-commands/internal-comms-community.md +32 -0
- package/merged-commands/internal-comms.md +32 -0
- package/merged-commands/invoice-organizer.md +446 -0
- package/merged-commands/ios-developer.md +219 -0
- package/merged-commands/issue-creator.md +137 -0
- package/merged-commands/istio-traffic-management.md +337 -0
- package/merged-commands/iterate-pr.md +150 -0
- package/merged-commands/java-architect.md +95 -0
- package/merged-commands/java-pro.md +177 -0
- package/merged-commands/javascript-mastery.md +645 -0
- package/merged-commands/javascript-pro.md +57 -0
- package/merged-commands/javascript-testing-patterns.md +35 -0
- package/merged-commands/javascript-typescript-typescript-scaffold.md +361 -0
- package/merged-commands/javascript-typescript.md +142 -0
- package/merged-commands/jira-issues.md +181 -0
- package/merged-commands/job-application.md +90 -0
- package/merged-commands/julia-pro.md +209 -0
- package/merged-commands/k8s-manifest-generator.md +35 -0
- package/merged-commands/k8s-security-policies.md +346 -0
- package/merged-commands/kaizen.md +730 -0
- package/merged-commands/kotlin-specialist.md +94 -0
- package/merged-commands/kpi-dashboard-design.md +440 -0
- package/merged-commands/kubernetes-architect.md +170 -0
- package/merged-commands/kubernetes-specialist.md +117 -0
- package/merged-commands/langchain-architecture.md +350 -0
- package/merged-commands/langfuse.md +238 -0
- package/merged-commands/langgraph.md +287 -0
- package/merged-commands/laravel-specialist.md +101 -0
- package/merged-commands/last30days.md +421 -0
- package/merged-commands/launch-strategy.md +344 -0
- package/merged-commands/lead-research-assistant.md +199 -0
- package/merged-commands/learn.md +476 -0
- package/merged-commands/legacy-modernizer.md +53 -0
- package/merged-commands/legal-advisor.md +70 -0
- package/merged-commands/linear-claude-skill.md +543 -0
- package/merged-commands/linkerd-patterns.md +321 -0
- package/merged-commands/lint-and-validate.md +45 -0
- package/merged-commands/linux-privilege-escalation.md +504 -0
- package/merged-commands/linux-shell-scripting.md +504 -0
- package/merged-commands/llm-app-patterns.md +760 -0
- package/merged-commands/llm-application-dev-ai-assistant.md +35 -0
- package/merged-commands/llm-application-dev-langchain-agent.md +246 -0
- package/merged-commands/llm-application-dev-prompt-optimize.md +37 -0
- package/merged-commands/llm-application-dev.md +216 -0
- package/merged-commands/llm-evaluation.md +483 -0
- package/merged-commands/loki-mode.md +721 -0
- package/merged-commands/machine-learning-ops-ml-pipeline.md +314 -0
- package/merged-commands/makepad-skills.md +22 -0
- package/merged-commands/malware-analyst.md +247 -0
- package/merged-commands/markdown-novel-viewer.md +281 -0
- package/merged-commands/market-sizing-analysis.md +425 -0
- package/merged-commands/marketing-ideas.md +221 -0
- package/merged-commands/marketing-psychology.md +255 -0
- package/merged-commands/mcp-builder.md +236 -0
- package/merged-commands/mcp-developer.md +94 -0
- package/merged-commands/mcp-management.md +209 -0
- package/merged-commands/media-processing.md +358 -0
- package/merged-commands/meeting-insights-analyzer.md +327 -0
- package/merged-commands/memory-forensics.md +491 -0
- package/merged-commands/memory-safety-patterns.md +33 -0
- package/merged-commands/memory-systems.md +228 -0
- package/merged-commands/mermaid-expert.md +59 -0
- package/merged-commands/mermaidjs-v11.md +115 -0
- package/merged-commands/metasploit-framework.md +478 -0
- package/merged-commands/micro-saas-launcher.md +212 -0
- package/merged-commands/microservices-architect.md +102 -0
- package/merged-commands/microservices-patterns.md +35 -0
- package/merged-commands/minecraft-bukkit-pro.md +126 -0
- package/merged-commands/ml-engineer.md +168 -0
- package/merged-commands/ml-pipeline-workflow.md +257 -0
- package/merged-commands/ml-pipeline.md +111 -0
- package/merged-commands/mlops-engineer.md +219 -0
- package/merged-commands/mobile-design.md +284 -0
- package/merged-commands/mobile-developer.md +205 -0
- package/merged-commands/mobile-development.md +212 -0
- package/merged-commands/mobile-security-coder.md +184 -0
- package/merged-commands/modern-javascript-patterns.md +35 -0
- package/merged-commands/monitoring-expert.md +92 -0
- package/merged-commands/monorepo-architect.md +61 -0
- package/merged-commands/monorepo-management.md +35 -0
- package/merged-commands/moodle-external-api-development.md +597 -0
- package/merged-commands/mtls-configuration.md +359 -0
- package/merged-commands/multi-agent-brainstorming.md +256 -0
- package/merged-commands/multi-agent-patterns.md +262 -0
- package/merged-commands/multi-cloud-architecture.md +189 -0
- package/merged-commands/multi-platform-apps-multi-platform.md +203 -0
- package/merged-commands/n8n-code-python.md +750 -0
- package/merged-commands/n8n-mcp-tools-expert.md +654 -0
- package/merged-commands/n8n-node-configuration.md +796 -0
- package/merged-commands/nanobanana-ppt-skills.md +22 -0
- package/merged-commands/neon-postgres.md +56 -0
- package/merged-commands/nestjs-expert.md +552 -0
- package/merged-commands/network-101.md +342 -0
- package/merged-commands/network-engineer.md +169 -0
- package/merged-commands/nextjs-app-router-patterns.md +33 -0
- package/merged-commands/nextjs-best-practices.md +203 -0
- package/merged-commands/nextjs-developer.md +97 -0
- package/merged-commands/nextjs-supabase-auth.md +56 -0
- package/merged-commands/nft-standards.md +395 -0
- package/merged-commands/nodejs-backend-patterns.md +35 -0
- package/merged-commands/nodejs-best-practices.md +333 -0
- package/merged-commands/nosql-expert.md +111 -0
- package/merged-commands/notebooklm-skill.md +269 -0
- package/merged-commands/notebooklm.md +269 -0
- package/merged-commands/notion-template-business.md +216 -0
- package/merged-commands/nx-workspace-patterns.md +464 -0
- package/merged-commands/observability-engineer.md +237 -0
- package/merged-commands/observability-monitoring-monitor-setup.md +48 -0
- package/merged-commands/observability-monitoring-slo-implement.md +43 -0
- package/merged-commands/observe-whatsapp.md +109 -0
- package/merged-commands/obsidian-clipper-template-creator.md +64 -0
- package/merged-commands/on-call-handoff-patterns.md +453 -0
- package/merged-commands/onboarding-cro.md +433 -0
- package/merged-commands/openapi-spec-generation.md +33 -0
- package/merged-commands/page-cro.md +343 -0
- package/merged-commands/paid-ads.md +551 -0
- package/merged-commands/pandas-pro.md +96 -0
- package/merged-commands/parallel-agents.md +175 -0
- package/merged-commands/payment-integration.md +77 -0
- package/merged-commands/paypal-integration.md +479 -0
- package/merged-commands/paywall-upgrade-cro.md +570 -0
- package/merged-commands/pci-compliance.md +478 -0
- package/merged-commands/pdf-official.md +294 -0
- package/merged-commands/pdf.md +294 -0
- package/merged-commands/pentest-checklist.md +334 -0
- package/merged-commands/pentest-commands.md +438 -0
- package/merged-commands/performance-engineer.md +180 -0
- package/merged-commands/performance-profiling.md +143 -0
- package/merged-commands/performance-testing-review-ai-review.md +450 -0
- package/merged-commands/performance-testing-review-multi-agent-review.md +216 -0
- package/merged-commands/personal-tool-builder.md +289 -0
- package/merged-commands/php-pro.md +63 -0
- package/merged-commands/plaid-fintech.md +50 -0
- package/merged-commands/plan-writing.md +152 -0
- package/merged-commands/planning-with-files.md +211 -0
- package/merged-commands/planning.md +95 -0
- package/merged-commands/plans-kanban.md +166 -0
- package/merged-commands/playwright-expert.md +87 -0
- package/merged-commands/playwright-skill.md +453 -0
- package/merged-commands/podcast-generation.md +121 -0
- package/merged-commands/popup-cro.md +346 -0
- package/merged-commands/posix-shell-pro.md +304 -0
- package/merged-commands/postgres-best-practices.md +57 -0
- package/merged-commands/postgres-pro.md +98 -0
- package/merged-commands/postgresql.md +230 -0
- package/merged-commands/postmortem-writing.md +386 -0
- package/merged-commands/powershell-windows.md +167 -0
- package/merged-commands/pptx-official.md +484 -0
- package/merged-commands/pptx.md +484 -0
- package/merged-commands/pricing-strategy.md +356 -0
- package/merged-commands/prisma-expert.md +355 -0
- package/merged-commands/privilege-escalation-methods.md +333 -0
- package/merged-commands/problem-solving.md +96 -0
- package/merged-commands/product-manager-toolkit.md +351 -0
- package/merged-commands/product-strategist.md +26 -0
- package/merged-commands/production-code-audit.md +540 -0
- package/merged-commands/programmatic-seo.md +351 -0
- package/merged-commands/projection-patterns.md +33 -0
- package/merged-commands/prometheus-configuration.md +404 -0
- package/merged-commands/prompt-caching.md +61 -0
- package/merged-commands/prompt-engineer.md +272 -0
- package/merged-commands/prompt-engineering-patterns.md +213 -0
- package/merged-commands/prompt-engineering.md +171 -0
- package/merged-commands/prompt-library.md +322 -0
- package/merged-commands/protocol-reverse-engineering.md +29 -0
- package/merged-commands/pydantic-models.md +58 -0
- package/merged-commands/pypict-skill.md +22 -0
- package/merged-commands/python-development-python-scaffold.md +331 -0
- package/merged-commands/python-development.md +139 -0
- package/merged-commands/python-packaging.md +36 -0
- package/merged-commands/python-patterns.md +441 -0
- package/merged-commands/python-performance-optimization.md +36 -0
- package/merged-commands/python-pro.md +158 -0
- package/merged-commands/python-testing-patterns.md +37 -0
- package/merged-commands/qa-regression.md +337 -0
- package/merged-commands/quant-analyst.md +53 -0
- package/merged-commands/radix-ui-design-system.md +847 -0
- package/merged-commands/raffle-winner-picker.md +159 -0
- package/merged-commands/rag-architect.md +100 -0
- package/merged-commands/rag-engineer.md +90 -0
- package/merged-commands/rag-implementation.md +421 -0
- package/merged-commands/rails-expert.md +97 -0
- package/merged-commands/react-best-practices.md +121 -0
- package/merged-commands/react-expert.md +98 -0
- package/merged-commands/react-flow-node.md +66 -0
- package/merged-commands/react-modernization.md +34 -0
- package/merged-commands/react-native-architecture.md +33 -0
- package/merged-commands/react-native-expert.md +88 -0
- package/merged-commands/react-patterns.md +198 -0
- package/merged-commands/react-state-management.md +441 -0
- package/merged-commands/react-ui-patterns.md +289 -0
- package/merged-commands/readme.md +775 -0
- package/merged-commands/receiving-code-review.md +213 -0
- package/merged-commands/red-team-tactics.md +199 -0
- package/merged-commands/red-team-tools.md +310 -0
- package/merged-commands/reference-builder.md +188 -0
- package/merged-commands/referral-program.md +602 -0
- package/merged-commands/remotion-best-practices.md +45 -0
- package/merged-commands/repomix.md +275 -0
- package/merged-commands/requesting-code-review.md +105 -0
- package/merged-commands/research-engineer.md +135 -0
- package/merged-commands/research.md +191 -0
- package/merged-commands/reverse-engineer.md +173 -0
- package/merged-commands/risk-manager.md +61 -0
- package/merged-commands/risk-metrics-calculation.md +33 -0
- package/merged-commands/ruby-pro.md +56 -0
- package/merged-commands/rust-async-patterns.md +33 -0
- package/merged-commands/rust-engineer.md +96 -0
- package/merged-commands/rust-pro.md +178 -0
- package/merged-commands/saga-orchestration.md +496 -0
- package/merged-commands/sales-automator.md +55 -0
- package/merged-commands/salesforce-developer.md +105 -0
- package/merged-commands/salesforce-development.md +51 -0
- package/merged-commands/sast-configuration.md +212 -0
- package/merged-commands/scala-pro.md +82 -0
- package/merged-commands/scanning-tools.md +589 -0
- package/merged-commands/schema-markup.md +360 -0
- package/merged-commands/screen-reader-testing.md +33 -0
- package/merged-commands/screenshots.md +401 -0
- package/merged-commands/scroll-experience.md +263 -0
- package/merged-commands/search-specialist.md +80 -0
- package/merged-commands/secrets-management.md +364 -0
- package/merged-commands/secure-code-guardian.md +93 -0
- package/merged-commands/security-auditor.md +169 -0
- package/merged-commands/security-bluebook-builder.md +22 -0
- package/merged-commands/security-compliance-compliance-check.md +55 -0
- package/merged-commands/security-requirement-extraction.md +33 -0
- package/merged-commands/security-reviewer.md +94 -0
- package/merged-commands/security-scanning-security-dependencies.md +43 -0
- package/merged-commands/security-scanning-security-hardening.md +147 -0
- package/merged-commands/security-scanning-security-sast.md +495 -0
- package/merged-commands/segment-cdp.md +50 -0
- package/merged-commands/senior-architect.md +209 -0
- package/merged-commands/senior-backend.md +209 -0
- package/merged-commands/senior-computer-vision.md +226 -0
- package/merged-commands/senior-data-engineer.md +226 -0
- package/merged-commands/senior-data-scientist.md +226 -0
- package/merged-commands/senior-devops.md +209 -0
- package/merged-commands/senior-frontend.md +209 -0
- package/merged-commands/senior-fullstack.md +209 -0
- package/merged-commands/senior-ml-engineer.md +226 -0
- package/merged-commands/senior-prompt-engineer.md +226 -0
- package/merged-commands/senior-qa.md +209 -0
- package/merged-commands/senior-secops.md +209 -0
- package/merged-commands/senior-security.md +209 -0
- package/merged-commands/seo-audit.md +487 -0
- package/merged-commands/seo-authority-builder.md +136 -0
- package/merged-commands/seo-cannibalization-detector.md +123 -0
- package/merged-commands/seo-content-auditor.md +83 -0
- package/merged-commands/seo-content-planner.md +108 -0
- package/merged-commands/seo-content-refresher.md +118 -0
- package/merged-commands/seo-content-writer.md +96 -0
- package/merged-commands/seo-fundamentals.md +173 -0
- package/merged-commands/seo-keyword-strategist.md +95 -0
- package/merged-commands/seo-meta-optimizer.md +92 -0
- package/merged-commands/seo-snippet-hunter.md +114 -0
- package/merged-commands/seo-structure-architect.md +108 -0
- package/merged-commands/sequential-thinking.md +94 -0
- package/merged-commands/server-management.md +161 -0
- package/merged-commands/service-mesh-expert.md +58 -0
- package/merged-commands/service-mesh-observability.md +395 -0
- package/merged-commands/sharp-edges.md +70 -0
- package/merged-commands/shellcheck-configuration.md +466 -0
- package/merged-commands/shodan-reconnaissance.md +503 -0
- package/merged-commands/shopify-apps.md +42 -0
- package/merged-commands/shopify-development.md +366 -0
- package/merged-commands/shopify-expert.md +102 -0
- package/merged-commands/signup-flow-cro.md +355 -0
- package/merged-commands/similarity-search-patterns.md +33 -0
- package/merged-commands/skill-creator.md +356 -0
- package/merged-commands/skill-developer.md +426 -0
- package/merged-commands/skill-rails-upgrade.md +408 -0
- package/merged-commands/skill-seekers.md +22 -0
- package/merged-commands/skill-share.md +80 -0
- package/merged-commands/slack-bot-builder.md +264 -0
- package/merged-commands/slack-gif-creator.md +254 -0
- package/merged-commands/slo-implementation.md +341 -0
- package/merged-commands/smtp-penetration-testing.md +500 -0
- package/merged-commands/social-content.md +807 -0
- package/merged-commands/software-architecture.md +75 -0
- package/merged-commands/solidity-security.md +34 -0
- package/merged-commands/spark-engineer.md +100 -0
- package/merged-commands/spark-optimization.md +427 -0
- package/merged-commands/spec-miner.md +88 -0
- package/merged-commands/spring-boot-engineer.md +104 -0
- package/merged-commands/sql-injection-testing.md +448 -0
- package/merged-commands/sql-optimization-patterns.md +35 -0
- package/merged-commands/sql-pro.md +173 -0
- package/merged-commands/sqlmap-database-pentesting.md +400 -0
- package/merged-commands/sre-engineer.md +98 -0
- package/merged-commands/ssh-penetration-testing.md +488 -0
- package/merged-commands/startup-analyst.md +328 -0
- package/merged-commands/startup-business-analyst-business-case.md +487 -0
- package/merged-commands/startup-business-analyst-financial-projections.md +353 -0
- package/merged-commands/startup-business-analyst-market-opportunity.md +240 -0
- package/merged-commands/startup-financial-modeling.md +467 -0
- package/merged-commands/startup-metrics-framework.md +34 -0
- package/merged-commands/stitch-ui-design.md +378 -0
- package/merged-commands/stride-analysis-patterns.md +33 -0
- package/merged-commands/stripe-integration.md +454 -0
- package/merged-commands/subagent-driven-development.md +240 -0
- package/merged-commands/superpowers-lab.md +22 -0
- package/merged-commands/swift-expert.md +94 -0
- package/merged-commands/swiftui-expert-skill.md +275 -0
- package/merged-commands/systematic-debugging.md +296 -0
- package/merged-commands/systems-programming-rust-project.md +440 -0
- package/merged-commands/tailwind-design-system.md +33 -0
- package/merged-commands/tailwind-patterns.md +269 -0
- package/merged-commands/tavily-web.md +36 -0
- package/merged-commands/tdd-orchestrator.md +205 -0
- package/merged-commands/tdd-workflow.md +149 -0
- package/merged-commands/tdd-workflows-tdd-cycle.md +221 -0
- package/merged-commands/tdd-workflows-tdd-green.md +73 -0
- package/merged-commands/tdd-workflows-tdd-red.md +164 -0
- package/merged-commands/tdd-workflows-tdd-refactor.md +187 -0
- package/merged-commands/team-collaboration-issue.md +37 -0
- package/merged-commands/team-collaboration-standup-notes.md +44 -0
- package/merged-commands/team-composition-analysis.md +413 -0
- package/merged-commands/telegram-bot-builder.md +254 -0
- package/merged-commands/telegram-mini-app.md +279 -0
- package/merged-commands/template-skill.md +6 -0
- package/merged-commands/temporal-python-pro.md +370 -0
- package/merged-commands/temporal-python-testing.md +170 -0
- package/merged-commands/terraform-engineer.md +97 -0
- package/merged-commands/terraform-module-library.md +261 -0
- package/merged-commands/terraform-skill.md +517 -0
- package/merged-commands/terraform-specialist.md +166 -0
- package/merged-commands/test-automator.md +224 -0
- package/merged-commands/test-driven-development.md +371 -0
- package/merged-commands/test-fixing.md +119 -0
- package/merged-commands/test-master.md +104 -0
- package/merged-commands/testing-patterns.md +259 -0
- package/merged-commands/theme-factory.md +59 -0
- package/merged-commands/threat-mitigation-mapping.md +33 -0
- package/merged-commands/threat-modeling-expert.md +60 -0
- package/merged-commands/threejs-skills.md +22 -0
- package/merged-commands/threejs.md +89 -0
- package/merged-commands/tool-design.md +318 -0
- package/merged-commands/top-web-vulnerabilities.md +543 -0
- package/merged-commands/track-management.md +38 -0
- package/merged-commands/trigger-dev.md +67 -0
- package/merged-commands/turborepo-caching.md +419 -0
- package/merged-commands/tutorial-engineer.md +139 -0
- package/merged-commands/twilio-communications.md +295 -0
- package/merged-commands/typescript-advanced-types.md +35 -0
- package/merged-commands/typescript-expert.md +429 -0
- package/merged-commands/typescript-pro.md +55 -0
- package/merged-commands/ui-design-system.md +32 -0
- package/merged-commands/ui-skills.md +22 -0
- package/merged-commands/ui-styling.md +321 -0
- package/merged-commands/ui-ux-designer.md +209 -0
- package/merged-commands/ui-ux-pro-max.md +351 -0
- package/merged-commands/ui-visual-validator.md +214 -0
- package/merged-commands/unit-testing-test-generate.md +319 -0
- package/merged-commands/unity-developer.md +230 -0
- package/merged-commands/unity-ecs-patterns.md +33 -0
- package/merged-commands/unreal-engine-cpp-pro.md +114 -0
- package/merged-commands/upgrading-expo.md +118 -0
- package/merged-commands/upstash-qstash.md +68 -0
- package/merged-commands/using-git-worktrees.md +217 -0
- package/merged-commands/using-neon.md +84 -0
- package/merged-commands/using-superpowers.md +87 -0
- package/merged-commands/uv-package-manager.md +37 -0
- package/merged-commands/ux-researcher-designer.md +30 -0
- package/merged-commands/varlock-claude-skill.md +22 -0
- package/merged-commands/vector-database-engineer.md +60 -0
- package/merged-commands/vector-index-tuning.md +42 -0
- package/merged-commands/vercel-deploy-claimable.md +120 -0
- package/merged-commands/vercel-deploy.md +22 -0
- package/merged-commands/vercel-deployment.md +79 -0
- package/merged-commands/verification-before-completion.md +139 -0
- package/merged-commands/vexor.md +22 -0
- package/merged-commands/video-downloader.md +106 -0
- package/merged-commands/viral-generator-builder.md +199 -0
- package/merged-commands/voice-agents.md +68 -0
- package/merged-commands/voice-ai-development.md +302 -0
- package/merged-commands/voice-ai-engine-development.md +721 -0
- package/merged-commands/vue-expert-js.md +91 -0
- package/merged-commands/vue-expert.md +374 -0
- package/merged-commands/vulnerability-scanner.md +276 -0
- package/merged-commands/wcag-audit-patterns.md +41 -0
- package/merged-commands/web-artifacts-builder.md +74 -0
- package/merged-commands/web-design-guidelines.md +36 -0
- package/merged-commands/web-frameworks.md +324 -0
- package/merged-commands/web-performance-optimization.md +646 -0
- package/merged-commands/web3-testing.md +427 -0
- package/merged-commands/webapp-testing.md +96 -0
- package/merged-commands/websocket-engineer.md +96 -0
- package/merged-commands/windows-privilege-escalation.md +496 -0
- package/merged-commands/wireshark-analysis.md +497 -0
- package/merged-commands/wordpress-penetration-testing.md +485 -0
- package/merged-commands/wordpress-pro.md +105 -0
- package/merged-commands/workflow-automation.md +68 -0
- package/merged-commands/workflow-orchestration-patterns.md +333 -0
- package/merged-commands/workflow-patterns.md +38 -0
- package/merged-commands/writing-plans.md +116 -0
- package/merged-commands/writing-skills.md +125 -0
- package/merged-commands/x-article-publisher-skill.md +22 -0
- package/merged-commands/xlsx-official.md +289 -0
- package/merged-commands/xlsx.md +289 -0
- package/merged-commands/xss-html-injection.md +499 -0
- package/merged-commands/youtube-transcript.md +415 -0
- package/merged-commands/zapier-make-patterns.md +67 -0
- package/merged-commands/zustand-store.md +68 -0
- package/package.json +1 -1
- package/scripts/merge-commands.js +21 -0
|
@@ -0,0 +1,760 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: llm-app-patterns
|
|
3
|
+
description: "Production-ready patterns for building LLM applications. Covers RAG pipelines, agent architectures, prompt IDEs, and LLMOps monitoring. Use when designing AI applications, implementing RAG, building agents, or setting up LLM observability."
|
|
4
|
+
---
|
|
5
|
+
|
|
6
|
+
# 🤖 LLM Application Patterns
|
|
7
|
+
|
|
8
|
+
> Production-ready patterns for building LLM applications, inspired by [Dify](https://github.com/langgenius/dify) and industry best practices.
|
|
9
|
+
|
|
10
|
+
## When to Use This Skill
|
|
11
|
+
|
|
12
|
+
Use this skill when:
|
|
13
|
+
|
|
14
|
+
- Designing LLM-powered applications
|
|
15
|
+
- Implementing RAG (Retrieval-Augmented Generation)
|
|
16
|
+
- Building AI agents with tools
|
|
17
|
+
- Setting up LLMOps monitoring
|
|
18
|
+
- Choosing between agent architectures
|
|
19
|
+
|
|
20
|
+
---
|
|
21
|
+
|
|
22
|
+
## 1. RAG Pipeline Architecture
|
|
23
|
+
|
|
24
|
+
### Overview
|
|
25
|
+
|
|
26
|
+
RAG (Retrieval-Augmented Generation) grounds LLM responses in your data.
|
|
27
|
+
|
|
28
|
+
```
|
|
29
|
+
┌─────────────┐ ┌─────────────┐ ┌─────────────┐
|
|
30
|
+
│ Ingest │────▶│ Retrieve │────▶│ Generate │
|
|
31
|
+
│ Documents │ │ Context │ │ Response │
|
|
32
|
+
└─────────────┘ └─────────────┘ └─────────────┘
|
|
33
|
+
│ │ │
|
|
34
|
+
▼ ▼ ▼
|
|
35
|
+
┌─────────┐ ┌───────────┐ ┌───────────┐
|
|
36
|
+
│ Chunking│ │ Vector │ │ LLM │
|
|
37
|
+
│Embedding│ │ Search │ │ + Context│
|
|
38
|
+
└─────────┘ └───────────┘ └───────────┘
|
|
39
|
+
```
|
|
40
|
+
|
|
41
|
+
### 1.1 Document Ingestion
|
|
42
|
+
|
|
43
|
+
```python
|
|
44
|
+
# Chunking strategies
|
|
45
|
+
class ChunkingStrategy:
|
|
46
|
+
# Fixed-size chunks (simple but may break context)
|
|
47
|
+
FIXED_SIZE = "fixed_size" # e.g., 512 tokens
|
|
48
|
+
|
|
49
|
+
# Semantic chunking (preserves meaning)
|
|
50
|
+
SEMANTIC = "semantic" # Split on paragraphs/sections
|
|
51
|
+
|
|
52
|
+
# Recursive splitting (tries multiple separators)
|
|
53
|
+
RECURSIVE = "recursive" # ["\n\n", "\n", " ", ""]
|
|
54
|
+
|
|
55
|
+
# Document-aware (respects structure)
|
|
56
|
+
DOCUMENT_AWARE = "document_aware" # Headers, lists, etc.
|
|
57
|
+
|
|
58
|
+
# Recommended settings
|
|
59
|
+
CHUNK_CONFIG = {
|
|
60
|
+
"chunk_size": 512, # tokens
|
|
61
|
+
"chunk_overlap": 50, # token overlap between chunks
|
|
62
|
+
"separators": ["\n\n", "\n", ". ", " "],
|
|
63
|
+
}
|
|
64
|
+
```
|
|
65
|
+
|
|
66
|
+
### 1.2 Embedding & Storage
|
|
67
|
+
|
|
68
|
+
```python
|
|
69
|
+
# Vector database selection
|
|
70
|
+
VECTOR_DB_OPTIONS = {
|
|
71
|
+
"pinecone": {
|
|
72
|
+
"use_case": "Production, managed service",
|
|
73
|
+
"scale": "Billions of vectors",
|
|
74
|
+
"features": ["Hybrid search", "Metadata filtering"]
|
|
75
|
+
},
|
|
76
|
+
"weaviate": {
|
|
77
|
+
"use_case": "Self-hosted, multi-modal",
|
|
78
|
+
"scale": "Millions of vectors",
|
|
79
|
+
"features": ["GraphQL API", "Modules"]
|
|
80
|
+
},
|
|
81
|
+
"chromadb": {
|
|
82
|
+
"use_case": "Development, prototyping",
|
|
83
|
+
"scale": "Thousands of vectors",
|
|
84
|
+
"features": ["Simple API", "In-memory option"]
|
|
85
|
+
},
|
|
86
|
+
"pgvector": {
|
|
87
|
+
"use_case": "Existing Postgres infrastructure",
|
|
88
|
+
"scale": "Millions of vectors",
|
|
89
|
+
"features": ["SQL integration", "ACID compliance"]
|
|
90
|
+
}
|
|
91
|
+
}
|
|
92
|
+
|
|
93
|
+
# Embedding model selection
|
|
94
|
+
EMBEDDING_MODELS = {
|
|
95
|
+
"openai/text-embedding-3-small": {
|
|
96
|
+
"dimensions": 1536,
|
|
97
|
+
"cost": "$0.02/1M tokens",
|
|
98
|
+
"quality": "Good for most use cases"
|
|
99
|
+
},
|
|
100
|
+
"openai/text-embedding-3-large": {
|
|
101
|
+
"dimensions": 3072,
|
|
102
|
+
"cost": "$0.13/1M tokens",
|
|
103
|
+
"quality": "Best for complex queries"
|
|
104
|
+
},
|
|
105
|
+
"local/bge-large": {
|
|
106
|
+
"dimensions": 1024,
|
|
107
|
+
"cost": "Free (compute only)",
|
|
108
|
+
"quality": "Comparable to OpenAI small"
|
|
109
|
+
}
|
|
110
|
+
}
|
|
111
|
+
```
|
|
112
|
+
|
|
113
|
+
### 1.3 Retrieval Strategies
|
|
114
|
+
|
|
115
|
+
```python
|
|
116
|
+
# Basic semantic search
|
|
117
|
+
def semantic_search(query: str, top_k: int = 5):
|
|
118
|
+
query_embedding = embed(query)
|
|
119
|
+
results = vector_db.similarity_search(
|
|
120
|
+
query_embedding,
|
|
121
|
+
top_k=top_k
|
|
122
|
+
)
|
|
123
|
+
return results
|
|
124
|
+
|
|
125
|
+
# Hybrid search (semantic + keyword)
|
|
126
|
+
def hybrid_search(query: str, top_k: int = 5, alpha: float = 0.5):
|
|
127
|
+
"""
|
|
128
|
+
alpha=1.0: Pure semantic
|
|
129
|
+
alpha=0.0: Pure keyword (BM25)
|
|
130
|
+
alpha=0.5: Balanced
|
|
131
|
+
"""
|
|
132
|
+
semantic_results = vector_db.similarity_search(query)
|
|
133
|
+
keyword_results = bm25_search(query)
|
|
134
|
+
|
|
135
|
+
# Reciprocal Rank Fusion
|
|
136
|
+
return rrf_merge(semantic_results, keyword_results, alpha)
|
|
137
|
+
|
|
138
|
+
# Multi-query retrieval
|
|
139
|
+
def multi_query_retrieval(query: str):
|
|
140
|
+
"""Generate multiple query variations for better recall"""
|
|
141
|
+
queries = llm.generate_query_variations(query, n=3)
|
|
142
|
+
all_results = []
|
|
143
|
+
for q in queries:
|
|
144
|
+
all_results.extend(semantic_search(q))
|
|
145
|
+
return deduplicate(all_results)
|
|
146
|
+
|
|
147
|
+
# Contextual compression
|
|
148
|
+
def compressed_retrieval(query: str):
|
|
149
|
+
"""Retrieve then compress to relevant parts only"""
|
|
150
|
+
docs = semantic_search(query, top_k=10)
|
|
151
|
+
compressed = llm.extract_relevant_parts(docs, query)
|
|
152
|
+
return compressed
|
|
153
|
+
```
|
|
154
|
+
|
|
155
|
+
### 1.4 Generation with Context
|
|
156
|
+
|
|
157
|
+
```python
|
|
158
|
+
RAG_PROMPT_TEMPLATE = """
|
|
159
|
+
Answer the user's question based ONLY on the following context.
|
|
160
|
+
If the context doesn't contain enough information, say "I don't have enough information to answer that."
|
|
161
|
+
|
|
162
|
+
Context:
|
|
163
|
+
{context}
|
|
164
|
+
|
|
165
|
+
Question: {question}
|
|
166
|
+
|
|
167
|
+
Answer:"""
|
|
168
|
+
|
|
169
|
+
def generate_with_rag(question: str):
|
|
170
|
+
# Retrieve
|
|
171
|
+
context_docs = hybrid_search(question, top_k=5)
|
|
172
|
+
context = "\n\n".join([doc.content for doc in context_docs])
|
|
173
|
+
|
|
174
|
+
# Generate
|
|
175
|
+
prompt = RAG_PROMPT_TEMPLATE.format(
|
|
176
|
+
context=context,
|
|
177
|
+
question=question
|
|
178
|
+
)
|
|
179
|
+
|
|
180
|
+
response = llm.generate(prompt)
|
|
181
|
+
|
|
182
|
+
# Return with citations
|
|
183
|
+
return {
|
|
184
|
+
"answer": response,
|
|
185
|
+
"sources": [doc.metadata for doc in context_docs]
|
|
186
|
+
}
|
|
187
|
+
```
|
|
188
|
+
|
|
189
|
+
---
|
|
190
|
+
|
|
191
|
+
## 2. Agent Architectures
|
|
192
|
+
|
|
193
|
+
### 2.1 ReAct Pattern (Reasoning + Acting)
|
|
194
|
+
|
|
195
|
+
```
|
|
196
|
+
Thought: I need to search for information about X
|
|
197
|
+
Action: search("X")
|
|
198
|
+
Observation: [search results]
|
|
199
|
+
Thought: Based on the results, I should...
|
|
200
|
+
Action: calculate(...)
|
|
201
|
+
Observation: [calculation result]
|
|
202
|
+
Thought: I now have enough information
|
|
203
|
+
Action: final_answer("The answer is...")
|
|
204
|
+
```
|
|
205
|
+
|
|
206
|
+
```python
|
|
207
|
+
REACT_PROMPT = """
|
|
208
|
+
You are an AI assistant that can use tools to answer questions.
|
|
209
|
+
|
|
210
|
+
Available tools:
|
|
211
|
+
{tools_description}
|
|
212
|
+
|
|
213
|
+
Use this format:
|
|
214
|
+
Thought: [your reasoning about what to do next]
|
|
215
|
+
Action: [tool_name(arguments)]
|
|
216
|
+
Observation: [tool result - this will be filled in]
|
|
217
|
+
... (repeat Thought/Action/Observation as needed)
|
|
218
|
+
Thought: I have enough information to answer
|
|
219
|
+
Final Answer: [your final response]
|
|
220
|
+
|
|
221
|
+
Question: {question}
|
|
222
|
+
"""
|
|
223
|
+
|
|
224
|
+
class ReActAgent:
|
|
225
|
+
def __init__(self, tools: list, llm):
|
|
226
|
+
self.tools = {t.name: t for t in tools}
|
|
227
|
+
self.llm = llm
|
|
228
|
+
self.max_iterations = 10
|
|
229
|
+
|
|
230
|
+
def run(self, question: str) -> str:
|
|
231
|
+
prompt = REACT_PROMPT.format(
|
|
232
|
+
tools_description=self._format_tools(),
|
|
233
|
+
question=question
|
|
234
|
+
)
|
|
235
|
+
|
|
236
|
+
for _ in range(self.max_iterations):
|
|
237
|
+
response = self.llm.generate(prompt)
|
|
238
|
+
|
|
239
|
+
if "Final Answer:" in response:
|
|
240
|
+
return self._extract_final_answer(response)
|
|
241
|
+
|
|
242
|
+
action = self._parse_action(response)
|
|
243
|
+
observation = self._execute_tool(action)
|
|
244
|
+
prompt += f"\nObservation: {observation}\n"
|
|
245
|
+
|
|
246
|
+
return "Max iterations reached"
|
|
247
|
+
```
|
|
248
|
+
|
|
249
|
+
### 2.2 Function Calling Pattern
|
|
250
|
+
|
|
251
|
+
```python
|
|
252
|
+
# Define tools as functions with schemas
|
|
253
|
+
TOOLS = [
|
|
254
|
+
{
|
|
255
|
+
"name": "search_web",
|
|
256
|
+
"description": "Search the web for current information",
|
|
257
|
+
"parameters": {
|
|
258
|
+
"type": "object",
|
|
259
|
+
"properties": {
|
|
260
|
+
"query": {
|
|
261
|
+
"type": "string",
|
|
262
|
+
"description": "Search query"
|
|
263
|
+
}
|
|
264
|
+
},
|
|
265
|
+
"required": ["query"]
|
|
266
|
+
}
|
|
267
|
+
},
|
|
268
|
+
{
|
|
269
|
+
"name": "calculate",
|
|
270
|
+
"description": "Perform mathematical calculations",
|
|
271
|
+
"parameters": {
|
|
272
|
+
"type": "object",
|
|
273
|
+
"properties": {
|
|
274
|
+
"expression": {
|
|
275
|
+
"type": "string",
|
|
276
|
+
"description": "Math expression to evaluate"
|
|
277
|
+
}
|
|
278
|
+
},
|
|
279
|
+
"required": ["expression"]
|
|
280
|
+
}
|
|
281
|
+
}
|
|
282
|
+
]
|
|
283
|
+
|
|
284
|
+
class FunctionCallingAgent:
|
|
285
|
+
def run(self, question: str) -> str:
|
|
286
|
+
messages = [{"role": "user", "content": question}]
|
|
287
|
+
|
|
288
|
+
while True:
|
|
289
|
+
response = self.llm.chat(
|
|
290
|
+
messages=messages,
|
|
291
|
+
tools=TOOLS,
|
|
292
|
+
tool_choice="auto"
|
|
293
|
+
)
|
|
294
|
+
|
|
295
|
+
if response.tool_calls:
|
|
296
|
+
for tool_call in response.tool_calls:
|
|
297
|
+
result = self._execute_tool(
|
|
298
|
+
tool_call.name,
|
|
299
|
+
tool_call.arguments
|
|
300
|
+
)
|
|
301
|
+
messages.append({
|
|
302
|
+
"role": "tool",
|
|
303
|
+
"tool_call_id": tool_call.id,
|
|
304
|
+
"content": str(result)
|
|
305
|
+
})
|
|
306
|
+
else:
|
|
307
|
+
return response.content
|
|
308
|
+
```
|
|
309
|
+
|
|
310
|
+
### 2.3 Plan-and-Execute Pattern
|
|
311
|
+
|
|
312
|
+
```python
|
|
313
|
+
class PlanAndExecuteAgent:
|
|
314
|
+
"""
|
|
315
|
+
1. Create a plan (list of steps)
|
|
316
|
+
2. Execute each step
|
|
317
|
+
3. Replan if needed
|
|
318
|
+
"""
|
|
319
|
+
|
|
320
|
+
def run(self, task: str) -> str:
|
|
321
|
+
# Planning phase
|
|
322
|
+
plan = self.planner.create_plan(task)
|
|
323
|
+
# Returns: ["Step 1: ...", "Step 2: ...", ...]
|
|
324
|
+
|
|
325
|
+
results = []
|
|
326
|
+
for step in plan:
|
|
327
|
+
# Execute each step
|
|
328
|
+
result = self.executor.execute(step, context=results)
|
|
329
|
+
results.append(result)
|
|
330
|
+
|
|
331
|
+
# Check if replan needed
|
|
332
|
+
if self._needs_replan(task, results):
|
|
333
|
+
new_plan = self.planner.replan(
|
|
334
|
+
task,
|
|
335
|
+
completed=results,
|
|
336
|
+
remaining=plan[len(results):]
|
|
337
|
+
)
|
|
338
|
+
plan = new_plan
|
|
339
|
+
|
|
340
|
+
# Synthesize final answer
|
|
341
|
+
return self.synthesizer.summarize(task, results)
|
|
342
|
+
```
|
|
343
|
+
|
|
344
|
+
### 2.4 Multi-Agent Collaboration
|
|
345
|
+
|
|
346
|
+
```python
|
|
347
|
+
class AgentTeam:
|
|
348
|
+
"""
|
|
349
|
+
Specialized agents collaborating on complex tasks
|
|
350
|
+
"""
|
|
351
|
+
|
|
352
|
+
def __init__(self):
|
|
353
|
+
self.agents = {
|
|
354
|
+
"researcher": ResearchAgent(),
|
|
355
|
+
"analyst": AnalystAgent(),
|
|
356
|
+
"writer": WriterAgent(),
|
|
357
|
+
"critic": CriticAgent()
|
|
358
|
+
}
|
|
359
|
+
self.coordinator = CoordinatorAgent()
|
|
360
|
+
|
|
361
|
+
def solve(self, task: str) -> str:
|
|
362
|
+
# Coordinator assigns subtasks
|
|
363
|
+
assignments = self.coordinator.decompose(task)
|
|
364
|
+
|
|
365
|
+
results = {}
|
|
366
|
+
for assignment in assignments:
|
|
367
|
+
agent = self.agents[assignment.agent]
|
|
368
|
+
result = agent.execute(
|
|
369
|
+
assignment.subtask,
|
|
370
|
+
context=results
|
|
371
|
+
)
|
|
372
|
+
results[assignment.id] = result
|
|
373
|
+
|
|
374
|
+
# Critic reviews
|
|
375
|
+
critique = self.agents["critic"].review(results)
|
|
376
|
+
|
|
377
|
+
if critique.needs_revision:
|
|
378
|
+
# Iterate with feedback
|
|
379
|
+
return self.solve_with_feedback(task, results, critique)
|
|
380
|
+
|
|
381
|
+
return self.coordinator.synthesize(results)
|
|
382
|
+
```
|
|
383
|
+
|
|
384
|
+
---
|
|
385
|
+
|
|
386
|
+
## 3. Prompt IDE Patterns
|
|
387
|
+
|
|
388
|
+
### 3.1 Prompt Templates with Variables
|
|
389
|
+
|
|
390
|
+
```python
|
|
391
|
+
class PromptTemplate:
|
|
392
|
+
def __init__(self, template: str, variables: list[str]):
|
|
393
|
+
self.template = template
|
|
394
|
+
self.variables = variables
|
|
395
|
+
|
|
396
|
+
def format(self, **kwargs) -> str:
|
|
397
|
+
# Validate all variables provided
|
|
398
|
+
missing = set(self.variables) - set(kwargs.keys())
|
|
399
|
+
if missing:
|
|
400
|
+
raise ValueError(f"Missing variables: {missing}")
|
|
401
|
+
|
|
402
|
+
return self.template.format(**kwargs)
|
|
403
|
+
|
|
404
|
+
def with_examples(self, examples: list[dict]) -> str:
|
|
405
|
+
"""Add few-shot examples"""
|
|
406
|
+
example_text = "\n\n".join([
|
|
407
|
+
f"Input: {ex['input']}\nOutput: {ex['output']}"
|
|
408
|
+
for ex in examples
|
|
409
|
+
])
|
|
410
|
+
return f"{example_text}\n\n{self.template}"
|
|
411
|
+
|
|
412
|
+
# Usage
|
|
413
|
+
summarizer = PromptTemplate(
|
|
414
|
+
template="Summarize the following text in {style} style:\n\n{text}",
|
|
415
|
+
variables=["style", "text"]
|
|
416
|
+
)
|
|
417
|
+
|
|
418
|
+
prompt = summarizer.format(
|
|
419
|
+
style="professional",
|
|
420
|
+
text="Long article content..."
|
|
421
|
+
)
|
|
422
|
+
```
|
|
423
|
+
|
|
424
|
+
### 3.2 Prompt Versioning & A/B Testing
|
|
425
|
+
|
|
426
|
+
```python
|
|
427
|
+
class PromptRegistry:
|
|
428
|
+
def __init__(self, db):
|
|
429
|
+
self.db = db
|
|
430
|
+
|
|
431
|
+
def register(self, name: str, template: str, version: str):
|
|
432
|
+
"""Store prompt with version"""
|
|
433
|
+
self.db.save({
|
|
434
|
+
"name": name,
|
|
435
|
+
"template": template,
|
|
436
|
+
"version": version,
|
|
437
|
+
"created_at": datetime.now(),
|
|
438
|
+
"metrics": {}
|
|
439
|
+
})
|
|
440
|
+
|
|
441
|
+
def get(self, name: str, version: str = "latest") -> str:
|
|
442
|
+
"""Retrieve specific version"""
|
|
443
|
+
return self.db.get(name, version)
|
|
444
|
+
|
|
445
|
+
def ab_test(self, name: str, user_id: str) -> str:
|
|
446
|
+
"""Return variant based on user bucket"""
|
|
447
|
+
variants = self.db.get_all_versions(name)
|
|
448
|
+
bucket = hash(user_id) % len(variants)
|
|
449
|
+
return variants[bucket]
|
|
450
|
+
|
|
451
|
+
def record_outcome(self, prompt_id: str, outcome: dict):
|
|
452
|
+
"""Track prompt performance"""
|
|
453
|
+
self.db.update_metrics(prompt_id, outcome)
|
|
454
|
+
```
|
|
455
|
+
|
|
456
|
+
### 3.3 Prompt Chaining
|
|
457
|
+
|
|
458
|
+
```python
|
|
459
|
+
class PromptChain:
|
|
460
|
+
"""
|
|
461
|
+
Chain prompts together, passing output as input to next
|
|
462
|
+
"""
|
|
463
|
+
|
|
464
|
+
def __init__(self, steps: list[dict]):
|
|
465
|
+
self.steps = steps
|
|
466
|
+
|
|
467
|
+
def run(self, initial_input: str) -> dict:
|
|
468
|
+
context = {"input": initial_input}
|
|
469
|
+
results = []
|
|
470
|
+
|
|
471
|
+
for step in self.steps:
|
|
472
|
+
prompt = step["prompt"].format(**context)
|
|
473
|
+
output = llm.generate(prompt)
|
|
474
|
+
|
|
475
|
+
# Parse output if needed
|
|
476
|
+
if step.get("parser"):
|
|
477
|
+
output = step["parser"](output)
|
|
478
|
+
|
|
479
|
+
context[step["output_key"]] = output
|
|
480
|
+
results.append({
|
|
481
|
+
"step": step["name"],
|
|
482
|
+
"output": output
|
|
483
|
+
})
|
|
484
|
+
|
|
485
|
+
return {
|
|
486
|
+
"final_output": context[self.steps[-1]["output_key"]],
|
|
487
|
+
"intermediate_results": results
|
|
488
|
+
}
|
|
489
|
+
|
|
490
|
+
# Example: Research → Analyze → Summarize
|
|
491
|
+
chain = PromptChain([
|
|
492
|
+
{
|
|
493
|
+
"name": "research",
|
|
494
|
+
"prompt": "Research the topic: {input}",
|
|
495
|
+
"output_key": "research"
|
|
496
|
+
},
|
|
497
|
+
{
|
|
498
|
+
"name": "analyze",
|
|
499
|
+
"prompt": "Analyze these findings:\n{research}",
|
|
500
|
+
"output_key": "analysis"
|
|
501
|
+
},
|
|
502
|
+
{
|
|
503
|
+
"name": "summarize",
|
|
504
|
+
"prompt": "Summarize this analysis in 3 bullet points:\n{analysis}",
|
|
505
|
+
"output_key": "summary"
|
|
506
|
+
}
|
|
507
|
+
])
|
|
508
|
+
```
|
|
509
|
+
|
|
510
|
+
---
|
|
511
|
+
|
|
512
|
+
## 4. LLMOps & Observability
|
|
513
|
+
|
|
514
|
+
### 4.1 Metrics to Track
|
|
515
|
+
|
|
516
|
+
```python
|
|
517
|
+
LLM_METRICS = {
|
|
518
|
+
# Performance
|
|
519
|
+
"latency_p50": "50th percentile response time",
|
|
520
|
+
"latency_p99": "99th percentile response time",
|
|
521
|
+
"tokens_per_second": "Generation speed",
|
|
522
|
+
|
|
523
|
+
# Quality
|
|
524
|
+
"user_satisfaction": "Thumbs up/down ratio",
|
|
525
|
+
"task_completion": "% tasks completed successfully",
|
|
526
|
+
"hallucination_rate": "% responses with factual errors",
|
|
527
|
+
|
|
528
|
+
# Cost
|
|
529
|
+
"cost_per_request": "Average $ per API call",
|
|
530
|
+
"tokens_per_request": "Average tokens used",
|
|
531
|
+
"cache_hit_rate": "% requests served from cache",
|
|
532
|
+
|
|
533
|
+
# Reliability
|
|
534
|
+
"error_rate": "% failed requests",
|
|
535
|
+
"timeout_rate": "% requests that timed out",
|
|
536
|
+
"retry_rate": "% requests needing retry"
|
|
537
|
+
}
|
|
538
|
+
```
|
|
539
|
+
|
|
540
|
+
### 4.2 Logging & Tracing
|
|
541
|
+
|
|
542
|
+
```python
|
|
543
|
+
import logging
|
|
544
|
+
from opentelemetry import trace
|
|
545
|
+
|
|
546
|
+
tracer = trace.get_tracer(__name__)
|
|
547
|
+
|
|
548
|
+
class LLMLogger:
|
|
549
|
+
def log_request(self, request_id: str, data: dict):
|
|
550
|
+
"""Log LLM request for debugging and analysis"""
|
|
551
|
+
log_entry = {
|
|
552
|
+
"request_id": request_id,
|
|
553
|
+
"timestamp": datetime.now().isoformat(),
|
|
554
|
+
"model": data["model"],
|
|
555
|
+
"prompt": data["prompt"][:500], # Truncate for storage
|
|
556
|
+
"prompt_tokens": data["prompt_tokens"],
|
|
557
|
+
"temperature": data.get("temperature", 1.0),
|
|
558
|
+
"user_id": data.get("user_id"),
|
|
559
|
+
}
|
|
560
|
+
logging.info(f"LLM_REQUEST: {json.dumps(log_entry)}")
|
|
561
|
+
|
|
562
|
+
def log_response(self, request_id: str, data: dict):
|
|
563
|
+
"""Log LLM response"""
|
|
564
|
+
log_entry = {
|
|
565
|
+
"request_id": request_id,
|
|
566
|
+
"completion_tokens": data["completion_tokens"],
|
|
567
|
+
"total_tokens": data["total_tokens"],
|
|
568
|
+
"latency_ms": data["latency_ms"],
|
|
569
|
+
"finish_reason": data["finish_reason"],
|
|
570
|
+
"cost_usd": self._calculate_cost(data),
|
|
571
|
+
}
|
|
572
|
+
logging.info(f"LLM_RESPONSE: {json.dumps(log_entry)}")
|
|
573
|
+
|
|
574
|
+
# Distributed tracing
|
|
575
|
+
@tracer.start_as_current_span("llm_call")
|
|
576
|
+
def call_llm(prompt: str) -> str:
|
|
577
|
+
span = trace.get_current_span()
|
|
578
|
+
span.set_attribute("prompt.length", len(prompt))
|
|
579
|
+
|
|
580
|
+
response = llm.generate(prompt)
|
|
581
|
+
|
|
582
|
+
span.set_attribute("response.length", len(response))
|
|
583
|
+
span.set_attribute("tokens.total", response.usage.total_tokens)
|
|
584
|
+
|
|
585
|
+
return response.content
|
|
586
|
+
```
|
|
587
|
+
|
|
588
|
+
### 4.3 Evaluation Framework
|
|
589
|
+
|
|
590
|
+
```python
|
|
591
|
+
class LLMEvaluator:
|
|
592
|
+
"""
|
|
593
|
+
Evaluate LLM outputs for quality
|
|
594
|
+
"""
|
|
595
|
+
|
|
596
|
+
def evaluate_response(self,
|
|
597
|
+
question: str,
|
|
598
|
+
response: str,
|
|
599
|
+
ground_truth: str = None) -> dict:
|
|
600
|
+
scores = {}
|
|
601
|
+
|
|
602
|
+
# Relevance: Does it answer the question?
|
|
603
|
+
scores["relevance"] = self._score_relevance(question, response)
|
|
604
|
+
|
|
605
|
+
# Coherence: Is it well-structured?
|
|
606
|
+
scores["coherence"] = self._score_coherence(response)
|
|
607
|
+
|
|
608
|
+
# Groundedness: Is it based on provided context?
|
|
609
|
+
scores["groundedness"] = self._score_groundedness(response)
|
|
610
|
+
|
|
611
|
+
# Accuracy: Does it match ground truth?
|
|
612
|
+
if ground_truth:
|
|
613
|
+
scores["accuracy"] = self._score_accuracy(response, ground_truth)
|
|
614
|
+
|
|
615
|
+
# Harmfulness: Is it safe?
|
|
616
|
+
scores["safety"] = self._score_safety(response)
|
|
617
|
+
|
|
618
|
+
return scores
|
|
619
|
+
|
|
620
|
+
def run_benchmark(self, test_cases: list[dict]) -> dict:
|
|
621
|
+
"""Run evaluation on test set"""
|
|
622
|
+
results = []
|
|
623
|
+
for case in test_cases:
|
|
624
|
+
response = llm.generate(case["prompt"])
|
|
625
|
+
scores = self.evaluate_response(
|
|
626
|
+
question=case["prompt"],
|
|
627
|
+
response=response,
|
|
628
|
+
ground_truth=case.get("expected")
|
|
629
|
+
)
|
|
630
|
+
results.append(scores)
|
|
631
|
+
|
|
632
|
+
return self._aggregate_scores(results)
|
|
633
|
+
```
|
|
634
|
+
|
|
635
|
+
---
|
|
636
|
+
|
|
637
|
+
## 5. Production Patterns
|
|
638
|
+
|
|
639
|
+
### 5.1 Caching Strategy
|
|
640
|
+
|
|
641
|
+
```python
|
|
642
|
+
import hashlib
|
|
643
|
+
from functools import lru_cache
|
|
644
|
+
|
|
645
|
+
class LLMCache:
|
|
646
|
+
def __init__(self, redis_client, ttl_seconds=3600):
|
|
647
|
+
self.redis = redis_client
|
|
648
|
+
self.ttl = ttl_seconds
|
|
649
|
+
|
|
650
|
+
def _cache_key(self, prompt: str, model: str, **kwargs) -> str:
|
|
651
|
+
"""Generate deterministic cache key"""
|
|
652
|
+
content = f"{model}:{prompt}:{json.dumps(kwargs, sort_keys=True)}"
|
|
653
|
+
return hashlib.sha256(content.encode()).hexdigest()
|
|
654
|
+
|
|
655
|
+
def get_or_generate(self, prompt: str, model: str, **kwargs) -> str:
|
|
656
|
+
key = self._cache_key(prompt, model, **kwargs)
|
|
657
|
+
|
|
658
|
+
# Check cache
|
|
659
|
+
cached = self.redis.get(key)
|
|
660
|
+
if cached:
|
|
661
|
+
return cached.decode()
|
|
662
|
+
|
|
663
|
+
# Generate
|
|
664
|
+
response = llm.generate(prompt, model=model, **kwargs)
|
|
665
|
+
|
|
666
|
+
# Cache (only cache deterministic outputs)
|
|
667
|
+
if kwargs.get("temperature", 1.0) == 0:
|
|
668
|
+
self.redis.setex(key, self.ttl, response)
|
|
669
|
+
|
|
670
|
+
return response
|
|
671
|
+
```
|
|
672
|
+
|
|
673
|
+
### 5.2 Rate Limiting & Retry
|
|
674
|
+
|
|
675
|
+
```python
|
|
676
|
+
import time
|
|
677
|
+
from tenacity import retry, wait_exponential, stop_after_attempt
|
|
678
|
+
|
|
679
|
+
class RateLimiter:
|
|
680
|
+
def __init__(self, requests_per_minute: int):
|
|
681
|
+
self.rpm = requests_per_minute
|
|
682
|
+
self.timestamps = []
|
|
683
|
+
|
|
684
|
+
def acquire(self):
|
|
685
|
+
"""Wait if rate limit would be exceeded"""
|
|
686
|
+
now = time.time()
|
|
687
|
+
|
|
688
|
+
# Remove old timestamps
|
|
689
|
+
self.timestamps = [t for t in self.timestamps if now - t < 60]
|
|
690
|
+
|
|
691
|
+
if len(self.timestamps) >= self.rpm:
|
|
692
|
+
sleep_time = 60 - (now - self.timestamps[0])
|
|
693
|
+
time.sleep(sleep_time)
|
|
694
|
+
|
|
695
|
+
self.timestamps.append(time.time())
|
|
696
|
+
|
|
697
|
+
# Retry with exponential backoff
|
|
698
|
+
@retry(
|
|
699
|
+
wait=wait_exponential(multiplier=1, min=4, max=60),
|
|
700
|
+
stop=stop_after_attempt(5)
|
|
701
|
+
)
|
|
702
|
+
def call_llm_with_retry(prompt: str) -> str:
|
|
703
|
+
try:
|
|
704
|
+
return llm.generate(prompt)
|
|
705
|
+
except RateLimitError:
|
|
706
|
+
raise # Will trigger retry
|
|
707
|
+
except APIError as e:
|
|
708
|
+
if e.status_code >= 500:
|
|
709
|
+
raise # Retry server errors
|
|
710
|
+
raise # Don't retry client errors
|
|
711
|
+
```
|
|
712
|
+
|
|
713
|
+
### 5.3 Fallback Strategy
|
|
714
|
+
|
|
715
|
+
```python
|
|
716
|
+
class LLMWithFallback:
|
|
717
|
+
def __init__(self, primary: str, fallbacks: list[str]):
|
|
718
|
+
self.primary = primary
|
|
719
|
+
self.fallbacks = fallbacks
|
|
720
|
+
|
|
721
|
+
def generate(self, prompt: str, **kwargs) -> str:
|
|
722
|
+
models = [self.primary] + self.fallbacks
|
|
723
|
+
|
|
724
|
+
for model in models:
|
|
725
|
+
try:
|
|
726
|
+
return llm.generate(prompt, model=model, **kwargs)
|
|
727
|
+
except (RateLimitError, APIError) as e:
|
|
728
|
+
logging.warning(f"Model {model} failed: {e}")
|
|
729
|
+
continue
|
|
730
|
+
|
|
731
|
+
raise AllModelsFailedError("All models exhausted")
|
|
732
|
+
|
|
733
|
+
# Usage
|
|
734
|
+
llm_client = LLMWithFallback(
|
|
735
|
+
primary="gpt-4-turbo",
|
|
736
|
+
fallbacks=["gpt-3.5-turbo", "claude-3-sonnet"]
|
|
737
|
+
)
|
|
738
|
+
```
|
|
739
|
+
|
|
740
|
+
---
|
|
741
|
+
|
|
742
|
+
## Architecture Decision Matrix
|
|
743
|
+
|
|
744
|
+
| Pattern | Use When | Complexity | Cost |
|
|
745
|
+
| :------------------- | :--------------- | :--------- | :-------- |
|
|
746
|
+
| **Simple RAG** | FAQ, docs search | Low | Low |
|
|
747
|
+
| **Hybrid RAG** | Mixed queries | Medium | Medium |
|
|
748
|
+
| **ReAct Agent** | Multi-step tasks | Medium | Medium |
|
|
749
|
+
| **Function Calling** | Structured tools | Low | Low |
|
|
750
|
+
| **Plan-Execute** | Complex tasks | High | High |
|
|
751
|
+
| **Multi-Agent** | Research tasks | Very High | Very High |
|
|
752
|
+
|
|
753
|
+
---
|
|
754
|
+
|
|
755
|
+
## Resources
|
|
756
|
+
|
|
757
|
+
- [Dify Platform](https://github.com/langgenius/dify)
|
|
758
|
+
- [LangChain Docs](https://python.langchain.com/)
|
|
759
|
+
- [LlamaIndex](https://www.llamaindex.ai/)
|
|
760
|
+
- [Anthropic Cookbook](https://github.com/anthropics/anthropic-cookbook)
|