@jhm1909/ag-kit 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.agent/ARCHITECTURE.md +189 -0
- package/.agent/known-registries.json +181 -0
- package/.agent/mcp_config.json +19 -0
- package/.agent/rules/clean-code.md +107 -0
- package/.agent/rules/documents.md +177 -0
- package/.agent/rules/git-workflow.md +68 -0
- package/.agent/rules/nano-banana.md +46 -0
- package/.agent/rules/research.md +35 -0
- package/.agent/rules/skill-loading.md +100 -0
- package/.agent/rules/skill-suggestion.md +47 -0
- package/.agent/rules/testing.md +52 -0
- package/.agent/rules/workflow-advisor.md +108 -0
- package/.agent/rules/workflow-skill-convention.md +127 -0
- package/.agent/skills/ai-engineer/SKILL.md +824 -0
- package/.agent/skills/ai-engineer/references/agentic-patterns.md +329 -0
- package/.agent/skills/ai-engineer/references/evaluation.md +493 -0
- package/.agent/skills/ai-engineer/references/llm.md +490 -0
- package/.agent/skills/ai-engineer/references/rag-advanced.md +444 -0
- package/.agent/skills/ai-engineer/references/serving-optimization.md +531 -0
- package/.agent/skills/ai-engineer/vector-db/README.md +137 -0
- package/.agent/skills/app-builder/SKILL.md +75 -0
- package/.agent/skills/app-builder/agent-coordination.md +71 -0
- package/.agent/skills/app-builder/feature-building.md +53 -0
- package/.agent/skills/app-builder/project-detection.md +34 -0
- package/.agent/skills/app-builder/scaffolding.md +118 -0
- package/.agent/skills/app-builder/tech-stack.md +41 -0
- package/.agent/skills/app-builder/templates/SKILL.md +39 -0
- package/.agent/skills/app-builder/templates/astro-static/TEMPLATE.md +76 -0
- package/.agent/skills/app-builder/templates/chrome-extension/TEMPLATE.md +92 -0
- package/.agent/skills/app-builder/templates/cli-tool/TEMPLATE.md +88 -0
- package/.agent/skills/app-builder/templates/electron-desktop/TEMPLATE.md +88 -0
- package/.agent/skills/app-builder/templates/express-api/TEMPLATE.md +83 -0
- package/.agent/skills/app-builder/templates/flutter-app/TEMPLATE.md +90 -0
- package/.agent/skills/app-builder/templates/monorepo-turborepo/TEMPLATE.md +90 -0
- package/.agent/skills/app-builder/templates/nextjs-fullstack/TEMPLATE.md +122 -0
- package/.agent/skills/app-builder/templates/nextjs-saas/TEMPLATE.md +122 -0
- package/.agent/skills/app-builder/templates/nextjs-static/TEMPLATE.md +169 -0
- package/.agent/skills/app-builder/templates/nuxt-app/TEMPLATE.md +134 -0
- package/.agent/skills/app-builder/templates/python-fastapi/TEMPLATE.md +83 -0
- package/.agent/skills/app-builder/templates/react-native-app/TEMPLATE.md +119 -0
- package/.agent/skills/backend-developer/SKILL.md +763 -0
- package/.agent/skills/backend-developer/references/general-patterns.md +65 -0
- package/.agent/skills/backend-developer/references/go-echo.md +68 -0
- package/.agent/skills/backend-developer/references/go-gin.md +76 -0
- package/.agent/skills/backend-developer/references/java-springboot.md +83 -0
- package/.agent/skills/backend-developer/references/node-express.md +64 -0
- package/.agent/skills/backend-developer/references/node-nestjs.md +69 -0
- package/.agent/skills/backend-developer/references/python-django.md +67 -0
- package/.agent/skills/backend-developer/references/python-fastapi.md +80 -0
- package/.agent/skills/blockchain-engineer/SKILL.md +975 -0
- package/.agent/skills/blockchain-engineer/references/deployment.md +28 -0
- package/.agent/skills/blockchain-engineer/references/evm.md +14 -0
- package/.agent/skills/blockchain-engineer/references/mechanisms.md +32 -0
- package/.agent/skills/blockchain-engineer/references/solidity.md +32 -0
- package/.agent/skills/business-analysis/SKILL.md +85 -0
- package/.agent/skills/business-analysis/references/best-practices/diagrams.md +141 -0
- package/.agent/skills/business-analysis/references/domains/ai-agent.md +94 -0
- package/.agent/skills/business-analysis/references/domains/blockchain-dapp.md +86 -0
- package/.agent/skills/business-analysis/references/domains/ecommerce.md +77 -0
- package/.agent/skills/business-analysis/references/domains/education.md +42 -0
- package/.agent/skills/business-analysis/references/domains/fintech.md +44 -0
- package/.agent/skills/business-analysis/references/domains/fnb.md +82 -0
- package/.agent/skills/business-analysis/references/domains/healthtech.md +44 -0
- package/.agent/skills/business-analysis/references/domains/internal-tools.md +38 -0
- package/.agent/skills/business-analysis/references/domains/marketplace.md +52 -0
- package/.agent/skills/business-analysis/references/domains/saas.md +36 -0
- package/.agent/skills/business-analysis/references/workflows/collaboration.md +41 -0
- package/.agent/skills/business-analysis/scripts/verify_mermaid.py +86 -0
- package/.agent/skills/business-analysis/templates/brd.md +46 -0
- package/.agent/skills/business-analysis/templates/change-request.md +41 -0
- package/.agent/skills/business-analysis/templates/prd-functional.md +38 -0
- package/.agent/skills/business-analysis/templates/use-case.md +40 -0
- package/.agent/skills/business-analysis/templates/user-story-detailed.md +36 -0
- package/.agent/skills/code-review/SKILL.md +113 -0
- package/.agent/skills/code-review/references/code-review-reception.md +209 -0
- package/.agent/skills/code-review/references/differential_review.md +59 -0
- package/.agent/skills/code-review/references/requesting-code-review.md +105 -0
- package/.agent/skills/code-review/references/spec_compliance.md +43 -0
- package/.agent/skills/code-review/references/verification-before-completion.md +139 -0
- package/.agent/skills/context-engineering/SKILL.md +68 -0
- package/.agent/skills/context-engineering/references/context-compression.md +84 -0
- package/.agent/skills/context-engineering/references/context-degradation.md +93 -0
- package/.agent/skills/context-engineering/references/context-fundamentals.md +75 -0
- package/.agent/skills/context-engineering/references/context-optimization.md +82 -0
- package/.agent/skills/context-engineering/references/evaluation.md +89 -0
- package/.agent/skills/context-engineering/references/memory-systems.md +88 -0
- package/.agent/skills/context-engineering/references/multi-agent-patterns.md +90 -0
- package/.agent/skills/context-engineering/references/project-development.md +97 -0
- package/.agent/skills/context-engineering/references/tool-design.md +86 -0
- package/.agent/skills/debugging/SKILL.md +60 -0
- package/.agent/skills/debugging/references/defense-in-depth.md +130 -0
- package/.agent/skills/debugging/references/root-cause-tracing.md +177 -0
- package/.agent/skills/debugging/references/systematic-debugging.md +295 -0
- package/.agent/skills/debugging/references/verification-before-completion.md +142 -0
- package/.agent/skills/designer/SKILL.md +159 -0
- package/.agent/skills/designer/concepts/apple-glass.md +48 -0
- package/.agent/skills/designer/concepts/aurora-gradients.md +26 -0
- package/.agent/skills/designer/concepts/bento-grids.md +14 -0
- package/.agent/skills/designer/concepts/claymorphism.md +27 -0
- package/.agent/skills/designer/concepts/neo-brutalism.md +32 -0
- package/.agent/skills/designer/data/app-interface.csv +31 -0
- package/.agent/skills/designer/data/charts.csv +26 -0
- package/.agent/skills/designer/data/colors.csv +162 -0
- package/.agent/skills/designer/data/design.csv +1776 -0
- package/.agent/skills/designer/data/icons.csv +106 -0
- package/.agent/skills/designer/data/landing.csv +35 -0
- package/.agent/skills/designer/data/products.csv +162 -0
- package/.agent/skills/designer/data/react-performance.csv +45 -0
- package/.agent/skills/designer/data/styles.csv +85 -0
- package/.agent/skills/designer/data/typography.csv +74 -0
- package/.agent/skills/designer/data/ui-reasoning.csv +162 -0
- package/.agent/skills/designer/data/ux-guidelines.csv +100 -0
- package/.agent/skills/designer/references/accessibility.md +172 -0
- package/.agent/skills/designer/references/branding.md +88 -0
- package/.agent/skills/designer/references/color-theory.md +139 -0
- package/.agent/skills/designer/references/creation.md +118 -0
- package/.agent/skills/designer/references/design-systems.md +219 -0
- package/.agent/skills/designer/references/frontend_design_aesthetics.md +57 -0
- package/.agent/skills/designer/references/layout.md +200 -0
- package/.agent/skills/designer/references/motion.md +92 -0
- package/.agent/skills/designer/references/review.md +100 -0
- package/.agent/skills/designer/references/trends.md +209 -0
- package/.agent/skills/designer/references/typography.md +190 -0
- package/.agent/skills/designer/scripts/remove_background.py +135 -0
- package/.agent/skills/designer/scripts/ui-search/__pycache__/core.cpython-314.pyc +0 -0
- package/.agent/skills/designer/scripts/ui-search/__pycache__/design_system.cpython-314.pyc +0 -0
- package/.agent/skills/designer/scripts/ui-search/core.py +217 -0
- package/.agent/skills/designer/scripts/ui-search/design_system.py +1067 -0
- package/.agent/skills/designer/scripts/ui-search/search.py +114 -0
- package/.agent/skills/designer/templates/design-motion-spec.md +30 -0
- package/.agent/skills/devops-engineer/SKILL.md +90 -0
- package/.agent/skills/devops-engineer/docker-compose/README.md +47 -0
- package/.agent/skills/devops-engineer/references/ci-cd-pipelines.md +76 -0
- package/.agent/skills/devops-engineer/references/cloud-providers.md +57 -0
- package/.agent/skills/devops-engineer/references/codebase-normalization.md +104 -0
- package/.agent/skills/devops-engineer/references/container-orchestration.md +69 -0
- package/.agent/skills/devops-engineer/references/iac-tools.md +63 -0
- package/.agent/skills/devops-engineer/references/observability-security.md +45 -0
- package/.agent/skills/devops-engineer/references/vercel-supabase.md +17 -0
- package/.agent/skills/devops-engineer/templates/release-notes.md +8 -0
- package/.agent/skills/frontend-developer/SKILL.md +125 -0
- package/.agent/skills/frontend-developer/react-nextjs/README.md +90 -0
- package/.agent/skills/frontend-developer/references/angular.md +52 -0
- package/.agent/skills/frontend-developer/references/composition_patterns.md +60 -0
- package/.agent/skills/frontend-developer/references/core-performance.md +68 -0
- package/.agent/skills/frontend-developer/references/modern-signals.md +43 -0
- package/.agent/skills/frontend-developer/references/react_performance_rules.md +55 -0
- package/.agent/skills/frontend-developer/references/vue-nuxt.md +55 -0
- package/.agent/skills/frontend-developer/scripts/validate_compliance.py +65 -0
- package/.agent/skills/frontend-developer/threejs/README.md +89 -0
- package/.agent/skills/frontend-developer/threejs/animation.md +552 -0
- package/.agent/skills/frontend-developer/threejs/fundamentals.md +488 -0
- package/.agent/skills/frontend-developer/threejs/geometry.md +548 -0
- package/.agent/skills/frontend-developer/threejs/interaction.md +660 -0
- package/.agent/skills/frontend-developer/threejs/lighting.md +481 -0
- package/.agent/skills/frontend-developer/threejs/loaders.md +623 -0
- package/.agent/skills/frontend-developer/threejs/materials.md +520 -0
- package/.agent/skills/frontend-developer/threejs/postprocessing.md +602 -0
- package/.agent/skills/frontend-developer/threejs/router.json +181 -0
- package/.agent/skills/frontend-developer/threejs/shaders.md +642 -0
- package/.agent/skills/frontend-developer/threejs/textures.md +628 -0
- package/.agent/skills/game-development/2d-games/SKILL.md +119 -0
- package/.agent/skills/game-development/3d-games/SKILL.md +135 -0
- package/.agent/skills/game-development/SKILL.md +167 -0
- package/.agent/skills/game-development/game-art/SKILL.md +185 -0
- package/.agent/skills/game-development/game-audio/SKILL.md +190 -0
- package/.agent/skills/game-development/game-design/SKILL.md +129 -0
- package/.agent/skills/game-development/mobile-games/SKILL.md +108 -0
- package/.agent/skills/game-development/multiplayer/SKILL.md +132 -0
- package/.agent/skills/game-development/pc-games/SKILL.md +144 -0
- package/.agent/skills/game-development/vr-ar/SKILL.md +123 -0
- package/.agent/skills/game-development/web-games/SKILL.md +150 -0
- package/.agent/skills/lead-architect/SKILL.md +85 -0
- package/.agent/skills/lead-architect/references/application-architecture.md +70 -0
- package/.agent/skills/lead-architect/references/infrastructure.md +51 -0
- package/.agent/skills/lead-architect/references/process.md +42 -0
- package/.agent/skills/lead-architect/references/system-architecture.md +62 -0
- package/.agent/skills/lead-architect/references/web-fullstack.md +82 -0
- package/.agent/skills/lead-architect/templates/adr.md +62 -0
- package/.agent/skills/lead-architect/templates/rfc.md +46 -0
- package/.agent/skills/lead-architect/templates/sdd.md +62 -0
- package/.agent/skills/lead-architect/templates/technical-spec.md +61 -0
- package/.agent/skills/marketer/SKILL.md +66 -0
- package/.agent/skills/marketer/remotion-best-practices/SKILL.md +58 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/3d.md +86 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/animations.md +29 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/assets/charts-bar-chart.tsx +173 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/assets/text-animations-typewriter.tsx +100 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/assets/text-animations-word-highlight.tsx +108 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/assets.md +78 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/audio.md +172 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/calculate-metadata.md +104 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/can-decode.md +75 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/charts.md +58 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/compositions.md +146 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/display-captions.md +126 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/extract-frames.md +229 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/fonts.md +152 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/get-audio-duration.md +58 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/get-video-dimensions.md +68 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/get-video-duration.md +58 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/gifs.md +138 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/images.md +130 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/import-srt-captions.md +67 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/lottie.md +68 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/measuring-dom-nodes.md +35 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/measuring-text.md +143 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/sequencing.md +106 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/tailwind.md +11 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/text-animations.md +20 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/timing.md +179 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/transcribe-captions.md +19 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/transitions.md +122 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/trimming.md +53 -0
- package/.agent/skills/marketer/remotion-best-practices/rules/videos.md +171 -0
- package/.agent/skills/mcp-builder/SKILL.md +76 -0
- package/.agent/skills/mcp-builder/references/evaluation.md +602 -0
- package/.agent/skills/mcp-builder/references/mcp_best_practices.md +249 -0
- package/.agent/skills/mcp-builder/references/node_mcp_server.md +970 -0
- package/.agent/skills/mcp-builder/references/python_mcp_server.md +719 -0
- package/.agent/skills/mobile-developer/SKILL.md +83 -0
- package/.agent/skills/mobile-developer/api-routes/SKILL.md +389 -0
- package/.agent/skills/mobile-developer/building-ui/SKILL.md +335 -0
- package/.agent/skills/mobile-developer/building-ui/references/animations.md +220 -0
- package/.agent/skills/mobile-developer/building-ui/references/controls.md +270 -0
- package/.agent/skills/mobile-developer/building-ui/references/form-sheet.md +227 -0
- package/.agent/skills/mobile-developer/building-ui/references/gradients.md +106 -0
- package/.agent/skills/mobile-developer/building-ui/references/icons.md +213 -0
- package/.agent/skills/mobile-developer/building-ui/references/media.md +198 -0
- package/.agent/skills/mobile-developer/building-ui/references/route-structure.md +229 -0
- package/.agent/skills/mobile-developer/building-ui/references/search.md +248 -0
- package/.agent/skills/mobile-developer/building-ui/references/storage.md +121 -0
- package/.agent/skills/mobile-developer/building-ui/references/tabs.md +368 -0
- package/.agent/skills/mobile-developer/building-ui/references/visual-effects.md +197 -0
- package/.agent/skills/mobile-developer/building-ui/references/webgpu-three.md +605 -0
- package/.agent/skills/mobile-developer/cicd-workflows/SKILL.md +107 -0
- package/.agent/skills/mobile-developer/cicd-workflows/scripts/fetch.js +109 -0
- package/.agent/skills/mobile-developer/cicd-workflows/scripts/package.json +11 -0
- package/.agent/skills/mobile-developer/cicd-workflows/scripts/validate.js +84 -0
- package/.agent/skills/mobile-developer/data-fetching/SKILL.md +508 -0
- package/.agent/skills/mobile-developer/deployment/SKILL.md +207 -0
- package/.agent/skills/mobile-developer/deployment/references/app-store-metadata.md +479 -0
- package/.agent/skills/mobile-developer/deployment/references/ios-app-store.md +355 -0
- package/.agent/skills/mobile-developer/deployment/references/play-store.md +246 -0
- package/.agent/skills/mobile-developer/deployment/references/testflight.md +58 -0
- package/.agent/skills/mobile-developer/deployment/references/workflows.md +200 -0
- package/.agent/skills/mobile-developer/dev-client/SKILL.md +181 -0
- package/.agent/skills/mobile-developer/tailwind-setup/SKILL.md +501 -0
- package/.agent/skills/mobile-developer/upgrading-expo/SKILL.md +116 -0
- package/.agent/skills/mobile-developer/upgrading-expo/references/new-architecture.md +79 -0
- package/.agent/skills/mobile-developer/upgrading-expo/references/react-19.md +79 -0
- package/.agent/skills/mobile-developer/upgrading-expo/references/react-compiler.md +59 -0
- package/.agent/skills/mobile-developer/use-dom/SKILL.md +434 -0
- package/.agent/skills/modern-python/SKILL.md +122 -0
- package/.agent/skills/project-manager/SKILL.md +110 -0
- package/.agent/skills/project-manager/references/ba-collaboration.md +62 -0
- package/.agent/skills/project-manager/references/discovery_process.md +52 -0
- package/.agent/skills/project-manager/references/jobs_to_be_done.md +51 -0
- package/.agent/skills/project-manager/references/prd_development.md +52 -0
- package/.agent/skills/project-manager/references/rules-guide.md +55 -0
- package/.agent/skills/project-manager/references/skill-creation.md +98 -0
- package/.agent/skills/project-manager/references/strategic-frameworks.md +62 -0
- package/.agent/skills/project-manager/references/task-decomposition.md +194 -0
- package/.agent/skills/project-manager/references/workflows-guide.md +44 -0
- package/.agent/skills/project-manager/router.json +160 -0
- package/.agent/skills/project-manager/scripts/compare_skill.py +177 -0
- package/.agent/skills/project-manager/scripts/encoding_utils.py +36 -0
- package/.agent/skills/project-manager/scripts/init_skill.py +190 -0
- package/.agent/skills/project-manager/scripts/quick_validate.py +123 -0
- package/.agent/skills/project-manager/templates/pm-strategy-one-pager.md +6 -0
- package/.agent/skills/project-manager/templates/prd-strategic.md +38 -0
- package/.agent/skills/project-manager/templates/skill-questionnaire.md +118 -0
- package/.agent/skills/project-manager/templates/user-story-simple.md +14 -0
- package/.agent/skills/prompt-engineer/SKILL.md +319 -0
- package/.agent/skills/prompt-engineer/skill-creator/README.md +47 -0
- package/.agent/skills/qa-tester/SKILL.md +142 -0
- package/.agent/skills/qa-tester/assets/README.md +8 -0
- package/.agent/skills/qa-tester/references/accessibility_testing.md +35 -0
- package/.agent/skills/qa-tester/references/agent_browser.md +38 -0
- package/.agent/skills/qa-tester/references/automation/api_testing.md +23 -0
- package/.agent/skills/qa-tester/references/automation/best_practices.md +14 -0
- package/.agent/skills/qa-tester/references/automation/jest_vitest.md +26 -0
- package/.agent/skills/qa-tester/references/automation/playwright.md +30 -0
- package/.agent/skills/qa-tester/references/e2e_testing.md +46 -0
- package/.agent/skills/qa-tester/references/integration_testing.md +39 -0
- package/.agent/skills/qa-tester/references/performance_testing.md +44 -0
- package/.agent/skills/qa-tester/references/property_based_testing.md +44 -0
- package/.agent/skills/qa-tester/references/security_audit.md +53 -0
- package/.agent/skills/qa-tester/references/security_testing.md +30 -0
- package/.agent/skills/qa-tester/references/sharp_edges.md +49 -0
- package/.agent/skills/qa-tester/references/static_analysis.md +52 -0
- package/.agent/skills/qa-tester/references/supply_chain_audit.md +54 -0
- package/.agent/skills/qa-tester/references/test_case_standards.md +96 -0
- package/.agent/skills/qa-tester/references/test_report_template.md +32 -0
- package/.agent/skills/qa-tester/references/unit_testing.md +50 -0
- package/.agent/skills/qa-tester/references/visual_testing.md +32 -0
- package/.agent/skills/qa-tester/templates/uat-plan.md +34 -0
- package/.agent/skills/research-first/SKILL.md +118 -0
- package/.agent/skills-manifest.json +264 -0
- package/.agent/workflows/absorb.md +176 -0
- package/.agent/workflows/bootstrap.md +91 -0
- package/.agent/workflows/brainstorm.md +168 -0
- package/.agent/workflows/break-tasks.md +77 -0
- package/.agent/workflows/commit.md +349 -0
- package/.agent/workflows/custom-behavior.md +64 -0
- package/.agent/workflows/debug.md +65 -0
- package/.agent/workflows/development.md +49 -0
- package/.agent/workflows/documentation.md +221 -0
- package/.agent/workflows/gen-tests.md +53 -0
- package/.agent/workflows/guide.md +196 -0
- package/.agent/workflows/implement-feature.md +182 -0
- package/.agent/workflows/install-skill.md +193 -0
- package/.agent/workflows/qa.md +54 -0
- package/.agent/workflows/ui-ux-design.md +108 -0
- package/LICENSE +21 -0
- package/README.md +258 -0
- package/cli/index.js +345 -0
- package/cli/migrate-skills.js +113 -0
- package/cli/verify.js +291 -0
- package/package.json +49 -0
|
@@ -0,0 +1,490 @@
|
|
|
1
|
+
# LLM Fundamentals
|
|
2
|
+
|
|
3
|
+
Core concepts for working with Large Language Models.
|
|
4
|
+
|
|
5
|
+
## 1. Tokenization
|
|
6
|
+
|
|
7
|
+
### Understanding Tokens
|
|
8
|
+
|
|
9
|
+
```python
|
|
10
|
+
import tiktoken
|
|
11
|
+
|
|
12
|
+
# Different models use different tokenizers
|
|
13
|
+
encodings = {
|
|
14
|
+
"gpt-4": tiktoken.encoding_for_model("gpt-4"),
|
|
15
|
+
"claude": tiktoken.get_encoding("cl100k_base"),
|
|
16
|
+
}
|
|
17
|
+
|
|
18
|
+
def count_tokens(text: str, model: str = "gpt-4") -> int:
|
|
19
|
+
encoding = encodings[model]
|
|
20
|
+
return len(encoding.encode(text))
|
|
21
|
+
|
|
22
|
+
def show_tokens(text: str, model: str = "gpt-4"):
|
|
23
|
+
"""Visualize how text is tokenized"""
|
|
24
|
+
encoding = encodings[model]
|
|
25
|
+
tokens = encoding.encode(text)
|
|
26
|
+
|
|
27
|
+
print(f"Text: {text}")
|
|
28
|
+
print(f"Tokens ({len(tokens)}):")
|
|
29
|
+
for token in tokens:
|
|
30
|
+
decoded = encoding.decode([token])
|
|
31
|
+
print(f" {token:6d} → '{decoded}'")
|
|
32
|
+
|
|
33
|
+
# Example
|
|
34
|
+
show_tokens("Hello, world!")
|
|
35
|
+
# 15496 → 'Hello'
|
|
36
|
+
# 11 → ','
|
|
37
|
+
# 616 → ' world'
|
|
38
|
+
# 0 → '!'
|
|
39
|
+
```
|
|
40
|
+
|
|
41
|
+
### Token Budgeting
|
|
42
|
+
|
|
43
|
+
| Model | Context | Output | ~Tokens/Word |
|
|
44
|
+
|:------|:--------|:-------|:-------------|
|
|
45
|
+
| GPT-4o | 128k | 4k | 0.75 |
|
|
46
|
+
| GPT-4 | 8k-32k | 4k-8k | 0.75 |
|
|
47
|
+
| Claude 3.5 Sonnet | 200k | 4k | 0.75 |
|
|
48
|
+
| Claude 3 Opus | 200k | 4k | 0.75 |
|
|
49
|
+
| Llama 3 | 8k-128k | 8k | 0.75 |
|
|
50
|
+
|
|
51
|
+
**Rule of thumb:** 100 tokens ≈ 75 words ≈ 1 paragraph
|
|
52
|
+
|
|
53
|
+
### Managing Context Windows
|
|
54
|
+
|
|
55
|
+
```python
|
|
56
|
+
class ContextWindow:
|
|
57
|
+
def __init__(self, max_tokens: int = 8000, reserve_output: int = 2000):
|
|
58
|
+
self.max_tokens = max_tokens
|
|
59
|
+
self.reserve_output = reserve_output
|
|
60
|
+
self.available = max_tokens - reserve_output
|
|
61
|
+
self.messages = []
|
|
62
|
+
|
|
63
|
+
def add_message(self, role: str, content: str) -> bool:
|
|
64
|
+
msg_tokens = count_tokens(content)
|
|
65
|
+
current = sum(count_tokens(m["content"]) for m in self.messages)
|
|
66
|
+
|
|
67
|
+
if current + msg_tokens > self.available:
|
|
68
|
+
# Need to compress or remove
|
|
69
|
+
self._make_space(msg_tokens)
|
|
70
|
+
|
|
71
|
+
self.messages.append({"role": role, "content": content})
|
|
72
|
+
return True
|
|
73
|
+
|
|
74
|
+
def _make_space(self, needed: int):
|
|
75
|
+
"""Remove or summarize old messages"""
|
|
76
|
+
while True:
|
|
77
|
+
current = sum(count_tokens(m["content"]) for m in self.messages)
|
|
78
|
+
if current + needed <= self.available:
|
|
79
|
+
break
|
|
80
|
+
|
|
81
|
+
# Remove oldest non-system message
|
|
82
|
+
for i, msg in enumerate(self.messages):
|
|
83
|
+
if msg["role"] != "system":
|
|
84
|
+
self.messages.pop(i)
|
|
85
|
+
break
|
|
86
|
+
```
|
|
87
|
+
|
|
88
|
+
## 2. API Integration
|
|
89
|
+
|
|
90
|
+
### OpenAI
|
|
91
|
+
|
|
92
|
+
```python
|
|
93
|
+
from openai import OpenAI
|
|
94
|
+
import os
|
|
95
|
+
|
|
96
|
+
client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
|
|
97
|
+
|
|
98
|
+
# Basic completion
|
|
99
|
+
response = client.chat.completions.create(
|
|
100
|
+
model="gpt-4",
|
|
101
|
+
messages=[
|
|
102
|
+
{"role": "system", "content": "You are a helpful assistant."},
|
|
103
|
+
{"role": "user", "content": "Hello!"}
|
|
104
|
+
],
|
|
105
|
+
temperature=0.7,
|
|
106
|
+
max_tokens=500
|
|
107
|
+
)
|
|
108
|
+
|
|
109
|
+
print(response.choices[0].message.content)
|
|
110
|
+
|
|
111
|
+
# Streaming
|
|
112
|
+
stream = client.chat.completions.create(
|
|
113
|
+
model="gpt-4",
|
|
114
|
+
messages=[{"role": "user", "content": "Tell me a story"}],
|
|
115
|
+
stream=True
|
|
116
|
+
)
|
|
117
|
+
|
|
118
|
+
for chunk in stream:
|
|
119
|
+
if chunk.choices[0].delta.content:
|
|
120
|
+
print(chunk.choices[0].delta.content, end="")
|
|
121
|
+
```
|
|
122
|
+
|
|
123
|
+
### Anthropic
|
|
124
|
+
|
|
125
|
+
```python
|
|
126
|
+
from anthropic import Anthropic
|
|
127
|
+
|
|
128
|
+
client = Anthropic(api_key=os.getenv("ANTHROPIC_API_KEY"))
|
|
129
|
+
|
|
130
|
+
response = client.messages.create(
|
|
131
|
+
model="claude-3-sonnet-20240229",
|
|
132
|
+
max_tokens=1000,
|
|
133
|
+
messages=[{
|
|
134
|
+
"role": "user",
|
|
135
|
+
"content": "Hello!"
|
|
136
|
+
}]
|
|
137
|
+
)
|
|
138
|
+
|
|
139
|
+
print(response.content[0].text)
|
|
140
|
+
```
|
|
141
|
+
|
|
142
|
+
### Unified Interface
|
|
143
|
+
|
|
144
|
+
```python
|
|
145
|
+
class LLMProvider:
|
|
146
|
+
def __init__(self, provider: str, model: str):
|
|
147
|
+
self.provider = provider
|
|
148
|
+
self.model = model
|
|
149
|
+
|
|
150
|
+
if provider == "openai":
|
|
151
|
+
self.client = OpenAI()
|
|
152
|
+
elif provider == "anthropic":
|
|
153
|
+
self.client = Anthropic()
|
|
154
|
+
|
|
155
|
+
def complete(self, messages: list, **kwargs) -> str:
|
|
156
|
+
if self.provider == "openai":
|
|
157
|
+
response = self.client.chat.completions.create(
|
|
158
|
+
model=self.model,
|
|
159
|
+
messages=messages,
|
|
160
|
+
**kwargs
|
|
161
|
+
)
|
|
162
|
+
return response.choices[0].message.content
|
|
163
|
+
|
|
164
|
+
elif self.provider == "anthropic":
|
|
165
|
+
response = self.client.messages.create(
|
|
166
|
+
model=self.model,
|
|
167
|
+
messages=messages,
|
|
168
|
+
max_tokens=kwargs.get("max_tokens", 1000)
|
|
169
|
+
)
|
|
170
|
+
return response.content[0].text
|
|
171
|
+
```
|
|
172
|
+
|
|
173
|
+
## 3. Generation Parameters
|
|
174
|
+
|
|
175
|
+
### Temperature
|
|
176
|
+
|
|
177
|
+
Controls randomness/creativity:
|
|
178
|
+
|
|
179
|
+
- **0.0-0.3**: Deterministic, good for extraction, classification
|
|
180
|
+
- **0.4-0.7**: Balanced, good for general conversation
|
|
181
|
+
- **0.8-1.2**: Creative, good for brainstorming, writing
|
|
182
|
+
|
|
183
|
+
```python
|
|
184
|
+
# Classification: low temperature
|
|
185
|
+
result = llm.classify(text, labels, temperature=0.1)
|
|
186
|
+
|
|
187
|
+
# Creative writing: higher temperature
|
|
188
|
+
story = llm.generate(prompt, temperature=0.9)
|
|
189
|
+
```
|
|
190
|
+
|
|
191
|
+
### Top-p (Nucleus Sampling)
|
|
192
|
+
|
|
193
|
+
Alternative to temperature. Only sample from tokens comprising top p% of probability mass.
|
|
194
|
+
|
|
195
|
+
```python
|
|
196
|
+
# Only consider tokens in top 90% probability mass
|
|
197
|
+
response = llm.complete(prompt, top_p=0.9)
|
|
198
|
+
```
|
|
199
|
+
|
|
200
|
+
### Max Tokens
|
|
201
|
+
|
|
202
|
+
Always set appropriate limits to control cost:
|
|
203
|
+
|
|
204
|
+
```python
|
|
205
|
+
# Quick answer
|
|
206
|
+
short = llm.complete(prompt, max_tokens=100)
|
|
207
|
+
|
|
208
|
+
# Detailed response
|
|
209
|
+
long = llm.complete(prompt, max_tokens=2000)
|
|
210
|
+
```
|
|
211
|
+
|
|
212
|
+
### Frequency/Presence Penalty
|
|
213
|
+
|
|
214
|
+
Reduce repetition:
|
|
215
|
+
|
|
216
|
+
```python
|
|
217
|
+
response = llm.complete(
|
|
218
|
+
prompt,
|
|
219
|
+
frequency_penalty=0.5, # Reduce repetition of same tokens
|
|
220
|
+
presence_penalty=0.5 # Encourage new topics
|
|
221
|
+
)
|
|
222
|
+
```
|
|
223
|
+
|
|
224
|
+
## 4. Structured Output
|
|
225
|
+
|
|
226
|
+
### JSON Mode
|
|
227
|
+
|
|
228
|
+
```python
|
|
229
|
+
# OpenAI JSON mode
|
|
230
|
+
response = client.chat.completions.create(
|
|
231
|
+
model="gpt-4",
|
|
232
|
+
messages=[{
|
|
233
|
+
"role": "user",
|
|
234
|
+
"content": f"Extract entities from: {text}"
|
|
235
|
+
}],
|
|
236
|
+
response_format={"type": "json_object"}
|
|
237
|
+
)
|
|
238
|
+
|
|
239
|
+
entities = json.loads(response.choices[0].message.content)
|
|
240
|
+
```
|
|
241
|
+
|
|
242
|
+
### Function Calling
|
|
243
|
+
|
|
244
|
+
```python
|
|
245
|
+
functions = [
|
|
246
|
+
{
|
|
247
|
+
"name": "get_weather",
|
|
248
|
+
"description": "Get current weather for a location",
|
|
249
|
+
"parameters": {
|
|
250
|
+
"type": "object",
|
|
251
|
+
"properties": {
|
|
252
|
+
"location": {
|
|
253
|
+
"type": "string",
|
|
254
|
+
"description": "City name"
|
|
255
|
+
},
|
|
256
|
+
"unit": {
|
|
257
|
+
"type": "string",
|
|
258
|
+
"enum": ["celsius", "fahrenheit"]
|
|
259
|
+
}
|
|
260
|
+
},
|
|
261
|
+
"required": ["location"]
|
|
262
|
+
}
|
|
263
|
+
}
|
|
264
|
+
]
|
|
265
|
+
|
|
266
|
+
response = client.chat.completions.create(
|
|
267
|
+
model="gpt-4",
|
|
268
|
+
messages=[{"role": "user", "content": "What's the weather in Paris?"}],
|
|
269
|
+
functions=functions,
|
|
270
|
+
function_call="auto"
|
|
271
|
+
)
|
|
272
|
+
|
|
273
|
+
# Check if function was called
|
|
274
|
+
if response.choices[0].message.function_call:
|
|
275
|
+
function_call = response.choices[0].message.function_call
|
|
276
|
+
args = json.loads(function_call.arguments)
|
|
277
|
+
result = get_weather(**args)
|
|
278
|
+
```
|
|
279
|
+
|
|
280
|
+
### Pydantic Integration
|
|
281
|
+
|
|
282
|
+
```python
|
|
283
|
+
from pydantic import BaseModel, Field
|
|
284
|
+
from typing import Literal
|
|
285
|
+
|
|
286
|
+
class Analysis(BaseModel):
|
|
287
|
+
sentiment: Literal["positive", "negative", "neutral"]
|
|
288
|
+
confidence: float = Field(ge=0, le=1)
|
|
289
|
+
topics: list[str] = Field(max_length=5)
|
|
290
|
+
|
|
291
|
+
# Generate schema
|
|
292
|
+
schema = Analysis.schema()
|
|
293
|
+
|
|
294
|
+
# Use in function calling
|
|
295
|
+
functions = [{
|
|
296
|
+
"name": "analyze",
|
|
297
|
+
"parameters": schema
|
|
298
|
+
}]
|
|
299
|
+
|
|
300
|
+
response = client.chat.completions.create(
|
|
301
|
+
model="gpt-4",
|
|
302
|
+
messages=[{"role": "user", "content": text}],
|
|
303
|
+
functions=functions,
|
|
304
|
+
function_call={"name": "analyze"}
|
|
305
|
+
)
|
|
306
|
+
|
|
307
|
+
# Parse result
|
|
308
|
+
result = Analysis(**json.loads(
|
|
309
|
+
response.choices[0].message.function_call.arguments
|
|
310
|
+
))
|
|
311
|
+
```
|
|
312
|
+
|
|
313
|
+
## 5. Embeddings
|
|
314
|
+
|
|
315
|
+
### Generating Embeddings
|
|
316
|
+
|
|
317
|
+
```python
|
|
318
|
+
# OpenAI
|
|
319
|
+
response = client.embeddings.create(
|
|
320
|
+
model="text-embedding-3-small",
|
|
321
|
+
input="The food was delicious!"
|
|
322
|
+
)
|
|
323
|
+
embedding = response.data[0].embedding
|
|
324
|
+
|
|
325
|
+
# Batch processing
|
|
326
|
+
texts = ["text 1", "text 2", "text 3"]
|
|
327
|
+
response = client.embeddings.create(
|
|
328
|
+
model="text-embedding-3-small",
|
|
329
|
+
input=texts
|
|
330
|
+
)
|
|
331
|
+
embeddings = [d.embedding for d in response.data]
|
|
332
|
+
```
|
|
333
|
+
|
|
334
|
+
### Similarity Calculation
|
|
335
|
+
|
|
336
|
+
```python
|
|
337
|
+
import numpy as np
|
|
338
|
+
|
|
339
|
+
def cosine_similarity(a: list, b: list) -> float:
|
|
340
|
+
"""Cosine similarity between two vectors"""
|
|
341
|
+
a, b = np.array(a), np.array(b)
|
|
342
|
+
return np.dot(a, b) / (np.linalg.norm(a) * np.linalg.norm(b))
|
|
343
|
+
|
|
344
|
+
def euclidean_distance(a: list, b: list) -> float:
|
|
345
|
+
"""L2 distance between two vectors"""
|
|
346
|
+
return np.linalg.norm(np.array(a) - np.array(b))
|
|
347
|
+
|
|
348
|
+
# Example
|
|
349
|
+
emb1 = get_embedding("The cat sat on the mat")
|
|
350
|
+
emb2 = get_embedding("A feline rested on the rug")
|
|
351
|
+
emb3 = get_embedding("Stock markets rallied today")
|
|
352
|
+
|
|
353
|
+
print(cosine_similarity(emb1, emb2)) # High similarity
|
|
354
|
+
print(cosine_similarity(emb1, emb3)) # Low similarity
|
|
355
|
+
```
|
|
356
|
+
|
|
357
|
+
### Embedding Models Comparison
|
|
358
|
+
|
|
359
|
+
| Model | Dimensions | Cost | Best For |
|
|
360
|
+
|:------|:-----------|:-----|:---------|
|
|
361
|
+
| text-embedding-3-small | 1536 | Low | General purpose, high volume |
|
|
362
|
+
| text-embedding-3-large | 3072 | Medium | High accuracy needs |
|
|
363
|
+
| text-embedding-ada-002 | 1536 | Low | Legacy compatibility |
|
|
364
|
+
| voyage-2 | 1024 | Medium | Domain-specific (code, finance) |
|
|
365
|
+
| e5-mistral | 4096 | Self-hosted | Privacy-sensitive |
|
|
366
|
+
|
|
367
|
+
## 6. Error Handling
|
|
368
|
+
|
|
369
|
+
### Common Errors
|
|
370
|
+
|
|
371
|
+
```python
|
|
372
|
+
from openai import (
|
|
373
|
+
RateLimitError,
|
|
374
|
+
APIError,
|
|
375
|
+
Timeout,
|
|
376
|
+
AuthenticationError
|
|
377
|
+
)
|
|
378
|
+
|
|
379
|
+
@retry(stop=stop_after_attempt(3), wait=wait_exponential(multiplier=1, min=4, max=10))
|
|
380
|
+
def robust_completion(prompt: str):
|
|
381
|
+
try:
|
|
382
|
+
return client.chat.completions.create(
|
|
383
|
+
model="gpt-4",
|
|
384
|
+
messages=[{"role": "user", "content": prompt}]
|
|
385
|
+
)
|
|
386
|
+
|
|
387
|
+
except RateLimitError:
|
|
388
|
+
# Will retry with backoff
|
|
389
|
+
raise
|
|
390
|
+
|
|
391
|
+
except Timeout:
|
|
392
|
+
# Shorten request or use faster model
|
|
393
|
+
return client.chat.completions.create(
|
|
394
|
+
model="gpt-3.5-turbo",
|
|
395
|
+
messages=[{"role": "user", "content": prompt}],
|
|
396
|
+
max_tokens=500 # Shorter response
|
|
397
|
+
)
|
|
398
|
+
|
|
399
|
+
except APIError as e:
|
|
400
|
+
logger.error(f"API error: {e}")
|
|
401
|
+
# Fallback to cached response
|
|
402
|
+
return get_cached_response(prompt)
|
|
403
|
+
|
|
404
|
+
except AuthenticationError:
|
|
405
|
+
logger.critical("Invalid API key")
|
|
406
|
+
raise
|
|
407
|
+
```
|
|
408
|
+
|
|
409
|
+
## 7. Cost Optimization
|
|
410
|
+
|
|
411
|
+
### Caching
|
|
412
|
+
|
|
413
|
+
```python
|
|
414
|
+
from functools import lru_cache
|
|
415
|
+
import hashlib
|
|
416
|
+
|
|
417
|
+
def hash_prompt(prompt: str) -> str:
|
|
418
|
+
return hashlib.sha256(prompt.encode()).hexdigest()
|
|
419
|
+
|
|
420
|
+
class LLMCache:
|
|
421
|
+
def __init__(self):
|
|
422
|
+
self.cache = {}
|
|
423
|
+
|
|
424
|
+
def get(self, prompt: str) -> str | None:
|
|
425
|
+
key = hash_prompt(prompt)
|
|
426
|
+
return self.cache.get(key)
|
|
427
|
+
|
|
428
|
+
def set(self, prompt: str, response: str):
|
|
429
|
+
key = hash_prompt(prompt)
|
|
430
|
+
self.cache[key] = response
|
|
431
|
+
|
|
432
|
+
def complete_with_cache(self, prompt: str) -> str:
|
|
433
|
+
cached = self.get(prompt)
|
|
434
|
+
if cached:
|
|
435
|
+
return cached
|
|
436
|
+
|
|
437
|
+
response = llm.complete(prompt)
|
|
438
|
+
self.set(prompt, response)
|
|
439
|
+
return response
|
|
440
|
+
```
|
|
441
|
+
|
|
442
|
+
### Model Selection
|
|
443
|
+
|
|
444
|
+
```python
|
|
445
|
+
TIER_CONFIG = {
|
|
446
|
+
"fast": {
|
|
447
|
+
"model": "gpt-3.5-turbo",
|
|
448
|
+
"max_tokens": 500,
|
|
449
|
+
"temperature": 0.3
|
|
450
|
+
},
|
|
451
|
+
"balanced": {
|
|
452
|
+
"model": "claude-3-sonnet",
|
|
453
|
+
"max_tokens": 1000,
|
|
454
|
+
"temperature": 0.5
|
|
455
|
+
},
|
|
456
|
+
"quality": {
|
|
457
|
+
"model": "gpt-4",
|
|
458
|
+
"max_tokens": 2000,
|
|
459
|
+
"temperature": 0.7
|
|
460
|
+
}
|
|
461
|
+
}
|
|
462
|
+
|
|
463
|
+
def route_by_complexity(query: str) -> dict:
|
|
464
|
+
"""Use cheap model to classify complexity"""
|
|
465
|
+
classification = llm.classify(
|
|
466
|
+
query,
|
|
467
|
+
classes=["fast", "balanced", "quality"],
|
|
468
|
+
model="gpt-3.5-turbo"
|
|
469
|
+
)
|
|
470
|
+
return TIER_CONFIG[classification]
|
|
471
|
+
```
|
|
472
|
+
|
|
473
|
+
## 8. Best Practices
|
|
474
|
+
|
|
475
|
+
### Do's ✅
|
|
476
|
+
- Set `max_tokens` to control costs
|
|
477
|
+
- Use streaming for better UX
|
|
478
|
+
- Implement retries with exponential backoff
|
|
479
|
+
- Cache frequent queries
|
|
480
|
+
- Monitor token usage
|
|
481
|
+
- Validate outputs
|
|
482
|
+
- Use structured output when possible
|
|
483
|
+
|
|
484
|
+
### Don'ts ❌
|
|
485
|
+
- Send PII to third-party APIs without sanitization
|
|
486
|
+
- Rely on exact output formatting (use JSON mode)
|
|
487
|
+
- Hardcode prompts (use templates)
|
|
488
|
+
- Ignore rate limits
|
|
489
|
+
- Send entire conversation history (summarize instead)
|
|
490
|
+
- Use high temperature for critical tasks
|