agent-cli 0.72.6__tar.gz → 0.73.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (364) hide show
  1. {agent_cli-0.72.6 → agent_cli-0.73.0}/PKG-INFO +15 -5
  2. {agent_cli-0.72.6 → agent_cli-0.73.0}/README.md +12 -4
  3. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_extras.json +4 -2
  4. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/memory.txt +51 -7
  5. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/rag.txt +51 -7
  6. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/memory/proxy.py +6 -1
  7. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/rag_proxy.py +10 -5
  8. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/api.py +2 -0
  9. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/client.py +2 -1
  10. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/opts.py +8 -0
  11. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/api.py +2 -1
  12. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/sync_extras.py +2 -2
  13. {agent_cli-0.72.6 → agent_cli-0.73.0}/docker/docker-compose.yml +3 -0
  14. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/memory.md +1 -0
  15. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/rag-proxy.md +1 -0
  16. {agent_cli-0.72.6 → agent_cli-0.73.0}/pyproject.toml +4 -2
  17. {agent_cli-0.72.6 → agent_cli-0.73.0}/uv.lock +4 -0
  18. {agent_cli-0.72.6 → agent_cli-0.73.0}/.claude/skills/agent-cli-dev/SKILL.md +0 -0
  19. {agent_cli-0.72.6 → agent_cli-0.73.0}/.claude/skills/agent-cli-dev/examples.md +0 -0
  20. {agent_cli-0.72.6 → agent_cli-0.73.0}/.claude-plugin/README.md +0 -0
  21. {agent_cli-0.72.6 → agent_cli-0.73.0}/.claude-plugin/marketplace.json +0 -0
  22. {agent_cli-0.72.6 → agent_cli-0.73.0}/.claude-plugin/plugin.json +0 -0
  23. {agent_cli-0.72.6 → agent_cli-0.73.0}/.claude-plugin/skills/agent-cli-dev/SKILL.md +0 -0
  24. {agent_cli-0.72.6 → agent_cli-0.73.0}/.claude-plugin/skills/agent-cli-dev/examples.md +0 -0
  25. {agent_cli-0.72.6 → agent_cli-0.73.0}/.cursorrules +0 -0
  26. {agent_cli-0.72.6 → agent_cli-0.73.0}/.dockerignore +0 -0
  27. {agent_cli-0.72.6 → agent_cli-0.73.0}/.env.example +0 -0
  28. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/logo.svg +0 -0
  29. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/release-drafter.yml +0 -0
  30. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/renovate.json +0 -0
  31. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/scripts/check_extras_sync.py +0 -0
  32. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/scripts/sync_requirements.py +0 -0
  33. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/automerge.yml +0 -0
  34. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/docker.yml +0 -0
  35. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/docs.yml +0 -0
  36. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/markdown-code-runner.yml +0 -0
  37. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/pytest.yml +0 -0
  38. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/release-drafter.yml +0 -0
  39. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/release.yml +0 -0
  40. {agent_cli-0.72.6 → agent_cli-0.73.0}/.github/workflows/toc.yaml +0 -0
  41. {agent_cli-0.72.6 → agent_cli-0.73.0}/.gitignore +0 -0
  42. {agent_cli-0.72.6 → agent_cli-0.73.0}/.jscpd.json +0 -0
  43. {agent_cli-0.72.6 → agent_cli-0.73.0}/.pre-commit-config.yaml +0 -0
  44. {agent_cli-0.72.6 → agent_cli-0.73.0}/.prompts/docs-review.md +0 -0
  45. {agent_cli-0.72.6 → agent_cli-0.73.0}/.prompts/pr-review.md +0 -0
  46. {agent_cli-0.72.6 → agent_cli-0.73.0}/CLAUDE.md +0 -0
  47. {agent_cli-0.72.6 → agent_cli-0.73.0}/LICENSE +0 -0
  48. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/__init__.py +0 -0
  49. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/__main__.py +0 -0
  50. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/.gitkeep +0 -0
  51. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/audio.txt +0 -0
  52. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/faster-whisper.txt +0 -0
  53. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/kokoro.txt +0 -0
  54. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/llm.txt +0 -0
  55. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/mlx-whisper.txt +0 -0
  56. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/piper.txt +0 -0
  57. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/server.txt +0 -0
  58. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/speed.txt +0 -0
  59. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/vad.txt +0 -0
  60. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_requirements/wyoming.txt +0 -0
  61. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/_tools.py +0 -0
  62. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/__init__.py +0 -0
  63. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/_voice_agent_common.py +0 -0
  64. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/assistant.py +0 -0
  65. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/autocorrect.py +0 -0
  66. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/chat.py +0 -0
  67. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/memory/__init__.py +0 -0
  68. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/memory/add.py +0 -0
  69. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/speak.py +0 -0
  70. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/transcribe.py +0 -0
  71. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/transcribe_daemon.py +0 -0
  72. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/agents/voice_edit.py +0 -0
  73. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/api.py +0 -0
  74. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/cli.py +0 -0
  75. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/config.py +0 -0
  76. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/config_cmd.py +0 -0
  77. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/constants.py +0 -0
  78. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/__init__.py +0 -0
  79. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/audio.py +0 -0
  80. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/audio_format.py +0 -0
  81. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/chroma.py +0 -0
  82. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/deps.py +0 -0
  83. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/openai_proxy.py +0 -0
  84. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/process.py +0 -0
  85. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/reranker.py +0 -0
  86. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/sse.py +0 -0
  87. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/transcription_logger.py +0 -0
  88. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/utils.py +0 -0
  89. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/vad.py +0 -0
  90. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/core/watch.py +0 -0
  91. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/__init__.py +0 -0
  92. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/cli.py +0 -0
  93. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/__init__.py +0 -0
  94. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/aider.py +0 -0
  95. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/base.py +0 -0
  96. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/claude.py +0 -0
  97. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/codex.py +0 -0
  98. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/continue_dev.py +0 -0
  99. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/copilot.py +0 -0
  100. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/cursor_agent.py +0 -0
  101. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/gemini.py +0 -0
  102. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/opencode.py +0 -0
  103. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/coding_agents/registry.py +0 -0
  104. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/__init__.py +0 -0
  105. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/base.py +0 -0
  106. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/cursor.py +0 -0
  107. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/emacs.py +0 -0
  108. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/jetbrains.py +0 -0
  109. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/nano.py +0 -0
  110. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/neovim.py +0 -0
  111. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/registry.py +0 -0
  112. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/sublime.py +0 -0
  113. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/vim.py +0 -0
  114. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/vscode.py +0 -0
  115. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/editors/zed.py +0 -0
  116. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/project.py +0 -0
  117. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/registry.py +0 -0
  118. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/skill/SKILL.md +0 -0
  119. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/skill/examples.md +0 -0
  120. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/__init__.py +0 -0
  121. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/apple_terminal.py +0 -0
  122. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/base.py +0 -0
  123. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/gnome.py +0 -0
  124. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/iterm2.py +0 -0
  125. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/kitty.py +0 -0
  126. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/registry.py +0 -0
  127. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/tmux.py +0 -0
  128. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/warp.py +0 -0
  129. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/terminals/zellij.py +0 -0
  130. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/dev/worktree.py +0 -0
  131. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/docs_gen.py +0 -0
  132. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/example-config.toml +0 -0
  133. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/install/__init__.py +0 -0
  134. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/install/common.py +0 -0
  135. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/install/extras.py +0 -0
  136. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/install/hotkeys.py +0 -0
  137. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/install/services.py +0 -0
  138. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/__init__.py +0 -0
  139. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_files.py +0 -0
  140. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_filters.py +0 -0
  141. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_git.py +0 -0
  142. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_indexer.py +0 -0
  143. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_ingest.py +0 -0
  144. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_persistence.py +0 -0
  145. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_prompt.py +0 -0
  146. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_retrieval.py +0 -0
  147. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_store.py +0 -0
  148. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_streaming.py +0 -0
  149. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/_tasks.py +0 -0
  150. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/engine.py +0 -0
  151. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/entities.py +0 -0
  152. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/memory/models.py +0 -0
  153. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/py.typed +0 -0
  154. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/__init__.py +0 -0
  155. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/_indexer.py +0 -0
  156. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/_indexing.py +0 -0
  157. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/_prompt.py +0 -0
  158. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/_retriever.py +0 -0
  159. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/_store.py +0 -0
  160. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/_utils.py +0 -0
  161. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/client.py +0 -0
  162. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/engine.py +0 -0
  163. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/rag/models.py +0 -0
  164. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/.runtime/.gitkeep +0 -0
  165. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/__init__.py +0 -0
  166. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/check_plugin_skill_sync.py +0 -0
  167. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/linux-hotkeys/README.md +0 -0
  168. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/linux-hotkeys/toggle-autocorrect.sh +0 -0
  169. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/linux-hotkeys/toggle-transcription.sh +0 -0
  170. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/linux-hotkeys/toggle-voice-edit.sh +0 -0
  171. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/macos-hotkeys/README.md +0 -0
  172. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/macos-hotkeys/skhd-config-example +0 -0
  173. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/macos-hotkeys/toggle-autocorrect.sh +0 -0
  174. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/macos-hotkeys/toggle-transcription.sh +0 -0
  175. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/macos-hotkeys/toggle-voice-edit.sh +0 -0
  176. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/nvidia-asr-server/README.md +0 -0
  177. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/nvidia-asr-server/pyproject.toml +0 -0
  178. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/nvidia-asr-server/server.py +0 -0
  179. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/nvidia-asr-server/shell.nix +0 -0
  180. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/nvidia-asr-server/uv.lock +0 -0
  181. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run-openwakeword.sh +0 -0
  182. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run-piper-windows.ps1 +0 -0
  183. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run-piper.sh +0 -0
  184. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run-whisper-linux.sh +0 -0
  185. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run-whisper-macos.sh +0 -0
  186. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run-whisper-windows.ps1 +0 -0
  187. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run-whisper.sh +0 -0
  188. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/run_faster_whisper_server.py +0 -0
  189. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/setup-linux-hotkeys.sh +0 -0
  190. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/setup-linux.sh +0 -0
  191. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/setup-macos-hotkeys.sh +0 -0
  192. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/setup-macos.sh +0 -0
  193. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/setup-windows.ps1 +0 -0
  194. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/start-all-services-windows.ps1 +0 -0
  195. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/scripts/start-all-services.sh +0 -0
  196. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/__init__.py +0 -0
  197. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/cli.py +0 -0
  198. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/common.py +0 -0
  199. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/model_manager.py +0 -0
  200. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/model_registry.py +0 -0
  201. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/proxy/__init__.py +0 -0
  202. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/proxy/api.py +0 -0
  203. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/streaming.py +0 -0
  204. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/__init__.py +0 -0
  205. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/api.py +0 -0
  206. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/backends/__init__.py +0 -0
  207. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/backends/base.py +0 -0
  208. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/backends/kokoro.py +0 -0
  209. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/backends/piper.py +0 -0
  210. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/model_manager.py +0 -0
  211. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/model_registry.py +0 -0
  212. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/tts/wyoming_handler.py +0 -0
  213. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/__init__.py +0 -0
  214. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/api.py +0 -0
  215. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/backends/__init__.py +0 -0
  216. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/backends/base.py +0 -0
  217. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/backends/faster_whisper.py +0 -0
  218. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/backends/mlx.py +0 -0
  219. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/languages.py +0 -0
  220. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/model_manager.py +0 -0
  221. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/model_registry.py +0 -0
  222. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/server/whisper/wyoming_handler.py +0 -0
  223. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/services/__init__.py +0 -0
  224. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/services/_wyoming_utils.py +0 -0
  225. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/services/asr.py +0 -0
  226. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/services/llm.py +0 -0
  227. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/services/tts.py +0 -0
  228. {agent_cli-0.72.6 → agent_cli-0.73.0}/agent_cli/services/wake_word.py +0 -0
  229. {agent_cli-0.72.6 → agent_cli-0.73.0}/docker/memory-proxy.Dockerfile +0 -0
  230. {agent_cli-0.72.6 → agent_cli-0.73.0}/docker/rag-proxy.Dockerfile +0 -0
  231. {agent_cli-0.72.6 → agent_cli-0.73.0}/docker/transcribe-proxy.Dockerfile +0 -0
  232. {agent_cli-0.72.6 → agent_cli-0.73.0}/docker/tts.Dockerfile +0 -0
  233. {agent_cli-0.72.6 → agent_cli-0.73.0}/docker/whisper.Dockerfile +0 -0
  234. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/CNAME +0 -0
  235. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/architecture/index.md +0 -0
  236. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/architecture/memory.md +0 -0
  237. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/architecture/rag.md +0 -0
  238. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/assistant.md +0 -0
  239. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/autocorrect.md +0 -0
  240. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/chat.md +0 -0
  241. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/config.md +0 -0
  242. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/dev.md +0 -0
  243. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/index.md +0 -0
  244. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/install-extras.md +0 -0
  245. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/install-hotkeys.md +0 -0
  246. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/install-services.md +0 -0
  247. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/server/index.md +0 -0
  248. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/server/transcribe-proxy.md +0 -0
  249. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/server/tts.md +0 -0
  250. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/server/whisper.md +0 -0
  251. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/speak.md +0 -0
  252. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/start-services.md +0 -0
  253. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/transcribe-daemon.md +0 -0
  254. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/transcribe.md +0 -0
  255. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/commands/voice-edit.md +0 -0
  256. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/configuration.md +0 -0
  257. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/getting-started.md +0 -0
  258. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/iOS_Shortcut_Guide.md +0 -0
  259. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/index.md +0 -0
  260. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/installation/docker.md +0 -0
  261. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/installation/index.md +0 -0
  262. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/installation/linux.md +0 -0
  263. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/installation/macos.md +0 -0
  264. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/installation/nixos.md +0 -0
  265. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/installation/windows.md +0 -0
  266. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/logo-clean.svg +0 -0
  267. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/overrides/partials/integrations/analytics/custom.html +0 -0
  268. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/run_markdown_code_runner.py +0 -0
  269. {agent_cli-0.72.6 → agent_cli-0.73.0}/docs/system-integration.md +0 -0
  270. {agent_cli-0.72.6 → agent_cli-0.73.0}/example.agent-cli-config.toml +0 -0
  271. {agent_cli-0.72.6 → agent_cli-0.73.0}/justfile +0 -0
  272. {agent_cli-0.72.6 → agent_cli-0.73.0}/shell.nix +0 -0
  273. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/__init__.py +0 -0
  274. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/__init__.py +0 -0
  275. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_fix_my_text.py +0 -0
  276. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_interactive.py +0 -0
  277. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_interactive_extra.py +0 -0
  278. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_memory_add.py +0 -0
  279. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_speak.py +0 -0
  280. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_speak_e2e.py +0 -0
  281. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_transcribe.py +0 -0
  282. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_transcribe_agent.py +0 -0
  283. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_transcribe_daemon.py +0 -0
  284. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_transcribe_e2e.py +0 -0
  285. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_transcribe_recovery.py +0 -0
  286. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_tts_common.py +0 -0
  287. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_tts_common_extra.py +0 -0
  288. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_voice_agent_common.py +0 -0
  289. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_voice_edit.py +0 -0
  290. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_voice_edit_e2e.py +0 -0
  291. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/agents/test_wake_word_assistant.py +0 -0
  292. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/conftest.py +0 -0
  293. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/core/__init__.py +0 -0
  294. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/core/test_audio_format.py +0 -0
  295. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/core/test_chroma.py +0 -0
  296. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/core/test_sse.py +0 -0
  297. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/core/test_vad.py +0 -0
  298. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/core/test_watch.py +0 -0
  299. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/__init__.py +0 -0
  300. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/test_cli.py +0 -0
  301. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/test_coding_agents.py +0 -0
  302. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/test_editors.py +0 -0
  303. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/test_project.py +0 -0
  304. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/test_terminals.py +0 -0
  305. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/test_verification.py +0 -0
  306. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/dev/test_worktree.py +0 -0
  307. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/install/__init__.py +0 -0
  308. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/install/test_extras.py +0 -0
  309. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/__init__.py +0 -0
  310. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_api_health.py +0 -0
  311. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_api_integration_liveish.py +0 -0
  312. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_client.py +0 -0
  313. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_engine.py +0 -0
  314. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_files.py +0 -0
  315. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_filters.py +0 -0
  316. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_git_integration.py +0 -0
  317. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_indexer.py +0 -0
  318. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_memory_integration.py +0 -0
  319. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_proxy_passthrough.py +0 -0
  320. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_store.py +0 -0
  321. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/memory/test_utils.py +0 -0
  322. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/mocks/__init__.py +0 -0
  323. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/mocks/audio.py +0 -0
  324. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/mocks/llm.py +0 -0
  325. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/mocks/wyoming.py +0 -0
  326. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/__init__.py +0 -0
  327. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_api.py +0 -0
  328. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_engine.py +0 -0
  329. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_history.py +0 -0
  330. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_indexer.py +0 -0
  331. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_indexing.py +0 -0
  332. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_rag_client.py +0 -0
  333. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_rag_integration_liveish.py +0 -0
  334. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_rag_proxy_passthrough.py +0 -0
  335. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_retriever.py +0 -0
  336. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_store.py +0 -0
  337. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/rag/test_utils.py +0 -0
  338. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_api.py +0 -0
  339. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_api_integration.py +0 -0
  340. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_asr.py +0 -0
  341. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_asr_recovery.py +0 -0
  342. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_audio_e2e.py +0 -0
  343. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_cli.py +0 -0
  344. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_config.py +0 -0
  345. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_config_cmd.py +0 -0
  346. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_docs_gen.py +0 -0
  347. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_env_vars.py +0 -0
  348. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_json_output.py +0 -0
  349. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_llm.py +0 -0
  350. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_llm_gemini.py +0 -0
  351. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_memory_tools.py +0 -0
  352. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_mlx_backend.py +0 -0
  353. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_process_manager.py +0 -0
  354. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_requires_extras.py +0 -0
  355. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_server_streaming.py +0 -0
  356. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_server_tts.py +0 -0
  357. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_server_whisper.py +0 -0
  358. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_services.py +0 -0
  359. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_tools.py +0 -0
  360. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_tts.py +0 -0
  361. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_utils.py +0 -0
  362. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_wake_word.py +0 -0
  363. {agent_cli-0.72.6 → agent_cli-0.73.0}/tests/test_wyoming_utils.py +0 -0
  364. {agent_cli-0.72.6 → agent_cli-0.73.0}/zensical.toml +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: agent-cli
3
- Version: 0.72.6
3
+ Version: 0.73.0
4
4
  Summary: A suite of AI-powered command-line tools for text correction, audio transcription, and voice assistance.
5
5
  Project-URL: Homepage, https://github.com/basnijholt/agent-cli
6
6
  Author-email: Bas Nijholt <bas@nijho.lt>
@@ -54,6 +54,7 @@ Requires-Dist: fastapi[standard]; extra == 'memory'
54
54
  Requires-Dist: huggingface-hub>=0.20.0; extra == 'memory'
55
55
  Requires-Dist: onnxruntime>=1.17.0; extra == 'memory'
56
56
  Requires-Dist: openai>=1.0.0; extra == 'memory'
57
+ Requires-Dist: pydantic-ai-slim[google,openai]>=0.1.1; extra == 'memory'
57
58
  Requires-Dist: pyyaml>=6.0.0; extra == 'memory'
58
59
  Requires-Dist: transformers>=4.30.0; extra == 'memory'
59
60
  Requires-Dist: watchfiles>=0.21.0; extra == 'memory'
@@ -70,6 +71,7 @@ Requires-Dist: huggingface-hub>=0.20.0; extra == 'rag'
70
71
  Requires-Dist: markitdown[docx,pdf,pptx]>=0.1.3; extra == 'rag'
71
72
  Requires-Dist: onnxruntime>=1.17.0; extra == 'rag'
72
73
  Requires-Dist: openai>=1.0.0; extra == 'rag'
74
+ Requires-Dist: pydantic-ai-slim[google,openai]>=0.1.1; extra == 'rag'
73
75
  Requires-Dist: transformers>=4.30.0; extra == 'rag'
74
76
  Requires-Dist: watchfiles>=0.21.0; extra == 'rag'
75
77
  Provides-Extra: server
@@ -2064,8 +2066,12 @@ uv tool install "agent-cli[vad]" -p 3.13
2064
2066
  │ [env var: OPENAI_API_KEY] │
2065
2067
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
2066
2068
  ╭─ LLM Configuration ────────────────────────────────────────────────────────────────────╮
2067
- │ --embedding-model TEXT Embedding model to use for vectorization.
2068
- [default: text-embedding-3-small]
2069
+ │ --embedding-base-url TEXT Base URL for embedding API. Falls back to
2070
+ --openai-base-url if not set. Useful when using
2071
+ │ different providers for chat vs embeddings. │
2072
+ │ [env var: EMBEDDING_BASE_URL] │
2073
+ │ --embedding-model TEXT Embedding model to use for vectorization. │
2074
+ │ [default: text-embedding-3-small] │
2069
2075
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
2070
2076
  ╭─ Server Configuration ─────────────────────────────────────────────────────────────────╮
2071
2077
  │ --host TEXT Host/IP to bind API servers to. │
@@ -2227,8 +2233,12 @@ The `memory proxy` command is the core feature—a middleware server that gives
2227
2233
  │ [env var: OPENAI_API_KEY] │
2228
2234
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
2229
2235
  ╭─ LLM Configuration ────────────────────────────────────────────────────────────────────╮
2230
- │ --embedding-model TEXT Embedding model to use for vectorization.
2231
- [default: text-embedding-3-small]
2236
+ │ --embedding-base-url TEXT Base URL for embedding API. Falls back to
2237
+ --openai-base-url if not set. Useful when using
2238
+ │ different providers for chat vs embeddings. │
2239
+ │ [env var: EMBEDDING_BASE_URL] │
2240
+ │ --embedding-model TEXT Embedding model to use for vectorization. │
2241
+ │ [default: text-embedding-3-small] │
2232
2242
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
2233
2243
  ╭─ Server Configuration ─────────────────────────────────────────────────────────────────╮
2234
2244
  │ --host TEXT Host/IP to bind API servers to. │
@@ -1974,8 +1974,12 @@ uv tool install "agent-cli[vad]" -p 3.13
1974
1974
  │ [env var: OPENAI_API_KEY] │
1975
1975
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
1976
1976
  ╭─ LLM Configuration ────────────────────────────────────────────────────────────────────╮
1977
- │ --embedding-model TEXT Embedding model to use for vectorization.
1978
- [default: text-embedding-3-small]
1977
+ │ --embedding-base-url TEXT Base URL for embedding API. Falls back to
1978
+ --openai-base-url if not set. Useful when using
1979
+ │ different providers for chat vs embeddings. │
1980
+ │ [env var: EMBEDDING_BASE_URL] │
1981
+ │ --embedding-model TEXT Embedding model to use for vectorization. │
1982
+ │ [default: text-embedding-3-small] │
1979
1983
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
1980
1984
  ╭─ Server Configuration ─────────────────────────────────────────────────────────────────╮
1981
1985
  │ --host TEXT Host/IP to bind API servers to. │
@@ -2137,8 +2141,12 @@ The `memory proxy` command is the core feature—a middleware server that gives
2137
2141
  │ [env var: OPENAI_API_KEY] │
2138
2142
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
2139
2143
  ╭─ LLM Configuration ────────────────────────────────────────────────────────────────────╮
2140
- │ --embedding-model TEXT Embedding model to use for vectorization.
2141
- [default: text-embedding-3-small]
2144
+ │ --embedding-base-url TEXT Base URL for embedding API. Falls back to
2145
+ --openai-base-url if not set. Useful when using
2146
+ │ different providers for chat vs embeddings. │
2147
+ │ [env var: EMBEDDING_BASE_URL] │
2148
+ │ --embedding-model TEXT Embedding model to use for vectorization. │
2149
+ │ [default: text-embedding-3-small] │
2142
2150
  ╰────────────────────────────────────────────────────────────────────────────────────────╯
2143
2151
  ╭─ Server Configuration ─────────────────────────────────────────────────────────────────╮
2144
2152
  │ --host TEXT Host/IP to bind API servers to. │
@@ -29,7 +29,8 @@
29
29
  "Long-term memory proxy",
30
30
  [
31
31
  "chromadb",
32
- "yaml"
32
+ "yaml",
33
+ "pydantic_ai"
33
34
  ]
34
35
  ],
35
36
  "mlx-whisper": [
@@ -43,7 +44,8 @@
43
44
  "rag": [
44
45
  "RAG proxy (ChromaDB, embeddings)",
45
46
  [
46
- "chromadb"
47
+ "chromadb",
48
+ "pydantic_ai"
47
49
  ]
48
50
  ],
49
51
  "server": [
@@ -6,6 +6,7 @@ annotated-types==0.7.0
6
6
  # via pydantic
7
7
  anyio==4.12.1
8
8
  # via
9
+ # google-genai
9
10
  # httpx
10
11
  # openai
11
12
  # starlette
@@ -37,16 +38,18 @@ click==8.3.1
37
38
  # typer
38
39
  # typer-slim
39
40
  # uvicorn
40
- colorama==0.4.6 ; os_name == 'nt' or sys_platform == 'win32'
41
+ colorama==0.4.6
41
42
  # via
42
43
  # build
43
44
  # click
45
+ # griffe
44
46
  # tqdm
45
47
  # uvicorn
46
48
  coloredlogs==15.0.1
47
49
  # via onnxruntime
48
50
  distro==1.9.0
49
51
  # via
52
+ # google-genai
50
53
  # openai
51
54
  # posthog
52
55
  dnspython==2.8.0
@@ -75,10 +78,18 @@ flatbuffers==25.12.19
75
78
  # via onnxruntime
76
79
  fsspec==2026.1.0
77
80
  # via huggingface-hub
81
+ genai-prices==0.0.51
82
+ # via pydantic-ai-slim
78
83
  google-auth==2.47.0
79
- # via kubernetes
84
+ # via
85
+ # google-genai
86
+ # kubernetes
87
+ google-genai==1.58.0
88
+ # via pydantic-ai-slim
80
89
  googleapis-common-protos==1.72.0
81
90
  # via opentelemetry-exporter-otlp-proto-grpc
91
+ griffe==1.15.0
92
+ # via pydantic-ai-slim
82
93
  grpcio==1.76.0
83
94
  # via
84
95
  # chromadb
@@ -99,7 +110,11 @@ httpx==0.28.1
99
110
  # chromadb
100
111
  # fastapi
101
112
  # fastapi-cloud-cli
113
+ # genai-prices
114
+ # google-genai
102
115
  # openai
116
+ # pydantic-ai-slim
117
+ # pydantic-graph
103
118
  huggingface-hub==0.36.0
104
119
  # via
105
120
  # agent-cli
@@ -127,6 +142,8 @@ jsonschema-specifications==2025.9.1
127
142
  # via jsonschema
128
143
  kubernetes==34.1.0
129
144
  # via chromadb
145
+ logfire-api==4.18.0
146
+ # via pydantic-graph
130
147
  markdown-it-py==4.0.0
131
148
  # via rich
132
149
  markupsafe==3.0.3
@@ -149,13 +166,16 @@ onnxruntime==1.20.1
149
166
  # agent-cli
150
167
  # chromadb
151
168
  openai==2.15.0
152
- # via agent-cli
169
+ # via
170
+ # agent-cli
171
+ # pydantic-ai-slim
153
172
  opentelemetry-api==1.39.1
154
173
  # via
155
174
  # chromadb
156
175
  # opentelemetry-exporter-otlp-proto-grpc
157
176
  # opentelemetry-sdk
158
177
  # opentelemetry-semantic-conventions
178
+ # pydantic-ai-slim
159
179
  opentelemetry-exporter-otlp-proto-common==1.39.1
160
180
  # via opentelemetry-exporter-otlp-proto-grpc
161
181
  opentelemetry-exporter-otlp-proto-grpc==1.39.1
@@ -203,13 +223,21 @@ pydantic==2.12.5
203
223
  # chromadb
204
224
  # fastapi
205
225
  # fastapi-cloud-cli
226
+ # genai-prices
227
+ # google-genai
206
228
  # openai
229
+ # pydantic-ai-slim
207
230
  # pydantic-extra-types
231
+ # pydantic-graph
208
232
  # pydantic-settings
233
+ pydantic-ai-slim==1.42.0
234
+ # via agent-cli
209
235
  pydantic-core==2.41.5
210
236
  # via pydantic
211
237
  pydantic-extra-types==2.11.0
212
238
  # via fastapi
239
+ pydantic-graph==1.42.0
240
+ # via pydantic-ai-slim
213
241
  pydantic-settings==2.12.0
214
242
  # via fastapi
215
243
  pygments==2.19.2
@@ -246,13 +274,18 @@ referencing==0.37.0
246
274
  # jsonschema
247
275
  # jsonschema-specifications
248
276
  regex==2026.1.15
249
- # via transformers
277
+ # via
278
+ # tiktoken
279
+ # transformers
250
280
  requests==2.32.5
251
281
  # via
282
+ # google-auth
283
+ # google-genai
252
284
  # huggingface-hub
253
285
  # kubernetes
254
286
  # posthog
255
287
  # requests-oauthlib
288
+ # tiktoken
256
289
  # transformers
257
290
  requests-oauthlib==2.0.0
258
291
  # via kubernetes
@@ -291,13 +324,19 @@ six==1.17.0
291
324
  # posthog
292
325
  # python-dateutil
293
326
  sniffio==1.3.1
294
- # via openai
327
+ # via
328
+ # google-genai
329
+ # openai
295
330
  starlette==0.50.0
296
331
  # via fastapi
297
332
  sympy==1.14.0
298
333
  # via onnxruntime
299
334
  tenacity==9.1.2
300
- # via chromadb
335
+ # via
336
+ # chromadb
337
+ # google-genai
338
+ tiktoken==0.12.0
339
+ # via pydantic-ai-slim
301
340
  tokenizers==0.22.2
302
341
  # via
303
342
  # chromadb
@@ -323,6 +362,7 @@ typing-extensions==4.15.0
323
362
  # anyio
324
363
  # chromadb
325
364
  # fastapi
365
+ # google-genai
326
366
  # grpcio
327
367
  # huggingface-hub
328
368
  # openai
@@ -342,6 +382,8 @@ typing-extensions==4.15.0
342
382
  typing-inspection==0.4.2
343
383
  # via
344
384
  # pydantic
385
+ # pydantic-ai-slim
386
+ # pydantic-graph
345
387
  # pydantic-settings
346
388
  urllib3==2.3.0
347
389
  # via
@@ -363,6 +405,8 @@ watchfiles==1.1.1
363
405
  websocket-client==1.9.0
364
406
  # via kubernetes
365
407
  websockets==15.0.1
366
- # via uvicorn
408
+ # via
409
+ # google-genai
410
+ # uvicorn
367
411
  zipp==3.23.0
368
412
  # via importlib-metadata
@@ -6,6 +6,7 @@ annotated-types==0.7.0
6
6
  # via pydantic
7
7
  anyio==4.12.1
8
8
  # via
9
+ # google-genai
9
10
  # httpx
10
11
  # openai
11
12
  # starlette
@@ -49,10 +50,11 @@ click==8.3.1
49
50
  # uvicorn
50
51
  cobble==0.1.4
51
52
  # via mammoth
52
- colorama==0.4.6 ; os_name == 'nt' or sys_platform == 'win32'
53
+ colorama==0.4.6
53
54
  # via
54
55
  # build
55
56
  # click
57
+ # griffe
56
58
  # tqdm
57
59
  # uvicorn
58
60
  coloredlogs==15.0.1
@@ -63,6 +65,7 @@ defusedxml==0.7.1
63
65
  # via markitdown
64
66
  distro==1.9.0
65
67
  # via
68
+ # google-genai
66
69
  # openai
67
70
  # posthog
68
71
  dnspython==2.8.0
@@ -91,10 +94,18 @@ flatbuffers==25.12.19
91
94
  # via onnxruntime
92
95
  fsspec==2026.1.0
93
96
  # via huggingface-hub
97
+ genai-prices==0.0.51
98
+ # via pydantic-ai-slim
94
99
  google-auth==2.47.0
95
- # via kubernetes
100
+ # via
101
+ # google-genai
102
+ # kubernetes
103
+ google-genai==1.58.0
104
+ # via pydantic-ai-slim
96
105
  googleapis-common-protos==1.72.0
97
106
  # via opentelemetry-exporter-otlp-proto-grpc
107
+ griffe==1.15.0
108
+ # via pydantic-ai-slim
98
109
  grpcio==1.76.0
99
110
  # via
100
111
  # chromadb
@@ -115,7 +126,11 @@ httpx==0.28.1
115
126
  # chromadb
116
127
  # fastapi
117
128
  # fastapi-cloud-cli
129
+ # genai-prices
130
+ # google-genai
118
131
  # openai
132
+ # pydantic-ai-slim
133
+ # pydantic-graph
119
134
  huggingface-hub==0.36.0
120
135
  # via
121
136
  # agent-cli
@@ -143,6 +158,8 @@ jsonschema-specifications==2025.9.1
143
158
  # via jsonschema
144
159
  kubernetes==34.1.0
145
160
  # via chromadb
161
+ logfire-api==4.18.0
162
+ # via pydantic-graph
146
163
  lxml==6.0.2
147
164
  # via
148
165
  # markitdown
@@ -180,13 +197,16 @@ onnxruntime==1.20.1
180
197
  # magika
181
198
  # markitdown
182
199
  openai==2.15.0
183
- # via agent-cli
200
+ # via
201
+ # agent-cli
202
+ # pydantic-ai-slim
184
203
  opentelemetry-api==1.39.1
185
204
  # via
186
205
  # chromadb
187
206
  # opentelemetry-exporter-otlp-proto-grpc
188
207
  # opentelemetry-sdk
189
208
  # opentelemetry-semantic-conventions
209
+ # pydantic-ai-slim
190
210
  opentelemetry-exporter-otlp-proto-common==1.39.1
191
211
  # via opentelemetry-exporter-otlp-proto-grpc
192
212
  opentelemetry-exporter-otlp-proto-grpc==1.39.1
@@ -240,13 +260,21 @@ pydantic==2.12.5
240
260
  # chromadb
241
261
  # fastapi
242
262
  # fastapi-cloud-cli
263
+ # genai-prices
264
+ # google-genai
243
265
  # openai
266
+ # pydantic-ai-slim
244
267
  # pydantic-extra-types
268
+ # pydantic-graph
245
269
  # pydantic-settings
270
+ pydantic-ai-slim==1.42.0
271
+ # via agent-cli
246
272
  pydantic-core==2.41.5
247
273
  # via pydantic
248
274
  pydantic-extra-types==2.11.0
249
275
  # via fastapi
276
+ pydantic-graph==1.42.0
277
+ # via pydantic-ai-slim
250
278
  pydantic-settings==2.12.0
251
279
  # via fastapi
252
280
  pygments==2.19.2
@@ -285,14 +313,19 @@ referencing==0.37.0
285
313
  # jsonschema
286
314
  # jsonschema-specifications
287
315
  regex==2026.1.15
288
- # via transformers
316
+ # via
317
+ # tiktoken
318
+ # transformers
289
319
  requests==2.32.5
290
320
  # via
321
+ # google-auth
322
+ # google-genai
291
323
  # huggingface-hub
292
324
  # kubernetes
293
325
  # markitdown
294
326
  # posthog
295
327
  # requests-oauthlib
328
+ # tiktoken
296
329
  # transformers
297
330
  requests-oauthlib==2.0.0
298
331
  # via kubernetes
@@ -332,7 +365,9 @@ six==1.17.0
332
365
  # posthog
333
366
  # python-dateutil
334
367
  sniffio==1.3.1
335
- # via openai
368
+ # via
369
+ # google-genai
370
+ # openai
336
371
  soupsieve==2.8.1
337
372
  # via beautifulsoup4
338
373
  starlette==0.50.0
@@ -340,7 +375,11 @@ starlette==0.50.0
340
375
  sympy==1.14.0
341
376
  # via onnxruntime
342
377
  tenacity==9.1.2
343
- # via chromadb
378
+ # via
379
+ # chromadb
380
+ # google-genai
381
+ tiktoken==0.12.0
382
+ # via pydantic-ai-slim
344
383
  tokenizers==0.22.2
345
384
  # via
346
385
  # chromadb
@@ -367,6 +406,7 @@ typing-extensions==4.15.0
367
406
  # beautifulsoup4
368
407
  # chromadb
369
408
  # fastapi
409
+ # google-genai
370
410
  # grpcio
371
411
  # huggingface-hub
372
412
  # openai
@@ -387,6 +427,8 @@ typing-extensions==4.15.0
387
427
  typing-inspection==0.4.2
388
428
  # via
389
429
  # pydantic
430
+ # pydantic-ai-slim
431
+ # pydantic-graph
390
432
  # pydantic-settings
391
433
  urllib3==2.3.0
392
434
  # via
@@ -408,7 +450,9 @@ watchfiles==1.1.1
408
450
  websocket-client==1.9.0
409
451
  # via kubernetes
410
452
  websockets==15.0.1
411
- # via uvicorn
453
+ # via
454
+ # google-genai
455
+ # uvicorn
412
456
  xlsxwriter==3.2.9
413
457
  # via python-pptx
414
458
  zipp==3.23.0
@@ -23,6 +23,7 @@ def proxy(
23
23
  rich_help_panel="Memory Configuration",
24
24
  ),
25
25
  openai_base_url: str | None = opts.OPENAI_BASE_URL,
26
+ embedding_base_url: str | None = opts.EMBEDDING_BASE_URL,
26
27
  embedding_model: str = opts.EMBEDDING_MODEL,
27
28
  openai_api_key: str | None = opts.OPENAI_API_KEY,
28
29
  default_top_k: int = typer.Option(
@@ -135,12 +136,15 @@ def proxy(
135
136
  entries_dir, _ = ensure_store_dirs(memory_path)
136
137
  if openai_base_url is None:
137
138
  openai_base_url = constants.DEFAULT_OPENAI_BASE_URL
139
+ effective_embedding_url = embedding_base_url or openai_base_url
138
140
 
139
141
  console.print(f"[bold green]Starting Memory Proxy on {host}:{port}[/bold green]")
140
142
  console.print(f" 💾 Memory store: [blue]{memory_path}[/blue]")
141
143
  console.print(f" 📁 Entries: [blue]{entries_dir}[/blue]")
142
144
  console.print(f" 🤖 Backend: [blue]{openai_base_url}[/blue]")
143
- console.print(f" 🧠 Embeddings: Using [blue]{embedding_model}[/blue]")
145
+ console.print(
146
+ f" 🧠 Embeddings: [blue]{embedding_model}[/blue] via [blue]{effective_embedding_url}[/blue]",
147
+ )
144
148
  console.print(f" 🔍 Memory top_k: [blue]{default_top_k}[/blue] entries per query")
145
149
  console.print(f" 🧹 Max entries per conversation: [blue]{max_entries}[/blue]")
146
150
  console.print(
@@ -154,6 +158,7 @@ def proxy(
154
158
  fastapi_app = create_app(
155
159
  memory_path,
156
160
  openai_base_url,
161
+ embedding_base_url=effective_embedding_url,
157
162
  embedding_model=embedding_model,
158
163
  embedding_api_key=openai_api_key,
159
164
  chat_api_key=openai_api_key,
@@ -32,6 +32,7 @@ def rag_proxy(
32
32
  rich_help_panel="RAG Configuration",
33
33
  ),
34
34
  openai_base_url: str | None = opts.OPENAI_BASE_URL,
35
+ embedding_base_url: str | None = opts.EMBEDDING_BASE_URL,
35
36
  embedding_model: str = opts.EMBEDDING_MODEL,
36
37
  openai_api_key: str | None = opts.OPENAI_API_KEY,
37
38
  limit: int = typer.Option(
@@ -138,22 +139,26 @@ def rag_proxy(
138
139
 
139
140
  if openai_base_url is None:
140
141
  openai_base_url = constants.DEFAULT_OPENAI_BASE_URL
142
+ effective_embedding_url = embedding_base_url or openai_base_url
141
143
 
142
144
  console.print(f"[bold green]Starting RAG Proxy on {host}:{port}[/bold green]")
143
145
  console.print(f" 📂 Docs: [blue]{docs_folder}[/blue]")
144
146
  console.print(f" 💾 DB: [blue]{chroma_path}[/blue]")
145
147
  console.print(f" 🤖 Backend: [blue]{openai_base_url}[/blue]")
146
- console.print(f" 🧠 Embeddings: Using [blue]{embedding_model}[/blue]")
148
+ console.print(
149
+ f" 🧠 Embeddings: [blue]{embedding_model}[/blue] via [blue]{effective_embedding_url}[/blue]",
150
+ )
147
151
  console.print(f" 🔍 Limit: [blue]{limit}[/blue] chunks per query")
148
152
 
149
153
  fastapi_app = create_app(
150
154
  docs_folder,
151
155
  chroma_path,
152
156
  openai_base_url,
153
- embedding_model,
154
- openai_api_key,
155
- openai_api_key,
156
- limit,
157
+ embedding_base_url=effective_embedding_url,
158
+ embedding_model=embedding_model,
159
+ embedding_api_key=openai_api_key,
160
+ chat_api_key=openai_api_key,
161
+ limit=limit,
157
162
  enable_rag_tools=enable_rag_tools,
158
163
  )
159
164
 
@@ -22,6 +22,7 @@ LOGGER = logging.getLogger(__name__)
22
22
  def create_app(
23
23
  memory_path: Path,
24
24
  openai_base_url: str,
25
+ embedding_base_url: str | None = None,
25
26
  embedding_model: str = DEFAULT_OPENAI_EMBEDDING_MODEL,
26
27
  embedding_api_key: str | None = None,
27
28
  chat_api_key: str | None = None,
@@ -39,6 +40,7 @@ def create_app(
39
40
  client = MemoryClient(
40
41
  memory_path=memory_path,
41
42
  openai_base_url=openai_base_url,
43
+ embedding_base_url=embedding_base_url,
42
44
  embedding_model=embedding_model,
43
45
  embedding_api_key=embedding_api_key,
44
46
  chat_api_key=chat_api_key,
@@ -41,6 +41,7 @@ class MemoryClient:
41
41
  self,
42
42
  memory_path: Path,
43
43
  openai_base_url: str,
44
+ embedding_base_url: str | None = None,
44
45
  embedding_model: str = DEFAULT_OPENAI_EMBEDDING_MODEL,
45
46
  embedding_api_key: str | None = None,
46
47
  chat_api_key: str | None = None,
@@ -74,7 +75,7 @@ class MemoryClient:
74
75
  self.collection: Collection = init_memory_collection(
75
76
  self.memory_path,
76
77
  embedding_model=embedding_model,
77
- openai_base_url=self.openai_base_url,
78
+ openai_base_url=embedding_base_url or self.openai_base_url,
78
79
  openai_api_key=embedding_api_key,
79
80
  )
80
81
 
@@ -109,6 +109,14 @@ EMBEDDING_MODEL: str = typer.Option(
109
109
  help="Embedding model to use for vectorization.",
110
110
  rich_help_panel="LLM Configuration",
111
111
  )
112
+ EMBEDDING_BASE_URL: str | None = typer.Option(
113
+ None,
114
+ "--embedding-base-url",
115
+ envvar="EMBEDDING_BASE_URL",
116
+ help="Base URL for embedding API. Falls back to `--openai-base-url` if not set. "
117
+ "Useful when using different providers for chat vs embeddings.",
118
+ rich_help_panel="LLM Configuration",
119
+ )
112
120
 
113
121
  # --- ASR (Audio) Configuration ---
114
122
  # General ASR
@@ -32,6 +32,7 @@ def create_app(
32
32
  docs_folder: Path,
33
33
  chroma_path: Path,
34
34
  openai_base_url: str,
35
+ embedding_base_url: str | None = None,
35
36
  embedding_model: str = DEFAULT_OPENAI_EMBEDDING_MODEL,
36
37
  embedding_api_key: str | None = None,
37
38
  chat_api_key: str | None = None,
@@ -47,7 +48,7 @@ def create_app(
47
48
  chroma_path,
48
49
  name="docs",
49
50
  embedding_model=embedding_model,
50
- openai_base_url=openai_base_url,
51
+ openai_base_url=embedding_base_url or openai_base_url,
51
52
  openai_api_key=embedding_api_key,
52
53
  )
53
54
 
@@ -35,8 +35,8 @@ EXTRA_METADATA: dict[str, tuple[str, list[str]]] = {
35
35
  "llm": ("LLM framework (pydantic-ai)", ["pydantic_ai"]),
36
36
  "llm-core": ("Minimal LLM support for Docker images", ["pydantic_ai"]),
37
37
  # Feature extras
38
- "rag": ("RAG proxy (ChromaDB, embeddings)", ["chromadb"]),
39
- "memory": ("Long-term memory proxy", ["chromadb", "yaml"]),
38
+ "rag": ("RAG proxy (ChromaDB, embeddings)", ["chromadb", "pydantic_ai"]),
39
+ "memory": ("Long-term memory proxy", ["chromadb", "yaml", "pydantic_ai"]),
40
40
  "vad": ("Voice Activity Detection (silero-vad)", ["silero_vad"]),
41
41
  "whisper": ("Local Whisper ASR (faster-whisper)", ["faster_whisper"]),
42
42
  "whisper-mlx": ("MLX Whisper for Apple Silicon", ["mlx_whisper"]),
@@ -46,6 +46,7 @@
46
46
  # RAG_LIMIT - Number of document chunks per query (default: 3)
47
47
  # RAG_ENABLE_TOOLS - Enable read_full_document tool (default: true)
48
48
  # EMBEDDING_MODEL - Embedding model for RAG/memory (default: text-embedding-3-small)
49
+ # EMBEDDING_BASE_URL - Separate endpoint for embeddings (falls back to OPENAI_BASE_URL)
49
50
  #
50
51
  # MEMORY_PORT - Memory proxy port (default: 8100)
51
52
  # MEMORY_TOP_K - Number of memories per query (default: 5)
@@ -262,6 +263,7 @@ services:
262
263
  - RAG_LIMIT=${RAG_LIMIT:-3}
263
264
  - RAG_ENABLE_TOOLS=${RAG_ENABLE_TOOLS:-true}
264
265
  - EMBEDDING_MODEL=${EMBEDDING_MODEL:-text-embedding-3-small}
266
+ - EMBEDDING_BASE_URL=${EMBEDDING_BASE_URL:-}
265
267
  - LOG_LEVEL=${LOG_LEVEL:-info}
266
268
  # OpenAI-compatible backend configuration
267
269
  - OPENAI_BASE_URL=${OPENAI_BASE_URL:-http://ollama:11434/v1}
@@ -295,6 +297,7 @@ services:
295
297
  - MEMORY_SUMMARIZATION=${MEMORY_SUMMARIZATION:-true}
296
298
  - MEMORY_GIT_VERSIONING=${MEMORY_GIT_VERSIONING:-true}
297
299
  - EMBEDDING_MODEL=${EMBEDDING_MODEL:-text-embedding-3-small}
300
+ - EMBEDDING_BASE_URL=${EMBEDDING_BASE_URL:-}
298
301
  - LOG_LEVEL=${LOG_LEVEL:-info}
299
302
  # OpenAI-compatible backend configuration
300
303
  - OPENAI_BASE_URL=${OPENAI_BASE_URL:-http://ollama:11434/v1}
@@ -98,6 +98,7 @@ agent-cli chat --openai-base-url http://localhost:8100/v1 --llm-provider openai
98
98
 
99
99
  | Option | Default | Description |
100
100
  |--------|---------|-------------|
101
+ | `--embedding-base-url` | - | Base URL for embedding API. Falls back to `--openai-base-url` if not set. Useful when using different providers for chat vs embeddings. |
101
102
  | `--embedding-model` | `text-embedding-3-small` | Embedding model to use for vectorization. |
102
103
 
103
104
  ### Server Configuration
@@ -78,6 +78,7 @@ agent-cli chat --openai-base-url http://localhost:8000/v1 --llm-provider openai
78
78
 
79
79
  | Option | Default | Description |
80
80
  |--------|---------|-------------|
81
+ | `--embedding-base-url` | - | Base URL for embedding API. Falls back to `--openai-base-url` if not set. Useful when using different providers for chat vs embeddings. |
81
82
  | `--embedding-model` | `text-embedding-3-small` | Embedding model to use for vectorization. |
82
83
 
83
84
  ### Server Configuration