PyPI - docpilot-cli - Versions diffs - 1.0.3__tar.gz → 1.0.4__tar.gz - Mend

docpilot-cli 1.0.3tar.gz → 1.0.4tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

{docpilot_cli-1.0.3/src/docpilot_cli.egg-info → docpilot_cli-1.0.4}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: docpilot-cli
-Version: 1.0.3
+Version: 1.0.4
 Summary: A local-first RAG pipeline CLI tool
 Requires-Python: >=3.12
 Description-Content-Type: text/markdown

{docpilot_cli-1.0.3 → docpilot_cli-1.0.4}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "docpilot-cli"
-version = "1.0.3"
+version = "1.0.4"
 description = "A local-first RAG pipeline CLI tool"
 readme = "README.md"
 requires-python = ">=3.12"
@@ -22,7 +22,6 @@ dependencies = [
 [project.scripts]
 docpilot = "docpilot.cli:app"
 [tool.setuptools.packages.find]
 where = ["src"]

{docpilot_cli-1.0.3 → docpilot_cli-1.0.4}/src/docpilot/chat.py RENAMED Viewed

@@ -2,6 +2,7 @@ from langchain_ollama.llms import OllamaLLM as Ollama
 from langchain_core.prompts import ChatPromptTemplate
 from langchain_core.output_parsers import StrOutputParser
 import os
+from rich.console import Console
 from . import store
 from langchain_chroma import Chroma
 from langchain_ollama import OllamaEmbeddings
@@ -10,22 +11,21 @@ config = store.load_config()
 retrieval_k = int(config.get("retrieval_k", 6))
 max_context_chars = int(config.get("max_context_chars", 3500))
 max_doc_chars = int(config.get("max_doc_chars", 700))
+console = Console()
 model = Ollama(
     model=config.get("default_model", "deepseek-coder-v2"),
-    num_predict=int(config.get("num_predict", 192)),
+    num_predict=int(config.get("num_predict", 400)),
     num_ctx=int(config.get("num_ctx", 2048)),
     num_thread=int(config.get("num_thread", max(1, (os.cpu_count() or 4) - 1))),
     temperature=float(config.get("temperature", 0.1)),
 )
 def _get_vectorstore():
     """Get vectorstore for the active project."""
     embeddings = OllamaEmbeddings(model=config.get("default_embed_model", "mxbai-embed-large:335m"))
     db_location = store.get_active_project_path()
     return Chroma(collection_name="documents", persist_directory=str(db_location), embedding_function=embeddings)
-retriever = None
 # Query Transformation Chain
 rewrite_template = """You are an AI assistant helping to formulate a search query for a vector database.
@@ -37,7 +37,7 @@ rewrite_prompt = ChatPromptTemplate.from_template(rewrite_template)
 rewrite_chain = rewrite_prompt | model | StrOutputParser()
 template = """
-You are an assistant for answering questions based on the following ingested documents.
+You are an assistant named docpilot for answering questions based on the following ingested documents.
 Use the information in the documents to answer the question as best as you can.
 If you don't know the answer, say you don't know.
 Always use the information in the documents and never make up an answer.
@@ -77,7 +77,7 @@ def askai(question):
         max_doc_chars=max_doc_chars,
     )
     if rag_text == "":
-        print("NO RAG obtained add some documents to ingest")
+        console.print("[italic blue]Note  - NO RAG obtained add some documents to ingest[/italic blue]")
     result = chain.invoke({"reviews": rag_text, "question": question})
     return result

{docpilot_cli-1.0.3 → docpilot_cli-1.0.4}/src/docpilot/cli.py RENAMED Viewed

@@ -120,7 +120,8 @@ def show():
     info_panel = Panel(
         f"[bold]Version:[/bold]     [cyan]{PROJECT_VERSION}[/cyan]\n"
-        f"[bold]Description:[/bold] [cyan]{PROJECT_DESCRIPTION}[/cyan]",
+        f"[bold]Description:[/bold] [cyan]{PROJECT_DESCRIPTION}[/cyan]\n"
+        f"[bold italic][yellow]Developed by Aswin Ashok as an open source project[/yellow]",
         border_style="cyan",
         title="[bold green]System Info[/bold green]",
         padding=(1, 2)

{docpilot_cli-1.0.3 → docpilot_cli-1.0.4}/src/docpilot/scrape.py RENAMED Viewed

@@ -4,9 +4,14 @@ from urllib.parse import urljoin, urlparse
 from concurrent.futures import ThreadPoolExecutor, as_completed
 from collections import deque
 import time
+from importlib.metadata import version, PackageNotFoundError
+try:
+    __version__ = version("docpilot-cli")
+except PackageNotFoundError:
+    __version__ = "unknown"
-REQUEST_HEADERS = {"User-Agent": "docpilot/0.0.1 (+https://github.com/foss-hack/docpilot)"}
+REQUEST_HEADERS = {"User-Agent": f"docpilot/{__version__} (+https://pypi.org/project/docpilot-cli/)"}
 MAX_RETRIES = 4
 BACKOFF_SECONDS = 0.8

{docpilot_cli-1.0.3 → docpilot_cli-1.0.4}/src/docpilot/store.py RENAMED Viewed

@@ -1,3 +1,6 @@
+from chromadb.utils import embedding_functions
+from bs4 import element
+from rich.console import Console
 import tomllib
 import tomli_w
 from pathlib import Path
@@ -8,6 +11,7 @@ path = Path.home() / ".docpilot"
 CONFIG_PATH = path / "config.toml"
 PROJECTS_DIR = path / "projects"
+console = Console()
 def _get_available_models():
     try:
@@ -28,8 +32,8 @@ DEFAULT_CONFIG = {
     "retrieval_k": 6,
     "max_context_chars": 3500,
     "max_doc_chars": 700,
-    "num_predict": 192,
-    "num_ctx": 2048,
+    "num_predict": 500,
+    "num_ctx": 4096,
     "num_thread": max(1, (os.cpu_count() or 4) - 1),
     "temperature": 0.1,
 }
@@ -39,9 +43,6 @@ def check_ollama_connection():
     try:
         ollama.list()
     except Exception:
-        from rich.console import Console
-        console = Console()
         console.print("\n[bold red]❌ Error: Could not connect to Ollama.[/bold red]")
         console.print("[yellow]Please ensure the Ollama application is running and try again.[/yellow]\n")
         import sys
@@ -51,6 +52,9 @@ def check_ollama_connection():
 def init_config():
     """Initialize config file with defaults if it doesn't exist."""
+    if path.exists():
+        if not CONFIG_PATH.exists():
+            console.print("[bold red]Config file lost, recreating it!")
     if not CONFIG_PATH.exists():
         CONFIG_PATH.parent.mkdir(parents=True, exist_ok=True)
         PROJECTS_DIR.mkdir(parents=True, exist_ok=True)
@@ -69,7 +73,22 @@ def interactive_setup(first_time=False):
         console.print("\n[bold cyan]🚀 Welcome to Docpilot! Let's do a quick setup.[/bold cyan]")
     else:
         console.print("\n[bold cyan]⚙️  Docpilot Model Setup[/bold cyan]")
+    #Finding and handling error of embeding model
+    embedding_modelfound=0
+    embedsupportedmodel = [
+    "all-minilm",
+    "snowflake-arctic-embed",
+    "bge-m3",
+    "bge-large",
+    "paraphrase-multilingual",
+    "mxbai-embed-large",
+    "mxbai-embed-large:latest",
+    "mxbai-embed-large:335m",
+    "nomic-embed-text",
+    ]
+    embedmodelfound=[]
+    embed_model=""
     models = _get_available_models()
     if not models:
         console.print("[yellow]No local Ollama models found! Using default fallbacks.[/yellow]")
@@ -77,15 +96,56 @@ def interactive_setup(first_time=False):
         embed_model = Prompt.ask("Enter embedding model name", default="mxbai-embed-large:335m")
         chat_model = Prompt.ask("Enter chat model name", default="qwen2.5:latest")
     else:
-        # Smart defaults based on names
-        embed_guess = next((m for m in models if "embed" in m.lower()), models[0])
-        chat_guess = next((m for m in models if "embed" not in m.lower()), models[1] if len(models) > 1 else models[0])
-        embed_model = Prompt.ask(
-            "Select your [bold green]embedding model[/bold green]", choices=models, default=embed_guess
-        )
-        chat_model = Prompt.ask("Select your [bold blue]chat model[/bold blue]", choices=models, default=chat_guess)
+        for i in models:
+            for j in embedsupportedmodel:
+                if i.lower()==j.lower():
+                    embedding_modelfound=1
+                    embedmodelfound.append(j)
+                    break
+        if not embedding_modelfound:
+            console.print("[bold yellow]Embedding model not found and is not encouraged to use this way")
+            while True:
+                userquestion = Prompt.ask("[blue]Run ollama pull mxbai-embed-large to fix this(y/n).[/blue]").lower()
+                if userquestion == "y":
+                    os.system("ollama pull mxbai-embed-large")
+                    embed_model="mxbai-embed-large"
+                    break
+                elif userquestion == "n":
+                    console.print("[red]Exiting...[/red]")
+                    exit()
+                else:
+                    console.print("Enter a valid option to continue")
+        #Asking embedding model if model not latestly downloaded
+        if embed_model == "":
+            embed_model = Prompt.ask(
+              "Select your [bold green]embedding model[/bold green]", choices=embedmodelfound, default=embedmodelfound[0]
+            )
+        #Chat Model
+        chatspecific_models=list(set(models)-set(embedsupportedmodel))
+        console.print("[bold yellow]Available chat Models:[/bold yellow]")
+        for i in range(len(chatspecific_models)):
+            console.print(f"[bold green]{i}:->{chatspecific_models[i]} .[/bold green]")
+        #Smart choice for model
+        chat_model=str()
+        if not chatspecific_models:
+            chatspecific_models = models # Fallback if they only have embedding models downloaded
+        chat_guess = next((m for m in models if "embed" not in m.lower()), chatspecific_models[1] if len(chatspecific_models) > 1 else chatspecific_models[0])
+        while True:
+            chatmodelanswer = Prompt.ask("Select your [bold blue]chat model[/bold blue]", default=chat_guess)
+            if chatmodelanswer.isdigit():
+                if int(chatmodelanswer)<len(chatspecific_models):
+                    chat_model=chatspecific_models[int(chatmodelanswer)]
+                    break
+                else:
+                    console.print("[red]Invalid model number. Try again.")
+            else:
+                if check_exist(chatmodelanswer,chatspecific_models):
+                    chat_model = chatmodelanswer
+                    break
+                else:
+                    console.print("[red]Invalid Option... try again")
     config = load_config() if not first_time else DEFAULT_CONFIG.copy()
     config["default_embed_model"] = embed_model
     config["default_model"] = chat_model
@@ -93,6 +153,11 @@ def interactive_setup(first_time=False):
     console.print(f"[bold green]✓ Configuration saved to {CONFIG_PATH}[/bold green]\n")
     return load_config()
+def check_exist(name,listname):
+    for i in listname:
+        if name == i.lower():
+            return True
+    return False
 def load_config():
     if not CONFIG_PATH.exists():

{docpilot_cli-1.0.3 → docpilot_cli-1.0.4/src/docpilot_cli.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: docpilot-cli
-Version: 1.0.3
+Version: 1.0.4
 Summary: A local-first RAG pipeline CLI tool
 Requires-Python: >=3.12
 Description-Content-Type: text/markdown