PyPI - ragxo - Versions diffs - 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl - Mend

ragxo 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

ragxo/client.py +132 -16
{ragxo-0.1.6.dist-info → ragxo-0.1.8.dist-info}/METADATA +14 -11
ragxo-0.1.8.dist-info/RECORD +5 -0
ragxo-0.1.6.dist-info/RECORD +0 -5
{ragxo-0.1.6.dist-info → ragxo-0.1.8.dist-info}/WHEEL +0 -0

ragxo/client.py CHANGED Viewed

@@ -20,7 +20,26 @@ class Document(BaseModel):
     id: int
 class Ragxo:
+    """
+    A RAG (Retrieval-Augmented Generation) system that combines vector search with LLM responses.
+    Attributes:
+        dimension (int): Dimension of the embedding vectors
+        collection_name (str): Name of the Milvus collection
+        db_path (str): Path to the Milvus database
+        processing_fn (list): List of preprocessing functions
+        embedding_fn (Callable): Function to generate embeddings
+        system_prompt (str): System prompt for LLM
+        model (str): LLM model name
+    """
     def __init__(self, dimension: int) -> None:
+        """
+        Initialize the Ragxo instance.
+        Args:
+            dimension (int): Dimension of the embedding vectors
+        """
         self.dimension = dimension
         self.collection_name = "ragx"
         os.makedirs("ragx_artifacts", exist_ok=True)
@@ -34,28 +53,105 @@ class Ragxo:
         self.model = "gpt-4o-mini"
     def add_preprocess(self, fn: Callable) -> Self:
+        """
+        Add a preprocessing function to the pipeline.
+        Args:
+            fn (Callable): Function that takes and returns a string
+        Returns:
+            Self: The current instance for method chaining
+        """
         self.processing_fn.append(fn)
         return self
     def add_llm_response_fn(self, fn: Callable) -> Self:
+        """
+        Add a function to process LLM responses.
+        Args:
+            fn (Callable): Function to process LLM responses
+        Returns:
+            Self: The current instance for method chaining
+        """
         self.llm_response_fn = fn
         return self
     def add_embedding_fn(self, fn: Callable) -> Self:
+        """
+        Set the embedding function for vector generation.
+        Args:
+            fn (Callable): Function that converts text to embeddings
+        Returns:
+            Self: The current instance for method chaining
+        Raises:
+            ValueError: If fn is None
+        """
         if not fn:
             raise ValueError("Embedding function cannot be None")
         self.embedding_fn = fn
         return self
     def add_system_prompt(self, prompt: str) -> Self:
+        """
+        Set the system prompt for LLM interactions.
+        Args:
+            prompt (str): System prompt text
+        Returns:
+            Self: The current instance for method chaining
+        """
         self.system_prompt = prompt
         return self
-    def add_model(self, model: str) -> Self:
+    def add_model(self, model: str,                              limit: int = 10,
+                        temperature: float = 0.5,
+                        max_tokens: int = 1000,
+                        top_p: float = 1.0,
+                        frequency_penalty: float = 0.0,
+                        presence_penalty: float = 0.0) -> Self:
+        """
+        Configure the LLM model and its parameters.
+        Args:
+            model (str): Name of the LLM model
+            limit (int): Maximum number of results to return from vector search
+            temperature (float): Sampling temperature
+            max_tokens (int): Maximum tokens in response
+            top_p (float): Nucleus sampling parameter
+            frequency_penalty (float): Frequency penalty parameter
+            presence_penalty (float): Presence penalty parameter
+        Returns:
+            Self: The current instance for method chaining
+        """
         self.model = model
+        self.limit = limit
+        self.temperature = temperature
+        self.max_tokens = max_tokens
+        self.top_p = top_p
+        self.frequency_penalty = frequency_penalty
+        self.presence_penalty = presence_penalty
         return self
     def index(self, data: list[Document]) -> Self:
+        """
+        Index documents into the vector database.
+        Args:
+            data (list[Document]): List of documents to index
+        Returns:
+            Self: The current instance for method chaining
+        Raises:
+            ValueError: If embedding function is not set
+        """
         if not self.embedding_fn:
             raise ValueError("Embedding function not set")
@@ -83,6 +179,20 @@ class Ragxo:
         return self
     def query(self, query: str, output_fields: list[str] = ['text', 'metadata'], limit: int = 10) -> list[list[dict]]:
+        """
+        Search the vector database for similar documents.
+        Args:
+            query (str): Search query
+            output_fields (list[str]): Fields to return in results
+            limit (int): Maximum number of results
+        Returns:
+            list[list[dict]]: Search results
+        Raises:
+            ValueError: If embedding function is not set
+        """
         if not self.embedding_fn:
             raise ValueError("Embedding function not set. Please call add_embedding_fn first.")
@@ -240,17 +350,23 @@ class Ragxo:
             raise
     def generate_llm_response(self,
-                              query: str,
-                              limit: int = 10,
-                              data: list[dict] = None,
-                              temperature: float = 0.5,
-                              max_tokens: int = 1000,
-                              top_p: float = 1.0,
-                              frequency_penalty: float = 0.0,
-                              presence_penalty: float = 0.0,
-                              ) -> ChatCompletion:
+                              query: str,
+                              data: list[dict] = None) -> ChatCompletion:
+        """
+        Generate LLM response based on query and retrieved data.
+        Args:
+            query (str): User query
+            data (list[dict], optional): Retrieved documents. If None, performs a new query
+        Returns:
+            ChatCompletion: LLM response
+        Raises:
+            ValueError: If system prompt is not set
+        """
         if data is None:
-            data = self.query(query, limit=limit)[0]
+            data = self.query(query, limit=self.limit)[0]
         if not self.system_prompt:
             raise ValueError("System prompt not set. Please call add_system_prompt first.")
@@ -261,11 +377,11 @@ class Ragxo:
                 {"role": "system", "content": self.system_prompt},
                 {"role": "user", "content": "query: {} data: {}".format(query, data)}
             ],
-            temperature=temperature,
-            max_tokens=max_tokens,
-            top_p=top_p,
-            frequency_penalty=frequency_penalty,
-            presence_penalty=presence_penalty,
+            temperature=self.temperature,
+            max_tokens=self.max_tokens,
+            top_p=self.top_p,
+            frequency_penalty=self.frequency_penalty,
+            presence_penalty=self.presence_penalty,
         )
         return response

{ragxo-0.1.6.dist-info → ragxo-0.1.8.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: ragxo
-Version: 0.1.6
+Version: 0.1.8
 Summary: A RAG (Retrieval-Augmented Generation) toolkit with Milvus integration
 Home-page: https://github.com/yourusername/ragx
 License: MIT
@@ -20,9 +20,11 @@ Classifier: Topic :: Software Development :: Libraries :: Python Modules
 Requires-Dist: boto3 (>=1.36.14,<2.0.0)
 Requires-Dist: dill (>=0.3.9,<0.4.0)
 Requires-Dist: milvus (>=2.3.9,<3.0.0)
+Requires-Dist: mocker (>=1.1.1,<2.0.0)
 Requires-Dist: openai (>=1.61.1,<2.0.0)
 Requires-Dist: pydantic (>=2.10.6,<3.0.0)
 Requires-Dist: pymilvus (>=2.5.4,<3.0.0)
+Requires-Dist: pytest-mock (>=3.14.0,<4.0.0)
 Project-URL: Repository, https://github.com/yourusername/ragx
 Description-Content-Type: text/markdown
@@ -65,7 +67,7 @@ def preprocess_text_remove_special_chars(text: str) -> str:
     return re.sub(r'[^a-zA-Z0-9\s]', '', text)
 def get_embeddings(text: str) -> list[float]:
-    return openai.embeddings.create(text=text, model="text-embedding-ada-002").data[0].embedding
+    return openai.embeddings.create(input=text, model="text-embedding-ada-002").data[0].embedding
 ragxo_client = Ragxo(dimension=768)
@@ -74,7 +76,14 @@ ragxo_client.add_preprocess(preprocess_text_remove_special_chars)
 ragxo_client.add_embedding_fn(get_embeddings)
 ragxo_client.add_system_prompt("You are a helpful assistant that can answer questions about the data provided.")
-ragxo_client.add_model("gpt-4o-mini")
+ragxo_client.add_model(
+    "gpt-4o-mini",
+    temperature=0.5,
+    max_tokens=1000,
+    top_p=1.0,
+    frequency_penalty=0.0,
+    presence_penalty=0.0
+)
 ragxo_client.index([
     Document(text="Capital of France is Paris", metadata={"source": "example"}, id=1),
@@ -92,16 +101,10 @@ ragxo_client.export("my_rag_v1.0.0")
 ```python
 loaded_ragxo_client = Ragxo.load("my_rag_v1.0.0")
-results = loaded_ragxo_client.query("What is the capital of France?")
+vector_search_results = loaded_ragxo_client.query("What is the capital of France?")
 llm_response = loaded_ragxo_client.generate_llm_response(
-    "What is the capital of France?",
-    limit=10,
-    temperature=0.5,
-    max_tokens=1000,
-    top_p=1.0,
-    frequency_penalty=0.0,
-    presence_penalty=0.0)
+    "What is the capital of France?")
 ```

ragxo-0.1.8.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,5 @@
+ragxo/__init__.py,sha256=0VVe-z4XkkGQLQIG0hF0Hyf87_RgX0E4T9TRwwTkbmE,68
+ragxo/client.py,sha256=5AvARwpm4ux-7nWRLs4k5lDFhkgbjl6B9yNjdxcK8vo,12766
+ragxo-0.1.8.dist-info/METADATA,sha256=4uo_8ewStWVyYQYtpfktLz9i8jVfQPReeZxAxfhrWQ4,6227
+ragxo-0.1.8.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
+ragxo-0.1.8.dist-info/RECORD,,

ragxo-0.1.6.dist-info/RECORD DELETED Viewed

@@ -1,5 +0,0 @@
-ragxo/__init__.py,sha256=0VVe-z4XkkGQLQIG0hF0Hyf87_RgX0E4T9TRwwTkbmE,68
-ragxo/client.py,sha256=M4777mj6oPdRIm9TvqIwXoQuJUMc7Ywczlykutd6c70,9068
-ragxo-0.1.6.dist-info/METADATA,sha256=1W4vJeY0awkXbtM0o3dyhFRHEY8VLHwkXrm55KECbg4,6141
-ragxo-0.1.6.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
-ragxo-0.1.6.dist-info/RECORD,,

{ragxo-0.1.6.dist-info → ragxo-0.1.8.dist-info}/WHEEL RENAMED Viewed

File without changes

ragxo 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl

ragxo 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl