PyPI - ragxo - Versions diffs - 0.1.5__tar.gz → 0.1.7__tar.gz - Mend

ragxo 0.1.5tar.gz → 0.1.7tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

{ragxo-0.1.5 → ragxo-0.1.7}/PKG-INFO +61 -2
{ragxo-0.1.5 → ragxo-0.1.7}/README.md +58 -1
{ragxo-0.1.5 → ragxo-0.1.7}/pyproject.toml +3 -1
{ragxo-0.1.5 → ragxo-0.1.7}/ragxo/client.py +28 -6
{ragxo-0.1.5 → ragxo-0.1.7}/ragxo/__init__.py +0 -0

{ragxo-0.1.5 → ragxo-0.1.7}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: ragxo
-Version: 0.1.5
+Version: 0.1.7
 Summary: A RAG (Retrieval-Augmented Generation) toolkit with Milvus integration
 Home-page: https://github.com/yourusername/ragx
 License: MIT
@@ -20,13 +20,17 @@ Classifier: Topic :: Software Development :: Libraries :: Python Modules
 Requires-Dist: boto3 (>=1.36.14,<2.0.0)
 Requires-Dist: dill (>=0.3.9,<0.4.0)
 Requires-Dist: milvus (>=2.3.9,<3.0.0)
+Requires-Dist: mocker (>=1.1.1,<2.0.0)
 Requires-Dist: openai (>=1.61.1,<2.0.0)
 Requires-Dist: pydantic (>=2.10.6,<3.0.0)
 Requires-Dist: pymilvus (>=2.5.4,<3.0.0)
+Requires-Dist: pytest-mock (>=3.14.0,<4.0.0)
 Project-URL: Repository, https://github.com/yourusername/ragx
 Description-Content-Type: text/markdown
-# RagXO 🚀
+# RagXO
+Export, version and reuse your RAG pipeline everywhere 🚀
 [![PyPI version](https://badge.fury.io/py/ragxo.svg)](https://badge.fury.io/py/ragxo)
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
@@ -49,6 +53,61 @@ RagXO extends the capabilities of traditional RAG (Retrieval-Augmented Generatio
 pip install ragxo
 ```
+## Quickstart 🚀
+### Build a RAG pipeline
+```python
+from ragxo import Ragxo, Document
+def preprocess_text_lower(text: str) -> str:
+    return text.lower()
+def preprocess_text_remove_special_chars(text: str) -> str:
+    return re.sub(r'[^a-zA-Z0-9\s]', '', text)
+def get_embeddings(text: str) -> list[float]:
+    return openai.embeddings.create(text=text, model="text-embedding-ada-002").data[0].embedding
+ragxo_client = Ragxo(dimension=768)
+ragxo_client.add_preprocess(preprocess_text_lower)
+ragxo_client.add_preprocess(preprocess_text_remove_special_chars)
+ragxo_client.add_embedding_fn(get_embeddings)
+ragxo_client.add_system_prompt("You are a helpful assistant that can answer questions about the data provided.")
+ragxo_client.add_model("gpt-4o-mini")
+ragxo_client.index([
+    Document(text="Capital of France is Paris", metadata={"source": "example"}, id=1),
+    Document(text="Capital of Germany is Berlin", metadata={"source": "example"}, id=2),
+    Document(text="Capital of Italy is Rome", metadata={"source": "example"}, id=3),
+])
+ragxo_client.export("my_rag_v1.0.0")
+```
+### Load a RAG pipeline
+```python
+loaded_ragxo_client = Ragxo.load("my_rag_v1.0.0")
+results = loaded_ragxo_client.query("What is the capital of France?")
+llm_response = loaded_ragxo_client.generate_llm_response(
+    "What is the capital of France?",
+    limit=10,
+    temperature=0.5,
+    max_tokens=1000,
+    top_p=1.0,
+    frequency_penalty=0.0,
+    presence_penalty=0.0)
+```
 ## Usage Guide 📚
 ### Import

{ragxo-0.1.5 → ragxo-0.1.7}/README.md RENAMED Viewed

@@ -1,4 +1,6 @@
-# RagXO 🚀
+# RagXO
+Export, version and reuse your RAG pipeline everywhere 🚀
 [![PyPI version](https://badge.fury.io/py/ragxo.svg)](https://badge.fury.io/py/ragxo)
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
@@ -21,6 +23,61 @@ RagXO extends the capabilities of traditional RAG (Retrieval-Augmented Generatio
 pip install ragxo
 ```
+## Quickstart 🚀
+### Build a RAG pipeline
+```python
+from ragxo import Ragxo, Document
+def preprocess_text_lower(text: str) -> str:
+    return text.lower()
+def preprocess_text_remove_special_chars(text: str) -> str:
+    return re.sub(r'[^a-zA-Z0-9\s]', '', text)
+def get_embeddings(text: str) -> list[float]:
+    return openai.embeddings.create(text=text, model="text-embedding-ada-002").data[0].embedding
+ragxo_client = Ragxo(dimension=768)
+ragxo_client.add_preprocess(preprocess_text_lower)
+ragxo_client.add_preprocess(preprocess_text_remove_special_chars)
+ragxo_client.add_embedding_fn(get_embeddings)
+ragxo_client.add_system_prompt("You are a helpful assistant that can answer questions about the data provided.")
+ragxo_client.add_model("gpt-4o-mini")
+ragxo_client.index([
+    Document(text="Capital of France is Paris", metadata={"source": "example"}, id=1),
+    Document(text="Capital of Germany is Berlin", metadata={"source": "example"}, id=2),
+    Document(text="Capital of Italy is Rome", metadata={"source": "example"}, id=3),
+])
+ragxo_client.export("my_rag_v1.0.0")
+```
+### Load a RAG pipeline
+```python
+loaded_ragxo_client = Ragxo.load("my_rag_v1.0.0")
+results = loaded_ragxo_client.query("What is the capital of France?")
+llm_response = loaded_ragxo_client.generate_llm_response(
+    "What is the capital of France?",
+    limit=10,
+    temperature=0.5,
+    max_tokens=1000,
+    top_p=1.0,
+    frequency_penalty=0.0,
+    presence_penalty=0.0)
+```
 ## Usage Guide 📚
 ### Import

{ragxo-0.1.5 → ragxo-0.1.7}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "ragxo"
-version = "0.1.5"
+version = "0.1.7"
 description = "A RAG (Retrieval-Augmented Generation) toolkit with Milvus integration"
 authors = ["Mohamed Sadek <mohamedfawzydes@gmail.com>"]
 readme = "README.md"
@@ -26,6 +26,8 @@ pydantic = "^2.10.6"
 dill = "^0.3.9"
 openai = "^1.61.1"
 boto3 = "^1.36.14"
+pytest-mock = "^3.14.0"
+mocker = "^1.1.1"
 [tool.poetry.group.dev.dependencies]
 pytest = "^8.3.4"

{ragxo-0.1.5 → ragxo-0.1.7}/ragxo/client.py RENAMED Viewed

@@ -37,6 +37,10 @@ class Ragxo:
         self.processing_fn.append(fn)
         return self
+    def add_llm_response_fn(self, fn: Callable) -> Self:
+        self.llm_response_fn = fn
+        return self
     def add_embedding_fn(self, fn: Callable) -> Self:
         if not fn:
             raise ValueError("Embedding function cannot be None")
@@ -47,8 +51,19 @@ class Ragxo:
         self.system_prompt = prompt
         return self
-    def add_model(self, model: str) -> Self:
+    def add_model(self, model: str,                              limit: int = 10,
+                        temperature: float = 0.5,
+                        max_tokens: int = 1000,
+                        top_p: float = 1.0,
+                        frequency_penalty: float = 0.0,
+                        presence_penalty: float = 0.0) -> Self:
         self.model = model
+        self.limit = limit
+        self.temperature = temperature
+        self.max_tokens = max_tokens
+        self.top_p = top_p
+        self.frequency_penalty = frequency_penalty
+        self.presence_penalty = presence_penalty
         return self
     def index(self, data: list[Document]) -> Self:
@@ -78,7 +93,7 @@ class Ragxo:
         ])
         return self
-    def query(self, query: str, output_fields: list[str] = ['text', 'metadata']) -> list[list[dict]]:
+    def query(self, query: str, output_fields: list[str] = ['text', 'metadata'], limit: int = 10) -> list[list[dict]]:
         if not self.embedding_fn:
             raise ValueError("Embedding function not set. Please call add_embedding_fn first.")
@@ -91,7 +106,7 @@ class Ragxo:
         return self.client.search(
             collection_name=self.collection_name,
             data=[embedding],
-            limit=10,
+            limit=limit,
             output_fields=output_fields
         )
@@ -235,9 +250,11 @@ class Ragxo:
             logger.error(f"Error in S3 load: {e}")
             raise
-    def generate_llm_response(self, query: str, data: list[dict] = None) -> ChatCompletion:
+    def generate_llm_response(self,
+                              query: str,
+                              data: list[dict] = None) -> ChatCompletion:
         if data is None:
-            data = self.query(query)[0]
+            data = self.query(query, limit=self.limit)[0]
         if not self.system_prompt:
             raise ValueError("System prompt not set. Please call add_system_prompt first.")
@@ -247,7 +264,12 @@ class Ragxo:
             messages=[
                 {"role": "system", "content": self.system_prompt},
                 {"role": "user", "content": "query: {} data: {}".format(query, data)}
-            ]
+            ],
+            temperature=self.temperature,
+            max_tokens=self.max_tokens,
+            top_p=self.top_p,
+            frequency_penalty=self.frequency_penalty,
+            presence_penalty=self.presence_penalty,
         )
         return response

{ragxo-0.1.5 → ragxo-0.1.7}/ragxo/__init__.py RENAMED Viewed

File without changes

ragxo 0.1.5__tar.gz → 0.1.7__tar.gz

ragxo 0.1.5tar.gz → 0.1.7tar.gz