PyPI - sf-vector-sdk - Versions diffs - 0.2.0__py3-none-any.whl - Mend

sf-vector-sdk 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

sf_vector_sdk-0.2.0.dist-info/METADATA +476 -0
sf_vector_sdk-0.2.0.dist-info/RECORD +27 -0
sf_vector_sdk-0.2.0.dist-info/WHEEL +4 -0
vector_sdk/__init__.py +262 -0
vector_sdk/client.py +538 -0
vector_sdk/content_types.py +233 -0
vector_sdk/generated/embedding_pipeline/content_types/v1/content_types_pb2.py +57 -0
vector_sdk/generated/embedding_pipeline/content_types/v1/content_types_pb2.pyi +141 -0
vector_sdk/generated/embedding_pipeline/db/vectors/v1/vectors_pb2.py +58 -0
vector_sdk/generated/embedding_pipeline/db/vectors/v1/vectors_pb2.pyi +145 -0
vector_sdk/generated/embedding_pipeline/query/v1/query_pb2.py +58 -0
vector_sdk/generated/embedding_pipeline/query/v1/query_pb2.pyi +109 -0
vector_sdk/generated/embedding_pipeline/tools/v1/tools_pb2.py +39 -0
vector_sdk/generated/embedding_pipeline/tools/v1/tools_pb2.pyi +31 -0
vector_sdk/hash/__init__.py +31 -0
vector_sdk/hash/hasher.py +259 -0
vector_sdk/hash/types.py +67 -0
vector_sdk/namespaces/__init__.py +13 -0
vector_sdk/namespaces/base.py +45 -0
vector_sdk/namespaces/db.py +230 -0
vector_sdk/namespaces/embeddings.py +268 -0
vector_sdk/namespaces/search.py +258 -0
vector_sdk/structured/__init__.py +60 -0
vector_sdk/structured/router.py +190 -0
vector_sdk/structured/structured_embeddings.py +431 -0
vector_sdk/structured/tool_config.py +254 -0
vector_sdk/types.py +864 -0

sf_vector_sdk-0.2.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,476 @@
+Metadata-Version: 2.4
+Name: sf-vector-sdk
+Version: 0.2.0
+Summary: Python SDK for the Vector Gateway service (embeddings and vector search)
+Requires-Python: >=3.11
+Requires-Dist: redis>=5.0.0
+Provides-Extra: dev
+Requires-Dist: pytest-asyncio>=0.21.0; extra == 'dev'
+Requires-Dist: pytest>=7.0.0; extra == 'dev'
+Requires-Dist: ruff>=0.1.0; extra == 'dev'
+Description-Content-Type: text/markdown
+# Vector SDK for Python
+A lightweight Python client for submitting embedding requests and vector search queries to the Vector Gateway service.
+## Overview
+The Vector SDK provides a simple interface for generating embeddings via the centralized Vector Gateway service. The SDK communicates directly with Redis Streams, making it efficient and suitable for any Python service that can reach the shared Redis VM.
+**Key Features:**
+- Simple, Pythonic API with namespace-based organization
+- Intuitive methods: `client.embeddings`, `client.search`, `client.db`
+- Asynchronous request submission with optional waiting
+- Full type hints and documentation
+- Multiple embedding model support (Google Vertex AI and OpenAI)
+- Client-side model validation before submission
+- Minimal dependencies (just Redis)
+## Installation
+### From Source (Monorepo)
+```bash
+cd packages/py/vector-sdk
+pip install -e .
+# Or with uv
+uv pip install -e .
+```
+### From Package Registry (when published)
+```bash
+pip install sf-vector-sdk
+```
+## Quick Start
+### Basic Usage
+```python
+from vector_sdk import VectorClient
+# Create client
+client = VectorClient(
+    redis_url="redis://your-redis-host:6379",
+    http_url="http://localhost:8080",  # Required for db operations
+)
+# Create embeddings
+result = client.embeddings.create_and_wait(
+    texts=[
+        {"id": "doc1", "text": "Introduction to machine learning"},
+        {"id": "doc2", "text": "Deep neural networks explained"},
+    ],
+    content_type="topic",
+)
+print(f"Processed: {result.processed_count}, Failed: {result.failed_count}")
+# Vector search
+search_result = client.search.query_and_wait(
+    query_text="What is machine learning?",
+    database="turbopuffer",
+    namespace="topics",
+    top_k=10,
+)
+for match in search_result.matches:
+    print(f"{match.id}: {match.score}")
+# Direct database lookup (no embedding)
+docs = client.db.get_by_ids(
+    ids=["doc1"],
+    database="turbopuffer",
+    namespace="topics",
+)
+client.close()
+```
+### With Storage Configuration
+```python
+from vector_sdk import VectorClient, StorageConfig, MongoDBStorage, TurboPufferStorage
+client = VectorClient(redis_url="redis://your-redis-host:6379")
+# Create embeddings with storage configuration
+result = client.embeddings.create_and_wait(
+    texts=[
+        {
+            "id": "tool123",
+            "text": "Term: Photosynthesis. Definition: The process by which plants convert sunlight into energy.",
+            "document": {
+                "toolId": "tool123",
+                "toolCollection": "FlashCard",
+                "userId": "user456",
+                "contentHash": "abc123",
+            }
+        }
+    ],
+    content_type="flashcard",
+    priority="high",
+    storage=StorageConfig(
+        mongodb=MongoDBStorage(
+            database="events_new",
+            collection="tool_vectors",
+            embedding_field="toolEmbedding",
+            upsert_key="contentHash",
+        ),
+        turbopuffer=TurboPufferStorage(
+            namespace="tool_vectors",
+            id_field="_id",
+            metadata=["toolId", "toolCollection", "userId"],
+        ),
+    ),
+    metadata={"source": "my-service"},
+)
+client.close()
+```
+### Context Manager
+```python
+with VectorClient(redis_url="redis://localhost:6379") as client:
+    result = client.embeddings.create_and_wait(
+        texts=[{"id": "doc1", "text": "Hello world"}],
+        content_type="document",
+    )
+# Connection automatically closed
+```
+## API Reference
+### VectorClient
+The main client class providing namespaced access to all SDK functionality.
+#### Constructor
+```python
+client = VectorClient(
+    redis_url="redis://localhost:6379",
+    http_url="http://localhost:8080",  # Optional, required for db operations
+)
+```
+### Namespaces
+#### `client.embeddings`
+Embedding generation operations.
+| Method | Description |
+|--------|-------------|
+| `create(texts, content_type, ...)` | Submit embedding request, return request ID |
+| `wait_for(request_id, timeout)` | Wait for request completion |
+| `create_and_wait(texts, content_type, ...)` | Submit and wait for result |
+| `get_queue_depth()` | Get current queue depth for each priority |
+```python
+# Async: create and wait separately
+request_id = client.embeddings.create(texts, content_type)
+result = client.embeddings.wait_for(request_id)
+# Sync: create and wait in one call
+result = client.embeddings.create_and_wait(texts, content_type)
+# Check queue depth
+depths = client.embeddings.get_queue_depth()
+```
+#### `client.search`
+Vector similarity search operations.
+| Method | Description |
+|--------|-------------|
+| `query(query_text, database, ...)` | Submit search query, return request ID |
+| `wait_for(request_id, timeout)` | Wait for query completion |
+| `query_and_wait(query_text, database, ...)` | Submit and wait for result |
+```python
+# Vector search with semantic similarity
+result = client.search.query_and_wait(
+    query_text="What is machine learning?",
+    database="turbopuffer",
+    namespace="topics",
+    top_k=10,
+    include_metadata=True,
+)
+```
+#### `client.db`
+Direct database operations (no embedding required). Requires `http_url`.
+| Method | Description |
+|--------|-------------|
+| `get_by_ids(ids, database, ...)` | Lookup documents by ID |
+| `find_by_metadata(filters, database, ...)` | Search by metadata filters |
+| `clone(id, source_namespace, destination_namespace)` | Clone document between namespaces |
+| `delete(id, namespace)` | Delete document from namespace |
+#### `client.structured_embeddings`
+Type-safe embedding for known tool types (FlashCard, TestQuestion, etc.) with automatic text extraction, content hash computation, and database routing.
+| Method | Description |
+|--------|-------------|
+| `embed_flashcard(data, metadata)` | Embed a flashcard, return request ID |
+| `embed_flashcard_and_wait(data, metadata, timeout)` | Embed and wait for result |
+| `embed_test_question(data, metadata)` | Embed a test question, return request ID |
+| `embed_test_question_and_wait(data, metadata, timeout)` | Embed and wait for result |
+| `embed_spaced_test_question(data, metadata)` | Embed a spaced test question, return request ID |
+| `embed_spaced_test_question_and_wait(data, metadata, timeout)` | Embed and wait for result |
+| `embed_audio_recap(data, metadata)` | Embed an audio recap section, return request ID |
+| `embed_audio_recap_and_wait(data, metadata, timeout)` | Embed and wait for result |
+```python
+from vector_sdk import VectorClient, ToolMetadata, TestQuestionInput
+client = VectorClient(redis_url="redis://localhost:6379")
+# Embed a flashcard - SDK handles text extraction, hashing, and routing
+result = client.structured_embeddings.embed_flashcard_and_wait(
+    data={"type": "BASIC", "term": "Mitochondria", "definition": "The powerhouse of the cell"},
+    metadata=ToolMetadata(tool_id="tool123", user_id="user456", topic_id="topic789"),
+)
+# Embed a test question
+result = client.structured_embeddings.embed_test_question_and_wait(
+    data=TestQuestionInput(
+        question="What is the capital?",
+        answers=[...],
+        question_type="multiplechoice",
+    ),
+    metadata=ToolMetadata(tool_id="tool456"),
+)
+```
+**Database Routing:**
+Set the `STRUCTURED_EMBEDDING_DATABASE_ROUTER` environment variable:
+| Value | Behavior |
+|-------|----------|
+| `dual` | Write to both TurboPuffer AND Pinecone if both have `enabled: True` |
+| `turbopuffer` | Only write to TurboPuffer |
+| `pinecone` | Only write to Pinecone |
+| undefined | Defaults to `turbopuffer` |
+```python
+# Lookup by IDs
+result = client.db.get_by_ids(
+    ids=["doc1", "doc2"],
+    database="turbopuffer",
+    namespace="topics",
+)
+# Find by metadata
+result = client.db.find_by_metadata(
+    filters={"userId": "user123"},
+    database="mongodb",
+    collection="vectors",
+    database_name="mydb",
+)
+# Clone between namespaces
+result = client.db.clone("doc1", "ns1", "ns2")
+# Delete
+result = client.db.delete("doc1", "ns1")
+```
+### Types
+#### Result Types
+```python
+@dataclass
+class EmbeddingResult:
+    request_id: str
+    status: str  # "success", "partial", "failed"
+    processed_count: int
+    failed_count: int
+    errors: list[EmbeddingError]
+    timing: Optional[TimingBreakdown]
+    completed_at: datetime
+    @property
+    def is_success(self) -> bool: ...
+    @property
+    def is_partial(self) -> bool: ...
+    @property
+    def is_failed(self) -> bool: ...
+@dataclass
+class QueryResult:
+    request_id: str
+    status: str  # "success", "failed"
+    matches: list[VectorMatch]
+    error: Optional[str]
+    timing: Optional[QueryTiming]
+    completed_at: datetime
+@dataclass
+class VectorMatch:
+    id: str
+    score: float  # Similarity score (0-1, higher is more similar)
+    metadata: Optional[dict]
+    vector: Optional[list[float]]
+```
+## Priority Levels
+| Priority | Use Case | Description |
+|----------|----------|-------------|
+| `critical` | Real-time user requests | Reserved quota, processed first |
+| `high` | New content embeddings | Standard processing priority |
+| `normal` | Updates, re-embeddings | Default priority |
+| `low` | Backfill, batch jobs | Processed when capacity available |
+```python
+result = client.embeddings.create_and_wait(texts, content_type="topic", priority="critical")
+```
+## Embedding Models
+### Supported Models
+| Model | Provider | Dimensions | Custom Dims |
+|-------|----------|------------|-------------|
+| `gemini-embedding-001` | Google | 3072 | No |
+| `text-embedding-004` | Google | 768 | No |
+| `text-multilingual-embedding-002` | Google | 768 | No |
+| `text-embedding-3-small` | OpenAI | 1536 | Yes |
+| `text-embedding-3-large` | OpenAI | 3072 | Yes |
+### Using a Specific Model
+```python
+result = client.embeddings.create_and_wait(
+    texts=[{"id": "doc1", "text": "Hello world"}],
+    content_type="document",
+    embedding_model="text-embedding-3-small",
+    embedding_dimensions=512,  # Custom dimensions (only for models that support it)
+)
+```
+## Content Hash
+The SDK provides deterministic content hashing for learning tools.
+```python
+from vector_sdk import compute_content_hash, extract_tool_text
+# Compute hash for a FlashCard
+hash = compute_content_hash(
+    "FlashCard",
+    {"type": "BASIC", "term": "Mitochondria", "definition": "The powerhouse of the cell"}
+)
+# Extract text for embedding
+text = extract_tool_text(
+    "FlashCard",
+    {"type": "BASIC", "term": "Mitochondria", "definition": "The powerhouse of the cell"}
+)
+```
+## Migration from EmbeddingClient
+The SDK now uses a namespace-based API with `VectorClient`. The old `EmbeddingClient` is preserved for backward compatibility.
+### Method Mapping
+| Old (EmbeddingClient) | New (VectorClient) |
+|----------------------|-------------------|
+| `submit()` | `client.embeddings.create()` |
+| `wait_for_result()` | `client.embeddings.wait_for()` |
+| `submit_and_wait()` | `client.embeddings.create_and_wait()` |
+| `get_queue_depth()` | `client.embeddings.get_queue_depth()` |
+| `query()` | `client.search.query()` |
+| `wait_for_query_result()` | `client.search.wait_for()` |
+| `query_and_wait()` | `client.search.query_and_wait()` |
+| `lookup_by_ids()` | `client.db.get_by_ids()` |
+| `search_by_metadata()` | `client.db.find_by_metadata()` |
+| `clone_from_namespace()` | `client.db.clone()` |
+| `delete_from_namespace()` | `client.db.delete()` |
+### Migration Example
+```python
+# Old API (still works, emits deprecation warnings)
+from vector_sdk import EmbeddingClient
+client = EmbeddingClient("redis://localhost:6379")
+result = client.submit_and_wait(texts, content_type)
+client.close()
+# New API (recommended)
+from vector_sdk import VectorClient
+client = VectorClient(redis_url="redis://localhost:6379")
+result = client.embeddings.create_and_wait(texts, content_type)
+client.close()
+```
+## Error Handling
+```python
+from vector_sdk import VectorClient, ModelValidationError
+try:
+    with VectorClient(redis_url="redis://localhost:6379") as client:
+        result = client.embeddings.create_and_wait(
+            texts=[{"id": "doc1", "text": "Hello"}],
+            content_type="test",
+            embedding_model="text-embedding-3-small",
+            timeout=30,
+        )
+        if result.is_success:
+            print("Success!")
+        elif result.is_partial:
+            print("Partial success. Errors:")
+            for err in result.errors:
+                print(f"  - {err.id}: {err.error}")
+except ModelValidationError as e:
+    print(f"Model validation failed: {e}")
+except TimeoutError as e:
+    print(f"Request timed out: {e}")
+except ValueError as e:
+    print(f"Invalid input: {e}")
+```
+## Best Practices
+### 1. Use Appropriate Priority
+```python
+# Use appropriate priority levels
+client.embeddings.create(texts, content_type="backfill", priority="low")
+client.embeddings.create(texts, content_type="userRequest", priority="critical")
+```
+### 2. Batch Your Requests
+```python
+# Batch multiple texts per request for efficiency
+texts = [{"id": doc.id, "text": doc.text} for doc in documents]
+client.embeddings.create(texts, content_type)
+```
+### 3. Use Context Managers
+```python
+with VectorClient(redis_url="redis://...") as client:
+    # Client automatically closed on exit
+    pass
+```
+## License
+Proprietary - All rights reserved.

sf_vector_sdk-0.2.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,27 @@
+vector_sdk/__init__.py,sha256=Fq4Pqq-xbDX_4M_lQhw6DVXAggUB-bjscNrUk8GEk2o,6632
+vector_sdk/client.py,sha256=NQFGHyR1aM0UToRFy6e9Xm_v6mk0opqzKN8UlHu97n0,17186
+vector_sdk/content_types.py,sha256=krvFOR58iUZPfYlEVsk0sXD6_ANAFbxEBQGNpt1YPDU,7381
+vector_sdk/types.py,sha256=rQgA2z3ls21vY-DRPZgfmm8gYFkWJk1dQaJI-nbc0no,25514
+vector_sdk/generated/embedding_pipeline/content_types/v1/content_types_pb2.py,sha256=HOyqisydOUgjQ2yEcLdAuW4O46ghcL7W--Sykc9Iwzc,5962
+vector_sdk/generated/embedding_pipeline/content_types/v1/content_types_pb2.pyi,sha256=fOw6liHkiXSEyvEZ_QKexDUgFNhbemuGuk52hwQ5pnQ,6738
+vector_sdk/generated/embedding_pipeline/db/vectors/v1/vectors_pb2.py,sha256=xwujSU8GXborGSDgKoRHQq_DL5CA6YAGX8L_Om35lRc,7057
+vector_sdk/generated/embedding_pipeline/db/vectors/v1/vectors_pb2.pyi,sha256=lxZ27fReDhHv2mKDCiPvKpicXuJObZX2zpfVYuGTk3I,8068
+vector_sdk/generated/embedding_pipeline/query/v1/query_pb2.py,sha256=E7uzz9w9xQlGbe_ZfO2MN_H8B-xpyFkkyixlDfaoGv0,5579
+vector_sdk/generated/embedding_pipeline/query/v1/query_pb2.pyi,sha256=a-rWfFQVAdZM5jK1qHB0bUiuSo6brcB-zUIHQezi0I8,5598
+vector_sdk/generated/embedding_pipeline/tools/v1/tools_pb2.py,sha256=i2VcFAoa8xVFsiXTxseDnZwpwl6iYv4CgwNV18mHHqU,2266
+vector_sdk/generated/embedding_pipeline/tools/v1/tools_pb2.pyi,sha256=KlMGcmAOXgCxVUmtqlyir_fNyRan9Bm3VEv4yGsWgHk,1453
+vector_sdk/hash/__init__.py,sha256=xyy3ezP4o58IkfUr2Kk-YwuAVtNH5uUG6QyUIed4Psw,691
+vector_sdk/hash/hasher.py,sha256=BjQ5d-dhJy2Smo-dssss2JDHcIfHjsvf08O_1h7Dq2I,7976
+vector_sdk/hash/types.py,sha256=QWSmGhbNcYZsRPZKWxgHC-XBOf-OBtE3XMGoTb2hm9Y,1785
+vector_sdk/namespaces/__init__.py,sha256=S9dJfB39s2zjYOpFn9Fvf8bk7mLKcXk5aPatKOA-xO0,374
+vector_sdk/namespaces/base.py,sha256=lioZBcd43mijnN0JwTMMEpQ6whiAjaueTDAAIZS1JM0,1156
+vector_sdk/namespaces/db.py,sha256=a5sEHrfy1xAjRjyM9qfZxr3IznZVA8BnY5W1Hq5jr4I,7230
+vector_sdk/namespaces/embeddings.py,sha256=7hH0hvBAeDf-ypTtOzUAqzc3W6wci_dbt_ZPavcRVyU,8950
+vector_sdk/namespaces/search.py,sha256=bwtZ_rTiP6q-dg8oOM5YA6taDHSphO88aq7RSuzc-tQ,8894
+vector_sdk/structured/__init__.py,sha256=eRiH-V6U-TSl98peoGdsRQukTysW9ZhTsous0fwHU-I,1468
+vector_sdk/structured/router.py,sha256=F3O1TYtbVFCPqVWCCYCt5QcRffX5WPlPQ7K3KlayooQ,5792
+vector_sdk/structured/structured_embeddings.py,sha256=Z93Bcf38fpk8jhQvXTeioxt-yyhtQXo1fMoUKqgVlus,13031
+vector_sdk/structured/tool_config.py,sha256=sv0mRNUcuPO9C8Oh0_Y52YTyakbLk6gjrBW0C04Jt_w,7462
+sf_vector_sdk-0.2.0.dist-info/METADATA,sha256=HA0KnQ9SAIRYk7M-g_IOn5o1y1yL7ISpQS0j_T7u0tw,13671
+sf_vector_sdk-0.2.0.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
+sf_vector_sdk-0.2.0.dist-info/RECORD,,

sf_vector_sdk-0.2.0.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,4 @@
+Wheel-Version: 1.0
+Generator: hatchling 1.28.0
+Root-Is-Purelib: true
+Tag: py3-none-any