PyPI - DeepFabric - Versions diffs - 4.4.1__py3-none-any.whl → 4.6.0__py3-none-any.whl - Mend

DeepFabric 4.4.1py3-none-any.whl → 4.6.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

deepfabric/__init__.py +8 -0
deepfabric/auth.py +8 -2
deepfabric/builders.py +2 -2
deepfabric/builders_agent.py +18 -6
deepfabric/cli.py +292 -13
deepfabric/cloud_upload.py +884 -0
deepfabric/config.py +47 -20
deepfabric/config_manager.py +2 -2
deepfabric/dataset.py +302 -0
deepfabric/evaluation/backends/__init__.py +2 -0
deepfabric/evaluation/backends/llm_eval_backend.py +527 -0
deepfabric/evaluation/backends/ollama_backend.py +3 -3
deepfabric/evaluation/backends/tool_call_parsers.py +7 -7
deepfabric/evaluation/backends/transformers_backend.py +73 -16
deepfabric/evaluation/evaluator.py +41 -7
deepfabric/evaluation/evaluators/builtin/tool_calling.py +13 -8
deepfabric/evaluation/inference.py +77 -5
deepfabric/evaluation/metrics.py +4 -0
deepfabric/evaluation/parser.py +8 -8
deepfabric/evaluation/reporters/cloud_reporter.py +19 -6
deepfabric/exceptions.py +14 -0
deepfabric/generator.py +8 -4
deepfabric/graph.py +38 -0
deepfabric/hf_hub.py +1 -1
deepfabric/loader.py +554 -0
deepfabric/schemas.py +7 -7
deepfabric/topic_manager.py +4 -0
deepfabric/training/__init__.py +24 -5
deepfabric/training/callback.py +43 -1
deepfabric/training/dataset_utils.py +223 -0
deepfabric/training/metrics_sender.py +50 -16
deepfabric/tui.py +9 -1
deepfabric/utils.py +14 -0
deepfabric/validation.py +1 -1
{deepfabric-4.4.1.dist-info → deepfabric-4.6.0.dist-info}/METADATA +84 -177
{deepfabric-4.4.1.dist-info → deepfabric-4.6.0.dist-info}/RECORD +39 -34
{deepfabric-4.4.1.dist-info → deepfabric-4.6.0.dist-info}/WHEEL +0 -0
{deepfabric-4.4.1.dist-info → deepfabric-4.6.0.dist-info}/entry_points.txt +0 -0
{deepfabric-4.4.1.dist-info → deepfabric-4.6.0.dist-info}/licenses/LICENSE +0 -0

deepfabric/config.py CHANGED Viewed

@@ -119,13 +119,13 @@ class TopicsConfig(BaseModel):
 class ConversationConfig(BaseModel):
     """Configuration for conversation structure in generation."""
-    type: Literal["basic", "chain_of_thought"] = Field(
+    type: Literal["basic", "cot"] = Field(
         default="basic",
-        description="Base conversation type: basic (simple chat), chain_of_thought (with reasoning)",
+        description="Base conversation type: basic (simple chat), cot (with reasoning)",
     )
     reasoning_style: Literal["freetext", "agent", "structured", "hybrid"] | None = Field(
         default=None,
-        description="Reasoning style for chain_of_thought: freetext or agent. Note: 'structured' and 'hybrid' are deprecated.",
+        description="Reasoning style for cot: freetext or agent. Note: 'structured' and 'hybrid' are deprecated.",
     )
     agent_mode: Literal["single_turn", "multi_turn"] | None = Field(
         default=None,
@@ -159,15 +159,14 @@ class ConversationConfig(BaseModel):
     @model_validator(mode="after")
     def validate_configuration(self):
         """Validate that configuration combinations are consistent."""
-        if self.reasoning_style is not None and self.type != "chain_of_thought":
+        if self.reasoning_style is not None and self.type != "cot":
             raise ValueError(
-                f"reasoning_style can only be set when type='chain_of_thought', "
-                f"got type='{self.type}'"
+                f"reasoning_style can only be set when type='cot', got type='{self.type}'"
             )
-        if self.type == "chain_of_thought" and self.reasoning_style is None:
+        if self.type == "cot" and self.reasoning_style is None:
             raise ValueError(
-                "reasoning_style must be specified when type='chain_of_thought'. "
+                "reasoning_style must be specified when type='cot'. "
                 "Choose from: 'freetext' or 'agent'"
             )
@@ -346,16 +345,37 @@ class KaggleConfig(BaseModel):
     version_notes: str | None = Field(None, description="Version notes for dataset update")
+class DeepFabricCloudConfig(BaseModel):
+    """Configuration for DeepFabric Cloud integration."""
+    graph: str | None = Field(
+        default=None,
+        description="DeepFabric Cloud graph handle (e.g., username/graph-name)",
+    )
+    dataset: str | None = Field(
+        default=None,
+        description="DeepFabric Cloud dataset handle (e.g., username/dataset-name)",
+    )
+    description: str | None = Field(
+        default=None,
+        description="Description for uploaded resources",
+    )
+    tags: list[str] = Field(
+        default_factory=list,
+        description="Tags for uploaded resources",
+    )
 class EvaluationConfig(BaseModel):
     """Configuration for model evaluation."""
-    conversation_type: Literal["basic", "chain_of_thought"] = Field(
+    conversation_type: Literal["basic", "cot"] = Field(
         ...,
         description="Conversation type (must match dataset generation)",
     )
     reasoning_style: Literal["freetext", "agent", "structured", "hybrid"] | None = Field(
         default=None,
-        description="Reasoning style for chain_of_thought type",
+        description="Reasoning style for cot type",
     )
     @field_validator("reasoning_style", mode="before")
@@ -419,15 +439,15 @@ class EvaluationConfig(BaseModel):
     @model_validator(mode="after")
     def validate_evaluation_config(self) -> "EvaluationConfig":
         """Validate evaluation configuration consistency."""
-        if self.reasoning_style is not None and self.conversation_type != "chain_of_thought":
+        if self.reasoning_style is not None and self.conversation_type != "cot":
             raise ValueError(
-                f"reasoning_style can only be set when conversation_type='chain_of_thought', "
+                f"reasoning_style can only be set when conversation_type='cot', "
                 f"got conversation_type='{self.conversation_type}'"
             )
-        if self.conversation_type == "chain_of_thought" and self.reasoning_style is None:
+        if self.conversation_type == "cot" and self.reasoning_style is None:
             raise ValueError(
-                "reasoning_style must be specified when conversation_type='chain_of_thought'. "
+                "reasoning_style must be specified when conversation_type='cot'. "
                 "Choose from: 'freetext' or 'agent'"
             )
@@ -457,6 +477,9 @@ class DeepFabricConfig(BaseModel):
     evaluation: EvaluationConfig | None = Field(None, description="Evaluation configuration")
     huggingface: HuggingFaceConfig | None = Field(None, description="Hugging Face configuration")
     kaggle: KaggleConfig | None = Field(None, description="Kaggle configuration")
+    deepfabric_cloud: DeepFabricCloudConfig | None = Field(
+        None, description="DeepFabric Cloud configuration"
+    )
     @classmethod
     def _detect_old_format(cls, config_dict: dict) -> bool:
@@ -663,6 +686,10 @@ See documentation for full examples.
         """Get Kaggle configuration."""
         return self.kaggle.model_dump() if self.kaggle else {}
+    def get_deepfabric_cloud_config(self) -> dict:
+        """Get DeepFabric Cloud configuration."""
+        return self.deepfabric_cloud.model_dump() if self.deepfabric_cloud else {}
     def get_configured_providers(self) -> set[str]:
         """Get the set of LLM providers configured in this config."""
         providers = set()
@@ -808,13 +835,13 @@ class DataEngineConfig(BaseModel):
         default=None,
         description="Rate limiting and retry configuration",
     )
-    conversation_type: Literal["basic", "chain_of_thought"] = Field(
+    conversation_type: Literal["basic", "cot"] = Field(
         default="basic",
         description="Base conversation type",
     )
     reasoning_style: Literal["freetext", "agent", "structured", "hybrid"] | None = Field(
         default=None,
-        description="Reasoning style for chain_of_thought type",
+        description="Reasoning style for cot type",
     )
     @field_validator("reasoning_style", mode="before")
@@ -839,15 +866,15 @@ class DataEngineConfig(BaseModel):
     @model_validator(mode="after")
     def validate_configuration(self):
-        if self.reasoning_style is not None and self.conversation_type != "chain_of_thought":
+        if self.reasoning_style is not None and self.conversation_type != "cot":
             raise ValueError(
-                f"reasoning_style can only be set when conversation_type='chain_of_thought', "
+                f"reasoning_style can only be set when conversation_type='cot', "
                 f"got conversation_type='{self.conversation_type}'"
             )
-        if self.conversation_type == "chain_of_thought" and self.reasoning_style is None:
+        if self.conversation_type == "cot" and self.reasoning_style is None:
             raise ValueError(
-                "reasoning_style must be specified when conversation_type='chain_of_thought'. "
+                "reasoning_style must be specified when conversation_type='cot'. "
                 "Choose from: 'freetext' or 'agent'"
             )

deepfabric/config_manager.py CHANGED Viewed

@@ -63,8 +63,8 @@ def load_config(  # noqa: PLR0913
         output_save_as: Path to save dataset
         include_system_message: Include system message in dataset
         mode: Topic generation mode (tree or graph)
-        conversation_type: Base conversation type (basic, chain_of_thought)
-        reasoning_style: Reasoning style for chain_of_thought (freetext, agent)
+        conversation_type: Base conversation type (basic, cot)
+        reasoning_style: Reasoning style for cot (freetext, agent)
         agent_mode: Agent mode (single_turn, multi_turn)
     Returns:

deepfabric/dataset.py ADDED Viewed

@@ -0,0 +1,302 @@
+"""Native DeepFabric Dataset implementation.
+This module provides a simple, maintainable Dataset class with no external
+dependencies (beyond stdlib). It supports column-oriented access patterns
+similar to HuggingFace datasets.
+"""
+import json
+import random
+from collections.abc import Callable, Iterator
+from typing import Any, overload
+class Dataset:
+    """A simple, native dataset class that stores data as a list of dicts
+    with column-oriented access patterns.
+    Examples:
+        >>> ds = Dataset([{"text": "hello"}, {"text": "world"}])
+        >>> len(ds)
+        2
+        >>> ds["text"]
+        ['hello', 'world']
+        >>> ds[0]
+        {'text': 'hello'}
+        >>> ds[0:1]
+        Dataset with 1 samples
+    """
+    def __init__(self, data: list[dict[str, Any]], metadata: dict | None = None):
+        """Initialize dataset from list of sample dicts.
+        Args:
+            data: List of sample dictionaries
+            metadata: Optional metadata (source, path, etc.)
+        """
+        self._data = data
+        self._metadata = metadata or {}
+        self._columns: list[str] | None = None
+    @property
+    def column_names(self) -> list[str]:
+        """Return list of column names."""
+        if self._columns is None:
+            if self._data:
+                # Collect all unique keys across samples
+                all_keys: set[str] = set()
+                for sample in self._data:
+                    all_keys.update(sample.keys())
+                self._columns = sorted(all_keys)
+            else:
+                self._columns = []
+        return self._columns
+    @property
+    def num_rows(self) -> int:
+        """Return number of samples (alias for len)."""
+        return len(self._data)
+    def __len__(self) -> int:
+        """Return number of samples."""
+        return len(self._data)
+    @overload
+    def __getitem__(self, key: str) -> list[Any]: ...
+    @overload
+    def __getitem__(self, key: int) -> dict[str, Any]: ...
+    @overload
+    def __getitem__(self, key: slice) -> "Dataset": ...
+    def __getitem__(self, key: str | int | slice) -> Any:
+        """Access by column name, index, or slice.
+        Args:
+            key: Column name (str), row index (int), or slice
+        Returns:
+            - For str: list of values for that column
+            - For int: dict for that sample
+            - For slice: new Dataset with selected samples
+        Examples:
+            >>> ds["messages"]  # Get column as list
+            >>> ds[0]           # Get first sample as dict
+            >>> ds[0:10]        # Get first 10 samples as new Dataset
+        """
+        if isinstance(key, str):
+            # Column access - return list of values
+            return [sample.get(key) for sample in self._data]
+        if isinstance(key, int):
+            # Single sample access
+            if key < 0:
+                key = len(self._data) + key
+            if key < 0 or key >= len(self._data):
+                raise IndexError(
+                    f"Index {key} out of range for dataset with {len(self._data)} samples"
+                )
+            return self._data[key]
+        if isinstance(key, slice):
+            # Slice access - return new Dataset
+            return Dataset(self._data[key], self._metadata.copy())
+        raise TypeError(f"Invalid key type: {type(key)}. Expected str, int, or slice.")
+    def __iter__(self) -> Iterator[dict[str, Any]]:
+        """Iterate over samples."""
+        return iter(self._data)
+    def __repr__(self) -> str:
+        """Return string representation."""
+        cols = ", ".join(self.column_names[:5])
+        if len(self.column_names) > 5:  # noqa: PLR2004
+            cols += ", ..."
+        return f"Dataset(num_rows={len(self)}, columns=[{cols}])"
+    def split(
+        self,
+        test_size: float = 0.1,
+        seed: int | None = None,
+    ) -> dict[str, "Dataset"]:
+        """Split dataset into train and test sets.
+        Args:
+            test_size: Fraction of data for test set (0.0 to 1.0)
+            seed: Random seed for reproducibility
+        Returns:
+            Dict with "train" and "test" Dataset instances
+        Examples:
+            >>> splits = ds.split(test_size=0.1, seed=42)
+            >>> train_ds = splits["train"]
+            >>> test_ds = splits["test"]
+        """
+        if not 0.0 < test_size < 1.0:
+            raise ValueError("test_size must be between 0.0 and 1.0 (exclusive)")
+        # Use a local Random instance to avoid affecting global state
+        rng = random.Random(seed)  # noqa: S311 # nosec
+        # Create shuffled indices
+        indices = list(range(len(self._data)))
+        rng.shuffle(indices)
+        # Calculate split point
+        split_idx = int(len(indices) * (1 - test_size))
+        train_indices = indices[:split_idx]
+        test_indices = indices[split_idx:]
+        return {
+            "train": self.select(train_indices),
+            "test": self.select(test_indices),
+        }
+    def select(self, indices: list[int]) -> "Dataset":
+        """Select samples by indices.
+        Args:
+            indices: List of integer indices to select
+        Returns:
+            New Dataset with selected samples
+        """
+        return Dataset([self._data[i] for i in indices], self._metadata.copy())
+    def shuffle(self, seed: int | None = None) -> "Dataset":
+        """Return a shuffled copy of the dataset.
+        Args:
+            seed: Random seed for reproducibility
+        Returns:
+            New Dataset with shuffled samples
+        """
+        rng = random.Random(seed)  #  nosec  # noqa: S311
+        indices = list(range(len(self._data)))
+        rng.shuffle(indices)
+        return self.select(indices)
+    def map(self, fn: Callable[[dict[str, Any]], dict[str, Any]]) -> "Dataset":
+        """Apply function to each sample.
+        Args:
+            fn: Function that takes a sample dict and returns a new sample dict
+        Returns:
+            New Dataset with transformed samples
+        Examples:
+            >>> ds.map(lambda x: {"text": x["text"].upper()})
+        """
+        return Dataset([fn(sample) for sample in self._data], self._metadata.copy())
+    def filter(self, fn: Callable[[dict[str, Any]], bool]) -> "Dataset":
+        """Filter samples by predicate function.
+        Args:
+            fn: Function that takes a sample dict and returns True to keep
+        Returns:
+            New Dataset with filtered samples
+        Examples:
+            >>> ds.filter(lambda x: len(x["text"]) > 10)
+        """
+        return Dataset([s for s in self._data if fn(s)], self._metadata.copy())
+    def to_list(self) -> list[dict[str, Any]]:
+        """Return data as list of dicts.
+        Returns:
+            Copy of internal data as list of dictionaries
+        """
+        return self._data.copy()
+    def to_hf(self) -> Any:
+        """Convert to HuggingFace Dataset for use with TRL/transformers.
+        Returns:
+            A HuggingFace datasets.Dataset instance
+        Raises:
+            ImportError: If the 'datasets' package is not installed
+        Examples:
+            >>> from deepfabric import load_dataset
+            >>> ds = load_dataset("data.jsonl")
+            >>> hf_ds = ds.to_hf()
+            >>> trainer = SFTTrainer(train_dataset=hf_ds, ...)
+        """
+        try:
+            from datasets import Dataset as HFDataset  # noqa: PLC0415
+        except ImportError:
+            raise ImportError(
+                "The 'datasets' package is required for to_hf(). "
+                "Install it with: pip install datasets"
+            ) from None
+        return HFDataset.from_list(self._data)
+    def to_jsonl(self, path: str) -> None:
+        """Save dataset to JSONL file.
+        Args:
+            path: File path to save to
+        """
+        with open(path, "w", encoding="utf-8") as f:
+            for sample in self._data:
+                f.write(json.dumps(sample, ensure_ascii=False) + "\n")
+    @classmethod
+    def from_jsonl(cls, path: str) -> "Dataset":
+        """Load dataset from JSONL file.
+        Args:
+            path: File path to load from
+        Returns:
+            New Dataset loaded from file
+        """
+        data = []
+        with open(path, encoding="utf-8") as f:
+            for line in f:
+                if line.strip():
+                    data.append(json.loads(line))
+        return cls(data, metadata={"source": "jsonl", "path": path})
+    @classmethod
+    def from_list(cls, data: list[dict[str, Any]]) -> "Dataset":
+        """Create dataset from list of dicts.
+        Args:
+            data: List of sample dictionaries
+        Returns:
+            New Dataset from the provided data
+        """
+        return cls(data)
+class DatasetDict(dict):
+    """Dictionary of Dataset objects for train/test/validation splits.
+    A simple dict subclass that provides typed access to Dataset values.
+    Examples:
+        >>> dd = DatasetDict({"train": train_ds, "test": test_ds})
+        >>> dd["train"]
+        Dataset(num_rows=100, columns=[...])
+    """
+    def __getitem__(self, key: str) -> Dataset:
+        """Get Dataset by split name."""
+        return super().__getitem__(key)
+    def __repr__(self) -> str:
+        """Return string representation."""
+        splits = ", ".join(f"{k}: {len(v)} rows" for k, v in self.items())
+        return f"DatasetDict({{{splits}}})"

deepfabric/evaluation/backends/__init__.py CHANGED Viewed

@@ -1,5 +1,6 @@
 """Inference backend implementations."""
+from .llm_eval_backend import LLMEvalBackend
 from .ollama_backend import OllamaBackend
 from .tool_call_parsers import (
     GenericToolCallParser,
@@ -18,6 +19,7 @@ from .transformers_backend import TransformersBackend
 __all__ = [
     "TransformersBackend",
     "OllamaBackend",
+    "LLMEvalBackend",
     # Tool call parsers
     "ToolCallParser",
     "ToolCallParserRegistry",

DeepFabric 4.4.1__py3-none-any.whl → 4.6.0__py3-none-any.whl

DeepFabric 4.4.1py3-none-any.whl → 4.6.0py3-none-any.whl