PyPI - sdg-hub - Versions diffs - 0.1.0a2__tar.gz → 0.1.0a3__tar.gz - Mend

sdg-hub 0.1.0a2tar.gz → 0.1.0a3tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (164) hide show

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: sdg_hub
-Version: 0.1.0a2
+Version: 0.1.0a3
 Summary: Synthetic Data Generation
 Author-email: Red Hat AI Innovation <abhandwa@redhat.com>
 License: Apache-2.0

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/examples/data-generation-with-llama-70b/data-generation-with-llama-70b.ipynb RENAMED Viewed

@@ -35,7 +35,7 @@
     "Before running this notebook, you'll need to:\n",
     "\n",
     "```bash \n",
-    "pip install git+https://github.com/Red-Hat-AI-Innovation-Team/sdg_hub.git\n",
+    "pip install sdg-hub==0.1.0a2\n",
     "```"
    ]
   },

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/examples/inference_time_scaling/prm_with_vllm.ipynb RENAMED Viewed

@@ -20,6 +20,18 @@
     "from sdg_hub.blocks.rmblocks import PRMBlock"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Install sdg-hub\n",
+    "\n",
+    "\n",
+    "```bash \n",
+    "pip install sdg-hub==0.1.0a2\n",
+    "```"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/examples/instructlab/knowledge/document_pre_processing.ipynb RENAMED Viewed

@@ -15,10 +15,11 @@
    "metadata": {},
    "source": [
     "### Install SDG\n",
-    " - git clone https://github.com/Red-Hat-AI-Innovation-Team/SDG-Research.git && cd SDG-Research\n",
-    " - pip install -r requirements.txt\n",
-    " - pip install -e .\n",
-    " - pip install rich datasets tabulate transformers"
+    "\n",
+    "```bash \n",
+    "pip install sdg-hub==0.1.0a2\n",
+    "pip install rich datasets tabulate transformers\n",
+    "```"
    ]
   },
   {

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/examples/instructlab/knowledge/knowledge_generation_and_mixing.ipynb RENAMED Viewed

@@ -15,10 +15,10 @@
    "metadata": {},
    "source": [
     "### Install SDG\n",
-    " - git clone https://github.com/Red-Hat-AI-Innovation-Team/SDG-Research.git && cd SDG-Research\n",
-    " - pip install -r requirements.txt\n",
-    " - pip install -e .\n",
-    " - pip install rich datasets tabulate transformers\n",
+    "```bash \n",
+    "pip install sdg-hub==0.1.0a2\n",
+    "pip install rich datasets tabulate transformers\n",
+    "```\n",
     " - If you haven't already, run the document pre-processing notebook to create the seed data"
    ]
   },

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/examples/instructlab/skills/unstructed_to_structured.ipynb RENAMED Viewed

@@ -41,6 +41,17 @@
     "The end goal is to create training data that will help align the model with your specific needs, whether that's matching your company's communication style, following particular protocols, or handling specialized tasks in your preferred way."
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Install sdg-hub\n",
+    "\n",
+    "```bash \n",
+    "pip install sdg-hub==0.1.0a2\n",
+    "```"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -404,7 +415,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.12.9"
+   "version": "3.10.16"
   }
  },
  "nbformat": 4,

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/examples/instructlab/skills/unstructed_to_structured_lls.ipynb RENAMED Viewed

@@ -41,6 +41,17 @@
     "The end goal is to create training data that will help align the model with your specific needs, whether that's matching your company's communication style, following particular protocols, or handling specialized tasks in your preferred way."
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Install sdg-hub\n",
+    "\n",
+    "```bash \n",
+    "pip install sdg-hub==0.1.0a2\n",
+    "```"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/examples/knowledge_generation_using_nemotron/knowledge_sdg.ipynb RENAMED Viewed

@@ -16,7 +16,14 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "### Installing Vllm\n",
+    "## Install sdg-hub\n",
+    "\n",
+    "```bash \n",
+    "pip install sdg-hub==0.1.0a2\n",
+    "```\n",
+    "\n",
+    "\n",
+    "## Installing Vllm\n",
     "\n",
     "- Clone vllm repo\n",
     "- Checkout PR #15008\n",

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/src/sdg_hub/_version.py RENAMED Viewed

@@ -17,5 +17,5 @@ __version__: str
 __version_tuple__: VERSION_TUPLE
 version_tuple: VERSION_TUPLE
-__version__ = version = '0.1.0a2'
+__version__ = version = '0.1.0a3'
 __version_tuple__ = version_tuple = (0, 1, 0)

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/src/sdg_hub/flow.py RENAMED Viewed

@@ -38,10 +38,37 @@ class Flow(ABC):
         self.base_path = str(resources.files(__package__))
         self.registered_blocks = BlockRegistry.get_registry()
+    def _getFilePath(self, dirs, filename):
+        """
+        Find a named configuration file.
+        Files are checked in the following order
+            - absulute path is always used
+            - checked relative to the directories in "dirs"
+            - relative the the current directory
+        Args:
+            dirs (list): Directories in which to search for "config_path"
+            config_path (str): The path to the configuration file.
+        Returns:
+            Selected file path
+        """
+        if os.path.isabs(filename):
+            return filename
+        for d in dirs:
+            full_file_path = os.path.join(d, filename)
+            if os.path.isfile(full_file_path):
+                return full_file_path
+        # If not found above then return the path unchanged i.e.
+        # assume the path is relative to the current directory
+        return filename
     def get_flow_from_file(self, yaml_path: str) -> list:
         yaml_path_relative_to_base = os.path.join(self.base_path, yaml_path)
         if os.path.isfile(yaml_path_relative_to_base):
             yaml_path = yaml_path_relative_to_base
+        yaml_dir = os.path.dirname(yaml_path)
         try:
             with open(yaml_path, "r", encoding="utf-8") as yaml_file:
@@ -86,33 +113,23 @@ class Flow(ABC):
             # update config path to absolute path
             if "config_path" in block["block_config"]:
-                config_path_relative_to_base = os.path.join(
-                    self.base_path, block["block_config"]["config_path"]
+                block["block_config"]["config_path"] = self._getFilePath(
+                    [yaml_dir, self.base_path], block["block_config"]["config_path"]
                 )
-                if os.path.isfile(config_path_relative_to_base):
-                    block["block_config"]["config_path"] = config_path_relative_to_base
             # update config paths to absolute paths - this might be a list or a dict
             if "config_paths" in block["block_config"]:
                 if isinstance(block["block_config"]["config_paths"], dict):
                     for key, path in block["block_config"]["config_paths"].items():
-                        config_path_relative_to_base = os.path.join(
-                            self.base_path, path
+                        block["block_config"]["config_paths"][key] = self._getFilePath(
+                            [yaml_dir, self.base_path], path
                         )
-                        if os.path.isfile(config_path_relative_to_base):
-                            block["block_config"]["config_paths"][key] = (
-                                config_path_relative_to_base
-                            )
-                if isinstance(block["block_config"]["config_paths"], list):
+                elif isinstance(block["block_config"]["config_paths"], list):
                     for i, path in enumerate(block["block_config"]["config_paths"]):
-                        config_path_relative_to_base = os.path.join(
-                            self.base_path, path
+                        block["block_config"]["config_paths"][i] = self._getFilePath(
+                            [yaml_dir, self.base_path], path
                         )
-                        if os.path.isfile(config_path_relative_to_base):
-                            block["block_config"]["config_paths"][i] = (
-                                config_path_relative_to_base
-                            )
             if "operation" in block["block_config"]:
                 block["block_config"]["operation"] = OPERATOR_MAP[

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/src/sdg_hub.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: sdg_hub
-Version: 0.1.0a2
+Version: 0.1.0a3
 Summary: Synthetic Data Generation
 Author-email: Red Hat AI Innovation <abhandwa@redhat.com>
 License: Apache-2.0

{sdg_hub-0.1.0a2 → sdg_hub-0.1.0a3}/src/sdg_hub.egg-info/SOURCES.txt RENAMED Viewed

@@ -10,7 +10,6 @@ README.md
 pyproject.toml
 requirements-dev.txt
 requirements.txt
-test.ipynb
 tox.ini
 .github/actionlint.yaml
 .github/dependabot.yml
@@ -55,9 +54,6 @@ scripts/docparser.py
 scripts/docparser_v2.py
 scripts/flow_runner.py
 scripts/ruff.sh
-scripts/test_freeform_skills.py
-scripts/test_grounded_skills.py
-scripts/test_knowledge.py
 src/sdg_hub/__init__.py
 src/sdg_hub/_version.py
 src/sdg_hub/flow.py
@@ -145,14 +141,14 @@ src/sdg_hub/flows/generation/skills/synth_grounded_skills.yaml
 src/sdg_hub/flows/generation/skills/synth_skills.yaml
 src/sdg_hub/utils/__init__.py
 src/sdg_hub/utils/chunking.py
-src/sdg_hub/utils/datamixing.py
 src/sdg_hub/utils/datautils.py
 src/sdg_hub/utils/docprocessor.py
-src/sdg_hub/utils/json.py
-src/sdg_hub/utils/models.py
 src/sdg_hub/utils/parse_and_convert.py
-src/sdg_hub/utils/taxonomy.py
 tests/__init__.py
 tests/test_chunking.py
 tests/test_filterblock.py
+tests/test_flow.py
+tests/testdata/test_config_1.yaml
+tests/testdata/test_flow_1.yaml
+tests/testdata/test_flow_2.yaml
 tests/testdata/testdata.py

sdg_hub-0.1.0a3/tests/test_flow.py ADDED Viewed

@@ -0,0 +1,74 @@
+# Standard
+from unittest.mock import MagicMock, patch
+import os
+import unittest
+# Third Party
+import yaml
+# First Party
+from sdg_hub.flow import Flow
+class TestFlow(unittest.TestCase):
+    def setUp(self):
+        self.flow = Flow(MagicMock())
+    def test_config_relative_to_flow(self):
+        flow = self.flow.get_flow_from_file("tests/testdata/test_flow_1.yaml")
+        block = flow[0]["block_type"](**flow[0]["block_config"])
+        self.assertEqual(block.block_config["introduction"], "intro")
+    def test_config_relative_to_package(self):
+        with open(
+            "tests/testdata/test_flow_1.yaml", "r", encoding="utf-8"
+        ) as yaml_file:
+            y = yaml.safe_load(yaml_file)
+        y[0]["block_config"]["config_path"] = (
+            "configs/skills/simple_generate_qa_freeform.yaml"
+        )
+        with patch("yaml.safe_load", new_callable=MagicMock) as mock_safe_load:
+            mock_safe_load.return_value = y
+            flow = self.flow.get_flow_from_file("tests/testdata/test_flow_1.yaml")
+        block = flow[0]["block_type"](**flow[0]["block_config"])
+        self.assertEqual(
+            block.block_config["introduction"],
+            "Develop a series of question and answer pairs to perform a task.",
+        )
+    def test_config_absolute(self):
+        with open(
+            "tests/testdata/test_flow_1.yaml", "r", encoding="utf-8"
+        ) as yaml_file:
+            y = yaml.safe_load(yaml_file)
+        y[0]["block_config"]["config_path"] = os.path.abspath(
+            "src/sdg_hub/configs/skills/simple_generate_qa_freeform.yaml"
+        )
+        with patch("yaml.safe_load", new_callable=MagicMock) as mock_safe_load:
+            mock_safe_load.return_value = y
+            flow = self.flow.get_flow_from_file("tests/testdata/test_flow_1.yaml")
+        block = flow[0]["block_type"](**flow[0]["block_config"])
+        self.assertEqual(
+            block.block_config["introduction"],
+            "Develop a series of question and answer pairs to perform a task.",
+        )
+    def test_config_list_mix(self):
+        with open(
+            "tests/testdata/test_flow_2.yaml", "r", encoding="utf-8"
+        ) as yaml_file:
+            y = yaml.safe_load(yaml_file)
+        y[0]["block_config"]["config_paths"]["k3"] = os.path.abspath(
+            "src/sdg_hub/configs/skills/simple_generate_qa_freeform.yaml"
+        )
+        with patch("yaml.safe_load", new_callable=MagicMock) as mock_safe_load:
+            mock_safe_load.return_value = y
+            flow = self.flow.get_flow_from_file("tests/testdata/test_flow_2.yaml")
+        block = flow[0]["block_type"](**flow[0]["block_config"])
+        self.assertEqual(block.block_config["introduction"], "intro")
+        self.assertEqual(len(block.prompt_template), 3)

sdg_hub-0.1.0a3/tests/testdata/test_config_1.yaml ADDED Viewed

@@ -0,0 +1,7 @@
+system: system
+introduction: intro
+principles: principles
+examples: The task is {{task_description}}.
+generation: Provide a single question and answer pair based on the examples.
+start_tags: [""]
+end_tags: [""]

sdg_hub-0.1.0a3/tests/testdata/test_flow_1.yaml ADDED Viewed

@@ -0,0 +1,7 @@
+- block_type: LLMBlock
+  block_config:
+    block_name: gen_skill_freeform
+    config_path: ./test_config_1.yaml
+    model_id: blank/model
+    output_cols:
+      - output

sdg_hub-0.1.0a3/tests/testdata/test_flow_2.yaml ADDED Viewed

@@ -0,0 +1,10 @@
+- block_type: ConditionalLLMBlock
+  block_config:
+    block_name: gen_skill_freeform
+    config_paths:
+      k1: ./test_config_1.yaml
+      k2: configs/skills/simple_generate_qa_freeform.yaml
+    model_id: blank/model
+    output_cols:
+      - output
+    selector_column_name: route

sdg_hub-0.1.0a2/scripts/test_freeform_skills.py DELETED Viewed

@@ -1,61 +0,0 @@
-# Third Party
-from datasets import Dataset
-from openai import OpenAI
-# First Party
-from sdg_hub.sdg import SDG
-from sdg_hub.flow import Flow
-from sdg_hub.pipeline import Pipeline
-# for vLLM endpoints, the api_key remains "EMPTY"
-openai_api_key = "EMPTY"
-openai_api_base = "Add model endpoint here"
-client = OpenAI(
-    api_key=openai_api_key,
-    base_url=openai_api_base,
-)
-models = client.models.list()
-teacher_model = models.data[0].id
-samples = [
-    {
-        "seed_question": """Could you help me write a formal email to inquire about the progress of my internship application?""",
-        "task_description": "Writing formal emails",
-        "seed_response": """Subject: Inquiry Regarding the Status of My Internship Application
-Dear [Recipient's Name],
-I hope this email finds you well. I am writing to inquire about the current status of my internship application with [Company Name]. I submitted my application on [date of application] for the [Internship Title] position.
-I am very interested in the opportunity to learn and grow as an intern at [Company Name], and I am eager to contribute my skills and enthusiasm to your team. I understand that the internship selection process may take some time, and I appreciate your consideration of my application.
-If there are any additional steps I need to take or further information you require from me, please let me know. I am more than happy to provide any necessary documentation or complete additional tasks to facilitate the decision-making process.
-I am excited about the prospect of joining [Company Name] and contributing to the [specific project, team, or aspect of the company] based on my background in [mention relevant skills or experiences]. I am confident that this internship will provide me with valuable experience and growth opportunities.
-Thank you for your time and consideration. I look forward to hearing from you regarding the next steps in the internship application process.
-Sincerely,
-[Your Full Name]
-[Your Contact Information]""",
-    }
-]
-ds = Dataset.from_list(samples)
-skills_flow = Flow(client, 1).get_flow_from_file(
-    DEFAULT_FLOW_FILE_MAP["SynthSkillsFlow"]
-)
-skills_pipe = Pipeline(skills_flow)
-sdg = SDG([skills_pipe])
-gen_data = sdg.generate(ds)
-print(gen_data)
-print(gen_data[0])

sdg_hub-0.1.0a2/scripts/test_grounded_skills.py DELETED Viewed

@@ -1,109 +0,0 @@
-# Third Party
-from datasets import Dataset
-from openai import OpenAI
-# First Party
-from sdg_hub.sdg import SDG
-from sdg_hub.flow import Flow
-from sdg_hub.pipeline import Pipeline
-# for vLLM endpoints, the api_key remains "EMPTY"
-openai_api_key = "EMPTY"
-openai_api_base = "Add model endpoint here"
-client = OpenAI(
-    api_key=openai_api_key,
-    base_url=openai_api_base,
-)
-models = client.models.list()
-teacher_model = models.data[0].id
-samples = [
-    {
-        "seed_context": """*Ms. Thompson:* Good morning, everyone. Today, we''re here to discuss
-    our customer journey mapping and analysis. I believe this is crucial to understanding
-    our customers'' experiences and improving our services.
-    *Mr. Patel:* I agree, Lisa. We should start by identifying all touchpoints in
-    our customer journey, from initial contact to post-sale support.
-    *Ms. Rodriguez:* Yes, and let''s not forget about the emotional aspect of the
-    journey. How do our customers feel at each stage? What are their pain points?
-    *Mr. Kim:* We can use data from our CRM system to track the customer journey and
-    gather insights. This will help us create a detailed, data-driven map.
-    *Ms. Johnson:* Once we have the map, we can analyze it to identify areas for improvement.
-    Perhaps there are steps where customers drop off or express dissatisfaction.
-    *Mr. Davis:* We should also consider the customer''s perspective. Conducting interviews
-    or surveys can provide valuable insights into their thoughts and feelings.
-    *Ms. Brown:* Absolutely. And once we''ve identified areas for improvement, we
-    can develop strategies to address them. This might involve redesigning certain
-    touchpoints, enhancing our communication, or streamlining processes.
-    *Mr. Smith:* And we must remember to measure the impact of any changes we make.
-    By tracking key performance indicators, we can determine whether our efforts are
-    successful.
-    *Ms. Thompson:* Great suggestions, everyone. Let''s divide into teams to tackle
-    different aspects of the customer journey. Team 1 will focus on pre-sale touchpoints,
-    Team 2 on sales, and Team 3 on post-sale support.
-    *Mr. Patel:* Sounds good. We''ll reconvene in a week to share our findings and
-    discuss next steps.""",
-        "seed_question": """Generate a company wide email based on the given meeting transcript""",
-        "task_description": "Writing emails based on minutes of meeting",
-        "seed_response": """Subject: Recap and Next Steps - Customer Journey Mapping and Analysis\n\
-    \nDear [Company Name] Team,\n\nI hope this email finds you well. Yesterday, we\
-    \ gathered to discuss our customer journey mapping and analysis, aiming to understand\
-    \ our customers' experiences and identify opportunities for improvement. The discussions\
-    \ were fruitful, and I want to share a brief overview of the key points and outcomes.\n\
-    \n1. **Identifying Touchpoints:**\n   Mr. Patel suggested mapping all touchpoints\
-    \ in our customer journey, from initial contact to post-sale support.\n\n2. **Emotional\
-    \ Aspect and Pain Points:**\n   Ms. Rodriguez emphasized the importance of considering\
-    \ the emotional aspect of the journey and identifying customers' pain points at\
-    \ each stage.\n\n3. **Data-Driven Mapping:**\n   Mr. Kim proposed using data from\
-    \ our CRM system to create a detailed, data-driven customer journey map.\n\n4.\
-    \ **Customer Perspective:**\n   Ms. Johnson recommended gathering insights from\
-    \ the customer's perspective through interviews or surveys.\n\n5. **Analysis and\
-    \ Improvement:**\n   Ms. Brown suggested analyzing the customer journey map to\
-    \ identify areas for improvement and developing strategies to address them.\n\n\
-    6. **Measuring Impact:**\n   Mr. Smith stressed the need to measure the impact\
-    \ of any changes made by tracking key performance indicators.\n\nTo facilitate\
-    \ a comprehensive analysis, we have divided into teams to tackle different aspects\
-    \ of the customer journey:\n\n* Team 1: Pre-sale touchpoints\n* Team 2: Sales\n\
-    * Team 3: Post-sale support\n\nEach team will share their findings and discuss\
-    \ next steps in a week.\n\nYour engagement and insights have been invaluable in\
-    \ understanding our customers' experiences and identifying opportunities for improvement.\
-    \ I look forward to our continued collaboration as we work towards enhancing our\
-    \ services and delivering exceptional customer experiences.\n\nBest regards,\n\
-    \n[Your Full Name]\n[Your Position]\n[Company Name]""",
-    }
-]
-ds = Dataset.from_list(samples)
-skills_flow = Flow(client, 10).get_flow_from_file(
-    DEFAULT_FLOW_FILE_MAP["SynthGroundedSkillsFlow"]
-)
-skills_pipe = Pipeline(skills_flow)
-sdg = SDG([skills_pipe])
-gen_data = sdg.generate(ds)
-print(gen_data)
-print(gen_data[0])

sdg_hub-0.1.0a2/scripts/test_knowledge.py DELETED Viewed

@@ -1,52 +0,0 @@
-# Standard
-import operator
-# Third Party
-from datasets import Dataset
-from openai import OpenAI
-# First Party
-from sdg_hub.sdg import SDG
-from sdg_hub.flow import Flow
-from sdg_hub.pipeline import Pipeline
-# Please don't add you vLLM endpoint key here
-openai_api_key = "EMPTY"
-openai_api_base = "Add model endpoint here"
-client = OpenAI(
-    api_key=openai_api_key,
-    base_url=openai_api_base,
-)
-models = client.models.list()
-teacher_model = models.data[0].id
-samples = [
-    {
-        "icl_query_1": "what is the location of the tubal tonsils?",
-        "icl_response_1": "The location of the tubal tonsils is the roof of the pharynx.",
-        "icl_query_2": "How long does the adenoid grow?",
-        "task_description": "Teaching about human anatomy, specifically tonsils",
-        "icl_response_2": "The adenoid grows until the age of 5, starts to shrink at the age of 7 and becomes small in adulthood.",
-        "icl_query_3": "What is the immune systems first line of defense against ingested or inhaled foreign pathogens?",
-        "icl_response_3": "The tonsils are the immune systems first line of defense.",
-        "document": "The **tonsils** are a set of lymphoid organs facing into the aerodigestive tract, which is known as Waldeyer's tonsillar ring and consists of the adenoid tonsil or pharyngeal tonsil, two tubal tonsils, two palatine tonsils, and the lingual tonsils. These organs play an important role in the immune system. When used unqualified, the term most commonly refers specifically to the palatine tonsils, which are two lymphoid organs situated at either side of the back of the human throat. The palatine tonsils and the adenoid tonsil are organs consisting of lymphoepithelial tissue located near the oropharynx and nasopharynx parts of the throat",
-        "domain": "textbook",
-    }
-]
-ds = Dataset.from_list(samples)
-mmlu_flow = Flow(client, 1).get_flow_from_file(DEFAULT_FLOW_FILE_MAP["MMLUBenchFlow"])
-knowledge_flow = Flow(client, 1).get_flow_from_file(
-    DEFAULT_FLOW_FILE_MAP["SynthKnowledgeFlow"]
-)
-knowledge_pipe = Pipeline(knowledge_flow)
-mmlu_pipe = Pipeline(mmlu_flow)
-sdg = SDG([mmlu_pipe, knowledge_pipe])
-mmlubench_data = sdg.generate(ds)
-print(mmlubench_data)
-print(mmlubench_data[0])

sdg-hub 0.1.0a2__tar.gz → 0.1.0a3__tar.gz

sdg-hub 0.1.0a2tar.gz → 0.1.0a3tar.gz