PyPI - edsl - Versions diffs - 0.1.38__py3-none-any.whl → 0.1.38.dev1__py3-none-any.whl - Mend

edsl 0.1.38py3-none-any.whl → 0.1.38.dev1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

edsl/Base.py +34 -63
edsl/BaseDiff.py +7 -7
edsl/__init__.py +1 -2
edsl/__version__.py +1 -1
edsl/agents/Agent.py +11 -23
edsl/agents/AgentList.py +23 -86
edsl/agents/Invigilator.py +7 -18
edsl/agents/InvigilatorBase.py +19 -0
edsl/agents/PromptConstructor.py +4 -5
edsl/auto/SurveyCreatorPipeline.py +1 -1
edsl/auto/utilities.py +1 -1
edsl/base/Base.py +13 -3
edsl/config.py +0 -8
edsl/conjure/AgentConstructionMixin.py +160 -0
edsl/conjure/Conjure.py +62 -0
edsl/conjure/InputData.py +659 -0
edsl/conjure/InputDataCSV.py +48 -0
edsl/conjure/InputDataMixinQuestionStats.py +182 -0
edsl/conjure/InputDataPyRead.py +91 -0
edsl/conjure/InputDataSPSS.py +8 -0
edsl/conjure/InputDataStata.py +8 -0
edsl/conjure/QuestionOptionMixin.py +76 -0
edsl/conjure/QuestionTypeMixin.py +23 -0
edsl/conjure/RawQuestion.py +65 -0
edsl/conjure/SurveyResponses.py +7 -0
edsl/conjure/__init__.py +9 -0
edsl/conjure/examples/placeholder.txt +0 -0
edsl/{utilities → conjure}/naming_utilities.py +1 -1
edsl/conjure/utilities.py +201 -0
edsl/coop/coop.py +7 -77
edsl/data/Cache.py +17 -45
edsl/data/CacheEntry.py +3 -8
edsl/data/RemoteCacheSync.py +19 -0
edsl/enums.py +0 -2
edsl/exceptions/agents.py +0 -4
edsl/inference_services/GoogleService.py +15 -7
edsl/inference_services/registry.py +0 -2
edsl/jobs/Jobs.py +559 -110
edsl/jobs/buckets/TokenBucket.py +0 -3
edsl/jobs/interviews/Interview.py +7 -7
edsl/jobs/runners/JobsRunnerAsyncio.py +28 -156
edsl/jobs/runners/JobsRunnerStatus.py +196 -194
edsl/jobs/tasks/TaskHistory.py +19 -27
edsl/language_models/LanguageModel.py +90 -52
edsl/language_models/ModelList.py +14 -67
edsl/language_models/registry.py +4 -57
edsl/notebooks/Notebook.py +8 -7
edsl/prompts/Prompt.py +3 -8
edsl/questions/QuestionBase.py +30 -38
edsl/questions/QuestionBaseGenMixin.py +1 -1
edsl/questions/QuestionBasePromptsMixin.py +17 -0
edsl/questions/QuestionExtract.py +4 -3
edsl/questions/QuestionFunctional.py +3 -10
edsl/questions/derived/QuestionTopK.py +0 -2
edsl/questions/question_registry.py +6 -36
edsl/results/Dataset.py +15 -146
edsl/results/DatasetExportMixin.py +217 -231
edsl/results/DatasetTree.py +4 -134
edsl/results/Result.py +16 -31
edsl/results/Results.py +65 -159
edsl/scenarios/FileStore.py +13 -187
edsl/scenarios/Scenario.py +18 -73
edsl/scenarios/ScenarioList.py +76 -251
edsl/surveys/MemoryPlan.py +1 -1
edsl/surveys/Rule.py +5 -1
edsl/surveys/RuleCollection.py +1 -1
edsl/surveys/Survey.py +19 -25
edsl/surveys/SurveyFlowVisualizationMixin.py +9 -67
edsl/surveys/instructions/ChangeInstruction.py +7 -9
edsl/surveys/instructions/Instruction.py +7 -21
edsl/templates/error_reporting/interview_details.html +3 -3
edsl/templates/error_reporting/interviews.html +9 -18
edsl/utilities/utilities.py +0 -15
{edsl-0.1.38.dist-info → edsl-0.1.38.dev1.dist-info}/METADATA +1 -2
{edsl-0.1.38.dist-info → edsl-0.1.38.dev1.dist-info}/RECORD +77 -71
edsl/exceptions/cache.py +0 -5
edsl/inference_services/PerplexityService.py +0 -163
edsl/jobs/JobsChecks.py +0 -147
edsl/jobs/JobsPrompts.py +0 -268
edsl/jobs/JobsRemoteInferenceHandler.py +0 -239
edsl/results/CSSParameterizer.py +0 -108
edsl/results/TableDisplay.py +0 -198
edsl/results/table_display.css +0 -78
edsl/scenarios/ScenarioJoin.py +0 -127
{edsl-0.1.38.dist-info → edsl-0.1.38.dev1.dist-info}/LICENSE +0 -0
{edsl-0.1.38.dist-info → edsl-0.1.38.dev1.dist-info}/WHEEL +0 -0

edsl/scenarios/FileStore.py CHANGED Viewed

@@ -14,87 +14,18 @@ from edsl.utilities.decorators import add_edsl_version, remove_edsl_version
 from edsl.utilities.utilities import is_notebook
-def view_csv(csv_path):
-    import pandas as pd
-    df = pd.read_csv(csv_path)
-    return df
-def view_html(html_path):
-    import os
-    import subprocess
-    from IPython.display import IFrame, display, HTML
-    if os.path.exists(html_path):
-        if is_notebook():
-            # Display the HTML inline in Jupyter Notebook
-            display(IFrame(src=html_path, width=700, height=600))
-            display(
-                HTML(
-                    f'<a href="{html_path}" target="_blank">Open HTML in a new tab</a>'
-                )
-            )
-        else:
-            try:
-                if (os_name := os.name) == "posix":
-                    # Open with the default browser on macOS
-                    subprocess.run(["open", html_path], check=True)
-                elif os_name == "nt":
-                    # Open with the default browser on Windows
-                    os.startfile(html_path)
-                else:
-                    # Open with the default browser on Linux
-                    subprocess.run(["xdg-open", html_path], check=True)
-            except Exception as e:
-                print(f"Error opening HTML file: {e}")
-    else:
-        print("HTML file was not found.")
-def view_html(html_path):
-    import os
-    from IPython.display import display, HTML
-    if is_notebook():
-        with open(html_path, "r") as f:
-            html_content = f.read()
-        display(HTML(html_content))
-    else:
-        if os.path.exists(html_path):
-            try:
-                if (os_name := os.name) == "posix":
-                    subprocess.run(["open", html_path], check=True)
-                elif os_name == "nt":
-                    os.startfile(html_path)
-                else:
-                    subprocess.run(["xdg-open", html_path], check=True)
-            except Exception as e:
-                print(f"Error opening file: {e}")
-        else:
-            print("File was not created successfully.")
 def view_pdf(pdf_path):
     import os
     import subprocess
-    import os
-    from IPython.display import HTML, display
     if is_notebook():
-        # Convert to absolute path if needed
-        with open(pdf_path, "rb") as f:
-            base64_pdf = base64.b64encode(f.read()).decode("utf-8")
-        html = f"""
-        <iframe
-            src="data:application/pdf;base64,{base64_pdf}"
-            width="800px"
-            height="800px"
-            type="application/pdf"
-        ></iframe>
-        """
-        display(HTML(html))
+        from IPython.display import IFrame
+        from IPython.display import display, HTML
+        # Replace 'path/to/your/file.pdf' with the actual path to your PDF file
+        IFrame(pdf_path, width=700, height=600)
+        display(HTML(f'<a href="{pdf_path}" target="_blank">Open PDF</a>'))
+        return
     if os.path.exists(pdf_path):
         try:
@@ -112,8 +43,6 @@ def view_pdf(pdf_path):
 class FileStore(Scenario):
-    __documentation__ = "https://docs.expectedparrot.com/en/latest/filestore.html"
     def __init__(
         self,
         path: Optional[str] = None,
@@ -126,10 +55,7 @@ class FileStore(Scenario):
     ):
         if path is None and "filename" in kwargs:
             path = kwargs["filename"]
-        self._path = path  # Store the original path privately
-        self._temp_path = None  # Track any generated temporary file
+        self.path = path
         self.suffix = suffix or path.split(".")[-1]
         self.binary = binary or False
         self.mime_type = (
@@ -139,7 +65,7 @@ class FileStore(Scenario):
         self.external_locations = external_locations or {}
         super().__init__(
             {
-                "path": path,
+                "path": self.path,
                 "base64_string": self.base64_string,
                 "binary": self.binary,
                 "suffix": self.suffix,
@@ -148,110 +74,17 @@ class FileStore(Scenario):
             }
         )
-    @property
-    def path(self) -> str:
-        """
-        Property that returns a valid path to the file content.
-        If the original path doesn't exist, generates a temporary file from the base64 content.
-        """
-        # Check if original path exists and is accessible
-        if self._path and os.path.isfile(self._path):
-            return self._path
-        # If we already have a valid temporary file, use it
-        if self._temp_path and os.path.isfile(self._temp_path):
-            return self._temp_path
-        # Generate a new temporary file from base64 content
-        self._temp_path = self.to_tempfile(self.suffix)
-        return self._temp_path
     def __str__(self):
         return "FileStore: self.path"
     @classmethod
-    def example(cls, example_type="text"):
-        import textwrap
+    def example(self):
         import tempfile
-        if example_type == "png" or example_type == "image":
-            import importlib.resources
-            from pathlib import Path
-            # Get package root directory
-            package_root = Path(__file__).parent.parent.parent
-            logo_path = package_root / "static" / "logo.png"
-            return cls(str(logo_path))
-        if example_type == "text":
-            with tempfile.NamedTemporaryFile(suffix=".txt", delete=False) as f:
-                f.write(b"Hello, World!")
-            return cls(path=f.name)
+        with tempfile.NamedTemporaryFile(suffix=".txt", delete=False) as f:
+            f.write(b"Hello, World!")
-        elif example_type == "csv":
-            from edsl.results.Results import Results
-            r = Results.example()
-            with tempfile.NamedTemporaryFile(suffix=".csv", delete=False) as f:
-                r.to_csv(filename=f.name)
-            return cls(f.name)
-        elif example_type == "pdf":
-            pdf_string = textwrap.dedent(
-                """\
-            %PDF-1.4
-            1 0 obj
-            << /Type /Catalog /Pages 2 0 R >>
-            endobj
-            2 0 obj
-            << /Type /Pages /Kids [3 0 R] /Count 1 >>
-            endobj
-            3 0 obj
-            << /Type /Page /Parent 2 0 R /MediaBox [0 0 612 792] /Contents 4 0 R >>
-            endobj
-            4 0 obj
-            << /Length 44 >>
-            stream
-            BT
-            /F1 24 Tf
-            100 700 Td
-            (Hello, World!) Tj
-            ET
-            endstream
-            endobj
-            5 0 obj
-            << /Type /Font /Subtype /Type1 /BaseFont /Helvetica >>
-            endobj
-            6 0 obj
-            << /ProcSet [/PDF /Text] /Font << /F1 5 0 R >> >>
-            endobj
-            xref
-            0 7
-            0000000000 65535 f
-            0000000010 00000 n
-            0000000053 00000 n
-            0000000100 00000 n
-            0000000173 00000 n
-            0000000232 00000 n
-            0000000272 00000 n
-            trailer
-            << /Size 7 /Root 1 0 R >>
-            startxref
-            318
-            %%EOF"""
-            )
-            with tempfile.NamedTemporaryFile(suffix=".pdf", delete=False) as f:
-                f.write(pdf_string.encode())
-            return cls(f.name)
-        elif example_type == "html":
-            with tempfile.NamedTemporaryFile(suffix=".html", delete=False) as f:
-                f.write("<html><body><h1>Test</h1></body></html>".encode())
-            return cls(f.name)
+        return self(path=f.name)
     @property
     def size(self) -> int:
@@ -353,16 +186,9 @@ class FileStore(Scenario):
         return temp_file.name
     def view(self, max_size: int = 300) -> None:
-        # with self.open() as f:
-        if self.suffix == "csv":
-            return view_csv(self.path)
         if self.suffix == "pdf":
             view_pdf(self.path)
-        if self.suffix == "html":
-            view_html(self.path)
         if self.suffix == "png" or self.suffix == "jpg" or self.suffix == "jpeg":
             if is_notebook():
                 from IPython.display import Image

edsl/scenarios/Scenario.py CHANGED Viewed

@@ -4,7 +4,6 @@ from __future__ import annotations
 import copy
 import hashlib
 import os
-import json
 from collections import UserDict
 from typing import Union, List, Optional, Generator
 from uuid import uuid4
@@ -15,30 +14,12 @@ from edsl.utilities.decorators import add_edsl_version, remove_edsl_version
 from edsl.exceptions.scenarios import ScenarioError
-class DisplayJSON:
-    def __init__(self, dict):
-        self.text = json.dumps(dict, indent=4)
-    def __repr__(self):
-        return self.text
-class DisplayYAML:
-    def __init__(self, dict):
-        import yaml
-        self.text = yaml.dump(dict)
-    def __repr__(self):
-        return self.text
 class Scenario(Base, UserDict, ScenarioHtmlMixin):
     """A Scenario is a dictionary of keys/values.
     They can be used parameterize EDSL questions."""
-    __documentation__ = "https://docs.expectedparrot.com/en/latest/scenarios.html"
+    __doc__ = "https://docs.expectedparrot.com/en/latest/scenarios.html"
     def __init__(self, data: Union[dict, None] = None, name: str = None):
         """Initialize a new Scenario.
@@ -156,23 +137,7 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
                 new_scenario[key] = value
         return new_scenario
-    def table(self, tablefmt: str = "grid") -> str:
-        from edsl.results.Dataset import Dataset
-        keys = [key for key, value in self.items()]
-        values = [value for key, value in self.items()]
-        d = Dataset([{"key": keys}, {"value": values}])
-        return d.table(tablefmt=tablefmt)
-    def json(self):
-        return DisplayJSON(self.to_dict(add_edsl_version=False))
-    def yaml(self):
-        import yaml
-        return DisplayYAML(self.to_dict(add_edsl_version=False))
-    def to_dict(self, add_edsl_version=True) -> dict:
+    def _to_dict(self) -> dict:
         """Convert a scenario to a dictionary.
         Example:
@@ -180,24 +145,26 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         >>> s = Scenario({"food": "wood chips"})
         >>> s.to_dict()
         {'food': 'wood chips', 'edsl_version': '...', 'edsl_class_name': 'Scenario'}
-        >>> s.to_dict(add_edsl_version = False)
-        {'food': 'wood chips'}
         """
         from edsl.scenarios.FileStore import FileStore
         d = self.data.copy()
         for key, value in d.items():
             if isinstance(value, FileStore):
-                d[key] = value.to_dict(add_edsl_version=add_edsl_version)
-        if add_edsl_version:
-            from edsl import __version__
+                d[key] = value.to_dict()
+        return d
-            d["edsl_version"] = __version__
-            d["edsl_class_name"] = "Scenario"
+    @add_edsl_version
+    def to_dict(self) -> dict:
+        """Convert a scenario to a dictionary.
-        return d
+        Example:
+        >>> s = Scenario({"food": "wood chips"})
+        >>> s.to_dict()
+        {'food': 'wood chips', 'edsl_version': '...', 'edsl_class_name': 'Scenario'}
+        """
+        return self._to_dict()
     def __hash__(self) -> int:
         """
@@ -211,7 +178,7 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         """
         from edsl.utilities.utilities import dict_hash
-        return dict_hash(self.to_dict(add_edsl_version=False))
+        return dict_hash(self._to_dict())
     def print(self):
         from rich import print_json
@@ -220,35 +187,13 @@ class Scenario(Base, UserDict, ScenarioHtmlMixin):
         print_json(json.dumps(self.to_dict()))
     def __repr__(self):
+        # return "Scenario(" + reprlib.repr(self.data) + ")"
         return "Scenario(" + repr(self.data) + ")"
-    def to_dataset(self) -> "Dataset":
-        # d = Dataset([{'a.b':[1,2,3,4]}])
-        from edsl.results.Dataset import Dataset
-        keys = [key for key, value in self.items()]
-        values = [value for key, value in self.items()]
-        return Dataset([{"key": keys}, {"value": values}])
     def _repr_html_(self):
-        from tabulate import tabulate
-        import reprlib
-        d = self.to_dict(add_edsl_version=False)
-        # return self.to_dataset()
-        r = reprlib.Repr()
-        r.maxstring = 70
-        data = [[k, r.repr(v)] for k, v in d.items()]
-        from tabulate import tabulate
-        if hasattr(self, "__documentation__"):
-            footer = f"<a href='{self.__documentation__}'>(docs)</a></p>"
-        else:
-            footer = ""
+        from edsl.utilities.utilities import data_to_html
-        table = str(tabulate(data, headers=["keys", "values"], tablefmt="html"))
-        return f"<pre>{table}</pre>" + footer
+        return data_to_html(self.to_dict())
     def select(self, list_of_keys: List[str]) -> "Scenario":
         """Select a subset of keys from a scenario.

edsl 0.1.38__py3-none-any.whl → 0.1.38.dev1__py3-none-any.whl

edsl 0.1.38py3-none-any.whl → 0.1.38.dev1py3-none-any.whl