PyPI - edsl - Versions diffs - 0.1.37.dev5__py3-none-any.whl → 0.1.38__py3-none-any.whl - Mend

edsl 0.1.37.dev5py3-none-any.whl → 0.1.38py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

edsl/Base.py +63 -34
edsl/BaseDiff.py +7 -7
edsl/__init__.py +2 -1
edsl/__version__.py +1 -1
edsl/agents/Agent.py +23 -11
edsl/agents/AgentList.py +86 -23
edsl/agents/Invigilator.py +18 -7
edsl/agents/InvigilatorBase.py +0 -19
edsl/agents/PromptConstructor.py +5 -4
edsl/auto/SurveyCreatorPipeline.py +1 -1
edsl/auto/utilities.py +1 -1
edsl/base/Base.py +3 -13
edsl/config.py +8 -0
edsl/coop/coop.py +89 -19
edsl/data/Cache.py +45 -17
edsl/data/CacheEntry.py +8 -3
edsl/data/RemoteCacheSync.py +0 -19
edsl/enums.py +2 -0
edsl/exceptions/agents.py +4 -0
edsl/exceptions/cache.py +5 -0
edsl/inference_services/GoogleService.py +7 -15
edsl/inference_services/PerplexityService.py +163 -0
edsl/inference_services/registry.py +2 -0
edsl/jobs/Jobs.py +110 -559
edsl/jobs/JobsChecks.py +147 -0
edsl/jobs/JobsPrompts.py +268 -0
edsl/jobs/JobsRemoteInferenceHandler.py +239 -0
edsl/jobs/buckets/TokenBucket.py +3 -0
edsl/jobs/interviews/Interview.py +7 -7
edsl/jobs/runners/JobsRunnerAsyncio.py +156 -28
edsl/jobs/runners/JobsRunnerStatus.py +194 -196
edsl/jobs/tasks/TaskHistory.py +27 -19
edsl/language_models/LanguageModel.py +52 -90
edsl/language_models/ModelList.py +67 -14
edsl/language_models/registry.py +57 -4
edsl/notebooks/Notebook.py +7 -8
edsl/prompts/Prompt.py +8 -3
edsl/questions/QuestionBase.py +38 -30
edsl/questions/QuestionBaseGenMixin.py +1 -1
edsl/questions/QuestionBasePromptsMixin.py +0 -17
edsl/questions/QuestionExtract.py +3 -4
edsl/questions/QuestionFunctional.py +10 -3
edsl/questions/derived/QuestionTopK.py +2 -0
edsl/questions/question_registry.py +36 -6
edsl/results/CSSParameterizer.py +108 -0
edsl/results/Dataset.py +146 -15
edsl/results/DatasetExportMixin.py +231 -217
edsl/results/DatasetTree.py +134 -4
edsl/results/Result.py +31 -16
edsl/results/Results.py +159 -65
edsl/results/TableDisplay.py +198 -0
edsl/results/table_display.css +78 -0
edsl/scenarios/FileStore.py +187 -13
edsl/scenarios/Scenario.py +73 -18
edsl/scenarios/ScenarioJoin.py +127 -0
edsl/scenarios/ScenarioList.py +251 -76
edsl/surveys/MemoryPlan.py +1 -1
edsl/surveys/Rule.py +1 -5
edsl/surveys/RuleCollection.py +1 -1
edsl/surveys/Survey.py +25 -19
edsl/surveys/SurveyFlowVisualizationMixin.py +67 -9
edsl/surveys/instructions/ChangeInstruction.py +9 -7
edsl/surveys/instructions/Instruction.py +21 -7
edsl/templates/error_reporting/interview_details.html +3 -3
edsl/templates/error_reporting/interviews.html +18 -9
edsl/{conjure → utilities}/naming_utilities.py +1 -1
edsl/utilities/utilities.py +15 -0
{edsl-0.1.37.dev5.dist-info → edsl-0.1.38.dist-info}/METADATA +2 -1
{edsl-0.1.37.dev5.dist-info → edsl-0.1.38.dist-info}/RECORD +71 -77
edsl/conjure/AgentConstructionMixin.py +0 -160
edsl/conjure/Conjure.py +0 -62
edsl/conjure/InputData.py +0 -659
edsl/conjure/InputDataCSV.py +0 -48
edsl/conjure/InputDataMixinQuestionStats.py +0 -182
edsl/conjure/InputDataPyRead.py +0 -91
edsl/conjure/InputDataSPSS.py +0 -8
edsl/conjure/InputDataStata.py +0 -8
edsl/conjure/QuestionOptionMixin.py +0 -76
edsl/conjure/QuestionTypeMixin.py +0 -23
edsl/conjure/RawQuestion.py +0 -65
edsl/conjure/SurveyResponses.py +0 -7
edsl/conjure/__init__.py +0 -9
edsl/conjure/examples/placeholder.txt +0 -0
edsl/conjure/utilities.py +0 -201
{edsl-0.1.37.dev5.dist-info → edsl-0.1.38.dist-info}/LICENSE +0 -0
{edsl-0.1.37.dev5.dist-info → edsl-0.1.38.dist-info}/WHEEL +0 -0

edsl/scenarios/ScenarioJoin.py ADDED Viewed

@@ -0,0 +1,127 @@
+from __future__ import annotations
+from typing import Union, TYPE_CHECKING
+# if TYPE_CHECKING:
+from edsl.scenarios.ScenarioList import ScenarioList
+from edsl.scenarios.Scenario import Scenario
+class ScenarioJoin:
+    """Handles join operations between two ScenarioLists.
+    This class encapsulates all join-related logic, making it easier to maintain
+    and extend with other join types (inner, right, full) in the future.
+    """
+    def __init__(self, left: "ScenarioList", right: "ScenarioList"):
+        """Initialize join operation with two ScenarioLists.
+        Args:
+            left: The left ScenarioList
+            right: The right ScenarioList
+        """
+        self.left = left
+        self.right = right
+    def left_join(self, by: Union[str, list[str]]) -> ScenarioList:
+        """Perform a left join between the two ScenarioLists.
+        Args:
+            by: String or list of strings representing the key(s) to join on. Cannot be empty.
+        Returns:
+            A new ScenarioList containing the joined scenarios
+        Raises:
+            ValueError: If by is empty or if any join keys don't exist in both ScenarioLists
+        """
+        self._validate_join_keys(by)
+        by_keys = [by] if isinstance(by, str) else by
+        other_dict = self._create_lookup_dict(self.right, by_keys)
+        all_keys = self._get_all_keys()
+        return ScenarioList(
+            self._create_joined_scenarios(by_keys, other_dict, all_keys)
+        )
+    def _validate_join_keys(self, by: Union[str, list[str]]) -> None:
+        """Validate join keys exist in both ScenarioLists."""
+        if not by:
+            raise ValueError(
+                "Join keys cannot be empty. Please specify at least one key to join on."
+            )
+        by_keys = [by] if isinstance(by, str) else by
+        left_keys = set(next(iter(self.left)).keys()) if self.left else set()
+        right_keys = set(next(iter(self.right)).keys()) if self.right else set()
+        missing_left = set(by_keys) - left_keys
+        missing_right = set(by_keys) - right_keys
+        if missing_left or missing_right:
+            missing = missing_left | missing_right
+            raise ValueError(f"Join key(s) {missing} not found in both ScenarioLists")
+    @staticmethod
+    def _get_key_tuple(scenario: Scenario, keys: list[str]) -> tuple:
+        """Create a tuple of values for the join keys."""
+        return tuple(scenario[k] for k in keys)
+    def _create_lookup_dict(self, scenarios: ScenarioList, by_keys: list[str]) -> dict:
+        """Create a lookup dictionary for the right scenarios."""
+        return {
+            self._get_key_tuple(scenario, by_keys): scenario for scenario in scenarios
+        }
+    def _get_all_keys(self) -> set:
+        """Get all unique keys from both ScenarioLists."""
+        all_keys = set()
+        for scenario in self.left:
+            all_keys.update(scenario.keys())
+        for scenario in self.right:
+            all_keys.update(scenario.keys())
+        return all_keys
+    def _create_joined_scenarios(
+        self, by_keys: list[str], other_dict: dict, all_keys: set
+    ) -> list[Scenario]:
+        """Create the joined scenarios."""
+        new_scenarios = []
+        for scenario in self.left:
+            new_scenario = {key: None for key in all_keys}
+            new_scenario.update(scenario)
+            key_tuple = self._get_key_tuple(scenario, by_keys)
+            if matching_scenario := other_dict.get(key_tuple):
+                self._handle_matching_scenario(
+                    new_scenario, scenario, matching_scenario, by_keys
+                )
+            new_scenarios.append(Scenario(new_scenario))
+        return new_scenarios
+    def _handle_matching_scenario(
+        self,
+        new_scenario: dict,
+        left_scenario: Scenario,
+        right_scenario: Scenario,
+        by_keys: list[str],
+    ) -> None:
+        """Handle merging of matching scenarios and conflict warnings."""
+        overlapping_keys = set(left_scenario.keys()) & set(right_scenario.keys())
+        for key in overlapping_keys:
+            if key not in by_keys and left_scenario[key] != right_scenario[key]:
+                join_conditions = [f"{k}='{left_scenario[k]}'" for k in by_keys]
+                print(
+                    f"Warning: Conflicting values for key '{key}' where "
+                    f"{' AND '.join(join_conditions)}. "
+                    f"Keeping left value: {left_scenario[key]} "
+                    f"(discarding: {right_scenario[key]})"
+                )
+        # Only update with non-overlapping keys from matching scenario
+        new_keys = set(right_scenario.keys()) - set(left_scenario.keys())
+        new_scenario.update({k: right_scenario[k] for k in new_keys})

edsl/scenarios/ScenarioList.py CHANGED Viewed

@@ -20,7 +20,7 @@ from edsl.scenarios.Scenario import Scenario
 from edsl.scenarios.ScenarioListPdfMixin import ScenarioListPdfMixin
 from edsl.scenarios.ScenarioListExportMixin import ScenarioListExportMixin
-from edsl.conjure.naming_utilities import sanitize_string
+from edsl.utilities.naming_utilities import sanitize_string
 from edsl.utilities.utilities import is_valid_variable_name
@@ -31,6 +31,10 @@ class ScenarioListMixin(ScenarioListPdfMixin, ScenarioListExportMixin):
 class ScenarioList(Base, UserList, ScenarioListMixin):
     """Class for creating a list of scenarios to be used in a survey."""
+    __documentation__ = (
+        "https://docs.expectedparrot.com/en/latest/scenarios.html#scenariolist"
+    )
     def __init__(self, data: Optional[list] = None, codebook: Optional[dict] = None):
         """Initialize the ScenarioList class."""
         if data is not None:
@@ -239,7 +243,10 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
         """
         from edsl.utilities.utilities import dict_hash
-        return dict_hash(self._to_dict(sort=True))
+        return dict_hash(self.to_dict(sort=True, add_edsl_version=False))
+    def __eq__(self, other: Any) -> bool:
+        return hash(self) == hash(other)
     def __repr__(self):
         return f"ScenarioList({self.data})"
@@ -282,41 +289,49 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
         random.shuffle(self.data)
         return self
-    def _repr_html_(self) -> str:
-        from edsl.utilities.utilities import data_to_html
-        data = self.to_dict()
-        _ = data.pop("edsl_version")
-        _ = data.pop("edsl_class_name")
-        for s in data["scenarios"]:
-            _ = s.pop("edsl_version")
-            _ = s.pop("edsl_class_name")
-        for scenario in data["scenarios"]:
-            for key, value in scenario.items():
-                if hasattr(value, "to_dict"):
-                    data[key] = value.to_dict()
-        return data_to_html(data)
-    def tally(self, field) -> dict:
-        """Return a tally of the values in the field.
-        Example:
-        >>> s = ScenarioList([Scenario({'a': 1, 'b': 1}), Scenario({'a': 1, 'b': 2})])
-        >>> s.tally('b')
-        {1: 1, 2: 1}
-        """
-        return dict(Counter([scenario[field] for scenario in self]))
-    def sample(self, n: int, seed="edsl") -> ScenarioList:
+    def _repr_html_(self):
+        """Return an HTML representation of the AgentList."""
+        # return (
+        #     str(self.summary(format="html")) + "<br>" + str(self.table(tablefmt="html"))
+        # )
+        footer = f"<a href={self.__documentation__}>(docs)</a>"
+        return str(self.summary(format="html")) + footer
+    # def _repr_html_(self) -> str:
+    # from edsl.utilities.utilities import data_to_html
+    # data = self.to_dict()
+    # _ = data.pop("edsl_version")
+    # _ = data.pop("edsl_class_name")
+    # for s in data["scenarios"]:
+    #     _ = s.pop("edsl_version")
+    #     _ = s.pop("edsl_class_name")
+    # for scenario in data["scenarios"]:
+    #     for key, value in scenario.items():
+    #         if hasattr(value, "to_dict"):
+    #             data[key] = value.to_dict()
+    # return data_to_html(data)
+    # def tally(self, field) -> dict:
+    #     """Return a tally of the values in the field.
+    #     Example:
+    #     >>> s = ScenarioList([Scenario({'a': 1, 'b': 1}), Scenario({'a': 1, 'b': 2})])
+    #     >>> s.tally('b')
+    #     {1: 1, 2: 1}
+    #     """
+    #     return dict(Counter([scenario[field] for scenario in self]))
+    def sample(self, n: int, seed: Optional[str] = None) -> ScenarioList:
         """Return a random sample from the ScenarioList
         >>> s = ScenarioList.from_list("a", [1,2,3,4,5,6])
-        >>> s.sample(3)
+        >>> s.sample(3, seed = "edsl")
         ScenarioList([Scenario({'a': 2}), Scenario({'a': 1}), Scenario({'a': 3})])
         """
-        random.seed(seed)
+        if seed:
+            random.seed(seed)
         return ScenarioList(random.sample(self.data, n))
@@ -564,6 +579,47 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
             func = lambda x: x
         return cls([Scenario({name: func(value)}) for value in values])
+    def table(self, *fields, tablefmt=None, pretty_labels=None) -> str:
+        """Return the ScenarioList as a table."""
+        from tabulate import tabulate_formats
+        if tablefmt is not None and tablefmt not in tabulate_formats:
+            raise ValueError(
+                f"Invalid table format: {tablefmt}",
+                f"Valid formats are: {tabulate_formats}",
+            )
+        return self.to_dataset().table(
+            *fields, tablefmt=tablefmt, pretty_labels=pretty_labels
+        )
+    def tree(self, node_list: Optional[List[str]] = None) -> str:
+        """Return the ScenarioList as a tree."""
+        return self.to_dataset().tree(node_list)
+    def _summary(self):
+        d = {
+            "EDSL Class name": "ScenarioList",
+            "# Scenarios": len(self),
+            "Scenario Keys": list(self.parameters),
+        }
+        return d
+    def reorder_keys(self, new_order):
+        """Reorder the keys in the scenarios.
+        Example:
+        >>> s = ScenarioList([Scenario({'a': 1, 'b': 2}), Scenario({'a': 3, 'b': 4})])
+        >>> s.reorder_keys(['b', 'a'])
+        ScenarioList([Scenario({'b': 2, 'a': 1}), Scenario({'b': 4, 'a': 3})])
+        """
+        new_scenarios = []
+        for scenario in self:
+            new_scenario = Scenario({key: scenario[key] for key in new_order})
+            new_scenarios.append(new_scenario)
+        return ScenarioList(new_scenarios)
     def to_dataset(self) -> "Dataset":
         """
         >>> s = ScenarioList.from_list("a", [1,2,3])
@@ -579,16 +635,32 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
         data = [{key: [scenario[key] for scenario in self.data]} for key in keys]
         return Dataset(data)
-    def split(
-        self, field: str, split_on: str, index: int, new_name: Optional[str] = None
+    def unpack(
+        self, field: str, new_names: Optional[List[str]] = None, keep_original=True
     ) -> ScenarioList:
-        """Split a scenario fiel in multiple fields."""
-        if new_name is None:
-            new_name = field + "_split_" + str(index)
+        """Unpack a field into multiple fields.
+        Example:
+        >>> s = ScenarioList([Scenario({'a': 1, 'b': [2, True]}), Scenario({'a': 3, 'b': [3, False]})])
+        >>> s.unpack('b')
+        ScenarioList([Scenario({'a': 1, 'b': [2, True], 'b_0': 2, 'b_1': True}), Scenario({'a': 3, 'b': [3, False], 'b_0': 3, 'b_1': False})])
+        >>> s.unpack('b', new_names=['c', 'd'], keep_original=False)
+        ScenarioList([Scenario({'a': 1, 'c': 2, 'd': True}), Scenario({'a': 3, 'c': 3, 'd': False})])
+        """
+        new_names = new_names or [f"{field}_{i}" for i in range(len(self[0][field]))]
         new_scenarios = []
         for scenario in self:
             new_scenario = scenario.copy()
-            new_scenario[new_name] = scenario[field].split(split_on)[index]
+            if len(new_names) == 1:
+                new_scenario[new_names[0]] = scenario[field]
+            else:
+                for i, new_name in enumerate(new_names):
+                    new_scenario[new_name] = scenario[field][i]
+            if not keep_original:
+                del new_scenario[field]
             new_scenarios.append(new_scenario)
         return ScenarioList(new_scenarios)
@@ -901,33 +973,32 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
         return cls.from_excel(temp_filename, sheet_name=sheet_name)
     @classmethod
-    def from_csv(cls, source: Union[str, urllib.parse.ParseResult]) -> ScenarioList:
-        """Create a ScenarioList from a CSV file or URL.
+    def from_delimited_file(
+        cls, source: Union[str, urllib.parse.ParseResult], delimiter: str = ","
+    ) -> ScenarioList:
+        """Create a ScenarioList from a delimited file (CSV/TSV) or URL.
         Args:
-            source: A string representing either a local file path or a URL to a CSV file,
+            source: A string representing either a local file path or a URL to a delimited file,
                     or a urllib.parse.ParseResult object for a URL.
+            delimiter: The delimiter used in the file. Defaults to ',' for CSV files.
+                    Use '\t' for TSV files.
         Returns:
-            ScenarioList: A ScenarioList object containing the data from the CSV.
+            ScenarioList: A ScenarioList object containing the data from the file.
         Example:
+            # For CSV files
-        >>> import tempfile
-        >>> import os
-        >>> with tempfile.NamedTemporaryFile(delete=False, mode='w', suffix='.csv') as f:
-        ...     _ = f.write("name,age,location\\nAlice,30,New York\\nBob,25,Los Angeles\\n")
-        ...     temp_filename = f.name
-        >>> scenario_list = ScenarioList.from_csv(temp_filename)
-        >>> len(scenario_list)
-        2
-        >>> scenario_list[0]['name']
-        'Alice'
-        >>> scenario_list[1]['age']
-        '25'
+            >>> with open('data.csv', 'w') as f:
+            ...     _ = f.write('name,age\\nAlice,30\\nBob,25\\n')
+            >>> scenario_list = ScenarioList.from_delimited_file('data.csv')
+            # For TSV files
+            >>> with open('data.tsv', 'w') as f:
+            ...     _ = f.write('name\\tage\\nAlice\t30\\nBob\t25\\n')
+            >>> scenario_list = ScenarioList.from_delimited_file('data.tsv', delimiter='\\t')
-        >>> url = "https://example.com/data.csv"
-        >>> ## scenario_list_from_url = ScenarioList.from_csv(url)
         """
         from edsl.scenarios.Scenario import Scenario
@@ -940,42 +1011,129 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
         if isinstance(source, str) and is_url(source):
             with urllib.request.urlopen(source) as response:
-                csv_content = response.read().decode("utf-8")
-            csv_file = StringIO(csv_content)
+                file_content = response.read().decode("utf-8")
+            file_obj = StringIO(file_content)
         elif isinstance(source, urllib.parse.ParseResult):
             with urllib.request.urlopen(source.geturl()) as response:
-                csv_content = response.read().decode("utf-8")
-            csv_file = StringIO(csv_content)
+                file_content = response.read().decode("utf-8")
+            file_obj = StringIO(file_content)
         else:
-            csv_file = open(source, "r")
+            file_obj = open(source, "r")
         try:
-            reader = csv.reader(csv_file)
+            reader = csv.reader(file_obj, delimiter=delimiter)
             header = next(reader)
             observations = [Scenario(dict(zip(header, row))) for row in reader]
         finally:
-            csv_file.close()
+            file_obj.close()
         return cls(observations)
-    def _to_dict(self, sort=False) -> dict:
-        if sort:
-            data = sorted(self, key=lambda x: hash(x))
-        else:
-            data = self
-        return {"scenarios": [s._to_dict() for s in data]}
+    # Convenience methods for specific file types
+    @classmethod
+    def from_csv(cls, source: Union[str, urllib.parse.ParseResult]) -> ScenarioList:
+        """Create a ScenarioList from a CSV file or URL."""
+        return cls.from_delimited_file(source, delimiter=",")
-    @add_edsl_version
-    def to_dict(self) -> dict[str, Any]:
-        """Return the `ScenarioList` as a dictionary.
+    def left_join(self, other: ScenarioList, by: Union[str, list[str]]) -> ScenarioList:
+        """Perform a left join with another ScenarioList, following SQL join semantics.
-        Example:
+        Args:
+            other: The ScenarioList to join with
+            by: String or list of strings representing the key(s) to join on. Cannot be empty.
+        >>> s1 = ScenarioList([Scenario({'name': 'Alice', 'age': 30}), Scenario({'name': 'Bob', 'age': 25})])
+        >>> s2 = ScenarioList([Scenario({'name': 'Alice', 'location': 'New York'}), Scenario({'name': 'Charlie', 'location': 'Los Angeles'})])
+        >>> s3 = s1.left_join(s2, 'name')
+        >>> s3 == ScenarioList([Scenario({'age': 30, 'location': 'New York', 'name': 'Alice'}), Scenario({'age': 25, 'location': None, 'name': 'Bob'})])
+        True
+        """
+        from edsl.scenarios.ScenarioJoin import ScenarioJoin
+        sj = ScenarioJoin(self, other)
+        return sj.left_join(by)
+        # # Validate join keys
+        # if not by:
+        #     raise ValueError(
+        #         "Join keys cannot be empty. Please specify at least one key to join on."
+        #     )
+        # # Convert single string to list for consistent handling
+        # by_keys = [by] if isinstance(by, str) else by
+        # # Verify all join keys exist in both ScenarioLists
+        # left_keys = set(next(iter(self)).keys()) if self else set()
+        # right_keys = set(next(iter(other)).keys()) if other else set()
+        # missing_left = set(by_keys) - left_keys
+        # missing_right = set(by_keys) - right_keys
+        # if missing_left or missing_right:
+        #     missing = missing_left | missing_right
+        #     raise ValueError(f"Join key(s) {missing} not found in both ScenarioLists")
+        # # Create lookup dictionary from the other ScenarioList
+        # def get_key_tuple(scenario: Scenario, keys: list[str]) -> tuple:
+        #     return tuple(scenario[k] for k in keys)
+        # other_dict = {get_key_tuple(scenario, by_keys): scenario for scenario in other}
+        # # Collect all possible keys (like SQL combining all columns)
+        # all_keys = set()
+        # for scenario in self:
+        #     all_keys.update(scenario.keys())
+        # for scenario in other:
+        #     all_keys.update(scenario.keys())
+        # new_scenarios = []
+        # for scenario in self:
+        #     new_scenario = {
+        #         key: None for key in all_keys
+        #     }  # Start with nulls (like SQL)
+        #     new_scenario.update(scenario)  # Add all left values
+        #     key_tuple = get_key_tuple(scenario, by_keys)
+        #     if matching_scenario := other_dict.get(key_tuple):
+        #         # Check for overlapping keys with different values
+        #         overlapping_keys = set(scenario.keys()) & set(matching_scenario.keys())
+        #         for key in overlapping_keys:
+        #             if key not in by_keys and scenario[key] != matching_scenario[key]:
+        #                 join_conditions = [f"{k}='{scenario[k]}'" for k in by_keys]
+        #                 print(
+        #                     f"Warning: Conflicting values for key '{key}' where {' AND '.join(join_conditions)}. "
+        #                     f"Keeping left value: {scenario[key]} (discarding: {matching_scenario[key]})"
+        #                 )
+        #         # Only update with non-overlapping keys from matching scenario
+        #         new_keys = set(matching_scenario.keys()) - set(scenario.keys())
+        #         new_scenario.update({k: matching_scenario[k] for k in new_keys})
+        #     new_scenarios.append(Scenario(new_scenario))
+        # return ScenarioList(new_scenarios)
+    @classmethod
+    def from_tsv(cls, source: Union[str, urllib.parse.ParseResult]) -> ScenarioList:
+        """Create a ScenarioList from a TSV file or URL."""
+        return cls.from_delimited_file(source, delimiter="\t")
+    def to_dict(self, sort=False, add_edsl_version=True) -> dict:
+        """
         >>> s = ScenarioList([Scenario({'food': 'wood chips'}), Scenario({'food': 'wood-fired pizza'})])
         >>> s.to_dict()
         {'scenarios': [{'food': 'wood chips', 'edsl_version': '...', 'edsl_class_name': 'Scenario'}, {'food': 'wood-fired pizza', 'edsl_version': '...', 'edsl_class_name': 'Scenario'}], 'edsl_version': '...', 'edsl_class_name': 'ScenarioList'}
         """
-        return {"scenarios": [s.to_dict() for s in self]}
+        if sort:
+            data = sorted(self, key=lambda x: hash(x))
+        else:
+            data = self
+        d = {"scenarios": [s.to_dict(add_edsl_version=add_edsl_version) for s in data]}
+        if add_edsl_version:
+            from edsl import __version__
+            d["edsl_version"] = __version__
+            d["edsl_class_name"] = self.__class__.__name__
+        return d
     @classmethod
     def gen(cls, scenario_dicts_list: List[dict]) -> ScenarioList:
@@ -1061,7 +1219,7 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
         elif isinstance(key, int):
             return super().__getitem__(key)
         else:
-            return self._to_dict()[key]
+            return self.to_dict(add_edsl_version=False)[key]
     def to_agent_list(self):
         """Convert the ScenarioList to an AgentList.
@@ -1074,8 +1232,25 @@ class ScenarioList(Base, UserList, ScenarioListMixin):
         """
         from edsl.agents.AgentList import AgentList
         from edsl.agents.Agent import Agent
+        import warnings
+        agents = []
+        for scenario in self:
+            new_scenario = scenario.copy().data
+            if "name" in new_scenario:
+                name = new_scenario.pop("name")
+                proposed_agent_name = "agent_name"
+                while proposed_agent_name not in new_scenario:
+                    proposed_agent_name += "_"
+                warnings.warn(
+                    f"The 'name' field is reserved for the agent's name---putting this value in {proposed_agent_name}"
+                )
+                new_scenario[proposed_agent_name] = name
+                agents.append(Agent(traits=new_scenario, name=name))
+            else:
+                agents.append(Agent(traits=new_scenario))
-        return AgentList([Agent(traits=s.data) for s in self])
+        return AgentList(agents)
     def chunk(
         self,

edsl/surveys/MemoryPlan.py CHANGED Viewed

@@ -143,7 +143,7 @@ class MemoryPlan(UserDict):
         for question in prior_questions:
             self.add_single_memory(focal_question, question)
-    def to_dict(self) -> dict:
+    def to_dict(self, add_edsl_version=True) -> dict:
         """Serialize the memory plan to a dictionary.
         >>> mp = MemoryPlan.example()

edsl/surveys/Rule.py CHANGED Viewed

@@ -148,10 +148,7 @@ class Rule:
     def _checks(self):
         pass
-    # def _to_dict(self):
-    # @add_edsl_version
-    def to_dict(self):
+    def to_dict(self, add_edsl_version=True):
         """Convert the rule to a dictionary for serialization.
         >>> r = Rule.example()
@@ -166,7 +163,6 @@ class Rule:
             "question_name_to_index": self.question_name_to_index,
             "before_rule": self.before_rule,
         }
-        # return self._to_dict()
     @classmethod
     @remove_edsl_version

edsl/surveys/RuleCollection.py CHANGED Viewed

@@ -46,7 +46,7 @@ class RuleCollection(UserList):
         """
         return f"RuleCollection(rules={self.data}, num_questions={self.num_questions})"
-    def to_dict(self):
+    def to_dict(self, add_edsl_version=True):
         """Create a dictionary representation of the RuleCollection object."""
         return {
             "rules": [rule.to_dict() for rule in self],

edsl 0.1.37.dev5__py3-none-any.whl → 0.1.38__py3-none-any.whl

edsl 0.1.37.dev5py3-none-any.whl → 0.1.38py3-none-any.whl