PyPI - edsl - Versions diffs - 0.1.49__py3-none-any.whl → 0.1.51__py3-none-any.whl - Mend

edsl 0.1.49py3-none-any.whl → 0.1.51py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (257) hide show

edsl/__init__.py +124 -53
edsl/__version__.py +1 -1
edsl/agents/agent.py +21 -21
edsl/agents/agent_list.py +2 -5
edsl/agents/exceptions.py +119 -5
edsl/base/__init__.py +10 -35
edsl/base/base_class.py +71 -36
edsl/base/base_exception.py +204 -0
edsl/base/data_transfer_models.py +1 -1
edsl/base/exceptions.py +94 -0
edsl/buckets/__init__.py +15 -1
edsl/buckets/bucket_collection.py +3 -4
edsl/buckets/exceptions.py +107 -0
edsl/buckets/model_buckets.py +1 -2
edsl/buckets/token_bucket.py +11 -6
edsl/buckets/token_bucket_api.py +27 -12
edsl/buckets/token_bucket_client.py +9 -7
edsl/caching/cache.py +12 -4
edsl/caching/cache_entry.py +10 -9
edsl/caching/exceptions.py +113 -7
edsl/caching/remote_cache_sync.py +6 -7
edsl/caching/sql_dict.py +20 -14
edsl/cli.py +43 -0
edsl/config/__init__.py +1 -1
edsl/config/config_class.py +32 -6
edsl/conversation/Conversation.py +8 -4
edsl/conversation/car_buying.py +1 -3
edsl/conversation/exceptions.py +58 -0
edsl/conversation/mug_negotiation.py +2 -8
edsl/coop/__init__.py +28 -6
edsl/coop/coop.py +120 -29
edsl/coop/coop_functions.py +1 -1
edsl/coop/ep_key_handling.py +1 -1
edsl/coop/exceptions.py +188 -9
edsl/coop/price_fetcher.py +5 -8
edsl/coop/utils.py +4 -6
edsl/dataset/__init__.py +5 -4
edsl/dataset/dataset.py +177 -86
edsl/dataset/dataset_operations_mixin.py +98 -76
edsl/dataset/dataset_tree.py +11 -7
edsl/dataset/display/table_display.py +0 -2
edsl/dataset/display/table_renderers.py +6 -4
edsl/dataset/exceptions.py +125 -0
edsl/dataset/file_exports.py +18 -11
edsl/dataset/r/ggplot.py +13 -6
edsl/display/__init__.py +27 -0
edsl/display/core.py +147 -0
edsl/display/plugin.py +189 -0
edsl/display/utils.py +52 -0
edsl/inference_services/__init__.py +9 -1
edsl/inference_services/available_model_cache_handler.py +1 -1
edsl/inference_services/available_model_fetcher.py +5 -6
edsl/inference_services/data_structures.py +10 -7
edsl/inference_services/exceptions.py +132 -1
edsl/inference_services/inference_service_abc.py +2 -2
edsl/inference_services/inference_services_collection.py +2 -6
edsl/inference_services/registry.py +4 -3
edsl/inference_services/service_availability.py +4 -3
edsl/inference_services/services/anthropic_service.py +4 -1
edsl/inference_services/services/aws_bedrock.py +13 -12
edsl/inference_services/services/azure_ai.py +12 -10
edsl/inference_services/services/deep_infra_service.py +1 -4
edsl/inference_services/services/deep_seek_service.py +1 -5
edsl/inference_services/services/google_service.py +7 -3
edsl/inference_services/services/groq_service.py +1 -1
edsl/inference_services/services/mistral_ai_service.py +4 -2
edsl/inference_services/services/ollama_service.py +1 -1
edsl/inference_services/services/open_ai_service.py +7 -5
edsl/inference_services/services/perplexity_service.py +6 -2
edsl/inference_services/services/test_service.py +8 -7
edsl/inference_services/services/together_ai_service.py +2 -3
edsl/inference_services/services/xai_service.py +1 -1
edsl/instructions/__init__.py +1 -1
edsl/instructions/change_instruction.py +7 -5
edsl/instructions/exceptions.py +61 -0
edsl/instructions/instruction.py +6 -2
edsl/instructions/instruction_collection.py +6 -4
edsl/instructions/instruction_handler.py +12 -15
edsl/interviews/ReportErrors.py +0 -3
edsl/interviews/__init__.py +9 -2
edsl/interviews/answering_function.py +11 -13
edsl/interviews/exception_tracking.py +15 -8
edsl/interviews/exceptions.py +79 -0
edsl/interviews/interview.py +33 -30
edsl/interviews/interview_status_dictionary.py +4 -2
edsl/interviews/interview_status_log.py +2 -1
edsl/interviews/interview_task_manager.py +5 -5
edsl/interviews/request_token_estimator.py +5 -2
edsl/interviews/statistics.py +3 -4
edsl/invigilators/__init__.py +7 -1
edsl/invigilators/exceptions.py +79 -0
edsl/invigilators/invigilator_base.py +0 -1
edsl/invigilators/invigilators.py +9 -13
edsl/invigilators/prompt_constructor.py +1 -5
edsl/invigilators/prompt_helpers.py +8 -4
edsl/invigilators/question_instructions_prompt_builder.py +1 -1
edsl/invigilators/question_option_processor.py +9 -5
edsl/invigilators/question_template_replacements_builder.py +3 -2
edsl/jobs/__init__.py +42 -5
edsl/jobs/async_interview_runner.py +25 -23
edsl/jobs/check_survey_scenario_compatibility.py +11 -10
edsl/jobs/data_structures.py +8 -5
edsl/jobs/exceptions.py +177 -8
edsl/jobs/fetch_invigilator.py +1 -1
edsl/jobs/jobs.py +74 -69
edsl/jobs/jobs_checks.py +6 -7
edsl/jobs/jobs_component_constructor.py +4 -4
edsl/jobs/jobs_pricing_estimation.py +4 -3
edsl/jobs/jobs_remote_inference_logger.py +5 -4
edsl/jobs/jobs_runner_asyncio.py +3 -4
edsl/jobs/jobs_runner_status.py +8 -9
edsl/jobs/remote_inference.py +27 -24
edsl/jobs/results_exceptions_handler.py +10 -7
edsl/key_management/__init__.py +3 -1
edsl/key_management/exceptions.py +62 -0
edsl/key_management/key_lookup.py +1 -1
edsl/key_management/key_lookup_builder.py +37 -14
edsl/key_management/key_lookup_collection.py +2 -0
edsl/language_models/__init__.py +1 -1
edsl/language_models/exceptions.py +302 -14
edsl/language_models/language_model.py +9 -8
edsl/language_models/model.py +4 -4
edsl/language_models/model_list.py +1 -1
edsl/language_models/price_manager.py +1 -1
edsl/language_models/raw_response_handler.py +14 -9
edsl/language_models/registry.py +17 -21
edsl/language_models/repair.py +0 -6
edsl/language_models/unused/fake_openai_service.py +0 -1
edsl/load_plugins.py +69 -0
edsl/logger.py +146 -0
edsl/notebooks/__init__.py +24 -1
edsl/notebooks/exceptions.py +82 -0
edsl/notebooks/notebook.py +7 -3
edsl/notebooks/notebook_to_latex.py +1 -2
edsl/plugins/__init__.py +63 -0
edsl/plugins/built_in/export_example.py +50 -0
edsl/plugins/built_in/pig_latin.py +67 -0
edsl/plugins/cli.py +372 -0
edsl/plugins/cli_typer.py +283 -0
edsl/plugins/exceptions.py +31 -0
edsl/plugins/hookspec.py +51 -0
edsl/plugins/plugin_host.py +128 -0
edsl/plugins/plugin_manager.py +633 -0
edsl/plugins/plugins_registry.py +168 -0
edsl/prompts/__init__.py +24 -1
edsl/prompts/exceptions.py +107 -5
edsl/prompts/prompt.py +15 -7
edsl/questions/HTMLQuestion.py +5 -11
edsl/questions/Quick.py +0 -1
edsl/questions/__init__.py +6 -4
edsl/questions/answer_validator_mixin.py +318 -323
edsl/questions/compose_questions.py +3 -3
edsl/questions/descriptors.py +11 -50
edsl/questions/exceptions.py +278 -22
edsl/questions/loop_processor.py +7 -5
edsl/questions/prompt_templates/question_list.jinja +3 -0
edsl/questions/question_base.py +46 -19
edsl/questions/question_base_gen_mixin.py +2 -2
edsl/questions/question_base_prompts_mixin.py +13 -7
edsl/questions/question_budget.py +503 -98
edsl/questions/question_check_box.py +660 -160
edsl/questions/question_dict.py +345 -194
edsl/questions/question_extract.py +401 -61
edsl/questions/question_free_text.py +80 -14
edsl/questions/question_functional.py +119 -9
edsl/questions/{derived/question_likert_five.py → question_likert_five.py} +2 -2
edsl/questions/{derived/question_linear_scale.py → question_linear_scale.py} +3 -4
edsl/questions/question_list.py +275 -28
edsl/questions/question_matrix.py +643 -96
edsl/questions/question_multiple_choice.py +219 -51
edsl/questions/question_numerical.py +361 -32
edsl/questions/question_rank.py +401 -124
edsl/questions/question_registry.py +7 -5
edsl/questions/{derived/question_top_k.py → question_top_k.py} +3 -3
edsl/questions/{derived/question_yes_no.py → question_yes_no.py} +3 -4
edsl/questions/register_questions_meta.py +2 -2
edsl/questions/response_validator_abc.py +13 -15
edsl/questions/response_validator_factory.py +10 -12
edsl/questions/templates/dict/answering_instructions.jinja +1 -0
edsl/questions/templates/rank/question_presentation.jinja +1 -1
edsl/results/__init__.py +1 -1
edsl/results/exceptions.py +141 -7
edsl/results/report.py +1 -2
edsl/results/result.py +11 -9
edsl/results/results.py +480 -321
edsl/results/results_selector.py +8 -4
edsl/scenarios/PdfExtractor.py +2 -2
edsl/scenarios/construct_download_link.py +69 -35
edsl/scenarios/directory_scanner.py +33 -14
edsl/scenarios/document_chunker.py +1 -1
edsl/scenarios/exceptions.py +238 -14
edsl/scenarios/file_methods.py +1 -1
edsl/scenarios/file_store.py +7 -3
edsl/scenarios/handlers/__init__.py +17 -0
edsl/scenarios/handlers/docx_file_store.py +0 -5
edsl/scenarios/handlers/pdf_file_store.py +0 -1
edsl/scenarios/handlers/pptx_file_store.py +0 -5
edsl/scenarios/handlers/py_file_store.py +0 -1
edsl/scenarios/handlers/sql_file_store.py +1 -4
edsl/scenarios/handlers/sqlite_file_store.py +0 -1
edsl/scenarios/handlers/txt_file_store.py +1 -1
edsl/scenarios/scenario.py +1 -3
edsl/scenarios/scenario_list.py +179 -27
edsl/scenarios/scenario_list_pdf_tools.py +1 -0
edsl/scenarios/scenario_selector.py +0 -1
edsl/surveys/__init__.py +3 -4
edsl/surveys/dag/__init__.py +4 -2
edsl/surveys/descriptors.py +1 -1
edsl/surveys/edit_survey.py +1 -0
edsl/surveys/exceptions.py +165 -9
edsl/surveys/memory/__init__.py +5 -3
edsl/surveys/memory/memory_management.py +1 -0
edsl/surveys/memory/memory_plan.py +6 -15
edsl/surveys/rules/__init__.py +5 -3
edsl/surveys/rules/rule.py +1 -2
edsl/surveys/rules/rule_collection.py +1 -1
edsl/surveys/survey.py +12 -24
edsl/surveys/survey_css.py +3 -3
edsl/surveys/survey_export.py +6 -3
edsl/surveys/survey_flow_visualization.py +10 -1
edsl/surveys/survey_simulator.py +2 -1
edsl/tasks/__init__.py +23 -1
edsl/tasks/exceptions.py +72 -0
edsl/tasks/question_task_creator.py +3 -3
edsl/tasks/task_creators.py +1 -3
edsl/tasks/task_history.py +8 -10
edsl/tasks/task_status_log.py +1 -2
edsl/tokens/__init__.py +29 -1
edsl/tokens/exceptions.py +37 -0
edsl/tokens/interview_token_usage.py +3 -2
edsl/tokens/token_usage.py +4 -3
edsl/utilities/__init__.py +21 -1
edsl/utilities/decorators.py +1 -2
edsl/utilities/markdown_to_docx.py +2 -2
edsl/utilities/markdown_to_pdf.py +1 -1
edsl/utilities/repair_functions.py +0 -1
edsl/utilities/restricted_python.py +0 -1
edsl/utilities/template_loader.py +2 -3
edsl/utilities/utilities.py +8 -29
{edsl-0.1.49.dist-info → edsl-0.1.51.dist-info}/METADATA +32 -2
edsl-0.1.51.dist-info/RECORD +365 -0
edsl-0.1.51.dist-info/entry_points.txt +3 -0
edsl/dataset/smart_objects.py +0 -96
edsl/exceptions/BaseException.py +0 -21
edsl/exceptions/__init__.py +0 -54
edsl/exceptions/configuration.py +0 -16
edsl/exceptions/general.py +0 -34
edsl/questions/derived/__init__.py +0 -0
edsl/study/ObjectEntry.py +0 -173
edsl/study/ProofOfWork.py +0 -113
edsl/study/SnapShot.py +0 -80
edsl/study/Study.py +0 -520
edsl/study/__init__.py +0 -6
edsl/utilities/interface.py +0 -135
edsl-0.1.49.dist-info/RECORD +0 -347
{edsl-0.1.49.dist-info → edsl-0.1.51.dist-info}/LICENSE +0 -0
{edsl-0.1.49.dist-info → edsl-0.1.51.dist-info}/WHEEL +0 -0

edsl/questions/question_matrix.py CHANGED Viewed

@@ -1,9 +1,26 @@
+"""
+question_matrix.py
+Module implementing the matrix question type with Pydantic validation
+"""
 from __future__ import annotations
-from typing import Union, Optional, Dict, List, Any
+from typing import (
+    Union,
+    Optional,
+    Dict,
+    List,
+    Any,
+    Type,
+    Literal
+)
+import random
+import json
+import re
-from pydantic import BaseModel, Field, field_validator
+from pydantic import BaseModel, Field, create_model, ValidationError, model_validator
 from jinja2 import Template
-import random
 from .question_base import QuestionBase
 from .descriptors import (
     QuestionOptionsDescriptor,
@@ -14,56 +31,201 @@ from .response_validator_abc import ResponseValidatorABC
 from .decorators import inject_exception
 from .exceptions import (
-    QuestionAnswerValidationError,
     QuestionCreationValidationError,
+    QuestionAnswerValidationError,
 )
+class MatrixResponseBase(BaseModel):
+    """
+    Base model for matrix question responses.
+    Attributes:
+        answer: A dictionary mapping each item to a selected option
+        comment: Optional comment about the selections
+        generated_tokens: Optional token usage data
+    Examples:
+        >>> # Valid response with two items
+        >>> model = MatrixResponseBase(answer={"Item1": 1, "Item2": 2})
+        >>> model.answer
+        {'Item1': 1, 'Item2': 2}
+        >>> # Valid response with a comment
+        >>> model = MatrixResponseBase(
+        ...     answer={"Item1": "Yes", "Item2": "No"},
+        ...     comment="This is my reasoning"
+        ... )
+        >>> model.comment
+        'This is my reasoning'
+    """
+    answer: Dict[str, Any]
+    comment: Optional[str] = None
+    generated_tokens: Optional[Any] = None
 def create_matrix_response(
     question_items: List[str],
     question_options: List[Union[int, str, float]],
     permissive: bool = False,
-):
-    """Create a response model for matrix questions.
-    The response model validates that:
-    1. All question items are answered
-    2. Each answer is from the allowed options
+) -> Type[BaseModel]:
     """
-    if permissive:
-        class MatrixResponse(BaseModel):
-            answer: Dict[str, Any]
-            comment: Optional[str] = None
-            generated_tokens: Optional[Any] = None
+    Create a dynamic Pydantic model for matrix questions with appropriate validation.
+    Args:
+        question_items: List of items that need responses
+        question_options: List of allowed options for each item
+        permissive: If True, allows any values and additional items
+    Returns:
+        A Pydantic model class for validating matrix responses
+    Examples:
+        >>> # Create a model for a 2x3 matrix
+        >>> Model = create_matrix_response(
+        ...     ["Item1", "Item2"],
+        ...     [1, 2, 3]
+        ... )
+        >>> # Valid response
+        >>> response = Model(answer={"Item1": 1, "Item2": 2})
+        >>> isinstance(response.answer, BaseModel)
+        True
+        >>> response.answer.Item1
+        1
+        >>> response.answer.Item2
+        2
+        >>> # Invalid: missing an item
+        >>> try:
+        ...     Model(answer={"Item1": 1})
+        ... except Exception:
+        ...     print("Validation error occurred")
+        Validation error occurred
+        >>> # Invalid: invalid option value
+        >>> try:
+        ...     Model(answer={"Item1": 4, "Item2": 2})
+        ... except Exception:
+        ...     print("Validation error occurred")
+        Validation error occurred
+    """
+    # Convert question_options to a tuple for Literal type
+    option_tuple = tuple(question_options)
+    # If non-permissive, build a Literal for each valid option
+    # e.g. Literal[1,2,3] or Literal["Yes","No"] or a mix
+    if not permissive:
+        # If question_options is empty (edge case), fall back to 'Any'
+        if question_options:
+            AllowedOptions = Literal[option_tuple]  # type: ignore
+        else:
+            AllowedOptions = Any
     else:
-        class MatrixResponse(BaseModel):
-            answer: Dict[str, Union[int, str, float]] = Field(
-                ..., description="Mapping of items to selected options"
-            )
-            comment: Optional[str] = None
-            generated_tokens: Optional[Any] = None
-            @field_validator("answer")
-            def validate_answer(cls, v, values, **kwargs):
-                # Check that all items have responses
-                if not all(item in v for item in question_items):
-                    missing = set(question_items) - set(v.keys())
-                    raise ValueError(f"Missing responses for items: {missing}")
-                # Check that all responses are valid options
-                if not all(answer in question_options for answer in v.values()):
-                    invalid = [ans for ans in v.values() if ans not in question_options]
-                    raise ValueError(f"Invalid options selected: {invalid}")
-                return v
+        # Permissive => let each item be anything
+        AllowedOptions = Any
+    # Build field definitions for the answer submodel
+    field_definitions = {}
+    for item in question_items:
+        field_definitions[item] = (AllowedOptions, Field(...))  # required field
+    # Dynamically create the submodel
+    MatrixAnswerSubModel = create_model(
+        "MatrixAnswerSubModel",
+        __base__=BaseModel,
+        **field_definitions
+    )
+    # Create the full response model with custom validation
+    class MatrixResponse(MatrixResponseBase):
+        """
+        Model for matrix question responses with validation for specific items and options.
+        """
+        answer: MatrixAnswerSubModel  # Use the dynamically created submodel
+        @model_validator(mode='after')
+        def validate_matrix_constraints(self):
+            """
+            Validates that:
+            1. All required items have responses
+            2. All responses are valid options
+            3. No unexpected items are included (unless permissive)
+            """
+            matrix_answer = self.answer.model_dump()
+            # Check that all required items have responses
+            missing_items = [item for item in question_items if item not in matrix_answer]
+            if missing_items and not permissive:
+                missing_str = ", ".join(missing_items)
+                validation_error = ValidationError.from_exception_data(
+                    title='MatrixResponse',
+                    line_errors=[{
+                        'type': 'value_error',
+                        'loc': ('answer',),
+                        'msg': f'Missing responses for items: {missing_str}',
+                        'input': matrix_answer,
+                        'ctx': {'missing_items': missing_items}
+                    }]
+                )
+                raise QuestionAnswerValidationError(
+                    message=f"Missing responses for items: {missing_str}",
+                    data=self.model_dump(),
+                    model=self.__class__,
+                    pydantic_error=validation_error
+                )
+            # Check that all responses are valid options
+            if not permissive:
+                invalid_items = {}
+                for item, value in matrix_answer.items():
+                    if value not in option_tuple:
+                        invalid_items[item] = value
+                if invalid_items:
+                    items_str = ", ".join(f"{k}: {v}" for k, v in invalid_items.items())
+                    validation_error = ValidationError.from_exception_data(
+                        title='MatrixResponse',
+                        line_errors=[{
+                            'type': 'value_error',
+                            'loc': ('answer',),
+                            'msg': f'Invalid options selected: {items_str}',
+                            'input': matrix_answer,
+                            'ctx': {'invalid_items': invalid_items, 'allowed_options': option_tuple}
+                        }]
+                    )
+                    raise QuestionAnswerValidationError(
+                        message=f"Invalid options selected: {items_str}. Allowed options: {option_tuple}",
+                        data=self.model_dump(),
+                        model=self.__class__,
+                        pydantic_error=validation_error
+                    )
+            return self
+        class Config:
+            # If permissive=True, allow extra fields in the answer dict
+            extra = "allow" if permissive else "forbid"
+            @staticmethod
+            def json_schema_extra(schema: dict, model: BaseModel) -> None:
+                # Add the options to the schema for better documentation
+                if "properties" in schema and "answer" in schema["properties"]:
+                    schema["properties"]["answer"]["description"] = "Matrix responses for each item"
+                    if "properties" in schema["properties"]["answer"]:
+                        for _, prop in schema["properties"]["answer"]["properties"].items():
+                            prop["enum"] = list(question_options)
     return MatrixResponse
 class MatrixResponseValidator(ResponseValidatorABC):
+    """
+    Validator for matrix question responses that attempts to fix invalid responses.
+    This validator tries multiple approaches to recover valid matrix responses from
+    malformed inputs, including JSON parsing, remapping numeric keys, and extracting
+    structured data from text.
+    """
     required_params = ["question_items", "question_options", "permissive"]
     valid_examples = [
@@ -72,8 +234,17 @@ class MatrixResponseValidator(ResponseValidatorABC):
             {
                 "question_items": ["Item1", "Item2"],
                 "question_options": [1, 2, 3],
+                "permissive": False
             },
-        )
+        ),
+        (
+            {"answer": {"Item1": "Yes", "Item2": "No"}},
+            {
+                "question_items": ["Item1", "Item2"],
+                "question_options": ["Yes", "No", "Maybe"],
+                "permissive": False
+            },
+        ),
     ]
     invalid_examples = [
@@ -82,57 +253,415 @@ class MatrixResponseValidator(ResponseValidatorABC):
             {
                 "question_items": ["Item1", "Item2"],
                 "question_options": [1, 2, 3],
+                "permissive": False
             },
-            "Missing responses for some items",
+            "Missing responses for items",
         ),
         (
             {"answer": {"Item1": 4, "Item2": 5}},
             {
                 "question_items": ["Item1", "Item2"],
                 "question_options": [1, 2, 3],
+                "permissive": False
             },
             "Invalid options selected",
         ),
     ]
     def fix(self, response, verbose=False):
+        """
+        Attempts to fix an invalid matrix response by trying multiple parsing strategies.
+        Args:
+            response: The invalid response to fix
+            verbose: Whether to print verbose debugging information
+        Returns:
+            A fixed response dict if fixable, otherwise the original response
+        """
         if verbose:
             print(f"Fixing matrix response: {response}")
-        # If we have generated tokens, try to parse them
-        if "generated_tokens" in response:
+        # If response doesn't have an answer field, nothing to do
+        if "answer" not in response:
+            if verbose:
+                print("Response has no answer field, cannot fix")
+            return response
+        # Strategy 1: If we have generated_tokens, try to parse them as JSON
+        if "generated_tokens" in response and response["generated_tokens"]:
             try:
-                import json
-                fixed = json.loads(response["generated_tokens"])
-                if isinstance(fixed, dict):
-                    # Map numeric keys to question items
-                    mapped_answer = {}
-                    for idx, item in enumerate(self.question_items):
-                        if str(idx) in fixed:
-                            mapped_answer[item] = fixed[str(idx)]
-                    if (
-                        mapped_answer
-                    ):  # Only return if we successfully mapped some answers
-                        return {"answer": mapped_answer}
-            except:
-                pass
-        # If answer uses numeric keys, map them to question items
-        if "answer" in response and isinstance(response["answer"], dict):
-            if all(str(key).isdigit() for key in response["answer"].keys()):
+                # Try to parse generated_tokens as JSON
+                tokens_text = str(response["generated_tokens"])
+                json_match = re.search(r'\{.*\}', tokens_text, re.DOTALL)
+                if json_match:
+                    json_str = json_match.group(0)
+                    fixed = json.loads(json_str)
+                    if isinstance(fixed, dict):
+                        # Map numeric keys to question items if needed
+                        if all(str(k).isdigit() for k in fixed.keys()):
+                            if verbose:
+                                print(f"JSON extraction found numeric keys: {fixed}")
+                                print(f"Question items: {self.question_items}")
+                                print(f"Question options: {self.question_options}")
+                            # Special handling for case when numeric keys directly represent option indices
+                            # This is the case we're trying to fix: {"0": 1, "1": 3, "2": 0} maps to options at those indices
+                            direct_mapped_answer = {}
+                            if verbose:
+                                print(f"Attempting to map numeric key/value format in JSON: {fixed}")
+                            for idx, item in enumerate(self.question_items):
+                                if str(idx) in fixed:
+                                    # Get the option index directly from the value
+                                    option_idx = fixed[str(idx)]
+                                    # Convert to int if needed
+                                    if isinstance(option_idx, str) and option_idx.isdigit():
+                                        option_idx = int(option_idx)
+                                    if verbose:
+                                        print(f"Item {item} at index {idx} maps to value {option_idx}")
+                                    if isinstance(option_idx, (int, float)) and 0 <= option_idx < len(self.question_options):
+                                        direct_mapped_answer[item] = self.question_options[option_idx]
+                                        if verbose:
+                                            print(f"Mapped option_idx {option_idx} to {self.question_options[option_idx]}")
+                            if direct_mapped_answer and len(direct_mapped_answer) == len(self.question_items):
+                                proposed_data = {
+                                    "answer": direct_mapped_answer,
+                                    "comment": response.get("comment"),
+                                    "generated_tokens": response.get("generated_tokens")
+                                }
+                                if verbose:
+                                    print(f"Created direct option mapping from JSON: {proposed_data}")
+                                try:
+                                    self.response_model(**proposed_data)
+                                    if verbose:
+                                        print(f"Successfully fixed with direct option mapping from JSON: {proposed_data}")
+                                    return proposed_data
+                                except Exception as e:
+                                    if verbose:
+                                        print(f"Direct option mapping from JSON failed validation: {e}")
+                            # Try the standard approach as well
+                            mapped_answer = {}
+                            for idx, item in enumerate(self.question_items):
+                                if str(idx) in fixed:
+                                    # Get the value (column index) from the response
+                                    value_idx = fixed[str(idx)]
+                                    # Convert to int if it's a digit string
+                                    if isinstance(value_idx, str) and value_idx.isdigit():
+                                        value_idx = int(value_idx)
+                                    # Convert column index to actual option value
+                                    if isinstance(value_idx, (int, float)) and 0 <= value_idx < len(self.question_options):
+                                        option_value = self.question_options[value_idx]
+                                        mapped_answer[item] = option_value
+                                    else:
+                                        # If the value is already a valid option, use it directly
+                                        if value_idx in self.question_options:
+                                            mapped_answer[item] = value_idx
+                                        else:
+                                            # Last resort - try to use it as a direct value even if not in options
+                                            mapped_answer[item] = value_idx
+                            if mapped_answer and (len(mapped_answer) == len(self.question_items) or self.permissive):
+                                proposed_data = {
+                                    "answer": mapped_answer,
+                                    "comment": response.get("comment"),
+                                    "generated_tokens": response.get("generated_tokens")
+                                }
+                                try:
+                                    # Validate the fixed response
+                                    self.response_model(**proposed_data)
+                                    if verbose:
+                                        print(f"Successfully fixed by parsing JSON: {proposed_data}")
+                                    return proposed_data
+                                except Exception as e:
+                                    if verbose:
+                                        print(f"Fixed response failed validation: {e}")
+                                # Try again with string values for all options
+                                text_mapped_answer = {}
+                                for item_name, option_value in mapped_answer.items():
+                                    text_mapped_answer[item_name] = str(option_value)
+                                proposed_data = {
+                                    "answer": text_mapped_answer,
+                                    "comment": response.get("comment"),
+                                    "generated_tokens": response.get("generated_tokens")
+                                }
+                                try:
+                                    self.response_model(**proposed_data)
+                                    if verbose:
+                                        print(f"Successfully fixed with string conversion from JSON: {proposed_data}")
+                                    return proposed_data
+                                except Exception as e:
+                                    if verbose:
+                                        print(f"String conversion from JSON failed validation: {e}")
+                        else:
+                            # The JSON already has string keys, use directly
+                            proposed_data = {
+                                "answer": fixed,
+                                "comment": response.get("comment"),
+                                "generated_tokens": response.get("generated_tokens")
+                            }
+                            try:
+                                self.response_model(**proposed_data)
+                                if verbose:
+                                    print(f"Successfully fixed by direct JSON: {proposed_data}")
+                                return proposed_data
+                            except Exception as e:
+                                if verbose:
+                                    print(f"Fixed response failed validation: {e}")
+                                # If validation failed, check if we need to map string keys to item names
+                                # This handles cases where the model responded with something like {"Row 0": 1, "Row 1": 2}
+                                # instead of using the exact item names
+                                item_map = {}
+                                for item in self.question_items:
+                                    # Create various forms of the item name that might appear in responses
+                                    item_variants = [
+                                        item.lower(),
+                                        item.upper(),
+                                        item.strip(),
+                                        f"Row {self.question_items.index(item)}",
+                                        f"Item {self.question_items.index(item)}",
+                                        f"{self.question_items.index(item)}"
+                                    ]
+                                    for key in fixed.keys():
+                                        if isinstance(key, str):
+                                            key_lower = key.lower().strip()
+                                            if key_lower in item_variants or item.lower() in key_lower:
+                                                item_map[key] = item
+                                if item_map:
+                                    mapped_answer = {}
+                                    for key, value in fixed.items():
+                                        if key in item_map:
+                                            # Handle both numeric indices and direct values
+                                            if isinstance(value, (int, float)) and 0 <= value < len(self.question_options):
+                                                mapped_answer[item_map[key]] = self.question_options[value]
+                                            else:
+                                                mapped_answer[item_map[key]] = value
+                                    if mapped_answer:
+                                        proposed_data = {
+                                            "answer": mapped_answer,
+                                            "comment": response.get("comment"),
+                                            "generated_tokens": response.get("generated_tokens")
+                                        }
+                                        try:
+                                            self.response_model(**proposed_data)
+                                            if verbose:
+                                                print(f"Successfully fixed by mapping item names: {proposed_data}")
+                                            return proposed_data
+                                        except Exception as e:
+                                            if verbose:
+                                                print(f"Item-mapped response failed validation: {e}")
+            except (ValueError, KeyError, TypeError, json.JSONDecodeError) as e:
+                if verbose:
+                    print(f"JSON parsing failed: {e}")
+                # Continue to other strategies
+        # Strategy 2: If answer uses numeric keys, map them to question items
+        if isinstance(response.get("answer"), dict):
+            answer_dict = response["answer"]
+            if all(str(k).isdigit() for k in answer_dict.keys()):
+                if verbose:
+                    print(f"Processing answer with numeric keys: {answer_dict}")
+                    print(f"Question items: {self.question_items}")
+                    print(f"Question options: {self.question_options}")
                 mapped_answer = {}
                 for idx, item in enumerate(self.question_items):
-                    if str(idx) in response["answer"]:
-                        mapped_answer[item] = response["answer"][str(idx)]
-                if mapped_answer:  # Only update if we successfully mapped some answers
-                    response["answer"] = mapped_answer
+                    if str(idx) in answer_dict:
+                        # Get the value (column index) from the response
+                        value_idx = answer_dict[str(idx)]
+                        # Convert to int if it's a digit string
+                        if isinstance(value_idx, str) and value_idx.isdigit():
+                            value_idx = int(value_idx)
+                        if verbose:
+                            print(f"Processing item {item} at index {idx}, value_idx={value_idx}")
+                        # Convert column index to actual option value
+                        if isinstance(value_idx, (int, float)) and 0 <= value_idx < len(self.question_options):
+                            option_value = self.question_options[value_idx]
+                            mapped_answer[item] = option_value
+                            if verbose:
+                                print(f"Mapped column index {value_idx} to option '{option_value}'")
+                        else:
+                            # If the value is already a valid option, use it directly
+                            if value_idx in self.question_options:
+                                mapped_answer[item] = value_idx
+                                if verbose:
+                                    print(f"Used direct option value '{value_idx}'")
+                            else:
+                                # Last resort - try to use it as a direct value even if not in options
+                                # (this helps with permissive mode)
+                                mapped_answer[item] = value_idx
+                                if verbose:
+                                    print(f"Used non-option value '{value_idx}' as direct value")
+                if mapped_answer and len(mapped_answer) == len(self.question_items):
+                    if verbose:
+                        print(f"Created complete mapped answer: {mapped_answer}")
+                    proposed_data = {
+                        "answer": mapped_answer,
+                        "comment": response.get("comment"),
+                        "generated_tokens": response.get("generated_tokens")
+                    }
+                    try:
+                        self.response_model(**proposed_data)
+                        if verbose:
+                            print(f"Successfully fixed by mapping numeric keys: {proposed_data}")
+                        return proposed_data
+                    except Exception as e:
+                        if verbose:
+                            print(f"Fixed response failed validation: {e}")
+                    # Try again with string values for the options
+                    text_mapped_answer = {}
+                    for item_name, option_value in mapped_answer.items():
+                        text_mapped_answer[item_name] = str(option_value)
+                    proposed_data = {
+                        "answer": text_mapped_answer,
+                        "comment": response.get("comment"),
+                        "generated_tokens": response.get("generated_tokens")
+                    }
+                    try:
+                        self.response_model(**proposed_data)
+                        if verbose:
+                            print(f"Successfully fixed with string conversion: {proposed_data}")
+                        return proposed_data
+                    except Exception as e:
+                        if verbose:
+                            print(f"String conversion failed validation: {e}")
+                # Special handling for case when numeric keys directly represent option indices
+                # This is the case we're trying to fix: {"0": 1, "1": 3, "2": 0} maps to options at those indices
+                direct_mapped_answer = {}
+                if verbose:
+                    print(f"Attempting to map numeric key/value format in answer: {answer_dict}")
+                for idx, item in enumerate(self.question_items):
+                    if str(idx) in answer_dict:
+                        # Get the option index directly from the value
+                        option_idx = answer_dict[str(idx)]
+                        # Convert to int if needed
+                        if isinstance(option_idx, str) and option_idx.isdigit():
+                            option_idx = int(option_idx)
+                        if verbose:
+                            print(f"Item {item} at index {idx} maps to value {option_idx}")
+                        if isinstance(option_idx, (int, float)) and 0 <= option_idx < len(self.question_options):
+                            direct_mapped_answer[item] = self.question_options[option_idx]
+                            if verbose:
+                                print(f"Mapped option_idx {option_idx} to {self.question_options[option_idx]}")
+                if direct_mapped_answer and len(direct_mapped_answer) == len(self.question_items):
+                    proposed_data = {
+                        "answer": direct_mapped_answer,
+                        "comment": response.get("comment"),
+                        "generated_tokens": response.get("generated_tokens")
+                    }
+                    if verbose:
+                        print(f"Created direct option mapping: {proposed_data}")
+                    try:
+                        self.response_model(**proposed_data)
+                        if verbose:
+                            print(f"Successfully fixed with direct option mapping: {proposed_data}")
+                        return proposed_data
+                    except Exception as e:
+                        if verbose:
+                            print(f"Direct option mapping failed validation: {e}")
+        # Strategy 3: If answer is a string, try to extract a structured response
+        if isinstance(response.get("answer"), str):
+            answer_text = response["answer"]
+            # Try to extract item-option pairs using regex
+            pairs = re.findall(r'([^:,]+):\s*([^,]+)', answer_text)
+            if pairs:
+                extracted = {}
+                for item, option in pairs:
+                    item = item.strip()
+                    option = option.strip()
+                    # Match the item name with the closest question item
+                    best_match = None
+                    for q_item in self.question_items:
+                        if q_item.lower() in item.lower():
+                            best_match = q_item
+                            break
+                    if best_match:
+                        # Try to match the option with question options
+                        matched_option = None
+                        for q_option in self.question_options:
+                            q_option_str = str(q_option)
+                            if q_option_str == option or q_option_str in option:
+                                matched_option = q_option
+                                break
+                        if matched_option is not None:
+                            extracted[best_match] = matched_option
+                if extracted and (len(extracted) == len(self.question_items) or self.permissive):
+                    proposed_data = {
+                        "answer": extracted,
+                        "comment": response.get("comment"),
+                        "generated_tokens": response.get("generated_tokens")
+                    }
+                    try:
+                        self.response_model(**proposed_data)
+                        if verbose:
+                            print(f"Successfully fixed by extracting pairs: {proposed_data}")
+                        return proposed_data
+                    except Exception as e:
+                        if verbose:
+                            print(f"Fixed response failed validation: {e}")
+        # If we got here, we couldn't fix the response
+        if verbose:
+            print("Could not fix matrix response, returning original")
         return response
 class QuestionMatrix(QuestionBase):
-    """A question that presents a matrix/grid where multiple items are rated using the same scale."""
+    """
+    A question that presents a matrix/grid where multiple items are rated
+    or selected from the same set of options.
+    This question type allows respondents to provide an answer for each row
+    in a grid, selecting from the same set of options for each row. It's often
+    used for Likert scales, ratings grids, or any scenario where multiple items
+    need to be rated using the same scale.
+    Examples:
+        >>> # Create a happiness rating matrix
+        >>> question = QuestionMatrix(
+        ...     question_name="happiness_matrix",
+        ...     question_text="Rate your happiness with each aspect:",
+        ...     question_items=["Work", "Family", "Social life"],
+        ...     question_options=[1, 2, 3, 4, 5],
+        ...     option_labels={1: "Very unhappy", 3: "Neutral", 5: "Very happy"}
+        ... )
+        >>> # The response is a dict matching each item to a rating
+        >>> response = {"answer": {"Work": 4, "Family": 5, "Social life": 3}}
+    """
     question_type = "matrix"
     question_text: str = QuestionTextDescriptor()
@@ -155,18 +684,19 @@ class QuestionMatrix(QuestionBase):
         question_presentation: Optional[str] = None,
         permissive: bool = False,
     ):
-        """Initialize a matrix question.
+        """
+        Initialize a matrix question.
         Args:
             question_name: The name of the question
             question_text: The text of the question
-            question_items: List of items to be rated
-            question_options: List of rating options
-            option_labels: Optional mapping of options to their labels
+            question_items: List of items to be rated or answered (rows)
+            question_options: Possible answer options for each item (columns)
+            option_labels: Optional mapping of options to labels (e.g. {1: "Sad", 5: "Happy"})
             include_comment: Whether to include a comment field
-            answering_instructions: Optional custom instructions
-            question_presentation: Optional custom presentation
-            permissive: Whether to strictly validate responses
+            answering_instructions: Custom instructions template
+            question_presentation: Custom presentation template
+            permissive: Whether to allow any values & extra items instead of strictly checking
         """
         self.question_name = question_name
@@ -186,14 +716,42 @@ class QuestionMatrix(QuestionBase):
         self.question_presentation = question_presentation
         self.permissive = permissive
-    def create_response_model(self):
+    def create_response_model(self) -> Type[BaseModel]:
+        """
+        Returns the pydantic model for validating responses to this question.
+        The model is dynamically created based on the question's configuration,
+        including allowed items, options, and permissiveness.
+        """
         return create_matrix_response(
-            self.question_items, self.question_options, self.permissive
+            self.question_items,
+            self.question_options,
+            self.permissive
         )
+    def _simulate_answer(self) -> dict:
+        """
+        Simulate a random valid answer for testing purposes.
+        Returns:
+            A valid simulated response with random selections
+        """
+        return {
+            "answer": {
+                item: random.choice(self.question_options)
+                for item in self.question_items
+            },
+            "comment": "Sample matrix response"
+        }
     @property
     def question_html_content(self) -> str:
-        """Generate HTML representation of the matrix question."""
+        """
+        Generate an HTML representation of the matrix question.
+        Returns:
+            HTML content string for rendering the question
+        """
         template = Template(
             """
         <table class="matrix-question">
@@ -225,7 +783,6 @@ class QuestionMatrix(QuestionBase):
         </table>
         """
         )
         return template.render(
             question_name=self.question_name,
             question_items=self.question_items,
@@ -236,7 +793,12 @@ class QuestionMatrix(QuestionBase):
     @classmethod
     @inject_exception
     def example(cls) -> QuestionMatrix:
-        """Return an example matrix question."""
+        """
+        Return an example matrix question.
+        Returns:
+            An example QuestionMatrix instance for happiness ratings by family size
+        """
         return cls(
             question_name="child_happiness",
             question_text="How happy would you be with different numbers of children?",
@@ -248,19 +810,4 @@ class QuestionMatrix(QuestionBase):
             ],
             question_options=[1, 2, 3, 4, 5],
             option_labels={1: "Very sad", 3: "Neutral", 5: "Extremely happy"},
-        )
-    def _simulate_answer(self) -> dict:
-        """Simulate a random valid answer."""
-        return {
-            "answer": {
-                item: random.choice(self.question_options)
-                for item in self.question_items
-            }
-        }
-if __name__ == "__main__":
-    import doctest
-    doctest.testmod(optionflags=doctest.ELLIPSIS)
+        )

edsl 0.1.49__py3-none-any.whl → 0.1.51__py3-none-any.whl

edsl 0.1.49py3-none-any.whl → 0.1.51py3-none-any.whl