PyPI - edsl - Versions diffs - 0.1.50__py3-none-any.whl → 0.1.51__py3-none-any.whl - Mend

edsl 0.1.50py3-none-any.whl → 0.1.51py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (109) hide show

edsl/__version__.py +1 -1
edsl/base/base_exception.py +2 -2
edsl/buckets/bucket_collection.py +1 -1
edsl/buckets/exceptions.py +32 -0
edsl/buckets/token_bucket_api.py +26 -10
edsl/caching/cache.py +5 -2
edsl/caching/remote_cache_sync.py +5 -5
edsl/caching/sql_dict.py +12 -11
edsl/config/__init__.py +1 -1
edsl/config/config_class.py +4 -2
edsl/conversation/Conversation.py +7 -4
edsl/conversation/car_buying.py +1 -3
edsl/conversation/mug_negotiation.py +2 -6
edsl/coop/__init__.py +11 -8
edsl/coop/coop.py +13 -13
edsl/coop/coop_functions.py +1 -1
edsl/coop/ep_key_handling.py +1 -1
edsl/coop/price_fetcher.py +2 -2
edsl/coop/utils.py +2 -2
edsl/dataset/dataset.py +144 -63
edsl/dataset/dataset_operations_mixin.py +14 -6
edsl/dataset/dataset_tree.py +3 -3
edsl/dataset/display/table_renderers.py +6 -3
edsl/dataset/file_exports.py +4 -4
edsl/dataset/r/ggplot.py +3 -3
edsl/inference_services/available_model_fetcher.py +2 -2
edsl/inference_services/data_structures.py +5 -5
edsl/inference_services/inference_service_abc.py +1 -1
edsl/inference_services/inference_services_collection.py +1 -1
edsl/inference_services/service_availability.py +3 -3
edsl/inference_services/services/azure_ai.py +3 -3
edsl/inference_services/services/google_service.py +1 -1
edsl/inference_services/services/test_service.py +1 -1
edsl/instructions/change_instruction.py +5 -4
edsl/instructions/instruction.py +1 -0
edsl/instructions/instruction_collection.py +5 -4
edsl/instructions/instruction_handler.py +10 -8
edsl/interviews/exception_tracking.py +1 -1
edsl/interviews/interview.py +1 -1
edsl/interviews/interview_status_dictionary.py +1 -1
edsl/interviews/interview_task_manager.py +2 -2
edsl/interviews/request_token_estimator.py +3 -2
edsl/interviews/statistics.py +2 -2
edsl/invigilators/invigilators.py +2 -2
edsl/jobs/__init__.py +39 -2
edsl/jobs/async_interview_runner.py +1 -1
edsl/jobs/check_survey_scenario_compatibility.py +5 -5
edsl/jobs/data_structures.py +2 -2
edsl/jobs/jobs.py +2 -2
edsl/jobs/jobs_checks.py +5 -5
edsl/jobs/jobs_component_constructor.py +2 -2
edsl/jobs/jobs_pricing_estimation.py +1 -1
edsl/jobs/jobs_runner_asyncio.py +2 -2
edsl/jobs/remote_inference.py +1 -1
edsl/jobs/results_exceptions_handler.py +2 -2
edsl/language_models/language_model.py +5 -1
edsl/notebooks/__init__.py +24 -1
edsl/notebooks/exceptions.py +82 -0
edsl/notebooks/notebook.py +7 -3
edsl/notebooks/notebook_to_latex.py +1 -1
edsl/prompts/__init__.py +23 -2
edsl/prompts/prompt.py +1 -1
edsl/questions/__init__.py +4 -4
edsl/questions/answer_validator_mixin.py +0 -5
edsl/questions/compose_questions.py +2 -2
edsl/questions/descriptors.py +1 -1
edsl/questions/question_base.py +32 -3
edsl/questions/question_base_prompts_mixin.py +4 -4
edsl/questions/question_budget.py +503 -102
edsl/questions/question_check_box.py +658 -156
edsl/questions/question_dict.py +176 -2
edsl/questions/question_extract.py +401 -61
edsl/questions/question_free_text.py +77 -9
edsl/questions/question_functional.py +118 -9
edsl/questions/{derived/question_likert_five.py → question_likert_five.py} +2 -2
edsl/questions/{derived/question_linear_scale.py → question_linear_scale.py} +3 -4
edsl/questions/question_list.py +246 -26
edsl/questions/question_matrix.py +586 -73
edsl/questions/question_multiple_choice.py +213 -47
edsl/questions/question_numerical.py +360 -29
edsl/questions/question_rank.py +401 -124
edsl/questions/question_registry.py +3 -3
edsl/questions/{derived/question_top_k.py → question_top_k.py} +3 -3
edsl/questions/{derived/question_yes_no.py → question_yes_no.py} +3 -4
edsl/questions/register_questions_meta.py +2 -1
edsl/questions/response_validator_abc.py +6 -2
edsl/questions/response_validator_factory.py +10 -12
edsl/results/report.py +1 -1
edsl/results/result.py +7 -4
edsl/results/results.py +471 -271
edsl/results/results_selector.py +2 -2
edsl/scenarios/construct_download_link.py +3 -3
edsl/scenarios/scenario.py +1 -2
edsl/scenarios/scenario_list.py +41 -23
edsl/surveys/survey_css.py +3 -3
edsl/surveys/survey_simulator.py +2 -1
edsl/tasks/__init__.py +22 -2
edsl/tasks/exceptions.py +72 -0
edsl/tasks/task_history.py +3 -3
edsl/tokens/__init__.py +27 -1
edsl/tokens/exceptions.py +37 -0
edsl/tokens/interview_token_usage.py +3 -2
edsl/tokens/token_usage.py +4 -3
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/METADATA +1 -1
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/RECORD +108 -106
edsl/questions/derived/__init__.py +0 -0
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/LICENSE +0 -0
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/WHEEL +0 -0
{edsl-0.1.50.dist-info → edsl-0.1.51.dist-info}/entry_points.txt +0 -0

edsl/questions/question_check_box.py CHANGED Viewed

@@ -1,8 +1,9 @@
 from __future__ import annotations
 from typing import Any, Optional, TYPE_CHECKING
+import random
 from jinja2 import Template
-from pydantic import BaseModel, Field
+from pydantic import BaseModel, Field, model_validator, ValidationError
 from typing import List, Literal, Annotated
 from .exceptions import QuestionAnswerValidationError
@@ -17,9 +18,45 @@ from .decorators import inject_exception
 from .response_validator_abc import ResponseValidatorABC
 if TYPE_CHECKING:
-    from .data_structures import (
-        BaseResponse,
-    )
+    pass
+class CheckboxResponse(BaseModel):
+    """
+    Base Pydantic model for validating checkbox responses.
+    This model defines the structure and validation rules for responses to
+    checkbox questions, ensuring that selected options are properly formatted
+    as a list of choices.
+    Attributes:
+        answer: List of selected choices
+        comment: Optional comment provided with the answer
+        generated_tokens: Optional raw LLM output for token tracking
+    Examples:
+        >>> # Valid response with list of options
+        >>> response = CheckboxResponse(answer=[0, 1])
+        >>> response.answer
+        [0, 1]
+        >>> # Valid response with comment
+        >>> response = CheckboxResponse(answer=[1], comment="This is my choice")
+        >>> response.answer
+        [1]
+        >>> response.comment
+        'This is my choice'
+        >>> # Invalid non-list answer
+        >>> try:
+        ...     CheckboxResponse(answer=1)
+        ... except Exception as e:
+        ...     print("Validation error occurred")
+        Validation error occurred
+    """
+    answer: List[Any]
+    comment: Optional[str] = None
+    generated_tokens: Optional[Any] = None
 def create_checkbox_response_model(
@@ -30,40 +67,218 @@ def create_checkbox_response_model(
 ):
     """
     Dynamically create a CheckboxResponse model with a predefined list of choices.
-    :param choices: A list of allowed values for the answer field.
-    :param include_comment: Whether to include a comment field in the model.
-    :return: A new Pydantic model class.
+    This function creates a customized Pydantic model for checkbox questions that
+    validates both the format of the response and any constraints on selection count.
+    Args:
+        choices: A list of allowed values for the answer field
+        min_selections: Optional minimum number of selections required
+        max_selections: Optional maximum number of selections allowed
+        permissive: If True, constraints are not enforced
+    Returns:
+        A new Pydantic model class with appropriate validation
+    Examples:
+        >>> # Create model with constraints
+        >>> choices = [0, 1, 2, 3]
+        >>> ConstrainedModel = create_checkbox_response_model(
+        ...     choices=choices,
+        ...     min_selections=1,
+        ...     max_selections=2
+        ... )
+        >>> # Valid response within constraints
+        >>> response = ConstrainedModel(answer=[0, 1])
+        >>> response.answer
+        [0, 1]
+        >>> # Too few selections fails validation
+        >>> try:
+        ...     ConstrainedModel(answer=[])
+        ... except Exception as e:
+        ...     "at least 1" in str(e)
+        True
+        >>> # Too many selections fails validation
+        >>> try:
+        ...     ConstrainedModel(answer=[0, 1, 2])
+        ... except Exception as e:
+        ...     "at most 2" in str(e)
+        True
+        >>> # Invalid choice fails validation
+        >>> try:
+        ...     ConstrainedModel(answer=[4])
+        ... except Exception as e:
+        ...     any(x in str(e) for x in ["Invalid choice", "not a valid enumeration member", "validation error"])
+        True
+        >>> # Permissive model ignores constraints
+        >>> PermissiveModel = create_checkbox_response_model(
+        ...     choices=choices,
+        ...     min_selections=1,
+        ...     max_selections=2,
+        ...     permissive=True
+        ... )
+        >>> response = PermissiveModel(answer=[0, 1, 2])
+        >>> len(response.answer)
+        3
     """
     # Convert the choices list to a tuple for use with Literal
     choice_tuple = tuple(choices)
-    field_params = {}
-    if min_selections is not None and not permissive:
-        field_params["min_items"] = min_selections
-    if max_selections is not None and not permissive:
-        field_params["max_items"] = max_selections
-    class CheckboxResponse(BaseModel):
-        answer: Annotated[
-            List[Literal[choice_tuple]],
-            Field(..., **field_params),
-        ] = Field(..., description="List of selected choices")
-        comment: Optional[str] = Field(None, description="Optional comment field")
-        generated_tokens: Optional[Any] = Field(default=None)
-        class Config:
-            @staticmethod
-            def json_schema_extra(schema: dict, model: BaseModel) -> None:
-                # Add the list of choices to the schema for better documentation
-                for prop in schema.get("properties", {}).values():
-                    if prop.get("title") == "answer":
-                        prop["items"] = {"enum": choices}
-    return CheckboxResponse
+    if permissive:
+        # For permissive mode, we still validate the choice values but ignore count constraints
+        class PermissiveCheckboxResponse(CheckboxResponse):
+            """Checkbox response model with choices validation but no count constraints."""
+            answer: Annotated[
+                List[Literal[choice_tuple]],
+                Field(description="List of selected choices"),
+            ]
+            @model_validator(mode='after')
+            def validate_choices(self):
+                """Validate that each selected choice is valid."""
+                for choice in self.answer:
+                    if choice not in choices:
+                        validation_error = ValidationError.from_exception_data(
+                            title='CheckboxResponse',
+                            line_errors=[{
+                                'type': 'value_error',
+                                'loc': ('answer',),
+                                'msg': f'Invalid choice: {choice}. Must be one of: {choices}',
+                                'input': choice,
+                                'ctx': {'error': 'Invalid choice'}
+                            }]
+                        )
+                        raise QuestionAnswerValidationError(
+                            message=f"Invalid choice: {choice}. Must be one of: {choices}",
+                            data=self.model_dump(),
+                            model=self.__class__,
+                            pydantic_error=validation_error
+                        )
+                return self
+        return PermissiveCheckboxResponse
+    else:
+        # For non-permissive mode, enforce both choice values and count constraints
+        class ConstrainedCheckboxResponse(CheckboxResponse):
+            """Checkbox response model with both choice and count constraints."""
+            answer: Annotated[
+                List[Literal[choice_tuple]],
+                Field(description="List of selected choices"),
+            ]
+            @model_validator(mode='after')
+            def validate_selection_count(self):
+                """Validate that the number of selections meets constraints."""
+                if min_selections is not None and len(self.answer) < min_selections:
+                    validation_error = ValidationError.from_exception_data(
+                        title='CheckboxResponse',
+                        line_errors=[{
+                            'type': 'value_error',
+                            'loc': ('answer',),
+                            'msg': f'Must select at least {min_selections} option(s)',
+                            'input': self.answer,
+                            'ctx': {'error': 'Too few selections'}
+                        }]
+                    )
+                    raise QuestionAnswerValidationError(
+                        message=f"Must select at least {min_selections} option(s), got {len(self.answer)}",
+                        data=self.model_dump(),
+                        model=self.__class__,
+                        pydantic_error=validation_error
+                    )
+                if max_selections is not None and len(self.answer) > max_selections:
+                    validation_error = ValidationError.from_exception_data(
+                        title='CheckboxResponse',
+                        line_errors=[{
+                            'type': 'value_error',
+                            'loc': ('answer',),
+                            'msg': f'Must select at most {max_selections} option(s)',
+                            'input': self.answer,
+                            'ctx': {'error': 'Too many selections'}
+                        }]
+                    )
+                    raise QuestionAnswerValidationError(
+                        message=f"Must select at most {max_selections} option(s), got {len(self.answer)}",
+                        data=self.model_dump(),
+                        model=self.__class__,
+                        pydantic_error=validation_error
+                    )
+                # Also validate that each choice is valid
+                for choice in self.answer:
+                    if choice not in choices:
+                        validation_error = ValidationError.from_exception_data(
+                            title='CheckboxResponse',
+                            line_errors=[{
+                                'type': 'value_error',
+                                'loc': ('answer',),
+                                'msg': f'Invalid choice: {choice}. Must be one of: {choices}',
+                                'input': choice,
+                                'ctx': {'error': 'Invalid choice'}
+                            }]
+                        )
+                        raise QuestionAnswerValidationError(
+                            message=f"Invalid choice: {choice}. Must be one of: {choices}",
+                            data=self.model_dump(),
+                            model=self.__class__,
+                            pydantic_error=validation_error
+                        )
+                return self
+        return ConstrainedCheckboxResponse
 class CheckBoxResponseValidator(ResponseValidatorABC):
+    """
+    Validator for checkbox question responses.
+    This class implements the validation and fixing logic for checkbox responses.
+    It ensures that responses contain valid selections from the available options
+    and that the number of selections meets any constraints.
+    Attributes:
+        required_params: List of required parameters for validation.
+        valid_examples: Examples of valid responses for testing.
+        invalid_examples: Examples of invalid responses for testing.
+    Examples:
+        >>> from edsl import QuestionCheckBox
+        >>> q = QuestionCheckBox.example()
+        >>> validator = q.response_validator
+        >>> # Fix string to list
+        >>> response = {"answer": 1}
+        >>> fixed = validator.fix(response)
+        >>> isinstance(fixed["answer"], list)
+        True
+        >>> # Extract selections from text
+        >>> response = {"generated_tokens": "I choose options 0 and 2"}
+        >>> fixed = validator.fix(response)
+        >>> sorted(fixed["answer"])
+        [0, 2]
+        >>> # Fix comma-separated list
+        >>> response = {"generated_tokens": "0, 1, 3"}
+        >>> fixed = validator.fix(response)
+        >>> sorted(fixed["answer"])
+        [0, 1, 3]
+        >>> # Preserve comments when fixing
+        >>> response = {"answer": 1, "comment": "My explanation"}
+        >>> fixed = validator.fix(response)
+        >>> "comment" in fixed and fixed["comment"] == "My explanation"
+        True
+    """
     required_params = [
         "question_options",
         "min_selections",
@@ -80,12 +295,12 @@ class CheckBoxResponseValidator(ResponseValidatorABC):
         (
             {"answer": [-1]},
             {"question_options": ["Good", "Great", "OK", "Bad"]},
-            "Answer code must be a non-negative integer",
+            "Invalid choice",
         ),
         (
             {"answer": 1},
             {"question_options": ["Good", "Great", "OK", "Bad"]},
-            "Answer code must be a list",
+            "value is not a valid list",
         ),
         (
             {"answer": [1, 2, 3, 4]},
@@ -94,84 +309,217 @@ class CheckBoxResponseValidator(ResponseValidatorABC):
                 "min_selections": 1,
                 "max_selections": 2,
             },
-            "Too many options selected",
+            "Must select at most 2",
         ),
     ]
     def fix(self, response, verbose=False):
+        """
+        Fix common issues in checkbox responses.
+        This method attempts to extract valid selections from responses with
+        format issues. It can handle:
+        1. Single values that should be lists
+        2. Comma-separated strings in answer field or generated_tokens
+        3. Finding option indices mentioned in text
+        Args:
+            response: The response dictionary to fix
+            verbose: If True, print information about the fixing process
+        Returns:
+            A fixed version of the response dictionary with a valid list of selections
+        Notes:
+            - First tries to convert to a list if the answer is not already a list
+            - Then tries to parse comma-separated values from answer or generated_tokens
+            - Finally tries to find option indices mentioned in the text
+            - Preserves any comment in the original response
+        """
         if verbose:
             print("Invalid response of QuestionCheckBox was: ", response)
-        response_text = response.get("generated_tokens")
-        if response_text is None or response_text == "":  # nothing to be done
-            return response
-        # Maybe it's a comma separated list?
-        proposed_list = response_text.split(",")
-        proposed_list = [item.strip() for item in proposed_list]
-        if verbose:
-            print("Using code? ", self.use_code)
-        if self.use_code:
-            try:
-                proposed_list = [int(i) for i in proposed_list]
-            except ValueError:
-                # print("Could not convert to int")
-                pass
-        if verbose:
-            print("Proposed solution is: ", proposed_list)
-        # print(f"Ivalid generated tokens was was: {response_text}")
-        if "comment" in response:
-            proposed_data = {
-                "answer": proposed_list,
-                "comment": response["comment"],
-                "generated_tokens": response.get("generated_tokens", None),
-            }
-        else:
+        # Check if answer exists and is a comma-separated string (common LLM output format)
+        if "answer" in response and isinstance(response["answer"], str) and "," in response["answer"]:
+            if verbose:
+                print(f"Parsing comma-separated answer string: {response['answer']}")
+            # Split by commas and strip whitespace
+            proposed_list = response["answer"].split(",")
+            proposed_list = [item.strip() for item in proposed_list]
+            # Try to convert to integers if use_code is True
+            if self.use_code:
+                try:
+                    proposed_list = [int(i) for i in proposed_list]
+                except ValueError:
+                    # If we can't convert to integers, try to match values to indices
+                    if verbose:
+                        print("Could not convert comma-separated values to integers, trying to match options")
+                    # Try to match option text values to their indices
+                    index_map = {}
+                    for i, option in enumerate(self.question_options):
+                        index_map[option.lower().strip()] = i
+                    converted_list = []
+                    for item in proposed_list:
+                        item_lower = item.lower().strip()
+                        if item_lower in index_map:
+                            converted_list.append(index_map[item_lower])
+                    if converted_list:
+                        proposed_list = converted_list
+            if verbose:
+                print("Proposed solution from comma separation is: ", proposed_list)
             proposed_data = {
                 "answer": proposed_list,
-                "generated_tokens": response.get("generated_tokens", None),
+                "comment": response.get("comment"),
+                "generated_tokens": response.get("generated_tokens"),
             }
-        try:
-            self.response_model(**proposed_data)
-            print("Proposed solution is valid")
-            print("Returning proposed data: ", proposed_data)
-            return proposed_data
-        except Exception as e:
-            if verbose:
-                print(f"Proposed solution {proposed_data} is invalid. Error: {e}")
-            # return response
-        if verbose:
-            print("Now seeing if responses show up in the answer")
-        matches = []
-        for index, option in enumerate(self.question_options):
-            if self.use_code:
-                if str(index) in response_text:
-                    matches.append(index)
-            else:
-                if option in response_text:
-                    matches.append(index)
-        proposed_data = {
-            "answer": matches,
-            "comment": response.get("comment", None),
-            "generated_tokens": response.get("generated_tokens", None),
-        }
-        try:
-            self.response_model(**proposed_data)
-            return proposed_data
-        except Exception as e:
+            # Try validating with the proposed solution
+            try:
+                validated = self._base_validate(proposed_data)
+                return validated.model_dump()
+            except Exception as e:
+                if verbose:
+                    print(f"Comma-separated solution invalid: {e}")
+        # If answer exists but is not a list, convert it to a list
+        elif "answer" in response and not isinstance(response["answer"], list):
             if verbose:
-                print(f"Proposed solution {proposed_data} is invalid. Error: {e}")
-            return response
-    def custom_validate(self, response) -> 'BaseResponse':
-        if response.answer is None:
-            raise QuestionAnswerValidationError("Answer is missing.")
-        return response.dict()
+                print(f"Converting non-list answer {response['answer']} to a list")
+            answer_value = response["answer"]
+            response = {**response, "answer": [answer_value]}
+            # Try validating the fixed response
+            try:
+                validated = self._base_validate(response)
+                return validated.model_dump()
+            except Exception:
+                if verbose:
+                    print("Converting to list didn't fix the issue")
+        # Try parsing from generated_tokens if present
+        response_text = response.get("generated_tokens")
+        if response_text and isinstance(response_text, str):
+            # Try comma-separated list first
+            if "," in response_text:
+                proposed_list = response_text.split(",")
+                proposed_list = [item.strip() for item in proposed_list]
+                if self.use_code:
+                    try:
+                        proposed_list = [int(i) for i in proposed_list]
+                    except ValueError:
+                        # If we can't convert to integers, try to match values to indices
+                        if verbose:
+                            print("Could not convert comma-separated values to integers, trying to match options")
+                        # Try to match option text values to their indices
+                        index_map = {}
+                        for i, option in enumerate(self.question_options):
+                            index_map[option.lower().strip()] = i
+                        converted_list = []
+                        for item in proposed_list:
+                            item_lower = item.lower().strip()
+                            if item_lower in index_map:
+                                converted_list.append(index_map[item_lower])
+                        if converted_list:
+                            proposed_list = converted_list
+                if verbose:
+                    print("Proposed solution from comma separation is: ", proposed_list)
+                proposed_data = {
+                    "answer": proposed_list,
+                    "comment": response.get("comment"),
+                    "generated_tokens": response.get("generated_tokens"),
+                }
+                # Try validating with the proposed solution
+                try:
+                    validated = self._base_validate(proposed_data)
+                    return validated.model_dump()
+                except Exception as e:
+                    if verbose:
+                        print(f"Comma-separated solution invalid: {e}")
+            # Try finding option indices mentioned in the text
+            matches = []
+            for index, option in enumerate(self.question_options):
+                if self.use_code:
+                    if str(index) in response_text:
+                        matches.append(index)
+                else:
+                    if option in response_text:
+                        matches.append(option)
+            if matches:
+                if verbose:
+                    print(f"Found options mentioned in text: {matches}")
+                proposed_data = {
+                    "answer": matches,
+                    "comment": response.get("comment"),
+                    "generated_tokens": response.get("generated_tokens"),
+                }
+                # Try validating with the proposed solution
+                try:
+                    validated = self._base_validate(proposed_data)
+                    return validated.model_dump()
+                except Exception as e:
+                    if verbose:
+                        print(f"Text matching solution invalid: {e}")
+        # If nothing worked, return the original response
+        return response
 class QuestionCheckBox(QuestionBase):
-    """This question prompts the agent to select options from a list."""
+    """
+    A question that prompts the agent to select multiple options from a list.
+    QuestionCheckBox allows agents to select one or more items from a predefined
+    list of options. It's useful for "select all that apply" scenarios, multi-select
+    preferences, or any question where multiple valid selections are possible.
+    Attributes:
+        question_type (str): Identifier for this question type, set to "checkbox".
+        purpose (str): Brief description of when to use this question type.
+        question_options: List of available options to select from.
+        min_selections: Optional minimum number of selections required.
+        max_selections: Optional maximum number of selections allowed.
+        _response_model: Initially None, set by create_response_model().
+        response_validator_class: Class used to validate and fix responses.
+    Examples:
+        >>> # Basic creation works
+        >>> q = QuestionCheckBox.example()
+        >>> q.question_type
+        'checkbox'
+        >>> # Create preferences question with selection constraints
+        >>> q = QuestionCheckBox(
+        ...     question_name="favorite_fruits",
+        ...     question_text="Which fruits do you like?",
+        ...     question_options=["Apple", "Banana", "Cherry", "Durian", "Elderberry"],
+        ...     min_selections=1,
+        ...     max_selections=3
+        ... )
+        >>> q.question_options
+        ['Apple', 'Banana', 'Cherry', 'Durian', 'Elderberry']
+        >>> q.min_selections
+        1
+        >>> q.max_selections
+        3
+    """
     question_type = "checkbox"
     purpose = "When options are known and limited"
@@ -195,13 +543,41 @@ class QuestionCheckBox(QuestionBase):
         answering_instructions: Optional[str] = None,
         permissive: bool = False,
     ):
-        """Instantiate a new QuestionCheckBox.
-        :param question_name: The name of the question.
-        :param question_text: The text of the question.
-        :param question_options: The options the respondent should select from.
-        :param min_selections: The minimum number of options that must be selected.
-        :param max_selections: The maximum number of options that must be selected.
+        """
+        Initialize a new checkbox question.
+        Args:
+            question_name: Identifier for the question, used in results and templates.
+                          Must be a valid Python variable name.
+            question_text: The actual text of the question to be asked.
+            question_options: List of options the agent can select from.
+            min_selections: Optional minimum number of options that must be selected.
+            max_selections: Optional maximum number of options that can be selected.
+            include_comment: Whether to allow comments with the answer.
+            use_code: If True, use indices (0,1,2...) instead of option text values.
+            question_presentation: Optional custom presentation template.
+            answering_instructions: Optional additional instructions.
+            permissive: If True, ignore selection count constraints during validation.
+        Examples:
+            >>> q = QuestionCheckBox(
+            ...     question_name="symptoms",
+            ...     question_text="Select all symptoms you are experiencing:",
+            ...     question_options=["Fever", "Cough", "Headache", "Fatigue"],
+            ...     min_selections=1
+            ... )
+            >>> q.question_name
+            'symptoms'
+            >>> # Question with both min and max
+            >>> q = QuestionCheckBox(
+            ...     question_name="pizza_toppings",
+            ...     question_text="Choose 2-4 toppings for your pizza:",
+            ...     question_options=["Cheese", "Pepperoni", "Mushroom", "Onion",
+            ...                       "Sausage", "Bacon", "Pineapple"],
+            ...     min_selections=2,
+            ...     max_selections=4
+            ... )
         """
         self.question_name = question_name
         self.question_text = question_text
@@ -217,18 +593,35 @@ class QuestionCheckBox(QuestionBase):
         self.answering_instructions = answering_instructions
     def create_response_model(self):
+        """
+        Create a response model with the appropriate constraints.
+        This method creates a Pydantic model customized with the options and
+        selection count constraints specified for this question instance.
+        Returns:
+            A Pydantic model class tailored to this question's constraints.
+        Examples:
+            >>> q = QuestionCheckBox.example()
+            >>> model = q.create_response_model()
+            >>> model(answer=[0, 2])  # Select first and third options
+            ConstrainedCheckboxResponse(answer=[0, 2], comment=None, generated_tokens=None)
+        """
         if not self._use_code:
+            # Use option text values as valid choices
             return create_checkbox_response_model(
                 self.question_options,
                 min_selections=self.min_selections,
-                max_selections=self.max_selections,  # include_comment=self._include_comment
+                max_selections=self.max_selections,
                 permissive=self.permissive,
             )
         else:
+            # Use option indices (0, 1, 2...) as valid choices
             return create_checkbox_response_model(
                 list(range(len(self.question_options))),
                 min_selections=self.min_selections,
-                max_selections=self.max_selections,  # include_comment=self._include_comment
+                max_selections=self.max_selections,
                 permissive=self.permissive,
             )
@@ -236,10 +629,27 @@ class QuestionCheckBox(QuestionBase):
         self, answer_codes, scenario: "Scenario" = None
     ):
         """
-        Translate the answer code to the actual answer.
-        For example, for question options ["a", "b", "c"],the answer codes are 0, 1, and 2.
-        The LLM will respond with [0,1] and this code will translate it to ["a","b"].
+        Translate the answer codes to the actual answer text.
+        For checkbox questions with use_code=True, the agent responds with
+        option indices (e.g., [0, 1]) which need to be translated to their
+        corresponding option text values (e.g., ["Option A", "Option B"]).
+        Args:
+            answer_codes: List of selected option indices or values
+            scenario: Optional scenario with variables for template rendering
+        Returns:
+            List of selected option texts
+        Examples:
+            >>> q = QuestionCheckBox(
+            ...     question_name="example",
+            ...     question_text="Select options:",
+            ...     question_options=["A", "B", "C"]
+            ... )
+            >>> q._translate_answer_code_to_answer([0, 2])
+            ['A', 'C']
         """
         scenario = scenario or Scenario()
         translated_options = [
@@ -253,38 +663,73 @@ class QuestionCheckBox(QuestionBase):
                 translated_codes.append(answer_code)
         return translated_codes
-    # def _simulate_answer(self, human_readable=True) -> dict[str, Union[int, str]]:
-    #     """Simulate a valid answer for debugging purposes."""
-    #     from edsl.utilities.utilities import random_string
-    #     min_selections = self.min_selections or 1
-    #     max_selections = self.max_selections or len(self.question_options)
-    #     num_selections = random.randint(min_selections, max_selections)
-    #     if human_readable:
-    #         # Select a random number of options from self.question_options
-    #         selected_options = random.sample(self.question_options, num_selections)
-    #         answer = {
-    #             "answer": selected_options,
-    #             "comment": random_string(),
-    #         }
-    #     else:
-    #         # Select a random number of indices from the range of self.question_options
-    #         selected_indices = random.sample(
-    #             range(len(self.question_options)), num_selections
-    #         )
-    #         answer = {
-    #             "answer": selected_indices,
-    #             "comment": random_string(),
-    #         }
-    #     return answer
+    def _simulate_answer(self, human_readable=True):
+        """
+        Simulate a valid answer for debugging purposes.
+        This method generates a random valid answer for the checkbox question,
+        useful for testing and demonstrations.
+        Args:
+            human_readable: If True, return option text values; if False, return indices
+        Returns:
+            A dictionary with a valid random answer
+        Examples:
+            >>> q = QuestionCheckBox.example()
+            >>> answer = q._simulate_answer(human_readable=False)
+            >>> len(answer["answer"]) >= q.min_selections
+            True
+            >>> len(answer["answer"]) <= q.max_selections
+            True
+        """
+        from edsl.utilities.utilities import random_string
+        min_sel = self.min_selections or 1
+        max_sel = self.max_selections or len(self.question_options)
+        # Ensure we don't try to select more options than available
+        max_sel = min(max_sel, len(self.question_options))
+        min_sel = min(min_sel, max_sel)
+        num_selections = random.randint(min_sel, max_sel)
+        if human_readable:
+            # Select a random number of options from self.question_options
+            selected_options = random.sample(self.question_options, num_selections)
+            answer = {
+                "answer": selected_options,
+                "comment": random_string(),
+            }
+        else:
+            # Select a random number of indices from the range of self.question_options
+            selected_indices = random.sample(
+                range(len(self.question_options)), num_selections
+            )
+            answer = {
+                "answer": selected_indices,
+                "comment": random_string(),
+            }
+        return answer
     @property
     def question_html_content(self) -> str:
+        """
+        Generate HTML content for rendering the question in web interfaces.
+        This property generates HTML markup for the question when it needs to be
+        displayed in web interfaces or HTML contexts. For a checkbox question,
+        this is a set of checkbox input elements, one for each option.
+        Returns:
+            str: HTML markup for rendering the question.
+        """
         instructions = ""
         if self.min_selections is not None:
             instructions += f"Select at least {self.min_selections} option(s). "
         if self.max_selections is not None:
             instructions += f"Select at most {self.max_selections} option(s)."
         question_html_content = Template(
             """
         <p>{{ instructions }}</p>
@@ -308,7 +753,30 @@ class QuestionCheckBox(QuestionBase):
     @classmethod
     @inject_exception
     def example(cls, include_comment=False, use_code=True) -> QuestionCheckBox:
-        """Return an example checkbox question."""
+        """
+        Create an example instance of a checkbox question.
+        This class method creates a predefined example of a checkbox question
+        for demonstration, testing, and documentation purposes.
+        Args:
+            include_comment: Whether to include a comment field with the answer.
+            use_code: Whether to use indices (True) or values (False) for answer codes.
+        Returns:
+            QuestionCheckBox: An example checkbox question.
+        Examples:
+            >>> q = QuestionCheckBox.example()
+            >>> q.question_name
+            'never_eat'
+            >>> len(q.question_options)
+            5
+            >>> q.min_selections
+            2
+            >>> q.max_selections
+            5
+        """
         return cls(
             question_name="never_eat",
             question_text="Which of the following foods would you eat if you had to?",
@@ -327,31 +795,65 @@ class QuestionCheckBox(QuestionBase):
 def main():
-    """Create an example QuestionCheckBox and test its methods."""
-    from edsl.questions.QuestionCheckBox import QuestionCheckBox
+    """
+    Demonstrate the functionality of the QuestionCheckBox class.
+    This function creates an example checkbox question and demonstrates its
+    key features including validation, serialization, and answer simulation.
+    It's primarily intended for testing and development purposes.
+    Note:
+        This function will be executed when the module is run directly,
+        but not when imported.
+    """
+    print("Creating a QuestionCheckBox example...")
     q = QuestionCheckBox.example()
-    q.question_text
-    q.question_options
-    q.question_name
-    # validate an answer
-    q._validate_answer({"answer": [1, 2], "comment": "I like custard"})
-    # translate answer code
-    q._translate_answer_code_to_answer([1, 2])
-    # simulate answer
-    q._simulate_answer()
-    q._simulate_answer(human_readable=False)
-    q._validate_answer(q._simulate_answer(human_readable=False))
-    # serialization (inherits from Question)
-    q.to_dict()
-    assert q.from_dict(q.to_dict()) == q
+    print(f"Question text: {q.question_text}")
+    print(f"Question name: {q.question_name}")
+    print(f"Question options: {q.question_options}")
+    print(f"Min selections: {q.min_selections}")
+    print(f"Max selections: {q.max_selections}")
+    # Validate an answer
+    print("\nValidating an answer...")
+    valid_answer = {"answer": [1, 2], "comment": "I like these foods"}
+    validated = q._validate_answer(valid_answer)
+    print(f"Validated answer: {validated}")
+    # Translate answer codes
+    print("\nTranslating answer codes...")
+    translated = q._translate_answer_code_to_answer([1, 2])
+    print(f"Translated answer: {translated}")
+    # Simulate answers
+    print("\nSimulating answers...")
+    simulated_human = q._simulate_answer(human_readable=True)
+    print(f"Simulated human-readable answer: {simulated_human}")
+    simulated_codes = q._simulate_answer(human_readable=False)
+    print(f"Simulated code answer: {simulated_codes}")
+    # Validate simulated answer
+    validated_simulated = q._validate_answer(simulated_codes)
+    print(f"Validated simulated answer: {validated_simulated}")
+    # Serialization demonstration
+    print("\nTesting serialization...")
+    serialized = q.to_dict()
+    print(f"Serialized question (keys): {list(serialized.keys())}")
+    deserialized = QuestionBase.from_dict(serialized)
+    print(f"Deserialization successful: {deserialized.question_text == q.question_text}")
+    # Run doctests
+    print("\nRunning doctests...")
     import doctest
     doctest.testmod(optionflags=doctest.ELLIPSIS)
+    print("Doctests completed")
 if __name__ == "__main__":
     import doctest
     doctest.testmod(optionflags=doctest.ELLIPSIS)
+    # Uncomment to run demonstration
+    # main()

edsl 0.1.50__py3-none-any.whl → 0.1.51__py3-none-any.whl

edsl 0.1.50py3-none-any.whl → 0.1.51py3-none-any.whl