PyPI - edsl - Versions diffs - 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev5__py3-none-any.whl - Mend

edsl 0.1.39.dev3py3-none-any.whl → 0.1.39.dev5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (341) hide show

edsl/Base.py +413 -332
edsl/BaseDiff.py +260 -260
edsl/TemplateLoader.py +24 -24
edsl/__init__.py +57 -49
edsl/__version__.py +1 -1
edsl/agents/Agent.py +1071 -867
edsl/agents/AgentList.py +551 -413
edsl/agents/Invigilator.py +284 -233
edsl/agents/InvigilatorBase.py +257 -270
edsl/agents/PromptConstructor.py +272 -354
edsl/agents/QuestionInstructionPromptBuilder.py +128 -0
edsl/agents/QuestionTemplateReplacementsBuilder.py +137 -0
edsl/agents/__init__.py +2 -3
edsl/agents/descriptors.py +99 -99
edsl/agents/prompt_helpers.py +129 -129
edsl/agents/question_option_processor.py +172 -0
edsl/auto/AutoStudy.py +130 -117
edsl/auto/StageBase.py +243 -230
edsl/auto/StageGenerateSurvey.py +178 -178
edsl/auto/StageLabelQuestions.py +125 -125
edsl/auto/StagePersona.py +61 -61
edsl/auto/StagePersonaDimensionValueRanges.py +88 -88
edsl/auto/StagePersonaDimensionValues.py +74 -74
edsl/auto/StagePersonaDimensions.py +69 -69
edsl/auto/StageQuestions.py +74 -73
edsl/auto/SurveyCreatorPipeline.py +21 -21
edsl/auto/utilities.py +218 -224
edsl/base/Base.py +279 -279
edsl/config.py +177 -157
edsl/conversation/Conversation.py +290 -290
edsl/conversation/car_buying.py +59 -58
edsl/conversation/chips.py +95 -95
edsl/conversation/mug_negotiation.py +81 -81
edsl/conversation/next_speaker_utilities.py +93 -93
edsl/coop/CoopFunctionsMixin.py +15 -0
edsl/coop/ExpectedParrotKeyHandler.py +125 -0
edsl/coop/PriceFetcher.py +54 -54
edsl/coop/__init__.py +2 -2
edsl/coop/coop.py +1106 -1028
edsl/coop/utils.py +131 -131
edsl/data/Cache.py +573 -555
edsl/data/CacheEntry.py +230 -233
edsl/data/CacheHandler.py +168 -149
edsl/data/RemoteCacheSync.py +186 -78
edsl/data/SQLiteDict.py +292 -292
edsl/data/__init__.py +5 -4
edsl/data/orm.py +10 -10
edsl/data_transfer_models.py +74 -73
edsl/enums.py +202 -175
edsl/exceptions/BaseException.py +21 -21
edsl/exceptions/__init__.py +54 -54
edsl/exceptions/agents.py +54 -42
edsl/exceptions/cache.py +5 -5
edsl/exceptions/configuration.py +16 -16
edsl/exceptions/coop.py +10 -10
edsl/exceptions/data.py +14 -14
edsl/exceptions/general.py +34 -34
edsl/exceptions/inference_services.py +5 -0
edsl/exceptions/jobs.py +33 -33
edsl/exceptions/language_models.py +63 -63
edsl/exceptions/prompts.py +15 -15
edsl/exceptions/questions.py +109 -91
edsl/exceptions/results.py +29 -29
edsl/exceptions/scenarios.py +29 -22
edsl/exceptions/surveys.py +37 -37
edsl/inference_services/AnthropicService.py +106 -87
edsl/inference_services/AvailableModelCacheHandler.py +184 -0
edsl/inference_services/AvailableModelFetcher.py +215 -0
edsl/inference_services/AwsBedrock.py +118 -120
edsl/inference_services/AzureAI.py +215 -217
edsl/inference_services/DeepInfraService.py +18 -18
edsl/inference_services/GoogleService.py +143 -148
edsl/inference_services/GroqService.py +20 -20
edsl/inference_services/InferenceServiceABC.py +80 -147
edsl/inference_services/InferenceServicesCollection.py +138 -97
edsl/inference_services/MistralAIService.py +120 -123
edsl/inference_services/OllamaService.py +18 -18
edsl/inference_services/OpenAIService.py +236 -224
edsl/inference_services/PerplexityService.py +160 -163
edsl/inference_services/ServiceAvailability.py +135 -0
edsl/inference_services/TestService.py +90 -89
edsl/inference_services/TogetherAIService.py +172 -170
edsl/inference_services/data_structures.py +134 -0
edsl/inference_services/models_available_cache.py +118 -118
edsl/inference_services/rate_limits_cache.py +25 -25
edsl/inference_services/registry.py +41 -41
edsl/inference_services/write_available.py +10 -10
edsl/jobs/AnswerQuestionFunctionConstructor.py +223 -0
edsl/jobs/Answers.py +43 -56
edsl/jobs/FetchInvigilator.py +47 -0
edsl/jobs/InterviewTaskManager.py +98 -0
edsl/jobs/InterviewsConstructor.py +50 -0
edsl/jobs/Jobs.py +823 -898
edsl/jobs/JobsChecks.py +172 -147
edsl/jobs/JobsComponentConstructor.py +189 -0
edsl/jobs/JobsPrompts.py +270 -268
edsl/jobs/JobsRemoteInferenceHandler.py +311 -239
edsl/jobs/JobsRemoteInferenceLogger.py +239 -0
edsl/jobs/RequestTokenEstimator.py +30 -0
edsl/jobs/__init__.py +1 -1
edsl/jobs/async_interview_runner.py +138 -0
edsl/jobs/buckets/BucketCollection.py +104 -63
edsl/jobs/buckets/ModelBuckets.py +65 -65
edsl/jobs/buckets/TokenBucket.py +283 -251
edsl/jobs/buckets/TokenBucketAPI.py +211 -0
edsl/jobs/buckets/TokenBucketClient.py +191 -0
edsl/jobs/check_survey_scenario_compatibility.py +85 -0
edsl/jobs/data_structures.py +120 -0
edsl/jobs/decorators.py +35 -0
edsl/jobs/interviews/Interview.py +396 -661
edsl/jobs/interviews/InterviewExceptionCollection.py +99 -99
edsl/jobs/interviews/InterviewExceptionEntry.py +186 -186
edsl/jobs/interviews/InterviewStatistic.py +63 -63
edsl/jobs/interviews/InterviewStatisticsCollection.py +25 -25
edsl/jobs/interviews/InterviewStatusDictionary.py +78 -78
edsl/jobs/interviews/InterviewStatusLog.py +92 -92
edsl/jobs/interviews/ReportErrors.py +66 -66
edsl/jobs/interviews/interview_status_enum.py +9 -9
edsl/jobs/jobs_status_enums.py +9 -0
edsl/jobs/loggers/HTMLTableJobLogger.py +304 -0
edsl/jobs/results_exceptions_handler.py +98 -0
edsl/jobs/runners/JobsRunnerAsyncio.py +151 -466
edsl/jobs/runners/JobsRunnerStatus.py +297 -330
edsl/jobs/tasks/QuestionTaskCreator.py +244 -242
edsl/jobs/tasks/TaskCreators.py +64 -64
edsl/jobs/tasks/TaskHistory.py +470 -450
edsl/jobs/tasks/TaskStatusLog.py +23 -23
edsl/jobs/tasks/task_status_enum.py +161 -163
edsl/jobs/tokens/InterviewTokenUsage.py +27 -27
edsl/jobs/tokens/TokenUsage.py +34 -34
edsl/language_models/ComputeCost.py +63 -0
edsl/language_models/LanguageModel.py +626 -668
edsl/language_models/ModelList.py +164 -155
edsl/language_models/PriceManager.py +127 -0
edsl/language_models/RawResponseHandler.py +106 -0
edsl/language_models/RegisterLanguageModelsMeta.py +184 -184
edsl/language_models/ServiceDataSources.py +0 -0
edsl/language_models/__init__.py +2 -3
edsl/language_models/fake_openai_call.py +15 -15
edsl/language_models/fake_openai_service.py +61 -61
edsl/language_models/key_management/KeyLookup.py +63 -0
edsl/language_models/key_management/KeyLookupBuilder.py +273 -0
edsl/language_models/key_management/KeyLookupCollection.py +38 -0
edsl/language_models/key_management/__init__.py +0 -0
edsl/language_models/key_management/models.py +131 -0
edsl/language_models/model.py +256 -0
edsl/language_models/repair.py +156 -156
edsl/language_models/utilities.py +65 -64
edsl/notebooks/Notebook.py +263 -258
edsl/notebooks/NotebookToLaTeX.py +142 -0
edsl/notebooks/__init__.py +1 -1
edsl/prompts/Prompt.py +352 -362
edsl/prompts/__init__.py +2 -2
edsl/questions/ExceptionExplainer.py +77 -0
edsl/questions/HTMLQuestion.py +103 -0
edsl/questions/QuestionBase.py +518 -664
edsl/questions/QuestionBasePromptsMixin.py +221 -217
edsl/questions/QuestionBudget.py +227 -227
edsl/questions/QuestionCheckBox.py +359 -359
edsl/questions/QuestionExtract.py +180 -182
edsl/questions/QuestionFreeText.py +113 -114
edsl/questions/QuestionFunctional.py +166 -166
edsl/questions/QuestionList.py +223 -231
edsl/questions/QuestionMatrix.py +265 -0
edsl/questions/QuestionMultipleChoice.py +330 -286
edsl/questions/QuestionNumerical.py +151 -153
edsl/questions/QuestionRank.py +314 -324
edsl/questions/Quick.py +41 -41
edsl/questions/SimpleAskMixin.py +74 -73
edsl/questions/__init__.py +27 -26
edsl/questions/{AnswerValidatorMixin.py → answer_validator_mixin.py} +334 -289
edsl/questions/compose_questions.py +98 -98
edsl/questions/data_structures.py +20 -0
edsl/questions/decorators.py +21 -21
edsl/questions/derived/QuestionLikertFive.py +76 -76
edsl/questions/derived/QuestionLinearScale.py +90 -87
edsl/questions/derived/QuestionTopK.py +93 -93
edsl/questions/derived/QuestionYesNo.py +82 -82
edsl/questions/descriptors.py +427 -413
edsl/questions/loop_processor.py +149 -0
edsl/questions/prompt_templates/question_budget.jinja +13 -13
edsl/questions/prompt_templates/question_checkbox.jinja +32 -32
edsl/questions/prompt_templates/question_extract.jinja +11 -11
edsl/questions/prompt_templates/question_free_text.jinja +3 -3
edsl/questions/prompt_templates/question_linear_scale.jinja +11 -11
edsl/questions/prompt_templates/question_list.jinja +17 -17
edsl/questions/prompt_templates/question_multiple_choice.jinja +33 -33
edsl/questions/prompt_templates/question_numerical.jinja +36 -36
edsl/questions/{QuestionBaseGenMixin.py → question_base_gen_mixin.py} +168 -161
edsl/questions/question_registry.py +177 -177
edsl/questions/{RegisterQuestionsMeta.py → register_questions_meta.py} +71 -71
edsl/questions/{ResponseValidatorABC.py → response_validator_abc.py} +188 -174
edsl/questions/response_validator_factory.py +34 -0
edsl/questions/settings.py +12 -12
edsl/questions/templates/budget/answering_instructions.jinja +7 -7
edsl/questions/templates/budget/question_presentation.jinja +7 -7
edsl/questions/templates/checkbox/answering_instructions.jinja +10 -10
edsl/questions/templates/checkbox/question_presentation.jinja +22 -22
edsl/questions/templates/extract/answering_instructions.jinja +7 -7
edsl/questions/templates/likert_five/answering_instructions.jinja +10 -10
edsl/questions/templates/likert_five/question_presentation.jinja +11 -11
edsl/questions/templates/linear_scale/answering_instructions.jinja +5 -5
edsl/questions/templates/linear_scale/question_presentation.jinja +5 -5
edsl/questions/templates/list/answering_instructions.jinja +3 -3
edsl/questions/templates/list/question_presentation.jinja +5 -5
edsl/questions/templates/matrix/__init__.py +1 -0
edsl/questions/templates/matrix/answering_instructions.jinja +5 -0
edsl/questions/templates/matrix/question_presentation.jinja +20 -0
edsl/questions/templates/multiple_choice/answering_instructions.jinja +9 -9
edsl/questions/templates/multiple_choice/question_presentation.jinja +11 -11
edsl/questions/templates/numerical/answering_instructions.jinja +6 -6
edsl/questions/templates/numerical/question_presentation.jinja +6 -6
edsl/questions/templates/rank/answering_instructions.jinja +11 -11
edsl/questions/templates/rank/question_presentation.jinja +15 -15
edsl/questions/templates/top_k/answering_instructions.jinja +8 -8
edsl/questions/templates/top_k/question_presentation.jinja +22 -22
edsl/questions/templates/yes_no/answering_instructions.jinja +6 -6
edsl/questions/templates/yes_no/question_presentation.jinja +11 -11
edsl/results/CSSParameterizer.py +108 -108
edsl/results/Dataset.py +587 -424
edsl/results/DatasetExportMixin.py +594 -731
edsl/results/DatasetTree.py +295 -275
edsl/results/MarkdownToDocx.py +122 -0
edsl/results/MarkdownToPDF.py +111 -0
edsl/results/Result.py +557 -465
edsl/results/Results.py +1183 -1165
edsl/results/ResultsExportMixin.py +45 -43
edsl/results/ResultsGGMixin.py +121 -121
edsl/results/TableDisplay.py +125 -198
edsl/results/TextEditor.py +50 -0
edsl/results/__init__.py +2 -2
edsl/results/file_exports.py +252 -0
edsl/results/{ResultsFetchMixin.py → results_fetch_mixin.py} +33 -33
edsl/results/{Selector.py → results_selector.py} +145 -135
edsl/results/{ResultsToolsMixin.py → results_tools_mixin.py} +98 -98
edsl/results/smart_objects.py +96 -0
edsl/results/table_data_class.py +12 -0
edsl/results/table_display.css +77 -77
edsl/results/table_renderers.py +118 -0
edsl/results/tree_explore.py +115 -115
edsl/scenarios/ConstructDownloadLink.py +109 -0
edsl/scenarios/DocumentChunker.py +102 -0
edsl/scenarios/DocxScenario.py +16 -0
edsl/scenarios/FileStore.py +511 -632
edsl/scenarios/PdfExtractor.py +40 -0
edsl/scenarios/Scenario.py +498 -601
edsl/scenarios/ScenarioHtmlMixin.py +65 -64
edsl/scenarios/ScenarioList.py +1458 -1287
edsl/scenarios/ScenarioListExportMixin.py +45 -52
edsl/scenarios/ScenarioListPdfMixin.py +239 -261
edsl/scenarios/__init__.py +3 -4
edsl/scenarios/directory_scanner.py +96 -0
edsl/scenarios/file_methods.py +85 -0
edsl/scenarios/handlers/__init__.py +13 -0
edsl/scenarios/handlers/csv.py +38 -0
edsl/scenarios/handlers/docx.py +76 -0
edsl/scenarios/handlers/html.py +37 -0
edsl/scenarios/handlers/json.py +111 -0
edsl/scenarios/handlers/latex.py +5 -0
edsl/scenarios/handlers/md.py +51 -0
edsl/scenarios/handlers/pdf.py +68 -0
edsl/scenarios/handlers/png.py +39 -0
edsl/scenarios/handlers/pptx.py +105 -0
edsl/scenarios/handlers/py.py +294 -0
edsl/scenarios/handlers/sql.py +313 -0
edsl/scenarios/handlers/sqlite.py +149 -0
edsl/scenarios/handlers/txt.py +33 -0
edsl/scenarios/{ScenarioJoin.py → scenario_join.py} +131 -127
edsl/scenarios/scenario_selector.py +156 -0
edsl/shared.py +1 -1
edsl/study/ObjectEntry.py +173 -173
edsl/study/ProofOfWork.py +113 -113
edsl/study/SnapShot.py +80 -80
edsl/study/Study.py +521 -528
edsl/study/__init__.py +4 -4
edsl/surveys/ConstructDAG.py +92 -0
edsl/surveys/DAG.py +148 -148
edsl/surveys/EditSurvey.py +221 -0
edsl/surveys/InstructionHandler.py +100 -0
edsl/surveys/Memory.py +31 -31
edsl/surveys/MemoryManagement.py +72 -0
edsl/surveys/MemoryPlan.py +244 -244
edsl/surveys/Rule.py +327 -326
edsl/surveys/RuleCollection.py +385 -387
edsl/surveys/RuleManager.py +172 -0
edsl/surveys/Simulator.py +75 -0
edsl/surveys/Survey.py +1280 -1801
edsl/surveys/SurveyCSS.py +273 -261
edsl/surveys/SurveyExportMixin.py +259 -259
edsl/surveys/{SurveyFlowVisualizationMixin.py → SurveyFlowVisualization.py} +181 -179
edsl/surveys/SurveyQualtricsImport.py +284 -284
edsl/surveys/SurveyToApp.py +141 -0
edsl/surveys/__init__.py +5 -3
edsl/surveys/base.py +53 -53
edsl/surveys/descriptors.py +60 -56
edsl/surveys/instructions/ChangeInstruction.py +48 -49
edsl/surveys/instructions/Instruction.py +56 -65
edsl/surveys/instructions/InstructionCollection.py +82 -77
edsl/templates/error_reporting/base.html +23 -23
edsl/templates/error_reporting/exceptions_by_model.html +34 -34
edsl/templates/error_reporting/exceptions_by_question_name.html +16 -16
edsl/templates/error_reporting/exceptions_by_type.html +16 -16
edsl/templates/error_reporting/interview_details.html +115 -115
edsl/templates/error_reporting/interviews.html +19 -19
edsl/templates/error_reporting/overview.html +4 -4
edsl/templates/error_reporting/performance_plot.html +1 -1
edsl/templates/error_reporting/report.css +73 -73
edsl/templates/error_reporting/report.html +117 -117
edsl/templates/error_reporting/report.js +25 -25
edsl/tools/__init__.py +1 -1
edsl/tools/clusters.py +192 -192
edsl/tools/embeddings.py +27 -27
edsl/tools/embeddings_plotting.py +118 -118
edsl/tools/plotting.py +112 -112
edsl/tools/summarize.py +18 -18
edsl/utilities/PrettyList.py +56 -0
edsl/utilities/SystemInfo.py +28 -28
edsl/utilities/__init__.py +22 -22
edsl/utilities/ast_utilities.py +25 -25
edsl/utilities/data/Registry.py +6 -6
edsl/utilities/data/__init__.py +1 -1
edsl/utilities/data/scooter_results.json +1 -1
edsl/utilities/decorators.py +77 -77
edsl/utilities/gcp_bucket/cloud_storage.py +96 -96
edsl/utilities/interface.py +627 -627
edsl/utilities/is_notebook.py +18 -0
edsl/utilities/is_valid_variable_name.py +11 -0
edsl/utilities/naming_utilities.py +263 -263
edsl/utilities/remove_edsl_version.py +24 -0
edsl/utilities/repair_functions.py +28 -28
edsl/utilities/restricted_python.py +70 -70
edsl/utilities/utilities.py +436 -424
{edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/LICENSE +21 -21
{edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/METADATA +13 -11
edsl-0.1.39.dev5.dist-info/RECORD +358 -0
{edsl-0.1.39.dev3.dist-info → edsl-0.1.39.dev5.dist-info}/WHEEL +1 -1
edsl/language_models/KeyLookup.py +0 -30
edsl/language_models/registry.py +0 -190
edsl/language_models/unused/ReplicateBase.py +0 -83
edsl/results/ResultsDBMixin.py +0 -238
edsl-0.1.39.dev3.dist-info/RECORD +0 -277

edsl/inference_services/AvailableModelCacheHandler.py ADDED Viewed

@@ -0,0 +1,184 @@
+from typing import List, Optional, get_args, Union
+from pathlib import Path
+import sqlite3
+from datetime import datetime
+import tempfile
+from platformdirs import user_cache_dir
+from dataclasses import dataclass
+import os
+from edsl.inference_services.data_structures import LanguageModelInfo, AvailableModels
+from edsl.enums import InferenceServiceLiteral
+class AvailableModelCacheHandler:
+    MAX_ROWS = 1000
+    CACHE_VALIDITY_HOURS = 48
+    def __init__(
+        self,
+        cache_validity_hours: int = 48,
+        verbose: bool = False,
+        testing_db_name: str = None,
+    ):
+        self.cache_validity_hours = cache_validity_hours
+        self.verbose = verbose
+        if testing_db_name:
+            self.cache_dir = Path(tempfile.mkdtemp())
+            self.db_path = self.cache_dir / testing_db_name
+        else:
+            self.cache_dir = Path(user_cache_dir("edsl", "model_availability"))
+            self.db_path = self.cache_dir / "available_models.db"
+            self.cache_dir.mkdir(parents=True, exist_ok=True)
+        if os.path.exists(self.db_path):
+            if self.verbose:
+                print(f"Using existing cache DB: {self.db_path}")
+        else:
+            self._initialize_db()
+    @property
+    def path_to_db(self):
+        return self.db_path
+    def _initialize_db(self):
+        """Initialize the SQLite database with the required schema."""
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            # Drop the old table if it exists (for migration)
+            cursor.execute("DROP TABLE IF EXISTS model_cache")
+            cursor.execute(
+                """
+                CREATE TABLE IF NOT EXISTS model_cache (
+                    timestamp DATETIME NOT NULL,
+                    model_name TEXT NOT NULL,
+                    service_name TEXT NOT NULL,
+                    UNIQUE(model_name, service_name)
+                )
+            """
+            )
+            conn.commit()
+    def _prune_old_entries(self, conn: sqlite3.Connection):
+        """Delete oldest entries when MAX_ROWS is exceeded."""
+        cursor = conn.cursor()
+        cursor.execute("SELECT COUNT(*) FROM model_cache")
+        count = cursor.fetchone()[0]
+        if count > self.MAX_ROWS:
+            cursor.execute(
+                """
+                DELETE FROM model_cache
+                WHERE rowid IN (
+                    SELECT rowid
+                    FROM model_cache
+                    ORDER BY timestamp ASC
+                    LIMIT ?
+                )
+            """,
+                (count - self.MAX_ROWS,),
+            )
+            conn.commit()
+    @classmethod
+    def example_models(cls) -> List[LanguageModelInfo]:
+        return [
+            LanguageModelInfo(
+                "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", "deep_infra"
+            ),
+            LanguageModelInfo("openai/gpt-4", "openai"),
+        ]
+    def add_models_to_cache(self, models_data: List[LanguageModelInfo]):
+        """Add new models to the cache, updating timestamps for existing entries."""
+        current_time = datetime.now()
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            for model in models_data:
+                cursor.execute(
+                    """
+                    INSERT INTO model_cache (timestamp, model_name, service_name)
+                    VALUES (?, ?, ?)
+                    ON CONFLICT(model_name, service_name)
+                    DO UPDATE SET timestamp = excluded.timestamp
+                """,
+                    (current_time, model.model_name, model.service_name),
+                )
+            # self._prune_old_entries(conn)
+            conn.commit()
+    def reset_cache(self):
+        """Clear all entries from the cache."""
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            cursor.execute("DELETE FROM model_cache")
+            conn.commit()
+    @property
+    def num_cache_entries(self):
+        """Return the number of entries in the cache."""
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            cursor.execute("SELECT COUNT(*) FROM model_cache")
+            count = cursor.fetchone()[0]
+            return count
+    def models(
+        self,
+        service: Optional[InferenceServiceLiteral],
+    ) -> Union[None, AvailableModels]:
+        """Return the available models within the cache validity period."""
+        # if service is not None:
+        #    assert service in get_args(InferenceServiceLiteral)
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            valid_time = datetime.now().timestamp() - (self.cache_validity_hours * 3600)
+            if self.verbose:
+                print(f"Fetching all with timestamp greater than {valid_time}")
+            cursor.execute(
+                """
+                SELECT DISTINCT model_name, service_name
+                FROM model_cache
+                WHERE timestamp > ?
+                ORDER BY timestamp DESC
+            """,
+                (valid_time,),
+            )
+            results = cursor.fetchall()
+            if not results:
+                if self.verbose:
+                    print("No results found in cache DB.")
+                return None
+            matching_models = [
+                LanguageModelInfo(model_name=row[0], service_name=row[1])
+                for row in results
+            ]
+            if self.verbose:
+                print(f"Found {len(matching_models)} models in cache DB.")
+            if service:
+                matching_models = [
+                    model for model in matching_models if model.service_name == service
+                ]
+            return AvailableModels(matching_models)
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod()
+    # cache_handler = AvailableModelCacheHandler(verbose=True)
+    # models_data = cache_handler.example_models()
+    # cache_handler.add_models_to_cache(models_data)
+    # print(cache_handler.models())
+    # cache_handler.clear_cache()
+    # print(cache_handler.models())

edsl/inference_services/AvailableModelFetcher.py ADDED Viewed

@@ -0,0 +1,215 @@
+from typing import Any, List, Tuple, Optional, Dict, TYPE_CHECKING, Union, Generator
+from concurrent.futures import ThreadPoolExecutor, as_completed
+from collections import UserList
+from edsl.inference_services.ServiceAvailability import ServiceAvailability
+from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
+from edsl.inference_services.data_structures import ModelNamesList
+from edsl.enums import InferenceServiceLiteral
+from edsl.inference_services.data_structures import LanguageModelInfo
+from edsl.inference_services.AvailableModelCacheHandler import (
+    AvailableModelCacheHandler,
+)
+from edsl.inference_services.data_structures import AvailableModels
+class AvailableModelFetcher:
+    """Fetches available models from the various services with JSON caching."""
+    service_availability = ServiceAvailability()
+    CACHE_VALIDITY_HOURS = 48  # Cache validity period in hours
+    def __init__(
+        self,
+        services: List["InferenceServiceABC"],
+        added_models: Dict[str, List[str]],
+        verbose: bool = False,
+        use_cache: bool = True,
+    ):
+        self.services = services
+        self.added_models = added_models
+        self._service_map = {
+            service._inference_service_: service for service in services
+        }
+        self.verbose = verbose
+        if use_cache:
+            self.cache_handler = AvailableModelCacheHandler()
+        else:
+            self.cache_handler = None
+    @property
+    def num_cache_entries(self):
+        return self.cache_handler.num_cache_entries
+    @property
+    def path_to_db(self):
+        return self.cache_handler.path_to_db
+    def reset_cache(self):
+        if self.cache_handler:
+            self.cache_handler.reset_cache()
+    def available(
+        self,
+        service: Optional[InferenceServiceABC] = None,
+        force_refresh: bool = False,
+    ) -> List[LanguageModelInfo]:
+        """
+        Get available models from all services, using cached data when available.
+        :param service: Optional[InferenceServiceABC] - If specified, only fetch models for this service.
+        >>> from edsl.inference_services.OpenAIService import OpenAIService
+        >>> af = AvailableModelFetcher([OpenAIService()], {})
+        >>> af.available(service="openai")
+        [LanguageModelInfo(model_name='...', service_name='openai'), ...]
+        Returns a list of [model, service_name, index] entries.
+        """
+        if service:  # they passed a specific service
+            matching_models, _ = self.get_available_models_by_service(
+                service=service, force_refresh=force_refresh
+            )
+            return matching_models
+        # Nope, we need to fetch them all
+        all_models = self._get_all_models()
+        # if self.cache_handler:
+        #    self.cache_handler.add_models_to_cache(all_models)
+        return all_models
+    def get_available_models_by_service(
+        self,
+        service: Union["InferenceServiceABC", InferenceServiceLiteral],
+        force_refresh: bool = False,
+    ) -> Tuple[AvailableModels, InferenceServiceLiteral]:
+        """Get models for a single service.
+        :param service: InferenceServiceABC - e.g., OpenAIService or "openai"
+        :return: Tuple[List[LanguageModelInfo], InferenceServiceLiteral]
+        """
+        if isinstance(service, str):
+            service = self._fetch_service_by_service_name(service)
+        if not force_refresh:
+            models_from_cache = self.cache_handler.models(
+                service=service._inference_service_
+            )
+            if self.verbose:
+                print(
+                    "Searching cache for models with service name:",
+                    service._inference_service_,
+                )
+                print("Got models from cache:", models_from_cache)
+        else:
+            models_from_cache = None
+        if models_from_cache:
+            # print(f"Models from cache for {service}: {models_from_cache}")
+            # print(hasattr(models_from_cache[0], "service_name"))
+            return models_from_cache, service._inference_service_
+        else:
+            return self.get_available_models_by_service_fresh(service)
+    def get_available_models_by_service_fresh(
+        self, service: Union["InferenceServiceABC", InferenceServiceLiteral]
+    ) -> Tuple[AvailableModels, InferenceServiceLiteral]:
+        """Get models for a single service. This method always fetches fresh data.
+        :param service: InferenceServiceABC - e.g., OpenAIService or "openai"
+        :return: Tuple[List[LanguageModelInfo], InferenceServiceLiteral]
+        """
+        if isinstance(service, str):
+            service = self._fetch_service_by_service_name(service)
+        service_models: ModelNamesList = (
+            self.service_availability.get_service_available(service, warn=False)
+        )
+        service_name = service._inference_service_
+        if not service_models:
+            import warnings
+            warnings.warn(f"No models found for service {service_name}")
+            return [], service_name
+        models_list = AvailableModels(
+            [
+                LanguageModelInfo(
+                    model_name=model_name,
+                    service_name=service_name,
+                )
+                for model_name in service_models
+            ]
+        )
+        self.cache_handler.add_models_to_cache(models_list)  # update the cache
+        return models_list, service_name
+    def _fetch_service_by_service_name(
+        self, service_name: InferenceServiceLiteral
+    ) -> "InferenceServiceABC":
+        """The service name is the _inference_service_ attribute of the service."""
+        if service_name in self._service_map:
+            return self._service_map[service_name]
+        raise ValueError(f"Service {service_name} not found")
+    def _get_all_models(self, force_refresh=False) -> List[LanguageModelInfo]:
+        all_models = []
+        with ThreadPoolExecutor(max_workers=min(len(self.services), 10)) as executor:
+            future_to_service = {
+                executor.submit(
+                    self.get_available_models_by_service, service, force_refresh
+                ): service
+                for service in self.services
+            }
+            for future in as_completed(future_to_service):
+                try:
+                    models, service_name = future.result()
+                    all_models.extend(models)
+                    # Add any additional models for this service
+                    for model in self.added_models.get(service_name, []):
+                        all_models.append(
+                            LanguageModelInfo(
+                                model_name=model, service_name=service_name
+                            )
+                        )
+                except Exception as exc:
+                    print(f"Service query failed for service {service_name}: {exc}")
+                    continue
+        return AvailableModels(all_models)
+def main():
+    from edsl.inference_services.OpenAIService import OpenAIService
+    af = AvailableModelFetcher([OpenAIService()], {}, verbose=True)
+    # print(af.available(service="openai"))
+    all_models = AvailableModelFetcher([OpenAIService()], {})._get_all_models(
+        force_refresh=True
+    )
+    print(all_models)
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod(optionflags=doctest.ELLIPSIS)
+    # main()
+    # from edsl.inference_services.OpenAIService import OpenAIService
+    # af = AvailableModelFetcher([OpenAIService()], {}, verbose=True)
+    # # print(af.available(service="openai"))
+    # all_models = AvailableModelFetcher([OpenAIService()], {})._get_all_models()
+    # print(all_models)

edsl/inference_services/AwsBedrock.py CHANGED Viewed

@@ -1,120 +1,118 @@
-import os
-from typing import Any, List, Optional
-import re
-import boto3
-from botocore.exceptions import ClientError
-from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
-from edsl.language_models.LanguageModel import LanguageModel
-import json
-from edsl.utilities.utilities import fix_partial_correct_response
-class AwsBedrockService(InferenceServiceABC):
-    """AWS Bedrock service class."""
-    _inference_service_ = "bedrock"
-    _env_key_name_ = (
-        "AWS_ACCESS_KEY_ID"  # or any other environment key for AWS credentials
-    )
-    key_sequence = ["output", "message", "content", 0, "text"]
-    input_token_name = "inputTokens"
-    output_token_name = "outputTokens"
-    usage_sequence = ["usage"]
-    model_exclude_list = [
-        "ai21.j2-grande-instruct",
-        "ai21.j2-jumbo-instruct",
-        "ai21.j2-mid",
-        "ai21.j2-mid-v1",
-        "ai21.j2-ultra",
-        "ai21.j2-ultra-v1",
-    ]
-    _models_list_cache: List[str] = []
-    @classmethod
-    def available(cls):
-        """Fetch available models from AWS Bedrock."""
-        region = os.getenv("AWS_REGION", "us-east-1")
-        if not cls._models_list_cache:
-            client = boto3.client("bedrock", region_name=region)
-            all_models_ids = [
-                x["modelId"] for x in client.list_foundation_models()["modelSummaries"]
-            ]
-        else:
-            all_models_ids = cls._models_list_cache
-        return [m for m in all_models_ids if m not in cls.model_exclude_list]
-    @classmethod
-    def create_model(
-        cls, model_name: str = "amazon.titan-tg1-large", model_class_name=None
-    ) -> LanguageModel:
-        if model_class_name is None:
-            model_class_name = cls.to_class_name(model_name)
-        class LLM(LanguageModel):
-            """
-            Child class of LanguageModel for interacting with AWS Bedrock models.
-            """
-            key_sequence = cls.key_sequence
-            usage_sequence = cls.usage_sequence
-            _inference_service_ = cls._inference_service_
-            _model_ = model_name
-            _parameters_ = {
-                "temperature": 0.5,
-                "max_tokens": 512,
-                "top_p": 0.9,
-            }
-            input_token_name = cls.input_token_name
-            output_token_name = cls.output_token_name
-            _rpm = cls.get_rpm(cls)
-            _tpm = cls.get_tpm(cls)
-            async def async_execute_model_call(
-                self,
-                user_prompt: str,
-                system_prompt: str = "",
-                files_list: Optional[List["FileStore"]] = None,
-            ) -> dict[str, Any]:
-                """Calls the AWS Bedrock API and returns the API response."""
-                api_token = (
-                    self.api_token
-                )  # call to check the if env variables are set.
-                region = os.getenv("AWS_REGION", "us-east-1")
-                client = boto3.client("bedrock-runtime", region_name=region)
-                conversation = [
-                    {
-                        "role": "user",
-                        "content": [{"text": user_prompt}],
-                    }
-                ]
-                system = [
-                    {
-                        "text": system_prompt,
-                    }
-                ]
-                try:
-                    response = client.converse(
-                        modelId=self._model_,
-                        messages=conversation,
-                        inferenceConfig={
-                            "maxTokens": self.max_tokens,
-                            "temperature": self.temperature,
-                            "topP": self.top_p,
-                        },
-                        # system=system,
-                        additionalModelRequestFields={},
-                    )
-                    return response
-                except (ClientError, Exception) as e:
-                    print(e)
-                    return {"error": str(e)}
-        LLM.__name__ = model_class_name
-        return LLM
+import os
+from typing import Any, List, Optional
+import re
+import boto3
+from botocore.exceptions import ClientError
+from edsl.inference_services.InferenceServiceABC import InferenceServiceABC
+from edsl.language_models.LanguageModel import LanguageModel
+import json
+from edsl.utilities.utilities import fix_partial_correct_response
+class AwsBedrockService(InferenceServiceABC):
+    """AWS Bedrock service class."""
+    _inference_service_ = "bedrock"
+    _env_key_name_ = (
+        "AWS_ACCESS_KEY_ID"  # or any other environment key for AWS credentials
+    )
+    key_sequence = ["output", "message", "content", 0, "text"]
+    input_token_name = "inputTokens"
+    output_token_name = "outputTokens"
+    usage_sequence = ["usage"]
+    model_exclude_list = [
+        "ai21.j2-grande-instruct",
+        "ai21.j2-jumbo-instruct",
+        "ai21.j2-mid",
+        "ai21.j2-mid-v1",
+        "ai21.j2-ultra",
+        "ai21.j2-ultra-v1",
+    ]
+    _models_list_cache: List[str] = []
+    @classmethod
+    def available(cls):
+        """Fetch available models from AWS Bedrock."""
+        region = os.getenv("AWS_REGION", "us-east-1")
+        if not cls._models_list_cache:
+            client = boto3.client("bedrock", region_name=region)
+            all_models_ids = [
+                x["modelId"] for x in client.list_foundation_models()["modelSummaries"]
+            ]
+        else:
+            all_models_ids = cls._models_list_cache
+        return [m for m in all_models_ids if m not in cls.model_exclude_list]
+    @classmethod
+    def create_model(
+        cls, model_name: str = "amazon.titan-tg1-large", model_class_name=None
+    ) -> LanguageModel:
+        if model_class_name is None:
+            model_class_name = cls.to_class_name(model_name)
+        class LLM(LanguageModel):
+            """
+            Child class of LanguageModel for interacting with AWS Bedrock models.
+            """
+            key_sequence = cls.key_sequence
+            usage_sequence = cls.usage_sequence
+            _inference_service_ = cls._inference_service_
+            _model_ = model_name
+            _parameters_ = {
+                "temperature": 0.5,
+                "max_tokens": 512,
+                "top_p": 0.9,
+            }
+            input_token_name = cls.input_token_name
+            output_token_name = cls.output_token_name
+            async def async_execute_model_call(
+                self,
+                user_prompt: str,
+                system_prompt: str = "",
+                files_list: Optional[List["FileStore"]] = None,
+            ) -> dict[str, Any]:
+                """Calls the AWS Bedrock API and returns the API response."""
+                api_token = (
+                    self.api_token
+                )  # call to check the if env variables are set.
+                region = os.getenv("AWS_REGION", "us-east-1")
+                client = boto3.client("bedrock-runtime", region_name=region)
+                conversation = [
+                    {
+                        "role": "user",
+                        "content": [{"text": user_prompt}],
+                    }
+                ]
+                system = [
+                    {
+                        "text": system_prompt,
+                    }
+                ]
+                try:
+                    response = client.converse(
+                        modelId=self._model_,
+                        messages=conversation,
+                        inferenceConfig={
+                            "maxTokens": self.max_tokens,
+                            "temperature": self.temperature,
+                            "topP": self.top_p,
+                        },
+                        # system=system,
+                        additionalModelRequestFields={},
+                    )
+                    return response
+                except (ClientError, Exception) as e:
+                    print(e)
+                    return {"error": str(e)}
+        LLM.__name__ = model_class_name
+        return LLM

edsl 0.1.39.dev3__py3-none-any.whl → 0.1.39.dev5__py3-none-any.whl

edsl 0.1.39.dev3py3-none-any.whl → 0.1.39.dev5py3-none-any.whl