lionagi 0.5.5__py3-none-any.whl → 0.6.0__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- lionagi/__init__.py +16 -24
- lionagi/{core/_class_registry.py → _class_registry.py} +51 -10
- lionagi/_errors.py +35 -0
- lionagi/libs/__init__.py +3 -0
- lionagi/libs/compress/__init__.py +3 -0
- lionagi/libs/compress/models.py +6 -2
- lionagi/libs/compress/utils.py +4 -16
- lionagi/libs/file/__init__.py +3 -0
- lionagi/libs/file/chunk.py +4 -0
- lionagi/libs/file/file_ops.py +4 -0
- lionagi/libs/file/params.py +4 -41
- lionagi/libs/file/process.py +4 -0
- lionagi/libs/file/save.py +5 -1
- lionagi/libs/{parse/flatten → nested}/flatten.py +4 -0
- lionagi/libs/{parse/nested → nested}/nfilter.py +4 -0
- lionagi/libs/{parse/nested → nested}/nget.py +6 -1
- lionagi/libs/{parse/nested → nested}/ninsert.py +5 -1
- lionagi/libs/{parse/nested → nested}/nmerge.py +4 -0
- lionagi/libs/{parse/nested → nested}/npop.py +5 -2
- lionagi/libs/{parse/nested → nested}/nset.py +6 -1
- lionagi/libs/{parse/flatten → nested}/unflatten.py +4 -0
- lionagi/libs/{parse/nested → nested}/utils.py +5 -1
- lionagi/libs/package/__init__.py +3 -0
- lionagi/libs/package/imports.py +6 -2
- lionagi/libs/package/management.py +7 -3
- lionagi/libs/package/params.py +4 -0
- lionagi/libs/package/system.py +4 -0
- lionagi/libs/parse.py +30 -0
- lionagi/libs/{parse/json → schema}/as_readable.py +10 -4
- lionagi/libs/{parse/string_parse/code_block.py → schema/extract_code_block.py} +4 -0
- lionagi/libs/{parse/string_parse/docstring.py → schema/extract_docstring.py} +4 -0
- lionagi/libs/{parse/string_parse/function_.py → schema/function_to_schema.py} +21 -9
- lionagi/libs/{parse/json/schema.py → schema/json_schema.py} +5 -1
- lionagi/libs/validate/common_field_validators.py +170 -0
- lionagi/libs/{parse/validate/keys.py → validate/fuzzy_match_keys.py} +42 -8
- lionagi/libs/{parse/validate/mapping.py → validate/fuzzy_validate_mapping.py} +41 -6
- lionagi/libs/{string_similarity/algorithms.py → validate/string_similarity.py} +115 -1
- lionagi/libs/{parse/validate/boolean.py → validate/validate_boolean.py} +42 -3
- lionagi/operations/__init__.py +13 -3
- lionagi/operations/brainstorm/__init__.py +3 -3
- lionagi/operations/brainstorm/brainstorm.py +33 -19
- lionagi/operations/brainstorm/prompt.py +4 -0
- lionagi/operations/plan/__init__.py +4 -0
- lionagi/operations/plan/plan.py +16 -13
- lionagi/operations/plan/prompt.py +4 -0
- lionagi/operations/select/__init__.py +4 -0
- lionagi/operations/select/prompt.py +4 -0
- lionagi/operations/select/select.py +1 -1
- lionagi/operations/select/utils.py +4 -4
- lionagi/{strategies → operations/strategies}/base.py +6 -2
- lionagi/{strategies → operations/strategies}/concurrent.py +8 -5
- lionagi/{strategies → operations/strategies}/concurrent_chunk.py +6 -3
- lionagi/{strategies → operations/strategies}/concurrent_sequential_chunk.py +8 -4
- lionagi/{strategies → operations/strategies}/params.py +10 -6
- lionagi/{strategies → operations/strategies}/sequential.py +6 -2
- lionagi/{strategies → operations/strategies}/sequential_chunk.py +7 -3
- lionagi/{strategies → operations/strategies}/sequential_concurrent_chunk.py +9 -4
- lionagi/{strategies → operations/strategies}/utils.py +6 -3
- lionagi/{core/models/__init__.py → operations/types.py} +3 -1
- lionagi/operations/utils.py +6 -3
- lionagi/operatives/action/function_calling.py +136 -0
- lionagi/operatives/action/manager.py +239 -0
- lionagi/operatives/action/request_response_model.py +90 -0
- lionagi/operatives/action/tool.py +141 -0
- lionagi/{protocols/operatives/action.py → operatives/action/utils.py} +52 -90
- lionagi/{core → operatives}/forms/base.py +9 -4
- lionagi/{core → operatives}/forms/form.py +8 -13
- lionagi/{core → operatives}/forms/report.py +5 -3
- lionagi/operatives/instruct/base.py +79 -0
- lionagi/operatives/instruct/instruct.py +105 -0
- lionagi/operatives/instruct/instruct_collection.py +52 -0
- lionagi/operatives/instruct/node.py +13 -0
- lionagi/{protocols/operatives → operatives/instruct}/prompts.py +0 -34
- lionagi/{protocols/operatives → operatives/instruct}/reason.py +14 -7
- lionagi/{integrations/anthropic_/version.py → operatives/manager.py} +5 -1
- lionagi/operatives/models/field_model.py +194 -0
- lionagi/operatives/models/model_params.py +307 -0
- lionagi/{core → operatives}/models/note.py +20 -28
- lionagi/{core → operatives}/models/operable_model.py +153 -71
- lionagi/{core → operatives}/models/schema_model.py +4 -3
- lionagi/{protocols/operatives → operatives}/operative.py +10 -7
- lionagi/{protocols/operatives → operatives}/step.py +67 -26
- lionagi/operatives/types.py +69 -0
- lionagi/protocols/_adapter.py +224 -0
- lionagi/protocols/_concepts.py +94 -0
- lionagi/protocols/generic/element.py +460 -0
- lionagi/protocols/generic/event.py +177 -0
- lionagi/protocols/generic/log.py +237 -0
- lionagi/{core → protocols}/generic/pile.py +172 -131
- lionagi/protocols/generic/processor.py +316 -0
- lionagi/protocols/generic/progression.py +500 -0
- lionagi/protocols/graph/edge.py +166 -0
- lionagi/protocols/graph/graph.py +290 -0
- lionagi/protocols/graph/node.py +109 -0
- lionagi/protocols/mail/exchange.py +116 -0
- lionagi/protocols/mail/mail.py +25 -0
- lionagi/protocols/mail/mailbox.py +47 -0
- lionagi/protocols/mail/manager.py +168 -0
- lionagi/protocols/mail/package.py +55 -0
- lionagi/protocols/messages/action_request.py +165 -0
- lionagi/protocols/messages/action_response.py +132 -0
- lionagi/{core/communication → protocols/messages}/assistant_response.py +55 -79
- lionagi/protocols/messages/base.py +73 -0
- lionagi/protocols/messages/instruction.py +582 -0
- lionagi/protocols/messages/manager.py +429 -0
- lionagi/protocols/messages/message.py +216 -0
- lionagi/protocols/messages/system.py +115 -0
- lionagi/protocols/messages/templates/assistant_response.jinja2 +6 -0
- lionagi/{core/communication → protocols/messages}/templates/instruction_message.jinja2 +2 -2
- lionagi/protocols/types.py +96 -0
- lionagi/service/__init__.py +10 -12
- lionagi/service/endpoints/base.py +517 -0
- lionagi/service/endpoints/chat_completion.py +102 -0
- lionagi/service/endpoints/match_endpoint.py +60 -0
- lionagi/service/endpoints/rate_limited_processor.py +145 -0
- lionagi/service/endpoints/token_calculator.py +209 -0
- lionagi/service/imodel.py +263 -96
- lionagi/service/manager.py +45 -0
- lionagi/service/providers/anthropic_/messages.py +64 -0
- lionagi/service/providers/groq_/chat_completions.py +56 -0
- lionagi/service/providers/openai_/chat_completions.py +62 -0
- lionagi/service/providers/openrouter_/chat_completions.py +62 -0
- lionagi/service/providers/perplexity_/__init__.py +3 -0
- lionagi/service/providers/perplexity_/chat_completions.py +40 -0
- lionagi/session/__init__.py +3 -0
- lionagi/session/branch.py +1287 -0
- lionagi/session/session.py +296 -0
- lionagi/settings.py +62 -118
- lionagi/utils.py +2386 -0
- lionagi/version.py +1 -1
- {lionagi-0.5.5.dist-info → lionagi-0.6.0.dist-info}/METADATA +7 -6
- lionagi-0.6.0.dist-info/RECORD +160 -0
- lionagi/core/action/action_manager.py +0 -289
- lionagi/core/action/base.py +0 -109
- lionagi/core/action/function_calling.py +0 -153
- lionagi/core/action/tool.py +0 -202
- lionagi/core/action/types.py +0 -16
- lionagi/core/communication/action_request.py +0 -163
- lionagi/core/communication/action_response.py +0 -149
- lionagi/core/communication/base_mail.py +0 -49
- lionagi/core/communication/instruction.py +0 -376
- lionagi/core/communication/message.py +0 -286
- lionagi/core/communication/message_manager.py +0 -543
- lionagi/core/communication/system.py +0 -116
- lionagi/core/communication/templates/assistant_response.jinja2 +0 -2
- lionagi/core/communication/types.py +0 -27
- lionagi/core/communication/utils.py +0 -256
- lionagi/core/forms/types.py +0 -13
- lionagi/core/generic/component.py +0 -422
- lionagi/core/generic/edge.py +0 -163
- lionagi/core/generic/element.py +0 -199
- lionagi/core/generic/graph.py +0 -377
- lionagi/core/generic/log.py +0 -151
- lionagi/core/generic/log_manager.py +0 -320
- lionagi/core/generic/node.py +0 -11
- lionagi/core/generic/progression.py +0 -395
- lionagi/core/generic/types.py +0 -23
- lionagi/core/generic/utils.py +0 -53
- lionagi/core/models/base.py +0 -28
- lionagi/core/models/field_model.py +0 -145
- lionagi/core/models/model_params.py +0 -194
- lionagi/core/models/types.py +0 -19
- lionagi/core/session/branch.py +0 -130
- lionagi/core/session/branch_mixins.py +0 -581
- lionagi/core/session/session.py +0 -163
- lionagi/core/session/types.py +0 -8
- lionagi/core/typing/__init__.py +0 -9
- lionagi/core/typing/_concepts.py +0 -173
- lionagi/core/typing/_id.py +0 -104
- lionagi/core/typing/_pydantic.py +0 -33
- lionagi/core/typing/_typing.py +0 -54
- lionagi/integrations/__init__.py +0 -0
- lionagi/integrations/_services.py +0 -17
- lionagi/integrations/anthropic_/AnthropicModel.py +0 -268
- lionagi/integrations/anthropic_/AnthropicService.py +0 -127
- lionagi/integrations/anthropic_/anthropic_max_output_token_data.yaml +0 -12
- lionagi/integrations/anthropic_/anthropic_price_data.yaml +0 -34
- lionagi/integrations/anthropic_/api_endpoints/api_request.py +0 -277
- lionagi/integrations/anthropic_/api_endpoints/data_models.py +0 -40
- lionagi/integrations/anthropic_/api_endpoints/match_response.py +0 -119
- lionagi/integrations/anthropic_/api_endpoints/messages/request/message_models.py +0 -14
- lionagi/integrations/anthropic_/api_endpoints/messages/request/request_body.py +0 -74
- lionagi/integrations/anthropic_/api_endpoints/messages/response/__init__.py +0 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/response/content_models.py +0 -32
- lionagi/integrations/anthropic_/api_endpoints/messages/response/response_body.py +0 -101
- lionagi/integrations/anthropic_/api_endpoints/messages/response/usage_models.py +0 -25
- lionagi/integrations/groq_/GroqModel.py +0 -325
- lionagi/integrations/groq_/GroqService.py +0 -156
- lionagi/integrations/groq_/api_endpoints/__init__.py +0 -0
- lionagi/integrations/groq_/api_endpoints/data_models.py +0 -187
- lionagi/integrations/groq_/api_endpoints/groq_request.py +0 -288
- lionagi/integrations/groq_/api_endpoints/match_response.py +0 -106
- lionagi/integrations/groq_/api_endpoints/response_utils.py +0 -105
- lionagi/integrations/groq_/groq_max_output_token_data.yaml +0 -21
- lionagi/integrations/groq_/groq_price_data.yaml +0 -58
- lionagi/integrations/groq_/groq_rate_limits.yaml +0 -105
- lionagi/integrations/groq_/version.py +0 -5
- lionagi/integrations/litellm_/imodel.py +0 -76
- lionagi/integrations/ollama_/OllamaModel.py +0 -244
- lionagi/integrations/ollama_/OllamaService.py +0 -142
- lionagi/integrations/ollama_/api_endpoints/api_request.py +0 -179
- lionagi/integrations/ollama_/api_endpoints/chat_completion/message_models.py +0 -31
- lionagi/integrations/ollama_/api_endpoints/chat_completion/request_body.py +0 -46
- lionagi/integrations/ollama_/api_endpoints/chat_completion/response_body.py +0 -67
- lionagi/integrations/ollama_/api_endpoints/chat_completion/tool_models.py +0 -49
- lionagi/integrations/ollama_/api_endpoints/completion/__init__.py +0 -0
- lionagi/integrations/ollama_/api_endpoints/completion/request_body.py +0 -72
- lionagi/integrations/ollama_/api_endpoints/completion/response_body.py +0 -59
- lionagi/integrations/ollama_/api_endpoints/data_models.py +0 -15
- lionagi/integrations/ollama_/api_endpoints/embedding/__init__.py +0 -0
- lionagi/integrations/ollama_/api_endpoints/embedding/request_body.py +0 -33
- lionagi/integrations/ollama_/api_endpoints/embedding/response_body.py +0 -29
- lionagi/integrations/ollama_/api_endpoints/match_data_model.py +0 -62
- lionagi/integrations/ollama_/api_endpoints/match_response.py +0 -190
- lionagi/integrations/ollama_/api_endpoints/model/copy_model.py +0 -13
- lionagi/integrations/ollama_/api_endpoints/model/create_model.py +0 -28
- lionagi/integrations/ollama_/api_endpoints/model/delete_model.py +0 -11
- lionagi/integrations/ollama_/api_endpoints/model/list_model.py +0 -60
- lionagi/integrations/ollama_/api_endpoints/model/pull_model.py +0 -34
- lionagi/integrations/ollama_/api_endpoints/model/push_model.py +0 -35
- lionagi/integrations/ollama_/api_endpoints/model/show_model.py +0 -36
- lionagi/integrations/ollama_/api_endpoints/option_models.py +0 -68
- lionagi/integrations/openai_/OpenAIModel.py +0 -419
- lionagi/integrations/openai_/OpenAIService.py +0 -435
- lionagi/integrations/openai_/__init__.py +0 -0
- lionagi/integrations/openai_/api_endpoints/__init__.py +0 -3
- lionagi/integrations/openai_/api_endpoints/api_request.py +0 -277
- lionagi/integrations/openai_/api_endpoints/audio/__init__.py +0 -9
- lionagi/integrations/openai_/api_endpoints/audio/speech_models.py +0 -34
- lionagi/integrations/openai_/api_endpoints/audio/transcription_models.py +0 -136
- lionagi/integrations/openai_/api_endpoints/audio/translation_models.py +0 -41
- lionagi/integrations/openai_/api_endpoints/audio/types.py +0 -41
- lionagi/integrations/openai_/api_endpoints/batch/__init__.py +0 -17
- lionagi/integrations/openai_/api_endpoints/batch/batch_models.py +0 -146
- lionagi/integrations/openai_/api_endpoints/batch/cancel_batch.py +0 -7
- lionagi/integrations/openai_/api_endpoints/batch/create_batch.py +0 -26
- lionagi/integrations/openai_/api_endpoints/batch/list_batch.py +0 -37
- lionagi/integrations/openai_/api_endpoints/batch/request_object_models.py +0 -65
- lionagi/integrations/openai_/api_endpoints/batch/retrieve_batch.py +0 -7
- lionagi/integrations/openai_/api_endpoints/batch/types.py +0 -4
- lionagi/integrations/openai_/api_endpoints/chat_completions/__init__.py +0 -1
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/__init__.py +0 -39
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/message_models.py +0 -121
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/request_body.py +0 -221
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/response_format.py +0 -71
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/stream_options.py +0 -14
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/tool_choice_models.py +0 -17
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/tool_models.py +0 -54
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/types.py +0 -18
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/__init__.py +0 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/choice_models.py +0 -62
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/function_models.py +0 -16
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/log_prob_models.py +0 -47
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/message_models.py +0 -25
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/response_body.py +0 -99
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/types.py +0 -8
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/usage_models.py +0 -24
- lionagi/integrations/openai_/api_endpoints/chat_completions/util.py +0 -46
- lionagi/integrations/openai_/api_endpoints/data_models.py +0 -23
- lionagi/integrations/openai_/api_endpoints/embeddings/__init__.py +0 -3
- lionagi/integrations/openai_/api_endpoints/embeddings/request_body.py +0 -79
- lionagi/integrations/openai_/api_endpoints/embeddings/response_body.py +0 -67
- lionagi/integrations/openai_/api_endpoints/files/__init__.py +0 -11
- lionagi/integrations/openai_/api_endpoints/files/delete_file.py +0 -20
- lionagi/integrations/openai_/api_endpoints/files/file_models.py +0 -56
- lionagi/integrations/openai_/api_endpoints/files/list_files.py +0 -27
- lionagi/integrations/openai_/api_endpoints/files/retrieve_file.py +0 -9
- lionagi/integrations/openai_/api_endpoints/files/upload_file.py +0 -38
- lionagi/integrations/openai_/api_endpoints/fine_tuning/__init__.py +0 -37
- lionagi/integrations/openai_/api_endpoints/fine_tuning/cancel_jobs.py +0 -9
- lionagi/integrations/openai_/api_endpoints/fine_tuning/create_jobs.py +0 -133
- lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_checkpoint_models.py +0 -58
- lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_event_models.py +0 -31
- lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_models.py +0 -140
- lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_checkpoints.py +0 -51
- lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_events.py +0 -42
- lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_jobs.py +0 -31
- lionagi/integrations/openai_/api_endpoints/fine_tuning/retrieve_jobs.py +0 -9
- lionagi/integrations/openai_/api_endpoints/fine_tuning/training_format.py +0 -30
- lionagi/integrations/openai_/api_endpoints/images/__init__.py +0 -9
- lionagi/integrations/openai_/api_endpoints/images/image_edit_models.py +0 -69
- lionagi/integrations/openai_/api_endpoints/images/image_models.py +0 -56
- lionagi/integrations/openai_/api_endpoints/images/image_variation_models.py +0 -56
- lionagi/integrations/openai_/api_endpoints/images/response_body.py +0 -30
- lionagi/integrations/openai_/api_endpoints/match_data_model.py +0 -197
- lionagi/integrations/openai_/api_endpoints/match_response.py +0 -336
- lionagi/integrations/openai_/api_endpoints/models/__init__.py +0 -7
- lionagi/integrations/openai_/api_endpoints/models/delete_fine_tuned_model.py +0 -17
- lionagi/integrations/openai_/api_endpoints/models/models_models.py +0 -31
- lionagi/integrations/openai_/api_endpoints/models/retrieve_model.py +0 -9
- lionagi/integrations/openai_/api_endpoints/moderations/__init__.py +0 -3
- lionagi/integrations/openai_/api_endpoints/moderations/request_body.py +0 -20
- lionagi/integrations/openai_/api_endpoints/moderations/response_body.py +0 -139
- lionagi/integrations/openai_/api_endpoints/uploads/__init__.py +0 -19
- lionagi/integrations/openai_/api_endpoints/uploads/add_upload_part.py +0 -11
- lionagi/integrations/openai_/api_endpoints/uploads/cancel_upload.py +0 -7
- lionagi/integrations/openai_/api_endpoints/uploads/complete_upload.py +0 -18
- lionagi/integrations/openai_/api_endpoints/uploads/create_upload.py +0 -17
- lionagi/integrations/openai_/api_endpoints/uploads/uploads_models.py +0 -52
- lionagi/integrations/openai_/image_token_calculator/__init__.py +0 -0
- lionagi/integrations/openai_/image_token_calculator/image_token_calculator.py +0 -98
- lionagi/integrations/openai_/image_token_calculator/openai_image_token_data.yaml +0 -15
- lionagi/integrations/openai_/openai_max_output_token_data.yaml +0 -12
- lionagi/integrations/openai_/openai_price_data.yaml +0 -26
- lionagi/integrations/openai_/version.py +0 -1
- lionagi/integrations/pandas_/__init__.py +0 -24
- lionagi/integrations/pandas_/extend_df.py +0 -61
- lionagi/integrations/pandas_/read.py +0 -103
- lionagi/integrations/pandas_/remove_rows.py +0 -61
- lionagi/integrations/pandas_/replace_keywords.py +0 -65
- lionagi/integrations/pandas_/save.py +0 -131
- lionagi/integrations/pandas_/search_keywords.py +0 -69
- lionagi/integrations/pandas_/to_df.py +0 -196
- lionagi/integrations/pandas_/update_cells.py +0 -54
- lionagi/integrations/perplexity_/PerplexityModel.py +0 -274
- lionagi/integrations/perplexity_/PerplexityService.py +0 -118
- lionagi/integrations/perplexity_/api_endpoints/__init__.py +0 -0
- lionagi/integrations/perplexity_/api_endpoints/api_request.py +0 -171
- lionagi/integrations/perplexity_/api_endpoints/chat_completions/__init__.py +0 -0
- lionagi/integrations/perplexity_/api_endpoints/chat_completions/request/__init__.py +0 -0
- lionagi/integrations/perplexity_/api_endpoints/chat_completions/request/request_body.py +0 -121
- lionagi/integrations/perplexity_/api_endpoints/chat_completions/response/__init__.py +0 -0
- lionagi/integrations/perplexity_/api_endpoints/chat_completions/response/response_body.py +0 -146
- lionagi/integrations/perplexity_/api_endpoints/data_models.py +0 -63
- lionagi/integrations/perplexity_/api_endpoints/match_response.py +0 -26
- lionagi/integrations/perplexity_/perplexity_max_output_token_data.yaml +0 -3
- lionagi/integrations/perplexity_/perplexity_price_data.yaml +0 -10
- lionagi/integrations/perplexity_/version.py +0 -1
- lionagi/integrations/pydantic_/__init__.py +0 -8
- lionagi/integrations/pydantic_/break_down_annotation.py +0 -81
- lionagi/integrations/pydantic_/new_model.py +0 -208
- lionagi/libs/constants.py +0 -98
- lionagi/libs/file/path.py +0 -301
- lionagi/libs/file/types.py +0 -22
- lionagi/libs/func/__init__.py +0 -0
- lionagi/libs/func/async_calls/__init__.py +0 -24
- lionagi/libs/func/async_calls/alcall.py +0 -210
- lionagi/libs/func/async_calls/bcall.py +0 -130
- lionagi/libs/func/async_calls/mcall.py +0 -134
- lionagi/libs/func/async_calls/pcall.py +0 -149
- lionagi/libs/func/async_calls/rcall.py +0 -217
- lionagi/libs/func/async_calls/tcall.py +0 -114
- lionagi/libs/func/async_calls/ucall.py +0 -85
- lionagi/libs/func/decorators.py +0 -277
- lionagi/libs/func/lcall.py +0 -57
- lionagi/libs/func/params.py +0 -64
- lionagi/libs/func/throttle.py +0 -119
- lionagi/libs/func/types.py +0 -39
- lionagi/libs/func/utils.py +0 -96
- lionagi/libs/package/types.py +0 -26
- lionagi/libs/parse/__init__.py +0 -1
- lionagi/libs/parse/flatten/__init__.py +0 -9
- lionagi/libs/parse/flatten/params.py +0 -52
- lionagi/libs/parse/json/__init__.py +0 -27
- lionagi/libs/parse/json/extract.py +0 -102
- lionagi/libs/parse/json/parse.py +0 -179
- lionagi/libs/parse/json/to_json.py +0 -71
- lionagi/libs/parse/nested/__init__.py +0 -33
- lionagi/libs/parse/nested/to_flat_list.py +0 -64
- lionagi/libs/parse/params.py +0 -0
- lionagi/libs/parse/string_parse/__init__.py +0 -11
- lionagi/libs/parse/type_convert/__init__.py +0 -19
- lionagi/libs/parse/type_convert/params.py +0 -145
- lionagi/libs/parse/type_convert/to_dict.py +0 -333
- lionagi/libs/parse/type_convert/to_list.py +0 -186
- lionagi/libs/parse/type_convert/to_num.py +0 -358
- lionagi/libs/parse/type_convert/to_str.py +0 -195
- lionagi/libs/parse/types.py +0 -9
- lionagi/libs/parse/validate/__init__.py +0 -14
- lionagi/libs/parse/validate/params.py +0 -62
- lionagi/libs/parse/xml/__init__.py +0 -10
- lionagi/libs/parse/xml/convert.py +0 -56
- lionagi/libs/parse/xml/parser.py +0 -93
- lionagi/libs/string_similarity/__init__.py +0 -32
- lionagi/libs/string_similarity/matcher.py +0 -102
- lionagi/libs/string_similarity/utils.py +0 -15
- lionagi/libs/utils.py +0 -266
- lionagi/protocols/adapters/__init__.py +0 -0
- lionagi/protocols/adapters/adapter.py +0 -79
- lionagi/protocols/adapters/json_adapter.py +0 -43
- lionagi/protocols/adapters/pandas_adapter.py +0 -96
- lionagi/protocols/configs/__init__.py +0 -0
- lionagi/protocols/configs/branch_config.py +0 -86
- lionagi/protocols/configs/id_config.py +0 -15
- lionagi/protocols/configs/imodel_config.py +0 -73
- lionagi/protocols/configs/log_config.py +0 -93
- lionagi/protocols/configs/retry_config.py +0 -29
- lionagi/protocols/configs/types.py +0 -15
- lionagi/protocols/operatives/instruct.py +0 -194
- lionagi/protocols/operatives/types.py +0 -19
- lionagi/protocols/registries/_component_registry.py +0 -23
- lionagi/protocols/registries/_pile_registry.py +0 -30
- lionagi/service/complete_request_info.py +0 -11
- lionagi/service/rate_limiter.py +0 -108
- lionagi/service/service.py +0 -41
- lionagi/service/service_match_util.py +0 -131
- lionagi/service/service_util.py +0 -72
- lionagi/service/token_calculator.py +0 -51
- lionagi/strategies/__init__.py +0 -0
- lionagi/strategies/types.py +0 -21
- lionagi-0.5.5.dist-info/RECORD +0 -374
- /lionagi/{core → libs/nested}/__init__.py +0 -0
- /lionagi/{core/action → libs/schema}/__init__.py +0 -0
- /lionagi/{core/communication → libs/validate}/__init__.py +0 -0
- /lionagi/{core/forms → operations/strategies}/__init__.py +0 -0
- /lionagi/{core/generic → operatives}/__init__.py +0 -0
- /lionagi/{core/session → operatives/action}/__init__.py +0 -0
- /lionagi/{integrations/anthropic_ → operatives/forms}/__init__.py +0 -0
- /lionagi/{core → operatives}/forms/utils.py +0 -0
- /lionagi/{integrations/anthropic_/api_endpoints → operatives/instruct}/__init__.py +0 -0
- /lionagi/{integrations/anthropic_/api_endpoints/messages → operatives/models}/__init__.py +0 -0
- /lionagi/{integrations/anthropic_/api_endpoints/messages/request → protocols/generic}/__init__.py +0 -0
- /lionagi/{integrations/groq_ → protocols/graph}/__init__.py +0 -0
- /lionagi/{integrations/litellm_ → protocols/mail}/__init__.py +0 -0
- /lionagi/{integrations/ollama_ → protocols/messages}/__init__.py +0 -0
- /lionagi/{core/communication → protocols/messages}/templates/README.md +0 -0
- /lionagi/{core/communication → protocols/messages}/templates/action_request.jinja2 +0 -0
- /lionagi/{core/communication → protocols/messages}/templates/action_response.jinja2 +0 -0
- /lionagi/{core/communication → protocols/messages}/templates/system_message.jinja2 +0 -0
- /lionagi/{core/communication → protocols/messages}/templates/tool_schemas.jinja2 +0 -0
- /lionagi/{integrations/ollama_/api_endpoints → service/endpoints}/__init__.py +0 -0
- /lionagi/{integrations/ollama_/api_endpoints/chat_completion → service/providers}/__init__.py +0 -0
- /lionagi/{integrations/ollama_/api_endpoints/model → service/providers/anthropic_}/__init__.py +0 -0
- /lionagi/{integrations/perplexity_ → service/providers/groq_}/__init__.py +0 -0
- /lionagi/{protocols/operatives → service/providers/openai_}/__init__.py +0 -0
- /lionagi/{protocols/registries → service/providers/openrouter_}/__init__.py +0 -0
- {lionagi-0.5.5.dist-info → lionagi-0.6.0.dist-info}/WHEEL +0 -0
- {lionagi-0.5.5.dist-info → lionagi-0.6.0.dist-info}/licenses/LICENSE +0 -0
@@ -1,325 +0,0 @@
|
|
1
|
-
# Copyright (c) 2023 - 2024, HaiyangLi <quantocean.li at gmail dot com>
|
2
|
-
#
|
3
|
-
# SPDX-License-Identifier: Apache-2.0
|
4
|
-
|
5
|
-
import warnings
|
6
|
-
from pathlib import Path
|
7
|
-
|
8
|
-
from dotenv import load_dotenv
|
9
|
-
from pydantic import (
|
10
|
-
BaseModel,
|
11
|
-
ConfigDict,
|
12
|
-
Field,
|
13
|
-
field_serializer,
|
14
|
-
model_validator,
|
15
|
-
)
|
16
|
-
|
17
|
-
from lionagi.service.rate_limiter import RateLimiter, RateLimitError
|
18
|
-
from lionagi.service.service_util import invoke_retry
|
19
|
-
from lionagi.service.token_calculator import TiktokenCalculator
|
20
|
-
|
21
|
-
from .api_endpoints.data_models import (
|
22
|
-
GroqChatCompletionRequest,
|
23
|
-
GroqEndpointRequestBody,
|
24
|
-
)
|
25
|
-
from .api_endpoints.groq_request import GroqRequest
|
26
|
-
from .api_endpoints.response_utils import match_response
|
27
|
-
|
28
|
-
load_dotenv()
|
29
|
-
path = Path(__file__).parent
|
30
|
-
|
31
|
-
price_config_file_name = path / "groq_price_data.yaml"
|
32
|
-
max_output_token_file_name = path / "groq_max_output_token_data.yaml"
|
33
|
-
rate_limits_file_name = path / "groq_rate_limits.yaml"
|
34
|
-
|
35
|
-
|
36
|
-
class _ModuleImportClass:
|
37
|
-
from lionagi.libs.package.imports import check_import
|
38
|
-
|
39
|
-
yaml = check_import("yaml", pip_name="pyyaml")
|
40
|
-
|
41
|
-
|
42
|
-
class GroqModel(BaseModel):
|
43
|
-
model: str = Field(description="ID of the model to use.")
|
44
|
-
request_model: GroqRequest = Field(description="Making requests")
|
45
|
-
rate_limiter: RateLimiter | None = Field(
|
46
|
-
default=None, description="Rate Limiter to track usage"
|
47
|
-
)
|
48
|
-
text_token_calculator: TiktokenCalculator | None = Field(
|
49
|
-
default=None, description="Token Calculator"
|
50
|
-
)
|
51
|
-
estimated_output_len: int = Field(
|
52
|
-
default=0, description="Expected output len before making request"
|
53
|
-
)
|
54
|
-
|
55
|
-
model_config = ConfigDict(extra="forbid")
|
56
|
-
|
57
|
-
@model_validator(mode="before")
|
58
|
-
@classmethod
|
59
|
-
def parse_input(cls, data: dict):
|
60
|
-
if not isinstance(data, dict):
|
61
|
-
raise ValueError("Invalid init param")
|
62
|
-
|
63
|
-
# Parse request model
|
64
|
-
request_model_params = {
|
65
|
-
"api_key": data.pop("api_key", None),
|
66
|
-
"endpoint": data.pop("endpoint", None),
|
67
|
-
"method": data.pop("method", None),
|
68
|
-
"content_type": data.pop("content_type", None),
|
69
|
-
}
|
70
|
-
data["request_model"] = GroqRequest(**request_model_params)
|
71
|
-
|
72
|
-
# Load rate limits from YAML
|
73
|
-
try:
|
74
|
-
with open(rate_limits_file_name) as file:
|
75
|
-
rate_limits = _ModuleImportClass.yaml.safe_load(file)
|
76
|
-
model_name = data.get("model")
|
77
|
-
model_limits = None
|
78
|
-
|
79
|
-
if model_name in rate_limits.get("text_models", {}):
|
80
|
-
model_limits = rate_limits["text_models"][model_name]
|
81
|
-
elif model_name in rate_limits.get("audio_models", {}):
|
82
|
-
model_limits = rate_limits["audio_models"][model_name]
|
83
|
-
|
84
|
-
if model_limits:
|
85
|
-
rate_limiter_params = {}
|
86
|
-
if limit_tokens := data.pop("limit_tokens", None):
|
87
|
-
rate_limiter_params["limit_tokens"] = limit_tokens
|
88
|
-
elif "tokens_per_minute" in model_limits:
|
89
|
-
rate_limiter_params["limit_tokens"] = model_limits[
|
90
|
-
"tokens_per_minute"
|
91
|
-
]
|
92
|
-
|
93
|
-
if limit_requests := data.pop("limit_requests", None):
|
94
|
-
rate_limiter_params["limit_requests"] = limit_requests
|
95
|
-
elif "requests_per_minute" in model_limits:
|
96
|
-
rate_limiter_params["limit_requests"] = model_limits[
|
97
|
-
"requests_per_minute"
|
98
|
-
]
|
99
|
-
|
100
|
-
if rate_limiter_params:
|
101
|
-
data["rate_limiter"] = RateLimiter(
|
102
|
-
**rate_limiter_params
|
103
|
-
)
|
104
|
-
except FileNotFoundError:
|
105
|
-
warnings.warn(
|
106
|
-
f"Rate limits file not found: {rate_limits_file_name}"
|
107
|
-
)
|
108
|
-
|
109
|
-
# Initialize token calculator
|
110
|
-
try:
|
111
|
-
text_calc = TiktokenCalculator(encoding_name="cl100k_base")
|
112
|
-
data["text_token_calculator"] = text_calc
|
113
|
-
except Exception as e:
|
114
|
-
warnings.warn(f"Failed to initialize token calculator: {str(e)}")
|
115
|
-
|
116
|
-
return data
|
117
|
-
|
118
|
-
@field_serializer("request_model")
|
119
|
-
def serialize_request_model(self, value: GroqRequest):
|
120
|
-
return value.model_dump(exclude_unset=True)
|
121
|
-
|
122
|
-
@invoke_retry(max_retries=3, base_delay=1, max_delay=60)
|
123
|
-
async def invoke(self, **kwargs):
|
124
|
-
"""Make a request to the Groq API."""
|
125
|
-
# Extract request body from kwargs
|
126
|
-
request_body = kwargs.get("request_body")
|
127
|
-
if not request_body:
|
128
|
-
raise ValueError("request_body is required")
|
129
|
-
|
130
|
-
# Extract other parameters
|
131
|
-
estimated_output_len = kwargs.get("estimated_output_len", 0)
|
132
|
-
output_file = kwargs.get("output_file")
|
133
|
-
parse_response = kwargs.get("parse_response", True)
|
134
|
-
|
135
|
-
if request_model := getattr(request_body, "model", None):
|
136
|
-
if request_model != self.model:
|
137
|
-
raise ValueError(
|
138
|
-
f"Request model does not match. Model is {self.model}, but request is made for {request_model}."
|
139
|
-
)
|
140
|
-
|
141
|
-
# Check rate limits if enabled
|
142
|
-
if self.rate_limiter:
|
143
|
-
input_token_len = await self.get_input_token_len(request_body)
|
144
|
-
if not self.verify_invoke_viability(
|
145
|
-
input_tokens_len=input_token_len,
|
146
|
-
estimated_output_len=estimated_output_len,
|
147
|
-
):
|
148
|
-
raise RateLimitError("Rate limit reached")
|
149
|
-
|
150
|
-
try:
|
151
|
-
if getattr(request_body, "stream", False):
|
152
|
-
return await self.stream(
|
153
|
-
request_body=request_body,
|
154
|
-
output_file=output_file,
|
155
|
-
parse_response=parse_response,
|
156
|
-
)
|
157
|
-
|
158
|
-
response_body, response_headers = await self.request_model.invoke(
|
159
|
-
request_body=request_body,
|
160
|
-
output_file=output_file,
|
161
|
-
with_response_header=True,
|
162
|
-
parse_response=False,
|
163
|
-
)
|
164
|
-
|
165
|
-
if response_body:
|
166
|
-
# Update rate limits based on usage
|
167
|
-
if self.rate_limiter:
|
168
|
-
if usage := response_body.get("usage"):
|
169
|
-
total_tokens = usage.get("total_tokens", 0)
|
170
|
-
self.rate_limiter.update_rate_limit(
|
171
|
-
response_headers.get("Date"), total_tokens
|
172
|
-
)
|
173
|
-
else:
|
174
|
-
self.rate_limiter.update_rate_limit(
|
175
|
-
response_headers.get("Date")
|
176
|
-
)
|
177
|
-
|
178
|
-
if parse_response:
|
179
|
-
return match_response(self.request_model, response_body)
|
180
|
-
return response_body
|
181
|
-
|
182
|
-
except Exception as e:
|
183
|
-
raise e
|
184
|
-
|
185
|
-
async def stream(
|
186
|
-
self,
|
187
|
-
request_body: GroqEndpointRequestBody,
|
188
|
-
output_file: str | None = None,
|
189
|
-
parse_response: bool = True,
|
190
|
-
):
|
191
|
-
"""Stream response from the Groq API."""
|
192
|
-
response_chunks = []
|
193
|
-
response_headers = None
|
194
|
-
|
195
|
-
async for chunk in self.request_model.stream(
|
196
|
-
request_body=request_body,
|
197
|
-
output_file=output_file,
|
198
|
-
with_response_header=True,
|
199
|
-
):
|
200
|
-
if isinstance(chunk, dict):
|
201
|
-
if "choices" in chunk or "usage" in chunk:
|
202
|
-
response_chunks.append(chunk)
|
203
|
-
elif "headers" in chunk:
|
204
|
-
response_headers = chunk["headers"]
|
205
|
-
|
206
|
-
# Update rate limits if usage information is available
|
207
|
-
if self.rate_limiter and response_chunks:
|
208
|
-
last_chunk = response_chunks[-1]
|
209
|
-
if usage := last_chunk.get("usage"):
|
210
|
-
total_tokens = usage.get("total_tokens", 0)
|
211
|
-
if response_headers:
|
212
|
-
self.rate_limiter.update_rate_limit(
|
213
|
-
response_headers.get("Date"), total_tokens
|
214
|
-
)
|
215
|
-
|
216
|
-
if parse_response:
|
217
|
-
return match_response(self.request_model, response_chunks)
|
218
|
-
return response_chunks
|
219
|
-
|
220
|
-
async def get_input_token_len(
|
221
|
-
self, request_body: GroqEndpointRequestBody | dict
|
222
|
-
) -> int:
|
223
|
-
"""Calculate the number of input tokens."""
|
224
|
-
if not isinstance(request_body, (GroqEndpointRequestBody, dict)):
|
225
|
-
return 0
|
226
|
-
|
227
|
-
if isinstance(request_body, dict):
|
228
|
-
request_body = GroqChatCompletionRequest(**request_body)
|
229
|
-
|
230
|
-
if not self.text_token_calculator:
|
231
|
-
warnings.warn(
|
232
|
-
"Token calculator not available, using approximate token count"
|
233
|
-
)
|
234
|
-
# Approximate token count (1 token ≈ 4 characters)
|
235
|
-
if isinstance(request_body, GroqChatCompletionRequest):
|
236
|
-
messages_text = "\n".join(
|
237
|
-
msg.content for msg in request_body.messages
|
238
|
-
)
|
239
|
-
return len(messages_text) // 4
|
240
|
-
return 0
|
241
|
-
|
242
|
-
total_tokens = 0
|
243
|
-
if isinstance(request_body, GroqChatCompletionRequest):
|
244
|
-
for message in request_body.messages:
|
245
|
-
total_tokens += self.text_token_calculator.calculate(
|
246
|
-
message.content
|
247
|
-
)
|
248
|
-
|
249
|
-
return total_tokens
|
250
|
-
|
251
|
-
def verify_invoke_viability(
|
252
|
-
self, input_tokens_len: int = 0, estimated_output_len: int = 0
|
253
|
-
) -> bool:
|
254
|
-
"""Check if the request can be made within rate limits."""
|
255
|
-
if not self.rate_limiter:
|
256
|
-
return True
|
257
|
-
|
258
|
-
self.rate_limiter.release_tokens()
|
259
|
-
|
260
|
-
estimated_output_len = (
|
261
|
-
estimated_output_len
|
262
|
-
if estimated_output_len != 0
|
263
|
-
else self.estimated_output_len
|
264
|
-
)
|
265
|
-
|
266
|
-
if estimated_output_len == 0:
|
267
|
-
try:
|
268
|
-
with open(max_output_token_file_name) as file:
|
269
|
-
output_token_config = _ModuleImportClass.yaml.safe_load(
|
270
|
-
file
|
271
|
-
)
|
272
|
-
estimated_output_len = output_token_config.get(
|
273
|
-
self.model, 2048
|
274
|
-
) # Default to 2048
|
275
|
-
self.estimated_output_len = estimated_output_len
|
276
|
-
except FileNotFoundError:
|
277
|
-
warnings.warn(
|
278
|
-
f"Max output token file not found: {max_output_token_file_name}"
|
279
|
-
)
|
280
|
-
# Use a conservative default
|
281
|
-
estimated_output_len = 2048
|
282
|
-
self.estimated_output_len = estimated_output_len
|
283
|
-
|
284
|
-
return self.rate_limiter.check_availability(
|
285
|
-
input_tokens_len, estimated_output_len
|
286
|
-
)
|
287
|
-
|
288
|
-
def estimate_text_price(
|
289
|
-
self,
|
290
|
-
input_text: str,
|
291
|
-
estimated_num_of_output_tokens: int = 0,
|
292
|
-
) -> float:
|
293
|
-
"""Estimate the cost of processing text."""
|
294
|
-
if not self.text_token_calculator:
|
295
|
-
warnings.warn(
|
296
|
-
"Token calculator not available, using approximate token count"
|
297
|
-
)
|
298
|
-
# Approximate token count (1 token ≈ 4 characters)
|
299
|
-
num_of_input_tokens = len(input_text) // 4
|
300
|
-
else:
|
301
|
-
num_of_input_tokens = self.text_token_calculator.calculate(
|
302
|
-
input_text
|
303
|
-
)
|
304
|
-
|
305
|
-
try:
|
306
|
-
with open(price_config_file_name) as file:
|
307
|
-
price_config = _ModuleImportClass.yaml.safe_load(file)
|
308
|
-
except FileNotFoundError:
|
309
|
-
raise ValueError(
|
310
|
-
f"Price config file not found: {price_config_file_name}"
|
311
|
-
)
|
312
|
-
|
313
|
-
if self.model not in price_config.get("model", {}):
|
314
|
-
raise ValueError(
|
315
|
-
f"No price information found for model: {self.model}"
|
316
|
-
)
|
317
|
-
|
318
|
-
model_price_info = price_config["model"][self.model]
|
319
|
-
estimated_price = (
|
320
|
-
model_price_info["input_tokens"] * num_of_input_tokens
|
321
|
-
+ model_price_info["output_tokens"]
|
322
|
-
* estimated_num_of_output_tokens
|
323
|
-
)
|
324
|
-
|
325
|
-
return estimated_price
|
@@ -1,156 +0,0 @@
|
|
1
|
-
# Copyright (c) 2023 - 2024, HaiyangLi <quantocean.li at gmail dot com>
|
2
|
-
#
|
3
|
-
# SPDX-License-Identifier: Apache-2.0
|
4
|
-
|
5
|
-
import inspect
|
6
|
-
|
7
|
-
from dotenv import load_dotenv
|
8
|
-
|
9
|
-
from lionagi.service import Service, register_service
|
10
|
-
|
11
|
-
from .api_endpoints.data_models import (
|
12
|
-
GroqAudioRequest,
|
13
|
-
GroqChatCompletionRequest,
|
14
|
-
)
|
15
|
-
from .GroqModel import GroqModel
|
16
|
-
|
17
|
-
load_dotenv()
|
18
|
-
|
19
|
-
|
20
|
-
@register_service
|
21
|
-
class GroqService(Service):
|
22
|
-
def __init__(
|
23
|
-
self,
|
24
|
-
api_key: str,
|
25
|
-
name: str | None = None,
|
26
|
-
):
|
27
|
-
"""Initialize the Groq service."""
|
28
|
-
super().__setattr__("_initialized", False)
|
29
|
-
self.api_key = api_key
|
30
|
-
self.name = name
|
31
|
-
self.rate_limiters = {} # model: RateLimiter
|
32
|
-
super().__setattr__("_initialized", True)
|
33
|
-
|
34
|
-
def __setattr__(self, key, value):
|
35
|
-
"""Prevent modification of critical attributes after initialization."""
|
36
|
-
if getattr(self, "_initialized", False) and key in ["api_key"]:
|
37
|
-
raise AttributeError(
|
38
|
-
f"Cannot modify '{key}' after initialization. "
|
39
|
-
f"Please create a new service instance for different credentials."
|
40
|
-
)
|
41
|
-
super().__setattr__(key, value)
|
42
|
-
|
43
|
-
def check_rate_limiter(
|
44
|
-
self,
|
45
|
-
groq_model: GroqModel,
|
46
|
-
limit_requests: int | None = None,
|
47
|
-
limit_tokens: int | None = None,
|
48
|
-
) -> GroqModel:
|
49
|
-
"""Check and update rate limiter for the model."""
|
50
|
-
if groq_model.model not in self.rate_limiters:
|
51
|
-
if groq_model.rate_limiter:
|
52
|
-
self.rate_limiters[groq_model.model] = groq_model.rate_limiter
|
53
|
-
else:
|
54
|
-
groq_model.rate_limiter = self.rate_limiters[groq_model.model]
|
55
|
-
if limit_requests is not None:
|
56
|
-
groq_model.rate_limiter.limit_requests = limit_requests
|
57
|
-
if limit_tokens is not None:
|
58
|
-
groq_model.rate_limiter.limit_tokens = limit_tokens
|
59
|
-
|
60
|
-
return groq_model
|
61
|
-
|
62
|
-
@staticmethod
|
63
|
-
def match_data_model(task_name: str) -> dict:
|
64
|
-
"""Match task name to appropriate request model mapping."""
|
65
|
-
if task_name in ["chat/completions", "create_chat_completion"]:
|
66
|
-
return {"request_body": GroqChatCompletionRequest}
|
67
|
-
elif task_name in ["audio/transcriptions", "create_transcription"]:
|
68
|
-
return {"request_body": GroqAudioRequest}
|
69
|
-
elif task_name in ["audio/translations", "create_translation"]:
|
70
|
-
return {"request_body": GroqAudioRequest}
|
71
|
-
raise ValueError(f"Unknown task: {task_name}")
|
72
|
-
|
73
|
-
@classmethod
|
74
|
-
def list_tasks(cls) -> list[str]:
|
75
|
-
"""List available tasks."""
|
76
|
-
methods = []
|
77
|
-
for name, member in inspect.getmembers(
|
78
|
-
cls, predicate=inspect.isfunction
|
79
|
-
):
|
80
|
-
if name not in [
|
81
|
-
"__init__",
|
82
|
-
"__setattr__",
|
83
|
-
"check_rate_limiter",
|
84
|
-
"match_data_model",
|
85
|
-
"list_tasks",
|
86
|
-
]:
|
87
|
-
methods.append(name)
|
88
|
-
return methods
|
89
|
-
|
90
|
-
# Chat Completions
|
91
|
-
def create_chat_completion(
|
92
|
-
self,
|
93
|
-
model: str,
|
94
|
-
limit_tokens: int | None = None,
|
95
|
-
limit_requests: int | None = None,
|
96
|
-
) -> GroqModel:
|
97
|
-
"""Create a chat completion model."""
|
98
|
-
model_obj = GroqModel(
|
99
|
-
model=model,
|
100
|
-
api_key=self.api_key,
|
101
|
-
endpoint="chat/completions",
|
102
|
-
method="POST",
|
103
|
-
content_type="application/json",
|
104
|
-
)
|
105
|
-
|
106
|
-
return self.check_rate_limiter(
|
107
|
-
model_obj,
|
108
|
-
limit_requests=limit_requests,
|
109
|
-
limit_tokens=limit_tokens,
|
110
|
-
)
|
111
|
-
|
112
|
-
# Audio
|
113
|
-
def create_transcription(
|
114
|
-
self,
|
115
|
-
model: str,
|
116
|
-
limit_requests: int | None = None,
|
117
|
-
) -> GroqModel:
|
118
|
-
"""Create an audio transcription model."""
|
119
|
-
model_obj = GroqModel(
|
120
|
-
model=model,
|
121
|
-
api_key=self.api_key,
|
122
|
-
endpoint="audio/transcriptions",
|
123
|
-
method="POST",
|
124
|
-
)
|
125
|
-
|
126
|
-
return self.check_rate_limiter(
|
127
|
-
model_obj,
|
128
|
-
limit_requests=limit_requests,
|
129
|
-
)
|
130
|
-
|
131
|
-
def create_translation(
|
132
|
-
self,
|
133
|
-
model: str,
|
134
|
-
limit_requests: int | None = None,
|
135
|
-
) -> GroqModel:
|
136
|
-
"""Create an audio translation model."""
|
137
|
-
model_obj = GroqModel(
|
138
|
-
model=model,
|
139
|
-
api_key=self.api_key,
|
140
|
-
endpoint="audio/translations",
|
141
|
-
method="POST",
|
142
|
-
)
|
143
|
-
|
144
|
-
return self.check_rate_limiter(
|
145
|
-
model_obj,
|
146
|
-
limit_requests=limit_requests,
|
147
|
-
)
|
148
|
-
|
149
|
-
@property
|
150
|
-
def allowed_roles(self):
|
151
|
-
return ["user", "assistant", "system"]
|
152
|
-
|
153
|
-
@property
|
154
|
-
def sequential_exchange(self):
|
155
|
-
"""whether the service requires user/assistant exchange"""
|
156
|
-
return True
|
File without changes
|
@@ -1,187 +0,0 @@
|
|
1
|
-
# Copyright (c) 2023 - 2024, HaiyangLi <quantocean.li at gmail dot com>
|
2
|
-
#
|
3
|
-
# SPDX-License-Identifier: Apache-2.0
|
4
|
-
|
5
|
-
from pydantic import BaseModel, ConfigDict, Field, model_validator
|
6
|
-
|
7
|
-
|
8
|
-
class GroqEndpointRequestBody(BaseModel):
|
9
|
-
model_config = ConfigDict(
|
10
|
-
extra="forbid",
|
11
|
-
use_enum_values=True,
|
12
|
-
validate_assignment=True,
|
13
|
-
arbitrary_types_allowed=True,
|
14
|
-
)
|
15
|
-
|
16
|
-
|
17
|
-
class GroqEndpointResponseBody(BaseModel):
|
18
|
-
model_config = ConfigDict(
|
19
|
-
use_enum_values=True,
|
20
|
-
validate_assignment=True,
|
21
|
-
arbitrary_types_allowed=True,
|
22
|
-
)
|
23
|
-
|
24
|
-
|
25
|
-
class GroqEndpointQueryParam(BaseModel):
|
26
|
-
model_config = ConfigDict(
|
27
|
-
extra="forbid",
|
28
|
-
use_enum_values=True,
|
29
|
-
validate_assignment=True,
|
30
|
-
arbitrary_types_allowed=True,
|
31
|
-
)
|
32
|
-
|
33
|
-
|
34
|
-
class GroqEndpointPathParam(BaseModel):
|
35
|
-
model_config = ConfigDict(
|
36
|
-
extra="forbid",
|
37
|
-
use_enum_values=True,
|
38
|
-
validate_assignment=True,
|
39
|
-
arbitrary_types_allowed=True,
|
40
|
-
)
|
41
|
-
|
42
|
-
|
43
|
-
class GroqChatMessage(BaseModel):
|
44
|
-
role: str = Field(description="The role of the message sender")
|
45
|
-
content: str = Field(description="The content of the message")
|
46
|
-
name: str | None = Field(
|
47
|
-
default=None, description="Optional name for the message sender"
|
48
|
-
)
|
49
|
-
|
50
|
-
|
51
|
-
class GroqChatCompletionRequest(GroqEndpointRequestBody):
|
52
|
-
messages: list[GroqChatMessage] = Field(
|
53
|
-
description="List of messages in the conversation"
|
54
|
-
)
|
55
|
-
model: str = Field(description="ID of the model to use")
|
56
|
-
temperature: float | None = Field(
|
57
|
-
default=1.0,
|
58
|
-
description="Sampling temperature between 0 and 2",
|
59
|
-
ge=0.0,
|
60
|
-
le=2.0,
|
61
|
-
)
|
62
|
-
top_p: float | None = Field(
|
63
|
-
default=1.0,
|
64
|
-
description="Nucleus sampling threshold",
|
65
|
-
ge=0.0,
|
66
|
-
le=1.0,
|
67
|
-
)
|
68
|
-
n: int | None = Field(
|
69
|
-
default=1,
|
70
|
-
description="Number of completions to generate",
|
71
|
-
ge=1,
|
72
|
-
)
|
73
|
-
stream: bool | None = Field(
|
74
|
-
default=False,
|
75
|
-
description="Whether to stream the response",
|
76
|
-
)
|
77
|
-
stop: str | list[str] | None = Field(
|
78
|
-
default=None,
|
79
|
-
description="Sequences where the API will stop generating",
|
80
|
-
)
|
81
|
-
max_tokens: int | None = Field(
|
82
|
-
default=None,
|
83
|
-
description="Maximum number of tokens to generate",
|
84
|
-
ge=1,
|
85
|
-
)
|
86
|
-
presence_penalty: float | None = Field(
|
87
|
-
default=0.0,
|
88
|
-
description="Presence penalty",
|
89
|
-
ge=-2.0,
|
90
|
-
le=2.0,
|
91
|
-
)
|
92
|
-
frequency_penalty: float | None = Field(
|
93
|
-
default=0.0,
|
94
|
-
description="Frequency penalty",
|
95
|
-
ge=-2.0,
|
96
|
-
le=2.0,
|
97
|
-
)
|
98
|
-
logit_bias: dict[str, float] | None = Field(
|
99
|
-
default=None,
|
100
|
-
description="Modify token likelihoods",
|
101
|
-
)
|
102
|
-
user: str | None = Field(
|
103
|
-
default=None,
|
104
|
-
description="Unique identifier for the end user",
|
105
|
-
)
|
106
|
-
|
107
|
-
@model_validator(mode="after")
|
108
|
-
def validate_messages(self):
|
109
|
-
if not self.messages:
|
110
|
-
raise ValueError("Messages list cannot be empty")
|
111
|
-
|
112
|
-
# Validate roles
|
113
|
-
valid_roles = {"system", "user", "assistant"}
|
114
|
-
for msg in self.messages:
|
115
|
-
if msg.role not in valid_roles:
|
116
|
-
raise ValueError(
|
117
|
-
f"Invalid role: {msg.role}. Must be one of {valid_roles}"
|
118
|
-
)
|
119
|
-
|
120
|
-
return self
|
121
|
-
|
122
|
-
|
123
|
-
class GroqAudioRequest(GroqEndpointRequestBody):
|
124
|
-
model: str = Field(description="ID of the model to use")
|
125
|
-
file: str = Field(description="Audio file to process")
|
126
|
-
language: str | None = Field(
|
127
|
-
default=None,
|
128
|
-
description="Language of the audio (ISO-639-1)",
|
129
|
-
)
|
130
|
-
prompt: str | None = Field(
|
131
|
-
default=None,
|
132
|
-
description="Text to guide the model",
|
133
|
-
)
|
134
|
-
response_format: str | None = Field(
|
135
|
-
default="json",
|
136
|
-
description="Response format (json, text, or verbose_json)",
|
137
|
-
)
|
138
|
-
temperature: float | None = Field(
|
139
|
-
default=0,
|
140
|
-
description="Sampling temperature",
|
141
|
-
ge=0.0,
|
142
|
-
le=1.0,
|
143
|
-
)
|
144
|
-
timestamp_granularities: list[str] | None = Field(
|
145
|
-
default=["segment"],
|
146
|
-
description="Timestamp granularities (word or segment)",
|
147
|
-
)
|
148
|
-
|
149
|
-
|
150
|
-
class GroqChatCompletionResponse(GroqEndpointResponseBody):
|
151
|
-
id: str = Field(description="Unique identifier for the completion")
|
152
|
-
object: str = Field(description="Object type")
|
153
|
-
created: int = Field(description="Unix timestamp of creation")
|
154
|
-
model: str = Field(description="Model used")
|
155
|
-
choices: list[dict] = Field(description="Generated completions")
|
156
|
-
usage: dict = Field(description="Token usage information")
|
157
|
-
system_fingerprint: str | None = Field(
|
158
|
-
description="System fingerprint for deterministic results"
|
159
|
-
)
|
160
|
-
|
161
|
-
|
162
|
-
class GroqAudioResponse(GroqEndpointResponseBody):
|
163
|
-
text: str = Field(description="Transcribed or translated text")
|
164
|
-
x_groq: dict = Field(description="Groq-specific metadata")
|
165
|
-
|
166
|
-
|
167
|
-
# Request model mapping for iModel
|
168
|
-
GROQ_REQUEST_MODELS = {
|
169
|
-
"create_chat_completion": {
|
170
|
-
"request_body": GroqChatCompletionRequest,
|
171
|
-
},
|
172
|
-
"create_transcription": {
|
173
|
-
"request_body": GroqAudioRequest,
|
174
|
-
},
|
175
|
-
"create_translation": {
|
176
|
-
"request_body": GroqAudioRequest,
|
177
|
-
},
|
178
|
-
"chat/completions": {
|
179
|
-
"request_body": GroqChatCompletionRequest,
|
180
|
-
},
|
181
|
-
"audio/transcriptions": {
|
182
|
-
"request_body": GroqAudioRequest,
|
183
|
-
},
|
184
|
-
"audio/translations": {
|
185
|
-
"request_body": GroqAudioRequest,
|
186
|
-
},
|
187
|
-
}
|