PyPI - aiecs - Versions diffs - 1.0.1__py3-none-any.whl → 1.7.17__py3-none-any.whl - Mend

aiecs 1.0.1py3-none-any.whl → 1.7.17py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of aiecs might be problematic. Click here for more details.

Files changed (340) hide show

aiecs/__init__.py +13 -16
aiecs/__main__.py +7 -7
aiecs/aiecs_client.py +269 -75
aiecs/application/executors/operation_executor.py +79 -54
aiecs/application/knowledge_graph/__init__.py +7 -0
aiecs/application/knowledge_graph/builder/__init__.py +37 -0
aiecs/application/knowledge_graph/builder/data_quality.py +302 -0
aiecs/application/knowledge_graph/builder/data_reshaping.py +293 -0
aiecs/application/knowledge_graph/builder/document_builder.py +369 -0
aiecs/application/knowledge_graph/builder/graph_builder.py +490 -0
aiecs/application/knowledge_graph/builder/import_optimizer.py +396 -0
aiecs/application/knowledge_graph/builder/schema_inference.py +462 -0
aiecs/application/knowledge_graph/builder/schema_mapping.py +563 -0
aiecs/application/knowledge_graph/builder/structured_pipeline.py +1384 -0
aiecs/application/knowledge_graph/builder/text_chunker.py +317 -0
aiecs/application/knowledge_graph/extractors/__init__.py +27 -0
aiecs/application/knowledge_graph/extractors/base.py +98 -0
aiecs/application/knowledge_graph/extractors/llm_entity_extractor.py +422 -0
aiecs/application/knowledge_graph/extractors/llm_relation_extractor.py +347 -0
aiecs/application/knowledge_graph/extractors/ner_entity_extractor.py +241 -0
aiecs/application/knowledge_graph/fusion/__init__.py +78 -0
aiecs/application/knowledge_graph/fusion/ab_testing.py +395 -0
aiecs/application/knowledge_graph/fusion/abbreviation_expander.py +327 -0
aiecs/application/knowledge_graph/fusion/alias_index.py +597 -0
aiecs/application/knowledge_graph/fusion/alias_matcher.py +384 -0
aiecs/application/knowledge_graph/fusion/cache_coordinator.py +343 -0
aiecs/application/knowledge_graph/fusion/entity_deduplicator.py +433 -0
aiecs/application/knowledge_graph/fusion/entity_linker.py +511 -0
aiecs/application/knowledge_graph/fusion/evaluation_dataset.py +240 -0
aiecs/application/knowledge_graph/fusion/knowledge_fusion.py +632 -0
aiecs/application/knowledge_graph/fusion/matching_config.py +489 -0
aiecs/application/knowledge_graph/fusion/name_normalizer.py +352 -0
aiecs/application/knowledge_graph/fusion/relation_deduplicator.py +183 -0
aiecs/application/knowledge_graph/fusion/semantic_name_matcher.py +464 -0
aiecs/application/knowledge_graph/fusion/similarity_pipeline.py +534 -0
aiecs/application/knowledge_graph/pattern_matching/__init__.py +21 -0
aiecs/application/knowledge_graph/pattern_matching/pattern_matcher.py +342 -0
aiecs/application/knowledge_graph/pattern_matching/query_executor.py +366 -0
aiecs/application/knowledge_graph/profiling/__init__.py +12 -0
aiecs/application/knowledge_graph/profiling/query_plan_visualizer.py +195 -0
aiecs/application/knowledge_graph/profiling/query_profiler.py +223 -0
aiecs/application/knowledge_graph/reasoning/__init__.py +27 -0
aiecs/application/knowledge_graph/reasoning/evidence_synthesis.py +341 -0
aiecs/application/knowledge_graph/reasoning/inference_engine.py +500 -0
aiecs/application/knowledge_graph/reasoning/logic_form_parser.py +163 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/__init__.py +79 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/ast_builder.py +513 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/ast_nodes.py +913 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/ast_validator.py +866 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/error_handler.py +475 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/parser.py +396 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/query_context.py +208 -0
aiecs/application/knowledge_graph/reasoning/logic_query_integration.py +170 -0
aiecs/application/knowledge_graph/reasoning/query_planner.py +855 -0
aiecs/application/knowledge_graph/reasoning/reasoning_engine.py +518 -0
aiecs/application/knowledge_graph/retrieval/__init__.py +27 -0
aiecs/application/knowledge_graph/retrieval/query_intent_classifier.py +211 -0
aiecs/application/knowledge_graph/retrieval/retrieval_strategies.py +592 -0
aiecs/application/knowledge_graph/retrieval/strategy_types.py +23 -0
aiecs/application/knowledge_graph/search/__init__.py +59 -0
aiecs/application/knowledge_graph/search/hybrid_search.py +457 -0
aiecs/application/knowledge_graph/search/reranker.py +293 -0
aiecs/application/knowledge_graph/search/reranker_strategies.py +535 -0
aiecs/application/knowledge_graph/search/text_similarity.py +392 -0
aiecs/application/knowledge_graph/traversal/__init__.py +15 -0
aiecs/application/knowledge_graph/traversal/enhanced_traversal.py +305 -0
aiecs/application/knowledge_graph/traversal/path_scorer.py +271 -0
aiecs/application/knowledge_graph/validators/__init__.py +13 -0
aiecs/application/knowledge_graph/validators/relation_validator.py +239 -0
aiecs/application/knowledge_graph/visualization/__init__.py +11 -0
aiecs/application/knowledge_graph/visualization/graph_visualizer.py +313 -0
aiecs/common/__init__.py +9 -0
aiecs/common/knowledge_graph/__init__.py +17 -0
aiecs/common/knowledge_graph/runnable.py +471 -0
aiecs/config/__init__.py +20 -5
aiecs/config/config.py +762 -31
aiecs/config/graph_config.py +131 -0
aiecs/config/tool_config.py +435 -0
aiecs/core/__init__.py +29 -13
aiecs/core/interface/__init__.py +2 -2
aiecs/core/interface/execution_interface.py +22 -22
aiecs/core/interface/storage_interface.py +37 -88
aiecs/core/registry/__init__.py +31 -0
aiecs/core/registry/service_registry.py +92 -0
aiecs/domain/__init__.py +270 -1
aiecs/domain/agent/__init__.py +191 -0
aiecs/domain/agent/base_agent.py +3949 -0
aiecs/domain/agent/exceptions.py +99 -0
aiecs/domain/agent/graph_aware_mixin.py +569 -0
aiecs/domain/agent/hybrid_agent.py +1731 -0
aiecs/domain/agent/integration/__init__.py +29 -0
aiecs/domain/agent/integration/context_compressor.py +216 -0
aiecs/domain/agent/integration/context_engine_adapter.py +587 -0
aiecs/domain/agent/integration/protocols.py +281 -0
aiecs/domain/agent/integration/retry_policy.py +218 -0
aiecs/domain/agent/integration/role_config.py +213 -0
aiecs/domain/agent/knowledge_aware_agent.py +1892 -0
aiecs/domain/agent/lifecycle.py +291 -0
aiecs/domain/agent/llm_agent.py +692 -0
aiecs/domain/agent/memory/__init__.py +12 -0
aiecs/domain/agent/memory/conversation.py +1124 -0
aiecs/domain/agent/migration/__init__.py +14 -0
aiecs/domain/agent/migration/conversion.py +163 -0
aiecs/domain/agent/migration/legacy_wrapper.py +86 -0
aiecs/domain/agent/models.py +894 -0
aiecs/domain/agent/observability.py +479 -0
aiecs/domain/agent/persistence.py +449 -0
aiecs/domain/agent/prompts/__init__.py +29 -0
aiecs/domain/agent/prompts/builder.py +159 -0
aiecs/domain/agent/prompts/formatters.py +187 -0
aiecs/domain/agent/prompts/template.py +255 -0
aiecs/domain/agent/registry.py +253 -0
aiecs/domain/agent/tool_agent.py +444 -0
aiecs/domain/agent/tools/__init__.py +15 -0
aiecs/domain/agent/tools/schema_generator.py +377 -0
aiecs/domain/community/__init__.py +155 -0
aiecs/domain/community/agent_adapter.py +469 -0
aiecs/domain/community/analytics.py +432 -0
aiecs/domain/community/collaborative_workflow.py +648 -0
aiecs/domain/community/communication_hub.py +634 -0
aiecs/domain/community/community_builder.py +320 -0
aiecs/domain/community/community_integration.py +796 -0
aiecs/domain/community/community_manager.py +803 -0
aiecs/domain/community/decision_engine.py +849 -0
aiecs/domain/community/exceptions.py +231 -0
aiecs/domain/community/models/__init__.py +33 -0
aiecs/domain/community/models/community_models.py +234 -0
aiecs/domain/community/resource_manager.py +461 -0
aiecs/domain/community/shared_context_manager.py +589 -0
aiecs/domain/context/__init__.py +40 -10
aiecs/domain/context/context_engine.py +1910 -0
aiecs/domain/context/conversation_models.py +87 -53
aiecs/domain/context/graph_memory.py +582 -0
aiecs/domain/execution/model.py +12 -4
aiecs/domain/knowledge_graph/__init__.py +19 -0
aiecs/domain/knowledge_graph/models/__init__.py +52 -0
aiecs/domain/knowledge_graph/models/entity.py +148 -0
aiecs/domain/knowledge_graph/models/evidence.py +178 -0
aiecs/domain/knowledge_graph/models/inference_rule.py +184 -0
aiecs/domain/knowledge_graph/models/path.py +171 -0
aiecs/domain/knowledge_graph/models/path_pattern.py +171 -0
aiecs/domain/knowledge_graph/models/query.py +261 -0
aiecs/domain/knowledge_graph/models/query_plan.py +181 -0
aiecs/domain/knowledge_graph/models/relation.py +202 -0
aiecs/domain/knowledge_graph/schema/__init__.py +23 -0
aiecs/domain/knowledge_graph/schema/entity_type.py +131 -0
aiecs/domain/knowledge_graph/schema/graph_schema.py +253 -0
aiecs/domain/knowledge_graph/schema/property_schema.py +143 -0
aiecs/domain/knowledge_graph/schema/relation_type.py +163 -0
aiecs/domain/knowledge_graph/schema/schema_manager.py +691 -0
aiecs/domain/knowledge_graph/schema/type_enums.py +209 -0
aiecs/domain/task/dsl_processor.py +172 -56
aiecs/domain/task/model.py +20 -8
aiecs/domain/task/task_context.py +27 -24
aiecs/infrastructure/__init__.py +0 -2
aiecs/infrastructure/graph_storage/__init__.py +11 -0
aiecs/infrastructure/graph_storage/base.py +837 -0
aiecs/infrastructure/graph_storage/batch_operations.py +458 -0
aiecs/infrastructure/graph_storage/cache.py +424 -0
aiecs/infrastructure/graph_storage/distributed.py +223 -0
aiecs/infrastructure/graph_storage/error_handling.py +380 -0
aiecs/infrastructure/graph_storage/graceful_degradation.py +294 -0
aiecs/infrastructure/graph_storage/health_checks.py +378 -0
aiecs/infrastructure/graph_storage/in_memory.py +1197 -0
aiecs/infrastructure/graph_storage/index_optimization.py +446 -0
aiecs/infrastructure/graph_storage/lazy_loading.py +431 -0
aiecs/infrastructure/graph_storage/metrics.py +344 -0
aiecs/infrastructure/graph_storage/migration.py +400 -0
aiecs/infrastructure/graph_storage/pagination.py +483 -0
aiecs/infrastructure/graph_storage/performance_monitoring.py +456 -0
aiecs/infrastructure/graph_storage/postgres.py +1563 -0
aiecs/infrastructure/graph_storage/property_storage.py +353 -0
aiecs/infrastructure/graph_storage/protocols.py +76 -0
aiecs/infrastructure/graph_storage/query_optimizer.py +642 -0
aiecs/infrastructure/graph_storage/schema_cache.py +290 -0
aiecs/infrastructure/graph_storage/sqlite.py +1373 -0
aiecs/infrastructure/graph_storage/streaming.py +487 -0
aiecs/infrastructure/graph_storage/tenant.py +412 -0
aiecs/infrastructure/messaging/celery_task_manager.py +92 -54
aiecs/infrastructure/messaging/websocket_manager.py +51 -35
aiecs/infrastructure/monitoring/__init__.py +22 -0
aiecs/infrastructure/monitoring/executor_metrics.py +45 -11
aiecs/infrastructure/monitoring/global_metrics_manager.py +212 -0
aiecs/infrastructure/monitoring/structured_logger.py +3 -7
aiecs/infrastructure/monitoring/tracing_manager.py +63 -35
aiecs/infrastructure/persistence/__init__.py +14 -1
aiecs/infrastructure/persistence/context_engine_client.py +184 -0
aiecs/infrastructure/persistence/database_manager.py +67 -43
aiecs/infrastructure/persistence/file_storage.py +180 -103
aiecs/infrastructure/persistence/redis_client.py +74 -21
aiecs/llm/__init__.py +73 -25
aiecs/llm/callbacks/__init__.py +11 -0
aiecs/llm/{custom_callbacks.py → callbacks/custom_callbacks.py} +26 -19
aiecs/llm/client_factory.py +230 -37
aiecs/llm/client_resolver.py +155 -0
aiecs/llm/clients/__init__.py +38 -0
aiecs/llm/clients/base_client.py +328 -0
aiecs/llm/clients/google_function_calling_mixin.py +415 -0
aiecs/llm/clients/googleai_client.py +314 -0
aiecs/llm/clients/openai_client.py +158 -0
aiecs/llm/clients/openai_compatible_mixin.py +367 -0
aiecs/llm/clients/vertex_client.py +1186 -0
aiecs/llm/clients/xai_client.py +201 -0
aiecs/llm/config/__init__.py +51 -0
aiecs/llm/config/config_loader.py +272 -0
aiecs/llm/config/config_validator.py +206 -0
aiecs/llm/config/model_config.py +143 -0
aiecs/llm/protocols.py +149 -0
aiecs/llm/utils/__init__.py +10 -0
aiecs/llm/utils/validate_config.py +89 -0
aiecs/main.py +140 -121
aiecs/scripts/aid/VERSION_MANAGEMENT.md +138 -0
aiecs/scripts/aid/__init__.py +19 -0
aiecs/scripts/aid/module_checker.py +499 -0
aiecs/scripts/aid/version_manager.py +235 -0
aiecs/scripts/{DEPENDENCY_SYSTEM_SUMMARY.md → dependance_check/DEPENDENCY_SYSTEM_SUMMARY.md} +1 -0
aiecs/scripts/{README_DEPENDENCY_CHECKER.md → dependance_check/README_DEPENDENCY_CHECKER.md} +1 -0
aiecs/scripts/dependance_check/__init__.py +15 -0
aiecs/scripts/dependance_check/dependency_checker.py +1835 -0
aiecs/scripts/{dependency_fixer.py → dependance_check/dependency_fixer.py} +192 -90
aiecs/scripts/{download_nlp_data.py → dependance_check/download_nlp_data.py} +203 -71
aiecs/scripts/dependance_patch/__init__.py +7 -0
aiecs/scripts/dependance_patch/fix_weasel/__init__.py +11 -0
aiecs/scripts/{fix_weasel_validator.py → dependance_patch/fix_weasel/fix_weasel_validator.py} +21 -14
aiecs/scripts/{patch_weasel_library.sh → dependance_patch/fix_weasel/patch_weasel_library.sh} +1 -1
aiecs/scripts/knowledge_graph/__init__.py +3 -0
aiecs/scripts/knowledge_graph/run_threshold_experiments.py +212 -0
aiecs/scripts/migrations/multi_tenancy/README.md +142 -0
aiecs/scripts/tools_develop/README.md +671 -0
aiecs/scripts/tools_develop/README_CONFIG_CHECKER.md +273 -0
aiecs/scripts/tools_develop/TOOLS_CONFIG_GUIDE.md +1287 -0
aiecs/scripts/tools_develop/TOOL_AUTO_DISCOVERY.md +234 -0
aiecs/scripts/tools_develop/__init__.py +21 -0
aiecs/scripts/tools_develop/check_all_tools_config.py +548 -0
aiecs/scripts/tools_develop/check_type_annotations.py +257 -0
aiecs/scripts/tools_develop/pre-commit-schema-coverage.sh +66 -0
aiecs/scripts/tools_develop/schema_coverage.py +511 -0
aiecs/scripts/tools_develop/validate_tool_schemas.py +475 -0
aiecs/scripts/tools_develop/verify_executor_config_fix.py +98 -0
aiecs/scripts/tools_develop/verify_tools.py +352 -0
aiecs/tasks/__init__.py +0 -1
aiecs/tasks/worker.py +115 -47
aiecs/tools/__init__.py +194 -72
aiecs/tools/apisource/__init__.py +99 -0
aiecs/tools/apisource/intelligence/__init__.py +19 -0
aiecs/tools/apisource/intelligence/data_fusion.py +632 -0
aiecs/tools/apisource/intelligence/query_analyzer.py +417 -0
aiecs/tools/apisource/intelligence/search_enhancer.py +385 -0
aiecs/tools/apisource/monitoring/__init__.py +9 -0
aiecs/tools/apisource/monitoring/metrics.py +330 -0
aiecs/tools/apisource/providers/__init__.py +112 -0
aiecs/tools/apisource/providers/base.py +671 -0
aiecs/tools/apisource/providers/census.py +397 -0
aiecs/tools/apisource/providers/fred.py +535 -0
aiecs/tools/apisource/providers/newsapi.py +409 -0
aiecs/tools/apisource/providers/worldbank.py +352 -0
aiecs/tools/apisource/reliability/__init__.py +12 -0
aiecs/tools/apisource/reliability/error_handler.py +363 -0
aiecs/tools/apisource/reliability/fallback_strategy.py +376 -0
aiecs/tools/apisource/tool.py +832 -0
aiecs/tools/apisource/utils/__init__.py +9 -0
aiecs/tools/apisource/utils/validators.py +334 -0
aiecs/tools/base_tool.py +415 -21
aiecs/tools/docs/__init__.py +121 -0
aiecs/tools/docs/ai_document_orchestrator.py +607 -0
aiecs/tools/docs/ai_document_writer_orchestrator.py +2350 -0
aiecs/tools/docs/content_insertion_tool.py +1320 -0
aiecs/tools/docs/document_creator_tool.py +1464 -0
aiecs/tools/docs/document_layout_tool.py +1160 -0
aiecs/tools/docs/document_parser_tool.py +1016 -0
aiecs/tools/docs/document_writer_tool.py +2008 -0
aiecs/tools/knowledge_graph/__init__.py +17 -0
aiecs/tools/knowledge_graph/graph_reasoning_tool.py +807 -0
aiecs/tools/knowledge_graph/graph_search_tool.py +944 -0
aiecs/tools/knowledge_graph/kg_builder_tool.py +524 -0
aiecs/tools/langchain_adapter.py +300 -138
aiecs/tools/schema_generator.py +455 -0
aiecs/tools/search_tool/__init__.py +100 -0
aiecs/tools/search_tool/analyzers.py +581 -0
aiecs/tools/search_tool/cache.py +264 -0
aiecs/tools/search_tool/constants.py +128 -0
aiecs/tools/search_tool/context.py +224 -0
aiecs/tools/search_tool/core.py +778 -0
aiecs/tools/search_tool/deduplicator.py +119 -0
aiecs/tools/search_tool/error_handler.py +242 -0
aiecs/tools/search_tool/metrics.py +343 -0
aiecs/tools/search_tool/rate_limiter.py +172 -0
aiecs/tools/search_tool/schemas.py +275 -0
aiecs/tools/statistics/__init__.py +80 -0
aiecs/tools/statistics/ai_data_analysis_orchestrator.py +646 -0
aiecs/tools/statistics/ai_insight_generator_tool.py +508 -0
aiecs/tools/statistics/ai_report_orchestrator_tool.py +684 -0
aiecs/tools/statistics/data_loader_tool.py +555 -0
aiecs/tools/statistics/data_profiler_tool.py +638 -0
aiecs/tools/statistics/data_transformer_tool.py +580 -0
aiecs/tools/statistics/data_visualizer_tool.py +498 -0
aiecs/tools/statistics/model_trainer_tool.py +507 -0
aiecs/tools/statistics/statistical_analyzer_tool.py +472 -0
aiecs/tools/task_tools/__init__.py +49 -36
aiecs/tools/task_tools/chart_tool.py +200 -184
aiecs/tools/task_tools/classfire_tool.py +268 -267
aiecs/tools/task_tools/image_tool.py +220 -141
aiecs/tools/task_tools/office_tool.py +226 -146
aiecs/tools/task_tools/pandas_tool.py +477 -121
aiecs/tools/task_tools/report_tool.py +390 -142
aiecs/tools/task_tools/research_tool.py +149 -79
aiecs/tools/task_tools/scraper_tool.py +339 -145
aiecs/tools/task_tools/stats_tool.py +448 -209
aiecs/tools/temp_file_manager.py +26 -24
aiecs/tools/tool_executor/__init__.py +18 -16
aiecs/tools/tool_executor/tool_executor.py +364 -52
aiecs/utils/LLM_output_structor.py +74 -48
aiecs/utils/__init__.py +14 -3
aiecs/utils/base_callback.py +0 -3
aiecs/utils/cache_provider.py +696 -0
aiecs/utils/execution_utils.py +50 -31
aiecs/utils/prompt_loader.py +1 -0
aiecs/utils/token_usage_repository.py +37 -11
aiecs/ws/socket_server.py +14 -4
{aiecs-1.0.1.dist-info → aiecs-1.7.17.dist-info}/METADATA +52 -15
aiecs-1.7.17.dist-info/RECORD +337 -0
aiecs-1.7.17.dist-info/entry_points.txt +13 -0
aiecs/config/registry.py +0 -19
aiecs/domain/context/content_engine.py +0 -982
aiecs/llm/base_client.py +0 -99
aiecs/llm/openai_client.py +0 -125
aiecs/llm/vertex_client.py +0 -186
aiecs/llm/xai_client.py +0 -184
aiecs/scripts/dependency_checker.py +0 -857
aiecs/scripts/quick_dependency_check.py +0 -269
aiecs/tools/task_tools/search_api.py +0 -7
aiecs-1.0.1.dist-info/RECORD +0 -90
aiecs-1.0.1.dist-info/entry_points.txt +0 -7
/aiecs/scripts/{setup_nlp_data.sh → dependance_check/setup_nlp_data.sh} +0 -0
/aiecs/scripts/{README_WEASEL_PATCH.md → dependance_patch/fix_weasel/README_WEASEL_PATCH.md} +0 -0
/aiecs/scripts/{fix_weasel_validator.sh → dependance_patch/fix_weasel/fix_weasel_validator.sh} +0 -0
/aiecs/scripts/{run_weasel_patch.sh → dependance_patch/fix_weasel/run_weasel_patch.sh} +0 -0
{aiecs-1.0.1.dist-info → aiecs-1.7.17.dist-info}/WHEEL +0 -0
{aiecs-1.0.1.dist-info → aiecs-1.7.17.dist-info}/licenses/LICENSE +0 -0
{aiecs-1.0.1.dist-info → aiecs-1.7.17.dist-info}/top_level.txt +0 -0

aiecs/tools/task_tools/classfire_tool.py CHANGED Viewed

@@ -1,53 +1,63 @@
+from aiecs.tools import register_tool
+from aiecs.tools.tool_executor import (
+    validate_input,
+)
+from aiecs.tools.base_tool import BaseTool
 import os
 import re
 import logging
 import asyncio
 import time
-from typing import Dict, Any, List, Optional, Union, Tuple
+from typing import Dict, Any, List, Optional, Tuple
 from enum import Enum
-from pydantic import BaseModel, Field, field_validator, ValidationError, ConfigDict
+from pydantic import BaseModel, Field, field_validator
+from pydantic_settings import BaseSettings, SettingsConfigDict
 # Lazy imports for heavy dependencies
 rake_nltk = None
 spacy = None
 def _init_heavy_dependencies():
     """Initialize heavy dependencies when actually needed"""
     global rake_nltk, spacy
     if rake_nltk is None:
         try:
-            import rake_nltk as _rake_nltk
+            import rake_nltk as _rake_nltk  # type: ignore[import-untyped]
             rake_nltk = _rake_nltk
         except ImportError:
             import logging
             logging.getLogger(__name__).error("rake_nltk not available")
     if spacy is None:
         try:
             import spacy as _spacy
             spacy = _spacy
         except ImportError:
             import logging
             logging.getLogger(__name__).warning("spacy not available (optional)")
-from aiecs.tools import register_tool
-from aiecs.tools.base_tool import BaseTool
-from aiecs.tools.tool_executor import (
-    validate_input,
-)
 # Enums for configuration options
 class Language(str, Enum):
     ENGLISH = "en"
     CHINESE = "zh"
     AUTO = "auto"
 class ModelType(str, Enum):
     SPACY_ENGLISH = "en_core_web_sm"
     SPACY_CHINESE = "zh_core_web_sm"
 @register_tool("classifier")
 class ClassifierTool(BaseTool):
     """
@@ -69,182 +79,126 @@ class ClassifierTool(BaseTool):
     """
     # Configuration schema
-    class Config(BaseModel):
-        """Configuration for the classifier tool"""
+    class Config(BaseSettings):
+        """Configuration for the classifier tool
+        Automatically reads from environment variables with CLASSIFIER_TOOL_ prefix.
+        Example: CLASSIFIER_TOOL_MAX_WORKERS -> max_workers
+        """
+        model_config = SettingsConfigDict(env_prefix="CLASSIFIER_TOOL_")
         max_workers: int = Field(
             default=min(32, (os.cpu_count() or 4) * 2),
-            description="Maximum number of worker threads"
+            description="Maximum number of worker threads",
         )
         pipeline_cache_ttl: int = Field(
             default=3600,
-            description="Time-to-live for pipeline cache in seconds"
-        )
-        pipeline_cache_size: int = Field(
-            default=10,
-            description="Maximum number of pipeline cache entries"
-        )
-        max_text_length: int = Field(
-            default=10_000,
-            description="Maximum text length in characters"
-        )
-        spacy_model_en: str = Field(
-            default="en_core_web_sm",
-            description="spaCy model for English"
-        )
-        spacy_model_zh: str = Field(
-            default="zh_core_web_sm",
-            description="spaCy model for Chinese"
+            description="Time-to-live for pipeline cache in seconds",
         )
+        pipeline_cache_size: int = Field(default=10, description="Maximum number of pipeline cache entries")
+        max_text_length: int = Field(default=10_000, description="Maximum text length in characters")
+        spacy_model_en: str = Field(default="en_core_web_sm", description="spaCy model for English")
+        spacy_model_zh: str = Field(default="zh_core_web_sm", description="spaCy model for Chinese")
         allowed_models: List[str] = Field(
-            default=[
-                "en_core_web_sm",
-                "zh_core_web_sm"
-            ],
-            description="List of allowed spaCy models"
-        )
-        rate_limit_enabled: bool = Field(
-            default=True,
-            description="Enable rate limiting"
+            default=["en_core_web_sm", "zh_core_web_sm"],
+            description="List of allowed spaCy models",
         )
-        rate_limit_requests: int = Field(
-            default=100,
-            description="Maximum requests per window"
-        )
-        rate_limit_window: int = Field(
-            default=60,
-            description="Rate limit window in seconds"
-        )
-        use_rake_for_english: bool = Field(
-            default=True,
-            description="Use RAKE for English phrase extraction"
-        )
-        model_config = ConfigDict(env_prefix="CLASSIFIER_TOOL_")
+        rate_limit_enabled: bool = Field(default=True, description="Enable rate limiting")
+        rate_limit_requests: int = Field(default=100, description="Maximum requests per window")
+        rate_limit_window: int = Field(default=60, description="Rate limit window in seconds")
+        use_rake_for_english: bool = Field(default=True, description="Use RAKE for English phrase extraction")
     # Base schema for text operations
     class BaseTextSchema(BaseModel):
         """Base schema for text operations"""
-        text: str = Field(
-            description="Text to process"
-        )
+        text: str = Field(description="Text to process")
         @field_validator("text")
         @classmethod
         def check_length_and_content(cls, v: str) -> str:
             if len(v) > 10_000:  # Using a constant here for validation
-                raise ValueError(f"Text length exceeds 10,000 characters")
+                raise ValueError("Text length exceeds 10,000 characters")
             # Check for malicious patterns (e.g., SQL injection)
-            if re.search(r'(\bSELECT\b|\bINSERT\b|\bDELETE\b|--|;|/\*)', v, re.IGNORECASE):
+            if re.search(
+                r"(\bSELECT\b|\bINSERT\b|\bDELETE\b|--|;|/\*)",
+                v,
+                re.IGNORECASE,
+            ):
                 raise ValueError("Text contains potentially malicious content")
             return v
     # Input schemas for operations
     class ClassifySchema(BaseTextSchema):
-        """Schema for text classification"""
-        model: Optional[str] = Field(
-            default=None,
-            description="Model to use for classification"
-        )
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+        """Schema for classify operation"""
+        model: Optional[str] = Field(default=None, description="Model to use for classification")
+        language: Optional[Language] = Field(default=None, description="Language of the text")
         @field_validator("model")
         @classmethod
         def check_model(cls, v: Optional[str]) -> Optional[str]:
-            allowed_models = [
-                "en_core_web_sm",
-                "zh_core_web_sm"
-            ]
+            allowed_models = ["en_core_web_sm", "zh_core_web_sm"]
             if v and v not in allowed_models:
                 raise ValueError(f"Model '{v}' not in allowed spaCy models: {allowed_models}")
             return v
     class TokenizeSchema(BaseTextSchema):
-        """Schema for text tokenization"""
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+        """Schema for tokenize operation"""
-    class PosTagSchema(BaseTextSchema):
-        """Schema for part-of-speech tagging"""
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+        language: Optional[Language] = Field(default=None, description="Language of the text")
+    class Pos_tagSchema(BaseTextSchema):
+        """Schema for pos_tag operation"""
+        language: Optional[Language] = Field(default=None, description="Language of the text")
     class NERSchema(BaseTextSchema):
-        """Schema for named entity recognition"""
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+        """Schema for ner operation"""
+        language: Optional[Language] = Field(default=None, description="Language of the text")
     class LemmatizeSchema(BaseTextSchema):
-        """Schema for lemmatization"""
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+        """Schema for lemmatize operation"""
-    class DependencyParseSchema(BaseTextSchema):
-        """Schema for dependency parsing"""
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+        language: Optional[Language] = Field(default=None, description="Language of the text")
-    class KeywordExtractSchema(BaseTextSchema):
-        """Schema for keyword extraction"""
-        top_k: int = Field(
-            default=10,
-            description="Number of keywords to extract"
-        )
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+    class Dependency_parseSchema(BaseTextSchema):
+        """Schema for dependency_parse operation"""
+        language: Optional[Language] = Field(default=None, description="Language of the text")
+    class Keyword_extractSchema(BaseTextSchema):
+        """Schema for keyword_extract operation"""
+        top_k: int = Field(default=10, description="Number of keywords to extract")
+        language: Optional[Language] = Field(default=None, description="Language of the text")
         extract_phrases: bool = Field(
             default=True,
-            description="Whether to extract phrases or just keywords"
+            description="Whether to extract phrases or just keywords",
         )
     class SummarizeSchema(BaseTextSchema):
-        """Schema for text summarization"""
-        max_length: int = Field(
-            default=150,
-            description="Maximum length of the summary"
-        )
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the text"
-        )
+        """Schema for summarize operation"""
+        max_length: int = Field(default=150, description="Maximum length of the summary")
+        language: Optional[Language] = Field(default=None, description="Language of the text")
-    class BatchProcessSchema(BaseModel):
+    class Batch_processSchema(BaseModel):
         """Schema for batch processing"""
-        texts: List[str] = Field(
-            description="List of texts to process"
-        )
-        operation: str = Field(
-            description="Operation to perform on each text"
-        )
-        language: Optional[Language] = Field(
-            default=None,
-            description="Language of the texts"
-        )
-        model: Optional[str] = Field(
-            default=None,
-            description="Model to use for processing"
-        )
+        texts: List[str] = Field(description="List of texts to process")
+        operation: str = Field(description="Operation to perform on each text")
+        language: Optional[Language] = Field(default=None, description="Language of the texts")
+        model: Optional[str] = Field(default=None, description="Model to use for processing")
         top_k: Optional[int] = Field(
             default=None,
-            description="Number of keywords to extract (for keyword_extract)"
+            description="Number of keywords to extract (for keyword_extract)",
         )
         max_length: Optional[int] = Field(
             default=None,
-            description="Maximum length of the summary (for summarize)"
+            description="Maximum length of the summary (for summarize)",
         )
         @field_validator("texts")
@@ -252,8 +206,12 @@ class ClassifierTool(BaseTool):
         def check_texts(cls, v: List[str]) -> List[str]:
             for text in v:
                 if len(text) > 10_000:  # Using a constant here for validation
-                    raise ValueError(f"Text length exceeds 10,000 characters")
-                if re.search(r'(\bSELECT\b|\bINSERT\b|\bDELETE\b|--|;|/\*)', text, re.IGNORECASE):
+                    raise ValueError("Text length exceeds 10,000 characters")
+                if re.search(
+                    r"(\bSELECT\b|\bINSERT\b|\bDELETE\b|--|;|/\*)",
+                    text,
+                    re.IGNORECASE,
+                ):
                     raise ValueError("Text contains potentially malicious content")
             return v
@@ -266,24 +224,31 @@ class ClassifierTool(BaseTool):
         Raises:
             ValueError: If config contains invalid settings.
+        Configuration is automatically loaded by BaseTool from:
+        1. Explicit config dict (highest priority)
+        2. YAML config files (config/tools/classifier.yaml)
+        3. Environment variables (via dotenv from .env files)
+        4. Tool defaults (lowest priority)
         """
         super().__init__(config)
-        # Parse configuration
-        self.config = self.Config(**(config or {}))
+        # Configuration is automatically loaded by BaseTool into self._config_obj
+        # Access config via self._config_obj (BaseSettings instance)
+        self.config = self._config_obj if self._config_obj else self.Config()
         # Set up logger
         self.logger = logging.getLogger(__name__)
         if not self.logger.handlers:
             handler = logging.StreamHandler()
-            handler.setFormatter(logging.Formatter('%(asctime)s %(levelname)s %(message)s'))
+            handler.setFormatter(logging.Formatter("%(asctime)s %(levelname)s %(message)s"))
             self.logger.addHandler(handler)
         self.logger.setLevel(logging.INFO)
         # Initialize resources
-        self._spacy_nlp = {}  # Language -> spaCy pipeline
-        self._metrics = {'requests': 0, 'cache_hits': 0, 'processing_time': []}
-        self._request_timestamps = []
+        self._spacy_nlp: Dict[str, Any] = {}  # Language -> spaCy pipeline
+        self._metrics = {"requests": 0, "cache_hits": 0, "processing_time": []}
+        self._request_timestamps: List[float] = []
     def _get_sentiment_lexicon(self, language: str) -> Dict[str, float]:
         """
@@ -295,22 +260,66 @@ class ClassifierTool(BaseTool):
         Returns:
             Dict[str, float]: Sentiment lexicon with word -> score mapping.
         """
-        if language == 'en':
+        if language == "en":
             # Simple English sentiment lexicon
             return {
-                'good': 1.0, 'great': 1.5, 'excellent': 2.0, 'amazing': 2.0, 'wonderful': 1.5,
-                'fantastic': 2.0, 'awesome': 1.5, 'perfect': 2.0, 'love': 1.5, 'like': 1.0,
-                'happy': 1.5, 'pleased': 1.0, 'satisfied': 1.0, 'positive': 1.0, 'best': 2.0,
-                'bad': -1.0, 'terrible': -2.0, 'awful': -2.0, 'horrible': -2.0, 'hate': -2.0,
-                'dislike': -1.0, 'sad': -1.5, 'angry': -1.5, 'disappointed': -1.5, 'negative': -1.0,
-                'worst': -2.0, 'poor': -1.0, 'fail': -1.5, 'wrong': -1.0, 'problem': -1.0
+                "good": 1.0,
+                "great": 1.5,
+                "excellent": 2.0,
+                "amazing": 2.0,
+                "wonderful": 1.5,
+                "fantastic": 2.0,
+                "awesome": 1.5,
+                "perfect": 2.0,
+                "love": 1.5,
+                "like": 1.0,
+                "happy": 1.5,
+                "pleased": 1.0,
+                "satisfied": 1.0,
+                "positive": 1.0,
+                "best": 2.0,
+                "bad": -1.0,
+                "terrible": -2.0,
+                "awful": -2.0,
+                "horrible": -2.0,
+                "hate": -2.0,
+                "dislike": -1.0,
+                "sad": -1.5,
+                "angry": -1.5,
+                "disappointed": -1.5,
+                "negative": -1.0,
+                "worst": -2.0,
+                "poor": -1.0,
+                "fail": -1.5,
+                "wrong": -1.0,
+                "problem": -1.0,
             }
         else:  # Chinese
             return {
-                '好': 1.0, '很好': 1.5, '非常好': 2.0, '棒': 1.5, '优秀': 2.0, '完美': 2.0,
-                '喜欢': 1.5, '爱': 2.0, '满意': 1.0, '开心': 1.5, '高兴': 1.5, '积极': 1.0,
-                '坏': -1.0, '很坏': -1.5, '糟糕': -2.0, '讨厌': -2.0, '恨': -2.0, '失望': -1.5,
-                '生气': -1.5, '愤怒': -2.0, '消极': -1.0, '问题': -1.0, '错误': -1.0, '失败': -1.5
+                "好": 1.0,
+                "很好": 1.5,
+                "非常好": 2.0,
+                "棒": 1.5,
+                "优秀": 2.0,
+                "完美": 2.0,
+                "喜欢": 1.5,
+                "爱": 2.0,
+                "满意": 1.0,
+                "开心": 1.5,
+                "高兴": 1.5,
+                "积极": 1.0,
+                "坏": -1.0,
+                "很坏": -1.5,
+                "糟糕": -2.0,
+                "讨厌": -2.0,
+                "恨": -2.0,
+                "失望": -1.5,
+                "生气": -1.5,
+                "愤怒": -2.0,
+                "消极": -1.0,
+                "问题": -1.0,
+                "错误": -1.0,
+                "失败": -1.5,
             }
     def _get_spacy(self, language: str) -> Any:
@@ -327,11 +336,12 @@ class ClassifierTool(BaseTool):
         if spacy is None:
             try:
                 import spacy as spacy_module
                 spacy = spacy_module
             except ImportError:
                 raise ImportError("spaCy is required but not installed. Please install it with: pip install spacy")
-        model = self.config.spacy_model_zh if language == 'zh' else self.config.spacy_model_en
+        model = self.config.spacy_model_zh if language == "zh" else self.config.spacy_model_en
         return spacy.load(model, disable=["textcat"])
     def _detect_language(self, text: str) -> str:
@@ -346,17 +356,17 @@ class ClassifierTool(BaseTool):
         """
         try:
             # Count Chinese characters (CJK Unified Ideographs)
-            chinese_chars = sum(1 for char in text if '\u4e00' <= char <= '\u9fff')
+            chinese_chars = sum(1 for char in text if "\u4e00" <= char <= "\u9fff")
             total_chars = len([char for char in text if char.isalpha()])
             if total_chars == 0:
-                return 'en'
+                return "en"
             # If more than 30% are Chinese characters, consider it Chinese
             chinese_ratio = chinese_chars / total_chars
-            return 'zh' if chinese_ratio > 0.3 else 'en'
+            return "zh" if chinese_ratio > 0.3 else "en"
         except Exception:
-            return 'en'
+            return "en"
     def _check_rate_limit(self) -> bool:
         """
@@ -373,8 +383,7 @@ class ClassifierTool(BaseTool):
         # Get lock from executor
         with self._executor.get_lock("rate_limit"):
             # Remove timestamps outside the window
-            self._request_timestamps = [ts for ts in self._request_timestamps
-                                      if current_time - ts <= self.config.rate_limit_window]
+            self._request_timestamps = [ts for ts in self._request_timestamps if current_time - ts <= self.config.rate_limit_window]
             # Check if we're at the limit
             if len(self._request_timestamps) >= self.config.rate_limit_requests:
@@ -398,10 +407,10 @@ class ClassifierTool(BaseTool):
         try:
             # Initialize heavy dependencies if needed
             _init_heavy_dependencies()
             if rake_nltk is None:
                 raise ImportError("rake_nltk not available")
             rake = rake_nltk.Rake()
             rake.extract_keywords_from_text(text)
             phrases = rake.get_ranked_phrases()[:top_k]
@@ -409,9 +418,9 @@ class ClassifierTool(BaseTool):
         except Exception as e:
             self.logger.error(f"Error extracting English phrases: {e}")
             # Fallback to simple keyword extraction
-            nlp = self._get_spacy('en')
+            nlp = self._get_spacy("en")
             doc = nlp(text)
-            keywords = [token.text for token in doc if token.pos_ in ('NOUN', 'PROPN')][:top_k]
+            keywords = [token.text for token in doc if token.pos_ in ("NOUN", "PROPN")][:top_k]
             return keywords
     def _extract_chinese_phrases(self, text: str, top_k: int) -> List[str]:
@@ -426,7 +435,7 @@ class ClassifierTool(BaseTool):
             List[str]: Extracted phrases.
         """
         try:
-            nlp = self._get_spacy('zh')
+            nlp = self._get_spacy("zh")
             doc = nlp(text)
             # Extract noun phrases and named entities
@@ -444,7 +453,7 @@ class ClassifierTool(BaseTool):
             # Add important nouns and proper nouns
             for token in doc:
-                if token.pos_ in ('NOUN', 'PROPN') and len(token.text.strip()) > 1:
+                if token.pos_ in ("NOUN", "PROPN") and len(token.text.strip()) > 1:
                     phrases.append(token.text.strip())
             # Remove duplicates and return top_k
@@ -455,9 +464,9 @@ class ClassifierTool(BaseTool):
             self.logger.error(f"Error extracting Chinese phrases with spaCy: {e}")
             # Fallback to simple noun extraction
             try:
-                nlp = self._get_spacy('zh')
+                nlp = self._get_spacy("zh")
                 doc = nlp(text)
-                nouns = [token.text for token in doc if token.pos_ in ('NOUN', 'PROPN')]
+                nouns = [token.text for token in doc if token.pos_ in ("NOUN", "PROPN")]
                 return nouns[:top_k]
             except Exception:
                 return []
@@ -478,14 +487,20 @@ class ClassifierTool(BaseTool):
             ValueError: If the pipeline creation fails.
         """
         try:
-            from transformers import pipeline
+            from transformers import pipeline  # type: ignore[import-not-found]
             return pipeline(task, model=model)
         except ImportError:
             raise ImportError("transformers library is required for summarization but not installed. Please install it with: pip install transformers")
         except Exception as e:
             raise ValueError(f"Error creating pipeline for task '{task}' with model '{model}': {e}")
-    async def classify(self, text: str, model: Optional[str] = None, language: Optional[str] = None) -> List[Dict[str, Any]]:
+    async def classify(
+        self,
+        text: str,
+        model: Optional[str] = None,
+        language: Optional[str] = None,
+    ) -> List[Dict[str, Any]]:
         """
         Perform sentiment classification on text using spaCy and lexicon-based approach.
@@ -503,16 +518,12 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
         # Get spaCy pipeline and sentiment lexicon
-        nlp = await asyncio.get_event_loop().run_in_executor(
-            None, self._get_spacy, language
-        )
+        nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
         sentiment_lexicon = self._get_sentiment_lexicon(language)
         # Process text with spaCy
-        doc = await asyncio.get_event_loop().run_in_executor(
-            None, nlp, text
-        )
+        doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
         # Calculate sentiment score
         sentiment_score = 0.0
@@ -556,13 +567,9 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
-        nlp = await asyncio.get_event_loop().run_in_executor(
-            None, self._get_spacy, language
-        )
+        nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
-        doc = await asyncio.get_event_loop().run_in_executor(
-            None, nlp, text
-        )
+        doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
         return [token.text for token in doc]
@@ -582,18 +589,12 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
-        nlp = await asyncio.get_event_loop().run_in_executor(
-            None, self._get_spacy, language
-        )
+        nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
-        doc = await asyncio.get_event_loop().run_in_executor(
-            None, nlp, text
-        )
+        doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
         return [(token.text, token.pos_) for token in doc]
-    @validate_input(NERSchema)
     async def ner(self, text: str, language: Optional[str] = None) -> List[Dict[str, Any]]:
         """
         Perform named entity recognition.
@@ -610,21 +611,20 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
-        nlp = await asyncio.get_event_loop().run_in_executor(
-            None, self._get_spacy, language
-        )
+        nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
-        doc = await asyncio.get_event_loop().run_in_executor(
-            None, nlp, text
-        )
+        doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
         return [
-            {"text": ent.text, "label": ent.label_, "start": ent.start_char, "end": ent.end_char}
+            {
+                "text": ent.text,
+                "label": ent.label_,
+                "start": ent.start_char,
+                "end": ent.end_char,
+            }
             for ent in doc.ents
         ]
-    @validate_input(LemmatizeSchema)
     async def lemmatize(self, text: str, language: Optional[str] = None) -> List[str]:
         """
         Lemmatize tokens in text using spaCy.
@@ -641,19 +641,14 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
-        nlp = await asyncio.get_event_loop().run_in_executor(
-            None, self._get_spacy, language
-        )
+        nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
-        doc = await asyncio.get_event_loop().run_in_executor(
-            None, nlp, text
-        )
+        doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
-        # For Chinese, lemma might be the same as text, but spaCy handles it consistently
+        # For Chinese, lemma might be the same as text, but spaCy handles it
+        # consistently
         return [token.lemma_ for token in doc]
-    @validate_input(DependencyParseSchema)
     async def dependency_parse(self, text: str, language: Optional[str] = None) -> List[Dict[str, Any]]:
         """
         Perform dependency parsing using spaCy (supports both English and Chinese).
@@ -670,27 +665,27 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
-        nlp = await asyncio.get_event_loop().run_in_executor(
-            None, self._get_spacy, language
-        )
+        nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
-        doc = await asyncio.get_event_loop().run_in_executor(
-            None, nlp, text
-        )
+        doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
         return [
             {
                 "text": token.text,
                 "head": token.head.text,
                 "dep": token.dep_,
-                "pos": token.pos_
+                "pos": token.pos_,
             }
             for token in doc
         ]
-    @validate_input(KeywordExtractSchema)
-    async def keyword_extract(self, text: str, top_k: int = 10, language: Optional[str] = None, extract_phrases: bool = True) -> List[str]:
+    async def keyword_extract(
+        self,
+        text: str,
+        top_k: int = 10,
+        language: Optional[str] = None,
+        extract_phrases: bool = True,
+    ) -> List[str]:
         """
         Extract keywords or key phrases from text using spaCy.
@@ -708,42 +703,28 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
-        if language == 'zh':
+        if language == "zh":
             if extract_phrases:
-                return await asyncio.get_event_loop().run_in_executor(
-                    None, self._extract_chinese_phrases, text, top_k
-                )
+                return await asyncio.get_event_loop().run_in_executor(None, self._extract_chinese_phrases, text, top_k)
             else:
                 # Extract simple keywords using spaCy
-                nlp = await asyncio.get_event_loop().run_in_executor(
-                    None, self._get_spacy, language
-                )
+                nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
-                doc = await asyncio.get_event_loop().run_in_executor(
-                    None, nlp, text
-                )
+                doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
-                keywords = [token.text for token in doc if token.pos_ in ('NOUN', 'PROPN')][:top_k]
+                keywords = [token.text for token in doc if token.pos_ in ("NOUN", "PROPN")][:top_k]
                 return keywords
         else:  # English or other languages
             if extract_phrases and self.config.use_rake_for_english:
-                return await asyncio.get_event_loop().run_in_executor(
-                    None, self._extract_english_phrases, text, top_k
-                )
+                return await asyncio.get_event_loop().run_in_executor(None, self._extract_english_phrases, text, top_k)
             else:
-                nlp = await asyncio.get_event_loop().run_in_executor(
-                    None, self._get_spacy, language
-                )
+                nlp = await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, language)
-                doc = await asyncio.get_event_loop().run_in_executor(
-                    None, nlp, text
-                )
+                doc = await asyncio.get_event_loop().run_in_executor(None, nlp, text)
-                keywords = [token.text for token in doc if token.pos_ in ('NOUN', 'PROPN')][:top_k]
+                keywords = [token.text for token in doc if token.pos_ in ("NOUN", "PROPN")][:top_k]
                 return keywords
-    @validate_input(SummarizeSchema)
     async def summarize(self, text: str, max_length: int = 150, language: Optional[str] = None) -> str:
         """
         Summarize text.
@@ -761,22 +742,21 @@ class ClassifierTool(BaseTool):
         language = language or self._detect_language(text)
         # Use appropriate models for summarization
-        if language == 'en':
+        if language == "en":
             model = "facebook/bart-large-cnn"
         else:
             # For Chinese and other languages, use a multilingual model
-            # For now, use t5-base, but consider using a Chinese-specific model in the future
+            # For now, use t5-base, but consider using a Chinese-specific model
+            # in the future
             model = "t5-base"
-        pipe = await asyncio.get_event_loop().run_in_executor(
-            None, self._get_hf_pipeline, "summarization", model
-        )
+        pipe = await asyncio.get_event_loop().run_in_executor(None, self._get_hf_pipeline, "summarization", model)
         # Different models use different parameter names for length control
         if model.startswith("t5"):
             # T5 models use max_new_tokens instead of max_length
             # For Chinese text, use a more conservative approach
-            if language == 'zh':
+            if language == "zh":
                 # Chinese text: use character count and be more conservative
                 input_chars = len(text)
                 max_new_tokens = min(max_length, max(input_chars // 4, 5))
@@ -786,13 +766,21 @@ class ClassifierTool(BaseTool):
                 input_words = len(text.split())
                 max_new_tokens = min(max_length, max(input_words // 2, 10))
                 min_new_tokens = 5
             result = await asyncio.get_event_loop().run_in_executor(
-                None, lambda: pipe(text, max_new_tokens=max_new_tokens, min_new_tokens=min_new_tokens, do_sample=False)[0]['summary_text']
+                None,
+                lambda: pipe(
+                    text,
+                    max_new_tokens=max_new_tokens,
+                    min_new_tokens=min_new_tokens,
+                    do_sample=False,
+                )[
+                    0
+                ]["summary_text"],
             )
         else:
             # BART and other models use max_length
-            if language == 'zh':
+            if language == "zh":
                 # Chinese text: use character count
                 input_chars = len(text)
                 max_len = min(max_length, max(input_chars // 4, 10))
@@ -802,18 +790,30 @@ class ClassifierTool(BaseTool):
                 input_words = len(text.split())
                 max_len = min(max_length, max(input_words // 2, 20))
                 min_len = 10
             result = await asyncio.get_event_loop().run_in_executor(
-                None, lambda: pipe(text, max_length=max_len, min_length=min_len, do_sample=False)[0]['summary_text']
+                None,
+                lambda: pipe(
+                    text,
+                    max_length=max_len,
+                    min_length=min_len,
+                    do_sample=False,
+                )[
+                    0
+                ]["summary_text"],
             )
         return result
-    @validate_input(BatchProcessSchema)
-    async def batch_process(self, texts: List[str], operation: str, language: Optional[str] = None,
-                           model: Optional[str] = None, top_k: Optional[int] = None,
-                           max_length: Optional[int] = None) -> List[Any]:
+    async def batch_process(
+        self,
+        texts: List[str],
+        operation: str,
+        language: Optional[str] = None,
+        model: Optional[str] = None,
+        top_k: Optional[int] = None,
+        max_length: Optional[int] = None,
+    ) -> List[Any]:
         """
         Process multiple texts with the specified operation.
@@ -834,7 +834,7 @@ class ClassifierTool(BaseTool):
         # Prepare operations to execute in batch
         operations = []
         for text in texts:
-            kwargs = {"text": text}
+            kwargs: Dict[str, Any] = {"text": text}
             if language:
                 kwargs["language"] = language
             if model and operation == "classify":
@@ -861,23 +861,24 @@ class ClassifierTool(BaseTool):
             "metrics": {
                 "requests": self._metrics["requests"],
                 "cache_hits": self._metrics["cache_hits"],
-                "avg_processing_time": sum(self._metrics["processing_time"]) / len(self._metrics["processing_time"])
-                                      if self._metrics["processing_time"] else 0.0
+                "avg_processing_time": (
+                    sum(float(t) for t in processing_times) / len(processing_times)
+                    if (processing_times := self._metrics.get("processing_time")) and isinstance(processing_times, list) and len(processing_times) > 0
+                    else 0.0
+                ),
             },
             "config": {
                 "max_workers": self.config.max_workers,
                 "pipeline_cache_size": self.config.pipeline_cache_size,
                 "rate_limit_enabled": self.config.rate_limit_enabled,
                 "rate_limit_requests": self.config.rate_limit_requests,
-                "rate_limit_window": self.config.rate_limit_window
-            }
+                "rate_limit_window": self.config.rate_limit_window,
+            },
         }
         # Check if models can be loaded
         try:
-            await asyncio.get_event_loop().run_in_executor(
-                None, self._get_spacy, "en"
-            )
+            await asyncio.get_event_loop().run_in_executor(None, self._get_spacy, "en")
             result["models"] = {"spacy_en": "ok"}
         except Exception as e:
             result["status"] = "warning"
@@ -893,7 +894,7 @@ class ClassifierTool(BaseTool):
         self._spacy_nlp.clear()
         # Clear metrics
-        self._metrics = {'requests': 0, 'cache_hits': 0, 'processing_time': []}
+        self._metrics = {"requests": 0, "cache_hits": 0, "processing_time": []}
         # Clear rate limiting data
         self._request_timestamps = []

aiecs 1.0.1__py3-none-any.whl → 1.7.17__py3-none-any.whl

Potentially problematic release.

aiecs 1.0.1py3-none-any.whl → 1.7.17py3-none-any.whl