crawlo 1.4.1__tar.gz → 1.4.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of crawlo might be problematic. Click here for more details.
- {crawlo-1.4.1/crawlo.egg-info → crawlo-1.4.2}/PKG-INFO +1 -1
- crawlo-1.4.2/crawlo/__version__.py +1 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/run.py +1 -1
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/downloader/aiohttp_downloader.py +7 -2
- {crawlo-1.4.1 → crawlo-1.4.2/crawlo.egg-info}/PKG-INFO +1 -1
- crawlo-1.4.1/crawlo/__version__.py +0 -1
- {crawlo-1.4.1 → crawlo-1.4.2}/LICENSE +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/MANIFEST.in +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/README.md +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/cli.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/check.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/genspider.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/help.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/list.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/startproject.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/stats.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/commands/utils.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/config_validator.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/core/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/core/engine.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/core/processor.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/core/scheduler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/crawler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/data/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/data/user_agents.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/downloader/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/downloader/cffi_downloader.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/downloader/httpx_downloader.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/downloader/hybrid_downloader.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/downloader/playwright_downloader.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/downloader/selenium_downloader.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/event.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/exceptions.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/health_check.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/log_interval.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/log_stats.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/logging_extension.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/memory_monitor.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/performance_profiler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/extension/request_recorder.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/factories/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/factories/base.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/factories/crawler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/factories/registry.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/filters/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/filters/aioredis_filter.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/filters/memory_filter.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/framework.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/initialization/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/initialization/built_in.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/initialization/context.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/initialization/core.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/initialization/phases.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/initialization/registry.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/items/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/items/base.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/items/fields.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/items/items.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/logging/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/logging/config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/logging/factory.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/logging/manager.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/default_header.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/download_delay.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/middleware_manager.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/offsite.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/proxy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/request_ignore.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/response_code.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/response_filter.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/retry.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/middleware/simple_proxy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/mode_manager.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/network/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/network/request.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/network/response.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/bloom_dedup_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/console_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/csv_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/database_dedup_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/json_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/memory_dedup_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/mongo_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/mysql_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/pipeline_manager.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/pipelines/redis_dedup_pipeline.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/project.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/queue/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/queue/pqueue.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/queue/queue_manager.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/queue/redis_priority_queue.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/settings/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/settings/default_settings.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/settings/setting_manager.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/spider/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/stats_collector.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/subscriber.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/task_manager.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/crawlo.cfg.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/__init__.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/items.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/middlewares.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/pipelines.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/settings.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/settings_distributed.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/settings_gentle.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/settings_high_performance.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/settings_minimal.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/settings_simple.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/project/spiders/__init__.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/run.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/spider/spider.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/templates/spiders_init.py.tmpl +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/anti_crawler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/authenticated_proxy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/data_formatter.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/data_validator.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/date_tools.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/distributed_coordinator.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/encoding_converter.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/network_diagnostic.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/request_tools.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/retry_mechanism.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/scenario_adapter.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/tools/text_cleaner.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/batch_processor.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/class_loader.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/controlled_spider_mixin.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/db_helper.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/enhanced_error_handler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/env_config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/error_handler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/fingerprint.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/func_tools.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/large_scale_config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/large_scale_helper.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/log.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/performance_monitor.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/queue_helper.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/redis_connection_pool.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/redis_key_validator.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/request.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/request_serializer.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/spider_loader.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/system.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/tools.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo/utils/url.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo.egg-info/SOURCES.txt +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo.egg-info/dependency_links.txt +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo.egg-info/entry_points.txt +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo.egg-info/requires.txt +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/crawlo.egg-info/top_level.txt +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/run.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/test_project/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/test_project/items.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/test_project/middlewares.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/test_project/pipelines.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/test_project/settings.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/test_project/spiders/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/examples/test_project/test_project/spiders/of_week_dis.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/pyproject.toml +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/requirements.txt +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/setup.cfg +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/__init__.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/advanced_tools_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/authenticated_proxy_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/baidu_performance_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/baidu_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/cleaners_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/comprehensive_framework_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/comprehensive_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/comprehensive_testing_summary.md +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/config_validation_demo.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/controlled_spider_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/date_tools_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/debug_configure.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/debug_framework_logger.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/debug_log_config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/debug_log_levels.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/debug_pipelines.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/detailed_log_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/distributed_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/distributed_test_debug.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/dynamic_loading_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/dynamic_loading_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/env_config_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/error_handling_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/final_command_test_report.md +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/final_comprehensive_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/final_log_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/final_validation_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/fix_log_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/framework_performance_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/log_buffering_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/log_generation_timing_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/optimized_performance_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/performance_comparison.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/queue_blocking_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/queue_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/redis_key_validation_demo.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/request_params_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/response_improvements_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/scrapy_comparison/ofweek_scrapy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/scrapy_comparison/scrapy_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_command_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_crawlo_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_log_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_log_test2.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_optimization_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_queue_type_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_spider_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/simple_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/spider_log_timing_test.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_advanced_tools.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_all_commands.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_all_pipeline_fingerprints.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_all_redis_key_configs.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_authenticated_proxy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_batch_processor.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_cleaners.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_component_factory.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_comprehensive.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_config_consistency.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_config_merge.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_config_validator.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_controlled_spider_mixin.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_crawlo_proxy_integration.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_date_tools.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_dedup_fix.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_default_header_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_distributed.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_double_crawlo_fix.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_double_crawlo_fix_simple.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_download_delay_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_downloader_proxy_compatibility.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_dynamic_downloaders_proxy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_dynamic_proxy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_dynamic_proxy_config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_dynamic_proxy_real.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_edge_cases.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_enhanced_error_handler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_enhanced_error_handler_comprehensive.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_env_config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_error_handler_compatibility.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_factories.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_final_validation.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_fingerprint_consistency.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_fingerprint_simple.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_framework_env_usage.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_framework_logger.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_framework_startup.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_get_component_logger.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_hash_performance.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_integration.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_item_dedup_redis_key.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_large_scale_config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_large_scale_helper.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_logging_system.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_mode_change.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_mode_consistency.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_offsite_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_offsite_middleware_simple.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_parsel.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_performance.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_performance_monitor.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_pipeline_fingerprint_consistency.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_api.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_health_check.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_middleware_enhanced.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_middleware_integration.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_middleware_refactored.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_providers.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_stats.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_proxy_strategies.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_queue_empty_check.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_queue_manager_double_crawlo.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_queue_manager_redis_key.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_queue_naming.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_queue_type.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_random_user_agent.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_real_scenario_proxy.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_redis_config.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_redis_connection_pool.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_redis_key_naming.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_redis_key_validator.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_redis_queue.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_redis_queue_name_fix.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_request_ignore_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_request_params.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_request_serialization.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_response_code_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_response_filter_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_response_improvements.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_retry_middleware.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_scheduler.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_scheduler_config_update.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_simple_response.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_telecom_spider_redis_key.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_template_content.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_template_redis_key.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_tools.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/test_user_agents.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/tools_example.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/untested_features_report.md +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/verify_debug.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/verify_distributed.py +0 -0
- {crawlo-1.4.1 → crawlo-1.4.2}/tests/verify_log_fix.py +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
__version__ = '1.4.2'
|
|
@@ -23,7 +23,7 @@ from crawlo.crawler import CrawlerProcess
|
|
|
23
23
|
from crawlo.project import get_settings, _find_project_root
|
|
24
24
|
# 使用新的统一初始化系统
|
|
25
25
|
from crawlo.initialization import initialize_framework
|
|
26
|
-
from crawlo.
|
|
26
|
+
from crawlo.core import get_framework_initializer
|
|
27
27
|
from crawlo.utils.log import get_logger
|
|
28
28
|
|
|
29
29
|
# 延迟获取logger,确保在日志系统配置之后获取
|
|
@@ -55,8 +55,13 @@ class AioHttpDownloader(DownloaderBase):
|
|
|
55
55
|
family=0, # 允许IPv4和IPv6
|
|
56
56
|
)
|
|
57
57
|
|
|
58
|
-
# 超时控制
|
|
59
|
-
timeout = ClientTimeout(
|
|
58
|
+
# 超时控制 - 增加更多超时设置
|
|
59
|
+
timeout = ClientTimeout(
|
|
60
|
+
total=timeout_secs,
|
|
61
|
+
connect=timeout_secs/2, # 连接超时
|
|
62
|
+
sock_read=timeout_secs, # 读取超时
|
|
63
|
+
sock_connect=timeout_secs/2 # socket连接超时
|
|
64
|
+
)
|
|
60
65
|
|
|
61
66
|
# 请求追踪
|
|
62
67
|
trace_config = TraceConfig()
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
__version__ = '1.4.1'
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|